boltons/tests/test_ioutils.py

445 lines
17 KiB
Python

import io
import os
import sys
import codecs
import random
import string
from tempfile import mkdtemp
from unittest import TestCase
from zipfile import ZipFile, ZIP_DEFLATED
from boltons import ioutils
CUR_FILE_PATH = os.path.abspath(__file__)
# Python2/3 compat
if sys.version_info[0] == 3:
text_type = str
binary_type = bytes
else:
text_type = unicode
binary_type = str
class AssertionsMixin(object):
def assertIsNone(self, item, msg=None):
self.assertTrue(item is None, msg)
class BaseTestMixin(object):
"""
A set of tests that work the same for SpooledBtyesIO and SpooledStringIO
"""
def test_getvalue_norollover(self):
"""Make sure getvalue function works with in-memory flo"""
self.spooled_flo.write(self.test_str)
self.assertEqual(self.spooled_flo.getvalue(), self.test_str)
def test_getvalue_rollover(self):
"""Make sure getvalue function works with on-disk flo"""
self.spooled_flo.write(self.test_str)
self.assertFalse(self.spooled_flo._rolled)
self.spooled_flo.rollover()
self.assertEqual(self.spooled_flo.getvalue(), self.test_str)
self.assertTrue(self.spooled_flo._rolled)
def test_rollover_custom_directory(self):
"""dir keyword argument is passed to TemporaryFile instantiation"""
custom_dir = mkdtemp()
try:
# Re-instantiate self.spooled_flo with the custom dir argument
_spooled_flo = type(self.spooled_flo)(dir=custom_dir)
self.assertEqual(_spooled_flo._dir, custom_dir)
# TemporaryFile is kind of a black box, we can't really test it
# since the directory entry for the file is removed immediately
# after the file is created. So we can't check path using fd.name
# or listdir(custom_dir). We could either convert rollover() to
# use NamedtemporaryFile-s or assume it's well tested enough that
# passing dir= into the constructor will work as expected. We'll
# call rollover() with the dir attribute set just to ensure
# nothing has gone absurdly wrong.
_spooled_flo.write(self.test_str)
_spooled_flo.rollover()
self.assertEqual(_spooled_flo.getvalue(), self.test_str)
self.assertTrue(_spooled_flo._rolled)
_spooled_flo.close()
finally:
os.rmdir(custom_dir)
def test_truncate_noargs_norollover(self):
"""Test truncating with no args with in-memory flo"""
self.spooled_flo.write(self.test_str)
self.spooled_flo.seek(10)
self.spooled_flo.truncate()
self.assertEqual(self.spooled_flo.getvalue(), self.test_str[:10])
def test_truncate_noargs_rollover(self):
"""Test truncating with no args with on-disk flo"""
self.spooled_flo.write(self.test_str)
self.spooled_flo.seek(10)
self.spooled_flo.rollover()
self.spooled_flo.truncate()
self.assertEqual(self.spooled_flo.getvalue(), self.test_str[:10])
def test_truncate_with_args_norollover(self):
"""Test truncating to a value with in-memory flo"""
self.spooled_flo.write(self.test_str)
self.spooled_flo.seek(5)
self.spooled_flo.truncate(10)
self.assertEqual(self.spooled_flo.getvalue(), self.test_str[:10])
def test_truncate_with_args_rollover(self):
"""Test truncating to a value with on-disk flo"""
self.spooled_flo.write(self.test_str)
self.spooled_flo.seek(5)
self.spooled_flo.rollover()
self.spooled_flo.truncate(10)
self.assertEqual(self.spooled_flo.getvalue(), self.test_str[:10])
def test_type_error_too_many_args(self):
"""Make sure TypeError raised if too many args passed to truncate"""
self.spooled_flo.write(self.test_str)
self.assertRaises(TypeError, self.spooled_flo.truncate, 0, 10)
def test_io_error_negative_truncate(self):
"""Make sure IOError raised trying to truncate with negative value"""
self.spooled_flo.write(self.test_str)
self.assertRaises(IOError, self.spooled_flo.truncate, -1)
def test_compare_different_instances(self):
"""Make sure two different instance types are not considered equal"""
a = ioutils.SpooledBytesIO()
a.write(binary_type(b"I am equal!"))
b = ioutils.SpooledStringIO()
b.write(text_type("I am equal!"))
self.assertNotEqual(a, b)
def test_compare_unequal_instances(self):
"""Comparisons of non-SpooledIOBase classes should fail"""
self.assertNotEqual("Bummer dude", self.spooled_flo)
def test_set_softspace_attribute(self):
"""Ensure softspace attribute can be retrieved and set"""
self.spooled_flo.softspace = True
self.assertTrue(self.spooled_flo.softspace)
def test_set_softspace_attribute_rolled(self):
"""Ensure softspace attribute can be retrieved and set if rolled"""
self.spooled_flo.softspace = True
self.assertTrue(self.spooled_flo.softspace)
self.spooled_flo.rollover()
self.spooled_flo.softspace = True
self.assertTrue(self.spooled_flo.softspace)
def test_iter(self):
"""Make sure iter works as expected"""
self.spooled_flo.write(self.test_str)
self.spooled_flo.seek(0)
self.assertEqual([x for x in self.spooled_flo][0], self.test_str)
self.assertEqual([x for x in self.spooled_flo][0], self.data_type())
def test_buf_property(self):
"""'buf' property returns the same value as getvalue()"""
self.assertEqual(self.spooled_flo.buf, self.spooled_flo.getvalue())
def test_pos_property(self):
"""'pos' property returns the same value as tell()"""
self.assertEqual(self.spooled_flo.pos, self.spooled_flo.tell())
def test_closed_property(self):
"""'closed' property works as expected"""
self.assertFalse(self.spooled_flo.closed)
self.spooled_flo.close()
self.assertTrue(self.spooled_flo.closed)
def test_readline(self):
"""Make readline returns expected values"""
self.spooled_flo.write(self.test_str_lines)
self.spooled_flo.seek(0)
self.assertEqual(self.spooled_flo.readline().rstrip(self.linesep),
self.test_str_lines.split(self.linesep)[0])
def test_readlines(self):
"""Make sure readlines returns expected values"""
self.spooled_flo.write(self.test_str_lines)
self.spooled_flo.seek(0)
self.assertEqual(
[x.rstrip(self.linesep) for x in self.spooled_flo.readlines()],
self.test_str_lines.split(self.linesep)
)
def test_next(self):
"""Make next returns expected values"""
self.spooled_flo.write(self.test_str_lines)
self.spooled_flo.seek(0)
self.assertEqual(self.spooled_flo.next().rstrip(self.linesep),
self.test_str_lines.split(self.linesep)[0])
def test_isatty(self):
"""Make sure we can check if the value is a tty"""
# This should simply not fail
self.assertTrue(self.spooled_flo.isatty() is True or
self.spooled_flo.isatty() is False)
def test_truthy(self):
"""Make sure empty instances are still considered truthy"""
self.spooled_flo.seek(0)
self.spooled_flo.truncate()
if not self.spooled_flo:
raise AssertionError("Instance is not truthy")
class TestSpooledBytesIO(TestCase, BaseTestMixin, AssertionsMixin):
linesep = os.linesep.encode('ascii')
def setUp(self):
self.spooled_flo = ioutils.SpooledBytesIO()
self.test_str = b"Armado en los EE, UU. para S. P. Richards co.,"
self.test_str_lines = (
"Text with:{0}newlines!".format(os.linesep).encode('ascii')
)
self.data_type = binary_type
def test_compare_not_equal_instances(self):
"""Make sure instances with different values fail == check."""
a = ioutils.SpooledBytesIO()
a.write(b"I am a!")
b = ioutils.SpooledBytesIO()
b.write(b"I am b!")
self.assertNotEqual(a, b)
def test_compare_two_equal_instances(self):
"""Make sure we can compare instances"""
a = ioutils.SpooledBytesIO()
a.write(b"I am equal!")
b = ioutils.SpooledBytesIO()
b.write(b"I am equal!")
self.assertEqual(a, b)
def test_auto_rollover(self):
"""Make sure file rolls over to disk after max_size reached"""
tmp = ioutils.SpooledBytesIO(max_size=10)
tmp.write(b"The quick brown fox jumped over the lazy dogs.")
self.assertTrue(tmp._rolled)
def test_use_as_context_mgr(self):
"""Make sure SpooledBytesIO can be used as a context manager"""
test_str = b"Armado en los EE, UU. para S. P. Richards co.,"
with ioutils.SpooledBytesIO() as f:
f.write(test_str)
self.assertEqual(f.getvalue(), test_str)
def test_len_no_rollover(self):
"""Make sure len works with in-memory flo"""
self.spooled_flo.write(self.test_str)
self.assertEqual(self.spooled_flo.len, len(self.test_str))
self.assertEqual(len(self.spooled_flo), len(self.test_str))
def test_len_rollover(self):
"""Make sure len works with on-disk flo"""
self.spooled_flo.write(self.test_str)
self.spooled_flo.rollover()
self.assertEqual(self.spooled_flo.len, len(self.test_str))
self.assertEqual(len(self.spooled_flo), len(self.test_str))
def test_invalid_type(self):
"""Ensure TypeError raised when writing unicode to SpooledBytesIO"""
self.assertRaises(TypeError, self.spooled_flo.write, u"hi")
def test_flush_after_rollover(self):
"""Make sure we can flush before and after rolling to a real file"""
self.spooled_flo.write(self.test_str)
self.assertIsNone(self.spooled_flo.flush())
self.spooled_flo.rollover()
self.assertIsNone(self.spooled_flo.flush())
def test_zip_compat(self):
"""Make sure object is compatible with ZipFile library"""
self.spooled_flo.seek(0)
self.spooled_flo.truncate()
doc = ZipFile(self.spooled_flo, 'w', ZIP_DEFLATED)
doc.writestr("content.txt", "test")
self.assertTrue('content.txt' in doc.namelist())
doc.close()
class TestSpooledStringIO(TestCase, BaseTestMixin, AssertionsMixin):
linesep = os.linesep
def setUp(self):
self.spooled_flo = ioutils.SpooledStringIO()
self.test_str = u"Remember kids, always use an emdash: '\u2014'"
self.test_str_lines = u"Text with\u2014{0}newlines!".format(os.linesep)
self.data_type = text_type
def test_compare_not_equal_instances(self):
"""Make sure instances with different values fail == check."""
a = ioutils.SpooledStringIO()
a.write(u"I am a!")
b = ioutils.SpooledStringIO()
b.write(u"I am b!")
self.assertNotEqual(a, b)
def test_compare_two_equal_instances(self):
"""Make sure we can compare instances"""
a = ioutils.SpooledStringIO()
a.write(u"I am equal!")
b = ioutils.SpooledStringIO()
b.write(u"I am equal!")
self.assertEqual(a, b)
def test_auto_rollover(self):
"""Make sure file rolls over to disk after max_size reached"""
tmp = ioutils.SpooledStringIO(max_size=10)
tmp.write(u"The quick brown fox jumped over the lazy dogs.")
self.assertTrue(tmp._rolled)
def test_use_as_context_mgr(self):
"""Make sure SpooledStringIO can be used as a context manager"""
test_str = u"Armado en los EE, UU. para S. P. Richards co.,"
with ioutils.SpooledStringIO() as f:
f.write(test_str)
self.assertEqual(f.getvalue(), test_str)
def test_len_no_rollover(self):
"""Make sure len property works with in-memory flo"""
self.spooled_flo.write(self.test_str)
self.assertEqual(self.spooled_flo.len, len(self.test_str))
def test_len_rollover(self):
"""Make sure len propery works with on-disk flo"""
self.spooled_flo.write(self.test_str)
self.spooled_flo.rollover()
self.assertEqual(self.spooled_flo.len, len(self.test_str))
def test_invalid_type(self):
"""Ensure TypeError raised when writing bytes to SpooledStringIO"""
self.assertRaises(TypeError, self.spooled_flo.write, b"hi")
def test_tell_codepoints(self):
"""Verify tell() returns codepoint position, not bytes position"""
self.spooled_flo.write(self.test_str)
self.spooled_flo.seek(0)
self.spooled_flo.read(40)
self.assertEqual(self.spooled_flo.tell(), 40)
self.spooled_flo.seek(10)
self.assertEqual(self.spooled_flo.tell(), 10)
def test_codepoints_all_enc(self):
""""Test getting read, seek, tell, on various codepoints"""
test_str = u"\u2014\u2014\u2014"
self.spooled_flo.write(test_str)
self.spooled_flo.seek(1)
self.assertEqual(self.spooled_flo.read(), u"\u2014\u2014")
self.assertEqual(len(self.spooled_flo), len(test_str))
def test_seek_codepoints_SEEK_END(self):
"""Make sure seek() moves to codepoints relative to file end"""
self.spooled_flo.write(self.test_str)
ret = self.spooled_flo.seek(0, os.SEEK_END)
self.assertEqual(ret, len(self.test_str))
def test_seek_codepoints_large_SEEK_END(self):
"""Make sure seek() moves to codepoints relative to file end"""
test_str = u"".join(random.choice(string.ascii_letters) for
x in range(34000))
self.spooled_flo.write(test_str)
ret = self.spooled_flo.seek(0, os.SEEK_END)
self.assertEqual(ret, len(test_str))
def test_seek_codepoints_SEEK_SET(self):
"""Make sure seek() moves to codepoints relative to file start"""
self.spooled_flo.write(self.test_str)
ret = self.spooled_flo.seek(3, os.SEEK_SET)
self.assertEqual(ret, 3)
def test_seek_codepoints_large_SEEK_SET(self):
"""Make sure seek() moves to codepoints relative to file start"""
test_str = u"".join(random.choice(string.ascii_letters) for
x in range(34000))
self.spooled_flo.write(test_str)
ret = self.spooled_flo.seek(33000, os.SEEK_SET)
self.assertEqual(ret, 33000)
def test_seek_codepoints_SEEK_CUR(self):
"""Make sure seek() moves to codepoints relative to current_position"""
test_str = u"\u2014\u2014\u2014"
self.spooled_flo.write(test_str)
self.spooled_flo.seek(1)
self.assertEqual(self.spooled_flo.tell(), 1)
ret = self.spooled_flo.seek(2, os.SEEK_CUR)
self.assertEqual(ret, 3)
def test_seek_codepoints_large_SEEK_CUR(self):
"""Make sure seek() moves to codepoints relative to current_position"""
test_str = u"".join(random.choice(string.ascii_letters) for
x in range(34000))
self.spooled_flo.write(test_str)
self.spooled_flo.seek(1)
ret = self.spooled_flo.seek(33000, os.SEEK_CUR)
self.assertEqual(ret, 33001)
def test_x80_codepoint(self):
"""Make sure x80 codepoint doesn't confuse read value"""
test_str = u'\x8000'
self.spooled_flo.write(test_str)
self.spooled_flo.seek(0)
self.assertEqual(len(self.spooled_flo.read(2)), 2)
self.assertEqual(self.spooled_flo.read(), '0')
def test_seek_encoded(self):
"""Make sure reading works when bytes exceeds read val"""
test_str = u"\u2014\u2014\u2014"
self.spooled_flo.write(test_str)
self.spooled_flo.seek(0)
self.assertEqual(self.spooled_flo.read(3), test_str)
class TestMultiFileReader(TestCase):
def test_read_seek_bytes(self):
r = ioutils.MultiFileReader(io.BytesIO(b'narf'), io.BytesIO(b'troz'))
self.assertEqual([b'nar', b'ftr', b'oz'],
list(iter(lambda: r.read(3), b'')))
r.seek(0)
self.assertEqual(b'narftroz', r.read())
def test_read_seek_text(self):
r = ioutils.MultiFileReader(io.StringIO(u'narf'), io.StringIO(u'troz'))
self.assertEqual([u'nar', u'ftr', u'oz'],
list(iter(lambda: r.read(3), u'')))
r.seek(0)
self.assertEqual(u'narftroz', r.read())
def test_no_mixed_bytes_and_text(self):
self.assertRaises(ValueError, ioutils.MultiFileReader,
io.BytesIO(b'narf'), io.StringIO(u'troz'))
def test_open(self):
with open(CUR_FILE_PATH, 'r') as f:
r_file_str = f.read()
with open(CUR_FILE_PATH, 'r') as f1:
with open(CUR_FILE_PATH, 'r') as f2:
mfr = ioutils.MultiFileReader(f1, f2)
r_double_file_str = mfr.read()
assert r_double_file_str == (r_file_str * 2)
with open(CUR_FILE_PATH, 'rb') as f:
rb_file_str = f.read()
with open(CUR_FILE_PATH, 'rb') as f1:
with open(CUR_FILE_PATH, 'rb') as f2:
mfr = ioutils.MultiFileReader(f1, f2)
rb_double_file_str = mfr.read()
assert rb_double_file_str == (rb_file_str * 2)
utf8_file_str = codecs.open(CUR_FILE_PATH, encoding='utf8').read()
f1, f2 = (codecs.open(CUR_FILE_PATH, encoding='utf8'),
codecs.open(CUR_FILE_PATH, encoding='utf8'))
mfr = ioutils.MultiFileReader(f1, f2)
utf8_double_file_str = mfr.read()
assert utf8_double_file_str == (utf8_file_str * 2)