2011-06-06 18:25:14 -03:00
|
|
|
import unittest
|
|
|
|
from os.path import join
|
|
|
|
|
2014-07-30 16:53:28 -03:00
|
|
|
from tests import tests_datadir
|
2011-06-06 18:25:14 -03:00
|
|
|
from scrapy.utils.gz import gunzip
|
|
|
|
|
|
|
|
SAMPLEDIR = join(tests_datadir, 'compressed')
|
|
|
|
|
|
|
|
class GzTest(unittest.TestCase):
|
|
|
|
|
|
|
|
def test_gunzip_basic(self):
|
|
|
|
with open(join(SAMPLEDIR, 'feed-sample1.xml.gz'), 'rb') as f:
|
|
|
|
text = gunzip(f.read())
|
|
|
|
self.assertEqual(len(text), 9950)
|
|
|
|
|
|
|
|
def test_gunzip_truncated(self):
|
|
|
|
with open(join(SAMPLEDIR, 'truncated-crc-error.gz'), 'rb') as f:
|
|
|
|
text = gunzip(f.read())
|
|
|
|
assert text.endswith('</html')
|
|
|
|
|
|
|
|
def test_gunzip_no_gzip_file_raises(self):
|
|
|
|
with open(join(SAMPLEDIR, 'feed-sample1.xml'), 'rb') as f:
|
|
|
|
self.assertRaises(IOError, gunzip, f.read())
|
|
|
|
|
2012-10-10 12:21:59 +03:00
|
|
|
def test_gunzip_truncated_short(self):
|
|
|
|
with open(join(SAMPLEDIR, 'truncated-crc-error-short.gz'), 'rb') as f:
|
|
|
|
text = gunzip(f.read())
|
|
|
|
assert text.endswith('</html>')
|