1
0
mirror of https://github.com/scrapy/scrapy.git synced 2025-02-24 09:44:15 +00:00
scrapy/tests/test_selector_lxmldocument.py

27 lines
910 B
Python
Raw Normal View History

2013-10-14 10:35:02 -02:00
import unittest
from scrapy.selector.lxmldocument import LxmlDocument
from scrapy.http import TextResponse, HtmlResponse
2013-10-14 16:37:14 -02:00
class LxmlDocumentTest(unittest.TestCase):
2013-10-14 10:35:02 -02:00
def test_caching(self):
r1 = HtmlResponse('http://www.example.com', body='<html><head></head><body></body></html>')
r2 = r1.copy()
doc1 = LxmlDocument(r1)
doc2 = LxmlDocument(r1)
doc3 = LxmlDocument(r2)
# make sure it's cached
assert doc1 is doc2
assert doc1 is not doc3
def test_null_char(self):
# make sure bodies with null char ('\x00') don't raise a TypeError exception
body = 'test problematic \x00 body'
response = TextResponse('http://example.com/catalog/product/blabla-123',
headers={'Content-Type': 'text/plain; charset=utf-8'},
body=body)
LxmlDocument(response)