How to use the parsel.lxmldocument.LxmlDocument function in parsel

To help you get started, we’ve selected a few parsel examples, based on popular ways it is used in public projects.

Secure your code as it's written. Use Snyk Code to scan source code in minutes - no build needed - and fix issues immediately.

github scrapy / parsel / tests / test_selector_lxmldocument.py View on Github external
def test_caching(self):
        r1 = HtmlResponse('http://www.example.com', body='')
        r2 = r1.copy()

        doc1 = LxmlDocument(r1)
        doc2 = LxmlDocument(r1)
        doc3 = LxmlDocument(r2)

        # make sure it's cached
        assert doc1 is doc2
        assert doc1 is not doc3
github scrapy / parsel / tests / test_selector_lxmldocument.py View on Github external
def test_null_char(self):
        # make sure bodies with null char ('\x00') don't raise a TypeError exception
        body = 'test problematic \x00 body'
        response = TextResponse('http://example.com/catalog/product/blabla-123',
                                headers={'Content-Type': 'text/plain; charset=utf-8'},
                                body=body)
        LxmlDocument(response)
github scrapy / parsel / tests / test_selector_lxmldocument.py View on Github external
def test_caching(self):
        r1 = HtmlResponse('http://www.example.com', body='')
        r2 = r1.copy()

        doc1 = LxmlDocument(r1)
        doc2 = LxmlDocument(r1)
        doc3 = LxmlDocument(r2)

        # make sure it's cached
        assert doc1 is doc2
        assert doc1 is not doc3
github scrapy / parsel / tests / test_selector_lxmldocument.py View on Github external
def test_caching(self):
        r1 = HtmlResponse('http://www.example.com', body='')
        r2 = r1.copy()

        doc1 = LxmlDocument(r1)
        doc2 = LxmlDocument(r1)
        doc3 = LxmlDocument(r2)

        # make sure it's cached
        assert doc1 is doc2
        assert doc1 is not doc3