def test_content_select_xpath(): content = Content(BASE_URL, CONTENT) assert content.select('//title/text()', method='xpath').extract() == ['Test content title'] assert content.select('//a/@href', method='xpath').extract() == ['link1', 'link2', 'link3', 'link4', 'link5', 'link6'] assert content.select('//p/a/@href', method='xpath').extract() == ['link4', 'link5', 'link6'] assert content.select('//p/a', method='xpath').extract() == ['<a href="link4">Link4</a>', '<a href="link5">Link5</a>', '<a href="link6">Link6</a>']
def test_content_select_css(): content = Content(BASE_URL, CONTENT) assert content.select('title', method='css').extract() == [ '<title>Test content title</title>' ] assert content.select('html title', method='css').extract() == [ '<title>Test content title</title>' ]
def test_content_select_xpath(): content = Content(BASE_URL, CONTENT) assert content.select('//title/text()', method='xpath').extract() == ['Test content title'] assert content.select('//a/@href', method='xpath').extract() == [ 'link1', 'link2', 'link3', 'link4', 'link5', 'link6' ] assert content.select('//p/a/@href', method='xpath').extract() == [ 'link4', 'link5', 'link6' ] assert content.select('//p/a', method='xpath').extract() == [ '<a href="link4">Link4</a>', '<a href="link5">Link5</a>', '<a href="link6">Link6</a>' ]
def test_content_select_css(): content = Content(BASE_URL, CONTENT) assert content.select('title', method='css').extract() == ['<title>Test content title</title>'] assert content.select('html title', method='css').extract() == ['<title>Test content title</title>']