Exemple #1
0
def test_content_select_xpath():

    content = Content(BASE_URL, CONTENT)
    assert content.select('//title/text()', method='xpath').extract() == ['Test content title']
    assert content.select('//a/@href', method='xpath').extract() == ['link1', 'link2', 'link3', 'link4', 'link5', 'link6']
    assert content.select('//p/a/@href', method='xpath').extract() == ['link4', 'link5', 'link6']
    assert content.select('//p/a', method='xpath').extract() == ['<a href="link4">Link4</a>', '<a href="link5">Link5</a>', '<a href="link6">Link6</a>']
Exemple #2
0
def test_content_select_css():

    content = Content(BASE_URL, CONTENT)
    assert content.select('title', method='css').extract() == [
        '<title>Test content title</title>'
    ]
    assert content.select('html title', method='css').extract() == [
        '<title>Test content title</title>'
    ]
Exemple #3
0
def test_content_select_xpath():

    content = Content(BASE_URL, CONTENT)
    assert content.select('//title/text()',
                          method='xpath').extract() == ['Test content title']
    assert content.select('//a/@href', method='xpath').extract() == [
        'link1', 'link2', 'link3', 'link4', 'link5', 'link6'
    ]
    assert content.select('//p/a/@href', method='xpath').extract() == [
        'link4', 'link5', 'link6'
    ]
    assert content.select('//p/a', method='xpath').extract() == [
        '<a href="link4">Link4</a>', '<a href="link5">Link5</a>',
        '<a href="link6">Link6</a>'
    ]
Exemple #4
0
def test_content_select_css():

    content = Content(BASE_URL, CONTENT)
    assert content.select('title', method='css').extract() == ['<title>Test content title</title>']
    assert content.select('html title', method='css').extract() == ['<title>Test content title</title>']