Example #1
0
def test_process_item_xlsx():
    spider = spider_with_crawler(unflatten=True)
    pipeline = Unflatten()
    item = File({
        'file_name': 'test.xlsx',
        'data': save_virtual_workbook(Workbook()),
        'data_type': 'release_package',
        'url': 'http://test.com/test.xlsx',
    })

    assert pipeline.process_item(item, spider) == item
Example #2
0
def test_process_item_csv():
    spider = spider_with_crawler(unflatten=True)
    pipeline = Unflatten()
    item = File({
        'file_name': 'test.csv',
        'data': b'data',
        'data_type': 'release_package',
        'url': 'http://test.com/test.csv',
    })

    assert pipeline.process_item(item, spider) == item
Example #3
0
def test_process_item_xlsx_error():
    spider = spider_with_crawler(unflatten=True)
    pipeline = Unflatten()
    item = File({
        'file_name': 'test.xlsx',
        'data': b'data',
        'data_type': 'release_package',
        'url': 'http://test.com/test.xlsx',
    })

    with pytest.raises(BadXLSXZipFile):
        pipeline.process_item(item, spider)
Example #4
0
def test_process_item_extension_error():
    spider = spider_with_crawler(unflatten=True)
    pipeline = Unflatten()
    item = File({
        'file_name': 'file',
        'data': b'data',
        'data_type': 'release_package',
        'url': 'http://test.com/file',
    })

    with pytest.raises(NotImplementedError):
        pipeline.process_item(item, spider)