Python file_reader示例，tablite.core.file_reader Python示例

示例#1

0

显示文件

文件： filereader_tests.py 项目： root-11/tablite

def test_filereader_gdocs1xlsx_import_single_sheet():
    path = Path(__file__).parent / "data" / 'gdocs1.xlsx'
    assert path.exists()

    # all sheets
    tables = list(file_reader(path, has_headers=False))
    assert len(tables) == 2

    # multiple sheets
    tables = list(
        file_reader(path, has_headers=False, sheet_names=['Sheet1', 'Sheet2']))
    assert len(tables) == 2

    tables = list(file_reader(path, has_headers=False, sheet_names='Sheet2'))
    assert len(tables) == 1

示例#2

0

显示文件

文件： filereader_tests.py 项目： root-11/tablite

def test_filereader_123csv():
    csv_file = Path(__file__).parent / "data" / "123.csv"

    table7 = Table(filename=csv_file.name)
    table7.metadata['filename'] = '123.csv'
    table7.add_column('A',
                      int,
                      data=[1, None, 8, 3, 4, 6, 5, 7, 9],
                      allow_empty=True)
    table7.add_column('B', int, data=[10, 100, 1, 1, 1, 1, 10, 10, 10])
    table7.add_column('C', int, data=[0, 1, 0, 1, 0, 1, 0, 1, 0])
    sort_order = {'B': False, 'C': False, 'A': False}
    table7.sort(**sort_order)

    headers = ", ".join([c for c in table7.columns])
    data = [headers]
    for row in table7.rows:
        data.append(", ".join(str(v) for v in row))

    s = "\n".join(data)
    print(s)
    csv_file.write_text(s)  # write
    tr_table = list(file_reader(csv_file))[0]  # read
    csv_file.unlink()  # cleanup

    tr_table.show()
    find_format(tr_table)

    assert tr_table == table7

示例#3

0

显示文件

文件： filereader_tests.py 项目： root-11/tablite

def test_filereader_book1xlsx():
    path = Path(__file__).parent / "data" / 'book1.xlsx'
    assert path.exists()
    start = process_time_ns()
    tables = list(file_reader(path))
    end = process_time_ns()

    fields = sum(len(t) * len(t.columns) for t in tables)
    print("{:,} fields/seccond".format(
        round(1e9 * fields / max(1, end - start), 0)))

    sheet1 = Table(filename=path.name, sheet_name='Sheet1')
    for column_name in list('abcdef'):
        sheet1.add_column(column_name, int, False)

    sheet2 = Table(
        filename=path.name,
        sheet_name='Sheet2 ')  # there's a deliberate white space at the end!
    sheet2.add_column('a', int, False)
    for column_name in list('bcdef'):
        sheet2.add_column(column_name, float, False)

    books = [sheet1, sheet2]

    for book, table in zip(books, tables):
        table.show(slice(5))
        assert table.compare(book)
        assert len(table) == 45, len(table)

示例#4

0

显示文件

文件： filereader_tests.py 项目： root-11/tablite

def test_filereader_saptxt():
    path = Path(__file__).parent / "data" / 'sap.txt'
    assert path.exists()
    # test part 1: split using user defined sequence.
    header = "    | Delivery |  Item|Pl.GI date|Route |SC|Ship-to   |SOrg.|Delivery quantity|SU| TO Number|Material    |Dest.act.qty.|BUn|Typ|Source Bin|Cty"
    split_sequence = ["|"] * header.count('|')
    table = list(file_reader(path, split_sequence=split_sequence))[0]
    table.show(slice(5))

    sap_sample = Table(filename=path.name)
    sap_sample.add_column('None', str, True)
    sap_sample.add_column('Delivery', int, False)
    sap_sample.add_column('Item', int, False)
    sap_sample.add_column('Pl.GI date', date, False)
    sap_sample.add_column('Route', str, False)
    sap_sample.add_column('SC', str, False)
    sap_sample.add_column('Ship-to', str, False)
    sap_sample.add_column('SOrg.', str, False)
    sap_sample.add_column('Delivery quantity', int, False)
    sap_sample.add_column('SU', str, False)
    sap_sample.add_column('TO Number', int, False)
    sap_sample.add_column('Material', str, False)
    sap_sample.add_column('Dest.act.qty.', int, False)
    sap_sample.add_column('BUn', str, False)
    sap_sample.add_column('Typ', str, False)
    sap_sample.add_column('Source Bin', str, False)
    sap_sample.add_column('Cty|', str, False)

    assert table.compare(sap_sample)
    assert len(table) == 20, len(table)

示例#5

0

显示文件

文件： filereader_tests.py 项目： root-11/tablite

def test_filereader_gdocs1xlsx_no_header():
    path = Path(__file__).parent / "data" / 'gdocs1.xlsx'
    assert path.exists()
    table = list(file_reader(path, has_headers=False))[0]
    table.show(slice(0, 10))

    gdocs1xlsx = Table(filename=path.name, sheet_name='Sheet1')
    for idx, _ in enumerate(list('abcdef'), 1):
        gdocs1xlsx.add_column(f"_{idx}", str)

    assert table.compare(gdocs1xlsx), table.compare(gdocs1xlsx)
    assert len(table) == 46

示例#6

0

显示文件

文件： filereader_tests.py 项目： root-11/tablite

def test_filereader_gdocs1csv_no_header():
    path = Path(__file__).parent / "data" / 'gdocs1.csv'
    assert path.exists()
    table = list(file_reader(path, has_headers=False))[0]
    table.show(slice(0, 10))

    book1_csv = Table(filename=path.name)
    for idx, _ in enumerate(list('abcdef'), 1):
        book1_csv.add_column(f"_{idx}", str)

    assert table.compare(book1_csv), table.compare(book1_csv)
    assert len(table) == 46

示例#7

0

显示文件

文件： filereader_tests.py 项目： root-11/tablite

def test_filereader_utf8sig_encoding_csv():
    path = Path(__file__).parent / "data" / 'utf8sig.csv'
    assert path.exists()
    table = list(file_reader(path, sep=','))[0]
    table.show(slice(0, 10))
    table.show(slice(-15))

    book1_csv = Table(filename=path.name)
    book1_csv.add_column('432', int)
    book1_csv.add_column('1', int)
    assert table.compare(book1_csv), table.compare(book1_csv)
    assert len(table) == 2, len(table)

示例#8

0

显示文件

文件： filereader_tests.py 项目： root-11/tablite

def test_filereader_gdocs1xlsx():
    path = Path(__file__).parent / "data" / 'gdocs1.xlsx'
    assert path.exists()
    table = list(file_reader(path))[0]
    table.show(slice(0, 10))

    gdocs1xlsx = Table(filename=path.name, sheet_name='Sheet1')
    for float_type in list('abcdef'):
        gdocs1xlsx.add_column(float_type, int)

    assert table.compare(gdocs1xlsx), table.compare(gdocs1xlsx)
    assert len(table) == 45

示例#9

0

显示文件

文件： filereader_tests.py 项目： root-11/tablite

def test_filereader_book1tsv():
    path = Path(__file__).parent / "data" / 'book1.tsv'
    assert path.exists()
    table = list(file_reader(path))[0]
    table.show(slice(0, 10))

    book1 = Table(filename=path.name)
    book1.add_column('a', int)
    for float_type in list('bcdef'):
        book1.add_column(float_type, float)

    assert table.compare(book1), table.compare(book1)
    assert len(table) == 45

示例#10

0

显示文件

文件： filereader_tests.py 项目： root-11/tablite

def test_filereader_exceldatesxlsx():
    path = Path(__file__).parent / "data" / 'excel_dates.xlsx'
    assert path.exists()
    table = list(file_reader(path))[0]
    table.show()

    sheet1 = Table(filename=path.name, sheet_name='Sheet1')
    sheet1.add_column('Date', datetime, False)
    sheet1.add_column('numeric value', int, False)
    sheet1.add_column('string', date, False)
    sheet1.add_column('bool', bool, False)

    assert table.compare(sheet1)
    assert len(table) == 2, len(table)

示例#11

0

显示文件

文件： filereader_tests.py 项目： root-11/tablite

def test_filereader_win1251_encoding_csv():
    path = Path(__file__).parent / "data" / 'win1250_test.csv'
    assert path.exists()
    table = list(file_reader(path, sep=';'))[0]
    table.show(slice(0, 10))
    table.show(slice(-15))

    book1_csv = Table(filename=path.name)
    book1_csv.add_column('Item', int)
    book1_csv.add_column('Materiál', str)
    book1_csv.add_column('Objem', float)
    book1_csv.add_column('Jednotka objemu', str)
    book1_csv.add_column('Free Inv Pcs', int)
    assert table.compare(book1_csv), table.compare(book1_csv)
    assert len(table) == 99, len(table)

示例#12

0

显示文件

文件： filereader_tests.py 项目： root-11/tablite

def test_filereader_zipped():
    path = Path(__file__).parent / 'data'
    assert path.exists()
    assert path.is_dir()
    zipped = Path(__file__).parent / 'new.zip'
    file_count = 0
    file_names = []
    with zipfile.ZipFile(zipped, 'w') as zipf:
        for file in path.iterdir():
            zipf.write(file)
            file_count += 1
            file_names.append(file.name)

    tables = list(file_reader(zipped))
    assert len(tables) >= file_count

    assert {t.metadata['filename'] for t in tables} == set(file_names)
    zipped.unlink()

示例#13

0

显示文件

文件： filereader_tests.py 项目： root-11/tablite

def test_filereader_gdocsc1ods_no_header():
    path = Path(__file__).parent / "data" / 'gdocs1.ods'
    assert path.exists()
    tables = file_reader(path, has_headers=False)

    sheet1 = Table(filename=path.name, sheet_name='Sheet1')
    for idx, _ in enumerate(list('abcdef'), 1):
        sheet1.add_column(f"_{idx}", str)

    sheet2 = Table(filename=path.name, sheet_name='Sheet2')
    for idx, _ in enumerate(list('abcdef'), 1):
        sheet2.add_column(f"_{idx}", str)

    sheets = [sheet1, sheet2]

    for sheet, table in zip(sheets, tables):
        table.show(slice(0, 10))
        table.compare(sheet)
        assert len(table) == 46, table.show(blanks="")

示例#14

0

显示文件

文件： filereader_tests.py 项目： root-11/tablite

def test_filereader_gdocsc1ods():
    path = Path(__file__).parent / "data" / 'gdocs1.ods'
    assert path.exists()
    tables = file_reader(path)

    sheet1 = Table(filename=path.name, sheet_name='Sheet1')
    for int_type in list('abcdef'):
        sheet1.add_column(int_type, int)

    sheet2 = Table(filename=path.name, sheet_name='Sheet2')
    sheet2.add_column('a', int)
    for float_type in list('bcdef'):
        sheet2.add_column(float_type, float)

    sheets = [sheet1, sheet2]

    for sheet, table in zip(sheets, tables):
        table.compare(sheet)
        assert len(table) == 45, table.show(blanks="")