Пример #1
0
# SimpleSQLite
# pip install simplesqlite
from simplesqlite import SimpleSQLite
import pandas as pd
import sys
import sqlite3

# read annotation file
print('reading annotation file...')
anno_df = pd.read_csv(sys.argv[1], sep='\t', index_col=0, header=0)

new_list = ['GeneID'] + list(anno_df.columns)

anno_df = anno_df.reindex(columns=new_list)

anno_df.GeneID = anno_df.index

print('connect gff sqlite3 database...')
con = SimpleSQLite(sys.argv[2])

print('create new table to gff sqlite3 database...')
con.create_table_from_dataframe(anno_df, table_name='anno')

print('create index to sqlite3 database...')
con.create_index_list(
    'anno', ['GeneID', 'Nr', 'Swissprot', 'KEGG', 'TrEMBL', 'Interpro'])

con.commit()
con.close()
Пример #2
0
print('reading expression file...')
anno_df = pd.read_csv(sys.argv[1], sep='\t', index_col=0, header=0)

new_list = ['Gene_id'] + list(anno_df.columns)

anno_df = anno_df.reindex(columns=new_list)

anno_df.Gene_id = anno_df.index

print('connect sqlite3 database...')
if os.path.exists(sys.argv[2]):
    os.remove(sys.argv[2])
    print("file exists! we will detele it.")
con = SimpleSQLite(sys.argv[2])

print('create new table to sqlite3 database...')
#con.create_table_from_dataframe(anno_df, table_name='exp',add_primary_key_column=1)

con.create_table_from_dataframe(anno_df,
                                table_name='exp',
                                primary_key='Gene_id')

# Migration
print('create index to sqlite3 database...')
con.create_index_list('exp', [
    'Gene_id',
])

con.commit()
con.close()