Python _blast6_to_data_frameの例、skbio.io.format.blast6._blast6_to_data_frame Pythonの例

コード例 #1

0

ファイルを表示

ファイル: test_blast6.py プロジェクト: ebolyen/scikit-bio

 def test_wrong_column_name_error(self):
     fp = get_data_path('blast6_default_single_line')
     with assertRaisesRegex(self, ValueError,
                            "Unrecognized column.*'abcd'"):
         _blast6_to_data_frame(fp, columns=['qseqid', 'sseqid', 'pident',
                                            'length', 'mismatch', 'gapopen',
                                            'qstart', 'qend', 'sstart',
                                            'send', 'abcd', 'bitscore'])

コード例 #2

0

ファイルを表示

 def test_wrong_column_name_error(self):
     fp = get_data_path('blast6_default_single_line')
     with self.assertRaisesRegex(ValueError, "Unrecognized column.*'abcd'"):
         _blast6_to_data_frame(fp,
                               columns=[
                                   'qseqid', 'sseqid', 'pident', 'length',
                                   'mismatch', 'gapopen', 'qstart', 'qend',
                                   'sstart', 'send', 'abcd', 'bitscore'
                               ])

コード例 #3

0

ファイルを表示

ファイル: test_blast6.py プロジェクト: ebolyen/scikit-bio

 def test_default_valid_single_line(self):
     fp = get_data_path('blast6_default_single_line')
     df = _blast6_to_data_frame(fp, default_columns=True)
     exp = pd.DataFrame([['query1', 'subject2', 75.0, 8.0, 2.0, 0.0, 1.0,
                          8.0, 2.0, 9.0, 0.06, 11.5]],
                        columns=['qseqid', 'sseqid', 'pident', 'length',
                                 'mismatch', 'gapopen', 'qstart', 'qend',
                                 'sstart', 'send', 'evalue', 'bitscore'])
     assert_data_frame_almost_equal(df, exp)

コード例 #4

0

ファイルを表示

ファイル: test_blast6.py プロジェクト: ebolyen/scikit-bio

 def test_custom_valid_single_line(self):
     fp = get_data_path('blast6_custom_single_line')
     df = _blast6_to_data_frame(fp, columns=['qacc', 'qseq', 'btop',
                                             'sframe', 'ppos',
                                             'positive', 'gaps'])
     exp = pd.DataFrame([['query1', 'PAAWWWWW', 8.0, 1.0, 100.00, 8.0,
                          0.0]], columns=['qacc', 'qseq', 'btop', 'sframe',
                                          'ppos', 'positive', 'gaps'])
     assert_data_frame_almost_equal(df, exp)

コード例 #5

0

ファイルを表示

ファイル: test_blast6.py プロジェクト: ebolyen/scikit-bio

 def test_valid_nan_handling(self):
     fp = get_data_path('blast6_custom_mixed_nans')
     df = _blast6_to_data_frame(fp, columns=['qacc', 'qseq', 'btop',
                                             'sframe', 'ppos', 'positive',
                                             'gaps'])
     exp = pd.DataFrame([[np.nan, 'PAAWWWWW', 8.0, 1.0, 100.00, np.nan,
                          0.0], ['query1', np.nan, 8.0, 1.0, np.nan, 8.0,
                                 0.0]], columns=['qacc', 'qseq', 'btop',
                                                 'sframe', 'ppos',
                                                 'positive', 'gaps'])
     assert_data_frame_almost_equal(df, exp)

コード例 #6

0

ファイルを表示

 def test_custom_valid_single_line(self):
     fp = get_data_path('blast6_custom_single_line')
     df = _blast6_to_data_frame(fp,
                                columns=[
                                    'qacc', 'qseq', 'btop', 'sframe',
                                    'ppos', 'positive', 'gaps'
                                ])
     exp = pd.DataFrame(
         [['query1', 'PAAWWWWW', 8.0, 1.0, 100.00, 8.0, 0.0]],
         columns=[
             'qacc', 'qseq', 'btop', 'sframe', 'ppos', 'positive', 'gaps'
         ])
     assert_data_frame_almost_equal(df, exp)

コード例 #7

0

ファイルを表示

 def test_default_valid_single_line(self):
     fp = get_data_path('blast6_default_single_line')
     df = _blast6_to_data_frame(fp, default_columns=True)
     exp = pd.DataFrame([[
         'query1', 'subject2', 75.0, 8.0, 2.0, 0.0, 1.0, 8.0, 2.0, 9.0,
         0.06, 11.5
     ]],
                        columns=[
                            'qseqid', 'sseqid', 'pident', 'length',
                            'mismatch', 'gapopen', 'qstart', 'qend',
                            'sstart', 'send', 'evalue', 'bitscore'
                        ])
     assert_data_frame_almost_equal(df, exp)

コード例 #8

0

ファイルを表示

ファイル: test_blast6.py プロジェクト: ebolyen/scikit-bio

 def test_default_valid_multi_line(self):
     fp = get_data_path('blast6_default_multi_line')
     df = _blast6_to_data_frame(fp, default_columns=True)
     exp = pd.DataFrame([['query1', 'subject2', 100.00, 8.0, 0.0, 0.0, 1.0,
                          8.0, 3.0, 10.0, 9e-05, 16.9],
                         ['query1', 'subject2', 75.00, 8.0, 2.0, 0.0, 1.0,
                          8.0, 2.0, 9.0, 0.060, 11.5],
                         ['query2', 'subject1', 71.43, 7.0, 2.0, 0.0, 1.0,
                         7.0, 1.0, 7.0, 0.044, 11.9]],
                        columns=['qseqid', 'sseqid', 'pident', 'length',
                                 'mismatch', 'gapopen', 'qstart', 'qend',
                                 'sstart', 'send', 'evalue', 'bitscore'])
     assert_data_frame_almost_equal(df, exp)

コード例 #9

0

ファイルを表示

ファイル: test_blast6.py プロジェクト: ebolyen/scikit-bio

 def test_custom_valid_multi_line(self):
     fp = get_data_path('blast6_custom_multi_line')
     df = _blast6_to_data_frame(fp, columns=['sacc', 'score', 'gapopen',
                                             'qcovs', 'sblastnames',
                                             'sallacc', 'qaccver'])
     exp = pd.DataFrame([['subject2', 32.0, 0.0, 100.0, np.nan, 'subject2',
                          'query1'], ['subject2', 18.0, 0.0, 100.0, np.nan,
                                      'subject2', 'query1'],
                         ['subject1', 19.0, 0.0, 70.0, np.nan, 'subject1',
                          'query2']], columns=['sacc', 'score', 'gapopen',
                                               'qcovs', 'sblastnames',
                                               'sallacc', 'qaccver'])
     exp['sblastnames'] = exp['sblastnames'].astype(object)
     assert_data_frame_almost_equal(df, exp)

コード例 #10

0

ファイルを表示

 def test_valid_nan_handling(self):
     fp = get_data_path('blast6_custom_mixed_nans')
     df = _blast6_to_data_frame(fp,
                                columns=[
                                    'qacc', 'qseq', 'btop', 'sframe',
                                    'ppos', 'positive', 'gaps'
                                ])
     exp = pd.DataFrame(
         [[np.nan, 'PAAWWWWW', 8.0, 1.0, 100.00, np.nan, 0.0],
          ['query1', np.nan, 8.0, 1.0, np.nan, 8.0, 0.0]],
         columns=[
             'qacc', 'qseq', 'btop', 'sframe', 'ppos', 'positive', 'gaps'
         ])
     assert_data_frame_almost_equal(df, exp)

コード例 #11

0

ファイルを表示

 def test_custom_valid_multi_line(self):
     fp = get_data_path('blast6_custom_multi_line')
     df = _blast6_to_data_frame(fp,
                                columns=[
                                    'sacc', 'score', 'gapopen', 'qcovs',
                                    'sblastnames', 'sallacc', 'qaccver'
                                ])
     exp = pd.DataFrame(
         [['subject2', 32.0, 0.0, 100.0, np.nan, 'subject2', 'query1'],
          ['subject2', 18.0, 0.0, 100.0, np.nan, 'subject2', 'query1'],
          ['subject1', 19.0, 0.0, 70.0, np.nan, 'subject1', 'query2']],
         columns=[
             'sacc', 'score', 'gapopen', 'qcovs', 'sblastnames', 'sallacc',
             'qaccver'
         ])
     exp['sblastnames'] = exp['sblastnames'].astype(object)
     assert_data_frame_almost_equal(df, exp)

コード例 #12

0

ファイルを表示

 def test_default_valid_multi_line(self):
     fp = get_data_path('blast6_default_multi_line')
     df = _blast6_to_data_frame(fp, default_columns=True)
     exp = pd.DataFrame([[
         'query1', 'subject2', 100.00, 8.0, 0.0, 0.0, 1.0, 8.0, 3.0, 10.0,
         9e-05, 16.9
     ],
                         [
                             'query1', 'subject2', 75.00, 8.0, 2.0, 0.0,
                             1.0, 8.0, 2.0, 9.0, 0.060, 11.5
                         ],
                         [
                             'query2', 'subject1', 71.43, 7.0, 2.0, 0.0,
                             1.0, 7.0, 1.0, 7.0, 0.044, 11.9
                         ]],
                        columns=[
                            'qseqid', 'sseqid', 'pident', 'length',
                            'mismatch', 'gapopen', 'qstart', 'qend',
                            'sstart', 'send', 'evalue', 'bitscore'
                        ])
     assert_data_frame_almost_equal(df, exp)

コード例 #13

0

ファイルを表示

 def test_no_columns_passed_error(self):
     fp = get_data_path('blast6_default_single_line')
     with self.assertRaisesRegex(ValueError,
                                 "Either `columns` or `default_columns`"):
         _blast6_to_data_frame(fp)

コード例 #14

0

ファイルを表示

 def test_wrong_amount_of_columns_error(self):
     fp = get_data_path('blast6_invalid_number_of_columns')
     with self.assertRaisesRegex(
             ValueError, "Specified number of columns \(12\).*\(10\)"):
         _blast6_to_data_frame(fp, default_columns=True)

コード例 #15

0

ファイルを表示

 def test_different_data_in_same_column(self):
     fp = get_data_path('blast6_invalid_type_in_column')
     with self.assertRaises(ValueError):
         _blast6_to_data_frame(fp, default_columns=True)

コード例 #16

0

ファイルを表示

ファイル: test_blast6.py プロジェクト: ebolyen/scikit-bio

 def test_different_data_in_same_column(self):
     fp = get_data_path('blast6_invalid_type_in_column')
     with self.assertRaises(ValueError):
         _blast6_to_data_frame(fp, default_columns=True)

コード例 #17

0

ファイルを表示

 def test_custom_and_default_passed_error(self):
     fp = get_data_path('blast6_default_single_line')
     with self.assertRaisesRegex(ValueError,
                                 "`columns` and `default_columns`"):
         _blast6_to_data_frame(fp, columns=['qseqid'], default_columns=True)

コード例 #18

0

ファイルを表示

ファイル: test_blast6.py プロジェクト: ebolyen/scikit-bio

 def test_custom_and_default_passed_error(self):
     fp = get_data_path('blast6_default_single_line')
     with assertRaisesRegex(self, ValueError,
                            "`columns` and `default_columns`"):
         _blast6_to_data_frame(fp, columns=['qseqid'], default_columns=True)

コード例 #19

0

ファイルを表示

ファイル: test_blast6.py プロジェクト: ebolyen/scikit-bio

 def test_valid_minimal(self):
     fp = get_data_path('blast6_custom_minimal')
     df = _blast6_to_data_frame(fp, columns=['sacc'])
     exp = pd.DataFrame([['subject2']], columns=['sacc'])
     assert_data_frame_almost_equal(df, exp)

コード例 #20

0

ファイルを表示

ファイル: test_blast6.py プロジェクト: ebolyen/scikit-bio

 def test_wrong_amount_of_columns_error(self):
     fp = get_data_path('blast6_invalid_number_of_columns')
     with assertRaisesRegex(self, ValueError,
                            "Specified number of columns \(12\).*\(10\)"):
         _blast6_to_data_frame(fp, default_columns=True)

コード例 #21

0

ファイルを表示

ファイル: test_blast6.py プロジェクト: ebolyen/scikit-bio

 def test_no_columns_passed_error(self):
     fp = get_data_path('blast6_default_single_line')
     with assertRaisesRegex(self, ValueError,
                            "Either `columns` or `default_columns`"):
         _blast6_to_data_frame(fp)

コード例 #22

0

ファイルを表示

 def test_valid_minimal(self):
     fp = get_data_path('blast6_custom_minimal')
     df = _blast6_to_data_frame(fp, columns=['sacc'])
     exp = pd.DataFrame([['subject2']], columns=['sacc'])
     assert_data_frame_almost_equal(df, exp)