Python _taxonomy_formats_to_dataframe Examples, q2_types.feature_data._transformer._taxonomy_formats_to_dataframe Python Examples

Example #1

0

Show file

File: test_transformer.py Project: gregcaporaso/q2-types

    def test_3_columns(self):
        index = pd.Index(['seq1', 'seq2'], name='Feature ID', dtype=object)
        exp = pd.DataFrame([['k__Foo; p__Bar', '-1.0'],
                            ['k__Foo; p__Baz', '-42.0']], index=index,
                           columns=['Taxon', 'Confidence'], dtype=object)

        # has_header=None (default)
        obs = _taxonomy_formats_to_dataframe(
            self.get_data_path(os.path.join('taxonomy', '3-column.tsv')))

        assert_frame_equal(obs, exp)

        # has_header=True
        obs = _taxonomy_formats_to_dataframe(
            self.get_data_path(os.path.join('taxonomy', '3-column.tsv')),
            has_header=True)

        assert_frame_equal(obs, exp)

Example #2

0

Show file

File: test_transformer.py Project: nbokulich/q2-types

    def test_2_columns(self):
        index = pd.Index(['seq1', 'seq2'], name='Feature ID', dtype=object)
        exp = pd.DataFrame([['k__Bacteria; p__Proteobacteria'],
                            ['k__Bacteria']], index=index, columns=['Taxon'],
                           dtype=object)

        # has_header=None (default)
        obs = _taxonomy_formats_to_dataframe(
            self.get_data_path(os.path.join('taxonomy', '2-column.tsv')))

        assert_frame_equal(obs, exp)

        # has_header=True
        obs = _taxonomy_formats_to_dataframe(
            self.get_data_path(os.path.join('taxonomy', '2-column.tsv')),
            has_header=True)

        assert_frame_equal(obs, exp)

Example #3

0

Show file

File: test_transformer.py Project: nbokulich/q2-types

    def test_3_columns(self):
        index = pd.Index(['seq1', 'seq2'], name='Feature ID', dtype=object)
        exp = pd.DataFrame([['k__Foo; p__Bar', '-1.0'],
                            ['k__Foo; p__Baz', '-42.0']], index=index,
                           columns=['Taxon', 'Confidence'], dtype=object)

        # has_header=None (default)
        obs = _taxonomy_formats_to_dataframe(
            self.get_data_path(os.path.join('taxonomy', '3-column.tsv')))

        assert_frame_equal(obs, exp)

        # has_header=True
        obs = _taxonomy_formats_to_dataframe(
            self.get_data_path(os.path.join('taxonomy', '3-column.tsv')),
            has_header=True)

        assert_frame_equal(obs, exp)

Example #4

0

Show file

File: test_transformer.py Project: gregcaporaso/q2-types

    def test_2_columns(self):
        index = pd.Index(['seq1', 'seq2'], name='Feature ID', dtype=object)
        exp = pd.DataFrame([['k__Bacteria; p__Proteobacteria'],
                            ['k__Bacteria']], index=index, columns=['Taxon'],
                           dtype=object)

        # has_header=None (default)
        obs = _taxonomy_formats_to_dataframe(
            self.get_data_path(os.path.join('taxonomy', '2-column.tsv')))

        assert_frame_equal(obs, exp)

        # has_header=True
        obs = _taxonomy_formats_to_dataframe(
            self.get_data_path(os.path.join('taxonomy', '2-column.tsv')),
            has_header=True)

        assert_frame_equal(obs, exp)

Example #5

0

Show file

File: test_transformer.py Project: gregcaporaso/q2-types

    def test_headerless(self):
        index = pd.Index(['seq1', 'seq2'], name='Feature ID', dtype=object)
        columns = ['Taxon', 'Unnamed Column 1', 'Unnamed Column 2']
        exp = pd.DataFrame([['k__Foo; p__Bar', 'some', 'another'],
                            ['k__Foo; p__Baz', 'column', 'column!']],
                           index=index, columns=columns, dtype=object)

        # has_header=None (default)
        obs = _taxonomy_formats_to_dataframe(
            self.get_data_path(os.path.join('taxonomy',
                                            'headerless.tsv')))

        assert_frame_equal(obs, exp)

        # has_header=False
        obs = _taxonomy_formats_to_dataframe(
            self.get_data_path(os.path.join('taxonomy',
                                            'headerless.tsv')),
            has_header=False)

        assert_frame_equal(obs, exp)

Example #6

0

Show file

    def test_headerless(self):
        index = pd.Index(['seq1', 'seq2'], name='Feature ID', dtype=object)
        columns = ['Taxon', 'Unnamed Column 1', 'Unnamed Column 2']
        exp = pd.DataFrame([['k__Foo; p__Bar', 'some', 'another'],
                            ['k__Foo; p__Baz', 'column', 'column!']],
                           index=index,
                           columns=columns,
                           dtype=object)

        # has_header=None (default)
        obs = _taxonomy_formats_to_dataframe(
            self.get_data_path(os.path.join('taxonomy', 'headerless.tsv')))

        assert_frame_equal(obs, exp)

        # has_header=False
        obs = _taxonomy_formats_to_dataframe(self.get_data_path(
            os.path.join('taxonomy', 'headerless.tsv')),
                                             has_header=False)

        assert_frame_equal(obs, exp)

Example #7

0

Show file

File: test_transformer.py Project: gregcaporaso/q2-types

    def test_valid_but_messy_file(self):
        index = pd.Index(
            ['SEQUENCE1', 'seq2'], name='Feature ID', dtype=object)
        exp = pd.DataFrame([['k__Bar; p__Baz', 'foo'],
                            ['some; taxonomy; for; ya', 'bar baz']],
                           index=index, columns=['Taxon', 'Extra Column'],
                           dtype=object)

        # has_header=None (default)
        obs = _taxonomy_formats_to_dataframe(
            self.get_data_path(os.path.join('taxonomy',
                                            'valid-but-messy.tsv')))

        assert_frame_equal(obs, exp)

        # has_header=True
        obs = _taxonomy_formats_to_dataframe(
            self.get_data_path(os.path.join('taxonomy',
                                            'valid-but-messy.tsv')),
            has_header=True)

        assert_frame_equal(obs, exp)

Example #8

0

Show file

File: test_transformer.py Project: nbokulich/q2-types

    def test_valid_but_messy_file(self):
        index = pd.Index(
            ['SEQUENCE1', 'seq2'], name='Feature ID', dtype=object)
        exp = pd.DataFrame([['k__Bar; p__Baz', 'foo'],
                            ['some; taxonomy; for; ya', 'bar baz']],
                           index=index, columns=['Taxon', 'Extra Column'],
                           dtype=object)

        # has_header=None (default)
        obs = _taxonomy_formats_to_dataframe(
            self.get_data_path(os.path.join('taxonomy',
                                            'valid-but-messy.tsv')))

        assert_frame_equal(obs, exp)

        # has_header=True
        obs = _taxonomy_formats_to_dataframe(
            self.get_data_path(os.path.join('taxonomy',
                                            'valid-but-messy.tsv')),
            has_header=True)

        assert_frame_equal(obs, exp)

Example #9

0

Show file

 def test_duplicate_columns(self):
     with self.assertRaisesRegex(ValueError, 'duplicated: Column1'):
         _taxonomy_formats_to_dataframe(
             self.get_data_path(
                 os.path.join('taxonomy', 'duplicate-columns.tsv')))

Example #10

0

Show file

 def test_has_header_with_headerless(self):
     with self.assertRaisesRegex(ValueError, 'requires a header'):
         _taxonomy_formats_to_dataframe(self.get_data_path(
             os.path.join('taxonomy', 'headerless.tsv')),
                                        has_header=True)

Example #11

0

Show file

 def test_jagged(self):
     with self.assertRaises(pandas.errors.ParserError):
         _taxonomy_formats_to_dataframe(
             self.get_data_path(os.path.join('taxonomy', 'jagged.tsv')))

Example #12

0

Show file

 def test_empty(self):
     with self.assertRaises(pandas.errors.EmptyDataError):
         _taxonomy_formats_to_dataframe(
             self.get_data_path(os.path.join('taxonomy', 'empty')))

Example #13

0

Show file

 def test_header_only(self):
     with self.assertRaisesRegex(ValueError, 'one row of data'):
         _taxonomy_formats_to_dataframe(
             self.get_data_path(os.path.join('taxonomy',
                                             'header-only.tsv')))

Example #14

0

Show file

 def test_blanks_and_comments(self):
     with self.assertRaises(pandas.io.common.EmptyDataError):
         _taxonomy_formats_to_dataframe(
             self.get_data_path(
                 os.path.join('taxonomy', 'blanks-and-comments')))

Example #15

0

Show file

 def test_one_column(self):
     with self.assertRaisesRegex(ValueError, "two columns, found 1"):
         _taxonomy_formats_to_dataframe(
             self.get_data_path(os.path.join('taxonomy', '1-column.tsv')))

Example #16

0

Show file

File: test_transformer.py Project: gregcaporaso/q2-types

 def test_one_column(self):
     with self.assertRaisesRegex(ValueError, "two columns, found 1"):
         _taxonomy_formats_to_dataframe(
             self.get_data_path(os.path.join('taxonomy', '1-column.tsv')))

Example #17

0

Show file

File: test_transformer.py Project: gregcaporaso/q2-types

 def test_blanks_and_comments(self):
     with self.assertRaises(pandas.io.common.EmptyDataError):
         _taxonomy_formats_to_dataframe(
             self.get_data_path(os.path.join('taxonomy',
                                             'blanks-and-comments')))

Example #18

0

Show file

File: test_transformer.py Project: gregcaporaso/q2-types

 def test_empty(self):
     with self.assertRaises(pandas.io.common.EmptyDataError):
         _taxonomy_formats_to_dataframe(
             self.get_data_path(os.path.join('taxonomy', 'empty')))

Example #19

0

Show file

File: test_transformer.py Project: gregcaporaso/q2-types

 def test_header_only(self):
     with self.assertRaisesRegex(ValueError, 'one row of data'):
         _taxonomy_formats_to_dataframe(
             self.get_data_path(os.path.join('taxonomy',
                                             'header-only.tsv')))

Example #20

0

Show file

File: test_transformer.py Project: gregcaporaso/q2-types

 def test_duplicate_columns(self):
     with self.assertRaisesRegex(ValueError, 'duplicated: Column1'):
         _taxonomy_formats_to_dataframe(
             self.get_data_path(os.path.join(
                 'taxonomy', 'duplicate-columns.tsv')))

Example #21

0

Show file

File: test_transformer.py Project: gregcaporaso/q2-types

 def test_jagged(self):
     with self.assertRaises(pandas.io.common.CParserError):
         _taxonomy_formats_to_dataframe(
             self.get_data_path(os.path.join('taxonomy', 'jagged.tsv')))

Example #22

0

Show file

File: test_transformer.py Project: gregcaporaso/q2-types

 def test_has_header_with_headerless(self):
     with self.assertRaisesRegex(ValueError, 'requires a header'):
         _taxonomy_formats_to_dataframe(
             self.get_data_path(os.path.join('taxonomy', 'headerless.tsv')),
             has_header=True)