Python DataFrameGraph Beispiele, gauss.domains.rlang.graphs.DataFrameGraph Python Beispiele

Beispiel #1

0

Datei anzeigen

Datei: definition.py Projekt: yadavpa1/gauss-rise-camp

def _generate_example(
    component_name: str
) -> Tuple[List[pd.DataFrame], pd.DataFrame, str, Graph]:
    while True:
        try:
            inputs, replay_map = datagen_dict[component_name]()
            #  Abstractions for the individual inputs.
            g_inputs = [DataFrameGraph(i) for i in inputs]
            strategy = RandomizedGraphStrategy()
            gen = generator_dict[component_name]
            output, program, graph, output_graph = gen.with_env(
                strategy=strategy, replay=replay_map).call(*inputs,
                                                           *g_inputs,
                                                           datagen=True)
            if 0 in output.shape:
                raise AssertionError("Got empty dataframe")

            #  Populate the placeholders
            program = program.format(
                **{f"inp{i}": f"inp{i}"
                   for i in range(1,
                                  len(inputs) + 1)})
            return inputs, output, program, graph

        except Exception as e:
            pass

Beispiel #2

0

Datei anzeigen

Datei: test_rlang_domain.py Projekt: yadavpa1/gauss-rise-camp

    def test_df_graph(self):
        from gauss.domains.rlang.graphs import DataFrameGraph
        df = pd.DataFrame([['a', 'b', 'e'], ['c', 'd', 'f']], columns=['C1', 'C2', 'C3'])
        df_graph = DataFrameGraph(df)

        #  Check if all the nodes have been created.
        self.assertListEqual(list(df.columns), [c.value for c in df_graph.columns])
        self.assertListEqual(list(df.index), [c.value for c in df_graph.index])
        for row_df, row_df_graph in zip(df.values, df_graph.values):
            self.assertListEqual(list(row_df), [v.value for v in row_df_graph])

Beispiel #3

0

Datei anzeigen

Datei: test_rlang_domain.py Projekt: yadavpa1/gauss-rise-camp

    def test_gather(self):
        from gauss.domains.rlang.generators import gen_gather, DataFrameGraph, RInterpreter
        gather = RInterpreter.gather
        df = pd.DataFrame([['a', 'b', 'e'], ['c', 'd', 'f']], columns=['C1', 'C2', 'C3'])
        result, call_str, graph, res_graph = gen_gather.call(df, DataFrameGraph(df))

        #  Result should not be equal to the input
        self.assertRaises(AssertionError, pd.testing.assert_frame_equal, df, result)

        #  Call str should evaluate to the result
        pd.testing.assert_frame_equal(result, eval(call_str.format(inp1='df')))

Beispiel #4

0

Datei anzeigen

Datei: test_rlang_domain.py Projekt: yadavpa1/gauss-rise-camp

    def test_groupby(self):
        from gauss.domains.rlang.generators import gen_group_by_summarise, DataFrameGraph, RInterpreter
        group_by = RInterpreter.group_by
        summarise = RInterpreter.summarise

        df = pd.DataFrame([['A', 100], ['A', 200], ['B', 300]], columns=['C1', 'C2'])
        g_df = DataFrameGraph(df)
        result, call_str, graph, res_graph = gen_group_by_summarise.with_env(ignore_exceptions=False).call(df, g_df)

        #  Result should not be equal to the input
        self.assertRaises(AssertionError, pd.testing.assert_frame_equal, df, result)

        #  Call str should evaluate to the result
        pd.testing.assert_frame_equal(result, eval(call_str.format(inp1='df')))

Beispiel #5

0

Datei anzeigen

Datei: test_rlang_domain.py Projekt: yadavpa1/gauss-rise-camp

    def test_inner_join(self):
        from gauss.domains.rlang.generators import gen_inner_join, DataFrameGraph, RInterpreter
        inner_join = RInterpreter.inner_join

        df1 = pd.DataFrame([['a', 'b', 'c'], ['d', 'g', 'c'], ['f', 'b', 'h']], columns=['c1', 'c2', 'c3'])
        df2 = pd.DataFrame([['x', 'g', 'z'], ['w', 'b', 'u'], ['y', 'g', 'j']], columns=['c4', 'c2', 'c5'])

        result, call_str, graph, res_graph = gen_inner_join.call(df1, df2, DataFrameGraph(df1), DataFrameGraph(df2))

        #  Result should not be equal to the input
        self.assertRaises(AssertionError, pd.testing.assert_frame_equal, df1, result)
        self.assertRaises(AssertionError, pd.testing.assert_frame_equal, df2, result)

        #  Call str should evaluate to the result
        pd.testing.assert_frame_equal(result, eval(call_str.format(inp1='df1', inp2='df2')))

Beispiel #6

0

Datei anzeigen