Esempi in Python per process_df

Linguaggio di programmazione: Python

Spazio dei nomi/nome del pacchetto: datapane.common.df_processor

Metodo/funzione: process_df

Esempi su hotexamples.com: 7

process_df in Python: 7 esempi trovati. Questi sono i migliori esempi reali in Python per datapane.common.df_processor.process_df, estratti da progetti open source. Li puoi valutare, per aiutarci a migliorare la qualità dei nostri esempi.

Esempio n. 1

Mostra file

File: dp_object.py Progetto: zhiliangpersonal/datapane

 def _save_df(cls, df: pd.DataFrame) -> DPTmpFile:
     fn = DPTmpFile(ArrowFormat.ext)
     df = to_df(df)
     process_df(df)
     ArrowFormat.save_file(fn.name, df)
     log.debug(f"Saved df to {fn} ({os.path.getsize(fn.file)} bytes)")
     return fn

Esempio n. 2

Mostra file

def check_df_equal(left: pd.DataFrame, right: pd.DataFrame, **kwargs):
    """
    Wraps pd.assert_frame_equal whilst processing dfs and ignoring the order of the columns.
    NOTE - this mutates the dfs
    """
    left = process_df(left)
    right = process_df(right)
    pd.testing.assert_frame_equal(left, right, check_like=True, **kwargs)

Esempio n. 3

Mostra file

    def convert_csv_pd_(string: str) -> pd.DataFrame:
        import textwrap
        from io import StringIO

        from datapane.common.df_processor import process_df

        buf = StringIO(textwrap.dedent(string).strip())
        df = pd.read_csv(buf, engine="c", sep=",")
        df["timedelta_col1"] = pd.to_timedelta(df["timedelta_col1"])
        process_df(df)
        return df

Esempio n. 4

Mostra file

    def _test_order(df: pd.DataFrame):
        # process and compare
        df1 = process_df(df, copy=True)
        assert list(df.columns) == list(df1.columns)

        # convert to arrow and back
        df2 = save_load_arrow(tmp_path, df)
        assert list(df.columns) == list(df2.columns)

Esempio n. 5

Mostra file

    def _test_df(df: pd.DataFrame, expected_types: List[str]):
        df_conv = df.convert_dtypes()
        df_proc = process_df(df, copy=True)

        # check both df's have same nulls
        pd.testing.assert_frame_equal(pd.isnull(df), pd.isnull(df_conv))
        pd.testing.assert_frame_equal(pd.isnull(df), pd.isnull(df_proc))

        # check we can save and load processed file
        df2 = save_load_arrow(tmp_path, df_proc)
        pd.testing.assert_frame_equal(df_proc, df2)
        assert [str(x) for x in df2.dtypes] == expected_types

Esempio n. 6

Mostra file

def convert_csv_pd(string: str, process: bool = False) -> pd.DataFrame:
    """Helper function to convert a well-formatted csv into a DataFrame"""
    buf: TextIO = StringIO(textwrap.dedent(string).strip())

    try:
        df = pd.read_csv(buf, engine="c", sep=",")
    except ParserError as e:
        log.warning(f"Error parsing CSV file ({e}), trying python fallback")
        df = pd.read_csv(buf, engine="python", sep=None)

    if process:
        df = process_df(df)
    return df

Esempio n. 7

Mostra file

def test_parse_categories_roundtrip(tmp_path: Path):
    # initial df
    df = pd.DataFrame(
        dict(
            str1=[str(x) for x in range(10000)],
            str2=[str(x % 25) for x in range(10000)],
        )
    )
    # process it
    df1 = process_df(df, copy=True)
    # arrow converted
    df2 = save_load_arrow(tmp_path, df)

    _check_categories_parsed(df2, ["str2"])
    pd.testing.assert_frame_equal(df1, df2)