Python normalise Examples, morar.normalise.normalise Python Examples

Example #1

0

Show file

def test_normalise_errors_invalid_method():
    # create test DataFrame
    x = np.random.randn(50).tolist()
    y = np.random.randn(50).tolist()
    z = np.random.randn(50).tolist()
    plate = (["plate1"] * 10 + ["plate2"] * 10 + ["plate3"] * 10 +
             ["plate4"] * 10 + ["plate5"] * 10)
    compound = (["drug"] * 8 + ["DMSO"] * 2) * 5
    colnames = ["A", "B", "C", "Metadata_plate", "Metadata_compound"]
    df = pd.DataFrame(list(zip(x, y, z, plate, compound)), columns=colnames)
    with pytest.raises(ValueError):
        normalise.normalise(df, plate_id="Metadata_plate", method="invalid")

Example #2

0

Show file

def test_check_control_within_function():
    # dataframe with missing controls in one plate
    x = np.random.randn(50).tolist()
    y = np.random.randn(50).tolist()
    z = np.random.randn(50).tolist()
    plate = (["plate1"] * 10 + ["plate2"] * 10 + ["plate3"] * 10 +
             ["plate4"] * 10 + ["plate5"] * 10)
    compound = (["drug"] * 10) + (["drug"] * 8 + ["DMSO"] * 2) * 4
    colnames = ["A", "B", "C", "Metadata_plate", "Metadata_compound"]
    missing_control_df = pd.DataFrame(list(zip(x, y, z, plate, compound)),
                                      columns=colnames)
    with pytest.raises(RuntimeError):
        normalise.normalise(missing_control_df, plate_id="Metadata_plate")

Example #3

0

Show file

def test_parallel_normalise():
    x = np.random.randn(50).tolist()
    y = np.random.randn(50).tolist()
    z = np.random.randn(50).tolist()
    plate = (["plate1"] * 10 + ["plate2"] * 10 + ["plate3"] * 10 +
             ["plate4"] * 10 + ["plate5"] * 10)
    compound = (["drug"] * 8 + ["DMSO"] * 2) * 5
    colnames = ["A", "B", "C", "Metadata_plate", "Metadata_compound"]
    df = pd.DataFrame(list(zip(x, y, z, plate, compound)), columns=colnames)
    standard_output = normalise.normalise(df, plate_id="Metadata_plate")
    parallel_output = normalise.normalise(df,
                                          plate_id="Metadata_plate",
                                          parallel=True)
    assert standard_output.equals(parallel_output)

Example #4

0

Show file

File: dataframe.py Project: Swarchal/morar

 def normalise(self, **kwargs):
     """normalise data via morar.normalise.normalise"""
     df = normalise.normalise(self,
                              metadata_string=self.metadata_string,
                              prefix=self.prefix **kwargs)
     return DataFrame(df, metadata_string=self.metadata_string,
                      prefix=self.metadata_prefix)

Example #5

0

Show file

File: test_normalise.py Project: Swarchal/morar

def test_normalise_errors_invalid_method():
    # create test DataFrame
    x = np.random.randn(50).tolist()
    y = np.random.randn(50).tolist()
    z = np.random.randn(50).tolist()
    plate = (
        ["plate1"] * 10
        + ["plate2"] * 10
        + ["plate3"] * 10
        + ["plate4"] * 10
        + ["plate5"] * 10
    )
    compound = (["drug"] * 8 + ["DMSO"] * 2) * 5
    colnames = ["A", "B", "C", "Metadata_plate", "Metadata_compound"]
    df = pd.DataFrame(list(zip(x, y, z, plate, compound)), columns=colnames)
    with pytest.raises(ValueError):
        normalise.normalise(df, plate_id="Metadata_plate", method="invalid")

Example #6

0

Show file

File: test_normalise.py Project: Swarchal/morar

def test_parallel_normalise():
    x = np.random.randn(50).tolist()
    y = np.random.randn(50).tolist()
    z = np.random.randn(50).tolist()
    plate = (
        ["plate1"] * 10
        + ["plate2"] * 10
        + ["plate3"] * 10
        + ["plate4"] * 10
        + ["plate5"] * 10
    )
    compound = (["drug"] * 8 + ["DMSO"] * 2) * 5
    colnames = ["A", "B", "C", "Metadata_plate", "Metadata_compound"]
    df = pd.DataFrame(list(zip(x, y, z, plate, compound)), columns=colnames)
    standard_output = normalise.normalise(df, plate_id="Metadata_plate")
    parallel_output = normalise.normalise(df, plate_id="Metadata_plate", parallel=True)
    assert standard_output.equals(parallel_output)

Example #7

0

Show file

File: dataframe.py Project: jwildenhain/morar

 def normalise(self, **kwargs):
     """normalise data via morar.normalise.normalise"""
     df = normalise.normalise(self,
                              metadata_string=self.metadata_string,
                              prefix=self.prefix**kwargs)
     return DataFrame(df,
                      metadata_string=self.metadata_string,
                      prefix=self.metadata_prefix)

Example #8

0

Show file

File: test_normalise.py Project: Swarchal/morar

def test_normalise_subtract_returns_correct_values():
    # simple dataframe to check actual values
    x = [4, 4, 4, 2, 2]
    compound = ["drug"] * 3 + ["DMSO"] * 2
    plate = ["plate_1"] * 5
    colnames = ["f1", "Metadata_compound", "Metadata_plate"]
    simple_df = pd.DataFrame(list(zip(x, compound, plate)), columns=colnames)
    out = normalise.normalise(simple_df, plate_id="Metadata_plate", method="subtract")
    assert isinstance(out, pd.DataFrame)
    assert out["f1"].tolist() == [2, 2, 2, 0, 0]

Example #9

0

Show file

File: test_normalise.py Project: Swarchal/morar

def test_check_control_within_function():
    # dataframe with missing controls in one plate
    x = np.random.randn(50).tolist()
    y = np.random.randn(50).tolist()
    z = np.random.randn(50).tolist()
    plate = (
        ["plate1"] * 10
        + ["plate2"] * 10
        + ["plate3"] * 10
        + ["plate4"] * 10
        + ["plate5"] * 10
    )
    compound = (["drug"] * 10) + (["drug"] * 8 + ["DMSO"] * 2) * 4
    colnames = ["A", "B", "C", "Metadata_plate", "Metadata_compound"]
    missing_control_df = pd.DataFrame(
        list(zip(x, y, z, plate, compound)), columns=colnames
    )
    with pytest.raises(RuntimeError):
        normalise.normalise(missing_control_df, plate_id="Metadata_plate")

Example #10

0

Show file

def test_normalise_returns_dataframe_divide():
    # create test DataFrame
    x = np.random.randn(50).tolist()
    y = np.random.randn(50).tolist()
    z = np.random.randn(50).tolist()
    plate = (["plate1"] * 10 + ["plate2"] * 10 + ["plate3"] * 10 +
             ["plate4"] * 10 + ["plate5"] * 10)
    compound = (["drug"] * 8 + ["DMSO"] * 2) * 5
    colnames = ["A", "B", "C", "Metadata_plate", "Metadata_compound"]
    df = pd.DataFrame(list(zip(x, y, z, plate, compound)), columns=colnames)
    out = normalise.normalise(df, plate_id="Metadata_plate", method="divide")
    assert isinstance(out, pd.DataFrame)

Example #11

0

Show file

def test_normalise_divide_returns_correct_values():
    # simple dataframe to check actual values
    x = [4, 4, 4, 2, 2]
    compound = ["drug"] * 3 + ["DMSO"] * 2
    plate = ["plate_1"] * 5
    colnames = ["f1", "Metadata_compound", "Metadata_plate"]
    simple_df = pd.DataFrame(list(zip(x, compound, plate)), columns=colnames)
    out = normalise.normalise(simple_df,
                              plate_id="Metadata_plate",
                              method="divide")
    assert isinstance(out, pd.DataFrame)
    assert out["f1"].tolist() == [2, 2, 2, 1, 1]

Example #12

0

Show file

def test_normalise_returns_correct_size():
    # create test DataFrame
    x = np.random.randn(50).tolist()
    y = np.random.randn(50).tolist()
    z = np.random.randn(50).tolist()
    plate = (["plate1"] * 10 + ["plate2"] * 10 + ["plate3"] * 10 +
             ["plate4"] * 10 + ["plate5"] * 10)
    compound = (["drug"] * 8 + ["DMSO"] * 2) * 5
    colnames = ["A", "B", "C", "Metadata_plate", "Metadata_compound"]
    df = pd.DataFrame(list(zip(x, y, z, plate, compound)), columns=colnames)
    out = normalise.normalise(df, plate_id="Metadata_plate")
    assert out.shape[0] == df.shape[0]

Example #13

0

Show file

def test_normalise_non_default_cols():
    # dataframe with weird columns names
    x = np.random.randn(50).tolist()
    y = np.random.randn(50).tolist()
    z = np.random.randn(50).tolist()
    plate = ["plate1"] * 10 + ["plate2"] * 10 + ["plate3"] * 10 + [
        "plate4"
    ] * 10 + ["plate5"] * 10
    compound = (["drug"] * 8 + ["DMSO"] * 2) * 5
    colnames = ["A", "B", "C", "meta_plate", "meta_cmpd"]
    non_default_df = pd.DataFrame(list(zip(x, y, z, plate, compound)),
                                  columns=colnames)
    out = normalise.normalise(non_default_df,
                              compound="meta_cmpd",
                              plate_id="meta_plate",
                              metadata_string="meta")
    assert isinstance(out, pd.DataFrame)

Example #14

0

Show file

File: test_normalise.py Project: Swarchal/morar

def test_normalise_returns_dataframe_divide():
    # create test DataFrame
    x = np.random.randn(50).tolist()
    y = np.random.randn(50).tolist()
    z = np.random.randn(50).tolist()
    plate = (
        ["plate1"] * 10
        + ["plate2"] * 10
        + ["plate3"] * 10
        + ["plate4"] * 10
        + ["plate5"] * 10
    )
    compound = (["drug"] * 8 + ["DMSO"] * 2) * 5
    colnames = ["A", "B", "C", "Metadata_plate", "Metadata_compound"]
    df = pd.DataFrame(list(zip(x, y, z, plate, compound)), columns=colnames)
    out = normalise.normalise(df, plate_id="Metadata_plate", method="divide")
    assert isinstance(out, pd.DataFrame)

Example #15

0

Show file

File: test_normalise.py Project: Swarchal/morar

def test_normalise_returns_correct_size():
    # create test DataFrame
    x = np.random.randn(50).tolist()
    y = np.random.randn(50).tolist()
    z = np.random.randn(50).tolist()
    plate = (
        ["plate1"] * 10
        + ["plate2"] * 10
        + ["plate3"] * 10
        + ["plate4"] * 10
        + ["plate5"] * 10
    )
    compound = (["drug"] * 8 + ["DMSO"] * 2) * 5
    colnames = ["A", "B", "C", "Metadata_plate", "Metadata_compound"]
    df = pd.DataFrame(list(zip(x, y, z, plate, compound)), columns=colnames)
    out = normalise.normalise(df, plate_id="Metadata_plate")
    assert out.shape[0] == df.shape[0]

Example #16

0

Show file

def test_normalise_extra_metadata_cols():
    # dataframe with weird columns names
    x = np.random.randn(50).tolist()
    y = np.random.randn(50).tolist()
    z = np.random.randn(50).tolist()
    plate = (["plate1"] * 10 + ["plate2"] * 10 + ["plate3"] * 10 +
             ["plate4"] * 10 + ["plate5"] * 10)
    compound = (["drug"] * 8 + ["DMSO"] * 2) * 5
    extra_metadata = ["A", "B"] * 25
    colnames = ["A", "B", "C", "meta_plate", "meta_cmpd", "metadata_extra"]
    df = pd.DataFrame(list(zip(x, y, z, plate, compound, extra_metadata)))
    df.columns = colnames
    out = normalise.normalise(df,
                              metadata_string="meta",
                              compound="meta_cmpd",
                              plate_id="meta_plate")
    assert df.shape == out.shape
    assert df.columns.tolist() == out.columns.tolist()

Example #17

0

Show file

File: test_normalise.py Project: Swarchal/morar

def test_normalise_non_default_cols():
    # dataframe with weird columns names
    x = np.random.randn(50).tolist()
    y = np.random.randn(50).tolist()
    z = np.random.randn(50).tolist()
    plate = (
        ["plate1"] * 10
        + ["plate2"] * 10
        + ["plate3"] * 10
        + ["plate4"] * 10
        + ["plate5"] * 10
    )
    compound = (["drug"] * 8 + ["DMSO"] * 2) * 5
    colnames = ["A", "B", "C", "meta_plate", "meta_cmpd"]
    non_default_df = pd.DataFrame(list(zip(x, y, z, plate, compound)), columns=colnames)
    out = normalise.normalise(
        non_default_df,
        compound="meta_cmpd",
        plate_id="meta_plate",
        metadata_string="meta",
    )
    assert isinstance(out, pd.DataFrame)

Example #18

0

Show file

File: test_normalise.py Project: Swarchal/morar

def test_normalise_extra_metadata_cols():
    # dataframe with weird columns names
    x = np.random.randn(50).tolist()
    y = np.random.randn(50).tolist()
    z = np.random.randn(50).tolist()
    plate = (
        ["plate1"] * 10
        + ["plate2"] * 10
        + ["plate3"] * 10
        + ["plate4"] * 10
        + ["plate5"] * 10
    )
    compound = (["drug"] * 8 + ["DMSO"] * 2) * 5
    extra_metadata = ["A", "B"] * 25
    colnames = ["A", "B", "C", "meta_plate", "meta_cmpd", "metadata_extra"]
    df = pd.DataFrame(list(zip(x, y, z, plate, compound, extra_metadata)))
    df.columns = colnames
    out = normalise.normalise(
        df, metadata_string="meta", compound="meta_cmpd", plate_id="meta_plate"
    )
    assert df.shape == out.shape
    assert df.columns.tolist() == out.columns.tolist()