Python load_testdata示例，normpy.utils.load_testdata Python示例

示例#1

0

显示文件

文件： test.py 项目： lukauskas/normpy

def test_edgeR():
    """
    Test call to EdgeR as a reference.
    """
    #counts_fname = "/home/yarden/jaen/normpy/normpy/test/data/pasilla_gene_counts.tsv"
    counts_fname = utils.load_testdata("pasilla")
    # Consider only a subset of the samples
    samples = OrderedDict()
    samples["Untreated 1"] = "untreated1"
    samples["Untreated 2"] = "untreated2"
    # Make an experiment object out of them
    exp_obj = experiment.Experiment(counts_fname, samples)
    edgeR_obj = edgeR_utils.EdgeR(exp_obj)
    edgeR_obj.norm_expr_vals(ref_col="untreated1")

示例#2

0

显示文件

文件： test.py 项目： hjanime/normpy

def test_edgeR():
    """
    Test call to EdgeR as a reference.
    """
    #counts_fname = "/home/yarden/jaen/normpy/normpy/test/data/pasilla_gene_counts.tsv"
    counts_fname = utils.load_testdata("pasilla")
    # Consider only a subset of the samples
    samples = OrderedDict()
    samples["Untreated 1"] = "untreated1"
    samples["Untreated 2"] = "untreated2"
    # Make an experiment object out of them
    exp_obj = experiment.Experiment(counts_fname, samples)
    edgeR_obj = edgeR_utils.EdgeR(exp_obj)
    edgeR_obj.norm_expr_vals(ref_col="untreated1")

示例#3

0

显示文件

文件： test.py 项目： hjanime/normpy

def test_deseq():
    """
    Calls DESeq normalization. Prints raw counts then normed counts.
    """
    counts_fname = utils.load_testdata("pasilla")
    # Consider only a subset of the samples
    samples = OrderedDict()
    samples["Untreated 1"] = "untreated1"
    samples["Untreated 2"] = "untreated2"
    exp_obj = experiment.Experiment(counts_fname, samples)
    norm_counts_df = normalizers.norm_deseq(exp_obj)
    print "\nDESeq Testing:"
    print "--------------"
    print "Pre-normalized counts: "
    print exp_obj.counts_df.head()
    print "Normalized counts: "
    print norm_counts_df.head()

示例#4

0

显示文件

文件： test.py 项目： lukauskas/normpy

def test_deseq():
    """
    Calls DESeq normalization. Prints raw counts then normed counts.
    """
    counts_fname = utils.load_testdata("pasilla")
    # Consider only a subset of the samples
    samples = OrderedDict()
    samples["Untreated 1"] = "untreated1"
    samples["Untreated 2"] = "untreated2"
    exp_obj = experiment.Experiment(counts_fname, samples)
    norm_counts_df = normalizers.norm_deseq(exp_obj)
    print("\nDESeq Testing:")
    print("--------------")
    print("Pre-normalized counts: ")
    print(exp_obj.counts_df.head())
    print("Normalized counts: ")
    print(norm_counts_df.head())

示例#5

0

显示文件

def test_quantile():
    """
    Calls quantile normalization. Prints raw counts then normed counts.
    """
    counts_fname = utils.load_testdata("pasilla")
    # Consider only a subset of the samples
    samples = OrderedDict()
    samples["Untreated 1"] = "untreated1"
    samples["Untreated 2"] = "untreated2"
    exp_obj = experiment.Experiment(counts_fname, samples)
    norm_counts_df = normalizers.norm_q(exp_obj)
    print "\nQuantile Testing:"
    print "--------------"
    print "Pre-normalized counts: "
    print exp_obj.counts_df.head()
    print "Normalized counts: "
    print norm_counts_df.head()

示例#6

0

显示文件

def test_tmm():
    """
    Calls TMM normalization. Prints raw counts then normed counts.
    """
    counts_fname = utils.load_testdata("pasilla")
    # Consider only a subset of the samples
    samples = OrderedDict()
    samples["Untreated 1"] = "untreated1"
    samples["Untreated 2"] = "untreated2"
    exp_obj = experiment.Experiment(counts_fname, samples)
    norm_counts_df = normalizers.norm_tmm(exp_obj)
    print("\nTMM Testing:")
    print("--------------")
    print("Pre-normalized counts: ")
    print(exp_obj.counts_df.head())
    print("Normalized counts: ")
    print(norm_counts_df.head())
    sys.stderr.write("Test tmm done!\n")

示例#7

0

显示文件

文件： test.py 项目： hjanime/normpy

def test_lowess():
    """
    Tests lowess normalization. 
    """
    counts_fname = utils.load_testdata("pasilla")
    # Consider only a subset of the samples
    samples = OrderedDict()
    samples["Untreated 1"] = "untreated1"
    samples["Untreated 2"] = "untreated2"
    exp_obj = experiment.Experiment(counts_fname, samples)
    pairs = [["untreated1", "untreated2"]]
    norm_df, unnorm_df = normalizers.norm_ma_lowess(exp_obj, pairs)
    print "\nLowess Testing:"
    print "--------------"
    print "Pre-normalized values: "
    print unnorm_df.head()
    print "Normalized counts: "
    print norm_df.head()
    # Compare LOWESS normalized to total counts
    pair = ["untreated1", "untreated2"]
    plot_utils.plot_fcs(norm_df, unnorm_df, pair, "lowess_test")

示例#8

0

显示文件

文件： test.py 项目： lukauskas/normpy

def test_lowess():
    """
    Tests lowess normalization. 
    """
    counts_fname = utils.load_testdata("pasilla")
    # Consider only a subset of the samples
    samples = OrderedDict()
    samples["Untreated 1"] = "untreated1"
    samples["Untreated 2"] = "untreated2"
    exp_obj = experiment.Experiment(counts_fname, samples)
    pairs = [["untreated1", "untreated2"]]
    norm_df, unnorm_df = normalizers.norm_ma_lowess(exp_obj, pairs)
    print("\nLowess Testing:")
    print("--------------")
    print("Pre-normalized values: ")
    print(unnorm_df.head())
    print("Normalized counts: ")
    print(norm_df.head())
    # Compare LOWESS normalized to total counts
    pair = ["untreated1", "untreated2"]
    plot_utils.plot_fcs(norm_df, unnorm_df, pair, "lowess_test")

示例#9

0

显示文件

def test_quantile_vs_tmm():
    """
    Test quantile normalization versus TMM
    in rank correlation of genes.
    """
    counts_fname = utils.load_testdata("pasilla")
    # Consider only a subset of the samples
    samples = OrderedDict()
    samples["Untreated 1"] = "untreated1"
    samples["Untreated 2"] = "untreated2"
    exp_obj = experiment.Experiment(counts_fname, samples)
    quantile_counts_df = normalizers.norm_q(exp_obj)
    tmm_counts_df = normalizers.norm_tmm(exp_obj)
    print("\nQuantile versus TMM Testing:")
    print("--------------")
    print("Normalized quantile counts: ")
    print(quantile_counts_df.head())
    print("Normalized TMM counts: ")
    print(tmm_counts_df.head())
    print("Correlating the genes.")
    # Merge the dataframes together, indexing by gene
    combined_df = pandas.merge(quantile_counts_df,
                               tmm_counts_df,
                               left_index=True,
                               right_index=True,
                               suffixes=["_q", "_tmm"],
                               how="outer")
    # Get log of counts: get rid of infinite values
    log_counts_df = combined_df.apply(np.log2).replace([-np.inf, np.inf],
                                                       np.nan)
    print("Combined dataframe: ")
    print(combined_df.head())
    print("Combined log dataframe: ")
    print(log_counts_df.head())
    # Plot correlation
    from pandas.tools.plotting import scatter_matrix
    scatter_matrix(log_counts_df, alpha=0.2, figsize=(8, 7))
    plot_utils.save_fig("quantile_vs_tmm_corr", ext="png")
    sys.stderr.write("Test quantile vs tmm done!\n")

示例#10

0

显示文件

文件： test.py 项目： lukauskas/normpy

def test_tc():
    """
    Test total counts normalization.
    """
    counts_fname = utils.load_testdata("pasilla")
    # Consider only a subset of the samples
    samples = OrderedDict()
    samples["Untreated 1"] = "untreated1"
    samples["Untreated 2"] = "untreated2"
    # Make an experiment object out of them
    exp_obj = experiment.Experiment(counts_fname, samples)
    # Normalization without explicit library sizes
    norm_counts_df = normalizers.norm_tc(exp_obj)
    print("Pre-normalized counts: ")
    print(exp_obj.counts_df.head())
    print("Normalized counts: ")
    print(norm_counts_df.head())
    # Normalization with library sizes
    exp_obj.lib_sizes = {"untreated1": 100, "untreated2": 200}
    norm_counts_df = normalizers.norm_tc(exp_obj)
    print("Normalized with library size: ")
    print(norm_counts_df.head())

示例#11

0

显示文件

文件： test.py 项目： hjanime/normpy

def test_tc():
    """
    Test total counts normalization.
    """
    counts_fname = utils.load_testdata("pasilla")
    # Consider only a subset of the samples
    samples = OrderedDict()
    samples["Untreated 1"] = "untreated1"
    samples["Untreated 2"] = "untreated2"
    # Make an experiment object out of them
    exp_obj = experiment.Experiment(counts_fname, samples)
    # Normalization without explicit library sizes
    norm_counts_df = normalizers.norm_tc(exp_obj)
    print "Pre-normalized counts: "
    print exp_obj.counts_df.head()
    print "Normalized counts: "
    print norm_counts_df.head()
    # Normalization with library sizes
    exp_obj.lib_sizes = {"untreated1": 100,
                         "untreated2": 200}
    norm_counts_df = normalizers.norm_tc(exp_obj)
    print "Normalized with library size: "
    print norm_counts_df.head()

示例#12

0

显示文件

文件： test.py 项目： hjanime/normpy

def test_quantile_vs_tmm():
    """
    Test quantile normalization versus TMM
    in rank correlation of genes.
    """
    counts_fname = utils.load_testdata("pasilla")
    # Consider only a subset of the samples
    samples = OrderedDict()
    samples["Untreated 1"] = "untreated1"
    samples["Untreated 2"] = "untreated2"
    exp_obj = experiment.Experiment(counts_fname, samples)
    quantile_counts_df = normalizers.norm_q(exp_obj)
    tmm_counts_df = normalizers.norm_tmm(exp_obj)
    print "\nQuantile versus TMM Testing:"
    print "--------------"
    print "Normalized quantile counts: "
    print quantile_counts_df.head()
    print "Normalized TMM counts: "
    print tmm_counts_df.head()
    print "Correlating the genes."
    # Merge the dataframes together, indexing by gene
    combined_df = pandas.merge(quantile_counts_df, tmm_counts_df,
                               left_index=True,
                               right_index=True,
                               suffixes=["_q", "_tmm"],
                               how="outer")
    # Get log of counts: get rid of infinite values
    log_counts_df = combined_df.apply(np.log2).replace([-np.inf, np.inf],
                                                       np.nan)
    print "Combined dataframe: "
    print combined_df.head()
    print "Combined log dataframe: "
    print log_counts_df.head()
    # Plot correlation
    from pandas.tools.plotting import scatter_matrix
    scatter_matrix(log_counts_df, alpha=0.2, figsize=(8, 7))
    plot_utils.save_fig("quantile_vs_tmm_corr", ext="png")