Python Dataset.features示例

编程语言: Python

命名空间/包名称: Data.Containers

类/类型: Dataset

方法/功能: features

hotexamples.com的示例: 2

Python Dataset.features - 已找到2个示例。这些是从开源项目中提取的最受好评的Data.Containers.Dataset.features现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

__init__(3)

features(2)

save(2)

uncompress(2)

compress(1)

df(1)

hit_val(1)

path(1)

示例#1

显示文件

文件： InitializeMut.py 项目： anyone1985/TCGA_Working

def is_one_gene(p):
    '''Test to see if most mutations are due to single gene'''
    counts = hit_matrix.ix[run.gene_sets[p]].sum(1).dropna().order()
    with_top = hit_matrix.ix[run.gene_sets[p]].sum().clip_upper(1).sum()
    without = hit_matrix.ix[run.gene_sets[p] - 
                            {counts.idxmax()}].sum().clip_upper(1).sum()
    return ((with_top - without) / without) > .5

meta_matrix = meta_matrix[size_filter(meta_matrix)] 
s = Series({p: is_one_gene(p) for p in meta_matrix.index})
meta_matrix = meta_matrix.ix[s==False]
hit_matrix = hit_matrix[size_filter(hit_matrix)] 

'''Add passing features to the Data Object''' 
mut.features = meta_matrix.append(hit_matrix)
mut.compress()
mut.uncompress()

'''Save updated Data Object (with additional features field'''
mut.save()
mut.uncompress()

'''Draw pathway_plots for pathway level features'''
meta_features = [f for f in mut.features.index if f in run.gene_sets]
pathway_plot_folder = mut.path + '/Figures/PathwayPlots/'
if not os.path.isdir(pathway_plot_folder):
    os.makedirs(pathway_plot_folder)
        
for i,p in enumerate(meta_features):
    df = mut.df.ix[run.gene_sets[p]]

示例#2

显示文件

文件： InitializeCN.py 项目： anyone1985/TCGA_Working

from Processing.Helpers import merge_redundant



report_path = sys.argv[1]
cancer_type = sys.argv[2]
data_type = sys.argv[3]
data_type = data_type[3:]

'''Load in run and CN data'''
run = pickle.load(open(report_path + '/RunObject.p', 'rb'))
cancer = run.load_cancer(cancer_type)

if data_type == 'broad':
    data = Dataset(cancer, run, 'CN_broad')
    data.features = data.df
    data.save()
    sys.exit(0)
    
data = Dataset(cancer, run, 'CN')
data.path = '_'.join([data.path, data_type])

if data_type == 'deletion':
    data.hit_val = -2
elif data_type == 'amplification':
    data.hit_val = 2
elif data_type == 'amplification_low':
    data.df = data.df.replace(1,2)
    data.hit_val = 2

hit_matrix = (data.df==data.hit_val).astype(float)