Esempio n. 1
0
def mm9_15():
    dm.extractFlanks("mm9.5.BonaFide_CGI.cgiHunter_oe0.6_gc50_len700.region",
                     "mm9_support.15.CGI700_downstream",
                     False,"start",2000,0)
    dm.extractFlanks("mm9.5.BonaFide_CGI.cgiHunter_oe0.6_gc50_len700.region",
                     "mm9_support.15.CGI700_upstream",
                     False,"end",0,2000)
    dm.mergeDatasets("mm9_support.15.BonaFide_CGI_Shore.cgiHunter_oe0.6_gc50_len700_2kb_outsideCgi",
                     ["mm9_support.15.CGI700_downstream",
                      "mm9_support.15.CGI700_upstream"])
    dm.deriveNewDataset("mm9.15.BonaFide_CGI_Shore.cgiHunter_oe0.6_gc50_len700_2kb_outsideCgi.region",
                        "mm9_support.15.BonaFide_CGI_Shore.cgiHunter_oe0.6_gc50_len700_2kb_outsideCgi",
                        [],
                        [],
                        None,
                        None,
                        True)
Esempio n. 2
0
def mm9_14():
    dm.extractFlanks("mm9.4.CpG_Island.cgiHunter_oe0.6_gc50_len200.region",
                     "mm9_support.14.CGI200_downstream",
                     False,"start",2000,0)
    dm.extractFlanks("mm9.4.CpG_Island.cgiHunter_oe0.6_gc50_len200.region",
                     "mm9_support.14.CGI200_upstream",
                     False,"end",0,2000)
    dm.mergeDatasets("mm9_support.14.CpG_Island_Shore.cgiHunter_oe0.6_gc50_len200_2kb_outsideCgi",
                     ["mm9_support.14.CGI200_upstream",
                      "mm9_support.14.CGI200_downstream"])
    dm.deriveNewDataset("mm9.14.CpG_Island_Shore.cgiHunter_oe0.6_gc50_len200_2kb_outsideCgi.region",
                        "mm9_support.14.CpG_Island_Shore.cgiHunter_oe0.6_gc50_len200_2kb_outsideCgi",
                        [],
                        [],
                        "max",
                        None,
                        True)    
Esempio n. 3
0
def mm9_16():
    dm.extractFlanks("mm9.5.BonaFide_CGI.cgiHunter_oe0.6_gc50_len700.region",
                     "mm9_support.16.500bp_centered_downstream",
                     False,"start",
#                     250,"int(min(250,(chromend-chromstart)*0.25))")
                     250,250)
    dm.extractFlanks("mm9.5.BonaFide_CGI.cgiHunter_oe0.6_gc50_len700.region",
                     "mm9_support.16.500bp_centered_upstream",
                     False,"end",
#                     "int(min(250,(chromend-chromstart)*0.25))",250)
                     250,250)
    dm.mergeDatasets("mm9_support.16.BonaFide_CGI_Border.cgiHunter_oe0.6_gc50_len700_500bp_centeredOnBorders",
                     ["mm9_support.16.500bp_centered_downstream",
                      "mm9_support.16.500bp_centered_upstream"])
    dm.deriveNewDataset("mm9.16.BonaFide_CGI_Border.cgiHunter_oe0.6_gc50_len700_500bp_centeredOnBorders.region",
                        "mm9_support.16.BonaFide_CGI_Border.cgiHunter_oe0.6_gc50_len700_500bp_centeredOnBorders",
                        [],
                        [],
                        "max",
                        None,
                        True)
Esempio n. 4
0
def hg18_12():    
    dm.deriveNewDataset("hg18_support.12.DNaseI_HS_site.hg18_tCell_DNaseI_hypersensitive_sites_Boyle2008",
                        "hg18_DNAseCD4Sites",
                        [],
                        [],
                        None,
                        None,
                        True)

    
    dm.regionDatasets.update(regionDatasets_DNaseI_Duke)
    dm.mergeDatasets("hg18_support.12.Duke_GM12878_HelaS3_K562_hepg2_SortedNotMerged",regionDatasets_DNaseI_Duke.keys())
    dm.deriveNewDataset("hg18_support.12.Duke_GM12878_HelaS3_K562_hepg2",
                        "hg18_support.12.Duke_GM12878_HelaS3_K562_hepg2_SortedNotMerged",
                        [],
                        [],
                        "max",
                        None,
                        True,
                        True)
#

    dm.regionDatasets.update(regionDatasets_DNaseI_Washington)

    dm.mergeDatasets("hg18_support.12.Open_Chromatin.ENCODE_DNaseI_hypersensitive_sites_SortedNotMerged",
                     regionDatasets_DNaseI_Washington.keys())

    dm.deriveNewDataset("hg18_support.12.Open_Chromatin.ENCODE_DNaseI_hypersensitive_sites",
                 "hg18_support.12.Open_Chromatin.ENCODE_DNaseI_hypersensitive_sites_SortedNotMerged",
                 [],
                 [],
                 "max",
                 None,
                 True,
                 True)
    dm.mergeDatasets("hg18_support.12.All_DNaseI_datasets_merged",
                     ["hg18_support.12.Open_Chromatin.ENCODE_DNaseI_hypersensitive_sites",
                      "hg18_support.12.Duke_GM12878_HelaS3_K562_hepg2",
                      "hg18_support.12.DNaseI_HS_site.hg18_tCell_DNaseI_hypersensitive_sites_Boyle2008"
                      ])
    
    dm.deriveNewDataset("hg18.12.Open_Chromatin.DNase_FAIRE_peaks_ENCODE_noPromoter.region",
                        "hg18_support.12.All_DNaseI_datasets_merged",
                        ["hg18.2.Promoter_centered.refSeqGenes_minus_1000_to_1000_around_TSS.region"],
                        [],
                        "max",
                        None,
                        True,
                        True)
    dm.deriveNewDataset("hg18.12.Open_Chromatin.DNase_FAIRE_peaks_ENCODE_noPromoter_downsampledTo500k.region",
                 "hg18.12.Open_Chromatin.DNase_FAIRE_peaks_ENCODE_noPromoter.region",
                 [],
                 [],
                 None,
                 None,
                 True,
                 True,
                 500000)
Esempio n. 5
0
def hg18_12_new():
    dm.extractFlanks("hg18_support.12.DNaseI_HS_site.hg18_tCell_DNaseI_hypersensitive_sites_Boyle2008",
                     "hg18_support.12.DNaseI_HS_site.hg18_tCell_DNaseI_hypersensitive_sites_Boyle2008_1kb",
                     False,"whole_region",
                     "max(0,int(500-(chromend-chromstart)/2))","max(0,int(500-(chromend-chromstart)/2))")
    
    dm.regionDatasets.update(regionDatasets_DNaseI_Duke)
    dm.mergeDatasets("hg18_support.12.Duke_GM12878_HelaS3_K562_hepg2_SortedNotMerged",regionDatasets_DNaseI_Duke.keys())
    dm.extractFlanks("hg18_support.12.Duke_GM12878_HelaS3_K562_hepg2_SortedNotMerged",
                     "hg18_support.12.Duke_GM12878_HelaS3_K562_hepg2_SortedNotMerged_1kb",
                     False,"whole_region",
                     "max(0,int(500-(chromend-chromstart)/2))","max(0,int(500-(chromend-chromstart)/2))")
    dm.regionDatasets.update(regionDatasets_DNaseI_Washington)
    dm.mergeDatasets("hg18_support.12.Open_Chromatin.ENCODE_DNaseI_hypersensitive_sites_SortedNotMerged",
                     regionDatasets_DNaseI_Washington.keys())
    dm.extractFlanks("hg18_support.12.Open_Chromatin.ENCODE_DNaseI_hypersensitive_sites_SortedNotMerged",
                     "hg18_support.12.Open_Chromatin.ENCODE_DNaseI_hypersensitive_sites_SortedNotMerged_1kb",
                     False,"whole_region",
                     "max(0,int(500-(chromend-chromstart)/2))","max(0,int(500-(chromend-chromstart)/2))")
#    datasetCurrent = {"hg18_support.12.DNaseI_HS_site.hg18_tCell_DNaseI_hypersensitive_sites_Boyle2008_1kb":defaultFolder+"hg18_support.12.DNaseI_HS_site.hg18_tCell_DNaseI_hypersensitive_sites_Boyle2008_1kb"+".txt",
#                      "hg18_support.12.Duke_GM12878_HelaS3_K562_hepg2_SortedNotMerged_1kb":defaultFolder+"hg18_support.12.Duke_GM12878_HelaS3_K562_hepg2_SortedNotMerged_1kb"+".txt",
#                      "hg18_support.12.Open_Chromatin.ENCODE_DNaseI_hypersensitive_sites_SortedNotMerged_1kb":defaultFolder+"hg18_support.12.Open_Chromatin.ENCODE_DNaseI_hypersensitive_sites_SortedNotMerged_1kb"+".txt",
#                      }
#    dm.regionDatasets.update(datasetCurrent)
    dm.mergeDatasets("hg18_support.12.All_DNaseI_datasets_merged",
                     ["hg18_support.12.DNaseI_HS_site.hg18_tCell_DNaseI_hypersensitive_sites_Boyle2008_1kb",
                      "hg18_support.12.Duke_GM12878_HelaS3_K562_hepg2_SortedNotMerged_1kb",
                      "hg18_support.12.Open_Chromatin.ENCODE_DNaseI_hypersensitive_sites_SortedNotMerged_1kb"                      
                      ])
    
    dm.deriveNewDataset("hg18.12_new.Open_Chromatin.DNase_FAIRE_peaks_ENCODE_noPromoter.region",
                        "hg18_support.12.All_DNaseI_datasets_merged",
                        ["hg18.2.Promoter_centered.refSeqGenes_minus_1000_to_1000_around_TSS.region"],
                        [],
                        "max",
                        None,
                        True,
                        True)