# but note that step2 is the bottleneck, so don't put too many events # in one output file here events_per_output=200, total_nevents=500000, # We have one input dummy file, so this must be True split_within_files=True, pset="psets/HIG-RunIIFall17wmLHEGS-01343_1_cfg_jhu.py", #cmssw_version = "CMSSW_9_3_6_patch2", cmssw_version="CMSSW_9_4_6_patch1", condor_submit_params={"sites": "T2_US_UCSD"}, scram_arch="slc6_amd64_gcc630", ) step2 = CMSSWTask( sample=DirectorySample( location=step1.get_outputdir(), dataset=step1.get_sample().get_datasetname().replace( "STEP1", "STEP2"), ), tag=proc_tag, special_dir=special_dir, open_dataset=True, files_per_output=1, pset="psets/HIG-RunIIFall17DRPremix-01240_1_cfg_jhu.py", cmssw_version="CMSSW_9_4_4", scram_arch="slc6_amd64_gcc630", ) step3 = CMSSWTask( sample=DirectorySample( location=step2.get_outputdir(),
sample=DirectorySample( location="/hadoop/cms/store/user/namin/yukawa_lhe/Events/run_{}/" .format(runstr), globber="*.lhe", dataset="/tttt-LOytscan/kt-{}_v2/LHE".format(ktstr), ), events_per_output=100, total_nevents=10000, pset="pset_gensim.py", cmssw_version="CMSSW_7_1_25_patch2", split_within_files=True, ) raw = CMSSWTask( sample=DirectorySample( location=lhe.get_outputdir(), dataset=lhe.get_sample().get_datasetname().replace( "LHE", "RAW"), ), open_dataset=True, files_per_output=1, pset="pset_raw.py", cmssw_version="CMSSW_8_0_21", ) aod = CMSSWTask( sample=DirectorySample( location=raw.get_outputdir(), dataset=raw.get_sample().get_datasetname().replace( "RAW", "AOD"), ),
def runall(special_dir, tag, total_nevents, events_per_output, config): for _ in range(25): proc_tag = "v1" #special_dir = "workflowtest/ProjectMetis" #special_dir = "miniaod_runII/JHUSample_ttH" cmssw_v_gensim = config["cmssw_v_gensim"] pset_gensim = config["pset_gensim"] scram_arch_gensim = config["scram_arch_gensim"] cmssw_v_aodsim = config["cmssw_v_aodsim"] pset_aodsim = config["pset_aodsim"] scram_arch_aodsim = config["scram_arch_aodsim"] pset_aodsim2 = config["pset_aodsim2"] cmssw_v_aodsim2 = cmssw_v_aodsim #config["pset_aodsim2"] scram_arch_aodsim2 = scram_arch_aodsim #config["scram_arch_aodsim2"] cmssw_v_miniaodsim = config["cmssw_v_miniaodsim"] pset_miniaodsim = config["pset_miniaodsim"] scram_arch_miniaodsim = config["scram_arch_miniaodsim"] step1 = CMSSWTask( # Change dataset to something more meaningful (but keep STEP1, as we use this # for string replacement later); keep N=1 sample=DummySample(N=1, dataset="/" + tag + "_STEP1"), # A unique identifier tag=proc_tag, special_dir=special_dir, # Probably want to beef up the below two numbers to control splitting, # but note that step2 is the bottleneck, so don't put too many events # in one output file here events_per_output=events_per_output, total_nevents=total_nevents, #events_per_output = 50, #total_nevents = 1000, # We have one input dummy file, so this must be True split_within_files=True, pset="psets/" + pset_gensim, cmssw_version=cmssw_v_gensim, scram_arch=scram_arch_gensim, ) step2 = CMSSWTask( sample=DirectorySample( location=step1.get_outputdir(), dataset=step1.get_sample().get_datasetname().replace( "STEP1", "STEP2"), ), tag=proc_tag, special_dir=special_dir, open_dataset=True, files_per_output=1, pset="psets/" + pset_aodsim, cmssw_version=cmssw_v_aodsim, scram_arch=scram_arch_aodsim, ) step3 = CMSSWTask( sample=DirectorySample( location=step2.get_outputdir(), dataset=step2.get_sample().get_datasetname().replace( "STEP2", "STEP3"), ), tag=proc_tag, special_dir=special_dir, open_dataset=True, files_per_output=1, pset="psets/" + pset_aodsim2, cmssw_version=cmssw_v_aodsim2, scram_arch=scram_arch_aodsim2, ) step4 = CMSSWTask( sample=DirectorySample( location=step3.get_outputdir(), dataset=step3.get_sample().get_datasetname().replace( "STEP3", "STEP4"), ), tag=proc_tag, special_dir=special_dir, open_dataset=True, files_per_output=1, output_name="step4.root", pset="psets/" + pset_miniaodsim, cmssw_version=cmssw_v_miniaodsim, scram_arch=scram_arch_miniaodsim, # condor_submit_params = {"sites":"UAF,UCSD"}, ) ''' step5 = CMSSWTask( sample = DirectorySample( location = step4.get_outputdir(), dataset = step4.get_sample().get_datasetname().replace("STEP4","STEP5"), ), tag = proc_tag, special_dir = special_dir, open_dataset = True, files_per_output = 1, pset = "psets/TOP-RunIIFall17NanoAODv7-00001_1_cfg.py", # The below two lines should match output file names in the pset output_name = "step5.root", #other_outputs = ["step3_inMINIAODSIM.root","step3_inDQM.root"], cmssw_version = "CMSSW_10_2_22", scram_arch = "slc6_amd64_gcc700", # condor_submit_params = {"sites":"UAF,UCSD"}, ) ''' #for _ in range(25): total_summary = {} for task in [step1, step2, step3, step4]: task.process() summary = task.get_task_summary() total_summary[task.get_sample().get_datasetname()] = summary StatsParser(data=total_summary, webdir="~/public_html/dump/metis/").do() time.sleep(600)