Exemple #1
0
    def test_SplitByFiles_split(self):
        job = Job(application=DaVinci())
        #job.application.extra = GaudiExtras()
        job.splitter = GPI.SplitByFiles(filesPerJob=2)
        dummy_files = ['pfn:f1.dst', 'pfn:f2.dst', 'pfn:f3.dst', 'pfn:f4.dst',
                       'pfn:f5.dst']
        job.inputdata = LHCbDataset(dummy_files)
        job.prepare()
        subjobs = job.splitter.split(job)
        assert len(subjobs) == 3, 'incorrect number of split jobs'
        # for i in range(0,3):
        jobconfigs = [LHCbGaudiRunTimeHandler().prepare(
            subjobs[i].application, None, None, None) for i in range(0, 3)]
        # job 0
        dataopts = [file for file in jobconfigs[
            0].inputbox if file.name.find('data.py') >= 0][0].getContents()
        #dataopts = subjobs[0].application.extra.input_buffers['data.py']
        ok = dataopts.rfind('f1.dst') >= 0 and dataopts.rfind('f2.dst') >= 0 \
            and len(subjobs[0].inputdata) == 2
        print(len(subjobs[0].inputdata))
        assert ok, 'problem w/ subjob 0 input data'
        # job 1
        dataopts = [file for file in jobconfigs[
            1].inputbox if file.name.find('data.py') >= 0][0].getContents()
        #dataopts = subjobs[1].application.extra.input_buffers['data.py']
        ok = dataopts.rfind('f3.dst') >= 0 and dataopts.rfind('f4.dst') >= 0 \
            and len(subjobs[1].inputdata) == 2
        assert ok, 'problem w/ subjob 1 input data'
        # job 2
        dataopts = [file for file in jobconfigs[
            2].inputbox if file.name.find('data.py') >= 0][0].getContents()
       #dataopts = subjobs[2].application.extra.input_buffers['data.py']
        ok = dataopts.rfind('f5.dst') >= 0 and \
            len(subjobs[2].inputdata) == 1
        assert ok, 'problem w/ subjob 2 input data'

        # Check also that data in the optsfiles was picked up.
        job = Job(application=DaVinci())
        #job.application.extra = GaudiExtras()
        job.splitter = GPI.SplitByFiles(filesPerJob=2)
        dummy_files = ['pfn:f1.dst', 'pfn:f2.dst', 'pfn:f3.dst', 'pfn:f4.dst',
                       'pfn:f5.dst']
        l = LHCbDataset(dummy_files)
        tdir = mkdtemp()
        f = open(os.path.join(tdir, 'data.py'), 'w')
        f.write(l.optionsString())
        f.close()
        job.application.optsfile = [f.name]
        job.prepare()
        subjobs = job.splitter.split(job)
        assert len(
            subjobs) == 3, 'incorrect number of split jobs, for data in optsfile'
        # for i in range(0,3):
        jobconfigs = [LHCbGaudiRunTimeHandler().prepare(
            subjobs[i].application, None, None, None) for i in range(0, 3)]
        # job 0
        dataopts = [file for file in jobconfigs[
            0].inputbox if file.name.find('data.py') >= 0][0].getContents()
        #dataopts = subjobs[0].application.extra.input_buffers['data.py']
        ok = dataopts.rfind('f1.dst') >= 0 and dataopts.rfind('f2.dst') >= 0 \
            and len(subjobs[0].inputdata) == 2
        print(len(subjobs[0].inputdata))
        assert ok, 'problem w/ subjob 0 input data, for data in optsfile'
        # job 1
        dataopts = [file for file in jobconfigs[
            1].inputbox if file.name.find('data.py') >= 0][0].getContents()
        #dataopts = subjobs[1].application.extra.input_buffers['data.py']
        ok = dataopts.rfind('f3.dst') >= 0 and dataopts.rfind('f4.dst') >= 0 \
            and len(subjobs[1].inputdata) == 2
        assert ok, 'problem w/ subjob 1 input data, for data in optsfile'
        # job 2
        dataopts = [file for file in jobconfigs[
            2].inputbox if file.name.find('data.py') >= 0][0].getContents()
       #dataopts = subjobs[2].application.extra.input_buffers['data.py']
        ok = dataopts.rfind('f5.dst') >= 0 and \
            len(subjobs[2].inputdata) == 1
        assert ok, 'problem w/ subjob 2 input data, for data in optsfile'