Exemplo n.º 1
0
def main():
    start = time.time()

    # acdcInfo = match['ACDC']
    acdcInfo = {
        "database": "acdcserver",
        "fileset":
        "/pdmvserv_task_SUS-RunIIFall18wmLHEGS-00025__v1_T_181211_005112_2222/SUS-RunIIFall18wmLHEGS-00025_0",
        "collection":
        "pdmvserv_task_SUS-RunIIFall18wmLHEGS-00025__v1_T_181211_005112_2222",
        "server": "https://cmsweb.cern.ch/couchdb"
    }

    dcs = DataCollectionService(acdcInfo["server"], acdcInfo["database"])
    #    acdcFileList = dcs.getProductionACDCInfo(acdcInfo['collection'], acdcInfo['fileset'])

    files = dcs._getFilesetInfo(acdcInfo['collection'], acdcInfo['fileset'])
    print("%s" % pformat(files[0]))
    files = mergeFilesInfo(files)
    acdcFileList = []
    for value in files:
        fileInfo = {
            "lfn": value["lfn"],
            "first_event": value["first_event"],
            "lumis": value["runs"][0]["lumis"],
            "events": value["events"]
        }
        acdcFileList.append(fileInfo)
    #print("Data retrieved:\n%s" % pformat(acdcFileList))
    print("Retrieved %d files from the ACDCServer" % len(acdcFileList))

    listLumis = []
    wantedLumis = set([252052, 240646])
    for f in acdcFileList:
        listLumis.extend(f['lumis'])
        lumisSet = set(f['lumis'])
        if wantedLumis.intersection(lumisSet):
            print("File: %s with events: %s, contains these lumis: %s" %
                  (f['lfn'], f['events'], f['lumis']))

    print("Total amount of lumis: %d, where unique are: %d" %
          (len(listLumis), len(set(listLumis))))
    # with open("chunkfiles.json", 'w') as fo:
    #     json.dump(block, fo)

    end = time.time()
    print("Spent %s secs running so far" % (end - start))
    sys.exit(1)
Exemplo n.º 2
0
def main():
    start = time.time()

    # acdcInfo = match['ACDC']
    acdcInfo = {"database": "acdcserver",
                "fileset": "/pdmvserv_task_SUS-RunIIFall18wmLHEGS-00025__v1_T_181211_005112_2222/SUS-RunIIFall18wmLHEGS-00025_0",
                "collection": "pdmvserv_task_SUS-RunIIFall18wmLHEGS-00025__v1_T_181211_005112_2222",
                "server": "https://cmsweb.cern.ch/couchdb"}

    dcs = DataCollectionService(acdcInfo["server"], acdcInfo["database"])
#    acdcFileList = dcs.getProductionACDCInfo(acdcInfo['collection'], acdcInfo['fileset'])

    files = dcs._getFilesetInfo(acdcInfo['collection'], acdcInfo['fileset'])
    print("%s" % pformat(files[0]))
    files = mergeFilesInfo(files)
    acdcFileList = []
    for value in files:
        fileInfo = {"lfn": value["lfn"],
                    "first_event": value["first_event"],
                    "lumis": value["runs"][0]["lumis"],
                    "events": value["events"]}
        acdcFileList.append(fileInfo)
    #print("Data retrieved:\n%s" % pformat(acdcFileList))
    print("Retrieved %d files from the ACDCServer" % len(acdcFileList))

    listLumis = []
    wantedLumis = set([252052, 240646])
    for f in acdcFileList:
        listLumis.extend(f['lumis'])
        lumisSet = set(f['lumis'])
        if wantedLumis.intersection(lumisSet):
            print("File: %s with events: %s, contains these lumis: %s" % (f['lfn'], f['events'], f['lumis']))

    print("Total amount of lumis: %d, where unique are: %d" % (len(listLumis), len(set(listLumis))))
    # with open("chunkfiles.json", 'w') as fo:
    #     json.dump(block, fo)

    end = time.time()
    print("Spent %s secs running so far" % (end - start))
    sys.exit(1)
Exemplo n.º 3
0
    def testDataMergeFilesInfo(self):
        """
        _testDataMergeFilesInfo_

        Verify that we can properly merge real input files coming from
        the ACDCServer.
        """
        originalFiles = [{
            u'events': 165,
            u'lfn': u'/store/unmerged/fileA.root',
            u'locations': [u'T2_CH_CERN', u'T2_CH_CERNBOX'],
            u'parents': [],
            u'runs': [{
                u'lumis': [1810823],
                u'run_number': 1
            }]
        }, {
            u'events': 165,
            u'lfn': u'/store/unmerged/fileA.root',
            u'locations': [u'T2_CH_CERN', u'T2_CH_CERNBOX'],
            u'parents': [],
            u'runs': [{
                u'lumis': [1810823],
                u'run_number': 2
            }]
        }, {
            u'events': 50,
            u'lfn': u'/store/unmerged/fileB.root',
            u'locations': [u'T1_US_FNAL_MSS'],
            u'parents': ['file1', 'file3'],
            u'runs': [{
                u'lumis': [1, 2, 3],
                u'run_number': 1
            }]
        }, {
            u'events': 165,
            u'lfn': u'/store/unmerged/fileA.root',
            u'locations': [u'T2_CH_CERN', u'T2_CH_CERNBOX'],
            u'parents': [],
            u'runs': [{
                u'lumis': [1810824],
                u'run_number': 1
            }]
        }, {
            u'events':
            50,
            u'lfn':
            u'/store/unmerged/fileB.root',
            u'locations': [u'T1_US_FNAL_MSS'],
            u'parents': ['file2'],
            u'runs': [{
                u'lumis': [4, 5, 6],
                u'run_number': 1
            }, {
                u'lumis': [9],
                u'run_number': 1
            }, {
                u'lumis': [7, 8],
                u'run_number': 7
            }]
        }, {
            u'events': 10,
            u'lfn': u'/store/unmerged/fileC.root',
            u'locations': [u'T1_US_FNAL_Disk', u'T2_US_MIT'],
            u'parents': [],
            u'runs': [{
                u'lumis': [111],
                u'run_number': 222
            }]
        }]

        mergedFiles = mergeFilesInfo(originalFiles)
        self.assertEqual(len(mergedFiles), 3, "Error: wrong number of files.")
        self.assertItemsEqual([i['lfn'] for i in mergedFiles], [
            '/store/unmerged/fileA.root', '/store/unmerged/fileB.root',
            '/store/unmerged/fileC.root'
        ])

        for item in mergedFiles:
            if item['lfn'] == '/store/unmerged/fileA.root':
                self.assertEqual(item['events'], 165)
                self.assertItemsEqual(item['locations'],
                                      ['T2_CH_CERN', 'T2_CH_CERNBOX'])
                for runLumi in item['runs']:
                    if runLumi['run_number'] == 1:
                        self.assertItemsEqual(runLumi['lumis'],
                                              [1810824, 1810823])
                    elif runLumi['run_number'] == 2:
                        self.assertItemsEqual(runLumi['lumis'], [1810823])
                    else:
                        raise AssertionError("This should never happen")
                self.assertEqual(item['parents'], [])
            elif item['lfn'] == '/store/unmerged/fileB.root':
                self.assertEqual(item['events'], 50)
                self.assertItemsEqual(item['locations'], ['T1_US_FNAL_MSS'])
                for runLumi in item['runs']:
                    if runLumi['run_number'] == 1:
                        self.assertItemsEqual(runLumi['lumis'],
                                              [1, 2, 3, 4, 5, 6, 9])
                    elif runLumi['run_number'] == 7:
                        self.assertItemsEqual(runLumi['lumis'], [7, 8])
                    else:
                        raise AssertionError("This should never happen")
                self.assertItemsEqual(item['parents'],
                                      ['file1', 'file2', 'file3'])
            elif item['lfn'] == '/store/unmerged/fileC.root':
                self.assertEqual(item['events'], 10)
                self.assertItemsEqual(item['locations'],
                                      ['T1_US_FNAL_Disk', 'T2_US_MIT'])
                self.assertItemsEqual(item['runs'], [{
                    'lumis': [111],
                    'run_number': 222
                }])
                self.assertEqual(item['parents'], [])
Exemplo n.º 4
0
    def testFakeMergeFilesInfo(self):
        """
        _testFakeMergeFilesInfo_

        Verify that we can merge MCFakeFiles together when a fileset contains
        several failures for the same input fake file.
        """
        fakeFiles = [{
            'checksums': {},
            'events':
            500000,
            'first_event':
            1,
            'id':
            40,
            'last_event':
            0,
            'lfn':
            'MCFakeFile-File1',
            'locations': ['T1_DE_KIT_Disk'],
            'merged':
            '0',
            'parents': [],
            'runs': [{
                'lumis': [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11],
                'run_number': 1
            }],
            'size':
            0
        }, {
            'checksums': {},
            'events':
            500000,
            'first_event':
            1000001,
            'id':
            40,
            'last_event':
            0,
            'lfn':
            'MCFakeFile-File2',
            'locations': ['T1_DE_KIT_Disk'],
            'merged':
            '0',
            'parents': [],
            'runs': [{
                'lumis': [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31],
                'run_number': 1
            }],
            'size':
            0
        }, {
            'checksums': {},
            'events':
            500000,
            'first_event':
            2000001,
            'id':
            40,
            'last_event':
            0,
            'lfn':
            'MCFakeFile-File1',
            'locations': ['T1_DE_KIT_Disk'],
            'merged':
            '0',
            'parents': [],
            'runs': [{
                'lumis': [41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51],
                'run_number': 1
            }],
            'size':
            0
        }, {
            'checksums': {},
            'events':
            500000,
            'first_event':
            7000001,
            'id':
            40,
            'last_event':
            0,
            'lfn':
            'MCFakeFile-File3',
            'locations': ['T1_DE_KIT_Disk'],
            'merged':
            '0',
            'parents': [],
            'runs': [{
                'lumis': [81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91],
                'run_number': 1
            }],
            'size':
            0
        }, {
            'checksums': {},
            'events':
            500000,
            'first_event':
            4000001,
            'id':
            40,
            'last_event':
            0,
            'lfn':
            'MCFakeFile-File3',
            'locations': ['T1_DE_KIT_Disk'],
            'merged':
            '0',
            'parents': [],
            'runs': [{
                'lumis': [51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61],
                'run_number': 1
            }],
            'size':
            0
        }]

        mergedFiles = mergeFilesInfo(fakeFiles)
        self.assertEqual(len(mergedFiles), 3, "Error: wrong number of files.")

        totalEvents = 0
        for job in mergedFiles:
            totalEvents += job['events']
        self.assertEqual(totalEvents, 2500000,
                         "Error: wrong number of total events.")

        for job in mergedFiles:
            if job['lfn'] == 'MCFakeFile-File1':
                lumiList = job['runs'][0]['lumis']
                self.assertEqual(len(lumiList), 22)
Exemplo n.º 5
0
    def testDataMergeFilesInfo(self):
        """
        _testDataMergeFilesInfo_

        Verify that we can properly merge real input files coming from
        the ACDCServer.
        """
        originalFiles = [{u'events': 165,
                          u'lfn': u'/store/unmerged/fileA.root',
                          u'locations': [u'T2_CH_CERN', u'T2_CH_CERNBOX'],
                          u'parents': [],
                          u'runs': [{u'lumis': [1810823], u'run_number': 1}]},
                         {u'events': 165,
                          u'lfn': u'/store/unmerged/fileA.root',
                          u'locations': [u'T2_CH_CERN', u'T2_CH_CERNBOX'],
                          u'parents': [],
                          u'runs': [{u'lumis': [1810823], u'run_number': 2}]},
                         {u'events': 50,
                          u'lfn': u'/store/unmerged/fileB.root',
                          u'locations': [u'T1_US_FNAL_MSS'],
                          u'parents': ['file1', 'file3'],
                          u'runs': [{u'lumis': [1, 2, 3], u'run_number': 1}]},
                         {u'events': 165,
                          u'lfn': u'/store/unmerged/fileA.root',
                          u'locations': [u'T2_CH_CERN', u'T2_CH_CERNBOX'],
                          u'parents': [],
                          u'runs': [{u'lumis': [1810824], u'run_number': 1}]},
                         {u'events': 50,
                          u'lfn': u'/store/unmerged/fileB.root',
                          u'locations': [u'T1_US_FNAL_MSS'],
                          u'parents': ['file2'],
                          u'runs': [{u'lumis': [4, 5, 6], u'run_number': 1}, {u'lumis': [9], u'run_number': 1}]},
                         {u'events': 10,
                          u'lfn': u'/store/unmerged/fileC.root',
                          u'locations': [u'T1_US_FNAL_Disk', u'T2_US_MIT'],
                          u'parents': [],
                          u'runs': [{u'lumis': [111], u'run_number': 222}]}]

        mergedFiles = mergeFilesInfo(originalFiles)
        self.assertEqual(len(mergedFiles), 3, "Error: wrong number of files.")
        self.assertItemsEqual([i['lfn'] for i in mergedFiles], ['/store/unmerged/fileA.root',
                                                                '/store/unmerged/fileB.root',
                                                                '/store/unmerged/fileC.root'])

        for item in mergedFiles:
            if item['lfn'] == '/store/unmerged/fileA.root':
                self.assertEqual(item['events'], 165)
                self.assertItemsEqual(item['locations'], ['T2_CH_CERN', 'T2_CH_CERNBOX'])
                self.assertItemsEqual(item['runs'], [{'lumis': [1810823], 'run_number': 1},
                                                     {'lumis': [1810823], 'run_number': 2},
                                                     {'lumis': [1810824], 'run_number': 1}])
                self.assertEqual(item['parents'], [])
            elif item['lfn'] == '/store/unmerged/fileB.root':
                self.assertEqual(item['events'], 50)
                self.assertItemsEqual(item['locations'], ['T1_US_FNAL_MSS'])
                self.assertItemsEqual(item['runs'], [{'lumis': [1, 2, 3], 'run_number': 1},
                                                     {'lumis': [4, 5, 6], 'run_number': 1},
                                                     {'lumis': [9], 'run_number': 1}])
                self.assertItemsEqual(item['parents'], ['file1', 'file2', 'file3'])
            elif item['lfn'] == '/store/unmerged/fileB.root':
                self.assertEqual(item['events'], 10)
                self.assertItemsEqual(item['locations'], ['T1_US_FNAL_Disk', 'T2_US_MIT'])
                self.assertItemsEqual(item['runs'], [{'lumis': [111], 'run_number': 222}])
                self.assertEqual(item['parents'], [])
Exemplo n.º 6
0
    def testFakeMergeFilesInfo(self):
        """
        _testFakeMergeFilesInfo_

        Verify that we can merge MCFakeFiles together when a fileset contains
        several failures for the same input fake file.
        """
        fakeFiles = [{'checksums': {},
                      'events': 500000,
                      'first_event': 1,
                      'id': 40,
                      'last_event': 0,
                      'lfn': 'MCFakeFile-File1',
                      'locations': ['T1_DE_KIT_Disk'],
                      'merged': '0',
                      'parents': [],
                      'runs': [{'lumis': [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11], 'run_number': 1}],
                      'size': 0},
                     {'checksums': {},
                      'events': 500000,
                      'first_event': 1000001,
                      'id': 40,
                      'last_event': 0,
                      'lfn': 'MCFakeFile-File2',
                      'locations': ['T1_DE_KIT_Disk'],
                      'merged': '0',
                      'parents': [],
                      'runs': [{'lumis': [21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31],
                                'run_number': 1}],
                      'size': 0},
                     {'checksums': {},
                      'events': 500000,
                      'first_event': 2000001,
                      'id': 40,
                      'last_event': 0,
                      'lfn': 'MCFakeFile-File1',
                      'locations': ['T1_DE_KIT_Disk'],
                      'merged': '0',
                      'parents': [],
                      'runs': [{'lumis': [41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51],
                                'run_number': 1}],
                      'size': 0},
                     {'checksums': {},
                      'events': 500000,
                      'first_event': 7000001,
                      'id': 40,
                      'last_event': 0,
                      'lfn': 'MCFakeFile-File3',
                      'locations': ['T1_DE_KIT_Disk'],
                      'merged': '0',
                      'parents': [],
                      'runs': [{'lumis': [81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91],
                                'run_number': 1}],
                      'size': 0},
                     {'checksums': {},
                      'events': 500000,
                      'first_event': 4000001,
                      'id': 40,
                      'last_event': 0,
                      'lfn': 'MCFakeFile-File3',
                      'locations': ['T1_DE_KIT_Disk'],
                      'merged': '0',
                      'parents': [],
                      'runs': [{'lumis': [51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61],
                                'run_number': 1}],
                      'size': 0}]

        mergedFiles = mergeFilesInfo(fakeFiles)
        self.assertEqual(len(mergedFiles), 3, "Error: wrong number of files.")

        totalEvents = 0
        for job in mergedFiles:
            totalEvents += job['events']
        self.assertEqual(totalEvents, 2500000, "Error: wrong number of total events.")

        for job in mergedFiles:
            if job['lfn'] == 'MCFakeFile-File1':
                lumiList = job['runs'][0]['lumis']
                self.assertEqual(len(lumiList), 22)