allData = {} # Read repo info data file (to use as repo list) dataObj = helpers.read_json("../github-data/labReposInfo.json") # Populate repo list repolist = [] print("Getting internal repos ...") repolist = sorted(dataObj["data"].keys()) print("Repo list complete. Found %d repos." % (len(repolist))) # Read pretty GraphQL query query_in = helpers.read_gql("../queries/repo-Topics.gql") # Retrieve authorization token authhead = helpers.get_gitauth() # Iterate through internal repos print("Gathering data across multiple paginated queries...") collective = {u'data': {}} tab = " " for repo in repolist: pageNum = 1 print("\n'%s'" % (repo)) print(tab + "page " + str(pageNum)) repoSplit = repo.split("/") print(tab + "Modifying query...") newqueryRep = re.sub('OWNNAME', repoSplit[0], query_in)
# Populate repo list repolist = [] print("Getting internal repos ...") repolist = sorted(dataObj["data"].keys()) print("Repo list complete. Found %d repos." % (len(repolist))) # Read pretty GraphQL query query_in = helpers.read_gql("../queries/repo-CreationDate.gql") # Rest endpoint query query_commits_in = "/repos/OWNNAME/REPONAME/commits?until=CREATETIME&per_page=100" query_commits_in2 = "/repos/OWNNAME/REPONAME/commits?per_page=100" # Retrieve authorization token authhead = helpers.get_gitauth() # Iterate through internal repos print("Gathering data across multiple paginated queries...") collective = {u'data': {}} tab = " " for repo in repolist: # History doesn't change, only update new repos or those that had no previous commits if "data" in allData.keys() and repo in allData["data"].keys(): if allData["data"][repo]["firstCommitAt"]: print(tab + "Already recorded data for '%s'" % (repo)) continue pageNum = 1