def main(): parser = argparse.ArgumentParser() parser.add_argument('--sourcefile', type=str, required=True) parser.add_argument('--tgtfile', type=str, required=True) args = vars(parser.parse_args()) sourcefile = open(args['sourcefile'], 'r') sourceclusters = buildclustersfromfile(sourcefile) tgtfile = open(args['tgtfile'], 'r') tgtclusters = buildclustersfromfile(tgtfile) matched_cluster_triples = simcluster.calcmatchingclusters( sourceclusters, tgtclusters, 0.66, 1) srccvg = simcluster.coverage(sourceclusters, tgtclusters, matched_cluster_triples, True) # calc coverage for source clusters tgtcvg = simcluster.coverage(sourceclusters, tgtclusters, matched_cluster_triples, False) # calc coverage for source clusters print ' source coverage of source clusters from {0} to {1}: {2}'.format( str(sourcefile), str(tgtfile), srccvg) print ' target coverage of source clusters from {0} to {1}: {2}'.format( str(sourcefile), str(tgtfile), tgtcvg)
def compareTwoVersions(source, target): srcf = open(source, 'r') tgtf = open(target, 'r') srcclusters = simcluster.buildclustersfromfile(srcf) tgtclusters = simcluster.buildclustersfromfile(tgtf) matched_cluster_triples = simcluster.calcmatchingclusters( srcclusters, tgtclusters, 0.66, 1) srccvg = simcluster.coverage(srcclusters, tgtclusters, matched_cluster_triples, True) # calc coverage for source clusters tgtcvg = simcluster.coverage(srcclusters, tgtclusters, matched_cluster_triples, False) # calc coverage for source clusters return (srccvg, tgtcvg)
def runAnalysis(args, sortedfilesbyversion): for srcidx, (srcversion, srcfile) in enumerate(sortedfilesbyversion): for tgtidx in xrange(srcidx + 1, len(sortedfilesbyversion)): tgtversion = sortedfilesbyversion[tgtidx][0] tgtfile = sortedfilesbyversion[tgtidx][1] srcf = open(os.path.join(expanduser(args.inputdir), srcfile), 'r') tgtf = open(os.path.join(expanduser(args.inputdir), tgtfile), 'r') srcclusters = simcluster.buildclustersfromfile(srcf) tgtclusters = simcluster.buildclustersfromfile(tgtf) matched_cluster_triples = simcluster.calcmatchingclusters(srcclusters, tgtclusters, 0.66, 1) srccvg = simcluster.coverage(srcclusters, tgtclusters, matched_cluster_triples, True) # calc coverage for source clusters tgtcvg = simcluster.coverage(srcclusters, tgtclusters, matched_cluster_triples, False) # calc coverage for source clusters print ' source coverage of source clusters from {0} to {1}: {2}'.format(srcversion, sortedfilesbyversion[tgtidx][0], srccvg) print ' target coverage of source clusters from {0} to {1}: {2}'.format(srcversion, sortedfilesbyversion[tgtidx][0], tgtcvg) print '\n'
def main(): parser = argparse.ArgumentParser() parser.add_argument('--sourcefile', type=str, required=True) parser.add_argument('--tgtfile', type=str, required=True) args = vars(parser.parse_args()) sourcefile = open(args['sourcefile'],'r') sourceclusters = buildclustersfromfile(sourcefile) tgtfile = open(args['tgtfile'],'r') tgtclusters = buildclustersfromfile(tgtfile) matched_cluster_triples = simcluster.calcmatchingclusters(sourceclusters, tgtclusters, 0.66, 1) srccvg = simcluster.coverage(sourceclusters, tgtclusters, matched_cluster_triples, True) # calc coverage for source clusters tgtcvg = simcluster.coverage(sourceclusters, tgtclusters, matched_cluster_triples, False) # calc coverage for source clusters print ' source coverage of source clusters from {0} to {1}: {2}'.format(str(sourcefile), str(tgtfile), srccvg) print ' target coverage of source clusters from {0} to {1}: {2}'.format(str(sourcefile), str(tgtfile), tgtcvg)
def runAnalysis(args, sortedfilesbyversion): for srcidx, (srcversion, srcfile) in enumerate(sortedfilesbyversion): for tgtidx in xrange(srcidx + 1, len(sortedfilesbyversion)): tgtversion = sortedfilesbyversion[tgtidx][0] tgtfile = sortedfilesbyversion[tgtidx][1] srcf = open(os.path.join(expanduser(args.inputdir), srcfile), 'r') tgtf = open(os.path.join(expanduser(args.inputdir), tgtfile), 'r') srcclusters = simcluster.buildclustersfromfile(srcf) tgtclusters = simcluster.buildclustersfromfile(tgtf) matched_cluster_triples = simcluster.calcmatchingclusters( srcclusters, tgtclusters, 0.66, 1) srccvg = simcluster.coverage( srcclusters, tgtclusters, matched_cluster_triples, True) # calc coverage for source clusters tgtcvg = simcluster.coverage( srcclusters, tgtclusters, matched_cluster_triples, False) # calc coverage for source clusters print ' source coverage of source clusters from {0} to {1}: {2}'.format( srcversion, sortedfilesbyversion[tgtidx][0], srccvg) print ' target coverage of source clusters from {0} to {1}: {2}'.format( srcversion, sortedfilesbyversion[tgtidx][0], tgtcvg) print '\n'