Example #1
0
def main():
    parser = argparse.ArgumentParser()
    parser.add_argument('--sourcefile', type=str, required=True)
    parser.add_argument('--tgtfile', type=str, required=True)

    args = vars(parser.parse_args())

    sourcefile = open(args['sourcefile'], 'r')
    sourceclusters = buildclustersfromfile(sourcefile)

    tgtfile = open(args['tgtfile'], 'r')
    tgtclusters = buildclustersfromfile(tgtfile)

    matched_cluster_triples = simcluster.calcmatchingclusters(
        sourceclusters, tgtclusters, 0.66, 1)
    srccvg = simcluster.coverage(sourceclusters, tgtclusters,
                                 matched_cluster_triples,
                                 True)  # calc coverage for source clusters
    tgtcvg = simcluster.coverage(sourceclusters, tgtclusters,
                                 matched_cluster_triples,
                                 False)  # calc coverage for source clusters
    print ' source coverage of source clusters from {0} to {1}: {2}'.format(
        str(sourcefile), str(tgtfile), srccvg)
    print ' target coverage of source clusters from {0} to {1}: {2}'.format(
        str(sourcefile), str(tgtfile), tgtcvg)
Example #2
0
def compareTwoVersions(source, target):
    srcf = open(source, 'r')
    tgtf = open(target, 'r')
    srcclusters = simcluster.buildclustersfromfile(srcf)
    tgtclusters = simcluster.buildclustersfromfile(tgtf)
    matched_cluster_triples = simcluster.calcmatchingclusters(
        srcclusters, tgtclusters, 0.66, 1)
    srccvg = simcluster.coverage(srcclusters, tgtclusters,
                                 matched_cluster_triples,
                                 True)  # calc coverage for source clusters
    tgtcvg = simcluster.coverage(srcclusters, tgtclusters,
                                 matched_cluster_triples,
                                 False)  # calc coverage for source clusters
    return (srccvg, tgtcvg)
def runAnalysis(args, sortedfilesbyversion):
    for srcidx, (srcversion, srcfile) in enumerate(sortedfilesbyversion):
        for tgtidx in xrange(srcidx + 1, len(sortedfilesbyversion)):
            tgtversion = sortedfilesbyversion[tgtidx][0]
            tgtfile = sortedfilesbyversion[tgtidx][1]
            srcf = open(os.path.join(expanduser(args.inputdir), srcfile), 'r')
            tgtf = open(os.path.join(expanduser(args.inputdir), tgtfile), 'r')
            srcclusters = simcluster.buildclustersfromfile(srcf)
            tgtclusters = simcluster.buildclustersfromfile(tgtf)
            matched_cluster_triples = simcluster.calcmatchingclusters(srcclusters, tgtclusters, 0.66, 1)
            srccvg = simcluster.coverage(srcclusters, tgtclusters, matched_cluster_triples, True) # calc coverage for source clusters
            tgtcvg = simcluster.coverage(srcclusters, tgtclusters, matched_cluster_triples, False) # calc coverage for source clusters
            print ' source coverage of source clusters from {0} to {1}: {2}'.format(srcversion, sortedfilesbyversion[tgtidx][0], srccvg)
            print ' target coverage of source clusters from {0} to {1}: {2}'.format(srcversion, sortedfilesbyversion[tgtidx][0], tgtcvg)
        
        print '\n'
def main():
    parser = argparse.ArgumentParser()
    parser.add_argument('--sourcefile', type=str, required=True)
    parser.add_argument('--tgtfile', type=str, required=True)

    args = vars(parser.parse_args())
    
    sourcefile = open(args['sourcefile'],'r')
    sourceclusters = buildclustersfromfile(sourcefile) 
        
    tgtfile = open(args['tgtfile'],'r')
    tgtclusters = buildclustersfromfile(tgtfile)
    
    matched_cluster_triples = simcluster.calcmatchingclusters(sourceclusters, tgtclusters, 0.66, 1)
    srccvg = simcluster.coverage(sourceclusters, tgtclusters, matched_cluster_triples, True)  # calc coverage for source clusters
    tgtcvg = simcluster.coverage(sourceclusters, tgtclusters, matched_cluster_triples, False)  # calc coverage for source clusters
    print ' source coverage of source clusters from {0} to {1}: {2}'.format(str(sourcefile), str(tgtfile), srccvg)
    print ' target coverage of source clusters from {0} to {1}: {2}'.format(str(sourcefile), str(tgtfile), tgtcvg)
Example #5
0
def runAnalysis(args, sortedfilesbyversion):
    for srcidx, (srcversion, srcfile) in enumerate(sortedfilesbyversion):
        for tgtidx in xrange(srcidx + 1, len(sortedfilesbyversion)):
            tgtversion = sortedfilesbyversion[tgtidx][0]
            tgtfile = sortedfilesbyversion[tgtidx][1]
            srcf = open(os.path.join(expanduser(args.inputdir), srcfile), 'r')
            tgtf = open(os.path.join(expanduser(args.inputdir), tgtfile), 'r')
            srcclusters = simcluster.buildclustersfromfile(srcf)
            tgtclusters = simcluster.buildclustersfromfile(tgtf)
            matched_cluster_triples = simcluster.calcmatchingclusters(
                srcclusters, tgtclusters, 0.66, 1)
            srccvg = simcluster.coverage(
                srcclusters, tgtclusters, matched_cluster_triples,
                True)  # calc coverage for source clusters
            tgtcvg = simcluster.coverage(
                srcclusters, tgtclusters, matched_cluster_triples,
                False)  # calc coverage for source clusters
            print ' source coverage of source clusters from {0} to {1}: {2}'.format(
                srcversion, sortedfilesbyversion[tgtidx][0], srccvg)
            print ' target coverage of source clusters from {0} to {1}: {2}'.format(
                srcversion, sortedfilesbyversion[tgtidx][0], tgtcvg)

        print '\n'