Пример #1
0
    print("@prefix m: <http://learningsparql.com/model#> .")
    print("@prefix dc: <http://purl.org/dc/elements/1.1/> .\n")

    # Find the cosine similarity of all the combinations
    recipesToCompare = len(recipeDataArray)  # or some small number for tests

    i1 = 0
    while i1 < recipesToCompare:

        title = recipeDataArray[i1][recipeTitleField].replace('\"', '\\"')
        print('d:' + str(i1) + ' dc:title "' + title + '" .')
        i2 = i1 + 1
        while i2 < recipesToCompare:
            # output triples like [ m:doc d:0, d:1 ; m:cosinsim 0.8249611 m:type "xml" ]  PLUS MORE SHOWN BELOW
            XMLCosinSim = \
            obj.cos_sim(recipeDataArray[i1][recipeXMLEmbeddingField],
                        recipeDataArray[i2][recipeXMLEmbeddingField])

            textCosinSim = \
            obj.cos_sim(recipeDataArray[i1][recipePlainTextEmbeddingField],
                        recipeDataArray[i2][recipePlainTextEmbeddingField])

            titleCosinSim = \
            obj.cos_sim(recipeDataArray[i1][recipeTitleEmbeddingField],
                        recipeDataArray[i2][recipeTitleEmbeddingField])

            print('[ m:doc d:' + str(i1) + ', d:' + str(i2) +
                  ' ; m:XMLCosinSim ' + str(XMLCosinSim) + '; ')
            print(' m:textCosinSim ' + str(textCosinSim) +
                  ' ; m:titleCosinSim ' + str(titleCosinSim) + ' ] .')
            i2 += 1
        i1 += 1
Пример #2
0
    recipeDataArray = a_f_array + g_p_array + q_z_array

    print('# starting comparisons: ' + time.strftime('%H:%M:%S'))

    # output header of RDF
    print("@prefix d: <http://learningsparql.com/data#> .")
    print("@prefix m: <http://learningsparql.com/model#> .")
    print("@prefix dc: <http://purl.org/dc/elements/1.1/> .\n")

    # Find the cosine similarity of all the combinations
    recipesToCompare = len(recipeDataArray)  # or some small number for tests
    i1 = 0
    while i1 < recipesToCompare:
        title = recipeDataArray[i1][recipeTitleField].replace('\"', '\\"')
        print('<' + recipeDataArray[i1][urlField] + '>  dc:title "' + title +
              '" .')
        i2 = i1 + 1
        while i2 < recipesToCompare:
            # output triples like [ m:doc d:0, d:1 ; m:recipeCosineSim 0.8249611 ]
            recipeCosineSim = \
            obj.cos_sim(recipeDataArray[i1][recipeEmbeddingField],
                        recipeDataArray[i2][recipeEmbeddingField])

            print('[ m:doc <' + recipeDataArray[i1][urlField] + '>, <' +
                  recipeDataArray[i2][urlField] + '> ; m:recipeCosineSim ' +
                  str(recipeCosineSim) + ' ] . ')
            i2 += 1
        i1 += 1

print('# finished: ' + time.strftime('%H:%M:%S'))