Python UtilityMethods.updatePhraseTextAndDimensionsMap示例

编程语言: Python

命名空间/包名称: classes

类/类型: UtilityMethods

方法/功能: updatePhraseTextAndDimensionsMap

hotexamples.com的示例: 10

Python UtilityMethods.updatePhraseTextAndDimensionsMap - 已找到10个示例。这些是从开源项目中提取的最受好评的classes.UtilityMethods.updatePhraseTextAndDimensionsMap现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

updateDimensions(6)

updatePhraseTextAndDimensionsMap(5)

updatePhraseTextToPhraseObject(5)

createOrAddNewPhraseObject(1)

pruneUnnecessaryPhrases(1)

pruningConditionDeterministic(1)

pruningConditionRandom(1)

示例#1

显示文件

文件： streaming_lsh_clustering.py 项目： greeness/streaming_lsh

 def getClusterForDocument(self, document):
     UtilityMethods.updatePhraseTextAndDimensionsMap(document, self.phraseTextAndDimensionMap, **self.clustering_settings)
     document.setSignatureUsingVectorPermutations(self.unitVector, self.vectorPermutations, self.phraseTextAndDimensionMap)
     predictedCluster = None
     possibleNearestNeighbors = reduce(lambda x,y:x.union(y), (permutation.getNearestDocuments(document) for permutation in self.signaturePermutations), set())
     if possibleNearestNeighbors: predictedCluster = max(((clusterId, self.clusters[clusterId].cosineSimilarity(document)) for clusterId in possibleNearestNeighbors), key=itemgetter(1))
     if predictedCluster and predictedCluster[1]>=self.thresholdForDocumentToBeInACluster:return predictedCluster[0]

示例#2

显示文件

文件： nearest_neighbor_lsh.py 项目： greeness/streaming_lsh

 def getNearestDocument(self, document):
     UtilityMethods.updatePhraseTextAndDimensionsMap(document, self.phraseTextAndDimensionMap, **self.settings)
     document.setSignatureUsingVectorPermutations(self.unitVector, self.vectorPermutations, self.phraseTextAndDimensionMap)
     predictedNeighbor = None
     possibleNearestNeighbors = reduce(lambda x,y:x.union(y), (permutation.getNearestDocuments(document) for permutation in self.signaturePermutations), set())
     if possibleNearestNeighbors: predictedNeighbor = max(((docId, self.documentIdToDocumentMap[docId].cosineSimilarity(document)) for docId in possibleNearestNeighbors), key=itemgetter(1))
     print predictedNeighbor
     if predictedNeighbor and predictedNeighbor[1]>=self.nearestNeighborThreshold:return predictedNeighbor[0]

示例#3

显示文件

文件： nearest_neighbor_lsh.py 项目： greeness/streaming_lsh

 def update(self, newDocument):
     UtilityMethods.updatePhraseTextAndDimensionsMap(newDocument, self.phraseTextAndDimensionMap, **self.settings)
     currentDocument = self.documentIdToDocumentMap.get(newDocument.docId, None)
     self.documentIdToDocumentMap[newDocument.docId] = newDocument
     newDocument.setSignatureUsingVectorPermutations(self.unitVector, self.vectorPermutations, self.phraseTextAndDimensionMap)
     for permutation in self.signaturePermutations: 
         if currentDocument!=None: permutation.removeDocument(currentDocument)
         permutation.addDocument(newDocument)

示例#4

显示文件

 def test_updatePhraseTextAndDimensionsMap_PhraseMapHasLesserDimensions(
         self):
     settings['dimensions'] = 4
     UtilityMethods.updatePhraseTextAndDimensionsMap(
         self.phraseVector, self.phraseTextAndDimensionMap, **settings)
     self.assertEqual(
         self.finalPhraseToIdMap,
         self.phraseTextAndDimensionMap.getMap(TwoWayMap.MAP_FORWARD))

示例#5

显示文件

 def test_updatePhraseTextAndDimensionsMap_PhraseMapHasMaximumDimensions(
         self):
     UtilityMethods.updatePhraseTextAndDimensionsMap(
         self.phraseVector, self.phraseTextAndDimensionMap, **settings)
     for k in ['streams', 'highdimensional']:
         del self.finalPhraseToIdMap[k]
     self.assertEqual(
         self.finalPhraseToIdMap,
         self.phraseTextAndDimensionMap.getMap(TwoWayMap.MAP_FORWARD))

示例#6

显示文件

文件： nearest_neighbor_lsh.py 项目： greeness/streaming_lsh

 def update(self, newDocument):
     UtilityMethods.updatePhraseTextAndDimensionsMap(
         newDocument, self.phraseTextAndDimensionMap, **self.settings)
     currentDocument = self.documentIdToDocumentMap.get(
         newDocument.docId, None)
     self.documentIdToDocumentMap[newDocument.docId] = newDocument
     newDocument.setSignatureUsingVectorPermutations(
         self.unitVector, self.vectorPermutations,
         self.phraseTextAndDimensionMap)
     for permutation in self.signaturePermutations:
         if currentDocument != None:
             permutation.removeDocument(currentDocument)
         permutation.addDocument(newDocument)

示例#7

显示文件

 def getClusterForDocument(self, document):
     UtilityMethods.updatePhraseTextAndDimensionsMap(
         document, self.phraseTextAndDimensionMap,
         **self.clustering_settings)
     document.setSignatureUsingVectorPermutations(
         self.unitVector, self.vectorPermutations,
         self.phraseTextAndDimensionMap)
     predictedCluster = None
     possibleNearestNeighbors = reduce(
         lambda x, y: x.union(y),
         (permutation.getNearestDocuments(document)
          for permutation in self.signaturePermutations), set())
     if possibleNearestNeighbors:
         predictedCluster = max(
             ((clusterId,
               self.clusters[clusterId].cosineSimilarity(document))
              for clusterId in possibleNearestNeighbors),
             key=itemgetter(1))
     if predictedCluster and predictedCluster[
             1] >= self.thresholdForDocumentToBeInACluster:
         return predictedCluster[0]

示例#8

显示文件

文件： nearest_neighbor_lsh.py 项目： greeness/streaming_lsh

 def getNearestDocument(self, document):
     UtilityMethods.updatePhraseTextAndDimensionsMap(
         document, self.phraseTextAndDimensionMap, **self.settings)
     document.setSignatureUsingVectorPermutations(
         self.unitVector, self.vectorPermutations,
         self.phraseTextAndDimensionMap)
     predictedNeighbor = None
     possibleNearestNeighbors = reduce(
         lambda x, y: x.union(y),
         (permutation.getNearestDocuments(document)
          for permutation in self.signaturePermutations), set())
     if possibleNearestNeighbors:
         predictedNeighbor = max(((
             docId,
             self.documentIdToDocumentMap[docId].cosineSimilarity(document))
                                  for docId in possibleNearestNeighbors),
                                 key=itemgetter(1))
     print predictedNeighbor
     if predictedNeighbor and predictedNeighbor[
             1] >= self.nearestNeighborThreshold:
         return predictedNeighbor[0]

示例#9

显示文件

文件： classes_tests.py 项目： greeness/streaming_lsh

 def test_updatePhraseTextAndDimensionsMap_PhraseMapHasMaximumDimensions(self):
     UtilityMethods.updatePhraseTextAndDimensionsMap(self.phraseVector, self.phraseTextAndDimensionMap, **settings)
     for k in ['streams', 'highdimensional']: del self.finalPhraseToIdMap[k]
     self.assertEqual(self.finalPhraseToIdMap, self.phraseTextAndDimensionMap.getMap(TwoWayMap.MAP_FORWARD))

示例#10

显示文件

文件： classes_tests.py 项目： greeness/streaming_lsh

 def test_updatePhraseTextAndDimensionsMap_PhraseMapHasLesserDimensions(self):
     settings['dimensions'] = 4
     UtilityMethods.updatePhraseTextAndDimensionsMap(self.phraseVector, self.phraseTextAndDimensionMap, **settings)
     self.assertEqual(self.finalPhraseToIdMap, self.phraseTextAndDimensionMap.getMap(TwoWayMap.MAP_FORWARD))