Python NameToDictMap.setItem示例，sourceutils.misc.NameToDictMap.NameToDictMap.setItem Python示例

示例#1

0

显示文件

文件： ExpressionTreeEmbedder.py 项目： MLDroid/chucky-old

    def _termDictsFromContext(self, context, symbol):
        
        vecs = NameToDictMap()
        allNgrams = OccurrenceCounter()
        
        context.neighbours.append(context.origin)
        
        for neighbour in context.neighbours:
            nOcc = neighbour.nOccurrences
            location = neighbour.location
            expressions = self.treeToExprConverter.getExpressionsForSymbol(location, symbol)
            # expressions.append('@+$_+@')
            # expressions.append('@+EXPR@+$_+@+@')
            
            # print 'FOO %s: %s: %s' % (symbol, location, expressions)
            
            neighbour.setExpressions(expressions)

            # add null-vector for function if it does not contain expressions
            if len(expressions) == 0:
                vecs.add(None, location)
            
            for expr in expressions:
                # vecs.add(expr, location, 1.0/nOcc)
                # vecs.add(expr, location, 1.0)
                vecs.setItem(expr, location, 1.0)
                allNgrams.add(expr)            
        
        context.neighbours.pop()
        
        if len(vecs.d) == 0 or len(allNgrams.d) == 0:
            return None
    
        return (vecs, allNgrams)

示例#2

0

显示文件

    def _termDictsFromContext(self, context, symbol):

        vecs = NameToDictMap()
        allNgrams = OccurrenceCounter()

        context.neighbours.append(context.origin)

        for neighbour in context.neighbours:
            nOcc = neighbour.nOccurrences
            location = neighbour.location
            expressions = self.treeToExprConverter.getExpressionsForSymbol(
                location, symbol)
            # expressions.append('@+$_+@')
            # expressions.append('@+EXPR@+$_+@+@')

            # print 'FOO %s: %s: %s' % (symbol, location, expressions)

            neighbour.setExpressions(expressions)

            # add null-vector for function if it does not contain expressions
            if len(expressions) == 0:
                vecs.add(None, location)

            for expr in expressions:
                # vecs.add(expr, location, 1.0/nOcc)
                # vecs.add(expr, location, 1.0)
                vecs.setItem(expr, location, 1.0)
                allNgrams.add(expr)

        context.neighbours.pop()

        if len(vecs.d) == 0 or len(allNgrams.d) == 0:
            return None

        return (vecs, allNgrams)

示例#3

0

显示文件

文件： AttackSurfaceRanker.py 项目： pombredanne/chucky-old

def relevancyWeighting(checkVectors, featureDir):

    k = 20

    termDocMatrix = pickle.load(file(featureDir + 'termDocMatrix.pickl'))
    functionLocations = termDocMatrix.index2Doc

    # it doesn't make much sense that we use euclidean distances here,
    # should be L1, but I can't calculate L1 on the sparse matrices for now.
    from scipy.spatial.distance import squareform
    D = squareform(pickle.load(file(featureDir + 'D_euclidean.pickl')))
    anomalyCalculator = AnomalyCalculator()
    (NNV, NNI) = anomalyCalculator.calculateNearestNeighbours(k, D)

    WDict = NameToDictMap()
    for i in xrange(len(functionLocations)):

        location = functionLocations[i]
        if not location in checkVectors.d:
            continue

        WDict.d[location] = checkVectors.d[location]

        indices = NNI[:, i]
        gamma = float(numpy.sum(NNV[:, i])) / k
        locations = [functionLocations[j] for j in indices]
        V = [checkVectors.d[l] for l in locations if l in checkVectors.d]
        distances = [
            NNV[j, i] for j in xrange(len(locations))
            if locations[j] in checkVectors.d
        ]

        # len(V) may be unequal to k if at least one of the nearest neighbours has no checks.
        # It is then a null-vector, so we're implicitly adding it in mean-calculation
        meanVector = {}
        for (v, d) in zip(V, distances):

            for (name, score) in v.iteritems():
                try:
                    meanVector[name] += (1 - d) * (float(score) / k)
                except KeyError:
                    meanVector[name] = (1 - d) * (float(score) / k)

        for (name, score) in checkVectors.d[location].iteritems():
            if meanVector.has_key(name):
                score -= meanVector[name]
                if score < 0: score = 0
                WDict.setItem(name, location, score)
    return WDict

示例#4

0

显示文件

文件： AttackSurfaceRanker.py 项目： MLDroid/chucky-old

def relevancyWeighting(checkVectors, featureDir):
    
    k = 20
    
    termDocMatrix = pickle.load(file(featureDir + 'termDocMatrix.pickl'))
    functionLocations = termDocMatrix.index2Doc

    # it doesn't make much sense that we use euclidean distances here,
    # should be L1, but I can't calculate L1 on the sparse matrices for now.
    from scipy.spatial.distance import squareform
    D = squareform(pickle.load(file(featureDir + 'D_euclidean.pickl')))
    anomalyCalculator = AnomalyCalculator()
    (NNV, NNI) = anomalyCalculator.calculateNearestNeighbours(k, D)
    
    WDict = NameToDictMap()
    for i in xrange(len(functionLocations)):
        
        location = functionLocations[i]
        if not location in checkVectors.d:
            continue
        
        WDict.d[location] = checkVectors.d[location]
        
        indices = NNI[:,i]
        gamma = float(numpy.sum(NNV[:,i]))/k
        locations = [functionLocations[j] for j in indices]       
        V = [checkVectors.d[l] for l in locations if l in checkVectors.d]
        distances = [NNV[j,i] for j in xrange(len(locations)) if locations[j] in checkVectors.d]
        
        # len(V) may be unequal to k if at least one of the nearest neighbours has no checks.
        # It is then a null-vector, so we're implicitly adding it in mean-calculation
        meanVector = {}
        for (v,d) in zip(V,distances):
            
            for (name, score) in v.iteritems():
                try:
                    meanVector[name] += (1-d)* (float(score)/k)
                except KeyError:
                    meanVector[name] = (1-d)* (float(score)/k)
        

        for (name, score) in checkVectors.d[location].iteritems():
            if meanVector.has_key(name):
                score -= meanVector[name]
                if score < 0: score = 0
                WDict.setItem(name, location, score)
    return WDict

示例#5

0

显示文件

文件： AttackSurfaceRanker.py 项目： MLDroid/chucky-old

def calculateCheckVectors(WFuncs, CFuncs, F, binary=True, alpha=1, weighByF = False):
    
    WDict = NameToDictMap()
    for (functionLocation, symbols) in WFuncs.d.iteritems():
        
        if not functionLocation in CFuncs.d:
            # The function does not contain any check,
            # thus, projected onto the check-space, it's
            # the NULL-vector
            WDict.d[functionLocation] = {}
            continue
        
        CFunc = CFuncs.d[functionLocation]
        
        for (s,occurrences) in symbols.iteritems():
            if binary: occurrences = 1
            
            if (not s in F):
                # This symbol is never checked
                WDict.setItem(s, functionLocation, 0)
            elif (s in CFunc):
                w = 1.0
                if weighByF: w = F[s]
                nChecks = CFunc[s]
                if binary: nChecks = 1
                WDict.setItem(s, functionLocation, (occurrences - alpha*nChecks)*w)
            else:
                w = 1.0
                if weighByF: w = F[s]
                WDict.setItem(s, functionLocation, occurrences*w)
    return WDict

示例#6

0

显示文件

文件： AttackSurfaceRanker.py 项目： pombredanne/chucky-old

def calculateCheckVectors(WFuncs,
                          CFuncs,
                          F,
                          binary=True,
                          alpha=1,
                          weighByF=False):

    WDict = NameToDictMap()
    for (functionLocation, symbols) in WFuncs.d.iteritems():

        if not functionLocation in CFuncs.d:
            # The function does not contain any check,
            # thus, projected onto the check-space, it's
            # the NULL-vector
            WDict.d[functionLocation] = {}
            continue

        CFunc = CFuncs.d[functionLocation]

        for (s, occurrences) in symbols.iteritems():
            if binary: occurrences = 1

            if (not s in F):
                # This symbol is never checked
                WDict.setItem(s, functionLocation, 0)
            elif (s in CFunc):
                w = 1.0
                if weighByF: w = F[s]
                nChecks = CFunc[s]
                if binary: nChecks = 1
                WDict.setItem(s, functionLocation,
                              (occurrences - alpha * nChecks) * w)
            else:
                w = 1.0
                if weighByF: w = F[s]
                WDict.setItem(s, functionLocation, occurrences * w)
    return WDict