Python Util.histogram 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: sandbox.util.Util

클래스/타입: Util

메소드/함수: histogram

hotexamples.com에서의 예제들: 4

Python Util.histogram - 4개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 sandbox.util.Util.Util.histogram에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

savePickle(16)

loadPickle(12)

printIteration(11)

indSvd(10)

rank(9)

indEig(9)

abstract(8)

mdot(8)

mode(7)

randomChoice(4)

extendArray(4)

argmaxN(3)

computeMeanVar(3)

expandIntArray(3)

printConciseIteration(2)

matrixPowerh(2)

fitDiscretePowerLaw(2)

histogram(2)

distanceMatrix(2)

matrixPower(1)

incompleteCholesky2(1)

powerEigs(1)

powerLawProbs(1)

fitPowerLaw(1)

random2Choice(1)

entropy(1)

safeEigh(1)

safeSvd(1)

sampleWithoutReplacement(1)

cumMin(1)

setupScript(1)

svd(1)

예제 #1

파일 보기

    def splitNode(self, tree, X, Y, d, k):
        """
        Take a node in a tree and classify in order to split it into 2 
        """
        if self.featureSize == None: 
            featureSize = numpy.sqrt(X.shape[1])/float(X.shape[1])
        else: 
            featureSize = self.featureSize       
        
        node = tree.getVertex((d, k))
        inds = node.getTrainInds()
        featureInds = node.getFeatureInds()
        alpha =  numpy.sum(Y[inds]==self.bestResponse)/float(inds.shape[0])

        #Now classify

        #We have the following condition if we need to do cross validation within the node
        if Util.histogram(Y[inds])[0].min() > self.minLabelCount:
            self.leafRanklearner.setWeight(1-alpha)
            leafRank = self.leafRanklearner.generateLearner(X, Y)
        else:
            leafRank = MajorityPredictor()

        node.setLeafRank(leafRank)
        leafRank.learnModel(X[inds, :][:, featureInds], Y[inds])
        predY = leafRank.predict(X[inds, :][:, featureInds])
        
        if numpy.unique(predY).shape[0] == 2 and inds.shape[0] >= self.minSplit:
            leftInds = inds[predY == self.bestResponse]
            featureInds = numpy.sort(numpy.random.permutation(X.shape[1])[0:int(numpy.round(X.shape[1]*featureSize))])
            leftNode = RankNode(leftInds, featureInds)
            leftNode.setPure(numpy.unique(Y[leftInds]).shape[0] <= 1)
            leftNode.setIsLeafNode(d==self.maxDepth-1 or leftNode.isPure())
            leftNode.setScore((1 - float(2*k)/2**(d+1))*2**self.maxDepth)
            tree.addEdge((d, k), (d+1, 2*k))
            tree.setVertex((d+1, 2*k), leftNode)

            rightInds = inds[predY != self.bestResponse]
            featureInds = numpy.sort(numpy.random.permutation(X.shape[1])[0:int(numpy.round(X.shape[1]*featureSize))])
            rightNode = RankNode(rightInds, featureInds)
            rightNode.setPure(numpy.unique(Y[rightInds]).shape[0] <= 1)
            rightNode.setIsLeafNode(d==self.maxDepth-1 or rightNode.isPure())
            rightNode.setScore((1 - float(2*k+1)/2**(d+1))*2**self.maxDepth)
            tree.addEdge((d, k), (d+1, 2*k+1))
            tree.setVertex((d+1, 2*k+1), rightNode)
        else:
            node.setIsLeafNode(True)
            node.setScore((1 - float(k)/2**d)*2**self.maxDepth)
            
        return tree

예제 #2

파일 보기

파일: UtilTest.py 프로젝트: charanpald/sandbox

 def testHistogram(self):
     v = numpy.array([0, 0, 1, 5, 0, 2, 2, 2, 5])
     
     (freq, items) = Util.histogram(v)
     self.assertTrue((freq == numpy.array([3, 1, 3, 2])).all())
     self.assertTrue((items == numpy.array([0, 1, 2, 5])).all())

예제 #3

파일 보기

파일: CheckData.py 프로젝트: charanpald/wallhack

    egoQuestionIds = eCsvReader.getEgoQuestionIds()
    alterQuestionIds = eCsvReader.getAlterQuestionIds()

    missing = 0 
    (egoX, titles) = eCsvReader.readFile(egoFileName, egoQuestionIds, missing)
    egoX[:, eCsvReader.ageIndex] = eCsvReader.ageToCategories(egoX[:, eCsvReader.ageIndex])

    (alterX, titles) = eCsvReader.readFile(alterFileName, alterQuestionIds, missing)
    alterX[:, eCsvReader.ageIndex] = eCsvReader.ageToCategories(alterX[:, eCsvReader.ageIndex])

    numFeatures = egoX.shape[1]
    numEgoExamples = egoX.shape[0]
    numAlterExamples = alterX.shape[0]

    for i in range(0, numFeatures):
        (histE, uniqElementsE) = Util.histogram(egoX[:, i])
        (histA, uniqElementsA) = Util.histogram(alterX[:, i])

        print((str(i) + " " + str(egoQuestionIds[i])))
        print(("Ego   " + str(uniqElementsE)))
        print(("Alter " + str(uniqElementsA)))
        print((numpy.setxor1d(uniqElementsE, uniqElementsA)))
        print((histE/numEgoExamples))
        print((histA/numAlterExamples))

    """
    Conclusion is that the distributions are broadly the same. The problem occurs
    with missing data handling. For example in Ego there are values with [ 0.  8.]
    with most zero, and in alter [ 0.  5.]. The means will be approx 8 for ego and 5 for
    alter.
    """

예제 #4

파일 보기

    def testHistogram(self):
        v = numpy.array([0, 0, 1, 5, 0, 2, 2, 2, 5])

        (freq, items) = Util.histogram(v)
        self.assertTrue((freq == numpy.array([3, 1, 3, 2])).all())
        self.assertTrue((items == numpy.array([0, 1, 2, 5])).all())