Python count_distinct_objects示例

编程语言: Python

命名空间/包名称: jrs_knn_multilabel

方法/功能: count_distinct_objects

hotexamples.com的示例: 4

Python count_distinct_objects - 已找到4个示例。这些是从开源项目中提取的最受好评的jrs_knn_multilabel.count_distinct_objects现实Python示例。您可以评价示例，以帮助我们提高示例质量。

示例#1

显示文件

文件： jrs_fraction_knn_trained.py 项目： pszostek/research-python-backup

    def calculate_label_counts(self, distances, records, train_labels, k, list_of_all_labels):
        """
        Calculates the label counts c and c_prim.
        """
        # init c and c' per a class:
        label_counts = {}
        for label in list_of_all_labels:
            label_counts[label] = {"c": defaultdict(lambda: 0), "c_prim": defaultdict(lambda: 0)}

        # find c and c' per a class:
        for ind in records:
            distance_vector = distances[ind]
            # print "ind, distance_vector, train_labels[ind], k, train_labels:", ind, distance_vector, train_labels[ind], k, train_labels
            labels = knn_repetitions_multilabel(
                distance_vector, records, train_labels, k + 1
            )  # k+1 because we will consider the sample itself
            neigh_counts = count_distinct_objects(labels)
            # substract all the labels of the sample being classified
            for self_label in train_labels[ind]:
                neigh_counts[self_label] -= 1

            oracle_ans = set(train_labels[ind])

            for label in list_of_all_labels:
                # label in oracle labelling:
                if label in oracle_ans:
                    label_counts[label]["c"][neigh_counts.get(label, 0)] += 1
                # label NOT in oracle labelling:
                else:
                    label_counts[label]["c_prim"][neigh_counts.get(label, 0)] += 1
        return label_counts

示例#2

显示文件

文件： jrs_fraction_knn_trained.py 项目： pszostek/research-python-backup

    def classify(self, sample_distances):
        nearest_labels = knn_repetitions_multilabel(sample_distances,
                                                    self.records,
                                                    self.train_labels, self.k)
        neigh_counts = count_distinct_objects(nearest_labels)

        result = []
        #for each label check the threshold:
        for label in self.list_of_all_labels:
            PRINTER(
                '[classify]: condidering label, neigh_counts[label],  self.fraction_knn_thresholds[label] '
                + str(label) + ", " + str(neigh_counts[label]) + ", " +
                str(self.fraction_knn_thresholds[label]))
            if neigh_counts[label] >= self.fraction_knn_thresholds[label]:
                result.append(label)
        PRINTER('[classify]: result ' + str(result))
        return result

示例#3

显示文件

文件： jrs_fraction_knn_trained.py 项目： pszostek/research-python-backup

    def classify(self, sample_distances):
        nearest_labels = knn_repetitions_multilabel(sample_distances, self.records, self.train_labels, self.k)
        neigh_counts = count_distinct_objects(nearest_labels)

        result = []
        # for each label check the threshold:
        for label in self.list_of_all_labels:
            PRINTER(
                "[classify]: condidering label, neigh_counts[label],  self.fraction_knn_thresholds[label] "
                + str(label)
                + ", "
                + str(neigh_counts[label])
                + ", "
                + str(self.fraction_knn_thresholds[label])
            )
            if neigh_counts[label] >= self.fraction_knn_thresholds[label]:
                result.append(label)
        PRINTER("[classify]: result " + str(result))
        return result

示例#4

显示文件

文件： jrs_fraction_knn_trained.py 项目： pszostek/research-python-backup

    def calculate_label_counts(self, distances, records, train_labels, k,
                               list_of_all_labels):
        '''
        Calculates the label counts c and c_prim.
        '''
        #init c and c' per a class:
        label_counts = {}
        for label in list_of_all_labels:
            label_counts[label] = {
                'c': defaultdict(lambda: 0),
                'c_prim': defaultdict(lambda: 0)
            }

        #find c and c' per a class:
        for ind in records:
            distance_vector = distances[ind]
            #print "ind, distance_vector, train_labels[ind], k, train_labels:", ind, distance_vector, train_labels[ind], k, train_labels
            labels = knn_repetitions_multilabel(
                distance_vector, records, train_labels,
                k + 1)  #k+1 because we will consider the sample itself
            neigh_counts = count_distinct_objects(labels)
            #substract all the labels of the sample being classified
            for self_label in train_labels[ind]:
                neigh_counts[self_label] -= 1

            oracle_ans = set(train_labels[ind])

            for label in list_of_all_labels:
                #label in oracle labelling:
                if label in oracle_ans:
                    label_counts[label]['c'][neigh_counts.get(label, 0)] += 1
                #label NOT in oracle labelling:
                else:
                    label_counts[label]['c_prim'][neigh_counts.get(label,
                                                                   0)] += 1
        return label_counts