Python LogisticRegression.densify 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: sklearn.linear_model

클래스/타입: LogisticRegression

메소드/함수: densify

hotexamples.com에서의 예제들: 4

Python LogisticRegression.densify - 4개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 sklearn.linear_model.LogisticRegression.densify에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

C(30)

decision_function(30)

coef_(30)

LogisticRegression(30)

add(30)

classes_(24)

compile(21)

__init__(15)

_predict_proba_lr(3)

deserialize_from_bundle(3)

densify(3)

computeModel(3)

class_weight(2)

booster(2)

accuracy_score(2)

append(2)

__repr__(2)

cost_complexity_pruning_path(1)

__doc__(1)

compute(1)

computeCrossValidation(1)

computeExample(1)

__dir__(1)

conf_int(1)

_objective(1)

classify(1)

SerializeToString(1)

degree(1)

Predict(1)

Logit(1)

do_fastgrad(1)

do_grad_descent(1)

cuda(1)

__str__(1)

_objective_long_way(1)

alpha(1)

_more_tags(1)

_set_callbacks(1)

_vectorizer(1)

accuracy(1)

_grad_long_way(1)

_grad(1)

_get_param_names(1)

_decision_function(1)

auc(1)

batch_fit(1)

batch_predict(1)

bias_(1)

_estimator_type(1)

build(1)

예제 #1

파일 보기

파일: multi_class_classifier_logistic.py 프로젝트: wsgan001/so_project

def train_custom_one_vs_all(X_train, X_test, Y_train, topk):

    #convert matrix to row for efficient splicing
    Y_train = Y_train.tocsc()
    tag_classifiers = []
    num_training, numclasses = Y_train.shape
    num_test_examples = X_test.shape[0]

    # hold a vector mxk, containing top k prediction classes for each example, maintain m heaps for that
    num_examples = X_test.shape[0]
    num_classes = len(tag_classifiers)
    topk_class_distances = []
    for i in xrange(num_examples):
        heap = []
        topk_class_distances += [heap]

    for j in xrange(numclasses):
        # train on each class label for all the training examples
        y = numpy.ravel(Y_train.getcol(j).todense())

        clf = LogisticRegression(penalty='l2',
                                 dual=False,
                                 tol=0.0001,
                                 C=0.8,
                                 fit_intercept=True,
                                 intercept_scaling=1)

        clf.fit(X_train, y)
        print "Trained for class", j
        # get the decision for all test examples
        decision = clf.densify().decision_function(X_test)
        # for each test example add its decision value to the heap of top k decision values
        for i in xrange(num_test_examples):
            h = topk_class_distances[i]
            if len(h) < topk: heapq.heappush(h, (decision[i], j))
            else: heapq.heappushpop(h, (decision[i], j))
        print "Predicted for class", j

    #clean the decision values and store the class labels
    class_label_indices = []
    for i in xrange(num_examples):
        topk_labels = [label for dist, label in topk_class_distances[i]]
        class_label_indices += [topk_labels]

    return class_label_indices

예제 #2

파일 보기

파일: multi_class_classifier_logistic.py 프로젝트: adirastogi/so_project

def train_custom_one_vs_all(X_train,X_test,Y_train,topk):

    #convert matrix to row for efficient splicing
    Y_train = Y_train.tocsc()
    tag_classifiers = []
    num_training,numclasses = Y_train.shape
    num_test_examples = X_test.shape[0]


    # hold a vector mxk, containing top k prediction classes for each example, maintain m heaps for that
    num_examples = X_test.shape[0]
    num_classes = len(tag_classifiers)
    topk_class_distances = []
    for i in xrange(num_examples):
        heap = []
        topk_class_distances += [heap]
    

    for j in xrange(numclasses):
        # train on each class label for all the training examples
        y = numpy.ravel(Y_train.getcol(j).todense());

        clf = LogisticRegression(penalty='l2',dual=False,tol=0.0001,C=0.8,fit_intercept=True,intercept_scaling=1)
    
        clf.fit(X_train,y);
        print "Trained for class",j
        # get the decision for all test examples
        decision = clf.densify().decision_function(X_test)
        # for each test example add its decision value to the heap of top k decision values
        for i in xrange(num_test_examples):
            h = topk_class_distances[i]
            if len(h) < topk: heapq.heappush(h,(decision[i],j))
            else:             heapq.heappushpop(h,(decision[i],j))
        print "Predicted for class",j

    #clean the decision values and store the class labels
    class_label_indices = []
    for i in xrange(num_examples):
        topk_labels = [label for dist,label in topk_class_distances[i]]
        class_label_indices += [topk_labels]

    return class_label_indices

예제 #3

파일 보기

파일: code2.py 프로젝트: JaredLLewis/IPReputationProject


clf = RandomForestClassifier(n_estimators=100, max_depth=2,
                              random_state=0)
clf.fit(X_train, y_train)
print("Accuracy ",clf.score(X_test, y_test))

# Model Building
#using logistic regression
print("TRAINING PHASE")
logit = LogisticRegression()	
logit.fit(X_train, y_train)
print("Accuracy ",logit.score(X_test, y_test))
print("coefficient :\n",logit.coef_)
print("Intercept:\n",logit.intercept_)
print(logit.densify())
print(logit.sparsify())
url_list = list(url_list)






print("TESTING PHASE")
X_predict = ["8.8.8.8"]
with open('logit.pickle', 'wb') as handle:
    pickle.dump(logit, handle, protocol=2)
with open('vectorizer.pickle', 'wb') as handle:
    pickle.dump(vectorizer, handle, protocol=2)

예제 #4

파일 보기

파일: logistic_reg_binary.py 프로젝트: hrdavidge/georgette_heyer

    solver='liblinear',  # for use with small datasets
    multi_class='ovr')  # stating this is a binary problem)

# training the model
clf.fit(x_train, y_train)

# attributes
classes = clf.classes_  # list of class labels
coeff = clf.coef_  # coefficients of the model
intercept = clf.intercept_  # the intercept of the model
n_iter = clf.n_iter_  # the number of iterations for each class - in the binary case it only returns one value

# now having a look at the methods
dec_func = clf.decision_function(
    x_test)  # the confidence score for each test data
density = clf.densify()  # returns the coeffient matrix in densy array format
get_param = clf.get_params()  # returns the hyper-parameters
predicted_array = clf.predict(
    x_test
)  # running the test dataset through the model, giving an array of predicted values
predic_log_proba = clf.predict_log_proba(
    x_test)  # log of probability estimate for each class
predic_prob = clf.predict_proba(x_test)  # the probability for each class
mean_accuracy = clf.score(x_test,
                          y_test)  # returns the mean accuracy of the test set
sparsify = clf.sparsify()  # returns the coeffient matrix in sparse format

print('The mean accuracy of the test set is: %.3f' % mean_accuracy)

# now findng the confusion matrix for the data
# we first need to convert the 1 and 2 to 'female' and 'male'