Example #1
0
print "moving to a sparse representation..."
train_feat = sparsify(train_feat)
test_feat = sparsify(test_feat)

train_labl = [s.labels for s in train_sequences]
train_labl = [item for sublist in train_labl for item in sublist]

obsr_labl = [s.labels for s in test_sequences]
test_seq = [" ".join(x) for x in obsr_labl]
test_tok = [item for sublist in obsr_labl for item in sublist]

obsr_list = get_observations(test_feat, test_sequences)

memm = MEMM(10, 0.0001)
memm.fit(train_feat, train_labl, fe.num_feats)
pred_tok, pred_seq = memm.predict_sequences(obsr_list)


# Structured Perceptron using viterbi in the inference step

"""percep = StructuredPerceptron(10, fe, 0.1)
percep.fit(train_sequences)
pred_tok, pred_seq = percep.predict_sequences(test_sequences)

obsr_labl = [s.labels for s in test_sequences]
test_seq = [" ".join(x) for x in obsr_labl]
test_tok = [item for sublist in obsr_labl for item in sublist]"""


# print results
print metrics.classification_report(test_tok, pred_tok)
Example #2
0
print "moving to a sparse representation..."
train_feat = sparsify(train_feat)
test_feat = sparsify(test_feat)

train_labl = [s.labels for s in train_sequences]
train_labl = [item for sublist in train_labl for item in sublist]

obsr_labl = [s.labels for s in test_sequences]
test_seq = [" ".join(x) for x in obsr_labl]
test_tok = [item for sublist in obsr_labl for item in sublist]

obsr_list = get_observations(test_feat, test_sequences)

memm = MEMM(10, 0.0001)
memm.fit(train_feat, train_labl, fe.num_feats)
pred_tok, pred_seq = memm.predict_sequences(obsr_list)

# Structured Perceptron using viterbi in the inference step
'''percep = StructuredPerceptron(10, fe, 0.1)
percep.fit(train_sequences)
pred_tok, pred_seq = percep.predict_sequences(test_sequences)

obsr_labl = [s.labels for s in test_sequences]
test_seq = [" ".join(x) for x in obsr_labl]
test_tok = [item for sublist in obsr_labl for item in sublist]'''

# print results
print metrics.classification_report(test_tok, pred_tok)
print metrics.accuracy_score(test_tok, pred_tok)
print metrics.accuracy_score(test_seq, pred_seq)