Python tree_from_backtrace 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: infinite_parser.pcfg

메소드/함수: tree_from_backtrace

hotexamples.com에서의 예제들: 3

Python tree_from_backtrace - 3개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 infinite_parser.pcfg.tree_from_backtrace에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

파일: test_inside_outside.py 프로젝트: hans/infinite-pcfg

def test_inside_outside2():
  pcfg = FixedPCFG("x",
                   terminals=["c", "d"],
                   nonterminals=["x"],
                   preterminals=["b"],
                   productions=[("b", "b"), ("b", "x")],
                   binary_weights=np.array([[0.25, 0.75]]),
                   unary_weights=np.array([[0.5, 0.5]]))

  sentence = "c d d".split()
  alphas, betas, backtrace = parse(pcfg, sentence)

  from pprint import pprint
  pprint(list(zip(pcfg.nonterminals, alphas)))
  pprint(list(zip(pcfg.nonterminals, betas)))

  tree_from_backtrace(pcfg, sentence, backtrace).pretty_print()
  assert_equal(tree_from_backtrace(pcfg, sentence, backtrace),
               Tree.fromstring("(x (b c) (x (b d) (b d)))"))

  # check alpha[x]
  np.testing.assert_allclose(alphas[0], [[0, 0.0625, 0.023438],
                                         [0, 0, 0.0625],
                                         [0, 0, 0]], atol=1e-5)
  # check alpha[b] (preterminals)
  np.testing.assert_allclose(alphas[1], [[0.5, 0, 0],
                                         [0, 0.5, 0],
                                         [0, 0, 0.5]])

예제 #2

파일 보기

파일: test_inside_outside.py 프로젝트: hans/infinite-pcfg

def test_inside_outside_em_update():
  pcfg = FixedPCFG("x",
                   terminals=["c", "d"],
                   nonterminals=["x"],
                   preterminals=["b"],
                   productions=[("b", "b"), ("b", "x")])

  sentence = "c d d".split()

  prev_total_prob = 0

  for i in range(20):
    alphas, betas, backtrace = parse(pcfg, sentence)
    total_prob = alphas[pcfg.nonterm2idx[pcfg.start], 0, len(sentence) - 1]
    tree_from_backtrace(pcfg, sentence, backtrace).pretty_print()
    print("%d\t%f" % (i, total_prob))

    # NB include small tolerance due to float imprecision
    assert total_prob - prev_total_prob >= 0, \
        "Total prob should never decrease: %f -> %f (iter %d)" % \
        (prev_total_prob, total_prob, i)
    prev_total_prob = total_prob

    pcfg = update_em(pcfg, sentence)

예제 #3

파일 보기

파일: pcfg_em.py 프로젝트: hans/infinite-pcfg

pcfg = P.FixedPCFG("S",
                   terminals=list(vocabulary),
                   nonterminals=["S", "NP", "VP", "VP$"],
                   preterminals=["N", "V", "D"],
                   productions=[("NP", "VP"), ("V", "NP"), ("V", "VP$"),
                                ("NP", "NP"), ("D", "N")])

prev_ll = -np.inf
for e in trange(40, desc="Epoch"):
    for sentence in tqdm(sentences):
        pcfg = I.update_em(pcfg, sentence)

    # Calculate total probability of corpus.
    ll = 0
    for sentence in tqdm(sentences):
        alphas, betas, _ = I.parse(pcfg, sentence)
        total_prob = alphas[pcfg.nonterm2idx[pcfg.start], 0, len(sentence) - 1]
        ll += np.log(total_prob)

    tqdm.write("%i ll: %f" % (e, ll))

    if ll - prev_ll > 0 and ll - prev_ll <= 1e-3:
        break
    prev_ll = ll

for sentence in sentences:
    print(" ".join(sentence))
    alphas, betas, backtrace = I.parse(pcfg, sentence)
    tree = P.tree_from_backtrace(pcfg, sentence, backtrace)
    tree.pretty_print()