Python WordMatrix.get_tokens Examples

Programming Language: Python

Namespace/Package Name: matrix_management

Class/Type: WordMatrix

Method/Function: get_tokens

Examples at hotexamples.com: 4

Python WordMatrix.get_tokens - 4 examples found. These are the top rated real world Python examples of matrix_management.WordMatrix.get_tokens extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

get_tokens(2)

WordMatrix(1)

add(1)

get(1)

kn_columns(1)

kn_cooccurences(1)

Example #1

Show file

File: converter.py Project: VOVAN1993/python2012

win_start = 0
while win_start + window_size <= len(normalized_tokens):
    window = normalized_tokens[win_start:win_start + window_size]
    first = 0
    second = 1
    while first < len(window):
        second = first + 1
        while second < len(window):
            matrix.add(window[first], window[second], window_size - second + first + 1)
            second += 1
        first += 1
    win_start += 1

print "Co-occurence counted"
print "Keys quantity:", len(matrix.get_tokens())

for key in matrix.get_tokens():
    if key <> "*":
        pass#print key, matrix.kn_cooccurences(key, 6)

print "Done"

def get_token_by_word(word):
    word = re.findall(r"[A-Za-z]+", word)[0]
    return stemmer.stem(word.lower())

def get_euclidean_vector_by_token(n, token):
    print "Incoming token:", token
    if token in matrix.token_set:
        return matrix.kn_columns(token, n, matrix.dist_cols_euclidean)

Example #2

Show file

File: converter.py Project: kimank/python2012

    normalized_tokens += [stemmer.stem(token)]

window_size = 5

matrix = WordMatrix()

win_start = 0
while win_start + window_size <= len(normalized_tokens):
    window = normalized_tokens[win_start : win_start + window_size]
    first = 0
    second = 1
    while first < len(window):
        second = first + 1
        while second < len(window):
            matrix.add(window[first], window[second], window_size - second + first + 1)
            second += 1
        first += 1
    win_start += 1

# todo: tabs stuff, cool printing
s = "    "

s += " " + " ".join(matrix.get_tokens())

for token0 in matrix.get_tokens():
    s += "\n" + token0
    for token1 in matrix.get_tokens():
        s += " " + str(matrix.get(token0, token1))

print s

Example #3

Show file

win_start = 0
while win_start + window_size <= len(normalized_tokens):
    window = normalized_tokens[win_start:win_start + window_size]
    first = 0
    second = 1
    while first < len(window):
        second = first + 1
        while second < len(window):
            matrix.add(window[first], window[second],
                       window_size - second + first + 1)
            second += 1
        first += 1
    win_start += 1

print "Co-occurence counted"
print "Keys quantity:", len(matrix.get_tokens())

for key in matrix.get_tokens():
    if key <> "*":
        print key, matrix.kn_cooccurences(key, 6)

print "Now to more sophisticated analysis"

for key in matrix.get_tokens():
    if key <> "*":
        print key, matrix.kn_columns(key, 6, matrix.dist_cols_euclidean)

print "Done"
"""
for token0 in matrix.get_tokens():
    s += "\n" + token0

Example #4

Show file

File: converter.py Project: viosng/python2012

    normalized_tokens += [stemmer.stem(token)]

window_size = 5

matrix = WordMatrix()

win_start = 0
while win_start + window_size <= len(normalized_tokens):
    window = normalized_tokens[win_start:win_start + window_size]
    first = 0
    second = 1
    while first < len(window):
        second = first + 1
        while second < len(window):
            matrix.add(window[first], window[second],
                       window_size - second + first + 1)
            second += 1
        first += 1
    win_start += 1

# todo: tabs stuff, cool printing
s = "    "

s += " " + " ".join(matrix.get_tokens())

for token0 in matrix.get_tokens():
    s += "\n" + token0
    for token1 in matrix.get_tokens():
        s += " " + str(matrix.get(token0, token1))

print s