예제 #1
0
def searchKwordWindowsOpt(text, k, left, right, skipBothFlag=False):

    tokens = []
    try:
        tokens = getTokenizer(text)
    except:
        genericErrorInfo()

    counts = {'left': 0, 'both': 0}

    kWordWindows = []
    for i in range(len(tokens)):

        if (i % k == 0):
            kWordWindows.append([])

        kWordWindows[-1].append(tokens[i])

    counts['left'] = len(kWordWindows)

    if (skipBothFlag == False):
        for win in kWordWindows:
            if (left in win and right in win):
                counts['both'] += 1

    return counts
def getKwordWindowsOpt(text, k):

    tokens = []
    try:
        tokens = getTokenizer(text)
    except:
        genericErrorInfo()

    kWordWindows = []
    for i in range(len(tokens)):

        if (i % k == 0):
            kWordWindows.append([])

        kWordWindows[-1].append(tokens[i])

    return kWordWindows