def searchKwordWindowsOpt(text, k, left, right, skipBothFlag=False): tokens = [] try: tokens = getTokenizer(text) except: genericErrorInfo() counts = {'left': 0, 'both': 0} kWordWindows = [] for i in range(len(tokens)): if (i % k == 0): kWordWindows.append([]) kWordWindows[-1].append(tokens[i]) counts['left'] = len(kWordWindows) if (skipBothFlag == False): for win in kWordWindows: if (left in win and right in win): counts['both'] += 1 return counts
def getKwordWindowsOpt(text, k): tokens = [] try: tokens = getTokenizer(text) except: genericErrorInfo() kWordWindows = [] for i in range(len(tokens)): if (i % k == 0): kWordWindows.append([]) kWordWindows[-1].append(tokens[i]) return kWordWindows