Python Helper.cleanWordForInitialAddの例

プログラミング言語: Python

名前空間/パッケージ名: Helper

クラス/型: Helper

メソッド/関数: cleanWordForInitialAdd

hotexamples.comのコード掲載数: 2

Python Helper.cleanWordForInitialAdd - 2件のコード例が見つかりました。すべてオープンソースプロジェクトから抽出されたPythonのHelper.Helper.cleanWordForInitialAddの実例で、最も評価が高いものを厳選しています。コード例の評価を行っていただくことで、より質の高いコード例が表示されるようになります。

よく使われるメソッド

表示非表示

Helper(30)

getCategoryKey(8)

_get_faller_cells(7)

close(6)

GetUnixMilliseconds(6)

downloadString(6)

delFolder(5)

GetJson(5)

copy(4)

_get_matched_cells(3)

cleanWord(3)

getRandomSubset(3)

cleanTextAndTokenize(3)

createBarplot(3)

create_folder(3)

calculate_f1(2)

getBandwidth(2)

create_tfidf(2)

check_game_over(2)

cleanWordForInitialAdd(2)

convertPrefixToAddress(2)

convertToAsn32(2)

angle_between_two_points(2)

getRepresentativeRows(2)

getUserKey(2)

createDictionary(2)

decoding(2)

makeDateObject(2)

_empty_under_cell(2)

parseGenderBlogDatasetWithLabels(2)

debug(2)

GetUploadSize(2)

deductscore(1)

displayData(1)

determine_current_time(1)

decimaltohex(1)

daysAsPrettyLength(1)

dataHandler(1)

determine_right_left(1)

GenerateFileKeys(1)

display_menu(1)

display_points(1)

display_population(1)

display_rects(1)

distance_between(1)

formatDateStringIntoCleanedString(1)

getItemKey(1)

getSaveName(1)

hash_string(1)

listToGrid(1)

コード例 #1

ファイルを表示

ファイル: WordFrequenciesClass.py プロジェクト: dirkstahlecker/WordFrequencies

    def readFile(self, url):
        try:
            f = open(url, 'r')
        except:
            print('File not found')
            newPath = input('Enter new path > ');
            return self.readFile(newPath) #TODO: this doesn't work for entirely unknown reasons

        markupFile = open(self.markUpFilePath, 'a')
        markupFile.write('\n\n\n')
        markupFile.close()
        allWords = []
        line = f.readline()
        last20Words = [] #maintains the last 20 words to give the user context for the name, which is a rolling list of 20 words ending in the particular name of note
        while line != '':
            markupFile = open(self.markUpFilePath, 'a')
            words = line.split(' ')
            last20Words = []
            for word_str in words:
                if len(last20Words) >= 20:
                    last20Words.pop(0)
                last20Words.append(word_str)

                (word_beforeStuff, word_str, word_afterStuff) = Helper.cleanWordForInitialAdd(word_str)

                if Helper.cleanWord(word_str, stripApostropheS=True) in self.namesSet:
                    wasPluralWithApostrophe = False
                    word_str = word_str.translate(str.maketrans({'‘':"'",'’':"'"})) #need to change from smart quotes to regular
                    if word_str.endswith("'s"):
                        word_str = word_str[:-2]
                        wasPluralWithApostrophe = True
                    word_class = self.getMarkUnderWord(word_str, last20Words, wasPluralWithApostrophe)
                else:
                    word_class = WordClass.addWordOrMarkup(word_str)
                allWords.append(word_class)
                markupFile.write(word_beforeStuff + word_class.printMarkup() + word_afterStuff + ' ') #need to manually add a space since they're removed in the split
                #TODO: add spaces back only where they were taken from
            markupFile.close()
            line = f.readline()

コード例 #2

ファイルを表示

ファイル: WordFrequenciesClass.py プロジェクト: dirkstahlecker/WordFrequencies

    def addLine(self, line, currentDate):
        # markunderFile = open(self.markUnderFilePath, 'a')

        words = line.split(' ')

        wordsToCount = 0 #used to calculate the length of entries - don't want to include invalid words in the word count TODO: rethink this?
        namesFound = set()
        for word in words:
            if word == '' or word == None or re.compile('^\s+$').search(word) != None:
                continue

            (beforeStuff, word, afterStuff) = Helper.cleanWordForInitialAdd(word)

            word = WordClass(word) #words are represented by the WordClass, which is basically an encapsulation of normal words and markup names in one object

            if self.prefs.COMBINE_PLURALS:
                if word.endswith("'s"):
                    word = WordClass.addWordOrMarkup(word.toString()[:len(word)-2]) #TODO: this is broken

            wasUpper = False;
            if word.toString()[:1].isupper():
                wasUpper = True;
            originalWord = word
            word = Helper.cleanWord(word) #this strips off all punctuation and other information that we want to pass into markup.

            if not Helper.valid(word):
                continue
            wordsToCount += 1

            #names
            if word in self.namesSet and (Preferences.REQUIRE_CAPS_FOR_NAMES and wasUpper):
                namesFound.add(word)

                try:
                    self.namesDict[word] = (self.namesDict[word][0] + 1, currentDate)
                except:
                    self.namesDict[word] = (1, currentDate)

                #names per day
                try:
                    if self.namesPerDayDict[word][1] != currentDate:
                        self.namesPerDayDict[word] = (self.namesPerDayDict[word][0] + 1, currentDate)
                except:
                    self.namesPerDayDict[word] = (1, currentDate)

                #names for graphing purposes
                try: #{ word : [ [ date , count ] ] }
                    self.namesToGraphDict[word] #trigger exception
                    if self.namesToGraphDict[word][-1][0] == currentDate: #increment count
                        self.namesToGraphDict[word][-1][1] += 1
                    else: #start a new tuple with a new date
                        self.namesToGraphDict[word].append([currentDate, 1])
                except: #this name hasn't been encountered yet
                    self.namesToGraphDict[word] = [[currentDate, 1]]

                #names for graph, counting on unique occurences
                try: #{ word : [ date ] }
                    self.namesToGraphDictUniqueOccurences[word].append(currentDate)
                except:
                    self.namesToGraphDictUniqueOccurences[word] = [currentDate]

            #words
            if self.wordDict.exists(word):
                self.wordDict.addOrReplaceWord(word, self.wordDict.getCount(word) + 1, currentDate, self.wordDict.getFirstOccurrence(word), wasUpper)
            else:
                self.wordDict.addWord(word, 1, currentDate, currentDate, wasUpper) #TODO: wasUpper wasn't there originally
            
            #words per day
            if self.wordsPerDayDict.exists(word):
                self.wordsPerDayDict.addWord(word, self.wordsPerDayDict.getCount(word), currentDate) #TODO: was addOrReplaceWord, need to think what it should be
            else:
                self.wordsPerDayDict(word, 1, currentDate)

            #TODO: this is being moved to its own class to be called separately
            # if self.prefs.DO_MARK_UNDER:
            #     #if it's a name, qualify it for the markunder
            #     if word in self.namesSet:# or not (Preferences.REQUIRE_CAPS_FOR_NAMES and wasUpper):
            #         markUnderWord = self.getMarkUnderWord(word, originalWord, line, currentDate)
            #     else:
            #         markUnderWord = word

            #     markunderFile.write(markUnderWord + ' ')

        # markunderFile.close()
        return (wordsToCount, namesFound)