Python Dictionary.add_word Exemples

Langage de programmation: Python

Espace de nommage/Pack: dictionary

Class/Type: Dictionary

Méthode/Fonction: add_word

Exemples au hotexamples.com: 7

Python Dictionary.add_word - 7 exemples trouvés. Ce sont les exemples réels les mieux notés de dictionary.Dictionary.add_word extraits de projets open source. Vous pouvez noter les exemples pour nous aider à en améliorer la qualité.

Méthodes fréquemment utilisées

Afficher Cacher

Dictionary(30)

add_term(12)

add(12)

encode_brief(7)

check(6)

add_word(5)

add_pad_token(5)

add_unk_token(5)

delete(4)

add_all(3)

accept_new(3)

doc_length(3)

build_dictionary(3)

delete_word(2)

add_new_term(2)

add_normalised_doc_length(2)

close(2)

all_docs(2)

add_single_word2dic(2)

add_start_token(2)

all_terms(2)

add_symbol(2)

create_default(2)

database_exists(2)

bos(2)

add_items(2)

add_documents(2)

add_doc_count(2)

encode_line(2)

entries(2)

open(2)

doc_to_bag_of_words(1)

is_in_dict(1)

setup(1)

confirm_multiple_words(1)

contains(1)

correct(1)

search_words(1)

search_anagrams(1)

definition(1)

has_word(1)

init_dict(1)

definitions(1)

doc2bow(1)

getPossibleWords(1)

getIDF(1)

getDefs(1)

getAllTFIDFV(1)

examples(1)

dict_learn(1)

Méthodes fréquemment utilisées

Dictionary (30)

add_term (12)

add (12)

encode_brief (7)

check (6)

add_word (5)

add_pad_token (5)

add_unk_token (5)

delete (4)

add_all (3)

Méthodes fréquemment utilisées

accept_new (3)

doc_length (3)

build_dictionary (3)

delete_word (2)

add_new_term (2)

add_normalised_doc_length (2)

close (2)

all_docs (2)

add_single_word2dic (2)

add_start_token (2)

all_terms (2)

add_symbol (2)

create_default (2)

database_exists (2)

bos (2)

add_items (2)

add_documents (2)

add_doc_count (2)

encode_line (2)

entries (2)

Méthodes fréquemment utilisées

all_terms (2)

add_symbol (2)

create_default (2)

database_exists (2)

bos (2)

add_items (2)

add_documents (2)

add_doc_count (2)

encode_line (2)

entries (2)

open (2)

doc_to_bag_of_words (1)

is_in_dict (1)

setup (1)

confirm_multiple_words (1)

contains (1)

correct (1)

search_words (1)

search_anagrams (1)

definition (1)

has_word (1)

init_dict (1)

definitions (1)

doc2bow (1)

getPossibleWords (1)

getIDF (1)

getDefs (1)

getAllTFIDFV (1)

examples (1)

dict_learn (1)

Related in langs

array_to_object_recursive (PHP)

DataLayer (PHP)

TimesheetContext (C#)

EditPublisherRequest (C#)

wbLogger_getHead (C++)

ND_node_type (C++)

GenerateCaptionedImage (Go)

GetRootUIDGID (Go)

ThreadUtils (Java)

MenuTemplate (Java)

Méthodes fréquemment utilisées

open (2)

doc_to_bag_of_words (1)

is_in_dict (1)

setup (1)

confirm_multiple_words (1)

contains (1)

correct (1)

search_words (1)

search_anagrams (1)

definition (1)

has_word (1)

init_dict (1)

definitions (1)

doc2bow (1)

getPossibleWords (1)

getIDF (1)

getDefs (1)

getAllTFIDFV (1)

examples (1)

dict_learn (1)

encode (1)

clear (1)

BinarySearch (1)

classify (1)

add_doc_len (1)

GetDictionaryNames (1)

New (1)

Search (1)

SequentialSearch (1)

_debug (1)

_definitions (1)

_parse_csv (1)

addCommentsToDict (1)

addDocuments (1)

addToDictionary (1)

addWord (1)

add_cfs (1)

add_court_weight (1)

add_dfs (1)

add_doc_length (1)

Associées

BWChatTypeFindCriteria

reverse

MercurialRepo

validate_policy

participant_type_choice

dict2tsv

override_current_theme_class

valfilter

BetterBackend

create_action

Exemple #1

0

Afficher le fichier

def main(): files = sys.argv[1:] d = Dictionary() for f in files: for word in parseWords(f): d.add_word(word) d.save("words.dat")

Exemple #2

0

Afficher le fichier

Fichier : loader.py Projet : darylsew/contact-analysis

def file_to_dict(path): word_file = open(path, 'r') dictionary = Dictionary() counter = 0 for line in word_file: if re.match('^[a-z]+$',line) is not None: dictionary.add_word(line.strip()) if counter % 25000 == 0: print "Loading Dictionary..." counter += 1 dictionary.update_word_count() word_file.close() return dictionary

Exemple #3

0

Afficher le fichier

def load_sentence_dict(data_file, max_len=0, remove_stop=False, encoding='utf8', split_symbol='\t', low_case=False, language='english'): d = Dictionary() with open(data_file, 'r') as fin: for line in fin: label, sentence = line.decode(encoding).strip().split(split_symbol) sentence_token = generate_sentence_token(sentence, max_len=max_len, remove_stop=remove_stop, low_case=low_case, language=language) for token in sentence_token: d.add_word(token) return d

Exemple #4

0

Afficher le fichier

Fichier : language.py Projet : AnthonyEdvalson/Lexicon

def _load_dictionary(self, path): dictionary = Dictionary(self) with open(path, encoding="utf-8") as f: for line in f: if line.isspace() or line[0] == "#": continue cells = list(map(lambda c: c.strip(), filter(None, line.replace(" ", "\t").split("\t")))) text = cells[0] definitions = list(map(lambda s: s.strip(" \n\t"), cells[-1].split(","))) if len(cells) == 2: tags = text.split("+") word = dictionary.to_word(tags, definitions) dictionary.add_word(word) elif len(cells) == 3: tag = cells[1] dictionary.add_morpheme(tag, text, definitions) else: raise Exception("Bad line '{}'".format(cells)) return dictionary

Exemple #5

0

Afficher le fichier

class TestDictionary(unittest.TestCase): DEFAULT_TABLE_SIZE = 250727 DEFAULT_HASH_BASE = 31 DEFAULT_TIMEOUT = 10 FILENAMES = ['english_small.txt', 'english_large.txt', 'french.txt'] RANDOM_STR = 'FIT1008 is the best subject!' def setUp(self) -> None: """ Used by our test cases """ self.dictionary = Dictionary(TestDictionary.DEFAULT_HASH_BASE, TestDictionary.DEFAULT_TABLE_SIZE) def test_init(self) -> None: """ Testing type of our table and the length is 0 """ self.assertEqual(type(self.dictionary.hash_table), LinearProbeHashTable) self.assertEqual(len(self.dictionary.hash_table), 0) def test_load_dictionary_statistics(self) -> None: """ For each file, doing some basic testing on the statistics generated """ print("Testing load dictionary statistics method......") statistics = Statistics() for filename in TestDictionary.FILENAMES: words, time, collision_count, probe_total, probe_max, rehash_count = statistics.load_statistics( TestDictionary.DEFAULT_HASH_BASE, TestDictionary.DEFAULT_TABLE_SIZE * 2, filename, TestDictionary.DEFAULT_TIMEOUT) self.assertGreater(words, 0) self.assertLess(time, TestDictionary.DEFAULT_TIMEOUT) # TODO: Add your own test cases here # test case 1: # checking list of integers return by load statistics are all integers integers = [words, collision_count, probe_total, probe_max, rehash_count] assert (all(isinstance(item, int) for item in integers)) def test_load_dictionary(self) -> None: """ Reading a dictionary and ensuring the number of lines matches the number of words Also testing the various exceptions are raised correctly """ for filename in TestDictionary.FILENAMES: self.dictionary = Dictionary(TestDictionary.DEFAULT_HASH_BASE, TestDictionary.DEFAULT_TABLE_SIZE) words = self.dictionary.load_dictionary(filename) lines = file_len(filename) self.assertEqual(words, lines, "Number of words should match number of lines") # TODO: Add your own test cases (consider testing exceptions being raised) # test case 1: # checking it doesnt throw an erro for FileNotFoundError print("Testing load dictionary method......work on it") filename_2 = 'engli.txt' bucket = Dictionary(TestDictionary.DEFAULT_HASH_BASE, TestDictionary.DEFAULT_TABLE_SIZE) words = bucket.load_dictionary(filename_2) self.assertEqual(words, 0, "Number of words should be 0") def test_add_word(self) -> None: """ Testing the ability to add words """ # TODO: Add your own test cases print("Testing add word......") # test case 1: inserting hello into the hash table self.dictionary.add_word("Hello") current_size = len(self.dictionary.hash_table) self.assertEqual(current_size, 1, "add word method not working properly") # test case 2: Insert multiple of item and updating the hash table count test_list_2 = ['to', 'customize', 'exception', 'parameters', 'while', 'giving', 'you', 'complete', 'control', 'of', 'the active'] test_list_2_size = len(test_list_2) for item in test_list_2: self.dictionary.add_word(item) current_size = len(self.dictionary.hash_table) self.assertEqual(current_size, test_list_2_size + 1, "add word method not working properly") def test_find_word(self) -> None: """ Ensuring both valid and invalid words """ # TODO: Add your own test cases print("Testing find word......") # test case 1: converted all the words in the hash table to upper case and check if find word would be able # to convert it back to lower case and return true self.test_add_word() test_list_2 = ['TO', 'CUSTOMIZE', 'EXCEPTION', 'PARAMETERS', 'WHILE', 'GIVING', 'YOU', 'COMPLETE', 'CONTROL', 'OF', 'THE ACTIVE'] for item in test_list_2: result = self.dictionary.find_word(item) self.assertEqual(result, True, "add word method not working properly") # test case 2: finding word not in the dictionary and check if method returns False word = "AMAKOHIA" result = self.dictionary.find_word(word) self.assertEqual(result, False, "find word method not working properly") def test_delete_word(self) -> None: """ Deleting valid words and ensuring we can't delete invalid words """ print("Testing delete word......") self.dictionary.load_dictionary('english_small.txt') table_size = len(self.dictionary.hash_table) with self.assertRaises(KeyError): self.dictionary.delete_word(TestDictionary.RANDOM_STR) self.assertEqual(len(self.dictionary.hash_table), table_size) self.dictionary.delete_word('test') self.assertEqual(len(self.dictionary.hash_table), table_size - 1)

Exemple #6

0

Afficher le fichier

Fichier : generate_dictionary.py Projet : killruana/wordplay

#!/usr/bin/env python3 #-*- coding: utf-8 -*- from dictionary import Dictionary import sys if len(sys.argv) != 3: sys.exit("Usage: generate_dictionary.py <input file> <ouput dictionary>") with open(sys.argv[1], 'r') as input_file: d = Dictionary() d.open(sys.argv[2]) d.clear() for word in input_file: d.add_word(word.strip()) d.save() d.close()

Exemple #7

0

Afficher le fichier

Fichier : make_dic.py Projet : windweller/l2w

import argparse, os, pickle from dictionary import Dictionary parser = argparse.ArgumentParser() parser.add_argument('data', help='text file to make dictionary from') parser.add_argument('out', help='path to write dictionary pickle to') parser.add_argument('--max_vocab', type=int, default=100000, help='max_words in dictionary') args = parser.parse_args() assert (os.path.exists(args.data)) dic = Dictionary() freq = {} with open(args.data, 'r') as f: for line in f: for word in line.split(): freq[word] = freq.get(word, 0) + 1 for _, word in sorted([(-f, w) for w, f in freq.items() ])[:args.max_vocab - len(dic.idx2word)]: dic.add_word(word) with open(args.out, 'wb') as out_file: pickle.dump(dic, out_file)