Python Nlp_util.reset_widx Exemples

Langage de programmation: Python

Espace de nommage/Pack: common.word_format.df_utils

Class/Type: Nlp_util

Méthode/Fonction: reset_widx

Exemples au hotexamples.com: 4

Python Nlp_util.reset_widx - 4 exemples trouvés. Ce sont les exemples réels les mieux notés de common.word_format.df_utils.Nlp_util.reset_widx extraits de projets open source. Vous pouvez noter les exemples pour nous aider à en améliorer la qualité.

Méthodes fréquemment utilisées

Afficher Cacher

are_words1_words2_words3_in_order(20)

make_noun_list(8)

make_verb_list(7)

get_idx_list_of_word(7)

get_idx_list_of_idiom(6)

reset_widx(4)

is_first_subject_in(4)

get_idx_list_of_word_list(4)

get_idx_list_of_idiom_list(2)

get_wordsDF_of_wordlist_after_idx(2)

exists_any_noun_verb_pair(1)

exist_subj_for_first_verb(1)

convert_objective_noun_to_nominative(1)

is_any_verb_before_first_noun(1)

is_any_verb_for_first_noun(1)

is_first_adj_after_first_sub_in(1)

convert_nominative_noun_to_objective(1)

is_first_verb_in(1)

make_adj_list(1)

change_subject_other_way_around(1)

change_object_pronoun_to_pronoun(1)

adjust_be_verb_for_changed_subject(1)

Méthodes fréquemment utilisées

are_words1_words2_words3_in_order (20)

make_noun_list (8)

make_verb_list (7)

get_idx_list_of_word (7)

get_idx_list_of_idiom (6)

reset_widx (4)

is_first_subject_in (4)

get_idx_list_of_word_list (4)

get_idx_list_of_idiom_list (2)

get_wordsDF_of_wordlist_after_idx (2)

Méthodes fréquemment utilisées

exists_any_noun_verb_pair (1)

exist_subj_for_first_verb (1)

convert_objective_noun_to_nominative (1)

is_any_verb_before_first_noun (1)

is_any_verb_for_first_noun (1)

is_first_adj_after_first_sub_in (1)

convert_nominative_noun_to_objective (1)

is_first_verb_in (1)

make_adj_list (1)

change_subject_other_way_around (1)

change_object_pronoun_to_pronoun (1)

adjust_be_verb_for_changed_subject (1)

Méthodes fréquemment utilisées

change_object_pronoun_to_pronoun (1)

adjust_be_verb_for_changed_subject (1)

Exemple #1

0

Afficher le fichier

def cut_sent_by_interjection(cls, df): try: separators = [",", "and", "but", "or", "then", "so", "plus", "cause", "because"] exists_separator = True while exists_separator: separators_in_message = df[(df.word.isin(separators)) & (df.widx != 0)] if separators_in_message.empty: exists_separator = False else: for idx, separator in separators_in_message.iterrows(): if separator.word == 'so' and separator.pos == 'RB': continue elif separator.word == 'cause' and separator.pos != 'VB': continue if cls.__exists_SV_around_cc(df, separators_in_message, separator): df.loc[df[(df.sidx >= separator.sidx) & (df.index >= idx)].index, "sidx"] += 1 df = Nlp_util.reset_widx(df) break else: exists_separator = False return df except: logging.exception('') return df

Exemple #2

0

Afficher le fichier

def cut_sent_by_unimportant_words_at_head(cls, df): try: fixed_df = df while len(fixed_df) != 0: is_fixed_df_modified = False for sidx in set(fixed_df.sidx): if len(fixed_df[fixed_df.sidx == sidx]) == 1: continue head_row = fixed_df[fixed_df.sidx == sidx].iloc[0] head_word = head_row.word if head_word in UNIMPORTANT_WORDS_FOR_REPEAT.word.values: fixed_df.loc[fixed_df.index > head_row.name, "sidx"] += 1 fixed_df = Nlp_util.reset_widx(fixed_df) is_fixed_df_modified = True break elif not head_word.isalpha(): if not head_word.isdigit(): fixed_df = cls.__remove_nums_n_symbols(fixed_df, sidx) is_fixed_df_modified = True break if not is_fixed_df_modified: break return fixed_df except: logging.exception('') return df

Exemple #3

0

Afficher le fichier

def __remove_nums_n_symbols(cls, fixed_df, sidx): try: fixed_df = fixed_df.drop(fixed_df[fixed_df.sidx == sidx].iloc[0].name) fixed_df = fixed_df.reset_index(drop=True) fixed_df.loc[fixed_df.sidx == sidx] = Nlp_util.reset_widx(fixed_df.loc[fixed_df.sidx == sidx]) return fixed_df except: logging.exception('') return fixed_df

Exemple #4

0

Afficher le fichier

def remove_unimportant_words_at_tail(df): try: for sidx in set(df.sidx.values): while len(df.loc[df.sidx == sidx]) != 1: tail_row = df.loc[((df.sidx == sidx) & (df.widx == len(df[df.sidx == sidx]) - 1))] tail_word = tail_row.word.values[0] if tail_word in list(UNIMPORTANT_WORDS_FOR_REPEAT.word.values) + [","]: if tail_word == 'well': if tail_row.widx.values[0] > len(df[df.sidx == tail_row.sidx.values[0]]) / 2: break df = df.drop(tail_row.index[0]) df = Nlp_util.reset_widx(df) else: break df = df.reset_index(drop=True) return df except: logging.exception('') return df