Python ConstantVars.ConstantVarsの例

プログラミング言語: Python

名前空間/パッケージ名: DataLayer.constants

クラス/型: ConstantVars

メソッド/関数: ConstantVars

hotexamples.comのコード掲載数: 6

Python ConstantVars.ConstantVars - 6件のコード例が見つかりました。すべてオープンソースプロジェクトから抽出されたPythonのDataLayer.constants.ConstantVars.ConstantVarsの実例で、最も評価が高いものを厳選しています。コード例の評価を行っていただくことで、より質の高いコード例が表示されるようになります。

よく使われるメソッド

表示非表示

ConstantVars(6)

punctuations(6)

StopWords(5)

コード例 #1

ファイルを表示

 def __init__(self, i):
     self.wordFormer = FormWords()
     self.indexTasks = i
     self.constants = ConstantVars()
     self.relatedDocs = np.array([dict() for i in range(100)])
     self.notRelatedDocs = np.array([dict() for i in range(100)])
     self.notRelatedCounts = 0

コード例 #2

ファイルを表示

    def __init__(self):
        self.alphabet = [
            'پ', 'چ', 'ج', 'ح', 'خ', 'ه', 'ع', 'غ', 'ف', 'ق', 'ث', 'ص', 'ض',
            'گ', 'ک', 'م', 'ن', 'ت', 'ا', 'ل', 'ب', 'آ', 'ی', 'س', 'ش', 'و',
            'ئ', 'د', 'ذ', 'ر', 'ز', 'ط', 'ظ', 'أ', 'ژ', '\u200c', 'ُ', 'ّ',
            'ة', 'ۀ', 'ؤ', 'ء', 'إ'
        ]
        self.constants = ConstantVars()

        self.after_verbs = {'ام', 'ای', 'ایم', 'اید', 'اند'}

        self.before_verbs = {'می', 'نمی'}

        self.suffixes = {
            'ی', 'ای', 'ها', 'های', 'تر', 'تری', 'ترین', 'گر', 'گری', 'ام',
            'ات', 'اش'
        }

        self.expression = []
        self.expression.extend([
            ('علی ای حال', 'علی\u200cای\u200cحال'),
            ('بنا بر این', 'بنابراین'),
            ('بنابر این', 'بنابراین'),
            ('مع ذالک', 'مع\u200cذالک'),
            ('فی ما بین', 'فی\u200cمابین'),
            ('فی مابین', 'فی\u200cمابین'),
            ('چنان چه', 'چنان\u200cچه'),
            ('در واقع', 'درواقع'),
            ('فی کل حال', 'فی\u200cکل\u200cحال'),
        ])
        self.expression = compile_patterns(self.expression)

コード例 #3

ファイルを表示

ファイル: indexing.py プロジェクト: mahdissfr/Persian_Search_Engine

 def __init__(self):
     self.input = FileInOut()
     self.wordFormer = FormWords()
     self.constants = ConstantVars()
     self.dictionary = dict()
     self.posting_list = np.array([dict() for j in range(150000)])
     self.dicIndex = 0
     self.docIndex = 0
     self.c = 0

コード例 #4

ファイルを表示

ファイル: query.py プロジェクト: mahdissfr/Persian_Search_Engine

 def __init__(self):
     self.input = FileInOut()
     self.Dic = self.input.readDic()
     self.DocID_file = self.input.readDocID()
     self.posting_file = self.input.readPostingList()
     self.wordFormer = FormWords()
     self.constants = ConstantVars()
     self.relatedDocs = []
     self.notRelatedDocs = []
     self.relatedDocsPos = []
     self.notRelatedDocsPos = []
     self.notRelatedCounts = 0

コード例 #5

ファイルを表示

ファイル: similarity.py プロジェクト: mahdissfr/Persian_Search_Engine

    def get_query_termList(query):
        wordFormer = FormWords()
        constants = ConstantVars()
        query = wordFormer.normalize(query)
        query_tokens = wordFormer.tokenize(query)
        for token in query_tokens:
            if token in constants.punctuations(
            ) or token in constants.StopWords():
                query_tokens.remove(token)
        query_tokens = wordFormer.uniform(query_tokens)
        # postaged_tokens = wordFormer.posTagging(query_tokens)
        stemmed_tokens = wordFormer.stemmWords(query_tokens)
        lemmatized_tokens = wordFormer.lemmatizeWords(stemmed_tokens)

        lemmatized_tokens = list(filter(lambda a: a != '"', lemmatized_tokens))
        return lemmatized_tokens

コード例 #6

ファイルを表示

#
#     def lemmatize(self, word, pos=''):
#         if not pos and word in self.words:
#             return word
#
#         if (not pos or pos == 'V') and word in self.verbs:
#             return self.verbs[word]
#
#         if pos.startswith('AJ') and word[-1] == 'ی':
#            + with_nots(present_simples) + with_nots(
#                 present_imperfects) + present_subjunctives + present_not_subjunctives + imperatives)
from DataLayer.constants import ConstantVars
from BusinessLayer.textOperations import FormWords

wordFormer = FormWords()
constants = ConstantVars()
query_tokens = wordFormer.tokenize("شفاف سازی")
print('query tokens')
print(query_tokens)
postaged_tokens = wordFormer.posTagging(query_tokens)
print(postaged_tokens)
stemmed_tokens = wordFormer.stemmWords(query_tokens, len(query_tokens))
print(stemmed_tokens)
lemmatized_tokens = wordFormer.lemmatizeWords(stemmed_tokens, postaged_tokens,
                                              len(query_tokens))
print(lemmatized_tokens)

for token in lemmatized_tokens:
    if token in constants.punctuations() or token in constants.StopWords():
        lemmatized_tokens.remove(token)
print(lemmatized_tokens)