Esempi in Python per Index.build

Linguaggio di programmazione: Python

Spazio dei nomi/nome del pacchetto: index.index

Classe/tipologia: Index

Metodo/funzione: build

Esempi su hotexamples.com: 2

Index.build in Python: 2 esempi trovati. Questi sono i migliori esempi reali in Python per index.index.Index.build, estratti da progetti open source. Li puoi valutare, per aiutarci a migliorare la qualità dei nostri esempi.

Metodi utilizzati di frequente

Mostra Nascondi

Index(20)

check_if_exists_in_index(3)

check_if_have_same_stem(3)

index_consturctor(3)

build(2)

tfidf(2)

obtain_text_of_a_document(2)

read_table(1)

obtain_term_ids_of_a_document(1)

obtain_terms_of_a_document(1)

od_expression_count(1)

od_expression_document_count(1)

parse_table_data(1)

run_query(1)

uw_expression_count(1)

run_query_doc_names(1)

load(1)

term(1)

term_count(1)

tf(1)

total_count(1)

search(1)

idf(1)

init_query_env(1)

expression_list(1)

add_xml_libraries(1)

create_index_for_table(1)

document_count(1)

document_length_doc_name(1)

document_length_docs_names(1)

expand_query(1)

expression_list_in_top_docs(1)

add_builtin_to_queue(1)

get_ext_document_id(1)

get_imports(1)

get_keywords(1)

get_kw_arguments(1)

get_kw_for_index(1)

get_object_name(1)

get_variables(1)

uw_expression_document_count(1)

Esempio n. 1

Mostra file

 def info(self, info='', col_bits=5, pagenum=100):
     keywords = PreDeal.seg(info)
     # 1. 关键词提取
     keys = jieba.analyse.textrank(info,
                                   topK=10,
                                   withWeight=False,
                                   allowPOS=('ns', 'n', 'vn', 'v'))
     # 2. 调用搜索引擎爬取相关网页
     # 2.1 抓取链接
     spider_link = SpiderLink(keys, self.root)
     spider_link.crawl(pagenum)
     # 2.2 抓取内容
     filename = '_'.join(keys) + '.html'
     spider_to = SpiderTo(filename)
     spider_to.crawl()
     # 3. 文本预处理,去重,去停用词,分词,保留url和关键词集合
     p = PreDeal()
     filepath = os.path.join(config.spidertext, '_'.join(keys))
     propath = os.path.join(config.prepapath, '_'.join(keys))
     p.savetexts(filepath=filepath, prepath=propath)
     # 4. 构建索引, 并检索,得到包含关键词信息的网页
     # 4.1 索引构建
     indexpath = os.path.join(config.indexpath, '_'.join(keys))
     Index.build(datapath=propath, indexpath=indexpath)
     search = Search(keys=keys, pindexp=indexpath)
     # 4.2 搜索并保存
     search.retrieve(keywords=keywords)
     # 5. 选取最佳网页,位置信息描述,编码
     info_kws = keywords[:]
     loc = Location(keywords=info_kws, col_bits=col_bits)
     name = '_'.join(keys)
     res_list = loc.describe(name)
     return res_list

Esempio n. 2

Mostra file

File: hide1.py Progetto: loinly/TextStego

 def info(self, fi='', pagenum=100):
     info = FileUtil.readfile(fi)
     keywords = PreDeal.seg(info)
     # 1. 关键词提取
     keys = jieba.analyse.textrank(info,
                                   topK=10,
                                   withWeight=False,
                                   allowPOS=('ns', 'n', 'vn', 'v'))
     # 2. 调用搜索引擎爬取相关网页
     # 2.1 抓取链接
     spider_link = SpiderLink(keys, self.root)
     spider_link.crawl(pagenum)
     # 2.2 抓取内容
     filename = '_'.join(keys) + '.html'
     spider_to = SpiderTo(filename)
     spider_to.crawl()
     # 3. 文本预处理,去重,去停用词,分词,保留url和关键词集合
     p = PreDeal()
     filepath = os.path.join(config.spidertext, '_'.join(keys))
     prepath = os.path.join(config.prepapath, '_'.join(keys))
     p.savetexts(filepath=filepath, prepath=prepath)
     # 4. 构建索引, 并检索,得到包含关键词信息的网页
     # 4.1 索引构建
     indexpath = os.path.join(config.indexpath, '_'.join(keys))
     idx = Index()
     idx.build(datapath=prepath, indexpath=indexpath)
     search = Search1(filename=fi, pindexp=indexpath)
     # 4.2 搜索并保存
     info_k = keywords[:]
     num = search.retrieve(keywords=info_k)
     return keywords, num