# -*- coding: utf-8 -*-

'''把前1000个关键词的搜索结果保存,为以后的搜索调整做对比'''

import time
from libs.parameter import generateEnv
from lnc.search.simple import Simple

simple = Simple(generateEnv('alpha'))
simple.login()
time.sleep(5)

keyword_file = 'input/keywords.txt'
keywords = [unicode(k.strip(), 'utf-8') for k in open(keyword_file, 'r')]

output = open('output/after-adjust.csv', 'a')

b = 1
for keyword in keywords:
    res = simple.get_results_list(keyword)
    if res:
        lines = map(None, (keyword,), (res['total'],), (res['time'],), res['title'])
        for l in lines:
            line = [x if x is not None else u'' for x in l]
            output.write("%s|%s|%s|%s\n" % tuple(line))
        output.write("\n")
        output.flush()

simple.close(logout=True)

Example #2
0
#-*- coding: utf-8 -*-

'''
从input/exact_title.txt文件里面读取标题
然后进行搜索,检查第一条结果是否中标题完全匹配
注意附件的标题会在后面有一个括号,括号里面是附件的文件名
'''

import re, time
from libs.parameter import generateEnv
from lnc.search.simple import Simple

input_titles = [unicode(x.strip(), 'utf-8') for x in open('input/exact_title.txt')]

lnc_simple = Simple(generateEnv('alpha'))
lnc_simple.login()
time.sleep(5)

p = re.compile("\(\d+.[a-zA-Z]{,4}\)", re.IGNORECASE)

output = open('logs/exact_title.csv', 'a')

for it in input_titles:
    title_list = lnc_simple.get_results_list(it)
    first_equal = False
    if title_list:
        if len(title_list[0]) > len(it) and title_list[0].find(it) > -1:
            remain_title = title_list[0][len(it):].strip()
            if p.match(remain_title):
                first_equal = True
        elif it == title_list[0]: