Esempio n. 1
0
def get_param(table):
    # 把店铺关注人数少的商品删掉
    sql = 'delete from '+table+' where sku in (select a.sku from (select a.sku from '+table+' a,shop b where a.shop_id=b.shop_id and b.follow<10000) a)'
    database_util.update_sql(sql,None)

    sql = 'SELECT url FROM '+table+' where update_time is null';
    result = list(database_util.search_sql(sql, None)[1])
    url_list = []
    for i in result:
        url_list.append(i[0])
    thread_queue.fill_queue(url_list)
    thread_queue.use_threading(['get_param',table])
def get_shop_id(table):
    sql = 'SELECT sku FROM ' + table + ' where shop_id is null'
    result = database_util.search_sql(sql, None)
    sku = []
    if result[0] != -1:
        id = list(result[1])
        for i in id:
            if i[0] is not None:
                sku.append(i[0])
            else:
                print("sku is null")
    thread_queue.fill_queue(sku)
    thread_queue.use_threading(['get_shop_id', table])
Esempio n. 3
0
def get_shop_info():
    sql = 'SELECT shop_id FROM shop where update_time is null';
    result = database_util.search_sql(sql, None)
    shop_id = []
    if result[0]!=-1:
        id = list(result[1])
        for i in id:
            if i[0] is not None:
                shop_id.append(i[0])
            else:
                print("shop_id is null")
    thread_queue.fill_queue(shop_id)
    thread_queue.use_threading(['update_shop_info',table])
def get_comment(table):
    # sql = 'SELECT sku FROM '+table+ ' where follow>=10000 and comment>=3000 and comment<5000';
    sql = 'SELECT sku FROM ' + table + ' where update_comment_time is null'
    result = database_util.search_sql(sql, None)
    sku = []
    if result[0] != -1:
        id = list(result[1])
        for i in id:
            if i[0] is not None:
                sku.append(i[0])
            else:
                print("sku is null")
    thread_queue.fill_queue(sku)
    #第三个参数是要获取多少页的评论数据
    thread_queue.use_threading(['get_comment', table, 100])
def update_price(table):
    sql = 'SELECT sku,max_price,min_price,avg_price,price_times  FROM ' + table + ' where TO_DAYS(NOW()) - TO_DAYS(update_price_time) >=1'
    result = database_util.search_sql(sql, None)
    prices = []
    if result[0] != -1:
        times = list(result[1])
        for i in times:
            price = {}
            price['sku'] = i[0]
            price['max_price'] = float(i[1])
            price['min_price'] = float(i[2])
            price['avg_price'] = float(i[3])
            price['price_times'] = int(i[4])
            prices.append(price)
    thread_queue.fill_queue(prices)
    thread_queue.use_threading(['update_price', table])
Esempio n. 6
0
def get_url(url,table):
    _spider = jd_spider.Spider()
    html_data = _spider.get_html(url)
    if html_data[0]==-1:
        return
    page_num = int(html_analysis.get_page_count(html_data[1]))
    for i in range(1,40):
        if i>page_num:
            break
        html_data = _spider.get_html(url+ "&page=" + str(i))
        if html_data[0]==-1:
            continue
        url_list = html_analysis.get_items_url(html_data[1])
        print('page:%s' % i)
        thread_queue.fill_queue(url_list)
    thread_queue.use_threading(['insert_url', table])
def update_shop_info(table):
    sql = 'SELECT shop_id FROM shop where TO_DAYS(NOW()) - TO_DAYS(update_time) >=1'
    result = database_util.search_sql(sql, None)
    shop_id = []
    if result[0] != -1:
        id = list(result[1])
        for i in id:
            shop_id.append(i[0])
    thread_queue.fill_queue(shop_id)
    thread_queue.use_threading(['update_shop_info', table])

    sql = 'select brand,follow from ' + table + ' group by brand order by follow'
    result = database_util.search_sql(sql, None)
    if result[0] != -1:
        result = list(result[1])
    for i in result:
        sql = 'update ' + table + ' set brand_hot=%s where brand=%s'
        data = [i[1], i[0]]
        database_util.update_sql(sql, data)