Python Jd_Db.db_query_extend Examples

Programming Language: Python

Namespace/Package Name: jd_db

Class/Type: Jd_Db

Method/Function: db_query_extend

Examples at hotexamples.com: 4

Python Jd_Db.db_query_extend - 4 examples found. These are the top rated real world Python examples of jd_db.Jd_Db.db_query_extend extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

Jd_Db(3)

db_query_extend(2)

db_query_process(1)

db_unprocess_count(1)

Example #1

Show file

File: suning_spider.py Project: taozhijiang/dust_repos

    def run(self):
        print ("启动线程 %d ...\n" % self.threadID)
        jdb = Jd_Db()
        while True:
            #if jdb.db_unprocess_count() > 200000:
            #    #print ("系统负载重，暂停展开网页...\n")
            #    time.sleep(60)
            #    continue

            with gdb_lock:
                while True:
                    full_url = jdb.db_query_extend()
                    if full_url:
                        break
                    else:
                        time.sleep(20)

            print("线程[%d]正在处理：%s" % (self.threadID, full_url) )
            get_product_ids(full_url, jdb, self.threadID)

        print ("退出线程 %d ..." % self.threadID)

Example #2

Show file

    def run(self):
        print("启动线程 %d ...\n" % self.threadID)
        jdb = Jd_Db()
        while True:
            #if jdb.db_unprocess_count() > 200000:
            #    #print ("系统负载重，暂停展开网页...\n")
            #    time.sleep(60)
            #    continue

            with gdb_lock:
                while True:
                    full_url = jdb.db_query_extend()
                    if full_url:
                        break
                    else:
                        time.sleep(20)

            print("线程[%d]正在处理：%s" % (self.threadID, full_url))
            get_product_ids(full_url, jdb, self.threadID)

        print("退出线程 %d ..." % self.threadID)

Example #3

Show file

File: jd_spider.py Project: dream1986/jd_spider

 def run(self):
     print ("启动线程 %d ...\n" % self.threadID)
     jdb = Jd_Db(jd_config.SQLITE_DB)
     while True:
         if jdb.db_unprocess_count() > 200000:                
             #print ("系统负载重，暂停展开网页...\n")
             time.sleep(60)
             continue 
             
         with gdb_lock:
             while True:
                 full_url = jdb.db_query_extend()
                 if full_url:
                     #if re.match(r'^http://(help|red|tuan|auction|jr|smart|gongyi|app|en|media|m|myjd|chat|read|chongzhi|z|giftcard|fw|you|mobile).jd.com', full_url) or re.match(r'^http://www.jd.com/compare/', full_url) or re.match(r'^http://club.jd.com/consultation/', full_url) :
                     #    print("线程[%d]正在处理：%s [删除]" % (self.threadID, full_url) )
                     #    jdb.db_drop_rubbish(full_url)
                     #else:
                     #    break
                     break
                 
         print("线程[%d]正在处理：%s" % (self.threadID, full_url) )
         get_product_ids(full_url, jdb, self.threadID)
                 
     print ("退出线程 %d ..." % self.threadID)

Example #4

Show file

    def run(self):
        print("启动线程 %d ...\n" % self.threadID)
        jdb = Jd_Db(jd_config.SQLITE_DB)
        while True:
            if jdb.db_unprocess_count() > 200000:
                #print ("系统负载重，暂停展开网页...\n")
                time.sleep(60)
                continue

            with gdb_lock:
                while True:
                    full_url = jdb.db_query_extend()
                    if full_url:
                        #if re.match(r'^http://(help|red|tuan|auction|jr|smart|gongyi|app|en|media|m|myjd|chat|read|chongzhi|z|giftcard|fw|you|mobile).jd.com', full_url) or re.match(r'^http://www.jd.com/compare/', full_url) or re.match(r'^http://club.jd.com/consultation/', full_url) :
                        #    print("线程[%d]正在处理：%s [删除]" % (self.threadID, full_url) )
                        #    jdb.db_drop_rubbish(full_url)
                        #else:
                        #    break
                        break

            print("线程[%d]正在处理：%s" % (self.threadID, full_url))
            get_product_ids(full_url, jdb, self.threadID)

        print("退出线程 %d ..." % self.threadID)