cur2.execute(sql, args) except: msg = "db error" raise RuntimeError(msg) while True: cur.execute(sql) if cur.rowcount == 0: break print for row in cur.fetchall(): stem = '%s-%s-%d-%d-%d' % row sgm = getSgmDir(stem) lang = row[0] tid = row[4] err = None try: score = langid(sgm, lang) except RuntimeError, e: score = None err = e.message try: update_score(tid, score) except RuntimeError, e: err = e.message
db2.cur.execute(sql, offset) if db2.cur.rowcount <= 0: break for row in db2.cur.fetchall(): lang, genre, site, grp, thr, errno = row if errno & 0x000A != 0: print "%x" % errno continue stem = "%s-%s-%s-%s-%s" % (lang,genre,site,grp,thr) html = mycurl.getHtmlDir(stem) if not os.path.exists(html): continue sgm = mycurl.getSgmDir(stem) mycurl.createBaseDir(sgm) CONVERTER = 'c' if site in h: CONVERTER += '%d' % site if grp in h[site]: CONVERTER += '-%d' % grp if thr in h[site][grp]: CONVERTER += '-%d' % thr CONVERTER = os.path.join(SCRIPTBASE, CONVERTER) if not os.path.exists(CONVERTER): print "no converter for %s" % stem continue