def get_user_info(save_file, uid_list, start): f = open(save_file, 'a') f2 = open('log', 'a') find = (start == -1) i = 0 while i < len(uid_list): if find: print 'processing uid#%s' % uid_list[i] url = 'http://mac.pcbeta.com/space-uid-%s.html' % uid_list[i] user = User() html = http_get(url) if html is None: time.sleep(10) continue user.parse(html) if user.is_valid(): f.write(str(user) + '\n') print 'write to file' else: login() i -= 1 else: if uid_list[i] == str(start): find = True i += 1 f.close() f2.close()
def get_all_uid(start_page): f = open('uid', 'a') for page in range(start_page, 7754): print 'getting uid from page %s' % page url = 'http://mac.pcbeta.com/member.php?action=list&listgid=&srchmem=&order=uid&type=&page=%s' % page html = http_get(url) if html is None: return uid_list = get_uid_list(html) if len(uid_list) == 0: return print uid_list for uid in uid_list: f.write(str(uid) + ' ') f.write('\n') print 'write to file' f.close()
self.info[k] = 'None' print self.info except Exception, e: print 'exception: %s' % str(e) def parse_from_str(self, s): # too sb............................. keys = [ 'username', 'qq', 'aliww', 'uid', 'birth', 'yahoo', 'site', 'pc', 'ichat', 'taobao', 'interest', 'device', 'home', 'icq', 'sex', 'os' ] if not len(s) == len(keys): print 'invalid string' else: for i in range(len(s)): self.info[keys[i]] = s[i] def __str__(self): s = '' for k in self.info.keys(): s += self.info[k] + ', ' return s if __name__ == '__main__': user = User() login.login() html = http_utils.http_get('http://mac.pcbeta.com/space-uid-2570038.html') user.parse(html) print str(user)
if len(m) > 0 and len(m[0]) > 0: self.info[k] = m[0] else: self.info[k] = 'None' print self.info except Exception, e: print 'exception: %s' % str(e) def parse_from_str(self, s): # too sb............................. keys = ['username', 'qq', 'aliww', 'uid', 'birth', 'yahoo', 'site', 'pc', 'ichat', 'taobao', 'interest', 'device', 'home', 'icq', 'sex', 'os'] if not len(s) == len(keys): print 'invalid string' else: for i in range(len(s)): self.info[keys[i]] = s[i] def __str__(self): s = '' for k in self.info.keys(): s += self.info[k] + ', ' return s if __name__ == '__main__': user = User() login.login() html = http_utils.http_get('http://mac.pcbeta.com/space-uid-2570038.html') user.parse(html) print str(user)