def get_newarticle_Id(uid_upwd, title, headers): try: headers['Accept'] = '*/*' headers['Content-Type'] = 'application/x-www-form-urlencoded' headers['Cookie'] = 'bbuserid=' + uid_upwd[ 0] + '; bbpassword='******'Origin'] = 'https://www.liveinternet.ru' headers[ 'Referer'] = 'https://www.liveinternet.ru/journal_post.php?journalid=' + uid_upwd[ 0] data = { 'postid': '0', 'journalid': uid_upwd[0], 'headerofpost': title, 'message': None, 'tags': None, } url_id = 'https://www.liveinternet.ru/journal_autosave.php?doajax=1' response = requestsW.post(url_id, data=data, headers=headers) if response == -1: return -1 if 'NOAccess denied' in response.text: return 1 blog_Id = re.findall('OK(.*?)\|', response.text) if not blog_Id: g_var.logger.info("获取新文章ID失败...") return -2 article_Id = blog_Id[0] return article_Id except Exception as e: g_var.logger.info(e) g_var.ERR_CODE = 5000 g_var.ERR_MSG = "获取新文章ID出现异常..." g_var.logger.info("获取新文章ID出现异常...") return -2
def __register_one(self): g_var.logger.info("register。。。") # 获取authenticity_token、_csrf_token、_rapgenius_session值 authenticity_token, csrf_token, rapgenius_session = get_authenticity_token_signup( ) if authenticity_token == 0: return -1 elif authenticity_token == -1: return -2 # 获取headers headers = generate_headers(0, csrf_token, rapgenius_session) if headers == -1: g_var.logger.info("获取headers失败。。。") return -2 # 注册数据 registerData = generate_register_data(authenticity_token) url_register = 'https://genius.com/account' g_var.logger.info("提交注册中。。。") html = requestsW.post(url_register, proxies=ip_proxy("ch"), data=registerData, headers=headers, timeout=g_var.TIMEOUT, vpn='ch') if html == -1: return html # 注册成功验证 user_id_list = re.findall('CURRENT_USER = {"id":(.*?),"login":'******'_rapgenius_session=(.*?);', html.headers['Set-Cookie']) # 插入数据库 try: sql = "INSERT INTO genius_com(username, password, mail, user_id) VALUES('" + registerData['user[login]'] + \ "', '" + registerData['user[password]'] + "', '" + registerData['user[email]'] + "', '" + user_id_list[0] +"');" last_row_id = MysqlHandler().insert(sql) if last_row_id != -1: registerData["id"] = last_row_id registerData["user_id"] = user_id_list[0] registerData["name"] = registerData['user[login]'] registerData["rapgenius_session"] = session_list[0] return registerData else: g_var.ERR_CODE = 2004 g_var.ERR_MSG = "数据库插入用户注册数据失败..." g_var.logger.error("数据库插入用户注册数据失败...") return 0 except Exception as e: g_var.logger.info(e) g_var.ERR_CODE = 2004 g_var.ERR_MSG = "数据库插入用户注册数据出现异常..." g_var.logger.error("数据库插入用户注册数据出现异常...") return 0
def register() -> (str, str, str): user = project_util.generate_random_string(12, 16) pwd = project_util.generate_random_string(10, 12) email = user + "@qq.com" dicproxy = ip_proxy() s = requests.session() s.proxies = dicproxy s.headers = headers proxies = ip_proxy() res = requestsW.get( "https://www.reddit.com/register/?actionSource=header_signup", proxies=proxies, headers=headers, timeout=5) cookies = res.cookies.get_dict() print(cookies) print("已经响应", res) re_res = re.search('<input type="hidden" name="csrf_token" value="(.*?)">', res.text) csrf_token = re_res.group(1) print("正在打码中") # g_recaptcha_response = captcha() g_recaptcha_response = "03AGdBq24tyZjh-Ini2ud5ISBy1Eb-UYEpSKYdgxsNNLLvMRQT4VXCVW4Z1EuXrtX4GwlERbjJkS1x9cJtcPbKmGYwzvqRfajGUvFyq9CEfRSzohkPv54Lnk1BlU3OHE8suDOSrKwc90uj7TPeTL12VUhdyCk-H73quiajTYNuwd3pJm1xdWbbo4JthN8N0hvMIrsdM7_XYAclp_BN9QTWkwmhjDTpR8-CM2zWJ48JKug-9KZzaVM-Bmxzb7LVr4NcG5XozTrhsIdbS89eLSo8aoS7V-frd8Hb6xFpBpvjtsCQMnE25FoR7FqPmL2ER0bNV7QgowFX6Z8OFZ95fDDTub5S9qCQUr7Zactpz57_W38T6opn4u4swVH_EcEGUpkT1IhUgy5GVVsBgvidVR3F0j7F5tfLQ2_GKg" print("打印验证码:", g_recaptcha_response) data = { "csrf_token": csrf_token, "g-recaptcha-response": g_recaptcha_response, "dest": "https://www.reddit.com", "password": pwd, "username": user, "email": email, } # res.headers["content-type"]="application/x-www-form-urlencoded" res = requestsW.post("https://www.reddit.com/register", headers=headers, proxies=proxies, cookies=cookies, data=data, timeout=5) print(res.cookies) print("注册结果:", res.text)
def __register_one(self, present_website, email_info): g_var.logger.info("register...") headers = generate_headers(0) if headers == -1: g_var.logger.info("获取注册headers失败...") return -2 registerData = generate_register_data(present_website, email_info) g_var.logger.info(registerData) if registerData == -1: g_var.logger.info("未生成正确注册数据...") return -2 url_register = 'https://www.wattpad.com/signup?nextUrl=/home' g_var.logger.info("提交注册中...") html = requestsW.post(url_register, proxies=ip_proxy("en"), data=registerData, headers=headers, timeout=g_var.TIMEOUT) if html == -1: return -1 # 注册成功与否验证 prove_info = 'Hi @' + registerData['username'] if prove_info not in html.text: g_var.logger.info(html.text) g_var.logger.info("IP被封等原因...") return -2 token_list = re.findall('token=(.*?);', html.headers['Set-Cookie']) del headers['Origin'] del headers['Content-Type'] del headers['Referer'] time.sleep(2) verify_url = get_verify_url(email_info) if verify_url == -1: g_var.logger.info("未读取到邮箱验证的url...") return -3 g_var.logger.info("邮件的url正在验证中...") html = requestsW.get(url=verify_url, proxies=ip_proxy("en"), headers=headers, timeout=g_var.TIMEOUT) if html == -1: return -1 if html.status_code == 200: sql = "INSERT INTO wattpad_com(username, password, mail, status) VALUES('" + registerData['username'] + \ "', '" + registerData['password'] + "', '" + registerData['email'] + "', '" + str(0) + "');" last_row_id = MysqlHandler().insert(sql) if last_row_id != -1: registerData["id"] = last_row_id registerData["token"] = token_list[0] return registerData else: g_var.ERR_CODE = 2004 g_var.ERR_MSG = "数据库插入用户注册数据失败..." g_var.logger.error("数据库插入用户注册数据失败...") return 0 else: g_var.ERR_CODE = 3006 g_var.ERR_MSG = "邮箱验证失败..." g_var.logger.error("邮箱验证失败!\n") return -3
def __send_profile(self, userData): """ 发个人简介 Args: Session:Session对象 loginData:用户信息,包括user_id,username,password,email,cookie Returns: 成功返回:0 失败返回状态值: 1:数据库存储失败 -1:连续代理错误或页面发生改变等取不到关键数据等,需要停止程序 -2:本次出错,继续循环 """ g_var.logger.info('send profile......') headers = generate_headers(1) if headers == -1: return -1 g_var.logger.info('authenticity_token, session_id...') authenticity_token, session_id = get_authenticity_token(userData) if authenticity_token == -1 or session_id == -1: return -1 elif authenticity_token == -2 or session_id == -2: return 1 headers['Referer'] = 'https://www.sbnation.com/users/' + userData[ 'username'] + '/edit_profile' headers['Cookie'] = '_session_id=' + session_id titleLink = get_new_title_and_link() if titleLink == -1: return -1 multipart_encoder = MultipartEncoder( fields={ 'utf8': '✓', '_method': 'patch', 'authenticity_token': authenticity_token, 'profile_image[filename]': ('', '', 'application/octet-stream'), 'profile_image[filename_cache]': '', 'network_membership[bio]': '', 'network_membership[signature]': '', 'network_membership[public_email]': '', 'network_membership[website_name]': titleLink[0], 'network_membership[website_url]': titleLink[1], 'network_membership[facebook_page_url]': '', 'network_membership[facebook_page_url]': '', 'network_membership[network_membership_items_attributes][0][key]': 'MLB', 'network_membership[network_membership_items_attributes][0][value]': '', 'network_membership[network_membership_items_attributes][1][key]': 'NFL', 'network_membership[network_membership_items_attributes][1][value]': '', 'network_membership[network_membership_items_attributes][2][key]': 'NBA', 'network_membership[network_membership_items_attributes][2][value]': '', 'network_membership[network_membership_items_attributes][3][key]': 'NHL', 'network_membership[network_membership_items_attributes][3][value]': '', 'network_membership[network_membership_items_attributes][4][key]': 'NCAAF', 'network_membership[network_membership_items_attributes][4][value]': '', 'network_membership[network_membership_items_attributes][5][key]': 'NCAAB', 'network_membership[network_membership_items_attributes][5][value]': '', 'network_membership[network_membership_items_attributes][6][key]': 'MMA', 'network_membership[network_membership_items_attributes][6][value]': '', 'network_membership[network_membership_items_attributes][7][key]': 'Golf', 'network_membership[network_membership_items_attributes][7][value]': '', 'network_membership[network_membership_items_attributes][8][key]': 'NASCAR', 'network_membership[network_membership_items_attributes][8][value]': '', 'network_membership[network_membership_items_attributes][9][key]': 'Boxing', 'network_membership[network_membership_items_attributes][9][value]': '', 'network_membership[network_membership_items_attributes][10][key]': 'Soccer', 'network_membership[network_membership_items_attributes][10][value]': '', 'network_membership[network_membership_items_attributes][11][key]': 'MLS', 'network_membership[network_membership_items_attributes][11][value]': '', 'network_membership[network_membership_items_attributes][12][key]': 'EPL', 'network_membership[network_membership_items_attributes][12][value]': '', 'network_membership[network_membership_items_attributes][13][key]': 'Football League Championship', 'network_membership[network_membership_items_attributes][13][value]': '', 'network_membership[network_membership_items_attributes][14][key]': 'FIFA', 'network_membership[network_membership_items_attributes][14][value]': '', 'network_membership[network_membership_items_attributes][15][key]': 'Bundesliga', 'network_membership[network_membership_items_attributes][15][value]': '', 'network_membership[network_membership_items_attributes][16][key]': 'Serie A', 'network_membership[network_membership_items_attributes][16][value]': '', 'network_membership[network_membership_items_attributes][17][key]': 'La Liga', 'network_membership[network_membership_items_attributes][17][value]': '', 'network_membership[network_membership_items_attributes][18][key]': 'Cycling', 'network_membership[network_membership_items_attributes][18][value]': '', 'network_membership[network_membership_items_attributes][19][key]': 'Tennis', 'network_membership[network_membership_items_attributes][19][value]': '', 'network_membership[network_membership_items_attributes][20][key]': 'General', 'network_membership[network_membership_items_attributes][20][value]': '', 'commit': 'Update', }, boundary='----WebKitFormBoundary' + generate_random_string( 16, 16, 'abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ'), ) headers['Content-Type'] = multipart_encoder.content_type g_var.logger.info("发布个人简介的链接...") url_link = 'https://www.sbnation.com/users/' + userData[ 'username'] + '/update_profile' html = requestsW.post(url_link, proxies=ip_proxy("en"), data=multipart_encoder, headers=headers, timeout=g_var.TIMEOUT) if html == -1: return html if html.status_code != 200: g_var.logger.info('链接发布失败。。。') g_var.logger.info(html.text) return -2 try: url = 'https://www.sbnation.com/users/' + userData['username'] sql = "INSERT INTO sbnation_com_article(url, user_id) VALUES('" + url + "', '" + str( userData["id"]) + "');" last_row_id = MysqlHandler().insert(sql) g_var.logger.info(last_row_id) if last_row_id != -1: g_var.logger.info('链接发送成功!' + userData['username']) return 0 else: g_var.ERR_CODE = 2004 g_var.ERR_MSG = "数据库插入用户注册数据失败..." g_var.logger.error("数据库插入用户注册数据失败...") return 1 except Exception as e: g_var.logger.info(e) g_var.ERR_CODE = 2004 g_var.ERR_MSG = "数据库插入用户注册数据异常..." g_var.logger.error("数据库插入用户注册数据异常...") return 1
def login(self, present_website, VPN, userData): """ 登录 Args: Session:Session对象 present_website:当前网站名,用于数据库表名 VPN:使用国内or国外代理 userInfo:用户信息 userInfo[0]:id [1]:username [2]passwod [3]:emial [4]:status Returns: 成功返回loginData loginData = { 'id': user_id, 'username': username, 'password': password, 'email': email, } 失败返回状态值: 1:表示账号密码失效,密码被改或账号被网站删除,将数据库中状态改为1,并跳出循环重新取账号 0:跳出循环,重新取号 -1:连续代理错误或页面发生改变等取不到关键数据等,需要停止程序 -2:本次出错,不跳出循环 Mysql Update示例: # 如果cookie失效,将该cookie从数据库中清除,并重新从数据库中获取登录账号密码 sql = "UPDATE %s SET cookie='%s' WHERE id=%s ;" % (sbnation_com, save_cookies, user_id) status = MysqlHandler().update(sql) if status == 0: g_var.logger.info("cookie失效,清除cookie update OK") return {"error": -2} else: g_var.logger.error("数据库清除cookie错误!") return {"error": 1} """ g_var.logger.info('login ......') headers = generate_headers(2) if headers == -1: return -1 login_session_id = get_login_session_id() headers['Cookie'] = login_session_id login_data = { 'username': userData['username'], 'password': userData['password'], 'remember_me': 'false', 'g-recaptcha-response': '', } login_url = 'https://auth.voxmedia.com/chorus_auth/initiate_password_auth.json' g_var.logger.info('登录中 ......') html = requestsW.post(login_url, proxies=ip_proxy("en"), data=login_data, headers=headers, timeout=g_var.TIMEOUT) if html == -1: return html try: g_var.logger.info(html.text) res_data = json.loads(html.text) except Exception as e: g_var.logger.info(e) g_var.logger.info('登录失败,返回信息解析失败。。。') g_var.logger.info(html.text) return 1 if not res_data['logged_in']: g_var.logger.info('登录失败。。。') g_var.logger.info(html.text) return 1 session_id_article = re.findall('_session_id=(.*?);', html.headers['Set-Cookie']) if not session_id_article: return 1 userData['cookie'] = session_id_article[0] return userData
def __register_one(self, present_website): """ 注册一个账户,需要实现注册、激活、并将注册数据存入数据库的功能 Args: Session:Session对象 present_website:当前网站名,用于数据库表名 email_and_passwd:邮箱账户和密码,email_and_passwd[0]是邮箱,[1]是密码 Returns: 注册成功返回注册数据字典对象registerData,需要包含id, username, password, email, cookie(在访问激活链接时能取到,\ 取不到返回空) user_id这样获取:(示例) # 将注册的账户写入数据库(sql自己写,这边只是个示例) sql = "INSERT INTO "+present_website+"(username, password, mail, status, cookie) VALUES('" + \ username + "', '" + password + "', '" + email + "', '" + str(0) + cookie + "');" last_row_id = MysqlHandler().insert(sql) if last_row_id != -1: registerData["user_id"] = last_row_id return registerData else: g_var.logger.error("数据库插入用户注册数据失败") return 0 注册失败返回状态码 0:数据库存储失败 -1:连续代理错误或页面发生改变等取不到关键数据等,需要停止程序 -2:注册失败,可能是打码出错等原因 """ g_var.logger.info('register......') headers = generate_headers(0) if headers == -1: return -1 g_var.logger.info('session_id......') session_id = get_session_id() if session_id == -1: return -1 elif session_id == -2: return -2 googlekey = '6LefyhkTAAAAANpeEKwwgimNneiKWXRQtEqFZbat' captcha_value = google_captcha( "", googlekey, 'https://auth.voxmedia.com/signup?return_to=https://www.sbnation.com/' ) if captcha_value == -1: return -2 headers['cookie'] = session_id username = generate_random_string(8, 12) password = generate_random_string(10, 14) community_id = random.randint(210, 299) g_var.logger.info('community_id.....') g_var.logger.info(community_id) email = username + '@hotmail.com' registerData = { 'g-recaptcha-response': captcha_value, 'user[username]': username, 'user[password]': password, 'user[email]': email, 'user[newsletter]': 'false', 'community_id': community_id, } g_var.logger.info('开始提交注册信息...') url_login = '******' html = requestsW.post(url_login, proxies=ip_proxy("en"), data=registerData, headers=headers, timeout=g_var.TIMEOUT) if html == -1: return html try: g_var.logger.info(html.text) res_data = json.loads(html.text) except Exception as e: g_var.logger.info(e) g_var.logger.info('注册失败,返回信息解析失败。。。') g_var.logger.info(html.text) return -2 if not res_data['success']: g_var.logger.info('注册失败。。。') g_var.logger.info(html.text) return -2 try: sql = "INSERT INTO " + present_website + "(username, password, mail) VALUES('" + \ username + "', '" + password + "', '" + email + "');" last_row_id = MysqlHandler().insert(sql) g_var.logger.info(last_row_id) if last_row_id != -1: g_var.logger.info('注册成功!' + username) userData = { 'id': last_row_id, 'username': username, 'password': password, } return userData else: g_var.ERR_CODE = 2004 g_var.ERR_MSG = "数据库插入用户注册数据失败..." g_var.logger.error("数据库插入用户注册数据失败...") return 0 except Exception as e: g_var.logger.info(e) g_var.ERR_CODE = 2004 g_var.ERR_MSG = "数据库插入用户注册数据异常..." g_var.logger.error("数据库插入用户注册数据异常...") return 0
def __register_one(self, Session, present_website: str, email_and_passwd): """ 注册一个账户 Args: Session:Session对象 present_website:当前网站名,用于数据库表名 email_and_passwd:邮箱账户和密码,email_and_passwd[0]是邮箱,[1]是密码 Returns: 注册成功返回注册数据字典对象registerData,需要包含user_id, username, password, email user_id这样获取:(示例) # 将注册的账户写入数据库(sql自己写,这边只是个示例) sql = "INSERT INTO "+present_website+"(username, password, mail, status) VALUES('" + name + \ "', '" + psd + "', '" + email_and_passwd[0] + "', '" + str(0) + "');" last_row_id = MysqlHandler().insert(sql) if last_row_id != -1: registerData["id"] = last_row_id return registerData else: g_var.logger.error("数据库插入用户注册数据失败") return 0 注册失败返回状态码 0:更换email 返回0 或其他错误,但是激活失败或插入数据库失败 -1:表示requests请求页面失败,需要更换代理 -2:注册失败,可能是邮箱密码不符合要求、或ip被封等原因,需要排查 """ user = project_util.generate_random_string(12, 16) pwd = project_util.generate_random_string(10, 12) email_list = email_and_passwd if email_list == -1: g_var.SPIDER_STATUS = 2 g_var.ERR_MSG = g_var.ERR_MSG + "|_|NO email" g_var.logger.info("NO email") return 0 verify_email = Session.get( "https://www.diigo.com/user_mana2/check_email?email=" + email_list[0], timeout=g_var.TIMEOUT, headers=self.headers, proxies=Session.proxies) # 验证邮箱是否可用 verify_user = Session.get( "https://www.diigo.com/user_mana2/check_name?username="******"1": g_var.SPIDER_STATUS = 2 g_var.ERR_MSG = g_var.ERR_MSG + "|_|账号密码或邮箱已经被注册" g_var.logger.info("账号密码或邮箱已经被注册") return 0 # time.sleep(3) google_captchas = google_captcha( "", "6Ld23sMSAAAAALfyXkI9d0nHmzOH9jZZNuh66nql", "https://www.diigo.com/sign-up?plan=free") if google_captchas == -1: g_var.SPIDER_STATUS = 2 g_var.ERR_MSG = g_var.ERR_MSG + "|_|谷歌打码失败" g_var.logger.info("谷歌打码失败") return -2 res = requestsW.get("https://www.diigo.com/", headers=self.headers, proxies=Session.proxies) # 打开首页 if res == -1: return res cookies = res.cookies.get_dict() i = 0 while i < g_var.ERR_COUNT: i += 1 try: Session.proxies = ip_proxy() res = requests.get("https://www.diigo.com/sign-up?plan=free", headers=self.headers, cookies=cookies, proxies=Session.proxies, verify=False) user_input = re.search('id="username" name="(\w{32})">', res.text) email_input = re.search('id=\'email\' name="(\w{32})">', res.text) pwd_input = re.search('id=\'password\' name="(\w{32})"', res.text) if not user_input and email_input and pwd_input: # TODO 获取不到参数 return "注册无法打开网页" else: user_input = user_input.group(1) email_input = email_input.group(1) pwd_input = pwd_input.group(1) data = { "plan": "free", "g-recaptcha-response": google_captchas, user_input: user, email_input: email_and_passwd[0], pwd_input: pwd, } self.headers["X-Requested-With"] = "XMLHttpRequest" self.headers[ "Referer"] = "https://www.diigo.com/sign-up?plan=free" self.headers[ "Content-Type"] = "application/x-www-form-urlencoded; charset=UTF-8" res = requests.post( "https://www.diigo.com/user_mana2/register_2", headers=self.headers, cookies=cookies, data=data, proxies=Session.proxies, verify=False) print(res.json()) if project_util.dictExistValue(res.json(), "status"): if res.json()["status"] == 1: cookies.update(res.cookies.get_dict()) savec = cookies res = requestsW.post( "https://www.diigo.com/user_mana2/resend_verify", cookies=cookies, headers=self.headers, data={"email": email_and_passwd[0]}, proxies=Session.proxies) print("重新发送邮箱:", res.text) emailinfo = EmailVerify( email_and_passwd[0], email_and_passwd[1], 'href="(https://www.diigo.com/user_mana2/register_verify/\w{32})"' ).execute_Start() print("这里是邮箱参数:", emailinfo) if emailinfo["data"] != -1: Session = requestsW.session() res = Session.get(emailinfo["data"], headers=self.headers, proxies=Session.proxies, cookies=cookies) sql = """INSERT INTO %s (username, password, mail, status, cookie) VALUES("%s", "%s", "%s", "%s", "%s");""" % ( "diigo_com", user, pwd, email_and_passwd[0], 0, savec) g_var.logger.info(sql) last_row_id = MysqlHandler().insert(sql) if last_row_id != -1: registerData = { "username": user, "password": pwd, "email": email_and_passwd[0], "cookie": savec, } registerData["id"] = int(last_row_id) return registerData return { "user": user, "pwd": pwd, "email": email_and_passwd[0], "cookies": Session.cookies.get_dict() } # if project_util.dictExistValue(res.cookies.get_dict(),"diigoandlogincookie"): # 注册成功并登陆cookie # saveCookie = str(Session.cookies.get_dict()) # # print({"user": user, "pwd": pwd, "email": email_and_passwd[0], "cookies": saveCookie}) # return {"user": user, "pwd": pwd, "email": email_and_passwd[0], "cookies": saveCookie} elif res.json()["status"] == -2: if "captcha error" in res.json()["status"]: g_var.SPIDER_STATUS = 2 g_var.ERR_MSG = g_var.ERR_MSG + "|_|谷歌打码失败" g_var.logger.info("谷歌打码失败") return -2 return -2 except Exception as e: res = requestsW.get("https://www.diigo.com/", headers=self.headers, proxies=Session.proxies, verify=False) # 打开首页 cookies = res.cookies.get_dict() g_var.logger.info(e) g_var.logger.info("正在换ip", e) return 0
def __postMessage(self, Session, loginData: dict, present_website): """ 发文章 Args: Session:Session对象 loginData:用户信息,包括id,username,password,cookie present_website:当前网站名,用于数据库表名 Returns: 成功返回状态值:0 失败返回状态值: 1:表示账号密码失效,密码被改或账号被网站删除 -1:连续代理错误,停止程序 -2:页面发生改变,获取不到页面上的一些token值 -3:数据库插入更新等错误 -4:cookie过期 """ if loginData["cookie"] != "": Session.cookies = loginData["cookie"] title_link = get_new_title_and_link() postUrl = title_link[1] users = loginData["username"] # Sesstion.cookies=cookies self.headers[ "Content-Type"] = "application/x-www-form-urlencoded; charset=UTF-8" self.headers["Referer"] = "https://www.diigo.com/user/t3wjogvjklzwh3zi" self.headers["Origin"] = "https://www.diigo.com" # res=requests.post("https://superio.diigo.com/fetch_meta",headers=headers,data={"url":postUrl},verify=False) # print(res.text) # if not project_util.dictExistValue(res.json(),"title"): # return "请求失败" self.headers["X-Requested-With"] = "XMLHttpRequest" # res=Sesstion.get("https://www.diigo.com/tag_mana2/load_recommended_tags",params={"title":res.json()["title"],"url":postUrl},headers=headers,cookies=cookies,verify=False) # if not project_util.dictExistValue(res.json(),"tags"): # return "提交网站有问题" data = { "title": title_link[0], "tags": title_link[0], "description": title_link[0], "unread": False, "private": False, "url": postUrl, "lists": "", "groups": "", } res = requestsW.post("https://www.diigo.com/item/save/bookmark", cookies=eval(loginData["cookie"]), headers=self.headers, data=data) if res == -1: return res g_var.logger.info(res.text) g_var.logger.info(loginData) if project_util.dictExistValue(res.json(), "items"): res_url = "https://www.diigo.com/user/" + users sql = "INSERT INTO %s_article(url, keyword, user_id) VALUES('%s', '%s', '%s');" % ( present_website, res_url, title_link[0], loginData["id"]) if g_var.insert_article_lock.acquire(): last_row_id = MysqlHandler().insert(sql) if last_row_id == -1: return -1 g_var.insert_article_lock.release() return 0 else: return -1
def register_one(Session=None) -> dict: MysqlHandler().startDB() if Session == None: Session = requests.session() Session.proxies = ip_proxy() res = requestsW.get("https://www.diigo.com/", headers=headers, proxies=ip_proxy(), verify=False) #打开首页 cookies = res.cookies.get_dict() print("这里是cookies", cookies) str_cookies = str(res.cookies.get_dict()) cookies = eval(str_cookies) user = project_util.generate_random_string(12, 16) pwd = project_util.generate_random_string(10, 12) email_and_passwd = get_email("https://www.diigo.com") if email_and_passwd == -1: return "NO email" else: print("这里是邮箱", email_and_passwd) verify_user = requestsW.get( "https://www.diigo.com/user_mana2/check_name?username="******"https://www.diigo.com/user_mana2/check_email?email=" + email_and_passwd[0], cookies=cookies, headers=headers, proxies=Session.proxies, verify=False) #验证邮箱是否可用 if not verify_user.text == verify_email.text == "1": print("错误") return "账号密码或邮箱已经被注册" # time.sleep(3) google_captchas = google_captcha( "", "6Ld23sMSAAAAALfyXkI9d0nHmzOH9jZZNuh66nql", "https://www.diigo.com/sign-up?plan=free") # google_captchas ="google_captchas" if google_captchas == -1: return "谷歌打码失败" # requestsW.get("https://www.diigo.com/interact_api/load_user_premium_info",headers=headers,cookies=cookies,proxies=Session.proxies,verify=False)#必须访问 i = 0 while i < 20: try: Session.proxies = ip_proxy() res = requests.get("https://www.diigo.com/sign-up?plan=free", headers=headers, cookies=cookies, proxies=Session.proxies, verify=False) user_input = re.search('id="username" name="(\w{32})">', res.text) email_input = re.search('id=\'email\' name="(\w{32})">', res.text) pwd_input = re.search('id=\'password\' name="(\w{32})"', res.text) if not user_input and email_input and pwd_input: # TODO 获取不到参数 return "注册无法打开网页" else: user_input = user_input.group(1) email_input = email_input.group(1) pwd_input = pwd_input.group(1) data = { "plan": "free", "g-recaptcha-response": google_captchas, user_input: user, email_input: email_and_passwd[0], pwd_input: pwd, } headers["X-Requested-With"] = "XMLHttpRequest" headers["Referer"] = "https://www.diigo.com/sign-up?plan=free" headers[ "Content-Type"] = "application/x-www-form-urlencoded; charset=UTF-8" print("准备提交") print(cookies) res = requests.post("https://www.diigo.com/user_mana2/register_2", headers=headers, cookies=cookies, data=data, proxies=Session.proxies, verify=False) print(res.json()) if project_util.dictExistValue(res.json(), "status"): if res.json()["status"] == 1: cookies.update(res.cookies.get_dict()) savec = cookies res = requestsW.post( "https://www.diigo.com/user_mana2/resend_verify", cookies=cookies, headers=headers, data={"email": email_and_passwd[0]}, proxies=Session.proxies) print("重新发送邮箱:", res.text) emailinfo = MyEmail( email_and_passwd[0], email_and_passwd[1], 'href="(https://www.diigo.com/user_mana2/register_verify/\w{32})"' ).execute_Start() print("这里是邮箱参数:", emailinfo) if emailinfo["data"] != -1: Session = requestsW.session() res = Session.get(emailinfo["data"], headers=headers, proxies=Session.proxies, cookies=cookies) sql = """INSERT INTO %s (username, password, mail, status, cookie) VALUES("%s", "%s", "%s", "%s", "%s");""" % ( "diigo_com", user, pwd, email_and_passwd[0], 0, savec) g_var.logger.info(sql) last_row_id = MysqlHandler().insert(sql) if last_row_id != -1: registerData = { "username": user, "password": pwd, "email": email_and_passwd[0], } registerData["user_id"] = last_row_id return registerData return { "user": user, "pwd": pwd, "email": email_and_passwd[0], "cookies": Session.cookies.get_dict() } # if project_util.dictExistValue(res.cookies.get_dict(),"diigoandlogincookie"): # 注册成功并登陆cookie # saveCookie = str(Session.cookies.get_dict()) # # print({"user": user, "pwd": pwd, "email": email_and_passwd[0], "cookies": saveCookie}) # return {"user": user, "pwd": pwd, "email": email_and_passwd[0], "cookies": saveCookie} return "res:" + res.text except (ConnectTimeout, ReadTimeout, ConnectionError) as e: res = requestsW.get("https://www.diigo.com/", headers=headers, proxies=Session.proxies, verify=False) # 打开首页 cookies = res.cookies.get_dict() i += 1 print(e) print("正在换ip", e)
def __postMessage(self, loginData, present_website, googlekey): """ 发文章 Args: Session:Session对象 loginData:用户信息,包括user_id,username,password,cookie present_website:当前网站名,用于数据库表名 Returns: 成功返回状态值:0 失败返回状态值: 1:表示账号密码失效,密码被改或账号被网站删除 -1:表示requests请求页面失败,需要更换代理 -2:页面发生改变,获取不到页面上的一些token值 -3:数据库插入更新等错误 -4:cookie失效 """ g_var.logger.info('post article......') item_id = str(uuid.uuid4()) sections_id = str(uuid.uuid4()) g_var.logger.info('正在获取headers。。。') headers = generate_headers(2, loginData['cookie'], item_id) if headers == -1 or loginData['cookie'] == "": g_var.logger.info("获取headers失败...") return -1 captcha_url = 'https://app.ex.co/create/new/preview' captcha_value = google_captcha('', googlekey, captcha_url) if captcha_value == -1: return -2 title, ops = get_article() if title == -1 or ops == -1: g_var.logger.info("未能获取对应文章格式内容...") return -1 article_data = generate_post_article_data(loginData, item_id, sections_id, captcha_value, title, ops) g_var.logger.info("文章发送中...") url = 'https://editor.ex.co/item/publish' res = requestsW.post(url, proxies=ip_proxy("en"), json=article_data, headers=headers, timeout=g_var.TIMEOUT) if res == -1: return res # cookie失效判断 cookie_prove = '401 - "Failed to authenticate token"' if cookie_prove == res.text: g_var.logger.info('cookie 失效 ......') # 如果cookie失效,将该cookie从数据库中清除,并重新从数据库中获取登录账号密码 sql = "UPDATE " + present_website + " SET cookie='' WHERE id=" + str( loginData['id']) + ";" status = MysqlHandler().update(sql) if status == 0: g_var.logger.info("cookie失效,清除cookie update OK") return -4 else: g_var.logger.error("数据库清除cookie错误!") return 1 res_article = re.findall('"item":\{"id":"(.*?)","tags"', res.text) if not res_article: g_var.ERR_CODE = 5000 g_var.ERR_MSG = "文章发送失败,IP异常等原因..." g_var.logger.info('文章发送失败,IP异常等原因...') return -1 try: url = 'https://app.ex.co/stories/item/' + item_id sql = "INSERT INTO playbuzz_com_article(url, keyword, user_id) VALUES('" + url + "', '" + title + "', '" + str( loginData["id"]) + "');" last_row_id = MysqlHandler().insert(sql) g_var.logger.info(last_row_id) if last_row_id != -1: g_var.logger.info('文章成功!' + loginData['firstName']) return 0 else: g_var.ERR_CODE = 2004 g_var.ERR_MSG = "数据库插入用户注册数据失败..." g_var.logger.error("数据库插入用户注册数据失败...") return -3 except Exception as e: g_var.logger.info(e) g_var.ERR_CODE = 2004 g_var.ERR_MSG = "数据库插入用户注册数据异常..." g_var.logger.error("数据库插入用户注册数据异常...") return -3
def __login(self, present_website, VPN, userInfo, googlekey): """ 登录 根据用户信息userInfo中是否包含cookie 1、有cookie直接构造loginData返回,跳过登录流程 2、没有cookie,需要post登录请求,获取到cookie,再构造loginData返回 Args: Session:Session对象 present_website:当前网站名,用于数据库表名 VPN:使用国内or国外代理 userInfo:用户信息 Returns: 成功返回loginData loginData = { 'id': user_id, 'username': username, 'password': password, 'cookie': cookie, } 失败返回状态值: 1:表示账号密码失效,密码被改或账号被网站删除 -1:表示requests请求页面失败,需要更换代理 -2:页面发生改变,获取不到页面上的一些token值 -3:数据库插入更新等错误 """ if userInfo[5] != None and userInfo[5] != "": g_var.logger.info('login, cookie....') # userInfo[5]保存cookie值,如果cookie不为空,则使用cookie loginData = { 'id': userInfo[0], 'firstName': userInfo[1], 'password': userInfo[2], 'cookie': userInfo[5], 'userId': userInfo[6], } return loginData g_var.logger.info('login, no cookie....') url_login = '******' # cookie为空,使用账号密码登录 headers = generate_headers(0) headers['Referer'] = 'https://login.ex.co/login' if headers == -1: g_var.logger.info("获取headers失败...") return -1 captcha_value = google_captcha('', googlekey, url_login) if captcha_value == -1: return -2 loginData = { "email": userInfo[3], "password": userInfo[2], "loginType": "Email", "captchaResponse": captcha_value, } g_var.logger.info("登录中...") html = requestsW.post(url_login, proxies=ip_proxy("en"), json=loginData, headers=headers, timeout=g_var.TIMEOUT) if html == -1: return html if '"response":"success"' not in html.text: g_var.logger.info('登录失败。。。') g_var.logger.info(html.text) return -2 accessToken = re.findall('"accessToken":"(.*?)"}', html.text)[0] try: # 获取cookie,保存到数据库。 sql = "UPDATE " + present_website + " SET cookie='" + accessToken + "' WHERE id=" + str( userInfo[0]) + ";" status = MysqlHandler().update(sql) if status == 0: g_var.logger.info("update cookie OK") else: g_var.ERR_CODE = 2004 g_var.ERR_MSG = "数据库更新cookie错误..." g_var.logger.error("数据库更新cookie错误...") return 0 except Exception as e: g_var.logger.info(e) g_var.ERR_CODE = 2004 g_var.ERR_MSG = "数据库更新cookie异常..." g_var.logger.error("数据库更新cookie异常...") return 0 loginData = { 'id': userInfo[0], 'firstName': userInfo[1], 'password': userInfo[2], 'cookie': accessToken, 'userId': userInfo[6], } return loginData
def __register_one(self, present_website, email_info, googlekey): """ 注册一个账户 Args: Session:Session对象 present_website:当前网站名,用于数据库表名 email_and_passwd:邮箱账户和密码,email_and_passwd[0]是邮箱,[1]是密码 Returns: 注册成功返回注册数据字典对象registerData,需要包含user_id, username, password, email user_id这样获取:(示例) # 将注册的账户写入数据库(sql自己写,这边只是个示例) sql = "INSERT INTO "+present_website+"(username, password, mail, status) VALUES('" + name + \ "', '" + psd + "', '" + email_and_passwd[0] + "', '" + str(0) + "');" last_row_id = MysqlHandler().insert(sql) if last_row_id != -1: registerData["user_id"] = last_row_id return registerData else: g_var.logger.error("数据库插入用户注册数据失败") return 0 注册失败返回状态码 0:注册成功,但是激活失败或插入数据库失败 -1:表示requests请求页面失败,需要更换代理 -2:注册失败,可能是邮箱密码不符合要求、或ip被封等原因,需要排查 """ url_register_one = 'https://login.ex.co/api/signup' headers = generate_headers(0) headers['Referer'] = 'https://login.ex.co/signup' if headers == -1: g_var.logger.info("获取headers失败...") return -1 captcha_value = google_captcha("", googlekey, url_register_one) if captcha_value == -1: return -2 registerData = generate_register_data(email_info, captcha_value) g_var.logger.info("提交注册中...") html = requestsW.post(url_register_one, proxies=ip_proxy("en"), json=registerData, headers=headers, timeout=g_var.TIMEOUT) if html == -1: return html if '"success":true' not in html.text: g_var.logger.info('注册失败。。。') g_var.logger.info(html.text) return -2 accessToken = re.findall('accessToken":"(.*?)"}}', html.text)[0] userId = re.findall('"UserId":"(.*?)",', html.text)[0] headers = generate_headers(1, accessToken) if headers == -1: g_var.logger.info("获取第二步注册验证的headers失败...") return -1 company = generate_random_string(10, 12) data = { "company": company, "industryType": 'Freelancer', "companySize": "", "userIntent": "" } url_register_two = 'https://login.ex.co/api/additional-data' g_var.logger.info("第二步提交注册中...") html = requestsW.post(url_register_two, proxies=ip_proxy("en"), json=data, headers=headers, timeout=g_var.TIMEOUT) if html == -1: return html if html.text != '{"success":true}': g_var.logger.info('第二步注册失败。。。') g_var.logger.info(html.text) return -2 # 将注册的账户写入数据库 try: sql = "INSERT INTO " + present_website + "(username, password, mail, cookie, userId) VALUES('" + \ registerData['firstName'] + "', '" + registerData['password'] + "', '" + email_info[0] + "', '" + accessToken + "', '" + str( userId) + "');" last_row_id = MysqlHandler().insert(sql) g_var.logger.info(last_row_id) if last_row_id != -1: g_var.logger.info('注册成功!' + registerData['firstName']) registerData["id"] = last_row_id registerData["cookie"] = accessToken registerData["userId"] = str(userId) return registerData else: g_var.ERR_CODE = 2004 g_var.ERR_MSG = "数据库插入用户注册数据失败..." g_var.logger.error("数据库插入用户注册数据失败...") return 0 except Exception as e: g_var.logger.info(e) g_var.ERR_CODE = 2004 g_var.ERR_MSG = "数据库插入用户注册数据异常..." g_var.logger.error("数据库插入用户注册数据异常...") return 0
def __postMessage(self, userData, present_website): """ 发文章 Args: Session:Session对象 loginData:用户信息,包括user_id,username,password,cookie present_website:当前网站名,用于数据库表名 Returns: 成功返回:"ok" 失败返回状态值: 1:跳出循环,重新取号 0:cookie失效,将cookie清空,跳出循环重新取号 -1:连续代理错误或页面发生改变等取不到关键数据等,需要停止程序 -2:本次出错,继续循环 """ g_var.logger.info("post article ...") headers = generate_headers(0) if headers == -1: g_var.logger.info("获取headers失败...") return -1 g_var.logger.info("article ...") article = get_new_article() if article == -1: return -2 content = get_code_content(article[1]) if content == -2: return -2 g_var.logger.info("postarticle_tok ...") uid_upwd = userData['cookie'].split('|_|') postarticle_tok = get_postarticle_tok(uid_upwd[0]) if postarticle_tok == -1: return -1 elif postarticle_tok == -2: return -2 g_var.logger.info("new_article_Id ...") new_article_Id = get_newarticle_Id(uid_upwd, article[0], headers) if new_article_Id == -1: return -1 elif new_article_Id == -2: return -2 elif new_article_Id == 1: return 1 headers['Origin'] = 'https://www.liveinternet.ru' headers[ 'Referer'] = 'https://www.liveinternet.ru/journal_post.php?journalid=' + uid_upwd[ 0] headers['Cookie'] = 'bbuserid=' + uid_upwd[ 0] + '; bbpassword='******'action': 'newpost', 'parsing': '', 'journalid': uid_upwd[0], 'backurl': '', 'selectforum': '/journal_post.php?journalid=' + uid_upwd[0], 'headerofpost': article[0], 'mode': str(0), 'status': 'Use these controls to insert vBcode', 'LiNewPostForm': content, # 文章内容 'tags': article[-1], # 标签 'uploader_count': str(0), 'music': '', 'mood': '', 'attachfile1': ("", '', 'application/octet-stream'), 'MAX_FILE_SIZE': '', 'nocomment': str(0), 'commentsubscribe': 'yes', 'parseurl': 'yes', 'autosave_postid': new_article_Id, # blog ID 'close_level': str(0), 'tok': postarticle_tok, }, boundary='------WebKitFormBoundary' + generate_random_string( 16, 16, 'abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ'), ) headers['Content-Type'] = multipart_encoder.content_type g_var.logger.info("正在发布文章 ...") url_article = 'https://www.liveinternet.ru/journal_addpost.php' html = requestsW.post(url_article, proxies=ip_proxy("en"), data=multipart_encoder, headers=headers) if html == -1: return -1 # 发布成功与否验证 prove = 'Вы добавили сообщение в Ваш дневник' if prove not in html.text: g_var.ERR_CODE = 5000 g_var.ERR_MSG = "文章发送失败,IP异常等原因..." g_var.logger.info('文章发送失败,IP异常等原因...') return 0 del headers['Origin'] headers[ 'Accept'] = 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.9' g_var.logger.info("正在获取新文章id ...") url_new_article = 'https://www.liveinternet.ru/users/' + userData[ 'username'] + '/blog/' res = requestsW.get(url_new_article, proxies=ip_proxy("en"), headers=headers) if res == -1: return -1 article_url = re.search( 'https://www.liveinternet.ru/users/' + userData['username'].lower() + '/post(.*?)/', res.text) if not article_url: ('获取新发布文章url失败。。。') return 0 try: new_article_url = article_url.group() sql = "INSERT INTO liveinternet_ru_article(url, keyword, user_id) VALUES('" + new_article_url + "', '" + article[ 0] + "', '" + str(userData["id"]) + "');" last_row_id = MysqlHandler().insert(sql) g_var.logger.info(last_row_id) if last_row_id != -1: g_var.logger.info('文章成功!' + userData['username']) return 'ok' else: g_var.ERR_CODE = 2004 g_var.ERR_MSG = "数据库插入用户注册数据失败..." g_var.logger.error("数据库插入用户注册数据失败...") return 0 except Exception as e: g_var.logger.info(e) g_var.ERR_CODE = 2004 g_var.ERR_MSG = "数据库插入用户注册数据异常..." g_var.logger.error("数据库插入用户注册数据异常...") return 0
def login(self, present_website, VPN, userInfo): """ 登录 根据用户信息userInfo中cookie是否为空 1、有cookie,跳过登录流程,直接构造loginData返回 2、没有cookie,需要post登录请求,获取到cookie存入数据库,再构造loginData返回 Args: Session:Session对象 present_website:当前网站名,用于数据库表名 VPN:使用国内or国外代理 userInfo:用户信息 userInfo[0]:id [1]:username [2]passwod [3]:emial [4]:status [5]cookie Returns: 成功返回loginData loginData = { 'id': user_id, 'username': username, 'password': password, 'cookie': cookie, } 失败返回状态值: 1:表示账号密码失效,密码被改或账号被网站删除,将数据库中状态改为1,并跳出循环重新取账号 0:跳出循环,重新取号 -1:连续代理错误或页面发生改变等取不到关键数据等,需要停止程序 -2:本次出错,不跳出循环 Mysql Update示例: # 如果cookie失效,将该cookie从数据库中清除,并重新从数据库中获取登录账号密码 sql = "UPDATE %s SET cookie='%s' WHERE id=%s ;" % (liveinternet_ru, save_cookies, user_id) status = MysqlHandler().update(sql) if status == 0: g_var.logger.info("cookie失效,清除cookie update OK") return {"error": -2} else: g_var.logger.error("数据库清除cookie错误!") return {"error": 1} """ g_var.logger.info("login ...") if userInfo[5] != None and userInfo[5] != "": # userInfo[5]保存cookie值,如果cookie不为空,则使用cookie g_var.logger.info("返回cookie" + userInfo[5]) loginData = { 'id': userInfo[0], 'username': userInfo[1], 'password': userInfo[2], 'cookie': userInfo[5], } return loginData else: # cookie为空,使用账号密码登录 url_login = '******' login_data = { 's': '', 'url': 'https://www.liveinternet.ru/journal_register.php', 'action': 'login', 'username': userInfo[1], 'password': userInfo[2], } g_var.logger.info("登录中...") html = requestsW.post(url_login, proxies=ip_proxy("en"), data=login_data, allow_redirects=False, timeout=g_var.TIMEOUT) if html == -1: return html if not html.headers.get('Set-Cookie', None): g_var.logger.info('登陆失败......') return 1 try: set_cookie = html.headers['Set-Cookie'] user_Id = re.findall('bbuserid=(.*?);', set_cookie) user_password = re.findall('bbpassword=(.*?);', set_cookie) cookie = user_Id[0] + '|_|' + user_password[0] # 获取cookie,保存到数据库。 sql = "UPDATE " + present_website + " SET cookie='" + cookie + "' WHERE id=" + str( userInfo[0]) + ";" status = MysqlHandler().update(sql) if status == 0: g_var.logger.info("update cookie OK") else: g_var.ERR_CODE = 2004 g_var.ERR_MSG = "数据库更新cookie错误..." g_var.logger.error("数据库更新cookie错误...") return 0 except Exception as e: g_var.logger.info(e) g_var.ERR_CODE = 2004 g_var.ERR_MSG = "数据库更新cookie异常..." g_var.logger.error("数据库更新cookie异常...") return 0 userData = { 'id': userInfo[0], 'username': userInfo[1], 'password': userInfo[2], 'cookie': cookie, } return userData
def __register_one(self, present_website, email_and_passwd): """ 注册一个账户,需要实现注册、激活、并将注册数据存入数据库的功能 Args: Session:Session对象 present_website:当前网站名,用于数据库表名 email_and_passwd:邮箱账户和密码,email_and_passwd[0]是邮箱,[1]是密码 Returns: 注册成功返回注册数据字典对象registerData,需要包含id, username, password, email, cookie(在访问激活链接时能取到,\ 取不到返回空) user_id这样获取:(示例) # 将注册的账户写入数据库(sql自己写,这边只是个示例) sql = "INSERT INTO "+present_website+"(username, password, mail, status, cookie) VALUES('" + \ username + "', '" + password + "', '" + email + "', '" + str(0) + cookie + "');" last_row_id = MysqlHandler().insert(sql) if last_row_id != -1: registerData["user_id"] = last_row_id return registerData else: g_var.logger.error("数据库插入用户注册数据失败") return 0 注册失败返回状态码 0:某些报错需要跳出while循环,更换邮箱 -1:连续代理错误或页面发生改变等取不到关键数据等,需要停止程序 -2:注册失败,可能是打码出错等原因,邮箱可以继续使用(邮箱资源成本较高,因此要确保注册成功后再更换邮箱),不跳出循环 """ g_var.logger.info('register......') url = 'http://www.liveinternet.ru/journal_register.php' headers = generate_headers(0) if headers == -1: g_var.logger.info("获取headers失败...") return -1 tok = get_tok(url, headers) if tok == -1: return -1 elif tok == -2: return -2 googlekey = '6Lcl3BYUAAAAAG1gTAOhNtJIeTrPn68melrC1gbV' captcha_value = google_captcha("", googlekey, url) if captcha_value == -1: return -2 registerData = generate_register_data(email_and_passwd, captcha_value, tok) headers['Origin'] = 'http://www.liveinternet.ru' headers['Referer'] = 'http://www.liveinternet.ru/journal_register.php' headers['Content-Type'] = 'application/x-www-form-urlencoded' g_var.logger.info("提交注册中...") html = requestsW.post(url, proxies=ip_proxy("en"), data=registerData, headers=headers, timeout=g_var.TIMEOUT) if html == -1: return html # 第一步注册成功与否的验证 result = re.findall(email_and_passwd[0], html.text) if len(result) != 2: g_var.logger.info("第一步注册失败...") g_var.logger.info(html.status_code) return -2 # 邮箱验证 time.sleep(2) verify_url = get_verify_url(email_and_passwd) if verify_url == 0: g_var.logger.info("未读取到邮箱验证的url...") return 0 # 邮箱验证的tok获取 email_tok = get_tok_email(verify_url) if email_tok == -1: return 0 elif email_tok == -2: return 0 id = re.findall('id=(.*?)&', verify_url)[0] h = re.findall('h=(.*)', verify_url)[0] headers['Referer'] = verify_url captcha_value = google_captcha("", googlekey, verify_url) if captcha_value == -1: return 0 username = generate_random_string( 10, 12, "abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ") day = str(random.randint(1, 28)) month = str(random.randint(1, 12)) year = str(random.randint(1980, 2010)) sex = ['M', 'W'] multipart_encoder = MultipartEncoder( fields={ 'username': username, 'comm': '0', 'sexchar': random.choice(sex), 'day': day, 'month': month, 'year': year, 'city': '1870', 'icq': '', 'emails': '', 'addinfo': username, 'avatarfile': ('', '', 'application/octet-stream'), 'g-recaptcha-response': captcha_value, 'dailynews': '1', 'Submit.x': '80', 'Submit.y': '20', 'familyname': '', 'firstname': '', 'password': registerData['password1'], 'email': email_and_passwd[0], 'passwordconfirm': registerData['password1'], 'imagehash': '', 'regkey': '', 'invite_id': '0', 'regkeynb': '', 'url_redirect': '', 'url2': '', 'action': 'add_step1', 'h': h, 'id': id, 'tok': email_tok, }, boundary='----WebKitFormBoundary' + generate_random_string( 16, 16, 'abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ'), ) headers['Content-Type'] = multipart_encoder.content_type g_var.logger.info("注册第二步,邮箱验证提交信息中...") url_email_prove = 'http://www.liveinternet.ru/journal_register.php' html = requestsW.post(url_email_prove, proxies=ip_proxy("en"), data=multipart_encoder, headers=headers, allow_redirects=False, timeout=g_var.TIMEOUT) if html == -1: return html if not html.headers.get('Set-Cookie', None): g_var.logger.info('第二步邮箱验证信息提交失败...') return 0 # 将注册的账户写入数据库 try: set_cookie = html.headers['Set-Cookie'] user_Id = re.findall('bbuserid=(.*?);', set_cookie) user_password = re.findall('bbpassword=(.*?);', set_cookie) cookie = user_Id[0] + '|_|' + user_password[0] sql = "INSERT INTO " + present_website + "(username, password, mail, cookie) VALUES('" + \ username + "', '" + registerData['password1'] + "', '" + email_and_passwd[0] + "', '" + cookie + "');" last_row_id = MysqlHandler().insert(sql) g_var.logger.info(last_row_id) if last_row_id != -1: g_var.logger.info('注册成功!' + username) userData = { 'id': last_row_id, 'username': username, 'password': registerData['password1'], 'cookie': cookie, } return userData else: g_var.ERR_CODE = 2004 g_var.ERR_MSG = "数据库插入用户注册数据失败..." g_var.logger.error("数据库插入用户注册数据失败...") return 0 except Exception as e: g_var.logger.info(e) g_var.ERR_CODE = 2004 g_var.ERR_MSG = "数据库插入用户注册数据异常..." g_var.logger.error("数据库插入用户注册数据异常...") return 0