Пример #1
0
    def registers(self, present_website, VPN):
        while self.success_count < self.assignment_num:
            # 每次循环检测当前错误状态
            if self.__monitor_status() == -1:
                break
            self.now_count = self.now_count + 1

            Session = get_Session(VPN)
            if Session == -1:
                self.failed_count = self.failed_count + 1
                continue

            # 获取邮箱
            email_and_passwd = get_email(present_website)
            if email_and_passwd == -1:
                self.failed_count = self.failed_count + 1
                continue
            retry_count = 0
            while retry_count < g_var.RETRY_COUNT_MAX:
                retry_count = retry_count + 1
                registerData = self.__register_one(Session, present_website,
                                                   email_and_passwd)
                if registerData == -1:
                    g_var.logger.info("代理错误")
                    self.proxy_err_count = self.proxy_err_count + 1
                    proxies = ip_proxy(VPN)
                    if proxies == {"error": -1}:
                        g_var.logger.info("获取代理错误")
                        self.failed_count = self.failed_count + 1
                    Session.proxies = proxies
                elif registerData == -2:
                    g_var.logger.info("注册失败,可能是邮箱密码不符合要求、或ip被封等原因,请排查!")
                    self.proxy_err_count = self.proxy_err_count + 1
                    proxies = ip_proxy(VPN)
                    if proxies == {"error": -1}:
                        g_var.logger.info("获取代理错误")
                        self.failed_count = self.failed_count + 1
                    Session.proxies = proxies
                elif registerData == 0:
                    # 注册成功,但激活失败
                    g_var.logger.info("注册成功,但激活失败!")
                    break
                else:
                    # 注册成功
                    self.success_count = self.success_count + 1
                    self.failed_count = 0
                    self.proxy_err_count = 0
                    break
                time.sleep(g_var.SLEEP_TIME)

            if retry_count == g_var.RETRY_COUNT_MAX:
                # 连续出错说明发生了一些问题,需要停止程序
                g_var.SPIDER_STATUS = 3
                g_var.ERR_MSG = "连续注册出错,程序停止"
                g_var.logger.error("连续注册失败!程序停止")
                break

        g_var.logger.info("g_var.SPIDER_STATUS" + str(g_var.SPIDER_STATUS))
        g_var.logger.info("本线程共成功注册'self.success_count'=" +
                          str(self.success_count) + "个账户")
def get_authenticity_token_signup():
    try:
        url = 'https://genius.com/signup'
        res = requestsW.get(url,
                            proxies=ip_proxy('ch'),
                            timeout=g_var.TIMEOUT,
                            vpn='ch')
        if res == -1:
            return 0, 0, 0
        token_list = re.findall(
            'name="authenticity_token" type="hidden" value="(.*?)" /></div>',
            res.text)
        res_headers = json.dumps(dict(res.headers))
        csrf_token_list = re.findall('_csrf_token=(.*?);', res_headers)
        session_list = re.findall('_rapgenius_session=(.*?);', res_headers)
        if not token_list or not csrf_token_list or not session_list:
            g_var.ERR_CODE = "2001"
            g_var.ERR_MSG = g_var.ERR_MSG + "|_|" + "获取注册authenticity_token值或_csrf_token值或_rapgenius_session值失败。。。"
            g_var.logger.info(
                '获取注册authenticity_token值或_csrf_token值或_rapgenius_session值失败。。。'
            )
            return -1, -1, -1
    except:
        g_var.logger.info("访问注册页失败。。。")
        return -1, -1, -1
    return token_list[0], csrf_token_list[0], session_list[0]
def get_authenticity_token(userData):
    try:
        headers = {
            'Host': 'www.sbnation.com',
            'User-Agent':
            'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/81.0.4044.122 Safari/537.36',
            'Accept':
            'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.9',
            'Referer':
            'https://www.sbnation.com/users/' + userData['username'],
            'Cookie': '_session_id=' + userData['cookie'],
        }
        url = 'https://www.sbnation.com/users/' + userData[
            'username'] + '/edit_profile'
        res = requestsW.get(url, proxies=ip_proxy("en"), headers=headers)
        if res == -1:
            return -1, -1
        token_list = re.findall('name="authenticity_token" value="(.*?)" />',
                                res.text)
        if not token_list:
            g_var.logger.info('获取修改个人网址的authenticity_token失败。。。')
            return -2, -2
        session_list = re.findall('_session_id=(.*?);',
                                  res.headers['Set-Cookie'])
        if not session_list:
            g_var.logger.info('获取修改个人网址的session_id失败。。。')
            return -2, -2
        return token_list[0], session_list[0]
    except Exception as e:
        g_var.logger.info(e)
        g_var.ERR_CODE = 5000
        g_var.ERR_MSG = "获取authenticity_token出现异常..."
        g_var.logger.info("获取authenticity_token出现异常...")
        return -2, -2
def get_session_id():
    try:
        headers = {
            'accept':
            'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.9',
            'user-agent':
            'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/81.0.4044.113 Safari/537.36',
        }
        url = 'https://auth.voxmedia.com/signup?return_to=https://www.sbnation.com/'
        res = requestsW.get(url,
                            proxies=ip_proxy("en"),
                            headers=headers,
                            timeout=g_var.TIMEOUT)
        if res == -1:
            return res
        str_session = res.headers['Set-Cookie']
        if not str_session:
            g_var.logger.info('获取session_id值失败。。。')
            return -2
        list_session = str_session.split(';')
        if not list_session:
            g_var.logger.info('获取_session_id值失败。。。')
            return -2
        return list_session[0]
    except Exception as e:
        g_var.logger.info(e)
        g_var.ERR_CODE = 5000
        g_var.ERR_MSG = "获取session_id出现异常..."
        g_var.logger.info("获取session_id出现异常...")
        return -2
    def __register_one(self):
        g_var.logger.info("register。。。")
        # 获取authenticity_token、_csrf_token、_rapgenius_session值
        authenticity_token, csrf_token, rapgenius_session = get_authenticity_token_signup(
        )
        if authenticity_token == 0:
            return -1
        elif authenticity_token == -1:
            return -2
        # 获取headers
        headers = generate_headers(0, csrf_token, rapgenius_session)
        if headers == -1:
            g_var.logger.info("获取headers失败。。。")
            return -2

        # 注册数据
        registerData = generate_register_data(authenticity_token)
        url_register = 'https://genius.com/account'
        g_var.logger.info("提交注册中。。。")
        html = requestsW.post(url_register,
                              proxies=ip_proxy("ch"),
                              data=registerData,
                              headers=headers,
                              timeout=g_var.TIMEOUT,
                              vpn='ch')
        if html == -1:
            return html

        # 注册成功验证
        user_id_list = re.findall('CURRENT_USER = {"id":(.*?),"login":'******'_rapgenius_session=(.*?);',
                                  html.headers['Set-Cookie'])
        # 插入数据库
        try:
            sql = "INSERT INTO genius_com(username, password, mail, user_id) VALUES('" + registerData['user[login]'] + \
                  "', '" + registerData['user[password]'] + "', '" + registerData['user[email]'] + "', '" + user_id_list[0] +"');"
            last_row_id = MysqlHandler().insert(sql)
            if last_row_id != -1:
                registerData["id"] = last_row_id
                registerData["user_id"] = user_id_list[0]
                registerData["name"] = registerData['user[login]']
                registerData["rapgenius_session"] = session_list[0]
                return registerData
            else:
                g_var.ERR_CODE = 2004
                g_var.ERR_MSG = "数据库插入用户注册数据失败..."
                g_var.logger.error("数据库插入用户注册数据失败...")
                return 0
        except Exception as e:
            g_var.logger.info(e)
            g_var.ERR_CODE = 2004
            g_var.ERR_MSG = "数据库插入用户注册数据出现异常..."
            g_var.logger.error("数据库插入用户注册数据出现异常...")
            return 0
Пример #6
0
    def registers(self, present_website: str, VPN: str):
        while self.success_count < self.assignment_num:
            # 每次循环检测当前错误状态
            if self.__monitor_status() == -1:
                break
            self.now_count = self.now_count + 1

            Session = requests.Session()
            # 获取代理设置
            proxies = ip_proxy(VPN)
            if proxies == {"error": -1}:
                self.failed_count = self.failed_count + 1
                continue
            self.failed_count = 0
            Session.proxies = {
                "http": proxies,
                "https": proxies,
            }
            # 设置最大重试次数
            Session.mount('http://', HTTPAdapter(max_retries=1))
            Session.mount('https://', HTTPAdapter(max_retries=1))
            retry_count = 0
            while retry_count < g_var.RETRY_COUNT_MAX:
                retry_count = retry_count + 1
                registerData = self.__register_one(Session, present_website)
                if registerData != -1:
                    # registerData != -1说明注册成功
                    self.success_count = self.success_count + 1
                    self.failed_count = 0
                    break
                else:
                    self.failed_count = self.failed_count + 1
                    proxies = ip_proxy(VPN)
                    Session.proxies = proxies
                    time.sleep(g_var.SLEEP_TIME)
                    continue
            if retry_count == g_var.RETRY_COUNT_MAX:
                # 连续出错说明发生了一些问题,需要停止程序
                g_var.SPIDER_STATUS = 3
                g_var.ERR_MSG = "连续注册出错,程序停止"
                g_var.logger.error("register:连续注册失败!程序停止")
                break

        g_var.logger.info("g_var.SPIDER_STATUS" + str(g_var.SPIDER_STATUS))
        g_var.logger.info("本线程共成功注册'self.success_count'=" + str(self.success_count) + "个账户")
Пример #7
0
    def __login(self, VPN, userInfo):
        # 使用账号密码登录
        user_id = userInfo[0]
        username = userInfo[1]
        password = userInfo[2]
        loginData = {
            'username': userInfo[1],
            'password': userInfo[2],
        }

        retry_count = 0
        while retry_count < g_var.RETRY_COUNT_MAX:
            retry_count = retry_count + 1
            url_login = '******'
            try:
                g_var.logger.info("使用账号密码登录...")
                headers = generate_headers(0)
                if headers == -1:
                    return -1
                html = Session.post(url_login,
                                    headers=headers,
                                    data=loginData,
                                    timeout=g_var.TIMEOUT)
                self.proxy_err_count = 0
                break
            except:
                g_var.logger.error("账号密码登录超时")
                self.proxy_err_count = self.proxy_err_count + 1
                time.sleep(g_var.SLEEP_TIME)
                proxies = ip_proxy(VPN)
                Session.proxies = proxies
                continue
        if retry_count == g_var.RETRY_COUNT_MAX:
            g_var.SPIDER_STATUS = 3
            g_var.logger.error("连续登录失败!程序停止")
            return -1

        if html.status_code != 200:
            # 如果登录失败将数据库中的status改为异常
            sql = "UPDATE wattpad_com SET status=1 WHERE id=" + str(
                user_id) + ";"
            MysqlHandler().update(sql)
            return 1  # 账号异常,重新取号登录

        token_list = re.findall('token=(.*?);', html.headers['Set-Cookie'])
        # 如果登录成功,则返回token_list和username给下一步发新文章
        loginSuccessData = {
            'id': user_id,
            'username': loginData['username'],
            'token': token_list[0],
        }
        return loginSuccessData
    def __postMessage(self, loginData):

        # 获取headers
        headers = generate_headers(2, loginData=loginData)
        if headers == -1:
            g_var.logger.info("获取headers失败。。。")
            return -1

        data = generate_new_link_data()
        g_var.logger.info(data)
        if data == -1:
            # 获取不到链接,程序停止
            g_var.SPIDER_STATUS = 3
            return -1

        url_postLink = 'https://genius.com/api/users/' + str(
            loginData['user_id']) + '?text_format=html,markdown'
        g_var.logger.info("发送链接中...")
        res = requestsW.put(url_postLink,
                            proxies=ip_proxy("ch"),
                            headers=headers,
                            json=data,
                            timeout=g_var.TIMEOUT,
                            vpn='ch')
        if res == -1:
            return res

        if res.status_code == 200:
            g_var.logger.info("链接发送成功!" + loginData["name"])
            # 将链接、用户id存入article表
            url = 'https://genius.com/' + loginData["name"]
            sql = "INSERT INTO genius_com_article(url, user_id) VALUES('" + url + "', '" + str(
                loginData['id']) + "');"
            if g_var.insert_article_lock.acquire():
                last_row_id = MysqlHandler().insert(sql)
                g_var.insert_article_lock.release()
                if last_row_id != -1:
                    g_var.logger.info("insert article OK")
                else:
                    g_var.logger.error("数据库插入连接数据错误!")
                    return 0
            return loginData
        else:
            g_var.logger.error("链接发送失败!" + str(res.status_code))
            g_var.ERR_CODE = 5000
            g_var.ERR_MSG = g_var.ERR_MSG + "|_|" + "链接发送失败,未知错误!"
            return 0
Пример #9
0
def get_tok_email(url):
    try:
        res = requestsW.get(url, proxies=ip_proxy("en"), timeout=g_var.TIMEOUT)
        if res == -1:
            return res
        tok = re.findall('<input type=hidden name=tok value=(.*?) /></form>',
                         res.text)
        if not tok:
            g_var.logger.info("未获取到邮箱验证的tok...")
            return -2
        return tok[0]
    except Exception as e:
        g_var.logger.info(e)
        g_var.ERR_CODE = 5000
        g_var.ERR_MSG = "获取邮箱验证的tok出现异常..."
        g_var.logger.info("获取邮箱验证的tok出现异常...")
        return -2
Пример #10
0
    def __postMessage(self, loginData):

        headers = generate_headers(1, loginData)
        if headers == -1:
            return -1
        link = get_new_link()
        if link == -1:
            # 获取不到链接,程序停止
            g_var.SPIDER_STATUS = 3
            return -1

        url_putLink = 'https://www.wattpad.com/api/v3/users/' + loginData[
            'username']
        linkData = {
            'website': link,
        }
        g_var.logger.info("发送链接中...")
        html = requestsW.put(url_putLink,
                             proxies=ip_proxy("en"),
                             headers=headers,
                             json=linkData,
                             timeout=g_var.TIMEOUT)
        if html == -1:
            return html
        if html.status_code == 200:
            g_var.logger.info("链接发送成功!" + loginData["username"])
            url = 'https://www.wattpad.com/user/' + loginData["username"]
            # 将链接、用户存入wattpad_com_article表
            sql = "INSERT INTO wattpad_com_article(url, user_id) VALUES('" + url + "', '" + str(
                loginData['id']) + "');"
            if g_var.insert_article_lock.acquire():
                last_row_id = MysqlHandler().insert(sql)
                g_var.insert_article_lock.release()
            if last_row_id != -1:
                g_var.logger.info("insert article OK")
            else:
                g_var.logger.error("数据库插入链接错误!")
                return 0
            return linkData
        else:
            g_var.logger.error("链接发送失败!\n" + html.status_code)
            g_var.ERR_CODE = 5000
            g_var.ERR_MSG = g_var.ERR_MSG + "|_|" + "链接发送失败,未知错误!"
            return 0
Пример #11
0
def get_postarticle_tok(uid):
    try:
        url_tok = 'https://www.liveinternet.ru/journal_post.php?journalid=' + uid
        response = requestsW.get(url_tok, proxies=ip_proxy("en"))
        if response == -1:
            return -1
        result = re.findall(
            '<input type=hidden name=tok value=(.*?) /></form>', response.text)
        if not result:
            g_var.logger.info("未获取到文章发布页tok...")
            return -2
        tok = result[0]
        return tok
    except Exception as e:
        g_var.logger.info(e)
        g_var.ERR_CODE = 5000
        g_var.ERR_MSG = "获取文章发布页tok出现异常..."
        g_var.logger.info("获取文章发布页tok出现异常...")
        return -2
    def registers(self, present_website, VPN):
        while self.success_count < self.assignment_num:
            # 每次循环检测当前错误状态
            if self.__monitor_status() == -1:
                break
            self.now_count = self.now_count + 1

            # 设置Session对象
            Session = get_Session(VPN)
            if Session == -1:
                self.failed_count = self.failed_count + 1
                continue

            retry_count = 0
            while retry_count < g_var.RETRY_COUNT_MAX:
                retry_count = retry_count + 1
                registerData = self.__register_one(Session)
                if registerData != -1:
                    # registerData != -1说明注册成功
                    self.success_count = self.success_count + 1
                    self.failed_count = 0
                    break
                else:
                    g_var.logger.info("更换代理...")
                    self.failed_count = self.failed_count + 1
                    proxies = ip_proxy(VPN)
                    Session.proxies = proxies
                    time.sleep(g_var.SLEEP_TIME)
                    continue
            if retry_count == g_var.RETRY_COUNT_MAX:
                # 连续出错说明发生了一些问题,需要停止程序
                g_var.SPIDER_STATUS = 3
                g_var.ERR_MSG = "连续注册出错,程序停止"
                g_var.logger.error("register:连续注册失败!程序停止")
                break

        g_var.logger.info("g_var.SPIDER_STATUS" + str(g_var.SPIDER_STATUS))
        g_var.logger.info("本线程共成功注册'self.success_count'=" +
                          str(self.success_count) + "个账户")
    def loginAndPostMessage(self, present_website, VPN):
        while self.success_count < self.assignment_num:
            # 每次循环检测当前错误状态
            if self.__monitor_status() == -1:
                break
            self.now_count = self.now_count + 1

            Session = get_Session(VPN)
            if Session == -1:
                self.failed_count = self.failed_count + 1
                continue

            userInfo = generate_login_data(present_website)
            if userInfo == None:
                g_var.logger.error("数据库中获取用户失败,本线程停止!")
                return {"error": -1}
            # 1、登录
            retry_count = 0
            login_signal = 0
            while retry_count < g_var.RETRY_COUNT_MAX:
                retry_count = retry_count + 1
                loginData = self.__login(Session, VPN, userInfo)
                if loginData == -1:
                    # 登录报错,停止运行
                    g_var.ERR_MSG = "登录出错"
                    self.failed_count = self.failed_count + 1
                    time.sleep(g_var.SLEEP_TIME)
                    proxies = ip_proxy(VPN)
                    Session.proxies = proxies
                    continue
                elif loginData == 1:
                    # 账号异常,重新取新账号登录
                    self.failed_count = self.failed_count + 1
                    login_signal = 1
                    break
                else:
                    self.failed_count = 0
                    self.proxy_err_count = 0
                    break
            if retry_count == g_var.RETRY_COUNT_MAX:
                # 连续出错说明发生了一些问题,需要停止程序
                g_var.SPIDER_STATUS = 3
                g_var.ERR_MSG = "连续登录出错,程序停止"
                g_var.logger.error("login:连续登录失败!程序停止")
                break

            if login_signal == 1:
                continue
            # 2、获取个人数据
            retry_count = 0
            personal_signal = 0
            while retry_count < g_var.RETRY_COUNT_MAX:
                retry_count = retry_count + 1
                personalData = self.__personal_data(Session, loginData)
                if personalData == -1:
                    g_var.ERR_MSG = "个人数据获取出错"
                    self.failed_count = self.failed_count + 1
                    time.sleep(g_var.SLEEP_TIME)
                    proxies = ip_proxy(VPN)
                    Session.proxies = proxies
                    continue
                elif personalData == 1:
                    # 账号异常,重新取新账号登录
                    self.failed_count = self.failed_count + 1
                    personal_signal = 1
                    break
                else:
                    self.failed_count = 0
                    self.proxy_err_count = 0
                    break
            if retry_count == g_var.RETRY_COUNT_MAX:
                # 连续出错说明发生了一些问题,需要停止程序
                g_var.SPIDER_STATUS = 3
                g_var.ERR_MSG = "连续登录出错,程序停止"
                g_var.logger.error("login:连续登录失败!程序停止")
                break

            if personal_signal == 1:
                continue

            # 3、发链接
            retry_count = 0
            while retry_count < g_var.RETRY_COUNT_MAX:
                retry_count = retry_count + 1
                status = self.__postMessage(Session, loginData, personalData)
                if status == 0:  # 发链接成功
                    self.success_count = self.success_count + 1
                    self.failed_count = 0
                    self.proxy_err_count = 0
                    break
                elif status == 1:
                    self.failed_count = self.failed_count + 1
                    self.proxy_err_count = self.proxy_err_count + 1
                    time.sleep(g_var.SLEEP_TIME)
                    proxies = ip_proxy(VPN)
                    Session.proxies = proxies
                    continue
                elif status == -1:
                    # 获取不到链接,程序停止
                    self.failed_count = self.failed_count + 1
                    break
            if retry_count == g_var.RETRY_COUNT_MAX:
                # 连续出错说明发生了一些问题,需要停止程序
                g_var.SPIDER_STATUS = 3
                g_var.ERR_MSG = "连续发链接出错,程序停止"
                g_var.logger.error("连续发链接出错,程序停止")
                break
        g_var.logger.info("成功发送" + str(self.success_count) + "个链接。")
    def __login(self, present_website, VPN, userInfo, googlekey):
        """
        登录
        根据用户信息userInfo中是否包含cookie
        1、有cookie直接构造loginData返回,跳过登录流程
        2、没有cookie,需要post登录请求,获取到cookie,再构造loginData返回
        Args:
            Session:Session对象
            present_website:当前网站名,用于数据库表名
            VPN:使用国内or国外代理
            userInfo:用户信息
        Returns:
            成功返回loginData
                loginData = {
                    'id': user_id,
                    'username': username,
                    'password': password,
                    'cookie': cookie,
                }
            失败返回状态值:
                1:表示账号密码失效,密码被改或账号被网站删除
                -1:表示requests请求页面失败,需要更换代理
                -2:页面发生改变,获取不到页面上的一些token值
                -3:数据库插入更新等错误
        """

        if userInfo[5] != None and userInfo[5] != "":
            g_var.logger.info('login, cookie....')
            # userInfo[5]保存cookie值,如果cookie不为空,则使用cookie
            loginData = {
                'id': userInfo[0],
                'firstName': userInfo[1],
                'password': userInfo[2],
                'cookie': userInfo[5],
                'userId': userInfo[6],
            }
            return loginData

        g_var.logger.info('login, no cookie....')
        url_login = '******'
        # cookie为空,使用账号密码登录
        headers = generate_headers(0)
        headers['Referer'] = 'https://login.ex.co/login'
        if headers == -1:
            g_var.logger.info("获取headers失败...")
            return -1
        captcha_value = google_captcha('', googlekey, url_login)
        if captcha_value == -1:
            return -2
        loginData = {
            "email": userInfo[3],
            "password": userInfo[2],
            "loginType": "Email",
            "captchaResponse": captcha_value,
        }
        g_var.logger.info("登录中...")
        html = requestsW.post(url_login,
                              proxies=ip_proxy("en"),
                              json=loginData,
                              headers=headers,
                              timeout=g_var.TIMEOUT)
        if html == -1:
            return html
        if '"response":"success"' not in html.text:
            g_var.logger.info('登录失败。。。')
            g_var.logger.info(html.text)
            return -2
        accessToken = re.findall('"accessToken":"(.*?)"}', html.text)[0]
        try:
            # 获取cookie,保存到数据库。
            sql = "UPDATE " + present_website + " SET cookie='" + accessToken + "' WHERE id=" + str(
                userInfo[0]) + ";"
            status = MysqlHandler().update(sql)
            if status == 0:
                g_var.logger.info("update cookie OK")
            else:
                g_var.ERR_CODE = 2004
                g_var.ERR_MSG = "数据库更新cookie错误..."
                g_var.logger.error("数据库更新cookie错误...")
                return 0
        except Exception as e:
            g_var.logger.info(e)
            g_var.ERR_CODE = 2004
            g_var.ERR_MSG = "数据库更新cookie异常..."
            g_var.logger.error("数据库更新cookie异常...")
            return 0
        loginData = {
            'id': userInfo[0],
            'firstName': userInfo[1],
            'password': userInfo[2],
            'cookie': accessToken,
            'userId': userInfo[6],
        }
        return loginData
 def __send_profile(self, userData):
     """
     发个人简介
     Args:
         Session:Session对象
         loginData:用户信息,包括user_id,username,password,email,cookie
     Returns:
         成功返回:0
         失败返回状态值:
             1:数据库存储失败
             -1:连续代理错误或页面发生改变等取不到关键数据等,需要停止程序
             -2:本次出错,继续循环
     """
     g_var.logger.info('send profile......')
     headers = generate_headers(1)
     if headers == -1:
         return -1
     g_var.logger.info('authenticity_token, session_id...')
     authenticity_token, session_id = get_authenticity_token(userData)
     if authenticity_token == -1 or session_id == -1:
         return -1
     elif authenticity_token == -2 or session_id == -2:
         return 1
     headers['Referer'] = 'https://www.sbnation.com/users/' + userData[
         'username'] + '/edit_profile'
     headers['Cookie'] = '_session_id=' + session_id
     titleLink = get_new_title_and_link()
     if titleLink == -1:
         return -1
     multipart_encoder = MultipartEncoder(
         fields={
             'utf8':
             '✓',
             '_method':
             'patch',
             'authenticity_token':
             authenticity_token,
             'profile_image[filename]':
             ('', '', 'application/octet-stream'),
             'profile_image[filename_cache]':
             '',
             'network_membership[bio]':
             '',
             'network_membership[signature]':
             '',
             'network_membership[public_email]':
             '',
             'network_membership[website_name]':
             titleLink[0],
             'network_membership[website_url]':
             titleLink[1],
             'network_membership[facebook_page_url]':
             '',
             'network_membership[facebook_page_url]':
             '',
             'network_membership[network_membership_items_attributes][0][key]':
             'MLB',
             'network_membership[network_membership_items_attributes][0][value]':
             '',
             'network_membership[network_membership_items_attributes][1][key]':
             'NFL',
             'network_membership[network_membership_items_attributes][1][value]':
             '',
             'network_membership[network_membership_items_attributes][2][key]':
             'NBA',
             'network_membership[network_membership_items_attributes][2][value]':
             '',
             'network_membership[network_membership_items_attributes][3][key]':
             'NHL',
             'network_membership[network_membership_items_attributes][3][value]':
             '',
             'network_membership[network_membership_items_attributes][4][key]':
             'NCAAF',
             'network_membership[network_membership_items_attributes][4][value]':
             '',
             'network_membership[network_membership_items_attributes][5][key]':
             'NCAAB',
             'network_membership[network_membership_items_attributes][5][value]':
             '',
             'network_membership[network_membership_items_attributes][6][key]':
             'MMA',
             'network_membership[network_membership_items_attributes][6][value]':
             '',
             'network_membership[network_membership_items_attributes][7][key]':
             'Golf',
             'network_membership[network_membership_items_attributes][7][value]':
             '',
             'network_membership[network_membership_items_attributes][8][key]':
             'NASCAR',
             'network_membership[network_membership_items_attributes][8][value]':
             '',
             'network_membership[network_membership_items_attributes][9][key]':
             'Boxing',
             'network_membership[network_membership_items_attributes][9][value]':
             '',
             'network_membership[network_membership_items_attributes][10][key]':
             'Soccer',
             'network_membership[network_membership_items_attributes][10][value]':
             '',
             'network_membership[network_membership_items_attributes][11][key]':
             'MLS',
             'network_membership[network_membership_items_attributes][11][value]':
             '',
             'network_membership[network_membership_items_attributes][12][key]':
             'EPL',
             'network_membership[network_membership_items_attributes][12][value]':
             '',
             'network_membership[network_membership_items_attributes][13][key]':
             'Football League Championship',
             'network_membership[network_membership_items_attributes][13][value]':
             '',
             'network_membership[network_membership_items_attributes][14][key]':
             'FIFA',
             'network_membership[network_membership_items_attributes][14][value]':
             '',
             'network_membership[network_membership_items_attributes][15][key]':
             'Bundesliga',
             'network_membership[network_membership_items_attributes][15][value]':
             '',
             'network_membership[network_membership_items_attributes][16][key]':
             'Serie A',
             'network_membership[network_membership_items_attributes][16][value]':
             '',
             'network_membership[network_membership_items_attributes][17][key]':
             'La Liga',
             'network_membership[network_membership_items_attributes][17][value]':
             '',
             'network_membership[network_membership_items_attributes][18][key]':
             'Cycling',
             'network_membership[network_membership_items_attributes][18][value]':
             '',
             'network_membership[network_membership_items_attributes][19][key]':
             'Tennis',
             'network_membership[network_membership_items_attributes][19][value]':
             '',
             'network_membership[network_membership_items_attributes][20][key]':
             'General',
             'network_membership[network_membership_items_attributes][20][value]':
             '',
             'commit':
             'Update',
         },
         boundary='----WebKitFormBoundary' + generate_random_string(
             16, 16,
             'abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ'),
     )
     headers['Content-Type'] = multipart_encoder.content_type
     g_var.logger.info("发布个人简介的链接...")
     url_link = 'https://www.sbnation.com/users/' + userData[
         'username'] + '/update_profile'
     html = requestsW.post(url_link,
                           proxies=ip_proxy("en"),
                           data=multipart_encoder,
                           headers=headers,
                           timeout=g_var.TIMEOUT)
     if html == -1:
         return html
     if html.status_code != 200:
         g_var.logger.info('链接发布失败。。。')
         g_var.logger.info(html.text)
         return -2
     try:
         url = 'https://www.sbnation.com/users/' + userData['username']
         sql = "INSERT INTO sbnation_com_article(url, user_id) VALUES('" + url + "', '" + str(
             userData["id"]) + "');"
         last_row_id = MysqlHandler().insert(sql)
         g_var.logger.info(last_row_id)
         if last_row_id != -1:
             g_var.logger.info('链接发送成功!' + userData['username'])
             return 0
         else:
             g_var.ERR_CODE = 2004
             g_var.ERR_MSG = "数据库插入用户注册数据失败..."
             g_var.logger.error("数据库插入用户注册数据失败...")
             return 1
     except Exception as e:
         g_var.logger.info(e)
         g_var.ERR_CODE = 2004
         g_var.ERR_MSG = "数据库插入用户注册数据异常..."
         g_var.logger.error("数据库插入用户注册数据异常...")
         return 1
 def login(self, present_website, VPN, userData):
     """
     登录
     Args:
         Session:Session对象
         present_website:当前网站名,用于数据库表名
         VPN:使用国内or国外代理
         userInfo:用户信息  userInfo[0]:id [1]:username [2]passwod [3]:emial [4]:status
     Returns:
         成功返回loginData
             loginData = {
                 'id': user_id,
                 'username': username,
                 'password': password,
                 'email': email,
             }
         失败返回状态值:
             1:表示账号密码失效,密码被改或账号被网站删除,将数据库中状态改为1,并跳出循环重新取账号
             0:跳出循环,重新取号
             -1:连续代理错误或页面发生改变等取不到关键数据等,需要停止程序
             -2:本次出错,不跳出循环
     Mysql Update示例:
         # 如果cookie失效,将该cookie从数据库中清除,并重新从数据库中获取登录账号密码
         sql = "UPDATE %s SET cookie='%s' WHERE id=%s ;" % (sbnation_com, save_cookies, user_id)
         status = MysqlHandler().update(sql)
         if status == 0:
             g_var.logger.info("cookie失效,清除cookie update OK")
             return {"error": -2}
         else:
             g_var.logger.error("数据库清除cookie错误!")
             return {"error": 1}    
     """
     g_var.logger.info('login ......')
     headers = generate_headers(2)
     if headers == -1:
         return -1
     login_session_id = get_login_session_id()
     headers['Cookie'] = login_session_id
     login_data = {
         'username': userData['username'],
         'password': userData['password'],
         'remember_me': 'false',
         'g-recaptcha-response': '',
     }
     login_url = 'https://auth.voxmedia.com/chorus_auth/initiate_password_auth.json'
     g_var.logger.info('登录中 ......')
     html = requestsW.post(login_url,
                           proxies=ip_proxy("en"),
                           data=login_data,
                           headers=headers,
                           timeout=g_var.TIMEOUT)
     if html == -1:
         return html
     try:
         g_var.logger.info(html.text)
         res_data = json.loads(html.text)
     except Exception as e:
         g_var.logger.info(e)
         g_var.logger.info('登录失败,返回信息解析失败。。。')
         g_var.logger.info(html.text)
         return 1
     if not res_data['logged_in']:
         g_var.logger.info('登录失败。。。')
         g_var.logger.info(html.text)
         return 1
     session_id_article = re.findall('_session_id=(.*?);',
                                     html.headers['Set-Cookie'])
     if not session_id_article:
         return 1
     userData['cookie'] = session_id_article[0]
     return userData
 def __register_one(self, present_website):
     """
     注册一个账户,需要实现注册、激活、并将注册数据存入数据库的功能
     Args:
         Session:Session对象
         present_website:当前网站名,用于数据库表名
         email_and_passwd:邮箱账户和密码,email_and_passwd[0]是邮箱,[1]是密码
     Returns:
         注册成功返回注册数据字典对象registerData,需要包含id, username, password, email, cookie(在访问激活链接时能取到,\
         取不到返回空)
             user_id这样获取:(示例)
                 # 将注册的账户写入数据库(sql自己写,这边只是个示例)
                 sql = "INSERT INTO "+present_website+"(username, password, mail, status, cookie) VALUES('" + \
                 username + "', '" + password + "', '" + email + "', '" + str(0) + cookie + "');"
                 last_row_id = MysqlHandler().insert(sql)
                 if last_row_id != -1:
                     registerData["user_id"] = last_row_id
                     return registerData
                 else:
                     g_var.logger.error("数据库插入用户注册数据失败")
                     return 0
         注册失败返回状态码
         0:数据库存储失败
         -1:连续代理错误或页面发生改变等取不到关键数据等,需要停止程序
         -2:注册失败,可能是打码出错等原因
     """
     g_var.logger.info('register......')
     headers = generate_headers(0)
     if headers == -1:
         return -1
     g_var.logger.info('session_id......')
     session_id = get_session_id()
     if session_id == -1:
         return -1
     elif session_id == -2:
         return -2
     googlekey = '6LefyhkTAAAAANpeEKwwgimNneiKWXRQtEqFZbat'
     captcha_value = google_captcha(
         "", googlekey,
         'https://auth.voxmedia.com/signup?return_to=https://www.sbnation.com/'
     )
     if captcha_value == -1:
         return -2
     headers['cookie'] = session_id
     username = generate_random_string(8, 12)
     password = generate_random_string(10, 14)
     community_id = random.randint(210, 299)
     g_var.logger.info('community_id.....')
     g_var.logger.info(community_id)
     email = username + '@hotmail.com'
     registerData = {
         'g-recaptcha-response': captcha_value,
         'user[username]': username,
         'user[password]': password,
         'user[email]': email,
         'user[newsletter]': 'false',
         'community_id': community_id,
     }
     g_var.logger.info('开始提交注册信息...')
     url_login = '******'
     html = requestsW.post(url_login,
                           proxies=ip_proxy("en"),
                           data=registerData,
                           headers=headers,
                           timeout=g_var.TIMEOUT)
     if html == -1:
         return html
     try:
         g_var.logger.info(html.text)
         res_data = json.loads(html.text)
     except Exception as e:
         g_var.logger.info(e)
         g_var.logger.info('注册失败,返回信息解析失败。。。')
         g_var.logger.info(html.text)
         return -2
     if not res_data['success']:
         g_var.logger.info('注册失败。。。')
         g_var.logger.info(html.text)
         return -2
     try:
         sql = "INSERT INTO " + present_website + "(username, password, mail) VALUES('" + \
               username + "', '" + password + "', '" + email + "');"
         last_row_id = MysqlHandler().insert(sql)
         g_var.logger.info(last_row_id)
         if last_row_id != -1:
             g_var.logger.info('注册成功!' + username)
             userData = {
                 'id': last_row_id,
                 'username': username,
                 'password': password,
             }
             return userData
         else:
             g_var.ERR_CODE = 2004
             g_var.ERR_MSG = "数据库插入用户注册数据失败..."
             g_var.logger.error("数据库插入用户注册数据失败...")
             return 0
     except Exception as e:
         g_var.logger.info(e)
         g_var.ERR_CODE = 2004
         g_var.ERR_MSG = "数据库插入用户注册数据异常..."
         g_var.logger.error("数据库插入用户注册数据异常...")
         return 0
    def __postMessage(self, loginData, present_website, googlekey):
        """
        发文章
        Args:
            Session:Session对象
            loginData:用户信息,包括user_id,username,password,cookie
            present_website:当前网站名,用于数据库表名
        Returns:
            成功返回状态值:0
            失败返回状态值:
                1:表示账号密码失效,密码被改或账号被网站删除
                -1:表示requests请求页面失败,需要更换代理
                -2:页面发生改变,获取不到页面上的一些token值
                -3:数据库插入更新等错误
                -4:cookie失效
        """
        g_var.logger.info('post article......')
        item_id = str(uuid.uuid4())
        sections_id = str(uuid.uuid4())
        g_var.logger.info('正在获取headers。。。')
        headers = generate_headers(2, loginData['cookie'], item_id)
        if headers == -1 or loginData['cookie'] == "":
            g_var.logger.info("获取headers失败...")
            return -1
        captcha_url = 'https://app.ex.co/create/new/preview'
        captcha_value = google_captcha('', googlekey, captcha_url)
        if captcha_value == -1:
            return -2
        title, ops = get_article()
        if title == -1 or ops == -1:
            g_var.logger.info("未能获取对应文章格式内容...")
            return -1
        article_data = generate_post_article_data(loginData, item_id,
                                                  sections_id, captcha_value,
                                                  title, ops)
        g_var.logger.info("文章发送中...")
        url = 'https://editor.ex.co/item/publish'
        res = requestsW.post(url,
                             proxies=ip_proxy("en"),
                             json=article_data,
                             headers=headers,
                             timeout=g_var.TIMEOUT)
        if res == -1:
            return res

        # cookie失效判断
        cookie_prove = '401 - "Failed to authenticate token"'
        if cookie_prove == res.text:
            g_var.logger.info('cookie 失效 ......')
            # 如果cookie失效,将该cookie从数据库中清除,并重新从数据库中获取登录账号密码
            sql = "UPDATE " + present_website + " SET cookie='' WHERE id=" + str(
                loginData['id']) + ";"
            status = MysqlHandler().update(sql)
            if status == 0:
                g_var.logger.info("cookie失效,清除cookie update OK")
                return -4
            else:
                g_var.logger.error("数据库清除cookie错误!")
                return 1

        res_article = re.findall('"item":\{"id":"(.*?)","tags"', res.text)
        if not res_article:
            g_var.ERR_CODE = 5000
            g_var.ERR_MSG = "文章发送失败,IP异常等原因..."
            g_var.logger.info('文章发送失败,IP异常等原因...')
            return -1
        try:
            url = 'https://app.ex.co/stories/item/' + item_id
            sql = "INSERT INTO playbuzz_com_article(url, keyword, user_id) VALUES('" + url + "', '" + title + "', '" + str(
                loginData["id"]) + "');"
            last_row_id = MysqlHandler().insert(sql)
            g_var.logger.info(last_row_id)
            if last_row_id != -1:
                g_var.logger.info('文章成功!' + loginData['firstName'])
                return 0
            else:
                g_var.ERR_CODE = 2004
                g_var.ERR_MSG = "数据库插入用户注册数据失败..."
                g_var.logger.error("数据库插入用户注册数据失败...")
                return -3
        except Exception as e:
            g_var.logger.info(e)
            g_var.ERR_CODE = 2004
            g_var.ERR_MSG = "数据库插入用户注册数据异常..."
            g_var.logger.error("数据库插入用户注册数据异常...")
            return -3
Пример #19
0
    def start(self, present_website, VPN):
        while self.success_count < self.assignment_num:
            # 每次循环检测当前错误状态
            if self.__monitor_status() == -1:
                break
            self.now_count = self.now_count + 1
            # 设置Session对象
            Session = requests.Session()
            proxies = ip_proxy(VPN)
            if proxies == {"error": -1}:
                self.failed_count = self.failed_count + 1
                continue
            Session.proxies = proxies
            Session.mount('http://', HTTPAdapter(max_retries=1))
            Session.mount('https://', HTTPAdapter(max_retries=1))

            # 1、注册
            retry_count = 0
            while retry_count < g_var.RETRY_COUNT_MAX:
                retry_count = retry_count + 1
                registerData = self.__register_one(Session, present_website)

                if registerData != -1:  # 说明注册成功
                    break
                else:
                    # 失败更换代理
                    g_var.logger.info("注册失败" + str(registerData))
                    time.sleep(g_var.SLEEP_TIME)
                    proxies = ip_proxy(VPN)
                    Session.proxies = proxies
                    continue
            if retry_count == g_var.RETRY_COUNT_MAX:
                # 连续出错说明发生了一些问题,需要停止程序
                g_var.SPIDER_STATUS = 3
                g_var.logger.error("start:连续注册失败!程序停止")
                break

            # 2、登录
            retry_count = 0
            while retry_count < g_var.RETRY_COUNT_MAX:
                retry_count = retry_count + 1
                # 构造一个userInfo
                userInfo: tuple = (registerData['user_id'], registerData['name'], registerData['password'],
                                   registerData['mail'], '0', "")

                loginData = self.__login(Session, VPN, userInfo)
                if loginData == {"error": -1}:
                    # 登录报错,停止运行
                    g_var.ERR_MSG = "登录出错"
                    self.failed_count = self.failed_count + 1
                    time.sleep(g_var.SLEEP_TIME)
                    proxies = ip_proxy(VPN)
                    Session.proxies = proxies
                    continue
                elif loginData == {"error": 1}:
                    # 账号异常,重新取新账号登录
                    self.failed_count = self.failed_count + 1
                    continue
                else:
                    self.failed_count = 0
                    self.proxy_err_count = 0
                    break
            if retry_count == g_var.RETRY_COUNT_MAX:
                g_var.SPIDER_STATUS = 3
                g_var.logger.error("start:连续登录失败!程序停止")
                break

            # 3、发文章
            retry_count = 0
            while retry_count < g_var.RETRY_COUNT_MAX:
                retry_count = retry_count + 1
                status = self.__postMessage(Session, loginData)
                if status == {"ok": 0}:  # 发文章成功
                    self.success_count = self.success_count + 1
                    self.failed_count = 0
                    self.proxy_err_count = 0
                    break
                elif status == {"error": 1}:
                    self.failed_count = self.failed_count + 1
                    self.proxy_err_count = self.proxy_err_count + 1
                    time.sleep(g_var.SLEEP_TIME)
                    proxies = ip_proxy(VPN)
                    Session.proxies = proxies
                    # g_var.logger.info("proxies"+str(proxies))
                elif status == {"error": -1}:
                    # 获取不到文章,程序停止
                    self.failed_count = self.failed_count + 1
                    break
            if retry_count == g_var.RETRY_COUNT_MAX:
                # 连续出错说明发生了一些问题,需要停止程序
                g_var.SPIDER_STATUS = 3
                g_var.ERR_MSG = "连续发文章出错,程序停止"
                g_var.logger.error("连续发文章出错,程序停止")
                break
        g_var.logger.info("成功注册账户并发送文章" + str(self.success_count) + "篇")
Пример #20
0
    def __register_one(self, Session, present_website: str, email_and_passwd):
        """
        注册一个账户
        Args:
            Session:Session对象
            present_website:当前网站名,用于数据库表名
            email_and_passwd:邮箱账户和密码,email_and_passwd[0]是邮箱,[1]是密码
        Returns:
            注册成功返回注册数据字典对象registerData,需要包含user_id, username, password, email
                user_id这样获取:(示例)
                    # 将注册的账户写入数据库(sql自己写,这边只是个示例)
                    sql = "INSERT INTO "+present_website+"(username, password, mail, status) VALUES('" + name + \
                          "', '" + psd + "', '" + email_and_passwd[0] + "', '" + str(0) + "');"
                    last_row_id = MysqlHandler().insert(sql)
                    if last_row_id != -1:
                        registerData["id"] = last_row_id
                        return registerData
                    else:
                        g_var.logger.error("数据库插入用户注册数据失败")
                        return 0
            注册失败返回状态码
            0:更换email 返回0 或其他错误,但是激活失败或插入数据库失败
            -1:表示requests请求页面失败,需要更换代理
            -2:注册失败,可能是邮箱密码不符合要求、或ip被封等原因,需要排查
        """

        user = project_util.generate_random_string(12, 16)
        pwd = project_util.generate_random_string(10, 12)
        email_list = email_and_passwd
        if email_list == -1:
            g_var.SPIDER_STATUS = 2
            g_var.ERR_MSG = g_var.ERR_MSG + "|_|NO email"
            g_var.logger.info("NO email")
            return 0

        verify_email = Session.get(
            "https://www.diigo.com/user_mana2/check_email?email=" +
            email_list[0],
            timeout=g_var.TIMEOUT,
            headers=self.headers,
            proxies=Session.proxies)  # 验证邮箱是否可用

        verify_user = Session.get(
            "https://www.diigo.com/user_mana2/check_name?username="******"1":
            g_var.SPIDER_STATUS = 2
            g_var.ERR_MSG = g_var.ERR_MSG + "|_|账号密码或邮箱已经被注册"
            g_var.logger.info("账号密码或邮箱已经被注册")
            return 0

        # time.sleep(3)

        google_captchas = google_captcha(
            "", "6Ld23sMSAAAAALfyXkI9d0nHmzOH9jZZNuh66nql",
            "https://www.diigo.com/sign-up?plan=free")
        if google_captchas == -1:
            g_var.SPIDER_STATUS = 2
            g_var.ERR_MSG = g_var.ERR_MSG + "|_|谷歌打码失败"
            g_var.logger.info("谷歌打码失败")
            return -2

        res = requestsW.get("https://www.diigo.com/",
                            headers=self.headers,
                            proxies=Session.proxies)  # 打开首页
        if res == -1: return res
        cookies = res.cookies.get_dict()
        i = 0
        while i < g_var.ERR_COUNT:
            i += 1
            try:
                Session.proxies = ip_proxy()
                res = requests.get("https://www.diigo.com/sign-up?plan=free",
                                   headers=self.headers,
                                   cookies=cookies,
                                   proxies=Session.proxies,
                                   verify=False)
                user_input = re.search('id="username" name="(\w{32})">',
                                       res.text)
                email_input = re.search('id=\'email\' name="(\w{32})">',
                                        res.text)
                pwd_input = re.search('id=\'password\' name="(\w{32})"',
                                      res.text)
                if not user_input and email_input and pwd_input:  # TODO 获取不到参数
                    return "注册无法打开网页"
                else:
                    user_input = user_input.group(1)
                    email_input = email_input.group(1)
                    pwd_input = pwd_input.group(1)
                data = {
                    "plan": "free",
                    "g-recaptcha-response": google_captchas,
                    user_input: user,
                    email_input: email_and_passwd[0],
                    pwd_input: pwd,
                }
                self.headers["X-Requested-With"] = "XMLHttpRequest"
                self.headers[
                    "Referer"] = "https://www.diigo.com/sign-up?plan=free"
                self.headers[
                    "Content-Type"] = "application/x-www-form-urlencoded; charset=UTF-8"

                res = requests.post(
                    "https://www.diigo.com/user_mana2/register_2",
                    headers=self.headers,
                    cookies=cookies,
                    data=data,
                    proxies=Session.proxies,
                    verify=False)
                print(res.json())
                if project_util.dictExistValue(res.json(), "status"):
                    if res.json()["status"] == 1:
                        cookies.update(res.cookies.get_dict())
                        savec = cookies
                        res = requestsW.post(
                            "https://www.diigo.com/user_mana2/resend_verify",
                            cookies=cookies,
                            headers=self.headers,
                            data={"email": email_and_passwd[0]},
                            proxies=Session.proxies)
                        print("重新发送邮箱:", res.text)

                        emailinfo = EmailVerify(
                            email_and_passwd[0], email_and_passwd[1],
                            'href="(https://www.diigo.com/user_mana2/register_verify/\w{32})"'
                        ).execute_Start()
                        print("这里是邮箱参数:", emailinfo)
                        if emailinfo["data"] != -1:
                            Session = requestsW.session()
                            res = Session.get(emailinfo["data"],
                                              headers=self.headers,
                                              proxies=Session.proxies,
                                              cookies=cookies)
                            sql = """INSERT INTO %s (username, password, mail, status, cookie) VALUES("%s", "%s", "%s", "%s", "%s");""" % (
                                "diigo_com", user, pwd, email_and_passwd[0], 0,
                                savec)
                            g_var.logger.info(sql)
                            last_row_id = MysqlHandler().insert(sql)

                            if last_row_id != -1:
                                registerData = {
                                    "username": user,
                                    "password": pwd,
                                    "email": email_and_passwd[0],
                                    "cookie": savec,
                                }
                                registerData["id"] = int(last_row_id)
                                return registerData
                            return {
                                "user": user,
                                "pwd": pwd,
                                "email": email_and_passwd[0],
                                "cookies": Session.cookies.get_dict()
                            }
                            # if project_util.dictExistValue(res.cookies.get_dict(),"diigoandlogincookie"):  # 注册成功并登陆cookie
                            #     saveCookie = str(Session.cookies.get_dict())
                            #     # print({"user": user, "pwd": pwd, "email": email_and_passwd[0], "cookies": saveCookie})
                            #     return {"user": user, "pwd": pwd, "email": email_and_passwd[0], "cookies": saveCookie}
                    elif res.json()["status"] == -2:
                        if "captcha error" in res.json()["status"]:
                            g_var.SPIDER_STATUS = 2
                            g_var.ERR_MSG = g_var.ERR_MSG + "|_|谷歌打码失败"
                            g_var.logger.info("谷歌打码失败")
                            return -2
                return -2

            except Exception as e:
                res = requestsW.get("https://www.diigo.com/",
                                    headers=self.headers,
                                    proxies=Session.proxies,
                                    verify=False)  # 打开首页
                cookies = res.cookies.get_dict()
                g_var.logger.info(e)
                g_var.logger.info("正在换ip", e)
        return 0
Пример #21
0
    def login(self, Session, present_website: str, VPN, userInfo):
        """
        登录
        根据用户信息userInfo中是否包含cookie
        1、有cookie直接构造loginData返回,跳过登录流程
        2、没有cookie,需要post登录请求,获取到cookie,再构造loginData返回
        Args:
            Session:Session对象
            present_website:当前网站名,用于数据库表名
            VPN:使用国内or国外代理
            userInfo:用户信息  userInfo[0]:id [1]:username [2]passwod [3]:emial [4]:status [5]cookie

        Mysql Update:
                        # 如果cookie失效,将该cookie从数据库中清除,并重新从数据库中获取登录账号密码
                sql = "UPDATE 网站名 SET cookie='' WHERE id=" + str(loginData['id']) + ";"
                status = MysqlHandler().update(sql)
                if status == 0:
                    g_var.logger.info("cookie失效,清除cookie update OK")
                    return {"error": -2}
                else:
                    g_var.logger.error("数据库清除cookie错误!")
                    return {"error": 1}

        Returns:
            成功返回loginData
                loginData = {
                    'id': user_id,
                    'username': username,
                    'password': password,
                    'cookie': cookie,
                }
            失败返回状态值:
                1:表示账号密码失效,密码被改或账号被网站删除
                -1:表示requests请求页面失败,需要更换代理
                -2:页面发生改变,获取不到页面上的一些token值
                -3:数据库插入更新等错误
        """
        user_id = userInfo[0]
        username = userInfo[1]
        password = userInfo[2]
        if userInfo[5] != None and userInfo[5] != "":
            # userInfo[5]保存cookie值,如果cookie不为空,则使用cookie
            g_var.logger.info("返回cookie" + userInfo[5])
            cookie = userInfo[5]
            loginData = {
                'id': user_id,
                'username': username,
                'password': password,
                'cookie': str(cookie),
            }
            return loginData
        else:
            google_captchas = google_captcha(
                "", "6Ld23sMSAAAAALfyXkI9d0nHmzOH9jZZNuh66nql",
                "https://www.diigo.com/sign-in?referInfo=https%3A%2F%2Fwww.diigo.com"
            )
            if google_captchas == -1:
                return "谷歌打码失败"
            i = 0
            while i < g_var.ERR_COUNT:
                i += 1
                try:
                    Session.proxies = ip_proxy()
                    res = requests.get(
                        "https://www.diigo.com/sign-in?referInfo=https%3A%2F%2Fwww.diigo.com",
                        headers=self.headers,
                        proxies=Session.proxies)
                    login_token = re.search(
                        'name="loginToken" value="(\w{32})"', res.text)
                    if login_token:
                        login_token = login_token.group(1)
                        print(login_token)
                    else:
                        return "为获取登陆cookie"
                    cookies = res.cookies.get_dict()
                    if res == -1: return res
                    data = {
                        "referInfo": "https://www.diigo.com",
                        "loginToken": login_token,
                        "username": username,
                        "password": password,
                        "g-recaptcha-response": google_captchas,
                        "recaptcha": "v2",
                    }
                    self.headers["X-Requested-With"] = "XMLHttpRequest"
                    self.headers[
                        "Referer"] = "https://www.diigo.com/sign-in?referInfo=https%3A%2F%2Fwww.diigo.com"
                    self.headers[
                        "Content-Type"] = "application/x-www-form-urlencoded; charset=UTF-8"
                    g_var.logger.info("正在登录中")
                    res = requests.post("https://www.diigo.com/sign-in",
                                        headers=self.headers,
                                        data=data,
                                        cookies=cookies,
                                        proxies=Session.proxies)
                    g_var.logger.info("登录结束")
                    g_var.logger.info(res.text)
                    if not '"status":1' in res.text:
                        return -2
                    else:
                        break

                except Exception as e:
                    g_var.logger.info("正在换ip" + str(e))

            save_cookies = str(res.cookies.get_dict())
            if "diigoandlogincookie" in save_cookies:
                sql = "UPDATE %s SET cookie=\"%s\" WHERE id=%s ;" % (
                    present_website, save_cookies, user_id)
                g_var.logger.info(sql)
                status = MysqlHandler().update(sql)
                if status == 0:
                    g_var.logger.info("cookie失效,清除cookie update OK")
                    return {
                        'id': user_id,
                        'username': username,
                        'password': password,
                        'cookie': save_cookies,
                    }
                else:
                    g_var.logger.error("数据库清除cookie错误!")
                    return {"error": 1}

            else:
                return -1

            pass
Пример #22
0
    # args = get_command_line_arguments()
    g_var.ALL_COUNT = count
    g_var.INTERFACE_HOST = host
    g_var.UUID = uuid
    # 获取配置参数
    get_global_params(present_website, True)

    # 1、注册测试
    # PastebinCom(1).registers(present_website, VPN)

    # 2、登录测试
    # s = requestsW.session()
    # userInfo = generate_login_data(present_website, "D:\qianwei_gitrepo\SendArticle\pastebin_com\config.json") #网站下json绝对路径
    # loginData = PastebinCom(1).login(s, present_website, VPN, userInfo)

    # 3、发送文章测试
    s = requestsW.session()
    s.proxies = ip_proxy("en")
    userInfo = generate_login_data(
        present_website,
        "D:\qianwei_gitrepo\SendArticle\pastebin_com\config.json"
    )  #网站下json绝对路径
    loginData = {
        'id': userInfo[0],
        'username': userInfo[1],
        'password': userInfo[2],
        'email': userInfo[3],
        'cookie': eval(userInfo[5]),
    }
    PastebinCom(1).send_profile(s, loginData)
Пример #23
0
    def loginAndPostMessage(self, present_website, VPN):
        while self.success_count < self.assignment_num:
            # 每次循环检测当前错误状态
            if self.__monitor_status() == -1:
                break
            self.now_count = self.now_count + 1

            Session = get_Session(VPN)
            if Session == -1:
                self.failed_count = self.failed_count + 1
                continue

            # 从数据库中获取用户信息
            userInfo = generate_login_data(present_website)
            g_var.logger.info(userInfo)
            if userInfo == None:
                g_var.ERR_CODE = 2001
                g_var.ERR_MSG = g_var.ERR_MSG + "无法获取proxy!"
                g_var.logger.error("数据库中获取用户失败,本线程停止!")
                return -1

            # 1、登录
            login_signal = 0
            retry_count = 0
            while retry_count < g_var.RETRY_COUNT_MAX:
                retry_count = retry_count + 1

                loginData = self.__login(Session, present_website, VPN,
                                         userInfo)
                if loginData == -1:
                    # 代理问题,更换代理
                    g_var.ERR_MSG = "登录出错"
                    self.failed_count = self.failed_count + 1
                    time.sleep(g_var.SLEEP_TIME)
                    proxies = ip_proxy(VPN)
                    if proxies == {"error": -1}:
                        self.failed_count = self.failed_count + 1
                        continue
                    Session.proxies = proxies
                    continue
                elif loginData == -2:
                    # 账号异常,跳出本循环
                    self.failed_count = self.failed_count + 1
                    login_signal = 1
                    break
                else:
                    self.failed_count = 0
                    self.proxy_err_count = 0
                    break
            if retry_count == g_var.RETRY_COUNT_MAX:
                # 连续出错说明发生了一些问题,需要停止程序
                g_var.SPIDER_STATUS = 3
                g_var.ERR_MSG = "连续登录出错,程序停止"
                g_var.logger.error("login:连续登录失败!程序停止")
                break
            if login_signal == 1:
                continue

            # 2、发文章
            retry_count = 0
            while retry_count < g_var.RETRY_COUNT_MAX:
                time.sleep(g_var.SLEEP_TIME)
                retry_count = retry_count + 1
                status = self.__postMessage(Session, loginData,
                                            present_website)
                if status == 0:  # 发文章成功
                    self.success_count = self.success_count + 1
                    self.failed_count = 0
                    self.proxy_err_count = 0
                    break
                elif status == -1:
                    # 返回值为-1,更换代理
                    self.failed_count = self.failed_count + 1
                    self.proxy_err_count = self.proxy_err_count + 1
                    time.sleep(g_var.SLEEP_TIME)
                    proxies = ip_proxy(VPN)
                    if proxies == {"error": -1}:
                        self.failed_count = self.failed_count + 1
                        continue
                    Session.proxies = proxies
                    # g_var.logger.info("proxies"+str(proxies))
                elif status == -2:
                    # 返回值为-1,某些必须停止的错误,程序停止
                    self.failed_count = self.failed_count + 1
                    g_var.SPIDER_STATUS = 3
                    break
                elif status == -3:
                    # 返回值为-1,数据库错误
                    self.failed_count = self.failed_count + 1
            if retry_count == g_var.RETRY_COUNT_MAX:
                # 连续出错说明发生了一些问题,需要停止程序
                g_var.SPIDER_STATUS = 3
                g_var.ERR_MSG = "连续发文章出错,程序停止"
                g_var.logger.error("连续发文章出错,程序停止")
                break
        g_var.logger.info("成功发送" + str(self.success_count) + "篇文章")
Пример #24
0
    def __login(self, Session, VPN, userInfo) -> dict:
        try :
            # 从传入的userInfo中判断是否包含cookie,有cookie直接跳过登录流程,
            # 没有cookie或cookie过期再执行登录流程

            # 判断用户信息中是否包含cookie
            if userInfo[5] != None and userInfo[5] != "":
                print("正在获取cookie")
                # userInfo[5]保存cookie值,如果cookie不为空,则使用cookie
                g_var.logger.info("返回cookie" + userInfo[5])
                user_id = userInfo[0]
                username = userInfo[1]
                Cookie = userInfo[5]
                # 长度为3,loginData包含cookie
                loginData = {
                    'id': user_id,
                    'name': username,
                    'cookie': Cookie
                }
                return loginData
            else:
                print("用账号密码登录中")
                # cookie为空,使用账号密码登录
                user_id = userInfo[0]
                username = userInfo[1]
                password = userInfo[2]

                res = Session.get("https://www.reddit.com/register/?actionSource=header_signup",proxies=Session.proxies,
                                  timeout=g_var.TIMEOUT)
                re_res = re.search('<input type="hidden" name="csrf_token" value="(.*?)">', res.text)
                if re_res.group():
                    csrf_token = re_res.group(1)
                else:
                    g_var.logger.info("注册未获取到token",re_res)
                    return {"error": -1}
                # res.headers["content-type"]="application/x-www-form-urlencoded"
                data = {
                    "csrf_token": csrf_token,
                    "otp": "",
                    "dest": "https://www.reddit.com",
                    "password": password,
                    "username": username,
                }
                print("正在提交参数",data)
                print(data)
                retry_count = 0
                while retry_count < g_var.RETRY_COUNT_MAX:
                    retry_count = retry_count + 1
                    try:
                        g_var.logger.info("使用账号密码登录...")
                        res = Session.post("https://www.reddit.com/login",proxies=Session.proxies, data=data,  timeout=g_var.TIMEOUT)
                        # print("登录text",res.text)
                        cookie = res.cookies.get_dict()
                        print("这里是cookie",cookie)
                        self.proxy_err_count = 0
                        break
                    except Exception as e:

                        g_var.logger.error("账号密码登录超时:",e)
                        self.proxy_err_count = self.proxy_err_count + 1
                        time.sleep(g_var.SLEEP_TIME)
                        proxies = ip_proxy(VPN)
                        Session.proxies = proxies
                        continue
                if retry_count == g_var.RETRY_COUNT_MAX:
                    g_var.SPIDER_STATUS = 3
                    g_var.logger.error("连续登录失败!程序停止")
                    return {"error": -1}

                if not self.__dictExistValue(cookie, "reddit_session"):
                    # 如果登录失败将数据库中的status改为异常 TODO t注释
                    # sql = "UPDATE reddit_com SET status=1 WHERE id=" + str(user_id) + ";"
                    # MysqlHandler().update(sql)

                    return {"error": 1}  # 账号异常,重新取号登录
                else:
                    print("正在存入cookie")
                    # 如果登录成功,则返回id和username给下一步发新文章
                    user_id = userInfo[0]
                    # 长度为2,使用账号密码登录的loginData
                    sql = "UPDATE reddit_com SET cookie=\"" + str(cookie) + "\" WHERE id=" + str(
                        user_id) + ";"
                    status = MysqlHandler().update(sql)
                    if status == 0:
                        g_var.logger.info("update cookie OK")
                    else:
                        g_var.logger.error("数据库更新cookie错误!")
                        return {"error": 1}
                    loginData = {
                        'id': user_id,
                        'name': username
                    }
                return loginData
        except Exception as e:
            g_var.ERR_CODE = "2100"
            g_var.ERR_MSG = g_var.ERR_MSG + "|_|"+"ip出现问题 请求失败"
            g_var.logger.error("登录错误:",e)
            return {"error": 1}
Пример #25
0
    def __register_one(self, present_website, email_info):

        g_var.logger.info("register...")
        headers = generate_headers(0)
        if headers == -1:
            g_var.logger.info("获取注册headers失败...")
            return -2

        registerData = generate_register_data(present_website, email_info)
        g_var.logger.info(registerData)
        if registerData == -1:
            g_var.logger.info("未生成正确注册数据...")
            return -2

        url_register = 'https://www.wattpad.com/signup?nextUrl=/home'
        g_var.logger.info("提交注册中...")
        html = requestsW.post(url_register,
                              proxies=ip_proxy("en"),
                              data=registerData,
                              headers=headers,
                              timeout=g_var.TIMEOUT)
        if html == -1:
            return -1
        # 注册成功与否验证
        prove_info = 'Hi @' + registerData['username']
        if prove_info not in html.text:
            g_var.logger.info(html.text)
            g_var.logger.info("IP被封等原因...")
            return -2
        token_list = re.findall('token=(.*?);', html.headers['Set-Cookie'])
        del headers['Origin']
        del headers['Content-Type']
        del headers['Referer']
        time.sleep(2)
        verify_url = get_verify_url(email_info)
        if verify_url == -1:
            g_var.logger.info("未读取到邮箱验证的url...")
            return -3
        g_var.logger.info("邮件的url正在验证中...")
        html = requestsW.get(url=verify_url,
                             proxies=ip_proxy("en"),
                             headers=headers,
                             timeout=g_var.TIMEOUT)
        if html == -1:
            return -1
        if html.status_code == 200:
            sql = "INSERT INTO wattpad_com(username, password, mail, status) VALUES('" + registerData['username'] + \
                  "', '" + registerData['password'] + "', '" + registerData['email'] + "', '" + str(0) + "');"
            last_row_id = MysqlHandler().insert(sql)
            if last_row_id != -1:
                registerData["id"] = last_row_id
                registerData["token"] = token_list[0]
                return registerData
            else:
                g_var.ERR_CODE = 2004
                g_var.ERR_MSG = "数据库插入用户注册数据失败..."
                g_var.logger.error("数据库插入用户注册数据失败...")
                return 0
        else:
            g_var.ERR_CODE = 3006
            g_var.ERR_MSG = "邮箱验证失败..."
            g_var.logger.error("邮箱验证失败!\n")
            return -3
Пример #26
0
    def start(self, present_website, VPN):
        while self.success_count < self.assignment_num:
            # 每次循环检测当前错误状态
            if self.__monitor_status() == -1:
                break
            self.now_count = self.now_count + 1

            # 设置Session对象
            Session = get_Session(VPN)
            if Session == -1:
                self.failed_count = self.failed_count + 1
                continue

            # 1、注册
            # 获取邮箱
            retry_count = 0
            email_and_passwd = get_email(present_website)
            if email_and_passwd == -1:
                retry_count = g_var.RETRY_COUNT_MAX
                g_var.ERR_MSG = g_var.ERR_MSG + "|_|没有邮箱了"
                g_var.logger.error("没有邮箱了")
                continue
            while retry_count < g_var.RETRY_COUNT_MAX:
                retry_count = retry_count + 1
                registerData = self.__register_one(Session, present_website,
                                                   email_and_passwd)
                if registerData == -1:
                    g_var.ERR_MSG = g_var.ERR_MSG + "|_|代理连续错误"
                    g_var.logger.info("代理错误")
                    retry_count = g_var.RETRY_COUNT_MAX
                elif registerData == -2:
                    g_var.logger.info("注册失败,可能是邮箱密码不符合要求、或ip被封等原因,请排查!")
                    self.proxy_err_count = self.proxy_err_count + 1
                    proxies = ip_proxy(VPN)
                    if proxies == {"error": -1}:
                        g_var.logger.info("获取代理错误")
                        self.failed_count = self.failed_count + 1
                    Session.proxies = proxies
                elif registerData == 0:
                    # 注册成功,但激活失败
                    email_and_passwd = get_email(present_website)
                    if email_and_passwd == -1:
                        retry_count = g_var.RETRY_COUNT_MAX
                        g_var.ERR_MSG = g_var.ERR_MSG + "|_|没有邮箱了"
                        g_var.logger.error("没有邮箱了")
                        continue
                    retry_count = 0
                else:
                    # 注册成功
                    self.failed_count = 0
                    break
            if retry_count == g_var.RETRY_COUNT_MAX:
                # 连续出错说明发生了一些问题,需要停止程序
                g_var.SPIDER_STATUS = 3
                g_var.ERR_MSG = g_var.ERR_MSG + "|_|连续注册出错,程序停止"
                g_var.logger.error("start:连续注册失败!程序停止")
                break

            # 2、登录
            Session = get_Session(VPN)
            if Session == -1:
                self.failed_count = self.failed_count + 1
                continue
            # 构造一个userInfo
            g_var.logger.info(registerData)
            userInfo = [
                int(registerData['id']), registerData['username'],
                registerData['password'], registerData['email'], 0,
                str(registerData['cookie'])
            ]

            login_signal = 0  # 记录状态,成功为0,失败为1
            retry_count = 0
            while retry_count < g_var.RETRY_COUNT_MAX:
                retry_count = retry_count + 1

                loginData = self.login(Session, present_website, VPN, userInfo)
                if loginData == -1:
                    # 代理问题,更换代理
                    g_var.ERR_MSG = g_var.ERR_MSG + "|_|代理连续错误"
                    g_var.logger.info("代理错误")
                    retry_count = g_var.RETRY_COUNT_MAX
                elif loginData == -2:
                    # 账号异常,跳出本循环
                    self.failed_count = self.failed_count + 1
                    login_signal = 1
                    break
                else:
                    self.failed_count = 0
                    self.proxy_err_count = 0
                    break
            if retry_count == g_var.RETRY_COUNT_MAX:
                g_var.SPIDER_STATUS = 3
                g_var.ERR_MSG = g_var.ERR_MSG + "|_|连续登录出错,程序停止"
                g_var.logger.error("start:连续登录失败!程序停止")
                break
            if login_signal == 1:
                continue

            # 3、发文章
            retry_count = 0
            while retry_count < g_var.RETRY_COUNT_MAX:
                retry_count = retry_count + 1
                status = self.__postMessage(Session, loginData,
                                            present_website)
                if status == 0:  # 发文章成功
                    self.success_count = self.success_count + 1
                    self.failed_count = 0
                    self.proxy_err_count = 0
                    break
                elif status == -1:
                    g_var.ERR_MSG = g_var.ERR_MSG + "|_|代理连续错误"
                    g_var.logger.info("代理错误")
                    retry_count = g_var.RETRY_COUNT_MAX
                elif status == -2:
                    # 某些必须停止的错误,程序停止
                    self.failed_count = self.failed_count + 1
                    g_var.SPIDER_STATUS = 3
                    break
                elif status == -3:
                    self.failed_count = self.failed_count + 1
                elif status == -4:
                    sql = "UPDATE %s SET cookie=null WHERE id=%s ;" % (
                        present_website, loginData["id"])
                    g_var.logger.info(sql)
                    status = MysqlHandler().update(sql)
                    if status != 0:
                        g_var.logger.error("数据库清除cookie错误!")
                        return {"error": 1}
                    break
            if retry_count == g_var.RETRY_COUNT_MAX:
                # 连续出错说明发生了一些问题,需要停止程序
                g_var.SPIDER_STATUS = 3
                g_var.ERR_MSG = g_var.ERR_MSG + "|_|连续发文章出错,程序停止"
                g_var.logger.error("连续发文章出错,程序停止")
                break
        g_var.logger.info("成功注册账户并发送文章" + str(self.success_count) + "篇")
    def __register_one(self, Session, present_website: str, email_and_passwd):
        """
        注册一个账户,需要实现注册、激活、并将注册数据存入数据库的功能
        Args:
            Session:Session对象
            present_website:当前网站名,用于数据库表名
            email_and_passwd:邮箱账户和密码,email_and_passwd[0]是邮箱,[1]是密码
        Returns:
            注册成功返回注册数据字典对象registerData,需要包含id, username, password, email, cookie(在访问激活链接时能取到,\
            取不到返回空)
                user_id这样获取:(示例)
                    # 将注册的账户写入数据库(sql自己写,这边只是个示例)
                    sql = "INSERT INTO "+present_website+"(username, password, mail, status, cookie) VALUES('" + \
                    username + "', '" + password + "', '" + email + "', '" + str(0) + cookie + "');"
                    last_row_id = MysqlHandler().insert(sql)
                    if last_row_id != -1:
                        registerData["user_id"] = last_row_id
                        return registerData
                    else:
                        g_var.logger.error("数据库插入用户注册数据失败")
                        return 0
            注册失败返回状态码
            0:某些报错需要跳出while循环,更换邮箱
            -1:连续代理错误或页面发生改变等取不到关键数据等,需要停止程序
            -2:注册失败,可能是打码出错等原因,邮箱可以继续使用(邮箱资源成本较高,因此要确保注册成功后再更换邮箱),不跳出循环
        """
        email = email_and_passwd[0]
        emailpwd = email_and_passwd[1]
        Session = requestsW.Session()
        Session.proxies = ip_proxy()
        headers = {"User-Agent": get_user_agent()}
        # headers["x-requested-with"] = "XMLHttpRequest"
        headers["referer"] = "https://www.boredpanda.com/add-new-post/"
        headers[
            "content-type"] = "application/x-www-form-urlencoded; charset=UTF-8"
        user = email.split("@")[0]
        pwd = emailpwd
        data = {
            "action": "contribution_signup",
            "user_email": email,
            "user_full_name": user,
            "user_pass": pwd,
            "redirect": "https://www.boredpanda.com/add-new-post/"
        }
        res = Session.post(
            "https://www.boredpanda.com/blog/wp-admin/admin-ajax.php",
            proxies=Session.proxies,
            data=data)
        if 'user_id' not in res.text:
            g_var.ERR_MSG = g_var.ERR_MSG + "|_|发送邮箱,注册失败"
            g_var.logger.info("|_|发送邮箱,注册失败")
            return 0
        # TODO 邮箱新方法
        res = EmailVerify(
            username=email,
            password=emailpwd,
            re_text=
            'Click .{0,50} href="(http://\w{5,15}.ct.sendgrid.net/ls/click\?upn=.{300,600})">here</a>'
        ).execute_Start()
        if res == -1:
            g_var.ERR_MSG = g_var.ERR_MSG + "|_|邮箱激活失败"
            g_var.logger.info("|_|邮箱激活失败")
            return 0
        res = Session.get(res["data"], headers=headers)
        if "boredpanda_auth" not in Session.cookies.get_dict():
            g_var.ERR_MSG = g_var.ERR_MSG + "|_|邮箱获取链接后,请求失败"
            g_var.logger.info("|_|邮箱获取链接后,请求失败")
            return 0

        sql = """INSERT INTO %s (username, password, mail, status, cookie) VALUES("%s", "%s", "%s", "%s", "%s");""" % (
            present_website, user, pwd, email_and_passwd[0], 0,
            str(Session.cookies.get_dict()))
        g_var.logger.info(sql)
        last_row_id = MysqlHandler().insert(sql)
        if last_row_id == -1:
            g_var.ERR_MSG = g_var.ERR_MSG + "|_|数据库插入失败"
            g_var.logger.info("|_|数据库插入失败")
            return 0

        tlList = get_new_title_and_link()
        title, url = tlList[0], tlList[1]
        data = {
            "action": "save_settings_form",
            "settingsDisplay": title,
            "settingsWebsite": url,
            "settingsFacebook": url,
            "settingsTwitter": url,
            "settingsFlickr": url,
            "settingsSlack": "",
            "settingsBio": title,
            "settingsAdminBox": ""
        }

        res = Session.post(
            "https://www.boredpanda.com/blog/wp-admin/admin-ajax.php",
            proxies=Session.proxies,
            headers=headers,
            data=data)
        success = 0
        if "success" not in res.text:
            g_var.ERR_MSG = g_var.ERR_MSG + "|_|修改个人链接,请求失败"
            g_var.logger.info("|_|修改个人链接,请求失败")
            return 0

        data = {
            "action": "save_privacy_settings_form",
            "allowContactMe": "true",
            "ninjaPanda": "false",
        }
        # proxies=ip_proxy()
        res = Session.post(
            "https://www.boredpanda.com/blog/wp-admin/admin-ajax.php",
            headers=headers,
            proxies=Session.proxies,
            data=data)
        if "success" not in res.text:
            g_var.ERR_MSG = g_var.ERR_MSG + "|_|允许个人资料访问,请求失败"
            g_var.logger.info("|_|允许个人资料访问,请求失败")
            return 0

        sql = "INSERT INTO %s_article(url, keyword, user_id) VALUES('%s', '%s', '%s');" % (
            present_website, "https://www.boredpanda.com/author/%s/" % user,
            title, last_row_id)
        if g_var.insert_article_lock.acquire():
            last_row_id = MysqlHandler().insert(sql)
            if last_row_id == -1:
                g_var.ERR_MSG = g_var.ERR_MSG + "|_|MYSQL插入文章失败"
                g_var.logger.info("|_|MYSQL插入文章失败")
                return 0
Пример #28
0
    def loginAndPostMessage(self, VPN: str):
        while self.success_count < self.assignment_num:
            # 每次循环检测当前错误状态
            if self.__monitor_status() == -1:
                break
            self.now_count = self.now_count + 1

            Session = requests.Session()
            # 获取代理设置
            proxies = ip_proxy(VPN)
            if proxies == {"error": -1}:
                self.failed_count = self.failed_count + 1
                continue

            Session.proxies = proxies
            Session.mount('http://', HTTPAdapter(max_retries=1))
            Session.mount('https://', HTTPAdapter(max_retries=1))

            # 1、登录
            retry_count = 0
            while retry_count < g_var.RETRY_COUNT_MAX:
                retry_count = retry_count + 1
                # 从数据库中获取用户信息
                userInfo = generate_login_data("reddit_com")
                if userInfo == None:
                    g_var.logger.error("数据库中获取用户失败,本线程停止!")
                    return {"error": -1}
                else:
                    loginData = self.__login(Session, VPN, userInfo)
                    if loginData == {"error": -1}:
                        # 登录报错,停止运行
                        g_var.ERR_MSG = "登录出错"
                        self.failed_count = self.failed_count + 1
                        time.sleep(g_var.SLEEP_TIME)
                        proxies = ip_proxy(VPN)
                        Session.proxies = proxies
                        continue
                    elif loginData == {"error": 1}:
                        # 账号异常,重新取新账号登录
                        self.failed_count = self.failed_count + 1
                        continue
                    else:
                        self.failed_count = 0
                        self.proxy_err_count = 0
                        break
            if retry_count == g_var.RETRY_COUNT_MAX:
                # 连续出错说明发生了一些问题,需要停止程序
                g_var.SPIDER_STATUS = 3
                g_var.ERR_MSG = "连续登录出错,程序停止"
                g_var.logger.error("login:连续登录失败!程序停止")
                break

            # 2、发文章
            retry_count = 0
            while retry_count < g_var.RETRY_COUNT_MAX:
                retry_count = retry_count + 1
                status = self.__postMessage(Session, loginData)
                if status == {"ok": 0}:  # 发文章成功
                    self.success_count = self.success_count + 1
                    self.failed_count = 0
                    self.proxy_err_count = 0
                    break
                elif status == {"error": 1}:
                    self.failed_count = self.failed_count + 1
                    self.proxy_err_count = self.proxy_err_count + 1
                    time.sleep(g_var.SLEEP_TIME)
                    proxies = ip_proxy(VPN)
                    Session.proxies = proxies
                    # g_var.logger.info("proxies"+str(proxies))
                elif status == {"error": -1}:
                    # 获取不到文章,程序停止
                    self.failed_count = self.failed_count + 1
                    break
            if retry_count == g_var.RETRY_COUNT_MAX:
                # 连续出错说明发生了一些问题,需要停止程序
                g_var.SPIDER_STATUS = 3
                g_var.ERR_MSG = "连续发文章出错,程序停止"
                g_var.logger.error("连续发文章出错,程序停止")
                break
        g_var.logger.info("成功发送" + str(self.success_count) + "篇文章")
Пример #29
0
    def loginAndPostMessage(self, present_website, VPN):
        while self.success_count < self.assignment_num:
            # 每次循环检测当前错误状态
            if self.__monitor_status() == -1:
                break
            self.now_count = self.now_count + 1

            # 1、登录
            retry_count = 0
            while retry_count < g_var.RETRY_COUNT_MAX:
                retry_count = retry_count + 1
                # 从数据库中获取用户信息
                userInfo = generate_login_data(present_website)
                g_var.logger.error('...userInfo...')
                g_var.logger.error(userInfo)
                if userInfo == None:
                    g_var.logger.error("数据库中获取用户失败,本线程停止!")
                    return {"error": -1}
                else:
                    loginData = self.__login(VPN, userInfo)
                    if loginData == -1:
                        # 登录报错,停止运行\
                        g_var.logger.error("登录出错,更换代理。。。")
                        g_var.ERR_MSG = "登录出错"
                        self.failed_count = self.failed_count + 1
                        time.sleep(g_var.SLEEP_TIME)
                        proxies = ip_proxy(VPN)
                        Session.proxies = proxies
                        continue
                    elif loginData == 1:
                        # 账号异常,重新取新账号登录
                        self.failed_count = self.failed_count + 1
                        continue
                    else:
                        self.failed_count = 0
                        self.proxy_err_count = 0
                        break
            if retry_count == g_var.RETRY_COUNT_MAX:
                # 连续出错说明发生了一些问题,需要停止程序
                g_var.SPIDER_STATUS = 3
                g_var.ERR_MSG = g_var.ERR_MSG + "|_|连续注册出错,程序停止"
                g_var.logger.error("login:连续登录失败!程序停止")
                break

            # 2、发链接
            retry_count = 0
            while retry_count < g_var.RETRY_COUNT_MAX:
                retry_count = retry_count + 1
                status = self.__postMessage(loginData)
                if status == 0:  # 发链接成功
                    self.success_count = self.success_count + 1
                    self.failed_count = 0
                    self.proxy_err_count = 0
                    break
                elif status == 1:
                    self.failed_count = self.failed_count + 1
                    self.proxy_err_count = self.proxy_err_count + 1
                    time.sleep(g_var.SLEEP_TIME)
                    proxies = ip_proxy(VPN)
                    Session.proxies = proxies
                    # g_var.logger.info("proxies"+str(proxies))
                elif status == -1:
                    # 获取不到链接,程序停止
                    self.failed_count = self.failed_count + 1
                    break
            if retry_count == g_var.RETRY_COUNT_MAX:
                # 连续出错说明发生了一些问题,需要停止程序
                g_var.SPIDER_STATUS = 3
                g_var.ERR_MSG = "连续发文章出错,程序停止"
                g_var.logger.error("连续发文章出错,程序停止")
                break
        g_var.logger.info("成功发送" + str(self.success_count) + "个链接")
def register_test():
    email = "*****@*****.**"
    emailpwd = "dqS72ijG"
    Session = requestsW.Session()
    Session.proxies = ip_proxy()
    print(Session.proxies)
    headers = {
        "User-Agent":
        "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_4) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/81.0.4044.129 Safari/537.36"
    }
    # headers["x-requested-with"] = "XMLHttpRequest"
    headers["referer"] = "https://www.boredpanda.com/add-new-post/"
    headers[
        "content-type"] = "application/x-www-form-urlencoded; charset=UTF-8"
    user = email.split("@")[0]
    pwd = emailpwd

    data = {
        "action": "contribution_signup",
        "user_email": email,
        "user_full_name": user,
        "user_pass": pwd,
        "redirect": "https://www.boredpanda.com/add-new-post/"
    }
    res = Session.post(
        "https://www.boredpanda.com/blog/wp-admin/admin-ajax.php",
        proxies=Session.proxies,
        data=data)
    print(res.text)
    if 'user_id' not in res.text:
        return "注册失败"
    #TODO 邮箱新方法
    res = EmailVerify(
        username=email,
        password=emailpwd,
        re_text=
        'Click .{0,50} href="(http://\w{5,15}.ct.sendgrid.net/ls/click\?upn=.{300,600})">here</a>'
    ).execute_Start()
    if res == -1:
        return "获取邮箱失败"
    res = Session.get(res["data"], headers=headers)
    print(Session.cookies.get_dict())
    print(res.text)  #网站user <a href=".*?">My Profile</a>

    if "boredpanda_auth" not in Session.cookies.get_dict():
        return "未打开注册页面,重新注册"
    print("已经打开注册")
    url = "https://www.baidu.com"
    data = {
        "action": "save_settings_form",
        "settingsDisplay": user,
        "settingsWebsite": url,
        "settingsFacebook": url,
        "settingsTwitter": url,
        "settingsFlickr": url,
        "settingsSlack": "",
        "settingsBio": "这里是我的个人啊12323",
        "settingsAdminBox": ""
    }

    res = Session.post(
        "https://www.boredpanda.com/blog/wp-admin/admin-ajax.php",
        proxies=Session.proxies,
        headers=headers,
        data=data)
    success = 0
    if "success" not in res.text:
        return "修改个人资料失败"

    print("修改个人资料:", res.text)  # {"success":"1"}

    data = {
        "action": "save_privacy_settings_form",
        "allowContactMe": "true",
        "ninjaPanda": "false",
    }
    # proxies=ip_proxy()
    res = Session.post(
        "https://www.boredpanda.com/blog/wp-admin/admin-ajax.php",
        headers=headers,
        proxies=Session.proxies,
        data=data)
    if "success" not in res.text:
        return "修改可见失败"

    print("https://www.boredpanda.com/author/%s/" % user)