示例#1
0
 def insert_item(self, item):
     date = time.strftime("%Y-%m-%d", time.localtime())
     data = Lagoutables(
         positionID=item['positionId'],
         longitude=item['longitude'],
         latitude=item['latitude'],
         positionName=item['positionName'],
         workYear=item['workYear'],
         education=item['education'],
         jobNature=item['jobNature'],
         financeStage=item['financeStage'],
         companySize=item['companySize'],
         industryField=item['industryField'],
         city=item['city'],
         positionAdvantage=item['positionAdvantage'],
         companyShortName=item['companyShortName'],
         companyFullName=item['companyFullName'],
         district=item['district'],
         companyLabelList=','.join(item['companyLabelList']),
         salary=item['salary'],
         crawl_date=date
     )
     query_result = self.mysql_session.query(Lagoutables).filter(Lagoutables.crawl_date == date,
                                                                 Lagoutables.positionID == item[
                                                                     "positionId"]).first()
     if query_result:
         print("该岗位信息已存在%s:%s:%s" % (item["positionId"], item["city"], item["positionName"]))
     else:
         self.mysql_session.add(data)
         self.mysql_session.commit()
         print("新增岗位信息%s" % item["positionId"])
示例#2
0
    def insert_item(self, item):
        # 今天
        date = time.strftime("%Y-%m-%d", time.localtime())
        # 存储的数据结构
        data = Lagoutables(
            # 岗位ID
            positionID=item['positionId'],
            # 经度
            longitude=item['longitude'],
            # 纬度
            latitude=item['latitude'],
            # 岗位名称
            positionName=item['positionName'],
            # 工作年限
            workYear=item['workYear'],
            # 学历
            education=item['education'],
            # 岗位性质
            jobNature=item['jobNature'],
            # 公司类型
            financeStage=item['financeStage'],
            # 公司规模
            companySize=item['companySize'],
            # 业务方向
            industryField=item['industryField'],
            # 所在城市
            city=item['city'],
            # 岗位标签
            positionAdvantage=item['positionAdvantage'],
            # 公司简称
            companyShortName=item['companyShortName'],
            # 公司全称
            companyFullName=item['companyFullName'],
            # 公司所在区
            district=item['district'],
            # 公司福利标签
            companyLabelList=','.join(item['companyLabelList']),
            salary=item['salary'],
            # 抓取日期
            crawl_date=date
        )

        # 在存储数据之前,先来查询一下表里是否有这条岗位信息
        query_result = self.mysql_session.query(Lagoutables).filter(Lagoutables.crawl_date == date,
                                                                    Lagoutables.positionID == item[
                                                                        'positionId']).first()
        if query_result:
            pass
            # print('该岗位信息已存在%s:%s:%s'%(item['positionId'],item['city'],item['positionName']))
        else:
            # 插入数据
            self.mysql_session.add(data)
            # 提交数据到数据库
            self.mysql_session.commit()
示例#3
0
    def insert_item(self, item):
        # 今天
        date = time.strftime("%Y-%m-%d", time.localtime())
        # 存储数据结构
        data = Lagoutables(
            positionId=item['positionId'],
            longitude=item['longitude'],
            latitude=item['latitude'],
            positionName=item['positionName'],
            workYear=item['workYear'],
            education=item['education'],
            jobNature=item['jobNature'],
            financeStage=item['financeStage'],
            companySize=item['companySize'],
            industryField=item['industryField'],
            city=item['city'],
            positionAdvantage=item['positionAdvantage'],
            companyShortName=item['companyShortName'],
            companyFullName=item['companyFullName'],
            district=item['district'],
            companyLabelList=','.join(item['companyLabelList']),
            salary=item['salary'],
            crawl_date=date,
            tag=KD,
        )

        # 在存储数据之前。先来查询是否有这条岗位信息
        query_result = self.mysql_session.query(Lagoutables).filter(
            Lagoutables.crawl_date == date, Lagoutables.tag == KD,
            Lagoutables.positionId == item['positionId']).first()
        if query_result:
            print('该岗位信息已存在%s:%s:%s' %
                  (item['positionId'], item['city'], item['positionName']))
        else:
            # 插入数据
            self.mysql_session.add(data)
            # 提交数据到数据库
            self.mysql_session.commit()
            print('新增岗位信息%s' % item['positionId'])