コード例 #1
0
ファイル: scraper.py プロジェクト: jgmc3012/dashboard_go_shop
    def scan_product(self, list_ids):
        path = '/items'
        params = [{
            'ids': ids,
            'attributes': 'id,pictures',
        } for ids in self.split_ids(list_ids)]
        results = self.map_pool_get([path] * len(params), params)

        products_draw = {
            product['body']['id']: product
            for product in results if product.get('body')
        }
        products = Product.objects.filter(
            provider_sku__in=products_draw.keys(), available=True)
        product_with_img = Picture.objects.filter(
            product__in=products).values_list('product', flat=True)
        if product_with_img:
            products = products.exclude(id__in=product_with_img)

        bulk_mgr = BulkCreateManager(250)
        for product in products:
            sku = product.provider_sku
            if not products_draw[sku].get('body'):
                logging.getLogger('log_three').warning(
                    f'Error en la peticion de {product}. Res: {products_draw[sku]}'
                )
                continue
            elif not products_draw[sku]['body'].get('pictures'):
                logging.getLogger('log_three').warning(
                    f'Al producto {product} no se le encontraron imagenes')
                continue

            for image in products_draw[sku]['body']['pictures']:
                if 'resources/frontend/statics/processing' in image[
                        'secure_url']:
                    logging.getLogger('log_three').warning(
                        'Imagen [Procesando por Meli]')
                    continue
                picture = Picture(src=image['secure_url'], product=product)
                bulk_mgr.add(picture)
        bulk_mgr.done()
コード例 #2
0
ファイル: scraper.py プロジェクト: jgmc3012/dashboard_go_shop
    def scan_for_seller(self, seller_id):
        params = {'seller_id': seller_id}
        result = self.get(self.path, params)
        if not result:
            return []
        total = result['paging'][
            'total'] if result['paging']['total'] <= 1000 else 1000
        limit = result['paging']['limit']
        seller_draw = result['seller']
        products_draw = result['results']

        seller = Seller.objects.get(id=seller_draw['id'])
        seller.nickname = seller_draw['nickname']
        seller.save()

        list_params = [{
            'seller_id': seller_id,
            'offset': offset,
            'limit': 50,
            'attributes': 'results'
        } for offset in range(limit, total, limit)]
        products_api = self.map_pool_get(paths=[self.path] * len(list_params),
                                         params=list_params)

        for product in products_api:
            products_draw += product['results']

        categories = ScraperCategory()

        BM = BusinessModel.objects.get(pk=self.SELLER_ID)
        bulk_mgr = BulkCreateManager()

        ids_products = list()
        for product_ in products_draw:
            if ((not product_['shipping']['free_shipping'])
                    or (not product_['condition'] == 'new')):
                continue

            elif (not int(product_['category_id'][3:]) in categories.ids):
                categories.update(product_['category_id'])

            category_id = int(product_['category_id'][3:])
            category_father_id = categories.array[category_id].father
            if not categories.array[category_father_id].approved:
                continue

            cost_price = ceil(product_['price'] / BM.trm)
            sales_cost = ceil((cost_price + BM.shipping_vzla) *
                              (1 + BM.meli_tax / 100) * (1 + BM.utility / 100))
            key_category = category_father_id
            product = Product.objects.get_or_create(
                seller=seller,
                title=product_['title'],
                cost_price=cost_price,
                sale_price=sales_cost,
                provider_sku=product_['id'],
                provider_link=product_['permalink'],
                image=product_['thumbnail'].replace('http', 'https'),
                category=categories.array[key_category],
                quantity=product_['initial_quantity'])
            if product[1]:
                product = product[0]
                ids_products.append(product_['id'])
                for _attribute in product_['attributes']:
                    if _attribute['value_name'] and (350 < len(
                            _attribute['value_name'])):
                        bulk_mgr.add(
                            Attribute(id_meli=_attribute['id'],
                                      value=_attribute['value_name'],
                                      value_id=_attribute.get('value_id'),
                                      product=product))
        bulk_mgr.done()
        return self.scan_product(ids_products)
コード例 #3
0
ファイル: scraper.py プロジェクト: jgmc3012/dashboard_go_shop
    def new_products(self, ids: list, business):
        products = self.get(path=f'/items',
                            params={
                                'ids': ids,
                                'include_internal_attributes': True
                            },
                            auth=True)

        bulk_mgr = BulkCreateManager(200)
        categories = ScraperCategory()
        count_products = 0
        logging.getLogger('log_three').info(f'scaneando 20 productos')
        for _product in products:
            if not _product['body'].get('id'):
                continue

            _product_ = _product['body']
            sku = _product_.get('seller_custom_field')
            if not sku:
                logging.getLogger('log_three').info(f'No se encontro el sku')
                continue

            product = Product.objects.filter(provider_sku=sku).first()
            if not product:
                category_id = int(_product_['category_id'][3:])
                if (not category_id in categories.ids):
                    categories.update(_product_['category_id'])

                product = Product.objects.create(
                    seller=None,
                    title=_product_['title'],
                    cost_price=0,
                    ship_price=0,
                    description=_product_['descriptions'][0].get('id'),
                    provider_sku=sku,
                    provider_link=f"https://www.amazon.com/-/es/dp/{sku}?psc=1",
                    image=_product_['secure_thumbnail'],
                    quantity=0)
                for _attribute in _product_['attributes']:
                    if _attribute['value_name'] and (100 > len(
                            _attribute['value_name'])):
                        bulk_mgr.add(
                            Attribute(
                                id_meli=_attribute['id'],
                                value=_attribute['value_name'],
                                value_id=_attribute.get('value_id'),
                                product=product,
                            ))
                for image in _product_['pictures']:
                    if 'resources/frontend/statics/processing' in image[
                            'secure_url']:
                        continue
                    picture = Picture(src=image['secure_url'], product=product)
                    bulk_mgr.add(picture)
            else:
                logging.getLogger('log_three').info(
                    f'Producto {sku} Ya existente')

            bulk_mgr.add(
                ProductForStore(store=business,
                                product=product,
                                sale_price=0,
                                sku=_product_['id'],
                                category=categories.array[category_id]))
            count_products += 1
        bulk_mgr.done()
        logging.getLogger('log_three').info(
            f'{count_products} Productos sincronizados')
コード例 #4
0
ファイル: scraper.py プロジェクト: jgmc3012/dashboard_go_shop
    def scan_for_category(self, category):
        params = {
            'offset': 0,
            'sort': 'relevance',
            'shipping': 'mercadoenvios',
            'power_seller': 'yes',
            'has_pictures': 'yes',
            'shipping_cost': 'free',
            'ITEM_CONDITION': 2230284,
            'category': f'MCO{category.id}'
        }

        result_draw = self.get(self.path, params)

        result = self.get(self.path, params)
        if not result:
            return []
        total = result['paging'][
            'total'] if result['paging']['total'] <= 10_000 else 10_000
        limit = result['paging']['limit']
        products_draw = result['results']

        list_params = [{
            'offset': offset,
            'sort': 'relevance',
            'shipping': 'mercadoenvios',
            'power_seller': 'yes',
            'has_pictures': 'yes',
            'shipping_cost': 'free',
            'ITEM_CONDITION': 2230284,
            'category': f'MCO{category.id}',
            'attribute': 'results'
        } for offset in range(limit, total, limit)]

        logging.getLogger('log_three').info(f'Scrapeando {total} productos')
        products_api = self.map_pool_get(paths=[self.path] * len(list_params),
                                         params=list_params,
                                         auths=[True] * len(list_params))

        for product in products_api:
            products_draw += product['results']

        BM = BusinessModel.objects.get(pk=self.SELLER_ID)
        bulk_mgr = BulkCreateManager(200)

        ids_products = list()
        sellers = ScraperSeller()
        bad_sellers = Seller.objects.filter(bad_seller=True).values_list(
            'id', flat=True)
        for product_ in products_draw:
            seller_id = int(product_['seller']['id'])
            if seller_id in bad_sellers:
                continue
            elif seller_id not in sellers.ids:
                sellers.update(seller_id)

            cost_price = ceil(product_['price'] / BM.trm)
            sales_cost = ceil((cost_price + BM.shipping_vzla) *
                              (1 + BM.meli_tax / 100) * (1 + BM.utility / 100))
            product = Product.objects.filter(
                provider_sku=product_['id']).first()
            if not product:
                product = Product.objects.create(
                    seller=sellers.array[seller_id],
                    title=product_['title'],
                    cost_price=cost_price,
                    sale_price=sales_cost,
                    provider_sku=product_['id'],
                    provider_link=product_['permalink'],
                    image=product_['thumbnail'].replace('http', 'https'),
                    category=category,
                    quantity=product_['available_quantity'])
                for _attribute in product_['attributes']:
                    if _attribute['value_name'] and (350 < len(
                            _attribute['value_name'])):
                        bulk_mgr.add(
                            Attribute(id_meli=_attribute['id'],
                                      value=_attribute['value_name'],
                                      value_id=_attribute.get('value_id'),
                                      product=product))

            ids_products.append(product_['id'])

        bulk_mgr.done()
        return self.scan_product(ids_products)