Python scrape 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: scrape_schema_recipe

메소드/함수: scrape

hotexamples.com에서의 예제들: 14

Python scrape - 14개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 scrape_schema_recipe.scrape에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

        def preparse(self):
            self.preparsed_elements = []
            self.data = scrape_schema_recipe.scrape(self.text,
                                                    python_objects=True)

            if not self.data:
                BaseParser.preparse(self)
                return

            recipe = self.data[0]
            self.recipe = recipe

            for schema_key, output_key in self.schema_org_mappings.items():
                if schema_key in recipe:
                    value = recipe[schema_key]
                    if isinstance(value, str):
                        self.preparsed_elements.append((value, output_key))
                    if isinstance(value, list):
                        for entry in value:
                            self.preparsed_elements.append((entry, output_key))
                    elif isinstance(value, timedelta):
                        minutes = int(value.total_seconds() // 60)
                        if not minutes % 60 == 0:
                            # Not full hours.
                            self.preparsed_elements.append(
                                ("{} min".format(minutes), output_key))
                        else:
                            # Full hours.
                            self.preparsed_elements.append(
                                ("{} h".format(minutes // 60), output_key))

            if self.preparsed_elements:
                self.ignore_unparsed = True
            else:
                BaseParser.preparse(self)

예제 #2

파일 보기

    def test_recipe2(self):
        recipes = scrape(
            f"{DATA_PATH}/sweetestkitchen-truffles.html",
            python_objects=True,
            migrate_old_schema=False,
        )
        recipe = recipes[0]

        input_keys = list(recipe.keys())

        expected_output = [
            "prepTime",
            "cookTime",
            "name",
            "recipeYield",
            "recipeCategory",
            "image",
            "description",
            "@type",
            "author",
            "aggregateRating",
            "ingredients",
            "recipeInstructions",
            "totalTime",
            "@context",
        ]

        assert lists_are_equal(expected_output, input_keys)

예제 #3

파일 보기

파일: test_scrape.py 프로젝트: squareinc/scrape-schema-recipe

    def test_recipe2(self):
        recipes = scrape('test_data/sweetestkitchen-truffles.html',
                             python_objects=True, migrate_old_schema=False)
        recipe = recipes[0]

        input_keys = list(recipe.keys())

        expectated_output = ['prepTime', 'cookTime', 'name', 'recipeYield',
                             'recipeCategory', 'image', 'description', '@type',
                             'author', 'aggregateRating', 'ingredients',
                             'recipeInstructions', 'totalTime', '@context']

        assert lists_are_equal(expectated_output, input_keys)

예제 #4

파일 보기

 def setUpClass(cls):
     cls.recipes = scrape(f"{DATA_PATH}/allrecipes-moscow-mule.html",
                          python_objects=True)
     cls.recipe = cls.recipes[0]

예제 #5

파일 보기

 def test_scrape(self):
     self.recipes = scrape(self.url)
     self.recipe = self.recipes[0]
     assert self.recipe["name"] == "Irish Coffee"

예제 #6

파일 보기

 def test_scrape(self):
     with self.assertRaises(SSRTypeError):
         scrape(0xBEE)

예제 #7

파일 보기

 def setUpClass(cls):
     cls.recipes = scrape(f"{DATA_PATH}/crumb-lemon-tea-cakes-2018.html",
                          python_objects=True)
     cls.recipe = cls.recipes[0]

예제 #8

파일 보기

 def setUpClass(cls):
     cls.recipes = scrape(f"{DATA_PATH}/bevvy-irish-coffee-2018.html")
     cls.recipe = cls.recipes[0]

예제 #9

파일 보기

 def setUpClass(cls):
     cls.recipes = scrape(f"{DATA_PATH}/sweetestkitchen-truffles.html",
                          python_objects=True)
     cls.recipe = cls.recipes[0]

예제 #10

파일 보기

파일: test_scrape.py 프로젝트: throttleup/scrape-schema-recipe

 def setUpClass(cls):
     cls.recipes = scrape('test_data/sweetestkitchen-truffles.html',
                          python_objects=True)
     cls.recipe = cls.recipes[0]

예제 #11

파일 보기

파일: test_scrape.py 프로젝트: throttleup/scrape-schema-recipe

 def test_scrape(self):
     self.recipes = scrape(self.url)
     self.recipe = self.recipes[0]
     assert self.recipe['name'] == 'Irish Coffee'

예제 #12

파일 보기

파일: test_scrape.py 프로젝트: throttleup/scrape-schema-recipe

 def setUpClass(cls):
     cls.recipes = scrape('test_data/crumb-lemon-tea-cakes-2018.html',
                          python_objects=True)
     cls.recipe = cls.recipes[0]

예제 #13

파일 보기

파일: test_scrape.py 프로젝트: throttleup/scrape-schema-recipe

 def setUpClass(cls):
     cls.recipes = scrape('test_data/bevvy-irish-coffee-2018.html')
     cls.recipe = cls.recipes[0]

예제 #14

파일 보기

    urls = list(f.readlines())

# create a new list with cleaned urls - add https:// and strip '//' and '\n' from each url
urls_cleaned = ['https:' + url.strip('\n') for url in urls]
# urls_subset = urls_cleaned[:5]

# initialize an empty list to contain recipes
recipes = []

# loop through list of cleaned urls
for url in urls_cleaned:

    try:

        # scrape url and obtain page information
        recipe_list = scrape_schema_recipe.scrape(url)

        # get relevant information out of the page
        recipe = recipe_list[0]
        # print('Recipe: \n', recipe)

        # transform the time values to a string of the total time of the recipes
        transform_time(recipe)

        # add recipe to list of recipes
        recipes.append(recipe)

        # print that the page has finished being scraped
        print('Page Done')
        print(url)