Python ARMHarvester.retrieve_record 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: schema_org.arm

클래스/타입: ARMHarvester

메소드/함수: retrieve_record

hotexamples.com에서의 예제들: 3

Python ARMHarvester.retrieve_record - 3개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 schema_org.arm.ARMHarvester.retrieve_record에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

ARMHarvester(8)

retrieve_record(3)

run(3)

extract_series_identifier(2)

예제 #1

파일 보기

    def test__read_record__invalid_jsonld(self):
        """
        SCENARIO:  A landing page is properly retrieved, but has invalid
        JSON-LD.

        EXPECTED RESULT:  JSON-LD error
        """
        url = (
            'https://www.archive.arm.gov'
            '/metadata/adc/html/nsaqcrad1longC2.c2.invalid_jsonld.html'
        )

        harvester = ARMHarvester()

        contents = ir.read_binary('tests.data.arm', 'nsaqcrad1longC2.c2.no_dataset_in_jsonld.html')  # noqa : E501
        status_code = 200
        headers = {'Content-Type': 'text/html'}

        regex = re.compile('https://www.archive.arm.gov/metadata/adc')

        with aioresponses() as m:
            m.get(regex, body=contents, status=status_code, headers=headers)
            with self.assertRaises(JsonLdError):
                with self.assertLogs(logger=harvester.logger, level='DEBUG'):
                    asyncio.run(harvester.retrieve_record(url))

예제 #2

파일 보기

    def test__landing_page_is_empty(self):
        """
        SCENARIO:  A landing page has absolutely no content.
        JSON.

        EXPECTED RESULT:  RuntimeError
        """
        url = 'https://www.archive.arm.gov/metadata/adc/html/met.html'

        harvester = ARMHarvester()

        contents = ir.read_binary('tests.data.arm', 'met.html')
        status_code = 200
        headers = {'Content-Type': 'text/html'}

        regex = re.compile('https://www.archive.arm.gov/metadata/adc')

        with aioresponses() as m:
            m.get(regex, body=contents, status=status_code, headers=headers)
            with self.assertRaises(RuntimeError):
                with self.assertLogs(logger=harvester.logger, level='DEBUG'):
                    asyncio.run(harvester.retrieve_record(url))

예제 #3

파일 보기

    def test__retrieve_record__bad_series_identifier(self):
        """
        SCENARIO:  We have a valid landing page URL but the JSON-LD document
        has a series identifier that is not in the format that we want.

        EXPECTED RESULT:  RuntimeError
        """
        landing_page_url = (
            'https://www.archive.arm.gov/metadata/adc/html/wsacrcrcal.html'
        )

        harvester = ARMHarvester()

        # External calls to read the:
        #
        #   2) HTML document for the landing page
        #   3) XML document associated with the landing page
        #
        contents = [
            ir.read_binary('tests.data.arm', 'wsacrcrcal.bad_series_id.html'),
            ir.read_binary('tests.data.arm', 'wsacrcrcal.xml'),
        ]
        status_codes = [200, 200, 200]
        headers = [
            {'Content-Type': 'text/html'},
            {'Content-Type': 'application/xml'},
        ]

        z = zip(contents, status_codes, headers)
        with aioresponses() as m:
            for content, status_code, headers in z:
                m.get(self.regex,
                      body=content, status=status_code, headers=headers)

            with self.assertLogs(logger=harvester.logger, level='DEBUG'):
                with self.assertRaises(RuntimeError):
                    asyncio.run(harvester.retrieve_record(landing_page_url))