예제 #1
0
    def test_extract_named_tmp_file_id_dropped(self):
        er = EventRecord(
            bucket_name="test1",
            object_key=
            "type=dropped/retailer_code=au-bec-and-bridge/year=2019/month=5/day=17/crawl_id=20190517010849__au-bec-and-bridge/20190517010849__au-bec-and-bridge--dropped_v2.0-enriched--e3w9fvyi.jl.gz",
            event_name="ObjectCreated:Put",
        )

        self.assertEqual(er.type, "dropped")
        self.assertEqual(er.named_tmp_file_id, "e3w9fvyi")
예제 #2
0
    def test_extract_walmart(self):
        er = EventRecord(
            bucket_name="test1",
            object_key=
            "type%3Dparsed/retailer_code%3Denus-walmart/year%3D2019/month%3D3/day%3D1/crawl_id%3D20190301110826__enus-walmart/20190301110826__enus-walmart--business--parsed_v2.0--00onxyom.jl.gz",
            event_name="ObjectCreated:Put",
        )

        self.assertEqual(er.type, "parsed")
        self.assertEqual(er.named_tmp_file_id, "00onxyom")
예제 #3
0
    def test_extract_named_tmp_file_id_ingested(self):
        er = EventRecord(
            bucket_name="test1",
            object_key=
            "type=ingested/retailer_code=au-camilla-and-marc/year=2019/month=5/day=17/crawl_id=20190517010856__au-camilla-and-marc/20190517010856__au-camilla-and-marc--ingested_v2.0-alternated--z0298d5o.jl.gz",
            event_name="ObjectCreated:Put",
        )

        self.assertEqual(er.type, "ingested")
        self.assertEqual(er.named_tmp_file_id, "z0298d5o")
예제 #4
0
    def test_extract_named_tmp_file_id_alternated(self):
        er = EventRecord(
            bucket_name="test1",
            object_key=
            "type%3Dalternated/retailer_code%3Dau-ssense/year%3D2019/month%3D3/day%3D1/crawl_id%3D20190301110826__au-ssense/20190301110826__au-ssense--alternated_v2.0--00onxyom.jl.gz",
            event_name="ObjectCreated:Put",
        )

        self.assertEqual(er.type, "alternated")
        self.assertEqual(er.named_tmp_file_id, "00onxyom")
예제 #5
0
    def test_extract_named_tmp_file_id_enriched(self):
        er = EventRecord(
            bucket_name="test1",
            object_key=
            "type%3Denriched/retailer_code%3Dau-ssense/.../20181005212630__au-ssense--enriched_v2.0--j9icejmp.jl.gz",
            event_name="ObjectCreated:Put",
        )

        self.assertEqual(er.type, "enriched")
        self.assertEqual(er.named_tmp_file_id, "j9icejmp")
예제 #6
0
    def test_extract_walmart_spider_name_timestamp_in_path(self):
        er = EventRecord(
            bucket_name="test1",
            object_key=
            "type%3Dparsed/spider_name%3Denus-walmart--business/timestamp%3D019-03-01/crawl_id%3D20190301110826__enus-walmart/20190301110826__enus-walmart--business--parsed_v2.0--00onxyom.jl.gz",
            event_name="ObjectCreated:Put",
        )

        self.assertEqual(er.type, "parsed")
        self.assertEqual(er.named_tmp_file_id, "00onxyom")
예제 #7
0
    def test_event_record_create(self):
        er = EventRecord(
            bucket_name="test1",
            object_key=
            "type%3Dfetched/retailer_code%3Dau-ssense/year%3D2018/month%3D10/day%3D5/crawl_id%3D20181005212630__au-ssense/20181005212630__au-ssense--fetched_v2.0--j9icejmp.jl.gz",
            event_name="ObjectCreated:Put",
        )

        self.assertEqual(
            er.object_key,
            "type=fetched/retailer_code=au-ssense/year=2018/month=10/day=5/crawl_id=20181005212630__au-ssense/20181005212630__au-ssense--fetched_v2.0--j9icejmp.jl.gz",
        )
        self.assertEqual(er.type, "fetched")
        self.assertEqual(er.named_tmp_file_id, "j9icejmp")