def get_list_datasets_update_number_download(): # list_datasets = ["http://data.europa.eu/88u/dataset/cordisH2020projects"] from ckanext.ecportal.virtuoso.utils_triplestore_crud_helpers import TripleStoreCRUDHelpers try: tsch = TripleStoreCRUDHelpers() sparql_query = """ select ?dataset from <dcatapop-public> from <dcatapop-private> where { ?dataset a <http://www.w3.org/ns/dcat#Dataset> } """ result = tsch.execute_select_query_auth(sparql_query) list_datasets = [ ds.get('dataset').get('value') for ds in result ] log.info( '[Dataset] [get_list_datasets_update_number_download] [SUCCESS] [Number of datasets: {0}]' .format(len(list_datasets))) list_datasets = list( map(lambda ds: ds.split('/')[-1], list_datasets)) return list_datasets except BaseException as e: log.error(traceback.print_exc(e)) log.error( '[Dataset] [get_list_datasets_update_number_download] [Failed]' )
def get_list_incorrect_datasets_issued_date(self): from ckanext.ecportal.virtuoso.utils_triplestore_crud_helpers import TripleStoreCRUDHelpers try: tsch = TripleStoreCRUDHelpers() sparql_query = """ PREFIX dcat: <http://www.w3.org/ns/dcat#> select ?dataset ?cr ?issued ?modified from <dcatapop-public> from <dcatapop-private> where { ?cr a <http://www.w3.org/ns/dcat#CatalogRecord> . ?cr <http://xmlns.com/foaf/0.1/primaryTopic> ?dataset . ?cr <http://purl.org/dc/terms/issued> ?issued . ?cr <http://purl.org/dc/terms/modified> ?modified filter ((?issued = ?modified) && (str(?issued) > "2019-07-10T12:59:20")) } order by ?modified """ result = tsch.execute_select_query_auth(sparql_query) list_datasets = [ds.get('dataset').get('value') for ds in result] return list_datasets except BaseException as e: log.error(traceback.print_exc(e)) log.error('[get_list_incorrect_datasets_issued_date] [Failed]')
def get_list_empty_datasets(self): # list_datasets = ["http://data.europa.eu/88u/dataset/cordisH2020projects"] from ckanext.ecportal.virtuoso.utils_triplestore_crud_helpers import TripleStoreCRUDHelpers try: tsch = TripleStoreCRUDHelpers() sparql_query = """ select ?dataset from <dcatapop-public> where { ?dataset a <http://www.w3.org/ns/dcat#Dataset>. optional{ ?cr <http://xmlns.com/foaf/0.1/primaryTopic> ?dataset . ?cr <http://purl.org/dc/terms/modified> ?o . } filter (!bound(?o)) } """ result = tsch.execute_select_query_auth(sparql_query) list_datasets = [ds.get('dataset').get('value') for ds in result] return list_datasets except BaseException as e: log.error(traceback.print_exc(e)) log.error('[Rollback Dataset] [get_list_empty_datasets] [Failed]')