def oai_process_pcurio(*args): identifiers = helpers.gather_identifiers(args) provider_uris, object_uris = helpers.seperate_provider_object_uris(identifiers) for i, uri in enumerate(provider_uris): if 'resultadon' in uri: doc_id = provider_uris[i].replace('http://www.maxwell.vrac.puc-rio.br/Busca_etds.php?strSecao=resultadonrSeq=', '') provider_uris[i] = 'http://www.maxwell.vrac.puc-rio.br/Busca_etds.php?strSecao=resultado&nrSeq=' + doc_id for i, uri in enumerate(object_uris): if 'resultadon' in uri: doc_id = object_uris[i].replace('http://www.maxwell.vrac.puc-rio.br/Busca_etds.php?strSecao=resultadonrSeq=', '') object_uris[i] = 'http://www.maxwell.vrac.puc-rio.br/Busca_etds.php?strSecao=resultado&nrSeq=' + doc_id potential_uris = (provider_uris + object_uris) try: canonical_uri = potential_uris[0] except IndexError: raise ValueError('No Canonical URI was returned for this record.') return { 'canonicalUri': canonical_uri, 'objectUris': object_uris, 'providerUris': provider_uris }
def oai_process_pcurio(*args): identifiers = helpers.gather_identifiers(args) provider_uris, object_uris = helpers.seperate_provider_object_uris( identifiers) for i, uri in enumerate(provider_uris): if 'resultadon' in uri: doc_id = provider_uris[i].replace( 'http://www.maxwell.vrac.puc-rio.br/Busca_etds.php?strSecao=resultadonrSeq=', '') provider_uris[ i] = 'http://www.maxwell.vrac.puc-rio.br/Busca_etds.php?strSecao=resultado&nrSeq=' + doc_id for i, uri in enumerate(object_uris): if 'resultadon' in uri: doc_id = object_uris[i].replace( 'http://www.maxwell.vrac.puc-rio.br/Busca_etds.php?strSecao=resultadonrSeq=', '') object_uris[ i] = 'http://www.maxwell.vrac.puc-rio.br/Busca_etds.php?strSecao=resultado&nrSeq=' + doc_id potential_uris = (provider_uris + object_uris) try: canonical_uri = potential_uris[0] except IndexError: raise ValueError('No Canonical URI was returned for this record.') return { 'canonicalUri': canonical_uri, 'objectUris': object_uris, 'providerUris': provider_uris }
def test_gather_identifiers(self): identifiers = [['doi:10.whateverwhatever', 'http://viewcontent.cgi/iamacoolpdf'], '451???462 [http://dx.doi.org/10.1680/geot.11.P.130]', 'I am a bunch of text but I also have a doi:10.10.thisisarealdoi', ['http://bubbaray.com', 'http://devon.net']] gathered = helpers.gather_identifiers(identifiers) assert gathered == ['doi:10.whateverwhatever', 'http://viewcontent.cgi/iamacoolpdf', '451???462 [http://dx.doi.org/10.1680/geot.11.P.130]', 'I am a bunch of text but I also have a doi:10.10.thisisarealdoi', 'http://bubbaray.com', 'http://devon.net']
def test_gather_identifiers(self): identifiers = [ ['doi:10.whateverwhatever', 'http://viewcontent.cgi/iamacoolpdf'], '451???462 [http://dx.doi.org/10.1680/geot.11.P.130]', 'I am a bunch of text but I also have a doi:10.10.thisisarealdoi', ['http://bubbaray.com', 'http://devon.net'] ] gathered = helpers.gather_identifiers(identifiers) assert gathered == [ 'doi:10.whateverwhatever', 'http://viewcontent.cgi/iamacoolpdf', '451???462 [http://dx.doi.org/10.1680/geot.11.P.130]', 'I am a bunch of text but I also have a doi:10.10.thisisarealdoi', 'http://bubbaray.com', 'http://devon.net' ]
def format_uris_pubmedcentral(*args): identifiers = helpers.gather_identifiers(args) provider_uris, object_uris = helpers.seperate_provider_object_uris(identifiers) for arg in args: if arg and 'oai:pubmedcentral.nih.gov:' in arg[0]: PMC_ID = arg[0].replace('oai:pubmedcentral.nih.gov:', '') canonical_uri = 'http://www.ncbi.nlm.nih.gov/pmc/articles/PMC' + PMC_ID if not canonical_uri: raise ValueError('No Canonical URI was returned for this record.') return { 'canonicalUri': canonical_uri, 'objectUris': object_uris, 'providerUris': provider_uris }
def format_uris_pubmedcentral(*args): identifiers = helpers.gather_identifiers(args) provider_uris, object_uris = helpers.seperate_provider_object_uris( identifiers) for arg in args: if arg and 'oai:pubmedcentral.nih.gov:' in arg[0]: PMC_ID = arg[0].replace('oai:pubmedcentral.nih.gov:', '') canonical_uri = 'http://www.ncbi.nlm.nih.gov/pmc/articles/PMC' + PMC_ID if not canonical_uri: raise ValueError('No Canonical URI was returned for this record.') return { 'canonicalUri': canonical_uri, 'objectUris': object_uris, 'providerUris': provider_uris }
def oai_process_uris_addis_ababa(*args): identifiers = helpers.gather_identifiers(args) provider_uris, object_uris = helpers.seperate_provider_object_uris( list(map(lambda x: x.replace('http://hdl.handle.net/123456789/', 'http://etd.aau.edu.et/handle/123456789/'), identifiers)) ) potential_uris = (provider_uris + object_uris) try: canonical_uri = potential_uris[0] except IndexError: raise ValueError('No Canonical URI was returned for this record.') return { 'canonicalUri': canonical_uri, 'objectUris': object_uris, 'providerUris': provider_uris }
def oai_process_uris_addis_ababa(*args): identifiers = helpers.gather_identifiers(args) provider_uris, object_uris = helpers.seperate_provider_object_uris( list( map( lambda x: x.replace('http://hdl.handle.net/123456789/', 'http://etd.aau.edu.et/handle/123456789/'), identifiers))) potential_uris = (provider_uris + object_uris) try: canonical_uri = potential_uris[0] except IndexError: raise ValueError('No Canonical URI was returned for this record.') return { 'canonicalUri': canonical_uri, 'objectUris': object_uris, 'providerUris': provider_uris }