コード例 #1
0
omeka_client = OmekaClient(endpoint.encode("utf-8"), logger, apikey)

resp, cont = omeka_client.get("items")
items = json.loads(cont)
temp_dir = tempfile.mkdtemp()
os.chmod(temp_dir, 0o2770) #Sets group permissions and "sticky bit"

num_docs_found = 0
num_html_uploaded = 0
num_html_deleted = 0
for item in items:
    logger.info('Looking at %s', item['id'])
  
    #First pass - delete HTML if required
    if args['delete_html']:
        for f in omeka_client.get_files_for_item(item['id']):
            fname = f['original_filename']
            name, ext = os.path.splitext(fname)

            if ext.lower() == ".html":
                logger.info("Deleting html file: %s",  f['id'])
                num_html_deleted += 1
                omeka_client.delete('files', f['id'])
            
    #Second pass do the conversion if required
    if not args['do_not_convert']:   
        for f in omeka_client.get_files_for_item(item['id']):
            fname = f['original_filename']
            name, ext = os.path.splitext(fname)

            if  ext.lower() in [".docx", ".doc", ".odt", ".rtf"]:
コード例 #2
0
omeka_client = OmekaClient(endpoint.encode("utf-8"), logger, apikey)

resp, cont = omeka_client.get("items")
items = json.loads(cont)
temp_dir = tempfile.mkdtemp()
os.chmod(temp_dir, 0o2770)  #Sets group permissions and "sticky bit"

num_docs_found = 0
num_html_uploaded = 0
num_html_deleted = 0
for item in items:
    logger.info('Looking at %s', item['id'])

    #First pass - delete HTML if required
    if args['delete_html']:
        for f in omeka_client.get_files_for_item(item['id']):
            fname = f['original_filename']
            name, ext = os.path.splitext(fname)

            if ext.lower() == ".html":
                logger.info("Deleting html file: %s", f['id'])
                num_html_deleted += 1
                omeka_client.delete('files', f['id'])

    #Second pass do the conversion if required
    if not args['do_not_convert']:
        for f in omeka_client.get_files_for_item(item['id']):
            fname = f['original_filename']
            name, ext = os.path.splitext(fname)

            if ext.lower() in [".docx", ".doc", ".odt", ".rtf"]: