コード例 #1
0
            name, ext = os.path.splitext(fname)

            if ext.lower() == ".html":
                logger.info("Deleting html file: %s",  f['id'])
                num_html_deleted += 1
                omeka_client.delete('files', f['id'])
            
    #Second pass do the conversion if required
    if not args['do_not_convert']:   
        for f in omeka_client.get_files_for_item(item['id']):
            fname = f['original_filename']
            name, ext = os.path.splitext(fname)

            if  ext.lower() in [".docx", ".doc", ".odt", ".rtf"]:
                num_docs_found += 1
                res, data = omeka_client.get_file(f['file_urls']['original'])
                download_file = os.path.join(temp_dir, fname)
                out = open(download_file, 'wb')
                out.write(data)
                out.close()
                logger.info("Converting office doc file %s to HTML",  f['id'])
                out_dir, x = os.path.split(download_file)
                html_file =  os.path.join(temp_dir, name + ".html")
                word2html.convert(download_file, html_file , True, True, False)
                
                if omeka_client.post_file_from_filename(html_file, item['id']):
                    num_html_uploaded += 1
                    logger.info("Uploaded  %s successfully",  f['id'])
                
        
logger.info("********************")
コード例 #2
0
            name, ext = os.path.splitext(fname)

            if ext.lower() == ".html":
                logger.info("Deleting html file: %s", f['id'])
                num_html_deleted += 1
                omeka_client.delete('files', f['id'])

    #Second pass do the conversion if required
    if not args['do_not_convert']:
        for f in omeka_client.get_files_for_item(item['id']):
            fname = f['original_filename']
            name, ext = os.path.splitext(fname)

            if ext.lower() in [".docx", ".doc", ".odt", ".rtf"]:
                num_docs_found += 1
                res, data = omeka_client.get_file(f['file_urls']['original'])
                download_file = os.path.join(temp_dir, fname)
                out = open(download_file, 'wb')
                out.write(data)
                out.close()
                logger.info("Converting office doc file %s to HTML", f['id'])
                out_dir, x = os.path.split(download_file)
                html_file = os.path.join(temp_dir, name + ".html")
                word2html.convert(download_file, html_file, True, True, False)

                if omeka_client.post_file_from_filename(html_file, item['id']):
                    num_html_uploaded += 1
                    logger.info("Uploaded  %s successfully", f['id'])

logger.info("********************")
logger.info("SUMMARY:")