def main(argv): (options, input_files) = parser.parse_args(args=argv[1:]) out = sys.stdout if len(input_files) < 1: parser.error("no imput warc file(s)") for name in input_files: fh = ArcRecord.open_archive(name, gzip="auto") for record in fh: content = record.content headers = [ (WarcRecord.TYPE, "response"), (WarcRecord.ID, "<urn:uuid:%s>"%uuid.UUID(hashlib.sha1(record.url+record.date).hexdigest()[0:32])), ] version = "WARC/1.0" url = record.url if url: headers.append((WarcRecord.URL,url)) date = record.date if date: headers.append((WarcRecord.DATE,date)) warcrecord = WarcRecord(headers=headers, content=content, version=version) warcrecord.write_to(out, gzip=options.gzip) fh.close() return 0