Python Utils.cleanOutputFolder 예제들

프로그래밍 언어: Python

클래스/타입: Utils

메소드/함수: cleanOutputFolder

hotexamples.com에서의 예제들: 4

Python Utils.cleanOutputFolder - 4개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 Utils.cleanOutputFolder 패키지로부터 playwright-python에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

AdjustGridSize(29)

executeOnServer(18)

errorCode(17)

format_Directory_Path(8)

bytesToInt(7)

dprint(7)

add_one(6)

assertPathExists(6)

allow_methods(5)

bytesToString(5)

convertNetToGefx(5)

extract_stochastics_values(5)

ApplyKPhaseShifts(4)

ensure_dir_exists(4)

encodeAuthToken(4)

__htmlpage_soup(4)

add_query_to_url(4)

extract_links(4)

constructQueries(4)

cleanOutputFolder(4)

create_build_command(4)

extract_results_single_page(4)

bitflip(4)

clearElem(4)

closestCentroidList(3)

expectNevents(3)

check_color(3)

findCollocations1(3)

checkIsFile(3)

ceil_key(3)

copyFirstBoot(3)

flatten_lines(3)

date_to_httpdate(3)

AddArrayLine(3)

drawCenteredOnTitle(3)

AppendLogFile(3)

generateCfgFile(3)

convertEncoding(3)

drawArray(2)

capstring(2)

dnorm(2)

file_exist(2)

csize(2)

create_ht_marc(2)

create_label_list(2)

create_document_term_matrix(2)

createSources(2)

clean_price_string(2)

drawRec(2)

electLeader(2)

예제 #1

파일 보기

파일: Cleaner.py 프로젝트: atbradley/eaccpf-indexer

 def run(self):
     """
     Execute the clean operation using specified parameters.
     @todo this needs to be cleaned up and simplified
     """
     with Timer.Timer() as t:
         # create an index of file hashes, so that we can track what has changed
         if self.update:
             self.hashIndex = Utils.loadFileHashIndex(self.output)
         # clear output folder
         if not os.path.exists(self.output):
             os.makedirs(self.output)
         if not self.update:
             Utils.cleanOutputFolder(self.output)
         # check state
         assert os.path.exists(self.source), self.log.error("Source path does not exist: " + self.source)
         assert os.path.exists(self.output), self.log.error("Output path does not exist: " + self.output)
         # clean data
         records = self.clean()
         # remove records from the index that were deleted in the source
         if self.update:
             self.log.info("Clearing orphaned records from the file hash index")
             Utils.purgeIndex(records, self.hashIndex)
         # remove files from the output that are not in the index
         if self.update:
             self.log.info("Clearing orphaned files from the output folder")
             Utils.purgeFolder(self.output, self.hashIndex)
         # write the updated file hash index
         Utils.writeFileHashIndex(self.hashIndex, self.output)
     # log execution time
     self.log.info("Cleaner finished in {0}:{1}:{2}".format(t.hours, t.minutes, t.seconds))
     print(("Cleaner finished in {0}:{1}:{2}".format(t.hours, t.minutes, t.seconds)))

예제 #2

파일 보기

파일: Transformer.py 프로젝트: atbradley/eaccpf-indexer

 def run(self):
     """
     Execute transformations on source documents as specified. Write results 
     to the output path.
     """
     with Timer.Timer() as t:
         # create output folder
         if not os.path.exists(self.output):
             os.makedirs(self.output)
         
         #TODO: Use the output flag instead.
         if 'clear' in self.actions:
             Utils.cleanOutputFolder(self.output)
         assert os.path.exists(self.output), self.log.error("Output path does not exist: {0}".format(self.output))
         # execute processing actions
         if "digitalobjects-to-sid" in self.actions:
             self.transformDigitalObjectsToSID(self.sources, self.output)
         if "eaccpf-to-sid" in self.actions:
             transform = Utils.loadTransform(self.xslt)
             self.transformEacCpfsToSID(self.sources, self.output, transform)
         if "html-to-sid" in self.actions:
             self.transformHtmlsToSid(self.sources, self.output)
         if 'merge-digitalobjects' in self.actions:
             self.mergeDigitalObjectsIntoSID(self.sources, self.output)
         if "merge-inferred" in self.actions:
             self.mergeInferredRecordsIntoSID(self.sources, self.output)
         if "set-fields" in self.actions and not '' in self.set_fields:
             self.setFieldValue(self.output)
         if 'boost' in self.actions:
             self.setBoosts(self.output)
         if "validate" in self.actions:
             pass
             
     # log execution time
     self.log.info("Transformer finished in {0}:{1}:{2}".format(t.hours, t.minutes, t.seconds))

예제 #3

파일 보기

파일: Grapher.py 프로젝트: atbradley/eaccpf-indexer

 def run(self):
     """
     Execute analysis operations using specified parameters.
     """
     # make output folder
     Utils.cleanOutputFolder(self.output)
     # check state
     assert os.path.exists(self.source), self.log.error("Source path does not exist: " + self.source)
     assert os.path.exists(self.output), self.log.error("Output path does not exist: " + self.output)
     # execute actions
     self.graph_entities()
     # generate a PDF of the graph
     self.save_graph_as_pdf()
     # write graph file
     self.save_graph_as_gexf()

예제 #4

파일 보기

파일: Crawler.py 프로젝트: atbradley/eaccpf-indexer

 def run(self):
     """
     Execute crawl operation.
     """
     with Timer.Timer() as t:
         # check state before starting
         assert os.path.exists(self.source), self.log.error("Input path does not exist: {0}".format(self.source))
         if not os.path.exists(self.output):
             os.makedirs(self.output)
         Utils.cleanOutputFolder(self.output, Update=self.update)
         assert os.path.exists(self.output), self.log.error("Output path does not exist: {0}".format(self.output))
         # purge the image cache
         if not self.update:
             self.cache.purge()
         # create an index of files hashes so that we can track which files
         # have changed since the last run
         self.records = []
         if self.update:
             self.hashIndex = Utils.loadFileHashIndex(self.output)
         # crawl the document source
         if 'http://' in self.source or 'https://' in self.source:
             self.crawlWebSite()
         else:
             self.crawlFileSystem()
         # if the crawl was executed as an update, then synchronize the file
         # index, metadata cache, and image cache folders with the source
         if self.update:
             # remove records from the index that were deleted in the source
             self.log.info("Clearing orphaned records from the file hash index")
             Utils.purgeIndex(self.records, self.hashIndex)
             # remove files from the metadata cache that are not in the index
             self.log.info("Clearing orphaned files from the output folder")
             Utils.purgeFolder(self.output, self.hashIndex)
             # remove files from the image cache that are not in the index
             self.log.info("Clearing orphaned files from the image cache")
             self.cache.purge(list(self.hashIndex.keys()))
         # write the updated file index
         Utils.writeFileHashIndex(self.hashIndex, self.output)
     # log execution time
     self.log.info("Crawler finished in {0}:{1}:{2}".format(t.hours, t.minutes, t.seconds))