Exemplo n.º 1
0
 def __init__(self,
              package_name=None,
              path=None,
              run_locally=False,
              CONSYN=False,
              journal_mappings={},
              extract_nations=False,
              no_harvest=False):
     self.CONSYN = CONSYN
     self.doi_package_name_mapping = []
     try:
         self.logger = create_logger("Elsevier",
                                     filename=join(CFG_LOGDIR,
                                                   'scoap3_harvesting.log'))
     except IOError:  # Could not access log file
         # Use std.out for logging
         self.logger = self
         self.info = print
         self.warning = print
         self.error = print
         self.debug = print
     if self.CONSYN:
         self.journal_mappings = journal_mappings
     else:
         if not no_harvest:
             self.package_name = package_name
             self.path = path
             self.found_articles = []
             self._found_issues = []
             if run_locally:
                 from harvestingkit.contrast_out import ContrastOutConnector
                 self.conn = ContrastOutConnector(self.logger)
                 self.conn.run(run_locally)
             else:
                 if not path and package_name:
                     self.logger.info("Got package: %s" % (package_name, ))
                     self._extract_package()
                 elif not path and not package_name:
                     from harvestingkit.contrast_out import ContrastOutConnector
                     self.conn = ContrastOutConnector(self.logger)
                     self.conn.run()
             self._crawl_elsevier_and_find_main_xml()
             self._crawl_elsevier_and_find_issue_xml()
             self._build_doi_mapping()
     self.extract_nations = extract_nations