Ejemplo n.º 1
0
 def __init__(self, format=ReferenceFormat.BIBTEX):
     super(ReferenceImporter, self).__init__()
     self.name = 'Importer'
     self.format = format
     self.util_factory = UtilFactory()
     self.ref_controller = ReferencesController(self.util_factory,
                                                self.format)
     self.path = ''
Ejemplo n.º 2
0
 def __init__(self):
     self.factory = UtilFactory()
     self.rce = controllers.RCEController(self.factory, 10, 10)
     self.ir = controllers.IRController(self.factory)
     self.results_cache_filename = 'customHeaders_cache_file.txt'
     self.results_cache = {}
     self.browser = Browser()
     self.basepath = '/home/rxuriguera/benchmark/pdfsets/pageHeader/'
     self.basename = 'pageHeader'
     self.len_range = range(4, 15)
Ejemplo n.º 3
0
    def __init__(self):

        self.info = {}
        
        self.nexamples = 4
        self.base_path = '/home/rxuriguera/benchmark/pages/'
        self.fields = ['addres', 'author', 'isbn', 'issn', 'journal', 'number', 'pages', 'publisher', 'title', 'volume', 'year']
        self.libraries = ['informaworld']#['acm', 'citeulike', 'computerorg', 'econpapers', 'ideas', 'informaworld', 'sciencedirect', 'scientificcommons', 'springer']
        
        self.factory = UtilFactory()
        self.iec = IEController(self.factory, secs_between_reqs=0,
                                wrapper_gen_examples=self.nexamples)
        self.rec = ReferencesController(self.factory)
Ejemplo n.º 4
0
 def setUp(self):
     factory = UtilFactory()
     self.iec = IEController(factory, ReferenceFormat.BIBTEX)
     self.top_results = [
         SearchResult(
             'result01',
             'http://portal.acm.org/citation.cfm?id=507338.507355'),
         SearchResult(
             'result01',
             'http://www.springerlink.com/index/D7X7KX6772HQ2135.pdf')
     ]
     self.empty_page = BeautifulSoup("<html><head/><body/></html>")
     self.page = self._get_soup('acm01.html')
     self.text = 'ss'
 def setUp(self):
     self.uf = UtilFactory()
 def setUp(self):
     factory = UtilFactory()
     self.rec = ReferencesController(factory, ReferenceFormat.BIBTEX)
     self.path = normpath(
         join(dirname(__file__), ('../../../../tests/'
                                  'fixtures/references/bibtex/import.bib')))
Ejemplo n.º 7
0
 def __init__(self, url):
     super(WrapperGenerator, self).__init__()
     self.name = 'WrapTrainer'
     self.url = url
     self.factory = UtilFactory()
     self.ie_controller = IEController(self.factory)
Ejemplo n.º 8
0
 def __init__(self, format=ReferenceFormat.BIBTEX):
     self.reference_gw = ReferenceGateway()
     self.format = format
     self.util_factory = UtilFactory()
 def setUp(self):
     factory = UtilFactory()
     self.rcec = RCEController(factory)
     self.pdf = normpath(join(dirname(__file__), ('../../../../tests/'
                                  'fixtures/extraction/article.pdf')))
Ejemplo n.º 10
0
 def __init__(self):
     self.factory = UtilFactory()