Example #1
0
 def __init__(self, rsrcmgr, pageno=1, laparams=None):
     PDFPageAggregator.__init__(self, rsrcmgr, pageno=pageno, laparams=laparams)
     self.rows = []
     self.page_number = 0
     self.outline = False # not an outline page
     self.interesting_text = [] # filled only if there is any outline info
     self.aux_text = [] # possibly helpful info, but maybe mixed
 def __init__(self, rsrcmgr, pageno=1, laparams=None):
     PDFPageAggregator.__init__(self,
                                rsrcmgr,
                                pageno=pageno,
                                laparams=laparams)
     self.rows = []
     self.page_number = 0
Example #3
0
    def __init__(self, rsrcmgr, pageno=1, laparams=None):
        PDFPageAggregator.__init__(self,
                                   rsrcmgr,
                                   pageno=pageno,
                                   laparams=laparams)

        self.stringNumber = 1
        self.stringNumberAbs = 1
 def __init__(self, rsrcmgr, pageno=1, laparams: LAParams = None):
     PDFPageAggregator.__init__(self,
                                rsrcmgr,
                                pageno=pageno,
                                laparams=laparams)
     self.rows = []
     self.page_number = 0
     self.doi = None
     self.cr = Crossref(mailto='*****@*****.**')
Example #5
0
 def __init__(self, rsrcmgr, pageno=1, laparams=None):
     PDFPageAggregator.__init__(self,
                                rsrcmgr,
                                pageno=pageno,
                                laparams=laparams)
     self.rows = []
     self.page_number = 0
     self.outline = False  # not an outline page
     self.interesting_text = []  # filled only if there is any outline info
     self.aux_text = []  # possibly helpful info, but maybe mixed
Example #6
0
 def __init__(self, rsrcmgr, pageno=1, laparams=None):
     PDFPageAggregator.__init__(self, rsrcmgr, pageno=pageno, laparams=laparams)
     self.rows = []
     self.itemz = []
     self.page_number = 0
     self. line2page =[] #the line nr in which the page starts
     self.nyears = [] #number of times 19 or 20 are found in one line
     self.allnNames = []
     self.coords = []
     self.ncommas = []
     self.ndots = []
 def __init__(self,
              rsrcmgr,
              pageno=1,
              laparams=None,
              imagewriter=None,
              imagename=None):
     PDFPageAggregator.__init__(self,
                                rsrcmgr,
                                pageno=pageno,
                                laparams=laparams)
     self.rows = []
     self.page_number = 0
     self.imagewriter = imagewriter
     self.imagename = str(imagename)
 def __init__(self, rsrcmgr,boxes=[(0,0,1080.0, 1440.0)], pageno=1, laparams=None, onlyInside=False):
     self.setCropBoxes(boxes)
     self.onlyInside = onlyInside
     self.inFigure = False
     PDFPageAggregator.__init__(self, rsrcmgr, pageno=pageno, laparams=laparams)
Example #9
0
 def __init__(self, rsrcmgr, pageno=1, laparams=None):
     PDFPageAggregator.__init__(self, rsrcmgr, pageno=pageno, laparams=laparams)
     self.rows = []
     self.page_number = 0
 def __init__(self, rsrcmgr, pageno=1, laparams=None):
     PDFPageAggregator.__init__(self, rsrcmgr, pageno, laparams)
 def __init__(self, rsrcmgr, pageno=1, laparams=None):
     PDFPageAggregator.__init__(self, rsrcmgr, pageno, laparams)