예제 #1
0
 def __init__(self, rsrcmgr, outfp, codec='utf-8', pageno=1, laparams=None,
              showpageno=False, imagewriter=None):
     TextConverter.__init__(self, rsrcmgr, outfp, codec=codec, pageno=pageno, laparams=laparams)
     self.showpageno = showpageno
     self.imagewriter = imagewriter
     self.text = ''
     return
예제 #2
0
 def __init__(self, rsrcmgr, codec='cp1251', pageno=1, laparams=None):
     dummy = io.StringIO()
     TextConverter.__init__(self, rsrcmgr, outfp=dummy, codec=codec, pageno=pageno, laparams=laparams)
     self.annots = set()
     # self.sentences = list()
     self.current_sentence = ''
     self.current_sentence_should_be_added_to_these_annotations_on_end = set()
예제 #3
0
 def __init__(self, rsrcmgr, codec='utf-8', pageno=1, laparams=None):
     dummy = io.StringIO()
     TextConverter.__init__(self,
                            rsrcmgr,
                            outfp=dummy,
                            codec=codec,
                            pageno=pageno,
                            laparams=laparams)
     self.annots = set()
예제 #4
0
파일: pdf_in.py 프로젝트: yask123/moin-2.0
 def __init__(self, rsrcmgr, pageno=1, laparams=None, showpageno=False):
     TextConverter.__init__(self,
                            rsrcmgr,
                            None,
                            codec=None,
                            pageno=pageno,
                            laparams=laparams,
                            showpageno=showpageno)
     self.__text = []
예제 #5
0
 def __init__(self,
              rsrcmgr,
              outfp,
              codec='utf-8',
              pageno=1,
              laparams=None,
              showpageno=False,
              imagewriter=None):
     TextConverter.__init__(self,
                            rsrcmgr,
                            outfp,
                            codec=codec,
                            pageno=pageno,
                            laparams=laparams,
                            showpageno=showpageno,
                            imagewriter=imagewriter)
     return
예제 #6
0
 def __init__(self,
              rsrcmgr,
              outfp,
              codec='utf-8',
              pageno=1,
              laparams=None,
              showpageno=False,
              imagewriter=None):
     TextConverter.__init__(self,
                            rsrcmgr,
                            outfp,
                            codec=codec,
                            pageno=pageno,
                            laparams=laparams)
     self.showpageno = showpageno
     self.imagewriter = imagewriter
     self.textlines = {}  # per pagenumber
     self.pagenumber = 0
     return
예제 #7
0
 def __init__(self, *args, **kwargs):
     TextConverter.__init__(self, *args, **kwargs)
예제 #8
0
 def __init__(self, *args, **kwargs):
     TextConverter.__init__(self, *args, **kwargs)
     pass
예제 #9
0
파일: pdf2text.py 프로젝트: zaim/bukutip
 def __init__(self, *args, **kwargs):
     self.results = []
     TextConverter.__init__(self, *args, **kwargs)
예제 #10
0
파일: pdf_in.py 프로젝트: pombredanne/moin2
 def __init__(self, rsrcmgr, pageno=1, laparams=None, showpageno=False):
     TextConverter.__init__(self, rsrcmgr, None, codec=None, pageno=pageno, laparams=laparams,
                            showpageno=showpageno)
     self.__text = []
예제 #11
0
 def __init__(self, separator=',', threshold=1.5, *args, **kwargs):
     TextConverter.__init__(self, *args, **kwargs)
     self.separator = separator
     self.threshold = threshold
예제 #12
0
 def __init__(self, rsrcmgr, outfp, laparams=laparams):
     TextConverter.__init__(self, rsrcmgr, outfp, laparams=laparams)
     return
예제 #13
0
파일: f.py 프로젝트: kamekame/alpha
 def __init__(self, *args, **kwargs):
     TextConverter.__init__(self, *args, **kwargs)
     self.separator = separator
     self.threshold = threshold
예제 #14
0
 def __init__(self, *args, **kwargs):
     TextConverter.__init__(self, *args, **kwargs)
     self.pages = {}