Python tameWhitespace 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: parliament.core.parsetools

메소드/함수: tameWhitespace

hotexamples.com에서의 예제들: 10

Python tameWhitespace - 10개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 parliament.core.parsetools.tameWhitespace에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

파일: common.py 프로젝트: hlainchb/openlegislature

 def saveProceedingsStatement(self, text, t):
     text = parsetools.sane_quotes(parsetools.tameWhitespace(text.strip()))
     if len(text):
         statement = Statement(hansard=self.hansard,
             time=datetime.datetime.combine(self.date, t['timestamp']),
             text=text, sequence=self.statement_index,
             who='Proceedings')
         self.statement_index += 1
         self.statements.append(statement)

예제 #2

파일 보기

파일: __init__.py 프로젝트: DevinMonroe-HalcyonWebDesign/openparliament

def _getHansardNumber(page):
    title = re.search(r'<title>([^<]+)</title>', page).group(1)
    match = re.search(r'Number +(\d+\S*) ', parsetools.tameWhitespace(title)) # New format: Number 079
    if match:
        return re.sub('^0+', '', match.group(1))
    else:
        match = re.search(r'\((\d+\S*)\)', title) # Old format (079)
        if match:
            return re.sub('^0+', '', match.group(1))
        else:
            raise Exception("Couldn't parse number from Hansard title: %s" % title)

예제 #3

파일 보기

파일: common.py 프로젝트: orenmazor/openparliament

 def saveProceedingsStatement(self, text, t):
     text = parsetools.sane_quotes(parsetools.tameWhitespace(text.strip()))
     if len(text):
         statement = Statement(hansard=self.hansard,
                               time=datetime.datetime.combine(
                                   self.date, t['timestamp']),
                               text=text,
                               sequence=self.statement_index,
                               who='Proceedings')
         self.statement_index += 1
         self.statements.append(statement)

예제 #4

파일 보기

파일: common.py 프로젝트: AskMP/openparliament

 def saveProceedingsStatement(self, text, t):
     text = parsetools.sane_quotes(parsetools.tameWhitespace(text.strip()))
     if len(text):
         timestamp = t['timestamp']
         if not isinstance(timestamp, datetime.datetime):
             # The older parser provides only datetime.time objects
             timestamp = datetime.datetime.combine(self.date, timestamp)
         statement = Statement(hansard=self.hansard,
             time=timestamp,
             text=text, sequence=self.statement_index,
             who='Proceedings')
         self.statement_index += 1
         self.statements.append(statement)

예제 #5

파일 보기

파일: __init__.py 프로젝트: orenmazor/openparliament

def _getHansardNumber(page):
    title = re.search(r'<title>([^<]+)</title>', page).group(1)
    match = re.search(
        r'Number +(\d+\S*) ',
        parsetools.tameWhitespace(title))  # New format: Number 079
    if match:
        return re.sub('^0+', '', match.group(1))
    else:
        match = re.search(r'\((\d+\S*)\)', title)  # Old format (079)
        if match:
            return re.sub('^0+', '', match.group(1))
        else:
            raise Exception("Couldn't parse number from Hansard title: %s" %
                            title)

예제 #6

파일 보기

 def saveProceedingsStatement(self, text, t):
     text = parsetools.sane_quotes(parsetools.tameWhitespace(text.strip()))
     if len(text):
         timestamp = t['timestamp']
         if not isinstance(timestamp, datetime.datetime):
             # The older parser provides only datetime.time objects
             timestamp = datetime.datetime.combine(self.date, timestamp)
         statement = Statement(hansard=self.hansard,
                               time=timestamp,
                               text=text,
                               sequence=self.statement_index,
                               who='Proceedings')
         self.statement_index += 1
         self.statements.append(statement)

예제 #7

파일 보기

파일: common.py 프로젝트: AskMP/openparliament

 def addText(self, text, blockquote=False):
     if not self._ignoretext:
         t = parsetools.tameWhitespace(text.strip())
         t = parsetools.sane_quotes(t)
         if t.startswith(':'):
             # Strip initial colon
             t = t[1:].strip()
         if t.startswith('He said: '):
             t = t[8:].strip()
         if t.startswith('She said: '):
             t = t[9:].strip()
         if len(t) > 0 and not t.isspace():
             #if t[0].islower() and not t.startswith('moved'):
             #    print "WARNING: Block of text begins with lowercase letter: %s" % t
             if blockquote or (t.startswith('moved ') and not self.hasText()):
                 self._textbuffer.append(u'> ' + t)
             else:
                 self._textbuffer.append(t)

예제 #8

파일 보기

 def addText(self, text, blockquote=False):
     if not self._ignoretext:
         t = parsetools.tameWhitespace(text.strip())
         t = parsetools.sane_quotes(t)
         if t.startswith(':'):
             # Strip initial colon
             t = t[1:].strip()
         if t.startswith('He said: '):
             t = t[8:].strip()
         if t.startswith('She said: '):
             t = t[9:].strip()
         if len(t) > 0 and not t.isspace():
             #if t[0].islower() and not t.startswith('moved'):
             #    print "WARNING: Block of text begins with lowercase letter: %s" % t
             if blockquote or (t.startswith('moved ')
                               and not self.hasText()):
                 self._textbuffer.append(u'> ' + t)
             else:
                 self._textbuffer.append(t)

예제 #9

파일 보기

파일: common.py 프로젝트: AskMP/openparliament

 def appendToText(self, text, italic=False):
     if self.hasText() and not self._ignoretext:
         t = parsetools.tameWhitespace(text.strip())
         if len(t) > 0 and not t.isspace():
             if italic: t = u' <em>' + t + u'</em> '
             self._textbuffer[-1] += t

예제 #10

파일 보기

 def appendToText(self, text, italic=False):
     if self.hasText() and not self._ignoretext:
         t = parsetools.tameWhitespace(text.strip())
         if len(t) > 0 and not t.isspace():
             if italic: t = u' <em>' + t + u'</em> '
             self._textbuffer[-1] += t