Python nth_occurrence 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: munge.util.str_utils

메소드/함수: nth_occurrence

hotexamples.com에서의 예제들: 8

Python nth_occurrence - 8개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 munge.util.str_utils.nth_occurrence에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

파일: io.py 프로젝트: Oneplus/cnccgbank

 def derivation_with_index(self, filename, index=None):
     with open(filename, 'r') as file:
         if index:
             return self.parse_file(''.join(
                 nth_occurrence(file.xreadlines(),
                                   N=index, 
                                   when=lambda line: re.match(r"^\(", line),
                                   until=lambda line: re.match(r"^\(", line))))
         else:
             return self.parse_file(file.read())

예제 #2

파일 보기

 def derivation_with_index(self, filename, index=None):
     with open(filename, 'r') as file:
         if index:
             return self.parse_file(''.join(
                 nth_occurrence(file.xreadlines(),
                                N=index,
                                when=lambda line: re.match(r"^\(", line),
                                until=lambda line: re.match(r"^\(", line))))
         else:
             return self.parse_file(file.read())

예제 #3

파일 보기

 def derivation_with_index(self, filename, index=None):
     self.file = open(filename, 'r')
     
     base = imap(lambda line: line.rstrip(), self.file.xreadlines())
     if index:
         lines = nth_occurrence(base,
                               N=1,
                               # put a space after the pattern to ensure we match the whole token
                               when=lambda line: re.match(r"^ID=wsj_%02d%02d.%d " % (self.sec_no, self.doc_no, index), line),
                               until=lambda line: re.match(r"^ID", line))
         return iter(lines)
     else:
         return base

예제 #4

파일 보기

파일: io.py 프로젝트: VikingMew/cnccgbank

    def derivation_with_index(self, filename, index=None):
        self.file = open(filename, "r")

        base = imap(lambda line: line.rstrip(), self.file.xreadlines())
        if index:
            lines = nth_occurrence(
                base,
                N=1,
                # put a space after the pattern to ensure we match the whole token
                when=lambda line: re.match(r"^ID=wsj_%02d%02d.%d " % (self.sec_no, self.doc_no, index), line),
                until=lambda line: re.match(r"^ID", line),
            )
            return iter(lines)
        else:
            return base

예제 #5

파일 보기

파일: io.py 프로젝트: Oneplus/cnccgbank

 def derivation_with_index(self, filename, i=None):
     self.contents = SGMLBag()
     with open(filename, 'r') as file:
         if i:
             text = ''.join(nth_occurrence(file.xreadlines(),
                                   N=i,
                                   when=lambda line: re.match(r'^<S', line),
                                   until=lambda line: re.match(r'^</S', line)))
         else:
             text = file.read()
             
         self.contents.feed(text)
     
     # HACK HACK HACK:
     # Sometimes <S>...</S> encloses more than one root (3:7 has some);
     # in which case, counting <S> will undercount the number of sentences
     if self.contents['s'] is None: return parse_tree('', AugmentedPennParser)
     
     return parse_tree('\n'.join(self.contents['s']), AugmentedPennParser)

예제 #6

파일 보기

파일: io.py 프로젝트: Oneplus/cnccgbank

    def derivation_with_index(self, filename, i=None):
        self.contents = SGMLBag()
        with open(filename, 'r') as file:
            headline_lines = nth_occurrence(file, N=1, 
                             when=lambda line:  re.match(r'^<HEADLINE', line),
                             until=lambda line: re.match(r'^</HEADLINE', line))
            if not headline_lines: return None

            if not headline_lines[0].startswith('<HEADLINE'):
                raise CPTBParseException('Expected to find a <HEADLINE> line.')
                
            headline_lines = headline_lines[1:] # strip off <HEADLINE>
            if i:
                text = ''.join(headline_lines[i])
            else:
                text = '\n'.join(headline_lines)

            self.contents.feed(text)

        return parse_tree('\n'.join(self.contents['s']), AugmentedPennParser)

예제 #7

파일 보기

    def derivation_with_index(self, filename, i=None):
        self.contents = SGMLBag()
        with open(filename, 'r') as file:
            if i:
                text = ''.join(
                    nth_occurrence(file.xreadlines(),
                                   N=i,
                                   when=lambda line: re.match(r'^<S', line),
                                   until=lambda line: re.match(r'^</S', line)))
            else:
                text = file.read()

            self.contents.feed(text)

        # HACK HACK HACK:
        # Sometimes <S>...</S> encloses more than one root (3:7 has some);
        # in which case, counting <S> will undercount the number of sentences
        if self.contents['s'] is None:
            return parse_tree('', AugmentedPennParser)

        return parse_tree('\n'.join(self.contents['s']), AugmentedPennParser)

예제 #8

파일 보기

    def derivation_with_index(self, filename, i=None):
        self.contents = SGMLBag()
        with open(filename, 'r') as file:
            headline_lines = nth_occurrence(
                file,
                N=1,
                when=lambda line: re.match(r'^<HEADLINE', line),
                until=lambda line: re.match(r'^</HEADLINE', line))
            if not headline_lines: return None

            if not headline_lines[0].startswith('<HEADLINE'):
                raise CPTBParseException('Expected to find a <HEADLINE> line.')

            headline_lines = headline_lines[1:]  # strip off <HEADLINE>
            if i:
                text = ''.join(headline_lines[i])
            else:
                text = '\n'.join(headline_lines)

            self.contents.feed(text)

        return parse_tree('\n'.join(self.contents['s']), AugmentedPennParser)