Ejemplo n.º 1
0
 def read_block(self, stream, tagspec=None, elt_handler=None):
     return list(
         filter(
             lambda x: x is not None,
             XMLCorpusView.read_block(self, stream, tagspec, elt_handler),
         )
     )
Ejemplo n.º 2
0
 def read_block(self, stream, tagspec=None, elt_handler=None):
     return list(
         filter(
             lambda x: x is not None,
             XMLCorpusView.read_block(self, stream, tagspec, elt_handler),
         )
     )
Ejemplo n.º 3
0
 def handle_query(self):
     self._open()
     header = []
     while True:
         segm = XMLCorpusView.read_block(self, self._stream)
         if len(segm) == 0:
             break
         header.extend(segm)
     self.close()
     return header
Ejemplo n.º 4
0
 def handle_query(self):
     self._open()
     header = []
     while True:
         segm = XMLCorpusView.read_block(self, self._stream)
         if len(segm) == 0:
             break
         header.extend(segm)
     self.close()
     return header
Ejemplo n.º 5
0
    def read_block(self, stream, tagspec=None, elt_handler=None):
        """
        Returns text as a list of sentences.
        """
        txt = []
        while True:
            segm = XMLCorpusView.read_block(self, stream)
            if len(segm) == 0:
                break
            for part in segm:
                txt.append(part)

        return [' '.join([segm for segm in txt])]
Ejemplo n.º 6
0
    def read_block(self, stream, tagspec=None, elt_handler=None):
        """
        Returns text as a list of sentences.
        """
        txt = []
        while True:
            segm = XMLCorpusView.read_block(self, stream)
            if len(segm) == 0:
                break
            for part in segm:
                txt.append(part)

        return [' '.join([segm for segm in txt])]
Ejemplo n.º 7
0
 def handle_query(self):
     try:
         self._open()
         words = []
         while True:
             segm = XMLCorpusView.read_block(self, self._stream)
             if len(segm) == 0:
                 break
             for part in segm:
                 if part is not None:
                     words.append(part)
         self.close()
         self.xml_tool.remove_preprocessed_file()
         return words
     except Exception:
         self.xml_tool.remove_preprocessed_file()
         raise Exception
Ejemplo n.º 8
0
 def handle_query(self):
     try:
         self._open()
         sentences = []
         while True:
             sent_segm = XMLCorpusView.read_block(self, self._stream)
             if len(sent_segm) == 0:
                 break
             for segm in sent_segm:
                 segm = self.remove_choice(segm)
                 sentences.append(self.get_sentences(segm))
         self.close()
         self.xml_tool.remove_preprocessed_file()
         return sentences
     except Exception:
         self.xml_tool.remove_preprocessed_file()
         raise Exception
Ejemplo n.º 9
0
 def handle_query(self):
     try:
         self._open()
         words = []
         while True:
             segm = XMLCorpusView.read_block(self, self._stream)
             if len(segm) == 0:
                 break
             for part in segm:
                 if part is not None:
                     words.append(part)
         self.close()
         self.xml_tool.remove_preprocessed_file()
         return words
     except Exception:
         self.xml_tool.remove_preprocessed_file()
         raise Exception
Ejemplo n.º 10
0
 def handle_query(self):
     try:
         self._open()
         sentences = []
         while True:
             sent_segm = XMLCorpusView.read_block(self, self._stream)
             if len(sent_segm) == 0:
                 break
             for segm in sent_segm:
                 segm = self.remove_choice(segm)
                 sentences.append(self.get_sentences(segm))
         self.close()
         self.xml_tool.remove_preprocessed_file()
         return sentences
     except Exception:
         self.xml_tool.remove_preprocessed_file()
         raise Exception