def _getLucene(self, path): directory = FSDirectory.open(Paths.get(path)) config = IndexWriterConfig(None) config.setRAMBufferSizeMB(256.0) # faster config.setUseCompoundFile(False) # faster, for Lucene 4.4 and later writer = IndexWriter(directory, config) reader = writer.getReader() searcher = IndexSearcher(reader) return writer, reader, searcher
def __init__(self, index_dir): """ :param index_dir: the dir where to store the index. """ self.indexDir = index_dir if not os.path.exists(index_dir): os.mkdir(index_dir) self.analyzer = MyPythonEnglishAnalyzer( stopwords=self.ENGLISH_STOP_WORDS_SET) conf = IndexWriterConfig(self.analyzer) conf.setUseCompoundFile(False) directory = FSDirectory.open(Paths.get(index_dir)) self.writer = IndexWriter(directory, conf)