def __init__(self, indexDir, analyzer): lucene.initVM() logger.info("RAM index") writerConfig = IndexWriterConfig(analyzer) writerConfig.setSimilarity(mySimilarity()) logger.debug('writer similarity func: {}'.format( writerConfig.getSimilarity())) writer = IndexWriter(indexDir, writerConfig) self.writer = writer
def __init__(self): indexDir = RAMDirectory() analyzer = SmartChineseAnalyzer() writerConfig = IndexWriterConfig(analyzer) # create new directory, remove previously indexed documents writerConfig.setOpenMode(IndexWriterConfig.OpenMode.CREATE) writerConfig.setSimilarity(mySimilarity()) logger.debug('search similarity:{}'.format( writerConfig.getSimilarity())) self.indexDir = indexDir self.writer = IndexWriter(indexDir, writerConfig)
def __init__(self, lang): lucene.initVM() if lang == 'zh': logger.info("index directory:{}".format(config.IDX_SSQA)) indexDir = SimpleFSDirectory(Paths.get(str(config.IDX_SSQA))) analyzer = SmartChineseAnalyzer() else: raise ValueError( 'lang should be "zh" or "en", {} is invalid!'.format(lang)) writerConfig = IndexWriterConfig(analyzer) writerConfig.setSimilarity(mySimilarity()) logger.debug('writer similarity func: {}'.format( writerConfig.getSimilarity())) writer = IndexWriter(indexDir, writerConfig) self.writer = writer