Python ELMoWordEmbeddings.storeCache 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: neuralnets.ELMoWordEmbeddings

클래스/타입: ELMoWordEmbeddings

메소드/함수: storeCache

hotexamples.com에서의 예제들: 2

Python ELMoWordEmbeddings.storeCache - 2개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 neuralnets.ELMoWordEmbeddings.ELMoWordEmbeddings.storeCache에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

ELMoWordEmbeddings(4)

loadCache(4)

addToCache(3)

storeCache(2)

예제 #1

파일 보기

def create_cache(args):
    datasetName = args.datasetName
    tokenColId = args.tokenColumnId
    cudaDevice = args.cuda_device
    elmo_options_file = args.elmo_options
    elmo_weight_file = args.elmo_weights

    #elmo_options_file= 'pretrained/elmo_2x4096_512_2048cnn_2xhighway_5.5B_options.json'
    #elmo_weight_file = 'pretrained/elmo_2x4096_512_2048cnn_2xhighway_5.5B_weights.hdf5'
    #elmo_options_file= 'pretrained/velmo_options.json'
    #elmo_weight_file = 'pretrained/velmo_weights.hdf5'

    # :: Logging level ::
    loggingLevel = logging.INFO
    logger = logging.getLogger()
    logger.setLevel(loggingLevel)

    ch = logging.StreamHandler(sys.stdout)
    ch.setLevel(loggingLevel)
    formatter = logging.Formatter('%(message)s')
    ch.setFormatter(formatter)
    logger.addHandler(ch)

    commentSymbol = None
    columns = {tokenColId: 'tokens'}

    #picklePath = "embeddings/elmo_cache_" + datasetName + ".pkl"
    #picklePath = "embeddings/velmo_cache_conll2000_data_perturbed_03.pkl"
    #picklePath = "embeddings/velmo_cache_conll2000_data_clean.pkl"
    picklePath = args.pkl_path
    embLookup = ELMoWordEmbeddings(None,
                                   elmo_options_file,
                                   elmo_weight_file,
                                   elmo_cuda_device=cudaDevice)

    print("ELMo Cache Generation")
    print("Output file:", picklePath)
    print("CUDA Device:", cudaDevice)

    splitFiles = ['train.txt', 'dev.txt', 'test.txt']

    for splitFile in splitFiles:
        inputPath = os.path.join('data', datasetName, splitFile)

        print("Adding file to cache: " + inputPath)
        sentences = readCoNLL(inputPath, columns, commentSymbol)
        tokens = [sentence['tokens'] for sentence in sentences]

        start_time = time.time()
        embLookup.addToCache(tokens)
        end_time = time.time()
        print("%s processed in %.1f seconds" %
              (splitFile, end_time - start_time))
        print("\n---\n")

    print("Store file at:", picklePath)
    embLookup.storeCache(picklePath)

예제 #2

파일 보기

columns = {tokenColId: 'tokens'}

picklePath = "embeddings/elmo_cache_" + datasetName + ".pkl"

embLookup = ELMoWordEmbeddings(None,
                               elmo_options_file,
                               elmo_weight_file,
                               elmo_cuda_device=cudaDevice)

print("ELMo Cache Generation")
print("Output file:", picklePath)
print("CUDA Device:", cudaDevice)

splitFiles = ['train.txt', 'dev.txt', 'test.txt']

for splitFile in splitFiles:
    inputPath = os.path.join('data', datasetName, splitFile)

    print("Adding file to cache: " + inputPath)
    sentences = readCoNLL(inputPath, columns, commentSymbol)
    tokens = [sentence['tokens'] for sentence in sentences]

    start_time = time.time()
    embLookup.addToCache(tokens)
    end_time = time.time()
    print("%s processed in %.1f seconds" % (splitFile, end_time - start_time))
    print("\n---\n")

print("Store file at:", picklePath)
embLookup.storeCache(picklePath)