Python getDataFromFile 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: DataProcessing.Utilities

메소드/함수: getDataFromFile

hotexamples.com에서의 예제들: 8

Python getDataFromFile - 8개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 DataProcessing.Utilities.getDataFromFile에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

def getTrainingData(text_features=True):
    '''
        Loads the training data from the appropriate directory
    '''
    #Load the data present in the training file
    f = loadFile(dir_path + training_file)
    training_data = getDataFromFile(f)
    token_ner, token_pos = parseTrainingData(training_data)

    feature_type = ""
    state_features = {}

    #Considering only words with count less than 3 for the similarity based classifier
    if text_features:
        low_frequency_token_ner = findLowFrequencyWord(token_ner)
        state_features = findFeaturesForText(low_frequency_token_ner)
        feature_type = "text_features"

    #Considering all words for the POS based classifier
    else:
        state_features = findFeaturesForPOS(token_pos, token_ner)
        feature_type = "pos_features"

    #Finding the probabilities for the features
    feature_probabilities = findProbabilityForFeatures(state_features)
    saveFeaturesToDisk(feature_probabilities, feature_type)
    pprint(feature_probabilities)
    return feature_probabilities

예제 #2

파일 보기

파일: HandleLowFrequencyWords.py 프로젝트: gkeswani92/Named-Entity-Recognition

def getTrainingData(text_features=True):
    """
        Loads the training data from the appropriate directory
    """
    # Load the data present in the training file
    f = loadFile(dir_path + training_file)
    training_data = getDataFromFile(f)
    token_ner, token_pos = parseTrainingData(training_data)

    feature_type = ""
    state_features = {}

    # Considering only words with count less than 3 for the similarity based classifier
    if text_features:
        low_frequency_token_ner = findLowFrequencyWord(token_ner)
        state_features = findFeaturesForText(low_frequency_token_ner)
        feature_type = "text_features"

    # Considering all words for the POS based classifier
    else:
        state_features = findFeaturesForPOS(token_pos, token_ner)
        feature_type = "pos_features"

    # Finding the probabilities for the features
    feature_probabilities = findProbabilityForFeatures(state_features)
    saveFeaturesToDisk(feature_probabilities, feature_type)
    pprint(feature_probabilities)
    return feature_probabilities

예제 #3

파일 보기

파일: DynamicTagger.py 프로젝트: gkeswani92/Named-Entity-Recognition

def getTrainingData():
    '''
        Loads the training data from the appropriate directory
    '''
    #Load the data present in the training file
    f = loadFile(dir_path + training_file)
    training_data = getDataFromFile(f)
    context, pos, ner = parseTrainingData(training_data)
    training_data = processTrainingData(context, pos, ner)
    largest_key_size = getMaxLengthKey(training_data)
    return training_data, largest_key_size

예제 #4

파일 보기

파일: DynamicTagger.py 프로젝트: gkeswani92/Named-Entity-Recognition

def getTrainingData():
    '''
        Loads the training data from the appropriate directory
    '''
    #Load the data present in the training file
    f = loadFile(dir_path + training_file)
    training_data = getDataFromFile(f)
    context, pos, ner = parseTrainingData(training_data)
    training_data = processTrainingData(context, pos, ner)
    largest_key_size = getMaxLengthKey(training_data)
    return training_data, largest_key_size

예제 #5

파일 보기

파일: LoadData.py 프로젝트: gkeswani92/Named-Entity-Recognition

def getTestData(HMM=False):
    '''
        Loads the test data from the appropriate directory
    '''
    #Load the data present in the test file
    f = loadFile(dir_path + test_file)
    test_data = getDataFromFile(f)
    if not HMM:
        context, pos, index = parseTestData(test_data)
        return context, pos, index
    else:
        context, pos, index = parseTestDataHMM(test_data)
        return context, pos, index

예제 #6

파일 보기

파일: LoadData.py 프로젝트: cfan2012/Named-Entity-Recognition

def getTestData(HMM=False):
    '''
        Loads the test data from the appropriate directory
    '''
    #Load the data present in the test file
    f = loadFile(dir_path + test_file)
    test_data = getDataFromFile(f)
    if not HMM:
        context, pos, index = parseTestData(test_data)
        return context, pos, index
    else:
        context, pos, index = parseTestDataHMM(test_data)
        return context, pos, index

예제 #7

파일 보기

파일: LoadData.py 프로젝트: gkeswani92/Named-Entity-Recognition

def getTrainingData(HMM=False):
    '''
        Loads the training data from the appropriate directory
    '''
    #Load the data present in the training file
    f = loadFile(dir_path + training_file)
    training_data = getDataFromFile(f)
    if not HMM:
        context, pos, ner = parseTrainingData(training_data)
        training_data = processTrainingData(context, pos, ner)
        return training_data
    else:
        context, pos, ner = parseTrainingDataHMM(training_data)
        return context, pos, ner

예제 #8

파일 보기

파일: LoadData.py 프로젝트: cfan2012/Named-Entity-Recognition

def getTrainingData(HMM=False):
    '''
        Loads the training data from the appropriate directory
    '''
    #Load the data present in the training file
    f = loadFile(dir_path + training_file)
    training_data = getDataFromFile(f)
    if not HMM:
        context, pos, ner = parseTrainingData(training_data)
        training_data = processTrainingData(context, pos, ner)
        return training_data
    else:
        context, pos, ner = parseTrainingDataHMM(training_data)
        return context, pos, ner