Python Instance.tokenDictionary примеры использования

Язык программирования: Python

Пространство имен/Пакет: Instance

Класс/Тип: Instance

Метод/Функция: tokenDictionary

Примеров на hotexamples.com: 2

Python Instance.tokenDictionary - 2 примера найдено. Это лучшие примеры Python кода для Instance.Instance.tokenDictionary, полученные из open source проектов. Вы можете ставить оценку каждому примеру, чтобы помочь нам улучшить качество примеров.

Основные методы

Показать Скрыть

Instance(30)

add_token(4)

get_name(2)

tokenDictionary(2)

to_text(2)

stats(2)

normalizeTokens(2)

listPositions(2)

updateTokens(2)

get_instance_details(2)

setMean(1)

addElement(1)

add_security_group(1)

to_json(1)

generateAllPossiblePath(1)

setValue(1)

setStd(1)

run(1)

get_id(1)

read_file(1)

getTableNames(1)

list_volume_attachments(1)

get_data(1)

__init__(1)

hasNoPapers(1)

get_network_provider(1)

id(1)

Пример #1

Показать файл

def createInstanceObjectList(processed_dataset):
    '''
    Creates a list of Instance objects from the tokenized input + label
    '''
    print('Reading instances...')
    instanceObjects = []

    #Els: read in tokenised lines
    #processed_data = []
    for item in processed_dataset:
        tokenized = []
        line = item[1]
        data = line.strip('\n')
        if data:
            all_words = word_tokenize(data)
            content = ' '.join([str(elem) for elem in all_words])
        label = item[2]
        #processed_data.append(tokenized + '\t' + str(label))
        instanceObject = Instance(content, label)
        for i, token in enumerate(content.split()):
            instanceObject.tokenDictionary[i + 1] = Token(token)
        if FeatureSelection.getInstance(featureFile).normalizeInstances:
            instanceObject.tokenDictionary = instanceObject.normalizeTokens()
        instanceObjects.append(instanceObject)
    return instanceObjects

Пример #2

Показать файл

def createInstanceObjectList(inputFileName):
    '''
    Creates a list of Instance objects from the input file, which contain all the (linguistic) information
    needed to extract the features for sentiment polarity classification
    '''
    print ('Reading instances...')
    instanceObjects = []
    with codecs.open(inputFileName, 'r', 'utf8') as inputFile:
    	for line in inputFile:
            content, label = line.strip().split('\t')
            instanceObject = Instance(content, label)
            for i, token in enumerate(content.split()):
                instanceObject.tokenDictionary[i+1] = Token(token)
            if FeatureSelection.getInstance(featureFile).normalizeInstances:
                instanceObject.tokenDictionary = instanceObject.normalizeTokens()
            instanceObjects.append(instanceObject)
    return instanceObjects