Python Token.tokenize Exemples

Langage de programmation: Python

Espace de nommage/Pack: tokenizer

Class/Type: Token

Méthode/Fonction: tokenize

Exemples au hotexamples.com: 2

Python Token.tokenize - 2 exemples trouvés. Ce sont les exemples réels les mieux notés de tokenizer.Token.tokenize extraits de projets open source. Vous pouvez noter les exemples pour nous aider à en améliorer la qualité.

Méthodes fréquemment utilisées

Afficher Cacher

Token(30)

append(16)

getWord(2)

tokenize(2)

type(2)

bool_val(1)

getPosition(1)

get_math_operators(1)

matches(1)

name(1)

tknOut(1)

tokenType(1)

val(1)

value(1)

xmlFrmt(1)

Méthodes fréquemment utilisées

Token (30)

append (16)

getWord (2)

tokenize (2)

type (2)

bool_val (1)

getPosition (1)

get_math_operators (1)

matches (1)

name (1)

Méthodes fréquemment utilisées

tknOut (1)

tokenType (1)

val (1)

value (1)

xmlFrmt (1)

Exemple #1

0

Afficher le fichier

Fichier : py-node.py Projet : theaiinstitute/aii-platform

def run(): model = sent2vec.Sent2vecModel() model.load_model( '/home/redlcamille/workspace/sent2vec/torontobooks_unigrams.bin') QAs = json.load(open('nlp/qas.json')) sio = socketio.Client() questions = [q for q in QAs] tk = Token() toks = tk.tokenize(questions) embeds = [model.embed_sentence(q) for q in toks] print(toks) def send_msg(event, msg): sio.emit('is typing', {'sender': msg['sender'], 'dest': msg['dest']}) sleep(1) sio.emit(event, msg) @sio.event def connect(): print('connection established') @sio.on('ask for hints') def on_message(typed): emb = model.embed_sentence(typed['msg']) hints = [] for i, q in enumerate(QAs): confid = 1.0 - cosine(embeds[i], emb) if confid > 0.7: hints.append({'hint': q, 'confidence': '%.2f' % confid}) hints.sort(key=lambda u: u['confidence'], reverse=True) sio.emit('hints', {'dest': typed['sender'], 'hints': hints}) @sio.on('new chat') def on_message(msg): if msg['dest'] != 'bot': return if 'referral' in msg: if len(msg['msg']) > 150: send_msg( 'new chat', { 'sender': 'bot', 'dest': msg['referral'], 'msg': msg['msg'][:150] + '...', 'fullanswer': "Prof's reply: %s" % msg['msg'], 'type': 'answer' }) return send_msg( 'new chat', { 'sender': 'bot', 'dest': msg['referral'], 'msg': "Prof's reply:%s" % msg['msg'], 'type': 'answer' }) return q = msg['msg'] print(q.lower() in QAs) if q.lower() in QAs: match = QAs[q.lower()] answer = match['answer'] for sent in nlp(answer).sents: send_msg( 'new chat', { 'sender': 'bot', 'dest': msg['sender'], 'msg': sent.text, 'type': 'answer' }) if 'courses' in match or 'toread' in match: res = { 'sender': 'bot', 'dest': msg['sender'], 'msg': 'more insights' } if 'courses' in match: res['courses'] = match['courses'] if 'toread' in match: res['toread'] = match['toread'] send_msg('new chat', res) elif q.endswith('?'): excuses = [ "I'm not qualified to answer this!", "I'll deliver this question to someone capable!" ] for s in excuses: send_msg('new chat', { 'sender': 'bot', 'dest': msg['sender'], 'msg': s }) send_msg( 'new chat', { 'sender': 'bot', 'dest': 'Prof. Alpha', 'msg': 'A student (%s) has the following question: %s' % (msg['sender'], msg['msg']), 'referral': msg['sender'] }) @sio.event def disconnect(): print('disconnected from server') sio.connect('http://localhost:5000') sio.wait()

Exemple #2

0

Afficher le fichier

dbconfig = json.load(f) # connect to the server conn = psycopg2.connect( "dbname=%s user=%s host=%s port=%d password=%s" % (dbconfig['database'], dbconfig['user'], dbconfig['host'], dbconfig['port'], dbconfig['password'])) cur = conn.cursor() # extract all questions from the table 'question' cur.execute("SELECT id, question_text FROM question;") questions = cur.fetchall() # iterate over all questions processed = 0 total = 0 for idx, text in questions: tks = tk.tokenize([text])[0] embeddings = mod.encode([tks])[0].tolist() cur.execute( "update question set dimensions=%s, vectorisation=%s where id=%s", [len(embeddings), embeddings, idx]) print('done for question with %d - total processed questions: %d' % (idx, processed)) processed += 1 conn.commit() # close the database cur.close() conn.close()