Ejemplo n.º 1
0
 def on_post(self, req, resp):
     """Handles POST requests"""
     resp.set_header('Access-Control-Allow-Origin', 'http://localhost:8081')
     resp.set_header('Access-Control-Allow-Methods', '*')
     resp.set_header('Access-Control-Allow-Headers', '*')
     resp.set_header('Access-Control-Allow-Credentials', 'true')
     resp.set_header("Cache-Control", "no-cache")
     data = req.stream.read(req.content_length)
     jsondata = json.loads(data)
     clean_title = shortenlines(jsondata.title)
     clean_content = cleanall(jsondata.content)
     resp.media = self.bert_classification(clean_title, clean_content)
Ejemplo n.º 2
0
 def on_get(self, req, resp):
     logger.info("...")
     resp.set_header('Access-Control-Allow-Origin', 'http://localhost:8081')
     resp.set_header('Access-Control-Allow-Methods', '*')
     resp.set_header('Access-Control-Allow-Headers', '*')
     resp.set_header('Access-Control-Allow-Credentials', 'true')
     title = req.get_param('1', True)
     content = req.get_param('2', True)
     clean_title = shortenlines(title)
     clean_content = cleanall(content)
     resp.media = self.bert_classification(clean_title, clean_content)
     logger.info("###")
Ejemplo n.º 3
0
 def on_post(self, req, resp):
     """Handles POST requests"""
     resp.set_header('Access-Control-Allow-Origin', '*')
     resp.set_header('Access-Control-Allow-Methods', '*')
     resp.set_header('Access-Control-Allow-Headers', '*')
     resp.set_header('Access-Control-Allow-Credentials', 'true')
     resp.set_header("Cache-Control", "no-cache")
     data = req.stream.read(req.content_length)
     start = time.process_time_ns()
     jsondata = json.loads(data)
     clean_title = shortenlines(jsondata['1'])
     clean_content = cleanall(jsondata['2'])
     resp.media = self.bert_classification(clean_title, clean_content)
     logger.info("tot:{}ns".format(time.process_time_ns() - start))
     logger.info("###")
Ejemplo n.º 4
0
import json

import pandas
import urllib3
from classmerge import match
from dataclean import cleanall

df = pandas.read_csv("data/valid1.csv")
http = urllib3.PoolManager()
correct = 0
for index, row in df.iterrows():
    label = row[0]
    title = row[1].replace(".doc", "").replace(".docx", "")
    content = cleanall(row[2])
    url = "http://192.168.0.161:58080/z?1={}&2={}".format(title, content)
    print(url)
    if len(url) > 9999:
        url = url[:9999]
    result = http.request('GET', url)
    result = json.loads(result.data)
    print(label, result['answer'][0])
    df.at[index, 'type1'] = result['answer'][0]
    df.at[index, 'title'] = title
    df.at[index, 'content'] = content
    if match(result['answer'][0], label):
        correct += 1
df.to_csv("data/valid1-filled.csv", index=False)
print('ACCURACY:{}%'.format(correct * 100.0 / len(df)))
Ejemplo n.º 5
0
import json

import pandas
import urllib3
from classmerge import class_case
from dataclean import cleanall

df = pandas.read_csv("data/test.csv")
http = urllib3.PoolManager()
correct = 0
for index, row in df.iterrows():
    label = row[0]
    title = str(row[1])  #.replace(".doc","").replace(".docx","")
    content = cleanall(str(row[2]))
    url = "http://192.168.0.161:58081/z?1={}&2={}".format(title, content)
    print(url)
    if len(url) > 9999:
        url = url[:9999]
    result = http.request('GET', url)
    result = json.loads(result.data)
    print(class_case[label - 1], result['answer'][0])
    # df.at[index, 'category'] = result['answer'][0]
    # df.at[index, 'title'] = title
    # df.at[index, 'fulltext'] = content
    if class_case.index(result['answer'][0]) == label - 1:
        correct += 1
#df.to_csv("eval/test-bert.csv", index=False)
print('ACCURACY:{}%'.format(correct * 100.0 / len(df)))