Python TextApi.TextApi 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: cortical.textApi

클래스/타입: TextApi

메소드/함수: TextApi

hotexamples.com에서의 예제들: 4

Python TextApi.TextApi - 4개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 cortical.textApi.TextApi.TextApi에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

TextApi(4)

getRepresentationsForBulkText(2)

decode(1)

getKeywordsForText(1)

getLanguage(1)

getRepresentationForText(1)

getSlicesForText(1)

getTokensForText(1)

예제 #1

파일 보기

파일: testTextApi.py 프로젝트: nickkimer/boxer.ai

 def setUp(self):
     self.api = TextApi(testConfiguration.client)

예제 #2

파일 보기


def gettokens(txt):
    return api.getTokensForText(config.RETINA_NAME, txt)


def getslices(txt):
    return api.getSlicesForText(config.RETINA_NAME, txt)


if __name__ == '__main__':
    client = config.client
    #api = TermsApi(client)
    #terms = api.getTerm("en_associative", term="apple", get_fingerprint=True)

    api = TextApi(client)
    scpr = scraper()
    kwords = []
    tokens = []
    targettxt = url2txt(scpr, TARGET_COMPANY_URL)
    candidatetxts = PDF2txt("resume.pdf")
    for i in range(len(candidatetxts)):
        kwords += getkw(candidatetxts[i])
        tokens += gettokens(candidatetxts[i])

    print("Keywords extracted, Tokens ready")
    #slices=[getslices(candidatetxts[i]) for i in range(len(candidatetxts))]

    if testing_slate:
        print([r.encode('utf-8') for r in kwords])
        print([r.encode('utf-8') for r in tokens])

예제 #3

파일 보기

파일: summarization.py 프로젝트: calvinsadewa/text_summarization

def summarize(text, len_sentences = 5, retina = retina, apiKey = apiKey,
              min_length = min_length, similarity_measure = similarity_measure) :
    sentences = [sentence for sentence in text.split(".") if len(sentence) >= min_length]
    
    # Make request to cortical to compare sentence by sentence to get distance
    # for graph
    
    # graph representation, to use : graph[0][1] is edge of vertex 0 to 1
    graph = nx.Graph()
    
    request_body = []
    for s in sentences:
        request_body.append({"text":s})
    
    request_body = json.dumps(request_body)
    
    client = ApiClient(apiKey=apiKey, apiServer="http://api.cortical.io/rest")
    api = TextApi(client)
    fingerprints = api.getRepresentationsForBulkText(retina, request_body)    
    
    pos_fingerprints = zip(range(0,len(sentences)),fingerprints)
    
    double_pos_fingerprints = itertools.combinations(pos_fingerprints, 2)    
    
    for (pos1,finger1),(pos2,finger2) in double_pos_fingerprints:
        graph.add_weighted_edges_from([(pos1,pos2,
                                        cosine_similarity(finger1.positions,
                                                          finger2.positions))])
        print(pos1,pos2)
    """
    request_body = []
    for s in sentences:
        for s2 in sentences:
            request_body.append([{"text":s},{"text":s2}])
    
    request_body = json.dumps(request_body)
    
    client = ApiClient(apiKey=apiKey, apiServer="http://api.cortical.io/rest")
    api = CompareApi(client)
    print("Sending to compare API")
    metrics = api.compareBulk(retina, request_body)    
    print("Receive compare API")

    for i in range(len(sentences)):
        for j in range(len(sentences)):
            graph.add_weighted_edges_from([(i,j,metrics[i*len(sentences)+j])].cosineSimilarity)
    """
    pos_fingerprints = zip(range(0,len(sentences)),fingerprints)
        
    # Compute pagerank for all vertex in matrix, refer to https://en.wikipedia.org/wiki/PageRank
    page_rank = nx.pagerank(graph)
    
    sorted_rank = [(page_rank[key],key) for key in page_rank]
    sorted_rank.sort(reverse = True)
    
    summary_graph = nx.Graph()
    summaries = [pos for weight,pos in sorted_rank[:len_sentences]]
    
    for i in range(0,len(summaries)):
        for j in range(i+1,len(summaries)):
            summary_graph.add_weighted_edges_from([(summaries[i],summaries[j],
                                                    graph[i][j]['weight'])])
    
    gr = nx.minimum_spanning_tree(summary_graph)
    
    visited = {}
    summary = []
    for tup in list(nx.dfs_edges(gr)):
        for first in tup:
            if (visited.get(first) is None):
                summary.append(sentences[first])
                visited[first] = True
    
    return summary

예제 #4

파일 보기

파일: GenerateFingerprint.py 프로젝트: nickkimer/boxer.ai

# Code to get fingerprints from a string
# Body = "Semantic fingerprints are cool."

# Code to get fingerprints from a .txt file put filename
file_name = "15_UTX.txt"

with open('Company_Descriptions/' + file_name, "r") as myfile:
    body = myfile.read().replace('\n', '')

####################################################
######### Code for fingerprint (vector) ############
####################################################

# Chose either en_synonymous or en_associative retina
text = TextApi(client).getRepresentationForText("en_synonymous", body)
print text[0].positions

####################################################
############# Code for keywords list ###############
####################################################

# Chose either en_synonymous or en_associative retina
terms = TextApi(client).getKeywordsForText("en_synonymous", body)
print terms

#####################################################
########## Code for fingerprint (image) #############
#####################################################

body = '{"text":"%s"}' % body