Python normalize_keyword 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: src.armado.cdpindex

메소드/함수: normalize_keyword

hotexamples.com에서의 예제들: 4

Python normalize_keyword - 4개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 src.armado.cdpindex.normalize_keyword에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

파일: web_app.py 프로젝트: Alwnikrotikz/cdpedia

 def on_search(self, request):
     if request.method == "GET":
         return self.render_template('search.html')
     elif request.method == "POST":
         search_string = request.form.get("keywords", None)
         if search_string:
             search_string_norm = normalize_keyword(search_string)
             words = search_string_norm.split()
             id_ = self.searcher.start_search(words)
             return redirect("/search/%s" % "+".join(words))
         return redirect("/")

예제 #2

파일 보기

파일: web_app.py 프로젝트: gurupratap-matharu/CDPedia

 def on_search(self, request):
     if request.method == "GET":
         return self.render_template('search.html')
     elif request.method == "POST":
         search_string = request.form.get("keywords", None)
         search_string = urllib.unquote_plus(search_string)
         if search_string:
             search_string_norm = normalize_keyword(search_string)
             words = search_string_norm.split()
             self.searcher.start_search(words)
             return redirect("/search/%s" % "+".join(words))
         return redirect("/")

예제 #3

파일 보기

파일: web_app.py 프로젝트: Alwnikrotikz/cdpedia

    def on_search_results(self, request, key):
        search_string_norm = normalize_keyword(key)
        words = search_string_norm.split()
        start = int(request.args.get("start", 0))
        quantity = int(request.args.get("quantity", config.SEARCH_RESULTS))
        id_ = self.searcher.start_search(words)
        results = self.searcher.get_results(id_, start, quantity)

        CLEAN = re.compile("[(),]")

        # group by link, giving priority to the title of the original articles
        grouped_results = {}
        for link, title, ptje, original, texto in results:
            # remove 3 dirs from link and add the proper base url
            link = "%s/%s" % (ARTICLES_BASE_URL, to3dirs.from_path(link))

            # convert tokens to lower case
            tit_tokens = set(CLEAN.sub("", x.lower()) for x in title.split())

            if link in grouped_results:
                (tit, prv_ptje, tokens, txt) = grouped_results[link]
                tokens.update(tit_tokens)
                if original:
                    # save the info of the original article
                    tit = title
                    txt = texto
                grouped_results[link] = (tit, prv_ptje + ptje, tokens, txt)
            else:
                grouped_results[link] = (title, ptje, tit_tokens, texto)

        # clean the tokens
        for link, (tit, ptje, tokens, texto) in grouped_results.iteritems():
            tit_tokens = set(CLEAN.sub("", x.lower()) for x in tit.split())
            tokens.difference_update(tit_tokens)

        # sort the results
        candidates = ((k, ) + tuple(v) for k, v in grouped_results.iteritems())
        sorted_results = sorted(candidates, key=operator.itemgetter(2),
                                reverse=True)

        return self.render_template('search.html',
            search_words=words,
            results=sorted_results,
            start=start,
            quantity=quantity
        )

예제 #4

파일 보기

파일: web_app.py 프로젝트: gurupratap-matharu/CDPedia

    def on_search_results(self, request, key):
        search_string_norm = urllib.unquote_plus(normalize_keyword(key))
        words = search_string_norm.split()
        start = int(request.args.get("start", 0))
        quantity = int(request.args.get("quantity", config.SEARCH_RESULTS))
        id_ = self.searcher.start_search(words)
        results = self.searcher.get_results(id_, start, quantity)

        CLEAN = re.compile("[(),]")

        # group by link, giving priority to the title of the original articles
        grouped_results = {}
        for link, title, ptje, original, texto in results:
            # remove 3 dirs from link and add the proper base url
            link = "%s/%s" % (ARTICLES_BASE_URL, to3dirs.from_path(link))

            # convert tokens to lower case
            tit_tokens = set(CLEAN.sub("", x.lower()) for x in title.split())

            if link in grouped_results:
                (tit, prv_ptje, tokens, txt) = grouped_results[link]
                tokens.update(tit_tokens)
                if original:
                    # save the info of the original article
                    tit = title
                    txt = texto
                grouped_results[link] = (tit, prv_ptje + ptje, tokens, txt)
            else:
                grouped_results[link] = (title, ptje, tit_tokens, texto)

        # clean the tokens
        for link, (tit, ptje, tokens, texto) in grouped_results.iteritems():
            tit_tokens = set(CLEAN.sub("", x.lower()) for x in tit.split())
            tokens.difference_update(tit_tokens)

        # sort the results
        candidates = ((k, ) + tuple(v) for k, v in grouped_results.iteritems())
        sorted_results = sorted(candidates,
                                key=operator.itemgetter(2),
                                reverse=True)

        return self.render_template('search.html',
                                    search_words=words,
                                    results=sorted_results,
                                    start=start,
                                    quantity=quantity)