Exemple #1
0
def get_position_summary(request, source_uuid):
    url_content = UrlContentStore.objects(id=source_uuid).first()
    if url_content is None:
        raise HtmlViewerWebException("Invalid url reference",
                                     HTTP_400_BAD_REQUEST)
    summary_result_dict = {POSITION: url_content.tag_position_summary}
    return HttpResponse(json.dumps(summary_result_dict),
                        content_type="application/json")
Exemple #2
0
def get_url_content(request):
    url = request.GET.get('url')
    html_source, uf = validate_url(url)

    soup = BeautifulSoup(html_source)
    html_source = soup.prettify()
    uf.close()
    parser = HTMLTagParser()
    parser.feed(html_source)
    url_content = UrlContentStore()
    url_content.content = html_source
    url_content.tag_count_summary = parser.tag_count_summary
    url_content.tag_position_summary = parser.tag_position_summary
    url_content.save()
    count_url = SOURCE_URL + str(url_content.id) + "/" + COUNT
    position_url = SOURCE_URL + str(url_content.id) + "/" + POSITION
    response_dict = {
        CONTENT: html.escape(html_source),
        UUID: str(url_content.id),
        COUNT_URL: count_url,
        POSITION_URL: position_url
    }
    return HttpResponse(json.dumps(response_dict),
                        content_type="application/json")
Exemple #3
0
def get_url_content(request):
    url = request.GET.get("url")
    html_source, uf = validate_url(url)

    soup = BeautifulSoup(html_source)
    html_source = soup.prettify()
    uf.close()
    parser = HTMLTagParser()
    parser.feed(html_source)
    url_content = UrlContentStore()
    url_content.content = html_source
    url_content.tag_count_summary = parser.tag_count_summary
    url_content.tag_position_summary = parser.tag_position_summary
    url_content.save()
    count_url = SOURCE_URL + str(url_content.id) + "/" + COUNT
    position_url = SOURCE_URL + str(url_content.id) + "/" + POSITION
    response_dict = {
        CONTENT: html.escape(html_source),
        UUID: str(url_content.id),
        COUNT_URL: count_url,
        POSITION_URL: position_url,
    }
    return HttpResponse(json.dumps(response_dict), content_type="application/json")
Exemple #4
0
def get_position_summary(request, source_uuid):
    url_content = UrlContentStore.objects(id=source_uuid).first()
    if url_content is None:
        raise HtmlViewerWebException("Invalid url reference", HTTP_400_BAD_REQUEST)
    summary_result_dict = {POSITION: url_content.tag_position_summary}
    return HttpResponse(json.dumps(summary_result_dict), content_type="application/json")