Python html_to_text примеры использования

Язык программирования: Python

Пространство имен/Пакет: xmodule.annotator_mixin

Метод/Функция: html_to_text

Примеров на hotexamples.com: 10

Python html_to_text - 10 примеров найдено. Это лучшие примеры Python кода для xmodule.annotator_mixin.html_to_text, полученные из open source проектов. Вы можете ставить оценку каждому примеру, чтобы помочь нам улучшить качество примеров.

Пример #1

Показать файл

def escape_html_characters(content):
    """
    Remove HTML characters that shouldn't be indexed using ElasticSearch indexer
    This method is complementary to html_to_text method found in xmodule/annotator_mixin.py

    Args:
        content (str): variable to escape html characters from

    Returns:
        content (str): content ready to be index by ElasticSearch

    """

    # Removing HTML comments
    return re.sub(
        r"<!--.*-->",
        "",
        # Removing HTML CDATA
        re.sub(
            r"<!\[CDATA\[.*\]\]>",
            "",
            # Removing HTML-encoded non-breaking space characters
            re.sub(
                r"(\s|&nbsp;|//)+",
                " ",
                html_to_text(content)
            )
        )
    )

Пример #2

Показать файл

def strip_html_content_to_text(html_content):
    """ Gets only the textual part for html content - useful for building text to be searched """
    # Removing HTML-encoded non-breaking space characters
    text_content = re.sub(r"(\s|&nbsp;|//)+", " ", html_to_text(html_content))
    # Removing HTML CDATA
    text_content = re.sub(r"<!\[CDATA\[.*\]\]>", "", text_content)
    # Removing HTML comments
    text_content = re.sub(r"<!--.*-->", "", text_content)

    return text_content

Пример #3

Показать файл

Файл: imageannotation_module.py Проект: uncletomiwa/edx-platform

    def __init__(self, *args, **kwargs):
        super(ImageAnnotationModule, self).__init__(*args, **kwargs)

        xmltree = etree.fromstring(self.data)

        self.instructions = self._extract_instructions(xmltree)
        self.openseadragonjson = html_to_text(etree.tostring(xmltree.find('json'), encoding='unicode'))
        self.user = ""
        if self.runtime.get_real_user is not None:
            self.user = self.runtime.get_real_user(self.runtime.anonymous_student_id).email

Пример #4

Показать файл

Файл: courseware_index.py Проект: marcore/edx-platform

def strip_html_content_to_text(html_content):
    """ Gets only the textual part for html content - useful for building text to be searched """
    # Removing HTML-encoded non-breaking space characters
    text_content = re.sub(r"(\s|&nbsp;|//)+", " ", html_to_text(html_content))
    # Removing HTML CDATA
    text_content = re.sub(r"<!\[CDATA\[.*\]\]>", "", text_content)
    # Removing HTML comments
    text_content = re.sub(r"<!--.*-->", "", text_content)

    return text_content

Пример #5

Показать файл

Файл: html_module.py Проект: sigberto/edx-platform

 def index_dictionary(self):
     xblock_body = super(HtmlDescriptor, self).index_dictionary()
     # Removing HTML-encoded non-breaking space characters
     html_content = re.sub(r"(\s|&nbsp;|//)+", " ", html_to_text(self.data))
     # Removing HTML CDATA
     html_content = re.sub(r"<!\[CDATA\[.*\]\]>", "", html_content)
     # Removing HTML comments
     html_content = re.sub(r"<!--.*-->", "", html_content)
     html_body = {"html_content": html_content, "display_name": self.display_name}
     if "content" in xblock_body:
         xblock_body["content"].update(html_body)
     else:
         xblock_body["content"] = html_body
     xblock_body["content_type"] = "Text"
     return xblock_body

Пример #6

Показать файл

Файл: imageannotation_module.py Проект: CDOT-EDX/edx-platform

    def __init__(self, *args, **kwargs):
        super(ImageAnnotationModule, self).__init__(*args, **kwargs)

        xmltree = etree.fromstring(self.data)

        self.instructions = self._extract_instructions(xmltree)
        self.openseadragonjson = html_to_text(etree.tostring(xmltree.find('json'), encoding='unicode'))
        self.user_email = ""
        self.is_course_staff = False
        if self.runtime.get_user_role() in ['instructor', 'staff']:
            self.is_course_staff = True
        if self.runtime.get_real_user is not None:
            try:
                self.user_email = self.runtime.get_real_user(self.runtime.anonymous_student_id).email
            except Exception:  # pylint: disable=broad-except
                self.user_email = _("No email address found.")

Пример #7

Показать файл

Файл: imageannotation_module.py Проект: devs1991/test_edx_docmode

    def __init__(self, *args, **kwargs):
        super(ImageAnnotationModule, self).__init__(*args, **kwargs)

        xmltree = etree.fromstring(self.data)

        self.instructions = self._extract_instructions(xmltree)
        self.openseadragonjson = html_to_text(etree.tostring(xmltree.find('json'), encoding='unicode'))
        self.user_email = ""
        self.is_course_staff = False
        if self.runtime.get_user_role() in ['instructor', 'staff']:
            self.is_course_staff = True
        if self.runtime.get_real_user is not None:
            try:
                self.user_email = self.runtime.get_real_user(self.runtime.anonymous_student_id).email
            except Exception:  # pylint: disable=broad-except
                self.user_email = _("No email address found.")

Пример #8

Показать файл

Файл: html_module.py Проект: echines/edx-platform

 def index_dictionary(self):
     xblock_body = super(HtmlDescriptor, self).index_dictionary()
     # Removing HTML-encoded non-breaking space characters
     html_content = re.sub(r"(\s|&nbsp;|//)+", " ", html_to_text(self.data))
     # Removing HTML CDATA
     html_content = re.sub(r"<!\[CDATA\[.*\]\]>", "", html_content)
     # Removing HTML comments
     html_content = re.sub(r"<!--.*-->", "", html_content)
     html_body = {
         "html_content": html_content,
         "display_name": self.display_name,
     }
     if "content" in xblock_body:
         xblock_body["content"].update(html_body)
     else:
         xblock_body["content"] = html_body
     xblock_body["content_type"] = "Text"
     return xblock_body

Пример #9

Показать файл

Файл: test_annotator_mixin.py Проект: tiwariricha/edx-platform

 def test_html_to_text(self):
     expectedtext = "Testing here and not bolded here"
     result = html_to_text(self.sample_html)
     assert expectedtext == result

Пример #10

Показать файл

 def test_html_to_text(self):
     expectedtext = "Testing here and not bolded here"
     result = html_to_text(self.sample_html)
     self.assertEqual(expectedtext, result)