Python leaf_div_elements_into_paragraphs示例

编程语言: Python

命名空间/包名称: breadability.readable

方法/功能: leaf_div_elements_into_paragraphs

hotexamples.com的示例: 6

Python leaf_div_elements_into_paragraphs - 已找到6个示例。这些是从开源项目中提取的最受好评的breadability.readable.leaf_div_elements_into_paragraphs现实Python示例。您可以评价示例，以帮助我们提高示例质量。

示例#1

显示文件

def test_dont_transform_div_with_div():
    """Verify that only child <div> element is replaced by <p>."""
    dom = document_fromstring("<html><body><div>text<div>child</div>"
                              "aftertext</div></body></html>")

    assert tounicode(leaf_div_elements_into_paragraphs(dom)) == to_unicode(
        "<html><body><div>text<p>child</p>"
        "aftertext</div></body></html>")

示例#2

显示文件

def test_misused_divs_transform():
    """Verify we replace leaf node divs with p's

    They should have the same content, just be a p vs a div

    """
    test_html = "<html><body><div>simple</div></body></html>"
    test_doc = document_fromstring(test_html)
    assert tounicode(leaf_div_elements_into_paragraphs(
        test_doc)) == to_unicode("<html><body><p>simple</p></body></html>")

    test_html2 = ('<html><body><div>simple<a href="">link</a>'
                  '</div></body></html>')
    test_doc2 = document_fromstring(test_html2)
    assert tounicode(
        leaf_div_elements_into_paragraphs(test_doc2)) == to_unicode(
            '<html><body><p>simple<a href="">link</a></p></body></html>')

示例#3

显示文件

文件： test_readable.py 项目： bookieio/breadability

def test_misused_divs_transform():
    """Verify we replace leaf node divs with p's

    They should have the same content, just be a p vs a div

    """
    test_html = "<html><body><div>simple</div></body></html>"
    test_doc = document_fromstring(test_html)
    assert tounicode(leaf_div_elements_into_paragraphs(test_doc)) == to_unicode(
        "<html><body><p>simple</p></body></html>"
    )

    test_html2 = ('<html><body><div>simple<a href="">link</a>'
                  '</div></body></html>')
    test_doc2 = document_fromstring(test_html2)
    assert tounicode(leaf_div_elements_into_paragraphs(test_doc2)) == to_unicode(
        '<html><body><p>simple<a href="">link</a></p></body></html>'
    )

示例#4

显示文件

文件： custom_article.py 项目： suraj-yadav-001/noclick

 def dom(self):
     """Parsed lxml tree (Document Object Model) of the given html."""
     try:
         dom = self._original_document.dom
         # cleaning doesn't return, just wipes in place
         html_cleaner(dom)
         return leaf_div_elements_into_paragraphs(dom)
     except ValueError:
         return None

示例#5

显示文件

文件： custom_article.py 项目： GTFObob/NoClick

 def dom(self):
     """Parsed lxml tree (Document Object Model) of the given html."""
     try:
         dom = self._original_document.dom
         # cleaning doesn't return, just wipes in place
         html_cleaner(dom)
         return leaf_div_elements_into_paragraphs(dom)
     except ValueError:
         return None

示例#6

显示文件

文件： test_readable.py 项目： bookieio/breadability

def test_dont_transform_div_with_div():
    """Verify that only child <div> element is replaced by <p>."""
    dom = document_fromstring(
        "<html><body><div>text<div>child</div>"
        "aftertext</div></body></html>"
    )

    assert tounicode(leaf_div_elements_into_paragraphs(dom)) == to_unicode(
        "<html><body><div>text<p>child</p>"
        "aftertext</div></body></html>"
    )