Python GopherHTMLParser.GopherHTMLParserの例、gopher_render.GopherHTMLParser.GopherHTMLParser Pythonの例

コード例 #1

0

ファイルを表示

ファイル: test_html.py プロジェクト: khoulihan/gopher-render

    def test_blockquote_default(self):
        """
        Blockquotes have a line before and after, and '> ' at the start of each
        line. Paragraphs within the quote will have one blank line between them,
        but the first and last paragraphs will not have top and bottom margins
        respectively.
        """
        html = "<blockquote><p>One</p><p>Two</p></blockquote>"
        parser = GopherHTMLParser(optimise=False)
        parser.feed(html)
        parser.close()
        output = parser.parsed

        # Blank lines before and after.
        assert output.startswith("\n")
        assert output.endswith("\n")

        # No wrapping should occur (line count includes blanks)
        lines = output.split('\n')
        assert len(lines) == 5

        for line in lines[1:-1]:
            assert line.startswith("> ")
            assert len(line) == 67
        assert lines[2].strip() == '>'

コード例 #2

0

ファイルを表示

ファイル: test_html.py プロジェクト: khoulihan/gopher-render

    def test_p_tag_default_long(self):
        """
        Default p tag render has a line below
        Long lines are wrapped to 67 characters and full justified.
        """
        html = ''.join([
            "<p>Paragraph Text Paragraph Text Paragraph Text Paragraph Text Paragraph ",
            "Paragraph Text Paragraph Text Paragraph Text Paragraph Text Paragraph ",
            "Paragraph Text Paragraph Text Paragraph Text Paragraph Text Paragraph ",
            "Paragraph Text Paragraph Text Paragraph Text Paragraph Text Paragraph ",
            "Paragraph Text Paragraph Text Paragraph Text Paragraph Text Paragraph ",
            "Paragraph Text Paragraph Text Paragraph Text Paragraph Text Paragraph ",
            "Text Paragraph Text Paragraph Text Paragraph Text</p>"
        ])
        parser = GopherHTMLParser(optimise=False)
        parser.feed(html)
        parser.close()
        output = parser.parsed

        # Blank line before.
        assert output.endswith("\n")

        # Wrapping (line count includes blank lines)
        lines = output.split('\n')
        assert len(lines) == 10

        # Initial line indent
        #assert lines[1].startswith(' ' * 8)

        # Check that lines are padded to the correct width
        for li in range(1, len(lines) - 1):
            assert len(lines[li]) == 67

コード例 #3

0

ファイルを表示

ファイル: test_html.py プロジェクト: khoulihan/gopher-render

    def test_code_block_default(self):
        """
        Where a code tags parent is a pre tag, its content should NOT be surrounded by backticks.

        The pre tag content will be indented, and also have a line after
        """
        code = "\n".join([
            "def func():",
            "    print('Some nonsense')",
            "    return True",
        ])
        html = "<pre><code>{}</code></pre>".format(code)
        parser = GopherHTMLParser()
        parser.feed(html)
        parser.close()
        output = parser.parsed

        # Blank lines before and after.
        assert output.startswith("\n")
        assert output.endswith("\n")

        # No wrapping should occur (line count includes blanks)
        lines = output.split('\n')
        assert len(lines) == 5

        codelines = code.split('\n')

        for li in range(1, 3):
            assert lines[li].rstrip() == "    {}".format(codelines[li - 1])

コード例 #4

0

ファイルを表示

ファイル: test_html.py プロジェクト: khoulihan/gopher-render

    def _header(self, html, result):
        parser = GopherHTMLParser(optimise=False)
        parser.feed(html)
        parser.close()
        output = parser.parsed

        assert output.strip() == result
        assert output.startswith('\n')
        assert output.endswith('\n')
        assert len(output) == 69

コード例 #5

0

ファイルを表示

ファイル: test_html.py プロジェクト: khoulihan/gopher-render

    def test_code_span_in_p_default(self):
        """
        Default code tag render should just surround the content in backticks.

        This test checks that this works correctly within a p tag.
        """
        html = "<p>This paragrah includes a <code>ClassName</code> in a code tag.</p>"
        parser = GopherHTMLParser()
        parser.feed(html)
        parser.close()
        output = parser.parsed

        # Surrounded by backticks
        assert output.strip() == "This paragrah includes a `ClassName` in a code tag."

コード例 #6

0

ファイルを表示

ファイル: test_html.py プロジェクト: khoulihan/gopher-render

    def test_span_default(self):
        """
        Default span tag render should do... nothing!
        """
        html = "<span>ClassName</span>"
        parser = GopherHTMLParser()
        parser.feed(html)
        parser.close()
        output = parser.parsed

        assert output.startswith("C")
        assert output.endswith("e")

        # Just the content.
        assert len(output) == 9

        # Just one line
        lines = output.split('\n')
        assert len(lines) == 1

コード例 #7

0

ファイルを表示

ファイル: test_html.py プロジェクト: khoulihan/gopher-render

    def test_ol_default(self):
        """
        Default ol tag render. It prepends list items with a number and has a margin
        above and below.
        """
        html = "<ol><li>One</li><li>Two</li><li>Three</li></ol>"
        parser = GopherHTMLParser(optimise=False)
        parser.feed(html)
        parser.close()
        output = parser.parsed

        assert output.startswith("\n")
        assert output.endswith("\n")

        lines = output.split('\n')
        assert len(lines) == 5
        for i in range(1, 4):
            assert lines[i].startswith("{}. ".format(i))
            assert len(lines[i]) == 67

コード例 #8

0

ファイルを表示

ファイル: test_html.py プロジェクト: khoulihan/gopher-render

    def test_ins_default(self):
        """
        Default ins tag render should just surround the content in underscores.
        """
        html = "<ins>ClassName</ins>"
        parser = GopherHTMLParser()
        parser.feed(html)
        parser.close()
        output = parser.parsed

        # Surrounded by underscores
        assert output.startswith("_")
        assert output.endswith("_")

        # Only one set of underscores, and the content.
        assert len(output) == 11

        # Just one line
        lines = output.split('\n')
        assert len(lines) == 1

コード例 #9

0

ファイルを表示

ファイル: test_html.py プロジェクト: khoulihan/gopher-render

    def test_strong_default(self):
        """
        Default strong tag render should just surround the content in **s.
        """
        html = "<strong>ClassName</strong>"
        parser = GopherHTMLParser()
        parser.feed(html)
        parser.close()
        output = parser.parsed

        # Surrounded by asterisks
        assert output.startswith("**")
        assert output.endswith("**")

        # Double asterisks, and the content.
        assert len(output) == 13

        # Just one line
        lines = output.split('\n')
        assert len(lines) == 1

コード例 #10

0

ファイルを表示

ファイル: test_html.py プロジェクト: khoulihan/gopher-render

    def test_code_span_default(self):
        """
        Default code tag render should just surround the content in backticks.
        """
        html = "<code>ClassName</code>"
        parser = GopherHTMLParser()
        parser.feed(html)
        parser.close()
        output = parser.parsed

        # Surrounded by backticks
        assert output.startswith("`")
        assert output.endswith("`")

        # Only one set of backticks, and the content.
        assert len(output) == 11

        # Just one line
        lines = output.split('\n')
        assert len(lines) == 1

コード例 #11

0

ファイルを表示

ファイル: test_html.py プロジェクト: khoulihan/gopher-render

    def test_div_default(self):
        """
        Default div tag render should do nothing except pad to the width of
        the block.
        """
        html = "<div>ClassName</div>"
        parser = GopherHTMLParser(optimise=False)
        parser.feed(html)
        parser.close()
        output = parser.parsed

        assert output.startswith("C")
        assert output.strip().endswith("e")

        # Just the padded content.
        assert len(output) == 67

        # Just one line
        lines = output.split('\n')
        assert len(lines) == 1

コード例 #12

0

ファイルを表示

ファイル: test_html.py プロジェクト: khoulihan/gopher-render

    def test_del_default(self):
        """
        Default del tag render should just surround the content in ~~s.
        """
        html = "<del>ClassName</del>"
        parser = GopherHTMLParser()
        parser.feed(html)
        parser.close()
        output = parser.parsed

        # Surrounded by tildes
        assert output.startswith("~~")
        assert output.endswith("~~")

        # Double tildes, and the content.
        assert len(output) == 13

        # Just one line
        lines = output.split('\n')
        assert len(lines) == 1

コード例 #13

0

ファイルを表示

ファイル: test_html.py プロジェクト: khoulihan/gopher-render

    def test_whitespace(self):
        """
        Test that whitespace is removed or preserved as expected.
        """
        html = "\n".join([
            "<p>  This \t\t\tparagraph  ",
            "     has a \tbunch of",
            "whitespace   in between    ",
            "the lines  </p>",
        ])
        parser = GopherHTMLParser()
        parser.feed(html)
        parser.close()
        output = parser.parsed

        lines = output.split('\n')
        assert len(lines) == 3

        result = "This paragraph has a bunch of whitespace in between the lines"
        assert lines[1] == result

コード例 #14

0

ファイルを表示

ファイル: test_html.py プロジェクト: khoulihan/gopher-render

    def test_closed_br_tag_default(self):
        """
        Default br tag renderer just adds a newline. It should not be removed
        by p tag formatting.
        """
        html = "<p>Paragraph<br/>Text</p>"
        parser = GopherHTMLParser()
        parser.feed(html)
        parser.close()
        output = parser.parsed

        # Blank line after.
        assert output.endswith("\n")

        # One extra wrap for the br
        lines = output.split('\n')
        assert len(lines) == 4

        assert lines[1].strip() == "Paragraph"
        assert len(lines[1]) == len(lines[1].strip())
        assert lines[2].strip() == 'Text'
        assert len(lines[2]) == len(lines[2].strip())

コード例 #15

0

ファイルを表示

ファイル: test_html.py プロジェクト: khoulihan/gopher-render

    def test_dl_default(self):
        """
        Default dl tag render. It prepends definitions with ': ' and has a margin
        above and below, and a margin between terms.
        """
        html = "<dl><dt>One</dt><dd>Definition One</dd><dt>Two</dt><dd>Definition Two One</dd><dd>Definition Two Two</dd></dl>"
        parser = GopherHTMLParser(optimise=False)
        parser.feed(html)
        parser.close()
        output = parser.parsed

        assert output.startswith("\n")
        assert output.endswith("\n")

        lines = output.split('\n')
        assert len(lines) == 8
        assert lines[2].startswith(": ")
        for i in range(5, 7):
            assert lines[i].startswith(": ")
            assert len(lines[i]) == 67
        for i in range(1, 7):
            assert len(lines[i]) == 67

コード例 #16

0

ファイルを表示

ファイル: test_html.py プロジェクト: khoulihan/gopher-render

    def test_nested_lists_default(self):
        """
        Nested lists.
        """
        html = "<ol><li>One</li><li>Two<ul><li>Two Point One</li><li>Two Point Two</li></ul></li><li>Three</li></ol>"
        parser = GopherHTMLParser(optimise=False)
        parser.feed(html)
        parser.close()
        output = parser.parsed

        assert output.startswith("\n")
        assert output.endswith("\n")

        lines = output.split('\n')
        assert len(lines) == 7
        for i in range(1, 3):
            assert lines[i].startswith("{}. ".format(i))
            assert len(lines[i]) == 67
        for i in range(3, 5):
            assert lines[i].startswith("   * ")
            assert len(lines[i]) == 67
        assert lines[5].startswith("3. ".format(i))
        assert len(lines[5]) == 67

コード例 #17

0

ファイルを表示

ファイル: test_html.py プロジェクト: khoulihan/gopher-render

    def test_p_tag_default_short(self):
        """
        Default p tag render has a line below and is left justified.
        """
        html = "<p>Paragraph Text</p>"
        parser = GopherHTMLParser()
        parser.feed(html)
        parser.close()
        output = parser.parsed

        # Blank line after.
        assert output.endswith("\n")

        # No wrapping should occur (line count includes blanks)
        lines = output.split('\n')
        assert len(lines) == 3

        # Initial line indent
        #assert lines[1].startswith(' ' * 8)

        assert lines[1].strip() == "Paragraph Text"
        assert len(lines[1]) == len(lines[1].strip())
        assert lines[2] == ''

コード例 #18

0

ファイルを表示

ファイル: test_html.py プロジェクト: khoulihan/gopher-render

    def test_whitespace_around_tags(self):
        """
        Test that whitespace is preserved around inline tags within a paragraph.
        """
        html = "\n".join([
            "<p>A first line,",
            "an <em>emphasised</em> second.",
            "<strong>Strong start </strong>to a third.",
            "</p>"
        ])
        parser = GopherHTMLParser()
        parser.feed(html)
        parser.close()
        output = parser.parsed

        lines = output.split('\n')
        assert len(lines) == 3

        # This is the formatted paragraph, but it then gets padded by the box model
        # Note that the paragraph justification adds an extra space after the
        # full stop here.
        result = "A first line, an _emphasised_ second.  **Strong start **to a third."
        result = result + (' ' * (67 - len(result)))
        assert lines[1] == result