Python build_whole_regtree示例，regparser.tree.build.build_whole_regtree Python示例

示例#1

0

显示文件

文件： tree_build_tests.py 项目： cfpb/regulations-parser

    def test_build_whole_regtree_missing_interp(self):
        """Not all regs have an interpretation section."""
        text = "PART 200-Regulation Q\n"
        text += u"§ 200.1 First section.\n"
        text += "Section content\n"
        text += "Appendix A to Part 200 - Appendix Title\n"
        text += "Appendix content"

        node200_1 = Node("\nSection content\n", label=['200', '1'],
                         title=u"§ 200.1 First section.", children=[],
                         node_type=Node.REGTEXT)
        nodeA = Node("\nAppendix content", label=["200", "A"],
                     title="Appendix A to Part 200 - Appendix Title",
                     children=[], node_type=Node.APPENDIX)
        nodeEP = Node('', label=['200', 'Subpart'], title='',
                      children=[node200_1], node_type=Node.EMPTYPART)

        #   Convert to JSON so we can ignore some unicode issues
        enc = NodeEncoder(sort_keys=True)
        self.assertEqual(
            enc.encode(build.build_whole_regtree(text)),
            enc.encode(Node("\n", label=["200"], title="PART 200-Regulation Q",
                            children=[nodeEP, nodeA]))
        )

示例#2

0

显示文件

文件： builder.py 项目： khandelwal/regulations-parser

 def reg_tree(reg_str):
     if reg_str[:1] == '<':  # XML
         return reg_text.build_tree(reg_str)
     else:
         return build_whole_regtree(reg_str)

示例#3

0

显示文件

 def reg_tree(reg_str):
     if reg_str[:1] == '<':  # XML
         return reg_text.build_tree(reg_str)
     else:
         return build_whole_regtree(reg_str)

示例#4

0

显示文件

文件： tree_build_tests.py 项目： cfpb/regulations-parser

    def test_build_whole_regtree(self):
        """Integration test for the plain-text regulation tree parser"""
        text = "PART 200-Regulation Q\n"
        text += u"§ 200.1 First section.\n"
        text += "(a) First par\n"
        text += "(b) Second par\n"
        text += u"§ 200.2 Second section.\n"
        text += "Content without sub pars\n"
        text += "Appendix A to Part 200 - Appendix Title\n"
        text += "A-1 Appendix 1\n"
        text += "(a) Appendix par 1\n"
        text += "Supplement I to Part 200 - Official Interpretations\n"
        text += "Section 200.2 Second section\n"
        text += "2(a)(5) First par\n"
        text += "1. Commentary 1\n"
        text += "2. Commentary 2\n"

        node201 = Node(
            "\n", label=['200', '1'], title=u"§ 200.1 First section.",
            children=[Node(u"(a) First par\n", label=["200", "1", "a"]),
                      Node(u"(b) Second par\n", label=["200", "1", "b"])])
        node202 = Node("\nContent without sub pars\n", label=["200", "2"],
                       title=u"§ 200.2 Second section.")
        nodeA = Node(
            "\n", label=["200", "A"], node_type=Node.APPENDIX,
            title="Appendix A to Part 200 - Appendix Title", children=[
                Node("\n",
                     label=["200", "A", "1"],
                     title="A-1 Appendix 1",
                     node_type=Node.APPENDIX,
                     children=[Node("(a) Appendix par 1\n",
                                    node_type=Node.APPENDIX,
                                    label=["200", "A", "1", "a"])])
            ]
        )
        nodeI1 = Node('1. Commentary 1\n', node_type=Node.INTERP,
                      label=['200', '2', 'a', '5', Node.INTERP_MARK, '1'])
        nodeI2 = Node('2. Commentary 2\n', node_type=Node.INTERP,
                      label=['200', '2', 'a', '5', Node.INTERP_MARK, '2'])
        nodeI = Node(
            '\n', label=['200', Node.INTERP_MARK], node_type=Node.INTERP,
            title='Supplement I to Part 200 - Official Interpretations',
            children=[
                Node('\n', label=['200', '2', Node.INTERP_MARK],
                     node_type=Node.INTERP,
                     title='Section 200.2 Second section',
                     children=[
                         Node('\n', label=['200', '2', 'a', '5',
                                           Node.INTERP_MARK],
                              node_type=Node.INTERP, title='2(a)(5) First par',
                              children=[nodeI1, nodeI2])])
            ]
        )
        nodeEP = Node('', label=['200', 'Subpart'], title='',
                      children=[node201, node202], node_type=Node.EMPTYPART)

        #   Convert to JSON so we can ignore some unicode issues
        enc = NodeEncoder(sort_keys=True)
        self.assertEqual(
            enc.encode(build.build_whole_regtree(text)),
            enc.encode(Node("\n", label=["200"], title="PART 200-Regulation Q",
                            children=[nodeEP, nodeA, nodeI]))
        )

示例#5

0

显示文件

文件： build_from.py 项目： dclegalhackers/regulations-parser

if __name__ == "__main__":
    if len(sys.argv) < 6:
        print("Usage: python build_from.py regulation.txt title "
              + "notice_doc_# act_title act_section (Generate diffs? "
              + "True/False)")
        print("  e.g. python build_from.py rege.txt 12 2011-31725 15 1693 "
              + "False")
        exit()

    writer = api_writer.Client()

    with codecs.open(sys.argv[1], encoding='utf-8') as f:
        reg = unicode(f.read())

    #   First, the regulation tree
    reg_tree = build_whole_regtree(reg)
    cfr_part = reg_tree.label_id()
    cfr_title = sys.argv[2]
    doc_number = sys.argv[3]
    #   Hold off on writing the regulation until after we know we have a valid
    #   doc number

    #   Next, notices
    notices = fetch_notices(cfr_title, cfr_part)
    modify_effective_dates(notices)
    notices = applicable_notices(notices, doc_number)
    #  Didn't include the provided version
    if not notices:
        print "Could not find notice_doc_#, %s" % doc_number
        exit()
    for notice in notices: