Ejemplo n.º 1
0
    along with Docket.  If not, see <http://www.gnu.org/licenses/>.
"""
import os, sys
from docket.explore import Explorer


if __name__ == '__main__':
    # Build the path to the xml file
    data_path = 'law_data/InnocentiveYear2005DCTExtract'
    xml_file = 'DCTInnoExtY20050420DCTInnoExtY20050420_N_DFEDDISTCV12_2015042064336.nxo.xml'
    path = os.path.join(os.getcwd(), data_path, xml_file)

    help_msg = ("""Usage: $ python -m docket tag-set: The set of all tags\n"""
        """       $ python -m docket grab <tag>: Grabs the text from tag\n""")

    x = Explorer(path)
    numargs = len(sys.argv)

    # Exit if no command line arguments
    if numargs > 1:
        op = sys.argv[1]
    else:
        print(help_msg)
        sys.exit(1)

    if op == 'tag-set':
        print("All Possible Tags:")
        for tag in x.tag_set():
            print(tag)
        sys.exit(0)
    elif op == 'grab':
Ejemplo n.º 2
0
 def setup_class(self):
     self.data_path = 'law_data/InnocentiveYear2005DCTExtract'
     self.xml_file = 'DCTInnoExtY20050420DCTInnoExtY20050420_N_DFEDDISTCV12_2015042064336.nxo.xml'
     self.path = os.path.join(os.getcwd(), self.data_path, self.xml_file)
     self.x = Explorer(self.path)
     print("SETUP!")
Ejemplo n.º 3
0
class TestExplorer(unittest.TestCase):

    @classmethod
    def setup_class(self):
        self.data_path = 'law_data/InnocentiveYear2005DCTExtract'
        self.xml_file = 'DCTInnoExtY20050420DCTInnoExtY20050420_N_DFEDDISTCV12_2015042064336.nxo.xml'
        self.path = os.path.join(os.getcwd(), self.data_path, self.xml_file)
        self.x = Explorer(self.path)
        print("SETUP!")
    
    @classmethod
    def teardown_class(self):
        del self.x
        print("TEAR DOWN!")

    def test_tag_set(self):
        print("Testing tag_set()")
        test_set = {'md.jurisdiction', 'n-metadata', 'knos.level1',
                'cause.block', 'number', 'judge', 'court.citelist',
                'md.jurisstate', 'case.type', 'md.title', 'col.key',
                'image.block', 'case.ref.to', 'md.jurisnum',
                'party.aka.block', 'md.subjects', 'state.source',
                'case.number.hidden', 'md.sourcepubid',
                'firm.fax.block', 'md.subject', 'court.pretty',
                'n-docbody', 'mlmd.judgment.record', 'md.doctype.name',
                'summary', 'party.type', 'court', 'n-metadoc',
                'party.block', 'docket.entry', 'n-document', 'state',
                'c', 'sct.jurisdiction.number', 'case.number.block',
                'party.terminated', 'jury.demand.block',
                'lead.docket.number', 'bop', 'knos.level2', 'bos',
                'case.status.flag', 'pc', 'docket.number',
                'n-extract-response', 'other.dockets.block',
                'md.contributors', 'n-field', 'gateway.image.link',
                'cta.jurisdiction.number', 'docket.block',
                'knos.level3.block', 'other.party', 'p', 'label',
                'md.uuid', 'nature.of.suit.code',
                'firm.address.combined', 'md.jurisabbrev',
                'court.block', 'firm.address.block', 'firm.phone.block',
                'md.pubid', 'eop', 'jurisdiction',
                'key.nature.of.suit.block', 'filing.date.block',
                'jury.demand', 'image.gateway.link', 'cite.query',
                'minor.link.metadata.block', 'party.name', 'city',
                'md.dates', 'md.createddatetime', 'firm.name.block',
                'docket.description', 'case.ref.to.block', 'link',
                'demand.amount', 'higher.court.information',
                'party.aka', 'number.block', 'jurisdiction.block',
                'panel.block', 'cause', 'knos.level2.block',
                'lead.docket.block', 'md.juriscourt', 'court.norm',
                'date', 'r', 'prism-clipdate', 'party.name.block',
                'title.block', 'knos.code', 'md.jurisdictions',
                'attorney.status', 'closed.date.block',
                'md.descriptions', 'docket.entries.block',
                'other.dockets', 'metadata.block', 'case.status.block',
                'scrape.date', 'md.filedate', 'md.docketnum',
                'convert.date', 'zip', 'firm.phone', 'md.publication',
                'party.attorney.block', 'attorney.terminated',
                'legacy.id', 'md.royalty', 'send.runner.link',
                'md.doctype.rank', 'private', 'case.number',
                'filing.date', 'closed.date', 'prism-stylesheet',
                'nature.of.suit.block', 'defendant.party',
                'attorney.name', 'data.source.type',
                'party.terminated.block', 'md.publications', 'firm.fax',
                'lead.docket.number.INF', 'md.doc.family.uuid',
                'md.westlawids', 'firm.name', 'platform', 'street',
                'md.judge', 'md.identifiers', 'md.publicationgroup',
                'knos.level1.block', 'md.infotype', 'md.royalty.code',
                'eos', 'nature.of.suit', 'demand.amount.block',
                'attorney.terminated.block', 'knos.level3',
                'md.royalty.number', 'cluster.name', 'md.jurislevel',
                'md.attorney', 'primary.title', 'plaintiff.party',
                'attorney.email'}
        
        assert_equals(self.x.tag_set(), test_set)
Ejemplo n.º 4
0
 def setup_class(self):
     self.data_path = 'law_data/InnocentiveYear2005DCTExtract'
     self.xml_file = 'DCTInnoExtY20050420DCTInnoExtY20050420_N_DFEDDISTCV12_2015042064336.nxo.xml'
     self.path = os.path.join(os.getcwd(), self.data_path, self.xml_file)
     self.x = Explorer(self.path)
     print("SETUP!")
Ejemplo n.º 5
0
class TestExplorer(unittest.TestCase):
    @classmethod
    def setup_class(self):
        self.data_path = 'law_data/InnocentiveYear2005DCTExtract'
        self.xml_file = 'DCTInnoExtY20050420DCTInnoExtY20050420_N_DFEDDISTCV12_2015042064336.nxo.xml'
        self.path = os.path.join(os.getcwd(), self.data_path, self.xml_file)
        self.x = Explorer(self.path)
        print("SETUP!")

    @classmethod
    def teardown_class(self):
        del self.x
        print("TEAR DOWN!")

    def test_tag_set(self):
        print("Testing tag_set()")
        test_set = {
            'md.jurisdiction', 'n-metadata', 'knos.level1', 'cause.block',
            'number', 'judge', 'court.citelist', 'md.jurisstate', 'case.type',
            'md.title', 'col.key', 'image.block', 'case.ref.to', 'md.jurisnum',
            'party.aka.block', 'md.subjects', 'state.source',
            'case.number.hidden', 'md.sourcepubid', 'firm.fax.block',
            'md.subject', 'court.pretty', 'n-docbody', 'mlmd.judgment.record',
            'md.doctype.name', 'summary', 'party.type', 'court', 'n-metadoc',
            'party.block', 'docket.entry', 'n-document', 'state', 'c',
            'sct.jurisdiction.number', 'case.number.block', 'party.terminated',
            'jury.demand.block', 'lead.docket.number', 'bop', 'knos.level2',
            'bos', 'case.status.flag', 'pc', 'docket.number',
            'n-extract-response', 'other.dockets.block', 'md.contributors',
            'n-field', 'gateway.image.link', 'cta.jurisdiction.number',
            'docket.block', 'knos.level3.block', 'other.party', 'p', 'label',
            'md.uuid', 'nature.of.suit.code', 'firm.address.combined',
            'md.jurisabbrev', 'court.block', 'firm.address.block',
            'firm.phone.block', 'md.pubid', 'eop', 'jurisdiction',
            'key.nature.of.suit.block', 'filing.date.block', 'jury.demand',
            'image.gateway.link', 'cite.query', 'minor.link.metadata.block',
            'party.name', 'city', 'md.dates', 'md.createddatetime',
            'firm.name.block', 'docket.description', 'case.ref.to.block',
            'link', 'demand.amount', 'higher.court.information', 'party.aka',
            'number.block', 'jurisdiction.block', 'panel.block', 'cause',
            'knos.level2.block', 'lead.docket.block', 'md.juriscourt',
            'court.norm', 'date', 'r', 'prism-clipdate', 'party.name.block',
            'title.block', 'knos.code', 'md.jurisdictions', 'attorney.status',
            'closed.date.block', 'md.descriptions', 'docket.entries.block',
            'other.dockets', 'metadata.block', 'case.status.block',
            'scrape.date', 'md.filedate', 'md.docketnum', 'convert.date',
            'zip', 'firm.phone', 'md.publication', 'party.attorney.block',
            'attorney.terminated', 'legacy.id', 'md.royalty',
            'send.runner.link', 'md.doctype.rank', 'private', 'case.number',
            'filing.date', 'closed.date', 'prism-stylesheet',
            'nature.of.suit.block', 'defendant.party', 'attorney.name',
            'data.source.type', 'party.terminated.block', 'md.publications',
            'firm.fax', 'lead.docket.number.INF', 'md.doc.family.uuid',
            'md.westlawids', 'firm.name', 'platform', 'street', 'md.judge',
            'md.identifiers', 'md.publicationgroup', 'knos.level1.block',
            'md.infotype', 'md.royalty.code', 'eos', 'nature.of.suit',
            'demand.amount.block', 'attorney.terminated.block', 'knos.level3',
            'md.royalty.number', 'cluster.name', 'md.jurislevel',
            'md.attorney', 'primary.title', 'plaintiff.party', 'attorney.email'
        }

        assert_equals(self.x.tag_set(), test_set)
Ejemplo n.º 6
0
    along with Docket.  If not, see <http://www.gnu.org/licenses/>.
"""
import os, sys
from docket.explore import Explorer

if __name__ == '__main__':
    # Build the path to the xml file
    data_path = 'law_data/InnocentiveYear2005DCTExtract'
    xml_file = 'DCTInnoExtY20050420DCTInnoExtY20050420_N_DFEDDISTCV12_2015042064336.nxo.xml'
    path = os.path.join(os.getcwd(), data_path, xml_file)

    help_msg = (
        """Usage: $ python -m docket tag-set: The set of all tags\n"""
        """       $ python -m docket grab <tag>: Grabs the text from tag\n""")

    x = Explorer(path)
    numargs = len(sys.argv)

    # Exit if no command line arguments
    if numargs > 1:
        op = sys.argv[1]
    else:
        print(help_msg)
        sys.exit(1)

    if op == 'tag-set':
        print("All Possible Tags:")
        for tag in x.tag_set():
            print(tag)
        sys.exit(0)
    elif op == 'grab':