Example #1
0
 def __init__(self, pinyin):
     """
     Initiate the parameters.
     """
     ParserBase.__init__(self, pinyin)
     #self.initMapper()
     self.log.info(u"ChongqingHandler构造开始")
Example #2
0
 def __init__(self, pinyin):
     """
     Initiate the parameters.
     """
     ParserBase.__init__(self, pinyin)
     self.ignore_key_list.extend(["gdxq_html", u'gdxx.详情'])
     self.log.info("LiaoningHandler 构造完成")
Example #3
0
 def __init__(self, pinyin):
     """
     Initiate the parameters.
     """
     ParserBase.__init__(self, pinyin)
     self.initMapper()
     self.log.info("JiangsuHandler 构造完成")
Example #4
0
 def __init__(self, pinyin):
     """
     Initiate the parameters.
     """
     ParserBase.__init__(self, pinyin)
     self.ignore_key_list.extend([u"gdxq_html", u'gdxx.详情'])
     self.appendJsonMapperConfig(
         u'bgxx_json', {
             'altFiledName': u'bgxx.变更事项',
             'altBe': u'bgxx.变更前内容',
             'altAf': u'bgxx.变更后内容',
             'altDate': u'bgxx.变更日期',
             'primary_key': 'altDate, altFiledName, altAf'
         })
     self.appendJsonMapperConfig(
         u'baxx_json', {
             'name': u'baxx.姓名',
             'position': u'baxx.职务',
             'primary_key': 'name, position'
         })
     self.appendJsonMapperConfig(
         u'fzjg_json', {
             'regNO': u'fzjg.注册号',
             'brName': u'fzjg.名称',
             'regOrg': u'fzjg.登记机关',
             'primary_key': 'regNO, brName'
         })
     self.log.info(u"GuangdongHandler 构造完成")
    def __init__(self, special_list = [], in_path = '/u/arvie/PHD/Neural_Language_Models/penn_tree_bank_data/', out_root = '/u/arvie/PHD/Neural_Language_Models/penn_tree_bank_data/out/'):
        ParserBase.__init__(self, special_list=special_list)

        self.data_in_path = in_path
        self.data_out_root = out_root
        self.update_out_path()

        self.data_files = ['train.txt', 'valid.txt', 'test.txt']
        self.extention_length = 4
    def __init__(self, special_list = [], in_path = '/u/arvie/PHD/Neural_Language_Models/botha_data/icml14-data/',
                 out_root = '/u/arvie/PHD/Neural_Language_Models/botha_data/out/'):

        ParserBase.__init__(self, special_list=special_list)

        self.data_in_path = in_path
        self.data_out_root = out_root
        self.data_in_path_original = in_path
        self.data_out_root_original = out_root

        self.data_files = ['train.in', 'test.in', 'finaltest.in']
        self.extention_length = 3

        # the data set is the second one i.e en, cs, de, es, fr, ru
        self.data_set_languages = ['cs-en', 'en-cs', 'en-de', 'en-es', 'en-fr', 'en-ru']
        self.data_sets = ['1m-mono', 'mono']
Example #7
0
    def __init__(self, pinyin):
        """
        Initiate the parameters.
        """
        ParserBase.__init__(self, pinyin)
        self.ignore_key_list.extend(["gdxq_html", u'gdxx.详情'])
        self.rslt_mapper_config = {
            u"合伙人信息.*": u"gdxx.*",
            u"基本信息.*": ".*",
            u"股东信息.*": u"gdxx.*",
            u"股东及出资信息.*": u"gdxx.*",
            u"投资人信息.*": u"gdxx.*",
            u"投资人及出资信息.*": u"gdxq.*",
            u"发起人.*": u"gdxx.*",
            u"变更信息.*": u"bgxx.*",
            u"主要人员信息.*": u"baxx.*",
            u"备案信息.*": u"baxx.*",
            u"成员名册.*": u"baxx.*",
            u"分支机构信息.*": u"fzjg.*",
            u"行政处罚信息.*": u"xzcf.*"
        }

        self.log.info(u"SiChuanHandler 构造完成")
Example #8
0
 def __init__(self, pinyin):
     """
     Initiate the parameters.
     """
     ParserBase.__init__(self, pinyin)
     self.log.info(u"NeimengguHandler 构造完成")
Example #9
0
 def __init__(self, pinyin):
     ParserBase.__init__(self, pinyin)
     self.ignore_key_list.extend([u"gdxq_html", u'gdxx.详情'])
     self.log.info(u"HainanHandler 构造完成")
Example #10
0
 def __init__(self, pinyin):
     """
     Initiate the parameters.
     """
     ParserBase.__init__(self, pinyin)
     self.log.info(u"HeilongjiangHandler 构造完成")