def split_eduexp_block(text): def issplit(i, lines): if re.search(edu_reg, lines[i]): return True return False exp_blocks = divideModule.divideExpBlock(text, isSplit=issplit) return exp_blocks
def split_skill_block(text): def issplit(i, lines): if re.search(skill_reg, lines[i]) and not lines[i].startswith(u"技能名称"): return True else: return False exp_blocks = divideModule.divideExpBlock(text, isSplit=issplit) return exp_blocks
def split_certificate_block(text): def issplit(i, lines): if re.search(certi_reg, lines[i]): return True else: return False exp_blocks = divideModule.divideExpBlock(text, isSplit=issplit) return exp_blocks
def split_language_block(text): def issplit(i, lines): if match_basic.match_language(re.split("\s+", lines[i])[0]): return True else: return False exp_blocks = divideModule.divideExpBlock(text, isSplit=issplit) return exp_blocks
def split_eduexp_block(text): def issplit(i, lines): for timestamp in timestamps: if re.search(timestamp, lines[i]): return True return False exp_blocks = divideModule.divideExpBlock(text, isSplit=issplit) return exp_blocks
def split_skill_block(text): def issplit(i, lines): if i + 1 < len(lines) and re.search( u"^(熟练|精通|良好|一般)", lines[i + 1]) or re.search( u".{2,}\s+(熟练|精通|良好|一般)", lines[i]): return True else: return False exp_blocks = divideModule.divideExpBlock(text, isSplit=issplit) exp_blocks_final = [] for block in exp_blocks: m = re.search(u"(?P<o>(.+)(熟练|精通|良好|一般))(?P<t>(.+)(熟练|精通|良好|一般))", block) if m: exp_blocks_final.append(m.group("o").strip()) exp_blocks_final.append(m.group("t").strip()) else: exp_blocks_final.append(block) return exp_blocks_final