Python find_key_val_line示例

编程语言: Python

命名空间/包名称: wikipedia_parser.infobox.wikitext_helpers

方法/功能: find_key_val_line

hotexamples.com的示例: 2

Python find_key_val_line - 已找到2个示例。这些是从开源项目中提取的最受好评的wikipedia_parser.infobox.wikitext_helpers.find_key_val_line现实Python示例。您可以评价示例，以帮助我们提高示例质量。

示例#1

显示文件

文件： wikitext_parser.py 项目： ijjoyce/wikipedia_parser

def get_simple_text(wtext, key, clean=True):

    text = None

    keys = key if type(key) is list else [key]

    template_dict = adapter.template_dict(wtext)
    wtext_lines = wtext_help.get_wtext_lines(wtext)

    if keys:
        for possible_key in keys:

            # try getting from parserfromhell
            if not text and template_dict:
                text = template_dict.get(possible_key)

            # final attempt if still no text
            if not text and wtext_lines:
                matched_line = wtext_help.find_key_val_line(wtext, possible_key)
                if matched_line:
                    key_val = matched_line.strip(' \t\n\r').split("=", 1)
                    if len(key_val) == 2:
                        text = key_val[1].strip()

    if text and clean:
        text = clean_help.clean_text(text)

    return text

示例#2

显示文件

文件： wikitext_parser.py 项目： ijjoyce/wikipedia_parser

def extract_page_links(wtext, key):

    links = []

    keys = key if type(key) is list else [key]

    template_dict = adapter.template_dict(wtext)
    wtext_lines = wtext_help.get_wtext_lines(wtext)

    if keys:
        for possible_key in keys:

            # try parserfromhell
            if not links and template_dict:
                if template_dict.get(possible_key):
                    matches = re.findall("\[\[(.*?)\]\]", template_dict.get(possible_key))
                    links = [link.split("|", 1)[0] for link in matches]

            # final attempt if still no links
            if not links and wtext_lines:
                matched_line = wtext_help.find_key_val_line(wtext_lines, possible_key)
                if matched_line:
                    key_val = matched_line.strip(' \t\n\r').split("=")
                    if len(key_val) == 2:
                        matches = re.findall("\[\[(.*?)\]\]", key_val[1].strip())
                        links = [link.split("|", 1)[0] for link in matches]

    return links