Python _build_phrase_map示例

编程语言: Python

命名空间/包名称: neuroquery.tokenization

方法/功能: _build_phrase_map

hotexamples.com的示例: 2

Python _build_phrase_map - 已找到2个示例。这些是从开源项目中提取的最受好评的neuroquery.tokenization._build_phrase_map现实Python示例。您可以评价示例，以帮助我们提高示例质量。

示例#1

显示文件

def test_extract_phrases():
    phrases = [("machine", ), ("machine", "learning"), ("algorithm", )]
    phrase_map = tokenization._build_phrase_map(phrases)
    sentence = "the new machine learning algorithm".split()
    all_phrases = tokenization._extract_phrases(phrase_map, sentence, "keep")
    assert all_phrases == [
        ("the", ),
        ("new", ),
        ("machine", "learning"),
        ("algorithm", ),
    ]
    all_phrases = tokenization._extract_phrases(phrase_map, sentence,
                                                tokenization.OUT_OF_VOC_TOKEN)
    assert all_phrases == [
        (tokenization.OUT_OF_VOC_TOKEN, ),
        (tokenization.OUT_OF_VOC_TOKEN, ),
        ("machine", "learning"),
        ("algorithm", ),
    ]
    all_phrases = tokenization._extract_phrases(phrase_map, sentence, "[]")
    assert all_phrases == [
        ("[the]", ),
        ("[new]", ),
        ("machine", "learning"),
        ("algorithm", ),
    ]
    all_phrases = tokenization._extract_phrases(phrase_map, sentence, "{}")
    assert all_phrases == [
        ("{the}", ),
        ("{new}", ),
        ("machine", "learning"),
        ("algorithm", ),
    ]

示例#2

显示文件

def test_build_phrase_map():
    phrases = [
        ("machine", "learning"),
        ("default", "mode", "network"),
        ("resting", "state"),
        ("learning", ),
        ("network", ),
        ("brain", ),
        ("machine", ),
        ("speech", "perception"),
        ("speech", "production"),
        ("speech", ),
    ]
    phrase_map = tokenization._build_phrase_map(phrases)
    assert phrase_map == {
        "brain": {
            "": {}
        },
        "default": {
            "mode": {
                "network": {
                    "": {}
                }
            }
        },
        "learning": {
            "": {}
        },
        "machine": {
            "": {},
            "learning": {
                "": {}
            }
        },
        "network": {
            "": {}
        },
        "resting": {
            "state": {
                "": {}
            }
        },
        "speech": {
            "": {},
            "perception": {
                "": {}
            },
            "production": {
                "": {}
            }
        },
    }