# coding: utf-8 import extract import json import re #original data = extract.inp(u"イギリス") sentence = data["text"].split("\n") for line in sentence: if "Category" in line: lie = line.strip("[]").split(":") print lie[1] print #answer with regularexpression data = extract.inp(u"イギリス") sentence = data["text"].split("\n") for line in sentence: category_line = re.search("^\[\[Category:(.*?)(|\|.*)\]\]$", line) if category_line is not None: print(category_line.group(1))
# coding: utf-8 import re import json import extract data = extract.inp(u"イギリス") data = data["text"].split("\n") for line in data: asd = re.search(u"^(File|ファイル):(.*\.jpg)\|.*(\|/*)?", line) if asd is not None: print asd.group(2)
# coding: utf-8 import extract import json f = u"イギリス" data = extract.inp(f) for line in data["text"].split("\n"): if "Category" in line: print line