/
fix_latin_raw_head_form.py
66 lines (55 loc) · 2.03 KB
/
fix_latin_raw_head_form.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
#!/usr/bin/env python3
# -*- coding: utf-8 -*-
import pywikibot, re, sys, argparse
import blib
from blib import getparam, rmparam, msg, errandmsg, site, tname, pname
import lalib
pos_to_template = {
"noun form": "la-noun-form",
"noun forms": "la-noun-form",
"proper noun form": "la-proper noun-form",
"proper noun forms": "la-proper noun-form",
"pronoun form": "la-pronoun-form",
"pronoun forms": "la-pronoun-form",
"verb form": "la-verb-form",
"verb forms": "la-verb-form",
"adjective form": "la-adj-form",
"adjective forms": "la-adj-form",
"participle form": "la-part-form",
"participle forms": "la-part-form",
"numeral form": "la-numeral-form",
"numeral forms": "la-numeral-form",
"suffix form": "la-suffix-form",
"suffix forms": "la-suffix-form",
}
def process_text_on_page(index, pagename, text):
def pagemsg(txt):
msg("Page %s %s: %s" % (index, pagename, txt))
def errandpagemsg(txt):
errandmsg("Page %s %s: %s" % (index, pagename, txt))
pagemsg("Processing")
notes = []
parsed = blib.parse_text(text)
for t in parsed.filter_templates():
tn = tname(t)
if tn == "head" and getparam(t, "1") == "la":
pos = getparam(t, "2")
if pos not in pos_to_template:
pagemsg("WARNING: Saw unrecognized part of speech %s: %s" % (pos, str(t)))
continue
if getparam(t, "3") or getparam(t, "head"):
pagemsg("WARNING: Saw 3= or head=: %s" % str(t))
continue
origt = str(t)
t.add("1", pagename)
blib.set_template_name(t, pos_to_template[pos])
rmparam(t, "2")
t.add("FIXME", "1")
pagemsg("Replaced %s with %s" % (origt, str(t)))
notes.append("replace {{head|la|%s}} with {{%s}}" % (pos, tname(t)))
return str(parsed), notes
parser = blib.create_argparser("Fix Latin raw-form {{head|la|... form}} usages",
include_pagefile=True, include_stdin=True)
args = parser.parse_args()
start, end = blib.parse_start_end(args.start, args.end)
blib.do_pagefile_cats_refs(args, start, end, process_text_on_page, edit=True, stdin=True)