-
Notifications
You must be signed in to change notification settings - Fork 0
/
correct_simplified.py
91 lines (86 loc) · 1.62 KB
/
correct_simplified.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
import sys
correct_registers = {
'MT': 'MT',
'NA': 'NA',
'LY': 'LY',
'SP': 'SP',
'ID': 'ID',
'IT': 'IT',
'ID': 'ID',
'NE': 'ne',
'SR': 'sr',
'RE': 're',
'HI': 'HI',
'EN': 'en',
'RA': 'ra',
'FI': 'fi',
'LT': 'lt',
'IN': 'IN',
'RV': 'rv',
'OB': 'ob',
'RS': 'rs',
'AV': 'av',
'OP': 'OP',
'DS': 'ds',
'ED': 'ed',
'IP': 'IP', #until here we have the ones that remain the same
'HT': '',
'RP': '',
'IB': '',
'CM': '',
'OI': '',
'OH': '',
'JD': 'dtp',
'PO': '',
'OO': '',
'TR':'',
'OI': '',
'AD': '',
'LE': '',
'MA': '',
'ON': '',
'OE': '',
'OF': '',
'FH': 'fi', #FAQ abt how to combined with FAQ informational
'FA': 'fi', # FAQ for some languages
'EB': 'ed', # news blogs / editorials under IP
'TS': '',
'OL': '',
'SL': '',
'PR': '',
'OS': '',
'TA': '',
'TV': '',
'FS': '',
'TA': '',
'RR': '',
'QA': '',
'DF': '',
'TB': 'nb',
'PB': 'nb',
'CB': 'nb',
'OA': '',
'SS': '',
'FC': '',
'DT': 'dtp',
'DP': 'dtp',
'PA': '',
'HA': '',
'SO': '',
'IG': ''
}
def correct(tags): #can include several
finals = []
tags=tags.strip().upper()
if "IG" in tags:
if "DS" in tags:
tags=tags.replace("IG", "IP")
else:
tags=tags.replace("IG", "")
for label in tags.strip().split(" "):
if len(label) <1:
continue
finals.append(correct_registers.get(label))
return " ".join(finals)
for line in sys.stdin:
print(correct(line))