Coverage for src / wiktextract / tags.py: 79%

33 statements  

« prev     ^ index     » next       coverage.py v7.14.0, created at 2026-05-11 04:48 +0000

1# -*- fundamental -*- 

2# 

3# Lists of valid tags and mappings for tags canonicalization. 

4# 

5# Copyright (c) 2020-2022 Tatu Ylonen. See file LICENSE and https://ylonen.org 

6 

7import re 

8 

9# Mappings for tags in template head line ends outside parentheses. These are 

10# also used to parse final tags from translations. 

11xlat_head_map = { 

12 "m": "masculine", 

13 "f": "feminine", 

14 "m/f": "masculine feminine", 

15 "m./f.": "masculine feminine", 

16 "m or f": "masculine feminine", 

17 "m or n": "masculine neuter", 

18 "m or c": "masculine common-gender", 

19 "f or m": "feminine masculine", 

20 "f or n": "feminine neuter", 

21 "f or n.": "feminine neuter", # fimmtíu/Icelandig 

22 "f or c": "feminine common-gender", # sustainability/Tr/Norwegian 

23 "n or f": "neuter feminine", 

24 "n or m": "neuter masculine", 

25 "n or c": "neuter common-gender", 

26 "c or m": "common-gender masculine", 

27 "c or f": "common-gender feminine", # picture book/Tr/Norwegian 

28 "c or n": "common-gender neuter", # ethylene/Eng/Tr/Danish 

29 "m or f or n": "masculine feminine neuter", 

30 "f or m or n": "feminine masculine neuter", 

31 "m or f or c": "masculine feminine common-gender", 

32 "f or m or c": "feminine masculine common-gender", 

33 "m or c or n": "masculine common-gender neuter", 

34 "f or c or n": "feminine common-gender neuter", 

35 "m or n or c": "masculine neuter common-gender", 

36 "f or n or c": "feminine neuter common-gender", 

37 "c or f or n": "common-gender feminine neuter", 

38 "c or m or n": "common-gender masculine neuter", 

39 "n or f or c": "neuter feminine common-gender", 

40 "n or m or c": "neuter masculine common-gender", 

41 "n or m or f": "neuter masculine feminine", 

42 "n or f or m": "neuter feminine masculine", 

43 "c or m or f": "common-gender masculine feminine", 

44 "c or f or m": "common-gender masculine feminine", 

45 "f or n or m": "feminine neuter masculine", 

46 "m or n or f": "masculine neuter feminine", # cataract/Tr/Dutch 

47 "f or c or m": "feminine common-gender masculine", 

48 "m or c or f": "masculine common-gender feminine", 

49 "m or f or m": "?masculine feminine", # fantasma,soldado/Portuguese 

50 "m pl": "masculine plural", 

51 "f pl": "feminine plural", 

52 "n pl": "neuter plural", 

53 "m sg": "masculine singular", 

54 "f sg": "feminine singular", 

55 "n sg": "neuter singular", 

56 # "f or pl": "feminine singular plural", # XXX information/Eng/Tr/Latgalian 

57 # "m or pl": "masculine singular plural", # XXX information/Eng/Tr/Latga... 

58 # "n or pl": "neuter singular plural", # XXX table scrap/Tr/Greek 

59 # "c or pl": "common-gender singular plural", 

60 "pl or f": "feminine singular plural", # XXX grit/Eng/Tr(husked...)/German 

61 "pl or m": "masculine singular plural", 

62 "pl or n": "neuter singular plural", # ordnance/Tr/German 

63 "pl or c": "common-gender singular plural", # "you don't say"/Tr/Romanian 

64 "sg or f": "singular feminine", 

65 "sg or m": "singular masculine", 

66 "sg or n": "singular neuter", 

67 "sg or c": "singular common-gender", 

68 # "m or sg": "masculine singular", 

69 "f or sg": "feminine singular", 

70 # "m or sg": "neuter singular", 

71 "c or sg": "common-gender singular", 

72 "m or pl": "masculine plural", 

73 "f or pl": "feminine plural", 

74 "n or pl": "neuter plural", 

75 "c or pl": "common-gender plural", 

76 "m or f pl": "masculine feminine plural", 

77 "c or n or n pl": "common-gender neuter singular plural", # XXX augmentation/Tr 

78 "pl or m or f": "masculine feminine singular plural", # XXX suc* my co*/Tr 

79 "m or f or sg or pl": "masculine feminine singular plural", # Ainu/Russian 

80 "m or f or pl": "masculine feminine plural", # that/Tr/Dutch 

81 "m or f sg": "masculine feminine singular", 

82 "pl or f or m or n": "", # Sindhi/Tr(language)/Spanish 

83 "pl or f or n": "masculine feminine neuter plural singular singular", # XXX 

84 # crush/Portuguese head 

85 "m or m f": "?masculine feminine", 

86 # beginner/Eng/Tr/Polish 

87 "m or m pl": "masculine singular plural", 

88 "f or f pl": "feminine singular plural", 

89 "n or n pl": "neuter singular plural", 

90 "c or c pl": "common-gender singular plural", 

91 "f pl or n pl": "feminine neuter plural", # diurnal/Eng/Tr/Polish 

92 "f pl or n or n pl": "feminine neuter singular plural", # veneral/Tr/Polish 

93 "m or m pl or f or f pl or n or n pl": "", # "a lot"/Tr/Latin 

94 "pl or n or n pl": "neuter singular plural", # salt/Tr/Greek 

95 "f or f": "feminine", 

96 "topo.": "toponymic", # E.g., p/Egyptian 

97 "n": "neuter", 

98 "c": "common-gender", # common gender in at least West Frisian 

99 "sg": "singular", 

100 "pl": "plural", 

101 "pl or sg": "plural singular", 

102 "sg or pl": "singular plural", 

103 "m sg or m pl": "masculine singular plural", # valenki/Tr/German 

104 "f sg or f pl": "feminine singular plural", 

105 "n sg or n pl": "neuter singular plural", 

106 "c sg or c pl": "common-gender singular plural", 

107 "m pl or f pl": "masculine feminine plural", # comedian/English/Tr/Welsh 

108 "m pl or n pl": "masculine neuter plural", # whose/Tr/Latin 

109 "m pl or n": "?masculine neuter plural singular", # pimpernel/Tr/Bulgarian 

110 "m sg or f sg": "masculine singular feminine", # your/Eng/Tr/Walloon 

111 "f sg or m sg": "masculine singular feminine", # your/Eng/Tr/Walloon 

112 "n sg or n sg": "masculine singular feminine", # your/Eng/Tr/Walloon 

113 "n sg or m sg": "neuter masculine singular", # vulgus/Latin 

114 # copacetic/English/Tr/Hebrew: 

115 "m or m pl or f or f pl": "masculine feminine singular plural", 

116 # your/Eng/Tr/Norwegian: 

117 "m pl or f pl or n pl": "masculine feminine neuter plural", 

118 "m sg or f sg or n sg": "masculine feminine neuter singular", 

119 "m pl or f or f pl": "masculine feminine singular plural", 

120 "c pl or n pl": "common-gender neuter plural", # which/Tr/Danish 

121 "inan": "inanimate", 

122 "Inanimate": "inanimate", # e.g., "James Bay"/English/Tr/Northern East Cree 

123 "inan or anim": "inanimate animate", 

124 "anim or inan": "animate inanimate", 

125 "anim": "animate", 

126 "f anim": "feminine animate", 

127 "m anim": "masculine animate", 

128 "n anim": "neuter animate", 

129 "f inan": "feminine inanimate", 

130 "m inan": "masculine inanimate", 

131 "n inan": "neuter inanimate", 

132 "f anim sg": "feminine animate singular", 

133 "m anim sg": "masculine animate singular", 

134 "n anim sg": "neuter animate singular", 

135 "f inan sg": "feminine inanimate singular", 

136 "m inan sg": "masculine inanimate singular", 

137 "n inan sg": "neuter inanimate singular", 

138 "f anim pl": "feminine animate plural", 

139 "m anim pl": "masculine animate plural", 

140 "n anim pl": "neuter animate plural", 

141 "f inan pl": "feminine inanimate plural", 

142 "m inan pl": "masculine inanimate plural", 

143 "n inan pl": "neuter inanimate plural", 

144 "f anim or f inan": "feminine animate inanimate", 

145 "f inan or f anim": "feminine inanimate animate", 

146 "m anim or m inan": "masculine animate inanimate", 

147 "m inan or m anim": "masculine inanimate animate", 

148 "m anim or f anim": "masculine animate feminine", 

149 "f anim or m anum": "feminine animate masculine", 

150 "f inan or f inan pl": "feminine inanimate singular plural", 

151 "m inan or m inan pl": "masculine inanimate singular plural", 

152 "n inan or n inan pl": "neuter inanimate singular plural", 

153 "n inan or m inan": "neuter masculine inanimate", 

154 "f anim or f anim pl": "feminine animate singular plural", 

155 "m anim or m anim pl": "masculine animate singular plural", 

156 "n anim or n anim pl": "neuter animate singular plural", 

157 "f anim or m anim": "feminine animate masculine", 

158 "f inan or n inan": "feminine inanimate neuter", 

159 "m inan pl or m anim pl": "masculine inanimate animate plural", 

160 "f inan or m inan": "feminine masculine inanimate", 

161 "f inan or m inan or f inan pl": "feminine masculine inanimate singular plural", 

162 "f inan or m inan or f inan pl or m inan pl": "feminine masculine inanimate singular plural", 

163 "m inan pl or m anim pl or f anim pl": "masculine feminine inanimate animate plural", 

164 "f anim or f inan or f anim pl": "feminine animate inanimate singular plural", 

165 "f anim or f inan or f anim pl or f inan pl": "feminine animate inanimate singular plural", 

166 "f anim pl or f inan or f inan pl": "feminine animate inanimate singular plural", # XXX 

167 "f inan pl or f anim or f anim pl": "feminine inanimate animate singular plural", # XXX 

168 "f anim or f anim pl or f inan": "feminine animate inanimate singular plural", 

169 "f anim or f anim pl or f inan or f inan pl": "feminine animate inanimate singular plural", 

170 "m anim pl or f anim pl": "masculine feminine animate plural", 

171 "m anim pl or f anim pl or f inan or f inan pl": "masculine animate plural feminine inanimate", 

172 "m anim pl or f anim pl or f inan": "masculine animate feminine plural inanimate singular", # XXX 

173 "f anim pl or f inan pl": "feminine animate inanimate plural", 

174 "f anim pl or f inan pl or m anim pl": "feminine masculine animate inanimate plural", 

175 "m anim pl or f anim pl or f inan pl": "masculine animate feminine plural inanimate", # XXX 

176 "f inan pl or m anim pl": "feminine masculine animate inanimate plural", 

177 "f inan pl or m anim pl or f anim pl": "masculine animate feminine plural inanimate", # XXX 

178 "m anim or f anim or m anim pl": "masculine animate feminine singular plural", 

179 "m anim or f anim or m anim pl or f anim pl": "masculine animate feminine singular plural", 

180 "n inan or n anim or m inan or m anim": "neuter inanimate animate masculine", 

181 "m anim pl or f anim pl or m anim or f anim": "masculine animate plural feminine singular", 

182 "m anim pl or f inan or f inan pl": "masculine animate plural feminine inanimate singular", # XXX 

183 "m anim or n inan": "masculine animate neuter inanimate", # XXX 

184 "n inan pl or m inan or m inan pl": "neuter inanimate plural masculine singular plural", # XXX 

185 "n inan pl or f inan or f inan pl": "neuter inanimate plural feminine singular", # XXX 

186 "f inan pl or m anim or m anim pl": "feminine inanimate plural masculine animate singular", # XXX 

187 "f inan pl or m inan or m inan pl": "feminine inanimate plural masculine singular", # XXX 

188 "n anim or n inan or n anim pl or n inan pl": "neuter animate inanimate singular plural", 

189 "n anim pl or n inan or n inan pl": "neuter animate plural inanimate singular", # XXX 

190 "n inan or n inan pl or f inan or f inan pl": "neuter inanimate singular plural feminine", 

191 "n inan pl or n anim or n anim pl": "neuter inanimate plural animate singular", # XXX 

192 "n anim or n inan": "neuter animate inanimate", 

193 "pers": "person", # XXX check what this really is used for? personal? 

194 "npers": "impersonal", 

195 "f pers": "feminine person", 

196 "m pers": "masculine person", 

197 "f pers or f pers pl": "feminine person singular plural", 

198 "m pers or m pers pl": "masculine person singular plural", 

199 "m pers or f pers": "masculine person feminine", 

200 "f pers or m pers": "feminine person masculine", 

201 "m pers or n pers": "masculine person neuter", 

202 "f pers or n pers": "feminine person neuter", 

203 "m pers or m anim": "masculine person animate", 

204 "m pers or m inan": "masculine person inanimate", 

205 "f pers or f anim": "feminine person animate", 

206 "f pers or f inan": "feminine person inanimate", 

207 # "m pers or f": "masculine person feminine", 

208 "m pers or f": "masculine person feminine animate inanimate", # XXX 

209 "m pers or n": "masculine person neuter animate inanimate", # XXX 

210 "m inan or m pers": "masculine inanimate person", 

211 "m or m pers or f": "masculine inanimate animate person feminine", # XXX 

212 "m anim or m pers": "masculine animate person", 

213 "f anim or f pers": "feminine animate person", 

214 "n anim or n pers": "neuter animate person", 

215 "vir": "virile", 

216 "nvir": "nonvirile", 

217 "anml": "animal-not-person", 

218 "f anml": "feminine animal-not-person", 

219 "m anml": "masculine animal-not-person", 

220 "f animal": "feminine animal-not-person", 

221 "m animal": "masculine animal-not-person", 

222 "m animal or f animal": "masculine animal-not-person feminine", 

223 "f animal or m animal": "feminine animal-not-person masculine", 

224 "m anim or f": "masculine animate feminine inanimate", 

225 "impf": "imperfective", 

226 "impf.": "imperfective", 

227 "pf": "perfective", 

228 "pf.": "perfective", 

229 "impf or impf": "imperfective", 

230 "impf or pf": "imperfective perfective", # ought/Eng/Tr/Serbo-Croatian 

231 "pf or impf": "perfective imperfective", # start/Tr(of an activity)/Russian 

232 "invariable": "invariable", 

233 "n.": "noun", 

234 "v.": "verb", 

235 "adj.": "adjective", 

236 "adv.": "adverb", 

237 "adversative": "", 

238 "?": "", 

239 "1.": "first-person", 

240 "2.": "second-person", 

241 "3.": "third-person", 

242 "1": "class-1", 

243 "1a": "class-1a", 

244 "2": "class-2", 

245 "2a": "class-2a", 

246 "3": "class-3", 

247 "4": "class-4", 

248 "5": "class-5", 

249 "6": "class-6", 

250 "7": "class-7", 

251 "8": "class-8", 

252 "9": "class-9", 

253 "9a": "class-9a", 

254 "10": "class-10", 

255 "10a": "class-10a", 

256 "11": "class-11", 

257 "12": "class-12", 

258 "13": "class-13", 

259 "14": "class-14", 

260 "15": "class-15", 

261 "16": "class-16", 

262 "17": "class-17", 

263 "18": "class-18", 

264 "1/2": "class-1 class-2", 

265 "3/4": "class-3 class-4", 

266 "5/6": "class-5 class-6", 

267 "7/8": "class-7 class-8", 

268 "9/10": "class-9 class-10", 

269 "15/17": "class-15 class-17", 

270 "class 1/2": "class-1 class-2", 

271 "class 3/4": "class-3 class-4", 

272 "class 5/6": "class-5 class-6", 

273 "class 7/8": "class-7 class-8", 

274 "class 9/10": "class-9 class-10", 

275 "class 15/17": "class-15 class-17", 

276 "1 or 2": "class-1 class-2", 

277 "1a or 2a": "class-1a class-2a", 

278 "1a or 2": "class-1a class-2", 

279 "3 or 4": "class-3 class-4", 

280 "5 or 6": "class-5 class-6", 

281 "7 or 8": "class-7 class-8", 

282 "9 or 10": "class-9 class-10", 

283 "9a or 10a": "class-9a class-10a", 

284 "15 or 17": "class-15 class-17", 

285 "9/10 or 1/2": "class-9 class-10 class-1 class-2", 

286 # two/Tr/Kikuyu 

287 "2 or 4 or 6 or 13": "class-2 class-4 class-6 class-13", 

288 "8 or 10": "class-8 class-10", # two/Tr/Kikuyu 

289 "11 or 10": "class-11 class-10", # sea/Eng/Tr/Zulu 

290 "11 or 10a": "class-11 class-10a", # half/Ngazidja Comorian 

291 "10 or 11": "class-10 class-11", # mushroom/Tr/Swahili 

292 "11 or 14": "class-11 class-14", # country/Tr/Swahili 

293 "11 or 12": "class-11 class-12", # theater/Tr/Swahili 

294 "11 or 6": "class-11 class-6", # leaf/'Maore Comorian 

295 "9 or 6": "class-9 class-6", # birthday,carrot/Tr/Rwanda-Rundi 

296 "1 or 6": "class-2 class-6", # Zulu/Tr/Zulu 

297 "6 or 7": "class-6 class-7", # spider/Eng/Tr/Lingala ??? 

298 "15 or 6": "class-15 class-6", # leg/Tr/Rwanda-Rundi 

299 "14 or 6": "class-14 class-6", # rainbow/Tr/Chichewa 

300 "9 or 9": "?class-9", # XXX bedsheet/Tr/Sotho 

301 "m1": "masculine declension-1", 

302 "f2": "feminine declension-2", 

303 "m2": "masculine declension-2", 

304 "f3": "feminine declension-3", 

305 "m3": "masculine declension-3", 

306 "f4": "feminine declension-4", 

307 "m4": "masculine declension-4", 

308 "f5": "feminine declension-5", 

309 "m5": "masculine declension-5", 

310 "[uncountable]": "uncountable", 

311 "is more colloquial": "colloquial", 

312 "(plural f)": "masculine singular feminine-plural", # XXX chromicas/Galician 

313 "(plural m)": "feminine singular masculine-plural", # XXX Genseric/Galician 

314 "m (plural f)": "masculine singular feminine-plural", # XXX chromicas/Galician 

315 "f (plural m)": "feminine singular masculine-plural", # XXX Genseric/Galician 

316 "2 or 3": "?class-2 class-3", # XXX branch/Tr/Swahili 

317 "m or impf": "masculine imperfective", # pour/Tr/Ukrainian 

318 "f or impf": "feminine imperfective", # fuc* around/Tr/(s with many)/Czech 

319 "n or impf": "neuter imperfective", # glom/Russian 

320 "f or pf": "feminine perfective", 

321 "m or pf": "masculine perfective", 

322 "n or pf": "neuter perfective", 

323 "m or m": "?masculine", # Paul/Tr(male given name)/Urdu 

324 "f or c pl": "?feminine common-gender singular plural", # mulberry/Tr/Zazaki 

325 "c pl or n": "?common-gender neuter singular plural", # mouthpiece/Tr/Swedish 

326 "pf or pf": "?perfective", 

327 "sg or sg": "?singular", 

328 "pl or pl": "?plural", 

329 "c or impf": "?common-gender imperfective", 

330 "m inan or n": "masculine inanimate neuter", 

331 "m inan or f": "masculine inanimate feminine", 

332 "pl or pf": "?plural perfective", 

333 "m pl or pf": "masculine plural perfective", 

334 "f pl or pf": "feminine plural perfective", 

335 "n pl or pf": "neuter plural perfective", 

336 "f pl or impf": "feminine plural imperfective", 

337 "m pl or impf": "masculine plural imperfective", 

338 "n pl or impf": "neuter plural imperfective", 

339 "m or f or impf": "?masculine feminine imperfective", 

340 "pl or m or f or n": "?plural masculine feminine neuter", 

341 "no perfect or supine stem": "no-perfect no-supine", 

342 "f inan or m anim or f anim": "masculine feminine animate inanimate", # XXX KJ Composite tags?? 

343 "f inan or f inan pl or f anim or f anim pl": "feminine inanimate plural animate", # XXX 

344 "m anim or f anim or m anim pl or f anim pl or f inan or f inan pl": "masculine animate feminine plural singular inanimate", # XXX 

345 "defunct": "archaic", # flugu/Norwegian Nynorsk 

346 "mfpl": "masculine feminine plural", # extrajudiciaires/French 

347 "class 1": "class-1", 

348 "class 1a": "class-1a", 

349 "class 2": "class-2", 

350 "class 2a": "class-2a", 

351 "class 3": "class-3", 

352 "class 4": "class-4", 

353 "class 5": "class-5", 

354 "class 6": "class-6", 

355 "class 7": "class-7", 

356 "class 8": "class-8", 

357 "class 9": "class-9", 

358 "class 9 or 10": "class-9 class-10", 

359 "class 9a": "class-9a", 

360 "class 10": "class-10", 

361 "class 10a": "class-10", 

362 "class 11": "class-11", 

363 "class 12": "class-12", 

364 "class 13": "class-13", 

365 "class 14": "class-14", 

366 "class 15": "class-15", 

367 "class 16": "class-16", 

368 "class 17": "class-17", 

369 "class 18": "class-18", 

370 "class m-wa": "class-1 class-2", 

371 "class m-mi": "class-3 class-4", 

372 "class ma": "class-5 class-6", 

373 "class ki-vi": "class-7 class-8", 

374 "class n": "class-9 class-10", 

375 "class n/n": "class-9 class-10", 

376 "class u": "class-11 class-12 class-14", 

377 "class ku": "class-15", 

378 "class pa": "class-16", 

379 "class mu": "class-18", 

380 "m-wa class": "class-1 class-2", 

381 "m-mi class": "class-3 class-4", 

382 "ma class": "class-5 class-6", 

383 "ki-vi class": "class-7 class-8", 

384 "n class": "class-9 class-10", 

385 "u class": "class-11 class-12 class-14", 

386 "ku class": "class-15", 

387 "pa class": "class-16", 

388 "mu class": "class-18", 

389 "m or f by sense": "masculine feminine by-personal-gender", 

390 "superlative dubious": "", 

391 # пьянчужка/Russian 

392 "m anim or f anim by sense": "masculine feminine by-personal-gender", 

393 "m pl or f pl by sense": "masculine feminine plural by-personal-gender", 

394 "m pers or f pers by sense": "masculine feminine personal by-personal-gender", 

395 "gender m": "masculine", # nene/Abau 

396 "gender f": "feminine", # just for completion's sake 

397 "gender mf": "masculine feminine", 

398 "class I": "class-i", 

399 "class II": "class-ii", 

400 "class III": "class-iii", 

401 "class IV": "class-iv", 

402 "class V": "class-v", 

403 "class VI": "class-vi", 

404 "class VII": "class-vii", 

405 "class VIII": "class-viii", 

406 "class IX": "class-ix", 

407 "class X": "class-x", 

408 "class XI": "class-xi", 

409 "class XII": "class-xii", 

410 "class XIII": "class-xiii", 

411} 

412 

413# Languages that can have head-final numeric class indicators. They are mostly 

414# used in Bantu languages. We do not want to interpret them at the ends of 

415# words like "Number 11"/English. Also, some languages have something like 

416# "stress pattern 1" at the end of word head, which we also do not want to 

417# interpret as class-1. 

418head_final_numeric_langs = { 

419 "Bende", 

420 "Chichewa", 

421 "Chimwiini", 

422 "Dyirbal", # Australian aboriginal, uses class-4 etc 

423 "Kamba", 

424 "Kikuyu", 

425 "Lingala", 

426 "Luganda", 

427 "Maore Comorian", 

428 "Masaba", 

429 "Mwali Comorian", 

430 "Mwani", 

431 "Ngazidja Comorian", 

432 "Northern Ndebele", 

433 "Nyankole", 

434 "Phuthi", 

435 "Rwanda-Rundi", 

436 "Sotho", 

437 "Shona", 

438 "Southern Ndebele", 

439 "Swahili", 

440 "Swazi", 

441 "Tsonga", 

442 "Tswana", 

443 "Tumbuka", 

444 "Xhosa", 

445 "Zulu", 

446 "ǃXóõ", 

447 "Proto-Bantu", 

448} 

449 

450# Languages for which to consider head_final_extra_map 

451head_final_bantu_langs = { 

452 # XXX should other Bantu languages be included here? Which ones use 

453 # suffixes such as "m or wa"? 

454 "Swahili", 

455} 

456 

457head_final_bantu_map = { 

458 # These are only handled in parse_head_final_tags 

459 # and will generally be ignored elsewhere. These may contain spaces. 

460 # Swahili class indications. 

461 "m or wa": "class-1 class-2", 

462 "m or mi": "class-3 class-4", 

463 "ma": "class-5 class-6", 

464 "ki or vi": "class-7 class-8", 

465 "n": "class-9 class-10", 

466 "class u": "class-11 class-12 class-14", 

467 "u": "class-11 class-12 class-14", 

468 "ku": "class-15", 

469 "pa": "class-16", 

470 "mu": "class-18", 

471 "n or n": "class-9 class-10", # Andromeda/Eng/Tr/Swahili etc 

472 "u or u": "class-11 class-14", # wife/Eng/Tr/Swahili 

473 "class 1": "class-1", 

474 "class 1a": "class-1a", 

475 "class 2": "class-2", 

476 "class 2a": "class-2a", 

477 "class 3": "class-3", 

478 "class 4": "class-4", 

479 "class 4/none": "class-4 no-plural", 

480 "class 5": "class-5", 

481 "class 6": "class-6", 

482 "class 7": "class-7", 

483 "class 8": "class-8", 

484 "class 9": "class-9", 

485 "class 9/10": "class-9 class-10", 

486 "class 9/10/1/2": "class-9 class-10 class-1 class-2", 

487 "class 9/10c": "class-9 class-10", 

488 "class 9/c10": "class-9 class-10", 

489 "class IX/X": "class-9 class-10", 

490 "class 9a": "class-9a", 

491 "class 10": "class-10", 

492 "class 10/11": "class-10 class-11", 

493 "class 10a": "class-10", 

494 "class 11": "class-11", 

495 "class 11/12": "class-11 class-12", 

496 "class 11/10": "class-10 class-11", 

497 "class 11/10a": "class-10 class-11", 

498 "class 11/14": "class-10 class-14", 

499 "class 12": "class-12", 

500 "class 13": "class-13", 

501 "class 14": "class-14", 

502 "class 15": "class-15", 

503 "class 16": "class-16", 

504 "class 17": "class-17", 

505 "class 18": "class-18", 

506 "class m-wa": "class-1 class-2", 

507 "class m/wa": "class-1 class-2", 

508 "class m-mi": "class-3 class-4", 

509 "class m/mi": "class-3 class-4", 

510 "class ma": "class-5 class-6", 

511 "class ki-vi": "class-7 class-8", 

512 "class ki/vi": "class-7 class-8", 

513 "class n": "class-9 class-10", 

514 "class n/n": "class-9 class-10", 

515 "class u/zi": "class-11 class-10", 

516 "class u/u": "class-11 class-12 class-14", 

517 "class ku": "class-15", 

518 "class pa": "class-16", 

519 "class mu": "class-18", 

520 "m-wa class": "class-1 class-2", 

521 "m-mi class": "class-3 class-4", 

522 "ma class": "class-5 class-6", 

523 "ki-vi class": "class-7 class-8", 

524 "n class": "class-9 class-10", 

525 "u class": "class-11 class-12 class-14", 

526 "ku class": "class-15", 

527 "pa class": "class-16", 

528 "mu class": "class-18", 

529} 

530 

531head_final_semitic_langs = { 

532 "Akkadian", 

533 "Amharic", 

534 "Arabic", 

535 "Aramaic", 

536 "Eblaite", 

537 "Hebrew", 

538 "Hijazi Arabic", 

539 "Maltese", 

540 "Moroccan Arabic", 

541 "Phoenician", 

542 "South Levantine Arabic", 

543 "Tigre", 

544 "Tigrinya", 

545 "Ugaritic", 

546} 

547 

548head_final_semitic_map = { 

549 "I": "form-i", 

550 "II": "form-ii", 

551 "III": "form-iii", 

552 "IV": "form-iv", 

553 "V": "form-v", 

554 "VI": "form-vi", 

555 "VII": "form-vii", 

556 "VIII": "form-viii", 

557 "IX": "form-ix", 

558 "X": "form-x", 

559 "XI": "form-xi", 

560 "XII": "form-xii", 

561 "XIII": "form-xiii", 

562 "Iq": "form-iq", 

563 "IIq": "form-iiq", 

564 "IIIq": "form-iiiq", 

565 "IVq": "form-ivq", 

566} 

567 

568head_final_other_langs = set( 

569 [ 

570 "Finnish", 

571 "French", 

572 "Lithuanian", 

573 "Arabic", 

574 "Armenian", 

575 "Zazaki", 

576 "Hebrew", 

577 "Hijazi Arabic", 

578 "Moroccan Arabic", 

579 "Nama", 

580 "Old Church Slavonic", 

581 "Gothic", 

582 "Old Irish", 

583 "Latin", 

584 "Scottish Gaelic", 

585 "Slovene", 

586 "Sorbian", 

587 "South Levantine Arabic", 

588 "Kajkavian", 

589 "Chakavian", 

590 "Croatian", # Kajkavian and Chakavian are forms of Croatian 

591 "Sanskrit", 

592 "Ancient Greek", 

593 # XXX For dual??? see e.g. route/Tr(course or way)/Polish 

594 "Dyirbal", 

595 "Egyptian", 

596 "Maltese", 

597 "Maori", 

598 "Polish", 

599 "Portuguese", 

600 "Romanian", # cache,acquaintance/Tr/Romanian 

601 "Ukrainian", 

602 "Ugaritic", 

603 "Russian", 

604 "Galician", 

605 ] 

606) 

607 

608head_final_other_map = { 

609 # This is used in Finnish at the end of some word forms (in translations?) 

610 "in indicative or conditional mood": "in-indicative in-conditional", 

611 # marine/French Derived terms 

612 "f colloquial form of a feminine marin": "feminine colloquial", 

613 # These stress pattern indicators occur in Lithuanian 

614 "stress pattern 1": "stress-pattern-1", 

615 "stress pattern 2": "stress-pattern-2", 

616 "stress pattern 3": "stress-pattern-3", 

617 "stress pattern 3a": "stress-pattern-3a", 

618 "stress pattern 3b": "stress-pattern-3b", 

619 "stress pattern 4": "stress-pattern-4", 

620 "stress pattern: 1": "stress-pattern-1", 

621 "stress pattern: 2": "stress-pattern-2", 

622 "stress pattern: 3": "stress-pattern-3", 

623 "stress pattern: 3a": "stress-pattern-3a", 

624 "stress pattern: 3b": "stress-pattern-3b", 

625 "stress pattern: 4": "stress-pattern-4", 

626 # These are specific to Arabic, Armenian, Zazaki, Hebrew, Nama, 

627 # Old Church Slavonic, Gothic, Old Irish, Latin, Scotish Gaelic, 

628 # Slovene, Sorbian, Kajkavian, Chakavian, (Croatian), Sanskrit, 

629 # Ancient Greek 

630 # (generally languages with a dual number) 

631 "du": "dual", 

632 "du or pl": "dual plural", # aka duoplural 

633 "m du": "masculine dual", 

634 "f du": "feminine dual", 

635 "n du": "neuter dual", 

636 "m du or f du": "masculine feminine dual", # yellow/Tr/Zazaki 

637 "f du or m du": "feminine masculine dual", 

638 "n du or n pl": "neuter dual plural", 

639 "f du or f pl": "feminine dual plural", 

640 "m du or m pl": "masculine dual plural", 

641 "du or f du or n": "?", # XXX guest/Tr/Zazaki 

642 "du or n or pf": "?", # XXX how would this be expressed 

643 "du or n du": "neuter dual", # bilberry/Tr/Zazaki 

644 "pl or pf": "?plural perfective", # walk/Tr(to steal)/Russian 

645 "m or pf": "?masculine perfective", # boom/Tr(make book)/Russian 

646 "n or n du": "neuter singular dual", 

647 # XXX clump/Tr/Portuguese 

648 "sg or m du": "singular feminine neuter masculine dual", 

649 "m du or f du or n du": "masculine dual feminine neuter", 

650 "du or m": "?dual masculine", 

651 "(plural f)": "singular plural feminine", # XXX chromicas/Galician 

652 "(plural m)": "singular plural masculine", # XXX Genseric/Galician 

653} 

654 

655# Accepted uppercase tag values. As tags these are represented with words 

656# connected by hyphens. These are classified as dialect tags; if an uppercase 

657# is not a dialect tag, then it should be listed separately in valid_tags. 

658uppercase_tags = { 

659 "A Estierna", 

660 "AF", # ??? what does this mean 

661 "ALUPEC", 

662 "ASL gloss", # Used with sign language heads 

663 "Aargau", 

664 "Abagatan", 

665 "Absheron", 

666 "Abung/Kotabumi", 

667 "Abung/Sukadana", 

668 "Abzakh", 

669 "Acadian", 

670 "Achaemenid", 

671 "Achterhooks", 

672 "Adana", 

673 "Adyghe", 

674 "Aeolic", # Ancient Greek 

675 "Affectation", 

676 "Afi-Amanda", 

677 "Africa", 

678 "African-American Vernacular English", 

679 "Afrikaans", 

680 "Afyonkarahisar", 

681 "Agdam", 

682 "Ağrı", 

683 "Akhmimic", 

684 "Aknada", 

685 "Al-Andalus", 

686 "Ala-Laukaa", 

687 "Alak", 

688 "Alemannic", # Variant of German 

689 "Alemannic German", # Variant of German 

690 "Algherese", 

691 "Alles", 

692 "Alliancelles", 

693 "Alsace", 

694 "Alsatian", 

695 "Alviri", # Variant of Alviri-Vidari 

696 "Amecameca", 

697 "American continent", 

698 "Americanization", 

699 "Amerindish", 

700 "Amianan", 

701 "Amira", 

702 "Amrum", 

703 "Amur", 

704 "Anbarani", # Variant of Talysh 

705 "Ancient", 

706 "Ancient China", 

707 "Ancient Egyptian", 

708 "Ancient Greek", 

709 "Ancient Rome", 

710 "Ancient Roman", 

711 "Andalusia", 

712 "Anglian", 

713 "Anglicised", 

714 "Anglicism", 

715 "Anglism", 

716 "Anglo-Latin", 

717 "Anglo-Norman", 

718 "Angola", 

719 "Aniwa", 

720 "Anpezan", # Variant of Ladin 

721 "Antalya", 

722 "Antanosy", 

723 "Antilles", 

724 "Appalachia", 

725 "Appalachian", 

726 "Arabicized", 

727 "Aragon", 

728 "Aragón", 

729 "Aramaic", 

730 "Aran", 

731 "Aranese", 

732 "Arango", 

733 "Arawak", 

734 "Arbëresh", 

735 "Arcadocypriot", # Ancient Greek 

736 "Ardennes", 

737 "Argentina", 

738 "Arkhangelsk", 

739 "Armenia", 

740 "Aromanian", 

741 "Aruba", 

742 "Asalem", 

743 "Asalemi", # Variant of Talysh 

744 "Asante", 

745 "Ashkenazi Hebrew", 

746 "Asturias", 

747 "Atlantic Canada", 

748 "Atlapexco", 

749 "Attic", # Ancient greek 

750 "Aukštaitian", 

751 "Australia", 

752 "Australian", 

753 "Austria", 

754 "Austrian", 

755 "Auve", 

756 "Auvernhàs", # Dialect of Occitan 

757 "Avignon", 

758 "Ayer", 

759 "Ayt Ndhir", 

760 "Azerbaijani", 

761 "Azores", 

762 "Baan Nong Duu", 

763 "Babia", 

764 "Bacheve", 

765 "Badiot", # Variant of Ladin 

766 "Badiu", 

767 "Baghdad", 

768 "Bahamas", 

769 "Bahasa Baku", 

770 "Bahia", 

771 "Baku", 

772 "Balearic", 

773 "Balkar", 

774 "Baltic-Finnic", 

775 "Bamu", 

776 "Banatiski Gurbet", 

777 "Banawá", 

778 "Bangkok", 

779 "Bangladesh", # bhai/English 20241113 

780 "Banten", 

781 "Banyamasan", 

782 "Barbados", 

783 "Barda", 

784 "Bardez Catholic", 

785 "Barlavento", 

786 "Basel", 

787 "Bashkir", 

788 "Basque", 

789 "Batang", 

790 "Batangas", 

791 "Bavaria", 

792 "Bavarian", 

793 "Baxter Sagart", # a reconstruction of Old Chinese pronunciation 

794 "Beijing", 

795 "Belalau", 

796 "Belarusian", 

797 "Belgium", 

798 "Belize", 

799 "Bentheim", 

800 "Bering Straits", # Inupiaq language 

801 "Berlin", 

802 "Berlin-Brandenburg", 

803 "Bern", 

804 "Beru", 

805 "Bezhta", 

806 "Bharati braille", 

807 "Biblical Hebrew", 

808 "Biblical", 

809 "Bikol Legazpi", 

810 "Bikol Naga", 

811 "Bikol Tabaco", 

812 "Bilasuvar", 

813 "Bimenes", 

814 "Biscayan", 

815 "Bla-Brang", 

816 "Bo Sa-ngae", 

817 "Bodega", 

818 "Bogota", 

819 "Boharic", # XXX is this typo of Bohairic? fruit/Tr/part of plant/Coptic 

820 "Bohairic", 

821 "Bohemia", 

822 "Boholano", 

823 "Bokmål", # Variant of Norwegian 

824 "Bolivia", 

825 "Bologna", 

826 "Bolognese", 

827 "Bombay", 

828 "Borneo", 

829 "Boro", 

830 "Bosnia Croatia", 

831 "Bosnia", 

832 "Bosnian", 

833 "Bosnian Croatian", 

834 "Bosnian Serbian", 

835 "Boston", 

836 "Botswana", 

837 "Brabant", 

838 "Brabantian", 

839 "Braintree", # Place in UK? 

840 "Brazil", 

841 "Brazilian", 

842 "Bressan", 

843 "Brest", 

844 "Britain", 

845 "British", 

846 "British airforce", 

847 "British Army", 

848 "British Columbia", 

849 "British Isles", 

850 "British Royal Navy", 

851 "Brunei", 

852 "Bugey", 

853 "Bugurdži", 

854 "Bukovina", 

855 "Bulgaria", 

856 "Bulgarian", 

857 "Busan", 

858 "Bushehr", 

859 "Burdur", 

860 "Burgenland", 

861 "Bygdeå", 

862 "Byzantine", # Ancient Greek 

863 "Bzyb", 

864 "Béarn", 

865 "cabo Verde", 

866 "CJK tally marks", 

867 "Cabrales", 

868 "Caipira", 

869 "Caithness", 

870 "California", 

871 "Campello Monti", 

872 "Campidanese", # Variant of Sardinian 

873 "Canada", 

874 "Canadian", 

875 "Canadian English", 

876 "Canadian French", 

877 "Canadian Prairies", 

878 "Canado-American", 

879 "Canary Islands", 

880 "Cangas del Narcea", 

881 "Cantonese", # Chinese dialect/language 

882 "Cape Afrikaans", 

883 "Carakan", 

884 "Carcoforo", 

885 "Caribbean", 

886 "Carioca", 

887 "Carpi", 

888 "Castilian Spanish", 

889 "Castilian", 

890 "Catalan", 

891 "Catalan-speaking bilingual areas mostly", 

892 "Catalonia", 

893 "Catholic", 

894 "Cebu", 

895 "Cebuano", 

896 "Central America", 

897 "Central Apulia", 

898 "Central Asia", 

899 "Central Scots", 

900 "Central Sweden", 

901 "Central and Southern Italy", 

902 "Central", 

903 "Chakavian", 

904 "Changuena", 

905 "Changsha", 

906 "Changtai", 

907 "Chanthaburi", 

908 "Chazal", # Jewish historical sages 

909 "Chengdu", 

910 "Chiconamel", 

911 "Chicontepec", 

912 "Child US", 

913 "Chile", 

914 "China", 

915 "Chinese Character classification", 

916 "Cholula", 

917 "Chongqing", 

918 "Choral Doric", # Ancient Greek 

919 "Christian", 

920 "Chugoku", 

921 "Chūgoku", 

922 "Chumulu", 

923 "Church of England", 

924 "Cieszyn Silesia", 

925 "Cincinnati", 

926 "Cismontane", # Corsican dialect 

927 "Classical", # Variant of several languages, e.g., Greek, Nahuatl 

928 "Classical Attic", 

929 "Classical Chinese", 

930 "Classical Edessan", 

931 "Classical Indonesian", 

932 "Classical K'Iche", 

933 "Classical Latin", 

934 "Classical Persian", 

935 "Classical Sanskrit", 

936 "Classical Syriac", 

937 "Classical studies", 

938 "Clay", 

939 "Closed ultima", 

940 "Coastal Min", 

941 "Cockney", 

942 "Cois Fharraige", 

943 "Cois Fharraige", 

944 "Colombia", 

945 "Colunga", 

946 "Common accent", 

947 "Commonwealth", 

948 "Congo", 

949 "Congo-Kinshasa", 

950 "Connacht", 

951 "Connemara", 

952 "Contentin", 

953 "Continent", 

954 "Copenhagen", 

955 "Corinthian", # Ancient Greek 

956 "Cork", 

957 "Cornish", 

958 "Cornwall", 

959 "Counting rod", 

960 "Costa Rica", 

961 "Cotentin", 

962 "Crimea", 

963 "Croatia", 

964 "Croatian", 

965 "Cu'up", # Region in Indonesia (Rejang language) 

966 "Cuarto de los Valles", 

967 "Cuba", 

968 "Cuisnahuat", 

969 "Cumbria", 

970 "Cuoq", 

971 "Cusco", 

972 "Cypriot", 

973 "Cyprus", 

974 "Czech", 

975 "Czech Republic", 

976 "Čakavian", 

977 "DR Congo", 

978 "Dalmatia", 

979 "Dalinpu", 

980 "Dananshan Miao", 

981 "Dankyira", 

982 "Dari", 

983 "Dashtestan", 

984 "Dauphinois", 

985 "Daya", 

986 "Daytshmerish", 

987 "De'kwana", 

988 "Debri", 

989 "Deh Sarv", 

990 "Deirate", 

991 "Delhi", 

992 "Delhi Hindi", 

993 "Demotic", # Greek/Ancient Greek 

994 "Denizli", 

995 "Derbyshire", 

996 "Devon", 

997 "Digor", # Variant of Ossetian 

998 "Dingzhou", 

999 "Dissenter", 

1000 "Dithmarsisch", 

1001 "Diyarbakır", 

1002 "Dominican Republic", 

1003 "Dominican Republic", 

1004 "Dongmen", 

1005 "Doric", # Ancient Greek 

1006 "Drasi", # Region in India 

1007 "Draweno-Polabian", 

1008 "Drents", 

1009 "Dundee", 

1010 "Dungan", 

1011 "Durham", 

1012 "Dutch", 

1013 "Dêgê", 

1014 "Džáva", 

1015 "EU", 

1016 "Early Middle English", 

1017 "Early Modern Greek", 

1018 "Early", 

1019 "East Anglia", 

1020 "East Armenian", 

1021 "East Bengal", 

1022 "East Coast", 

1023 "East Frisian", 

1024 "East Midlands", 

1025 "East Slovakia", 

1026 "East", 

1027 "Eastern Armenian", 

1028 "Eastern Lombard", 

1029 "Eastern New England", 

1030 "Eastern Punjabi", 

1031 "Eastern Syriac", 

1032 "Eastern", 

1033 "Ecclesiastical", 

1034 "Ectasian", 

1035 "Ecuador", 

1036 "Ecuadorian Kichwa", 

1037 "Edirne", 

1038 "Egypt", 

1039 "Egyptian Arabic", # Variant of Arabic 

1040 "Egyptiot", 

1041 "Ekagongo", 

1042 "Ekavian", 

1043 "El Salvador", 

1044 "Elazığ", 

1045 "Elberfelder Bibel", 

1046 "Elean", # Ancient Greek 

1047 "England", 

1048 "English Midlands", 

1049 "English", 

1050 "Eonavian", 

1051 "Epic", 

1052 "Epigraphic Gandhari", 

1053 "Epirote", # Ancient Greek 

1054 "Erhua", # Northern Chinese dialectal feature 

1055 "Erzgebirgisch", 

1056 "Esham", 

1057 "Esperantized", 

1058 "Esperanto", 

1059 "Essex", # Region in UK 

1060 "Estonian", 

1061 "Estuary English", 

1062 "Europe", 

1063 "European", 

1064 "European Union", 

1065 "European ortography", 

1066 "Eurozone", 

1067 "Fante", 

1068 "Faroese", 

1069 "Fars", 

1070 "Fascian", # Variant of Ladin 

1071 "Fayyumic", # Variant of Coptic 

1072 "Fengkai", 

1073 "Finglish", # Finnish word taken from English / American Finnish dialect 

1074 "Finland", 

1075 "Fjolde", 

1076 "Flanders", 

1077 "Flemish", 

1078 "Florida", 

1079 "Fluminense", 

1080 "Fodom", # Variant of Ladin 

1081 "For transcription only", 

1082 "Formazza", 

1083 "Fountain", 

1084 "Fragoria vesca", 

1085 "France Quebec", 

1086 "France", 

1087 "Fredrikstad", 

1088 "French", 

1089 "Frenchified", 

1090 "Fribourg", 

1091 "Friulian", 

1092 "From Old Northern French", 

1093 "Föhr", 

1094 "Föhr-Amrum", 

1095 "Fuzhou", 

1096 "Gadabay", 

1097 "Gaellic", 

1098 "Galgolitic", 

1099 "Galicia", 

1100 "Galician", 

1101 "Galitzish", 

1102 "Galway", 

1103 "Gan", # Variant of Chinese 

1104 "Gangwon", # Dialect/region for Korean 

1105 "Gascon", # DIalect of Occitan 

1106 "Gascony", 

1107 "Gaspésie", 

1108 "Gaúcho", 

1109 "Gelders", 

1110 "General American", 

1111 "General Australian", 

1112 "General Brazilian", 

1113 "General Cebuano", 

1114 "General New Zealand", 

1115 "General South African", 

1116 "Genoa", 

1117 "Genoese", 

1118 "Genovese", 

1119 "Geordie", 

1120 "Georgia", 

1121 "German", 

1122 "German Low German", 

1123 "Germanic", 

1124 "Germany", 

1125 "Gheg", 

1126 "Gherdëina", # Variant of Ladin 

1127 "Gipuzkoan", 

1128 "Glarus", 

1129 "Goan Konkani", 

1130 "Goerdie", 

1131 "Goeree-Overflakkee", 

1132 "Gope", 

1133 "Gorj", 

1134 "Goth", 

1135 "Gothenburg", 

1136 "Gotland", 

1137 "Goud Saraswat", 

1138 "Grecian", 

1139 "Greco-Bohairic", 

1140 "Greco-Roman", 

1141 "Greek Catholic", 

1142 "Greek-type", # Used to characterize some Latin words e.g. nematodes/Latin 

1143 "Gressoney", 

1144 "Grischun", 

1145 "Grisons", 

1146 "Groningen", 

1147 "Gronings", 

1148 "Guadeloupean", 

1149 "Gualaca", 

1150 "Guatemala", 

1151 "Guangdong", 

1152 "Guangzhou", 

1153 "Guernsey", 

1154 "Gufin", 

1155 "Guichicovi", 

1156 "Guinea-Bissau", 

1157 "Guinée Conakry", 

1158 "Gulf Arabic", # Variant of Arabic Language 

1159 "Gurbet", 

1160 "Gurvari", 

1161 "Guyana", 

1162 "Gwichya", 

1163 "Gyeongsang", # Province in South Korea 

1164 "H-system", 

1165 "Ha", 

1166 "Hachijō", 

1167 "Hainanese", 

1168 "Haketia", 

1169 "Hakka", # Chinese dialect/language 

1170 "Halchighol", 

1171 "Hallig", 

1172 "Halligen", 

1173 "Hamburg", 

1174 "Hamgyong", # Region and former province in Korea 

1175 "Hangaza", 

1176 "Hanoi", 

1177 "Hanyuan", 

1178 "Harak", 

1179 "Harat", 

1180 "Harry Potter", 

1181 "Hawaii", 

1182 "Hawick", 

1183 "Hán tự", 

1184 "Hebei", # China 

1185 "Hejazi Arabic", # Variant of Arabic Language 

1186 "Hejazi", 

1187 "Helgoland", # Variant of North Frisian 

1188 "Heligoland", 

1189 "Heligolandic", 

1190 "Hellenizing School", 

1191 "Hevaha", 

1192 "Hianacoto", 

1193 "Hiberno-English", 

1194 "Hijazi", # Variant of Arabic 

1195 "Hijazi Arabic", # Variant of Arabic 

1196 "Hinduism", 

1197 "Hinglish", # babu/English 20241113 

1198 "Hokkien", # Chinese dialect/language 

1199 "Honduras", 

1200 "Hong Kong", 

1201 "Hongmaogang", 

1202 "Hong'an", 

1203 "Hoanya", 

1204 "Hometwoli", 

1205 "Hongfeng", 

1206 "Hosso", 

1207 "Hsinchu Hokkien", # Chinese dialect/language 

1208 "Hua", 

1209 "Huizhou", 

1210 "Hui'an", 

1211 "Hungarian Vend", 

1212 "Huế", 

1213 "Hyōgai", # Uncommon type of Kanji character 

1214 "Hà Nội", # Vietnamese dialect 

1215 "Hà Tĩnh", # Vietnamese dialect 

1216 "Hössjö", 

1217 "Hồ Chí Minh City", 

1218 "I Ching hexagram", 

1219 "I-I", # Used in some Dungan nouns; I have no idea what this means 

1220 "Ionic", # Ancient Greek 

1221 "IUPAC", 

1222 "Iberian", 

1223 "Ibero-Romance", 

1224 "Iceland", 

1225 "İçel", 

1226 "Ikavian", 

1227 "Ijekavian", 

1228 "Ijekavian/Ekavian", 

1229 "Ilir", 

1230 "In conjunct consonants", 

1231 "Inari", # Variant of Sami 

1232 "India", 

1233 "Indian English", 

1234 "Indo-Aryan linguistics", 

1235 "Indo-European studies", 

1236 "Indonesia", 

1237 "Inkhokwari", 

1238 "Inland Min", 

1239 "Inland Northern American", 

1240 "Inner Mongolia", 

1241 "Insular Scots", 

1242 "Insular", 

1243 "Interlingua", 

1244 "Internet", 

1245 "Inuvialuktun", 

1246 "Iran", 

1247 "Iranian", 

1248 "Iranian Persian", 

1249 "Iraq", 

1250 "Iraqi Hebrew", 

1251 "Ireland", 

1252 "Irish", 

1253 "Iron", # Variant of Ossetian 

1254 "Isfahan", 

1255 "Isparta", 

1256 "Israel", 

1257 "Issime", 

1258 "Istanbul", 

1259 "Italian Hebrew", 

1260 "Italy", 

1261 "Iyaric", 

1262 "Izalco", 

1263 "İzmit", 

1264 "Jabung", 

1265 "Jainism", 

1266 "Jakarta", 

1267 "Jalalabad", 

1268 "Jalilabad", 

1269 "Jalnguy", 

1270 "Jamaica", 

1271 "Jamaican", 

1272 "Jamaican creole", 

1273 "Japan", 

1274 "Japurá", 

1275 "Jarawara", 

1276 "Jazan", 

1277 "Jáva", 

1278 "Jehovah's Witnesses", 

1279 "Jèrriais", 

1280 "Jeolla", # Province in South Korea 

1281 "Jersey", 

1282 "Jewish Aramaic", 

1283 "Jewish Babylonian Aramaic", 

1284 "Jewish Palestinian Aramaic", 

1285 "Jewish", 

1286 "Jianghuai Mandarin", # Chinese dialect/language 

1287 "Jian'ou", # Chinese dialect 

1288 "Jicalapa", 

1289 "Jicarilla", # Variant of the Apache Language? 

1290 "Jilu Mandarin", # Dialect/Language in Chinese 

1291 "Jin", 

1292 "Jin Mandarin", # Chinese dialect/language 

1293 "Jinjiang Hokkien", # Chinese dialect/language 

1294 "Jinjiang", 

1295 "Johannesburg", 

1296 "Johor-Selangor", 

1297 "Johore", 

1298 "Judaism", 

1299 "Judeo-French", 

1300 "Kabul", 

1301 "Kabuli", 

1302 "Kadaru", 

1303 "Kagoshima", 

1304 "Kaipi", 

1305 "Kaiwaligau Ya", 

1306 "Kajkavian", 

1307 "Kalaw Kawaw Ya", 

1308 "Kalaw Lagaw Ya", 

1309 "Kalbajar", 

1310 "Kalderaš", 

1311 "Kalianda", 

1312 "Kaliarda", 

1313 "Kalix", 

1314 "Kaluga", 

1315 "Kamino", 

1316 "Kampong Ayer", 

1317 "Kamrupi", 

1318 "Kamviri", 

1319 "Kanchanaburi", 

1320 "Kandahar", 

1321 "Kansai", 

1322 "Kanto", 

1323 "Kaohsiung", 

1324 "Kaohsiung Hokkien", # Chinese dialect/language 

1325 "Karabakh", 

1326 "Karachay", 

1327 "Karanga", 

1328 "Karwari", 

1329 "Kasuweri", 

1330 "Katharevousa", 

1331 "Kautokeino", 

1332 "Kayseri", 

1333 "Kayu Agung", 

1334 "Kayu Agung Asli", 

1335 "Kayu Agung Pendatang", 

1336 "Kaw Kyaik", 

1337 "Kazakh", 

1338 "Kazerun", 

1339 "Kazym", 

1340 "Kedayan", 

1341 "Kent", 

1342 "Kentish", 

1343 "Kenya", 

1344 "Kernewek Kemmyn", 

1345 "Kernowek Standard", 

1346 "Kerry", 

1347 "Kfar Kama", # Region in Israel 

1348 "Khesht", 

1349 "Khojavend", 

1350 "Khorasan", 

1351 "Khoshar-Khota", 

1352 "Khun villages", 

1353 "Kiambu", 

1354 "Kidero", 

1355 "Kinmen Hokkien", 

1356 "Kinmen", 

1357 "Kinshasa", 

1358 "Kinyarwanda", 

1359 "Kirundi", 

1360 "Klang", 

1361 "Kobuk", # Inupiaq 

1362 "Koine", # Ancient Greek 

1363 "Konartakhteh", 

1364 "Kong Loi village", 

1365 "Kong Loi villages", 

1366 "Konya", 

1367 "Koryo-mar", 

1368 "Kosovo", 

1369 "Kosovo Arli", 

1370 "Kota Agung", 

1371 "Krui", 

1372 "Kulkalgau Ya", 

1373 "Kurdamir", 

1374 "Kuritiba", 

1375 "Kursk", 

1376 "Kuwait", 

1377 "Kuwaiti Gulf Arabic", # Variant of Arabic Language 

1378 "Kuzarg", 

1379 "Kyoto", 

1380 "Kyrgyz", 

1381 "Kyūshū", 

1382 "Kwantlada", 

1383 "Kölsch", 

1384 "LÚ", 

1385 "La Up village", 

1386 "Lamphun Province", 

1387 "Languedoc", 

1388 "Late Bohairic", 

1389 "Late Egyptian", 

1390 "Late Latin", 

1391 "Late Middle English", 

1392 "Late Old French", 

1393 "Late Old Frisian", 

1394 "Late West Saxon", 

1395 "Late", 

1396 "Later poetic Ancient Greek", # Ancient Greek 

1397 "Latin America", 

1398 "Latinate", 

1399 "Latinism", 

1400 "Latium", 

1401 "Latvian", 

1402 "Laval", 

1403 "Lavarone", 

1404 "Lebanese Arabic", # Variant of Arabic language 

1405 "Lebong", # Region in Indonesia/Sumatra? (Rejang language) 

1406 "Leet", # Leetspeak, an internet "slang" 

1407 "Legazpi", 

1408 "Leizhou Min", # Chinese dialect/language 

1409 "Lemosin", # Dialect of Occitan 

1410 "Lengadocian", # Dialect of Occitan 

1411 "Lesbian", # Ancient Greek 

1412 "Lesotho", 

1413 "Levantine Arabic", # Variant of Arabic language 

1414 "Lewis", 

1415 "Leyte", 

1416 "Lhasa", 

1417 "Liechtenstein", 

1418 "Limba Sarda Comuna", 

1419 "Limburg", 

1420 "Limburgish", 

1421 "Limousin", 

1422 "Limuru", 

1423 "Linnaeus", 

1424 "Lippisch", 

1425 "Lisan ud-Dawat", 

1426 "Listuguj", 

1427 "Literary affectation", 

1428 "Lithuania", 

1429 "Lithuanian", 

1430 "Litvish", 

1431 "Liverpudlian", 

1432 "Llanos", 

1433 "Locrian", # Ancient Greek 

1434 "Logudorese", # Variant of Sardinian 

1435 "Lojban", 

1436 "Loli", 

1437 "Lombardy", 

1438 "London", 

1439 "Longyan Min", # Variant of Chinese 

1440 "Lorraine", 

1441 "Louisiana", 

1442 "Lovara", 

1443 "Low Prussian", 

1444 "Low Sorbian", 

1445 "Lower Sorbian", 

1446 "Lubunyaca", 

1447 "Lukang Hokkien", 

1448 "Lukang", 

1449 "Luleå", 

1450 "Lunfardo", 

1451 "Luserna", 

1452 "Luxembourg", 

1453 "Luxembourgish", 

1454 "Lycopolitan", 

1455 "Lyon", 

1456 "Lyons", 

1457 "Lyric Ancient Greek", # Ancient Greek 

1458 "Lviv", 

1459 "Lövånger", 

1460 "Ḷḷena", 

1461 "Łowicz", 

1462 "M.O.D.", # Used as head form in Marshallese 

1463 "Maastrichtian", 

1464 "Macau", 

1465 "Macedonia", 

1466 "Macedonian", 

1467 "Macedonian Arli", 

1468 "Macedonian Džambazi", 

1469 "Mackem", 

1470 "Madeira", 

1471 "Maharashtra", 

1472 "Mahuizalco", 

1473 "Maiak", 

1474 "Maine", 

1475 "Mainland China", 

1476 "Malacatepec", 

1477 "Malak", 

1478 "Malayalam", 

1479 "Malaysia", 

1480 "Malaysia Hokkien", 

1481 "Malaysian English", 

1482 "Mallorca", 

1483 "Malta", 

1484 "Malyangapa", 

1485 # [ used in Kipchak entries e.g. {{head|qwm|noun|tr=aχ as}} {{tlb|qwm|Armeno-Kipchak}} 

1486 "Armeno-Kipchak", 

1487 "Armenian Kipchak", 

1488 "Mamluk-Kipchak", 

1489 "Mamluk", 

1490 # ] 

1491 "Mandalay Taishanese", 

1492 "Mandarin", # Dialect/Language in Chinese 

1493 "Mandi", 

1494 "Manglish", 

1495 "Manichaean", 

1496 "Manicoré", 

1497 "Manitoba Saulteux", 

1498 "Mantua", 

1499 "Manyika", 

1500 "Marathi", 

1501 "Martinican", 

1502 "Martinican Creole", 

1503 "Marwari", 

1504 "Mary-marry-merry distinction", 

1505 "Mary-marry-merry merger", 

1506 "Marxism", 

1507 "Masarm", 

1508 "Maharastri Prakrit", 

1509 "Mauritania", 

1510 "Mawakwa", 

1511 "Mayo", 

1512 "Mecayapan", # Variant of Nathuatl 

1513 "Mecklenburg-Vorpommern", 

1514 "Mecklenburgisch", 

1515 "Mecklenburgisch-Vorpommersch", 

1516 "Medan", 

1517 "Mediaeval", 

1518 "Medieval", 

1519 "Medieval Greek", 

1520 "Medieval Latin", 

1521 "Medio-Late Egyptian", 

1522 "Mehedinți", 

1523 "Meinong", 

1524 "Meixian", 

1525 "Melanesian", 

1526 "Melinting", 

1527 "Menggala/Tulang Bawang", 

1528 "Mercian", 

1529 "Merseyside", 

1530 "Mescaleiro", 

1531 "Mexica", 

1532 "Mexico", 

1533 "Mfom", 

1534 "Miaoli", 

1535 "Microsoft Azure", 

1536 "Mid Northern Scots", 

1537 "Mid Northern", 

1538 "Mid", 

1539 "Mid-Atlantic", 

1540 "Middle Ages", 

1541 "Middle Chinese", # Historical variant of Chinese 

1542 "Middle Cornish", 

1543 "Middle Egyptian", 

1544 "Middle", 

1545 "Midland American English", 

1546 "Midlands", 

1547 "Midlandsnormalen", 

1548 "Midwestern US", 

1549 "Milan", 

1550 "Milanese", 

1551 "Milpa Alta", 

1552 "Min", 

1553 "Min Bei", 

1554 "Min Dong", # Chinese dialect/language 

1555 "Min Nan", # Chinese dialect/language 

1556 "Minangkabauat", 

1557 "Minas Gerais", 

1558 "Mineiro", 

1559 "Mirandola", 

1560 "Mirandolese", 

1561 "Mistralian", 

1562 "Mizrahi Hebrew", 

1563 "Modena", 

1564 "Modern", 

1565 "Modern Armenian", 

1566 "Modern Israeli Hebrew", 

1567 "Modern Israeli", 

1568 "Modern Latin", 

1569 "Modern Polabian", 

1570 "Modern Turkish", 

1571 "Modi", # Variant/language based on Sanskrit 

1572 "Moghamo", 

1573 "Moldavia", 

1574 "Molet Kasu", 

1575 "Molet Mur", 

1576 "Monegasque", 

1577 "Mongo-Turkic", 

1578 "Montenegro", 

1579 "Montreal", 

1580 "Mooring", # Variant of North Frisian 

1581 "Moravia", 

1582 "Mormonism", 

1583 "Moroccan", # Variant of Arabic 

1584 "Moroccan Arabic", # Variant of Arabic 

1585 "Morocco", 

1586 "Moscow", 

1587 "Moselle Franconian", 

1588 "Mosetén", 

1589 "Mount Currie", 

1590 "Mozambique", 

1591 "Moçambique", 

1592 "Mpakwithi", 

1593 "Muğla", 

1594 "Multicultural London English", 

1595 "Munster", 

1596 "Muping", 

1597 "Murang'a", 

1598 "Mushuau Innu", 

1599 "Muslim", 

1600 "Münsterland", 

1601 "Münsterländisch", 

1602 "Mycenaean", # Variant of Greek 

1603 "Nahua", 

1604 "Nahuatl", 

1605 "Nakhchivan", 

1606 "Namibia", 

1607 "Nanchuan", 

1608 "Nanchang", 

1609 "Nan'an", 

1610 "Nao Klao", # dialect 

1611 "Naples", 

1612 "Navajo", 

1613 "Navarre", 

1614 "Navarrese", 

1615 "Navarro-Lapurdian", 

1616 "Navy", 

1617 "Nazism", 

1618 "Ndia", 

1619 "Neo-Latin", 

1620 "Nepal", 

1621 "Netherlands", 

1622 "Nevada", 

1623 "New Age", 

1624 "New England", 

1625 "New Jersey", 

1626 "New Latin", 

1627 "New Sanskrit", 

1628 "New South Wales", # State of Australia 

1629 "New York City", 

1630 "New York", 

1631 "New Zealand", 

1632 "Newfoundland", 

1633 "Nicaragua", 

1634 "Niçard", 

1635 "Nidwalden", 

1636 "Nigeria", 

1637 "Niğde", 

1638 "Ningbo", 

1639 "Nizhegorod", 

1640 "Nomen sacrum", # Used in Gothic form names 

1641 "Non-Oxford", 

1642 "Nordestino", 

1643 "Nordic", 

1644 "Norfolk", 

1645 "Normandy", 

1646 "Norse", 

1647 "North Afar", 

1648 "North America", 

1649 "North American", 

1650 "North Brazil", 

1651 "North East England", 

1652 "North Eastern US", 

1653 "North German", 

1654 "North Korea", 

1655 "North Levantine", 

1656 "North Levantine Arabic", # Variant of Arabic 

1657 "North Northern Scots", 

1658 "North Northern", 

1659 "North Northern", 

1660 "North Wales", 

1661 "North and East of the Netherlands", 

1662 "North", 

1663 "Northeast Brazil", 

1664 "Northeastern Brazil", 

1665 "Northeastern", 

1666 "Northern California", 

1667 "Northern Catalan", 

1668 "Northern Crimea", 

1669 "Northern England", 

1670 "Northern English", 

1671 "Northern Germany", 

1672 "Northern Ireland", 

1673 "Northern Italy", 

1674 "Northern Mandarin", # Chinese dialect/language 

1675 "Northern Manx", 

1676 "Northern Middle English", 

1677 "Northern Puebla", 

1678 "Northern Scots", 

1679 "Northern UK", 

1680 "Northern US", 

1681 "Northern Yiddish", 

1682 "Northern Zazaki", 

1683 "Northern", 

1684 "Northamptonshire", 

1685 "Northumbria", 

1686 "Northwestern", 

1687 "Northwestern Argentina", 

1688 "Novgorod", 

1689 "Nde", 

1690 "Nembe", 

1691 "Nfom", 

1692 "Ngan'gimerri", 

1693 "Ngan'gikurunggurr", 

1694 "Ngie", 

1695 "Ngoko", 

1696 "Nghệ An", # Vietnamese dialect 

1697 "Nkim", 

1698 "Nkojo", 

1699 "Nkum", 

1700 "Norse", 

1701 "Nselle", 

1702 "Nsimbwa", 

1703 "Nta", 

1704 "Ntuzu", 

1705 "Nuorese", 

1706 "Nyeri", 

1707 "Nynorak", 

1708 "Nynorsk", # Variant of Norwegian 

1709 "Nyungkal", 

1710 "Nürnbergisch", 

1711 "Occitania", 

1712 "Old Attic", # Ancient Greek 

1713 "Old Bohairic", 

1714 "Old Chamorro", 

1715 "Old Chinese", # Historical variant of Chinese 

1716 "Old Coptic", 

1717 "Old East Church Slavonic", 

1718 "Old Egyptian", 

1719 "Old English", 

1720 "Old Latin", 

1721 "Old Lithuanian", 

1722 "Old Norse", 

1723 "Old Northern French", 

1724 "Old Polabian", 

1725 "Old Tagalog", 

1726 "Oliti", 

1727 "Olles", 

1728 "Ombos", 

1729 "Ontario", 

1730 "Ooldea", 

1731 "Orcadian", 

1732 "Ordubad", 

1733 "Orkney", 

1734 "Ormulum", 

1735 "Oryol", 

1736 "Oslo", 

1737 "Ottomans", 

1738 "Oxford", # Variant of British English 

1739 "Pa Pae village", 

1740 "Paderbornish", 

1741 "Paderbornisch", 

1742 "Pahang", 

1743 "Pak Kret District", 

1744 "Pakistan", 

1745 "Palacios de Sil", 

1746 "Palatine", 

1747 "Palestinian", 

1748 "Pali", # Sanskrit 

1749 "Panama", 

1750 "Pangin", 

1751 "Papua", 

1752 "Papua New Guinea", 

1753 "Papuanese", 

1754 "Paraguay", 

1755 "Paraná", # State in Brazil 

1756 "Paris", 

1757 "Parisian", 

1758 "Parres", 

1759 "Parts of south Jeolla", 

1760 "Paulistano", 

1761 "Payang", # Region in Indonesia (Rejang language) 

1762 "Pays de Bray", 

1763 "Pays de Caux", 

1764 "Paḷḷuezu", 

1765 "Peking", 

1766 "Pembrokeshire", 

1767 "Penang Hokkien", 

1768 "Penang", 

1769 "Peng'im", 

1770 "Penghu Hokkien", 

1771 "Pennsylvania", 

1772 "Periphrastic conjugations", 

1773 "Perm", 

1774 "Persian Gulf", 

1775 "Persianized", 

1776 "Perso-Arabic", 

1777 "Peru", 

1778 "Peshawar", 

1779 "Phnom Penh", 

1780 "Philadelphia", 

1781 "Philippine", 

1782 "Philippines", 

1783 "Piacenza", 

1784 "Picardy", 

1785 "Pinghua", # Chinese dialect/language 

1786 "Pinyin", 

1787 "Pirupiru", 

1788 "Pite", # Variant of Sami 

1789 "Piteå", 

1790 "Plautdietsch", 

1791 "Polari", 

1792 "Polish", 

1793 "Portugal", 

1794 "Portugal", 

1795 "Possesse", 

1796 "Poylish", 

1797 "Poznań", 

1798 "Praenominal", # Type of abbreviation 

1799 "Pre-Hebrew", 

1800 "Prokem", 

1801 "Protestant", 

1802 "Proto-Slavic", 

1803 # [ used in Reconstruction:Latin entries, e.g. {{la-verb|4|*sufferiō|*sufferīv|*suffert}} {{lb|la|Proto-Romance}} 

1804 "Proto-Balkan-Romance", 

1805 "Proto-Ibero-Romance", 

1806 "Proto-Italo-Western-Romance", 

1807 "Proto-Gallo-Romance", 

1808 "Proto-Romance", 

1809 "Proto-Western-Romance", 

1810 # ] 

1811 "Provençal", 

1812 "Provençau", # Dialect of Occitan 

1813 "Pskov", 

1814 "Pu No", # dialect 

1815 "Pubian", 

1816 "Puebla", 

1817 "Puerto Rico", 

1818 "Pulaar", 

1819 "Pular", 

1820 "Puter", 

1821 "Puxian Min", # Chinese language/dialect 

1822 "Valdés", 

1823 "Vallander", 

1824 "Varendra", 

1825 "Vegliot", 

1826 "Vest Recklinghausen", 

1827 "Villacidayo", 

1828 "Qazakh", 

1829 "Quakerism", 

1830 "Quanzhou", 

1831 "Quebec", 

1832 "Quebec City", 

1833 "Quetta", 

1834 "Quirós", 

1835 "Quốc ngữ", 

1836 "Raguileo Alphabet", 

1837 "Ragusan", 

1838 "Rai Kaili", 

1839 "Ranau", 

1840 "Rastafari", 

1841 "Rastafarian", 

1842 "Ratak", 

1843 "Received Pronunciation", 

1844 "Recueil scientifique ou littéraire", 

1845 "Reggio Emilia", 

1846 "Reina-Valera version", 

1847 "Renshou", 

1848 "Revived Late Cornish", 

1849 "Revived Middle Cornish", 

1850 "Revived", 

1851 "Rhine Franconian", # Variant of German 

1852 "Rhineland", 

1853 "Rhodesia", 

1854 "Riau", 

1855 "Riau-Lingga", 

1856 "Rigveda", 

1857 "Riksmål", 

1858 "Rimella", 

1859 "Ring", 

1860 "Rio Grande De Sul", 

1861 "Rio de Janeiro", 

1862 "Río de la Plata", 

1863 "Rioplatense", 

1864 "Ripuarian", 

1865 "Ritsu", 

1866 "Rogaland", 

1867 "Roman Catholic", 

1868 "Roman Empire", 

1869 "Romanian", 

1870 "Romungro", 

1871 "Rouen", 

1872 "Rubī-Safaia", 

1873 "Ruhrgebiet", 

1874 "Rumantsch Grischun", 

1875 "Rumy", 

1876 "Rundi", 

1877 "Rungu", 

1878 "Russia", 

1879 "Russian", 

1880 "Russianism", 

1881 "Rwanda", 

1882 "Rwanda-Rundi", 

1883 "Rālik", 

1884 "Rāṛha", 

1885 "SK Standard", 

1886 "SW England", 

1887 "Saarve", 

1888 "Sagada", 

1889 "Sahidic", 

1890 "Saint Ouën", 

1891 "Saint Petersburg", 

1892 "Sakayamuni", 

1893 "Sakhalin", 

1894 "Salaca", 

1895 "Salas", 

1896 "Sallans", 

1897 "Salyan", 

1898 "Sami", 

1899 "San Juan Quiahije", 

1900 "Sanskrit", 

1901 "Sanskritized", 

1902 "Santiago", 

1903 "Sanxia Hokkien", 

1904 "São Vicente", 

1905 "Sappada", 

1906 "Sapper-Ricke", 

1907 "Sark", 

1908 "Sauerland", 

1909 "Sauerländisch", 

1910 "Sauris", 

1911 "Savoie", 

1912 "Savoyard", 

1913 "Sawndip", 

1914 "Sayisi", # Variant of Chipewyan language? 

1915 "Schleswig-Holstein", 

1916 "Schwyz", 

1917 "Scientific Latin", 

1918 "Scotland", 

1919 "Scottish", 

1920 "Scouse", 

1921 "Seoul", 

1922 "Sepečides", 

1923 "Sepoe", 

1924 "Serbia", 

1925 "Serbian", 

1926 "Serbo-Croatian", 

1927 "Servia", 

1928 "Sesivi", 

1929 "Sette Comuni", 

1930 "Seville", 

1931 "Shandong", 

1932 "Shanghai", 

1933 "Shanghainese Wu", 

1934 "Shapsug", 

1935 "Shavian", 

1936 "Sheffield", 

1937 "Sheng", 

1938 "Shephardi Hebrew", 

1939 "Sheshatshiu Innu", 

1940 "Shetland", 

1941 "Shetlandic", 

1942 "Shia", 

1943 "Shidong", 

1944 "Shikoku", 

1945 "Shin", 

1946 "Shiraz", 

1947 "Shropshire", 

1948 "Shubi", 

1949 "Shuri-Naha", 

1950 "Shuryshkar", 

1951 "Siba", 

1952 "Sibe", 

1953 "Sichuan", 

1954 "Sichuanese", 

1955 "Sikh", 

1956 "Sikhism", 

1957 "Silesian", 

1958 "Simplified", 

1959 "Singapore English", 

1960 "Singapore", 

1961 "Singlish", 

1962 "Sino-Korean", 

1963 "Sino-Japanese", 

1964 "Sisiame", 

1965 "Sistani", 

1966 "Sixian", 

1967 "Skellefteå", 

1968 "Skiri", 

1969 "Skolt", # Variant of Sami 

1970 "Slovak", 

1971 "Slovene", 

1972 "Slovincian", 

1973 "Smolensk", 

1974 "Sobrescobiu", 

1975 "Sofia Erli", 

1976 "Soikkola", 

1977 "Solothurn", 

1978 "Somiedu", 

1979 "Sori", 

1980 "Sotavento", 

1981 "Souletin", 

1982 "South Afar", 

1983 "South Africa", 

1984 "South African", 

1985 "South America", 

1986 "South American English", 

1987 "South Asia", 

1988 "South Azerbaijani", 

1989 "South Brazil", 

1990 "South German", 

1991 "South Korea", 

1992 "South Levantine", 

1993 "South Levantine Arabic", 

1994 "South Northern Scots", 

1995 "South Scots", 

1996 "South Wales", 

1997 "South", 

1998 "Southeastern", 

1999 "Southern Africa", 

2000 "Southern American English", 

2001 "Southern Brazil", 

2002 "Southern England", 

2003 "Southern Italy", 

2004 "Southern Manx", 

2005 "Southern Middle English", 

2006 "Southern Quechua", 

2007 "Southern Scotland", 

2008 "Southern Scots", 

2009 "Southern Spain", 

2010 "Southern US", 

2011 "Southern Yiddish", 

2012 "Southern Zazaki", 

2013 "Southern", 

2014 "Southwestern", 

2015 "Southwestern Mandarin", # Chinese dialect/language 

2016 "Space Force", 

2017 "Spain", 

2018 "Spanish", 

2019 "Sremski Gurbet", 

2020 "Sri Lanka", 

2021 "St. Gallen", 

2022 "Standard Cornish", 

2023 "Standard Chinese", # Standard spoken Chinese, Standard Northern Mandarin in linguistics 

2024 "Standard East Norwegian", 

2025 "Standard German of Switzerland", 

2026 "Standard German", 

2027 "Standard Hlai", 

2028 "Standard Sicilian", 

2029 "Standard Tagalog", 

2030 "Standard Zhuang", 

2031 "Stavanger", 

2032 "Stellingwerfs", 

2033 "Stokoe", # Used in sign language letter entries to indicate Latin letter 

2034 "Suizhou", 

2035 "Sukai", 

2036 "Sukau", 

2037 "Sundanese", 

2038 "Sungkai", 

2039 "Sunni", 

2040 "Surgut", 

2041 "Surigaonon", 

2042 "Surinam", 

2043 "Suriname", 

2044 "Surmiran", 

2045 "Sursilvan", 

2046 "Suðuroy", 

2047 "Sutsilvan", 

2048 "Suzhou", 

2049 "Sweden", 

2050 "Swindon", # Place in UK? 

2051 "Swiss German", 

2052 "Swiss", 

2053 "Switzerland", 

2054 "Syllabics", # Used in word head with Plains Cree, e.g. tânisi/Plains Cree 

2055 "Sylt", # Variant of North Frisian 

2056 "Syrian Hebrew", 

2057 "São Paulo", 

2058 "São Vicente", 

2059 "Traditional Chinese Medicine", 

2060 "TV", 

2061 "Taberga", 

2062 "Tabriz", 

2063 "Taicheng", 

2064 "Tai Xuan Jing", 

2065 "Taichung Hokkien", 

2066 "Tainan", 

2067 "Taipei", 

2068 "Taishanese", 

2069 "Taishan", 

2070 "Taiwan", 

2071 "Taiwanese Min Nan", 

2072 "Taiwanese Hokkien", 

2073 "Taiwanese Mandarin", # Chinese dialect/language 

2074 "Taixuanjing tetragram", 

2075 "Taiyuan", 

2076 "Tajik", 

2077 "Talang Padang", 

2078 "Tally-marks", 

2079 "Talur", 

2080 "Tang-e Eram", 

2081 "Tankarana", 

2082 "Tantoyuca", 

2083 "Tao", 

2084 "Taraškievica", 

2085 "Tashelhit", # Variant of Berber 

2086 "Tasmania", 

2087 "Tasmanian", 

2088 "Tavastia", 

2089 "Tebera", 

2090 "Teesside", 

2091 "Tehran", 

2092 "Tehrani", 

2093 "Telugu-Kui", 

2094 "Temapache", 

2095 "Tenerife", 

2096 "Teochew", 

2097 "Teotepeque", 

2098 "Tepetzintla", 

2099 "Terre-Neuve-et-Labrador", 

2100 "Tessin", 

2101 "Texas", 

2102 "Texcoco", 

2103 "Textbibel", 

2104 "Tgdaya", 

2105 "Thailand", 

2106 "Thanh Chương", 

2107 "The Hague", 

2108 "Thessalian", # Ancient Greek 

2109 "Thung Luang village", 

2110 "Thung Luang", 

2111 "Thurgau", 

2112 "Thuringian-Upper Saxon", 

2113 "Tianjin", 

2114 "Tiberian Hebrew", 

2115 "Timau", 

2116 "Timor-Leste", 

2117 "Tlaxcala", 

2118 "Tlyadal", 

2119 "Toaripi", 

2120 "Tokat", 

2121 "Tokyo", 

2122 "Tongyang", 

2123 "Tongzi", 

2124 "Torlakian", 

2125 "Tosk", 

2126 "Toulouse", 

2127 "Traditional", 

2128 "Tragic Ancient Greek", # Ancient Greek 

2129 "Trakai-Vilnius", 

2130 "Translingual", 

2131 "Transoxianan", 

2132 "Transylvania", 

2133 "Trat", 

2134 "Tredici Comuni", 

2135 "Trentino", 

2136 "Trinidad and Tobago", 

2137 "Truku", 

2138 "Tsimihety", 

2139 "Tulamni", 

2140 "Turkmen", 

2141 "Tuscany", 

2142 "Twente", 

2143 "Twents", 

2144 "Twi", # Dialect of the Akan language 

2145 "Tyneside", 

2146 "Uganda", 

2147 "UK with /ʊ/", 

2148 "UK", 

2149 "Ulu", 

2150 "UPA", 

2151 "Upper Silesia", 

2152 "Upper Sorbian", 

2153 "Urama", 

2154 "Urdu", 

2155 "US with /u/", 

2156 "US", 

2157 "US-Inland North", 

2158 "US-merged", 

2159 "Ukraine", 

2160 "Ukrainish", 

2161 "Ukraynish", 

2162 "Ulaanbaatar", 

2163 "Ulster Scots", 

2164 "Ulster", 

2165 "Ultramontane", # Corsican dialect 

2166 "Umeå", 

2167 "Unified", 

2168 "Unix", 

2169 "Unquachog", # Dialect of Quiripi 

2170 "Upper RP Triphthong Smoothing", 

2171 "Uri", 

2172 "Urkers", 

2173 "Ursari", 

2174 "Urtijëi", 

2175 "Uruguay", 

2176 "Urumqi", 

2177 "Utara", # Region in Indonesia (Rejang language) 

2178 "Uutände", 

2179 "Uyghurjin", 

2180 "Vaiśeṣika", 

2181 "Valais", 

2182 "Valencia", 

2183 "Valencian", 

2184 "Vallander", 

2185 "Vancouver", 

2186 "Vancouver Island", 

2187 "Vaṅga", 

2188 "Vedic", 

2189 "Veluws", 

2190 "Venezuela", 

2191 "Verona", 

2192 "Vidari", # Variant of Alviri-Vidari 

2193 "Vietnam", 

2194 "Vinh", 

2195 "Vinza", 

2196 "Virginia", 

2197 "Vivaro-Alpin", 

2198 "Vivaro-Alpine", 

2199 "Volapük Nulik", 

2200 "Volapük Rigik", 

2201 "Vosges", 

2202 "Vulgata", 

2203 "Västergötland", 

2204 "WW2 air pilots' usage", 

2205 "Wade-Giles", 

2206 "Wadikali", 

2207 "Walapai", 

2208 "Wales", 

2209 "Wallonia", 

2210 "Wamwan", 

2211 "Wardak", 

2212 "Waterford", 

2213 "Way Lima", 

2214 "Waxiang", # Variant of Chinese? 

2215 "Wazirwola", 

2216 "Wearside", 

2217 "Weirate", 

2218 "Welche", 

2219 "Welsh English", 

2220 "Wenzhou", # Chinese dialect/language 

2221 "Wenzhou Wu", # Chinese dialect/language 

2222 "West Armenian", 

2223 "West Bengal", 

2224 "Benglish", # vai/English 20241112 

2225 "West Cork", 

2226 "West Country", 

2227 "West Java", 

2228 "West Kerry", 

2229 "West Midlands", 

2230 "West Muskerry", 

2231 "West Pomeranian", 

2232 "West Saxon", 

2233 "West Sumatra", 

2234 "West", 

2235 "Western Armenian", 

2236 "Western Lombard", 

2237 "Western Punjabi", 

2238 "Western Quebec", 

2239 "Western Rumelia", 

2240 "Western Syriac", 

2241 "Western", 

2242 "Westminster system", 

2243 "Westmünsterland", 

2244 "Westphalia", 

2245 "Westphalian", 

2246 "Westpfälzisch", 

2247 "Westwestphalian", 

2248 "Wiedingharde", 

2249 "Windesi", 

2250 "Witzapan", 

2251 "Wolverhampton", # Place in UK? 

2252 "Wood", 

2253 "World War I", 

2254 "Wrangelsholm", 

2255 "Written Form", 

2256 "Wu", # Chinese dialect/language 

2257 "Wuhan", 

2258 "Wuvulu", 

2259 "Xiamen", 

2260 "Xiamen-Hokkien", 

2261 "Xiang", 

2262 "Xilitla", 

2263 "YIVO", 

2264 "Yagaria", 

2265 "Yahualica", 

2266 "Yajurveda chanting", 

2267 "Yaman", 

2268 "Yanbian", 

2269 "Yanhe", 

2270 "Yao'an", 

2271 "Yardliyawara", 

2272 "Yardymli", 

2273 "Yaut", 

2274 "Yawelmani", 

2275 "Yañalif", 

2276 "Ye'kwana", 

2277 "Yemen", 

2278 "Yemenite Hebrew", 

2279 "Yichang", 

2280 "Yiddish-influenced", 

2281 "Yilan", 

2282 "Yilan Hokkien", 

2283 "Yindjilandji", 

2284 "Yintyingka", 

2285 "Ylä-Laukaa", 

2286 "Yongshan", 

2287 "Yorkshire", 

2288 "Yozgat", 

2289 "Yukjin", 

2290 "Yukon", 

2291 "Yulparija", 

2292 "Yunnan", 

2293 "Zacatianguis", 

2294 "Zamboanga", 

2295 "Zangilan", 

2296 "Zaqatala", 

2297 "Zezuru", 

2298 "Zhengzhang", 

2299 "Zhangzhou", 

2300 "Zhangzhou Hokkien", 

2301 "Zhangpu", 

2302 "Zimbabwe", 

2303 "Zinacantán", 

2304 "Zurich", 

2305 "Zêkog", 

2306 "Överkalix", 

2307 "al-Andalus", # historically Muslim ruled area of the Iberian Penisula 

2308 "bureaucratese", 

2309 "central and northeastern Switzerland", 

2310 "continental Normandy", 

2311 "feudal Britain", 

2312 "parts of South Africa", 

2313 "outside Northumbria", 

2314 "post-Augustan", 

2315 "post-Classical", 

2316 "post-Homeric", 

2317 "pre-Classical", 

2318 "regionally African American Vernacular", 

2319 "southern Moselle Franconian", 

2320 "northernmost Moselle Franconian", 

2321 "west Sweden", 

2322 "most of Moselle Franconian", 

2323 "Southern Germany", 

2324 "southern Germany", 

2325 "Northwest German", # anfangen/German 

2326 "Ruhrdeutsch", # Haus/German 

2327 "Berlinisch", # Haus/German 

2328 "18th ct.", # Haus/German 

2329 "south-western German", # Maus/German 

2330 "Upper German", # schneien/German 

2331 # paste from placenames relating to Chinese dialectal synonyms 

2332 "Tianmen", 

2333 "Gaoming", 

2334 "Xining", 

2335 "Dali", 

2336 "Huicheng-Bendihua", 

2337 "Ganzhou", 

2338 "Luoyang", 

2339 "Lingui", 

2340 "Changting", 

2341 "Lütian", 

2342 "Jiamusi", 

2343 "Heshan", 

2344 "Neipu", 

2345 "Sanjia", 

2346 "Fuyang", 

2347 "Baihe", 

2348 "Changchun", 

2349 "Linfen", 

2350 "Jinzhou", 

2351 "Chongming", 

2352 "Dandong", 

2353 "Qingxi", 

2354 "Shexian", 

2355 "Mengzi", 

2356 "Tonghua", 

2357 "Zhengzhou", 

2358 "Qingping", 

2359 "Haikou", 

2360 "Zunyi", 

2361 "Zhangjiakou", 

2362 "Yangchun", 

2363 "Guiyang", 

2364 "Southern-Pinghua", 

2365 "Ninghua", 

2366 "Dazhou", 

2367 "Zhuhai", 

2368 "Shuangfeng", 

2369 "Tangkou", 

2370 "Hailar", 

2371 "Nanchong", 

2372 "Lianyungang", 

2373 "Kuala-Lumpur", 

2374 "Wengyuan", 

2375 "Hsinchu-County", 

2376 "Ningdu", 

2377 "Lunbei", 

2378 "Wuping", 

2379 "Tingzi", 

2380 "Zhaotong", 

2381 "Liuzhou", 

2382 "Yantai", 

2383 "Shenzhen", 

2384 "Doumen", 

2385 "Leizhou", 

2386 "Zhongshan", 

2387 "Changzhi", 

2388 "Lianjiang", 

2389 "Xinhui", 

2390 "Lishi", 

2391 "Baisha", 

2392 "Xihe", 

2393 "Hangzhou", 

2394 "Tong'an", 

2395 "Baoji", 

2396 "Hanzhong", 

2397 "Yanqian", 

2398 "Xi'an", 

2399 "Cangzhou", 

2400 "Zhao'an", 

2401 "Xinyang", 

2402 "Jieyang", 

2403 "Xiangyang", 

2404 "Huazhou", 

2405 "Niujiang", 

2406 "Xichang", 

2407 "Sabah", 

2408 "Danyang", 

2409 "Lianshui", 

2410 "Qianshan", 

2411 "Jining", 

2412 "Zhudong", 

2413 "Conghua", 

2414 "Huiyang", 

2415 "Chikan", 

2416 "Yangxi", 

2417 "Pingshan", 

2418 "Anqing", 

2419 "Xiuzhuan", 

2420 "Qingdao", 

2421 "Erenhot", 

2422 "Pingtung", 

2423 "Hefei", 

2424 "Manila", 

2425 "Chifeng", 

2426 "Qionglin", 

2427 "Nantong", 

2428 "Yangyuan", 

2429 "Zengcheng", 

2430 "Lijin", 

2431 "Dunhuang", 

2432 "Kam-Tin-Weitou", 

2433 "Nanlang-Heshui", 

2434 "Lichuan", 

2435 "Jiexi", 

2436 "Dongshi", 

2437 "Xindong", 

2438 "Linzhou", 

2439 "Qionghai", 

2440 "Shangqiu", 

2441 "Wuhu", 

2442 "Shijiao", 

2443 "Linhe", 

2444 "Shunde", 

2445 "Wenchang", 

2446 "Kaiping", 

2447 "Shijiazhuang", 

2448 "Yinchuan", 

2449 "Mingcheng", 

2450 "Xinyi", 

2451 "Dongguan", 

2452 "Tonggu", 

2453 "Tianshui", 

2454 "Guangfu", 

2455 "Jixi", 

2456 "Yangjiang", 

2457 "Shatou", 

2458 "Suide", 

2459 "Nanjing", 

2460 "Foshan", 

2461 "Dalian", 

2462 "Liannan", 

2463 "Baicheng", 

2464 "Datong", 

2465 "Yunlin", 

2466 "Shenyang", 

2467 "Nanhai", 

2468 "Dabu", 

2469 "Shajing", 

2470 "Chaozhou", 

2471 "Hami", 

2472 "Pingxiang", 

2473 "Shiqi", 

2474 "Sanshui", 

2475 "Baoding", 

2476 "Johor-Bahru", 

2477 "Tangshan", 

2478 "Harbin", 

2479 "Yudu", 

2480 "Dianbai", 

2481 "Gaozhou", 

2482 "Heihe", 

2483 "Hulunbuir", 

2484 "Jinan", 

2485 "Kunming", 

2486 "Changde", 

2487 "Enping", 

2488 "Shatoujiao", 

2489 "Hailu", 

2490 "Chengde", 

2491 "Zigong", 

2492 "Zhucheng", 

2493 "Guilin", 

2494 "Panlong", 

2495 "Wanrong", 

2496 "Huadu", 

2497 "Bao'an", 

2498 "Qiqihar", 

2499 "Jinhua", 

2500 "Xinzhou", 

2501 "Lanzhou", 

2502 "Huashan", 

2503 "Loudi", 

2504 "Shalang", 

2505 "Yayao", 

2506 "Dayu", 

2507 "Senai", 

2508 "Hohhot", 

2509 "Nanning", 

2510 "Raoping", 

2511 "Sandu", 

2512 "Yuanyang", 

2513 "Handan", 

2514 "Jiangmen", 

2515 "Panyu", 

2516 "Xin'an", 

2517 "Sihe", 

2518 "Xuzhou", 

2519 "Lingbao", 

2520 "Luchuan", 

2521 "Mengshan", 

2522 "Taichung", 

2523 "Qianpai", 

2524 "Yangzhou", 

2525 "Liping", 

2526 "Ürümqi", 

2527 "Bijie", 

2528 "Cretan", # Ancient Greek 

2529 "Crimean Latin", 

2530 "Imperial Aramaic", 

2531 "Jewish Literary Aramaic", 

2532 "Katharevoussa", 

2533 "San Pedro Amuzgos", 

2534 "Ajaccino", 

2535 "Alupec", # Nonstandard lower-case of ALUPEC, just in case it pops up again. 

2536 "Ancient Cretan", 

2537 "Arbërëshë Albanian", 

2538 "Arbërëshë", 

2539 "Arebica", 

2540 "Arvanitika", 

2541 "Assyrian Neo Aramaic", 

2542 "Babylonian", 

2543 "Fogo", 

2544 "Bau-Jagoi", 

2545 "Bikol Daet", 

2546 "Bikol Partido", 

2547 "Bima", 

2548 "Sumbawa", 

2549 "Boeotian", # Ancient Greek 

2550 "Bokmal", 

2551 "Book Pahlavi", # Book Pahlavi, pseudoscience/English/translations/ 

2552 "Bádiu", 

2553 "Bökingharde", 

2554 "Cajun French", 

2555 "Campidanese Sardinian", 

2556 "Canka Quechua", 

2557 "Central Mahuatlán Zapotec", 

2558 "Central Yup'ik", 

2559 "Chu Nom", 

2560 "Chữ Nôm", 

2561 "Classical Huasteca Nahuatl", 

2562 "Classical Ottoman Turkish", 

2563 "Colloquial Finnish", 

2564 "Common Cornish", 

2565 "Dimli", 

2566 "Early Modern Korean", 

2567 "East Slovak Romani", 

2568 "Ekiti", 

2569 "Fadicca", 

2570 "Franconian", 

2571 "Galilean Aramaic", 

2572 "Gallurese Sardinian", 

2573 "Goesharde", 

2574 "Mooring", 

2575 "Grenadian", 

2576 "Guerrero", 

2577 "Hadrami Arabic", 

2578 "Hague dialect", 

2579 "Hawick Scots", 

2580 "High Saxonian", 

2581 "High Sorbian", 

2582 "Hill", # Hill Mari, Meadow Mari, dandruff/English 

2583 "Meadow", 

2584 "Hochpreußisch", 

2585 "Hoisanese", 

2586 "Huallaga", 

2587 "Inuvialuk", 

2588 "Isthmus", 

2589 "Jewish Babylonian", 

2590 "Jewish Northeastern Neo-Aramaic", 

2591 "Judeo-Malayalam", 

2592 "Kagwahiv", 

2593 "Kaigani", 

2594 "Kaili", 

2595 "Kativiri", 

2596 "Kelantan-Pattani Malay", 

2597 "Kihnu subdialect", 

2598 "Kirmancki", 

2599 "Kirmanjki", 

2600 "Komi-Yazva", 

2601 "Krama", 

2602 "Kyushu", 

2603 "Kölnisch", 

2604 "Laconian", # Ancient Greek 

2605 "Late Ottoman Turkish", 

2606 "Levantine, North", 

2607 "Levantine, South", 

2608 "Levantine", 

2609 "Logudorese Sardinian", 

2610 "Lower Rhine Alsatian", 

2611 "Maio", 

2612 "Maore", 

2613 "Masali", 

2614 "Massett", 

2615 "Mennonite Plautdietsch", 

2616 "Min nan", 

2617 "Minnan", 

2618 "Moldavian", 

2619 "Moldovan Cyrillic", 

2620 "Mon Pali", 

2621 "Sylt", 

2622 "México Otomi", 

2623 "Narkamaŭka", 

2624 "New Low Saxon", 

2625 "North Korean", 

2626 "Northern Peubla", 

2627 "Oberlausitzisch", 

2628 "Old Zazaki", 

2629 "Olo'ik'yana", 

2630 "Onan", 

2631 "Palermitan", 

2632 "Palestine", 

2633 "Regional German", 

2634 "Salentino", 

2635 "San Miguel El Grande", 

2636 "San'ani Arabic", 

2637 "Santo Antão", 

2638 "Sarawak Malay", 

2639 "Saterland", 

2640 "Selice Romani", 

2641 "Sierra Norte", 

2642 "Singkil", 

2643 "Skitegate", 

2644 "South Korean", 

2645 "Standard Indonesian", 

2646 "Standard", 

2647 "Swabian German", 

2648 "São Nicolau", 

2649 "Tabarchino", 

2650 "Tarashkevitsa", 

2651 "Tataltepec Coastal Chatino", 

2652 "Terengganu Malay", 

2653 "Town Frisian", 

2654 "Tuscan dialect", 

2655 "UEY", # Uyghyr, wash/English 

2656 "USY", # Uyghyr ^ 

2657 "Upper Rhine Alsatian", 

2658 "Volhynian German", 

2659 "Waiwaş Quechua", 

2660 "Wanka Quechua", 

2661 "Zuberoan", 

2662 "Setesdal", # Norwegian 

2663 "Telemark", # Norwegian 

2664 "San'ani Yemeni Arabic", 

2665 "Krobo", # wawa/Adangme 

2666 "Afar", # afoofa/Afar 

2667 "Saru", # Ainu/ecioka 

2668 "Old Albanian", 

2669 # [ used in Ashokan Prakrit entries, e.g. {{inc-ash-noun|g=f}} {{tlb|inc-ash|Delhi-Meerut|Delhi-Topra|... 

2670 # see https://en.wiktionary.org/wiki/Module:labels/data/lang/inc-ash 

2671 # and https://en.wiktionary.org/wiki/Module:inc-ash/dial/data 

2672 "Shahbazgarhi", 

2673 "Mansehra", 

2674 "Kanadahar", 

2675 "Ranigat", 

2676 "Kalsi", 

2677 "Delhi-Topra", 

2678 "Delhi-Meerut", 

2679 "Rampurva", 

2680 "Lauriya-Nandangarh", 

2681 "Lauriya-Araraj", 

2682 "Lumbini", 

2683 "Nigali-Sagar", 

2684 "Sarnath", 

2685 "Rupnath", 

2686 "Bairat", 

2687 "Sanchi", 

2688 "Allahabad-Kosambi", 

2689 "Sahasram", 

2690 "Gujarra", 

2691 "Barabar", 

2692 "Calcutta-Bairat", 

2693 "Dhauli", 

2694 "Jaugada", 

2695 "Girnar", 

2696 "Sopara", 

2697 "Yerragudi", 

2698 "Siddapura", 

2699 "Brahmagiri", 

2700 "Maski", 

2701 "Barabar Hill", 

2702 "Barabar Caves", 

2703 "Bhabru", 

2704 "Kaushambi", 

2705 "Khalsi", 

2706 "Kosambi", 

2707 "Lauria-Nandangarh", 

2708 "Lauria-Araraj", 

2709 "Mathia", 

2710 "Radhia", 

2711 "Rummindei", 

2712 "Topra", 

2713 "Meerut", 

2714 # [ used in Proto-Uralic entries e.g. 

2715 # {{head|urj-pro|noun}} {{tlb|urj-pro|Finno-Permic}} 

2716 "Finno-Permic", 

2717 "Finno-Volgaic", 

2718 # [ used in Proto-Georgian-Zan/Proto-Kartvelian entries e.g. 

2719 # {{head|ccs-pro|noun}} {{tlb|ccs-pro|Fähnrich-Sarǯvelaʒe}} 

2720 "Čikobava", 

2721 "Klimov", 

2722 "Fähnrich-Sarǯvelaʒe", 

2723 "Fähnrich", 

2724 "Fähnrich-Sarǯvelaʒe 2000", 

2725 "Fähnrich 2007" 

2726 # Chinese pronunciation table stuff 

2727 "Yongchun", 

2728 "SP", 

2729 "Palladius", 

2730 "PFS", 

2731 "Hanyu Pinyin", 

2732 "IUPAC", # International Union of Pure and Applied Chemistry 

2733} 

2734 

2735 

2736# General mapping for linguistic tags. Value is a string of space-separated 

2737# tags, or list of alternative sets of tags. Alternative forms in the same 

2738# category can all be listed in the same string (e.g., multiple genders). 

2739# XXX should analyze imperfect vs. imperfective - are they just used in 

2740# different languages, or is there an actual difference in meaning? 

2741xlat_tags_map: dict[str, str | list[str]] = { 

2742 "sg": "singular", 

2743 "pl": "plural", 

2744 "sg.": "singular", 

2745 "pl.": "plural", 

2746 "sg. and pl.": "singular plural", 

2747 "sg and pl": "singular plural", 

2748 "m/f": "masculine feminine", 

2749 "no pl": "no-plural", 

2750 "pl. only": "plural-only plural", 

2751 "pl ordinaux": "usually plural", 

2752 "m.": "masculine", 

2753 "male": "masculine", 

2754 "f.": "feminine", 

2755 "fem.": "feminine", 

2756 "female": "feminine", 

2757 "indef.": "indefinite", 

2758 "gen.": "genitive", 

2759 "pres.": "present", 

2760 "subj.": "subjunctive", 

2761 "impf.": "imperfective", 

2762 "pf.": "perfective", 

2763 "trans.": "transitive", 

2764 "unc": "uncountable", 

2765 "abbreviated": "abbreviation", 

2766 "abbreviation as": "abbreviation", 

2767 "diminutives": "diminutive", 

2768 "Diminutive": "diminutive", 

2769 "Diminutives": "diminutive", 

2770 "†-tari": "-tari", 

2771 "†-nari": "-nari", 

2772 "♂♀": "masculine feminine", 

2773 "♂": "masculine", 

2774 "♀": "feminine", 

2775 "cangjie input": "cangjie-input", 

2776 "RP": "Received-Pronunciation", 

2777 "BR": "Brazil", 

2778 "Brasil": "Brazil", 

2779 "Brazilian Portuguese": "Brazil", 

2780 "FR": "France", 

2781 "IT": "Italy", 

2782 "CAN": "Canada", 

2783 "AU": "Australia", 

2784 "AU&NZ": "Australia New-Zealand", 

2785 "AUS": "Australia", 

2786 "Austr.": "Australian", 

2787 "AusE": "Australia", 

2788 "Aus": "Australia", 

2789 "NSW": "New-South-Wales", 

2790 "LKA": "Sri-Lanka", 

2791 "RU": "Russia", 

2792 "SA": "South-Africa", 

2793 "[AU]": "Australia", 

2794 "NYC": "New-York-City", 

2795 "CA": "Canada", 

2796 "AT": "Austria", 

2797 "GA": "General-American", 

2798 "NV": "Navajo", 

2799 "UK male": "UK", 

2800 "UK female": "UK", 

2801 "GB": "UK", 

2802 "EN": "UK", 

2803 "IN": "India", 

2804 "PRC": "China", 

2805 "BG": "Bulgaria", 

2806 "DE": "Germany", 

2807 "IE": "Ireland", 

2808 "NL": "Netherlands", 

2809 "NZ": "New-Zealand", 

2810 "PT": "Portugal", 

2811 "BOL": "Bolivia", 

2812 "U.S.A.": "US", 

2813 "U.S.": "US", 

2814 "[US]": "US", 

2815 "Americanisation": "Americanization", 

2816 "Saint Ouen": "Saint-Ouën", 

2817 "Déné syllabary": "Déné-syllabary", 

2818 "Kayah Li": "Kayah-Li", 

2819 "Hanifi Rohingya": "Hanifi-Rohingya", 

2820 "Ol Chiki": "Ol-Chiki", 

2821 "Old Persian": "Old-Persian", 

2822 "Tai Tham": "Tai-Tham", 

2823 "Warang Citi": "Warang-Citi", 

2824 "UK & Aus": "UK Australia", 

2825 "US & HK": "US Hong-Kong", 

2826 "Britian": "Britain", 

2827 "coastal Min": "Coastal-Min", 

2828 "Telugu-Kui language": "Telugu-Kui", 

2829 "SK Standard/Seoul": "SK-Standard Seoul", 

2830 "Devanagri": "Devanagari error-misspelling", 

2831 "Standard Seoul": "SK-Standard Seoul", 

2832 "Association canadienne de normalisation": "Canada", 

2833 "esp.": "especially", 

2834 "northwestern": "Northwestern", 

2835 "northeastern": "Northeastern", 

2836 "southwestern": "Southwestern", 

2837 "southeastern": "Southeastern", 

2838 "northern": "Northern", 

2839 "southern": "Southern", 

2840 "western": "Western", 

2841 "eastern": "Eastern", 

2842 "westernmost": "Western", 

2843 "west": "West", 

2844 "Mecayapán": "Mecayapan", 

2845 "Andalucia": "Andalusia", 

2846 "Andalusian": "Andalusia", 

2847 "Andalucía": "Andalusia", 

2848 "Mooring and Föhr-Amrum": "Mooring Föhr-Amrum", 

2849 "Föhr-Amrum & Mooring": "Föhr-Amrum Mooring", 

2850 "Nazi slur against Churchill": "Nazism slur", 

2851 "religious slur": "slur", 

2852 "euphemistic Nazi term": "Nazism euphemistic", 

2853 "United States": "US", 

2854 "Québec": "Quebec", 

2855 "Classic Persian": "Classical-Persian", 

2856 "Sette Communi": "Sette-Comuni", 

2857 "Vivaro-alpine": "Vivaro-Alpine", 

2858 "Mooring and Hallig": "Mooring Hallig", 

2859 "Zürich": "Zurich", 

2860 "Somiedo": "Somiedu", 

2861 "Uk": "UK", 

2862 "US/UK": "US UK", # XXX leave separate 

2863 "USA": "US", 

2864 "México": "Mexico", 

2865 "Latinamerica": "Latin-America", 

2866 "Lat. Amer.": "Latin-America", 

2867 "LAm": "Latin-America", 

2868 "Monégasque": "Monegasque", 

2869 "Audio": "", 

2870 "orig. US": "", 

2871 "poetical": "poetic", 

2872 "Noun": "noun", 

2873 "Adjective": "adjective", 

2874 "Verb": "verb", 

2875 "Poetic": "poetic", 

2876 "Poetic.": "poetic", 

2877 "Informal.": "informal", 

2878 "slightly more formal": "formal", 

2879 "Used in formal contexts": "formal", 

2880 "Dialectal use only": "dialectal", 

2881 "Generally avoided unless the cause is emphasized": "rare emphatic", 

2882 "Colloquial.": "colloquial", 

2883 "Antiquated.": "dated", 

2884 "Archaic": "archaic", 

2885 "religious/archaic": "archaic", 

2886 "Causative": "causative", 

2887 "Passive": "passive", 

2888 "Stative": "stative", 

2889 "Applicative": "applicative", 

2890 "Colloquial": "colloquial", 

2891 "Epic verse": "poetic", 

2892 "Nominative plural - rare": "nominative plural rare", 

2893 "Nonstandard but common": "nonstandard common", 

2894 "Slang": "slang", 

2895 "Slang-Latin America": "slang Latin-America", 

2896 "TCM": "Traditional-Chinese-Medicine", 

2897 "slangy": "slang", 

2898 "backslang": "slang", 

2899 "butcher's slang": "slang jargon", 

2900 "archiac": "archaic error-misspelling", 

2901 "archaic except in fixed expressions": "archaic", 

2902 "nonstandard form": "nonstandard", 

2903 "singular form": "singular", 

2904 "plural form": "plural", 

2905 "nonstandard form of": "nonstandard alt-of", 

2906 "main verb": "base-form", 

2907 "standard form of": "standard alt-of", 

2908 "nonstandard stylistic suffix": "nonstandard dialectal suffix", 

2909 "honorific form": "honorific", 

2910 "possessed form": "possessed-form", 

2911 "obligatorily possessed": "possessed-form", 

2912 "obligatory possessive": "possessed-form", 

2913 "obligatory possession": "possessed-form", 

2914 "possessive only": "possessive", 

2915 "obligational": "obligative", 

2916 "indicated possession by preceding noun": "possessed-form", 

2917 "unpossessed form": "unpossessed-form", 

2918 "Dialectal": "dialectal", 

2919 "Dialect": "", 

2920 "dialectal form": "dialectal", 

2921 "dialectal term": "dialectal", 

2922 "dialectal Mandarin": "dialectal Mandarin", 

2923 "Dialect:": "", 

2924 "regiolectal": "dialectal", 

2925 "archaic or regiolectal": "archaic dialectal", 

2926 "archaic or regional": "archaic dialectal", 

2927 "Archaic or obsolete": "archaic", 

2928 "Canada: Ontario": "Ontario", 

2929 "Canada: British Columbia": "British-Columbia", 

2930 "GenAm": "General-American", 

2931 "Greco-Bohairic Pronunciation": "Greco-Bohairic", 

2932 "Greco-Bohairic pronunciation": "Greco-Bohairic", 

2933 "Vallader": "Vallander", 

2934 "Conservative RP": "Received-Pronunciation", 

2935 "Received Prononunciation": "Received-Pronunciation", 

2936 "North American also": "North-American", 

2937 "Cois Fharraige also": "Cois-Fharraige", 

2938 "Sawndip forms": "Sawndip", 

2939 "Sawndip form": "Sawndip", 

2940 "old orthography": "archaic", 

2941 "Maine accent": "Maine", 

2942 "Bosnia Serbia": "Bosnian-Serbian", 

2943 "MLE": "Multicultural-London-English", 

2944 "AAVE": "African-American-Vernacular-English", 

2945 "Early ME": "Early-Middle-English", 

2946 "Northern ME": "Northern-Middle-English", 

2947 "Southern ME": "Southern-Middle-English", 

2948 "Late ME": "Late-Middle-English", 

2949 "Spanish given name": "Spanish proper-noun", 

2950 "Taichung & Tainan Hokkien": "Taichung-Hokkien Tainan", 

2951 "St. Petersburg or dated": "Saint-Petersburg dated", 

2952 "Irregular reading": "irregular-pronunciation", 

2953 "irreg. adv.": "irregular adverbial", 

2954 "Argentina and Uruguay": "Argentina Uruguay", 

2955 "Argentina Uruguay": "Argentina Uruguay", 

2956 "Quanzhou & Xiamen Hokkien": "Quanzhou Xiamen-Hokkien", 

2957 "Xiamen & Zhangzhou Hokkien": "Xiamen-Hokkien Zhangzhou-Hokkien", 

2958 "Southern US folk speech": "Southern-US dialectal", 

2959 "Main dialectal variations": "dialectal", 

2960 "Many eastern and northern dialects": "dialectal", 

2961 "many dialects": "dialectal", 

2962 "some dialects of": "dialectal", 

2963 "now sometimes by conflation with etymology 1 under standard German influence": "sometimes", 

2964 "see below": "", 

2965 "unstressed form": "unstressed", 

2966 "mute of": "unstressed form-of", 

2967 "for some speakers": "uncommon", 

2968 'when "do" is unstressed and the next word starts with /j/': "unstressed-before-j", 

2969 "before a vowel": "before-vowel", 

2970 "before vowel": "before-vowel", 

2971 "before vowels": "before-vowel", 

2972 "pre-vocalic": "before-vowel", 

2973 "used before vowels and lenited fh-": "before-vowel before-lenited-fh", 

2974 "used before vowels": "before-vowel", 

2975 "used before the past tense": "before-past", 

2976 "used a verb in imperfect subjunctive": "with-imperfect with-subjunctive", 

2977 "the Eurozone": "Eurozone", 

2978 "Phoneme": "phoneme", 

2979 "Vowel": "phoneme", 

2980 "Consonant": "phoneme", 

2981 "Name of letter": "name", 

2982 "nation's name": "name", 

2983 "proprietary name": "name", 

2984 "Vulgar": "vulgar", 

2985 "strong language": "vulgar", 

2986 "Very Strong Swear word": "vulgar", 

2987 "Spoken": "colloquial", 

2988 "spoken": "colloquial", 

2989 "written": "literary", 

2990 "Syllable initial": "syllable-initial", 

2991 "Syllable final": "syllable-final", 

2992 "internet": "Internet", 

2993 "online": "Internet", 

2994 "instant messaging": "Internet", 

2995 "text messaging": "Internet", 

2996 "cot-caught merged": "cot-caught-merger", 

2997 "cot–caught merged": "cot-caught-merger", 

2998 "cot-caught merger": "cot-caught-merger", 

2999 "cot–caught merger": "cot-caught-merger", 

3000 "pin-pen merger": "pin-pen-merger", 

3001 "pin–pen merger": "pin-pen-merger", 

3002 "prefix before comparative forms": "prefix with-comparative", 

3003 "countable and uncountable": "countable uncountable", 

3004 "masculine and feminine plural": "masculine feminine plural", 

3005 "definite singular and plural": "definite singular plural", 

3006 "definite or plural": ["definite", "plural"], 

3007 "plural or definite attributive": [ 

3008 "plural attributive", 

3009 "definite singular attributive", 

3010 ], 

3011 "plural and definite singular attributive": [ 

3012 "plural attributive", 

3013 "definite singular attributive", 

3014 ], 

3015 "oblique and nominative feminine singular": "oblique nominative feminine singular", 

3016 "feminine and neuter plural": "feminine neuter plural", 

3017 "feminine and neuter": "feminine neuter", 

3018 "masculine and feminine": "masculine feminine", 

3019 "masculine and neuter": "masculine neuter", 

3020 "masculine and plural": "masculine plural", 

3021 "female and neuter": "feminine neuter", 

3022 "the third person": "third-person", 

3023 "(at least) nominative/objective/reflexive cases": "nominative objective", 

3024 "singular and plural": "singular plural", 

3025 "plural and weak singular": ["plural", "weak singular"], 

3026 "dative-directional": "dative directional", 

3027 "preterite and supine": "preterite supine", 

3028 "genitive and dative": "genitive dative", 

3029 "genitive and plural": "genitive plural", 

3030 "genitive plural": "genitive plural", 

3031 "dative and accusative": "dative accusative", 

3032 "accusative/illative": "accusative illative", 

3033 "accusative and ablative": "accusative ablative", 

3034 "dative and accusative singular": "dative accusative singular", 

3035 "no nominative": "no-nominative", 

3036 "simple past": "past", 

3037 "past —": "no-past", 

3038 "simple future": "future", 

3039 "simple present": "present", 

3040 "simple past and past participle": ["past", "past participle"], 

3041 "simple past tense and past participle": ["past", "past participle"], 

3042 "taking a past participle": "with-past-participle", 

3043 "literary or in compounds": "literary in-compounds", 

3044 "certain compounds": "in-compounds idiomatic", 

3045 "participial adjective": "participle adjective error-misspelling", 

3046 "literary or archaic": "literary archaic", 

3047 "literaly or archaic": "literary archaic error-misspelling", 

3048 "literary or dialectal": "literary dialectal", 

3049 "dated or dialectal": "dated dialectal", 

3050 "dialectal or colloquial": "dialectal colloquial", 

3051 "dialectal or obsolete": "dialectal obsolete", 

3052 # XXX what is this? "with verb in simple tense": "with-simple", 

3053 "in simple past tense": "past", 

3054 "for most verbs": "usually", 

3055 "in general": "usually", 

3056 "in variation": "in-variation", 

3057 "genitive/dative": "genitive dative", 

3058 "dative/locative": "dative locative", 

3059 "dative/locative/partitive": "dative locative partitive", 

3060 "dative/partitive": "dative partitive", 

3061 "genitive/dative/prepositional": "genitive dative prepositional", 

3062 "dative/instrumental": "dative instrumental", 

3063 "dative/instrumental/prepositional": "dative instrumental prepositional", 

3064 "genitive/prepositional": "genitive prepositional", 

3065 "genitive/dative/locative": "genitive dative locative", 

3066 "genitive/dative/ablative": "genitive dative ablative", 

3067 "dative/ablative/locative": "dative ablative locative", 

3068 "ablative/vocative": "ablative vocative", 

3069 "ablative/locative": "ablative locative", 

3070 "ablative/instrumental": "ablative instrumental", 

3071 "dative/ablative": "dative ablative", 

3072 "genitive/instrumental/locative": "genitive instrumental locative", 

3073 "genitive/dative/locative/vocative": "genitive dative locative vocative", 

3074 "genitive/dative/instrumental": "genitive dative instrumental", 

3075 "genitive/dative/instrumental/prepositional": "genitive dative instrumental prepositional", 

3076 "prepositional masculine / neuter singular": [ 

3077 "prepositional masculine", 

3078 "neuter singular", 

3079 ], 

3080 "+ prepositional case": "with-prepositional", 

3081 "+prepositional": "with-prepositional", 

3082 "+ por": "with-por", 

3083 "Radical": "radical", 

3084 "Kangxi radical": "radical", 

3085 "accusative/instrumental": "accusative instrumental", 

3086 "dative/adverbial case": "dative adverbial", 

3087 "dative/genitive": "dative genitive", 

3088 "dative/genitive/instrumental": "dative genitive instrumental", 

3089 "dative/accusative": "dative accusative", 

3090 "dative/accusative/locative": "dative accusative locative", 

3091 "genitive/accusative/prepositional": "genitive accusative prepositional", 

3092 "genitive/accusative/vocative": "genitive accusative vocative", 

3093 "genitive/dative/accusative": "genitive dative accusative", 

3094 "genitive/animate accusative": ["genitive", "animate accusative"], 

3095 "genitive/accusative animate/prepositional": [ 

3096 "genitive prepositional", 

3097 "accusative animate", 

3098 ], 

3099 "accusative plural and genitive plural": "accusative genitive plural", 

3100 "hidden-n declension": "hidden-n", 

3101 "declension pattern of": "declension-pattern-of", 

3102 "first/declension-2 adjective": "declension-1 declension-2 adjective", 

3103 "first/declension-2 participle": "declension-1 declension-2 participle", 

3104 "class 9/10": "class-9 class-10", 

3105 "class 5/6": "class-5 class-6", 

3106 "class 3/4": "class-3 class-4", 

3107 "class 7/8": "class-7 class-8", 

3108 "class 1/2": "class-1 class-2", 

3109 "class 11/10": "class-11 class-10", 

3110 "class 11/12": "class-11 class-12", 

3111 "nc 1/2": "class-1 class-2", 

3112 "nc 3/4": "class-3 class-4", 

3113 "nc 5/6": "class-5 class-6", 

3114 "nc 7/8": "class-7 class-8", 

3115 "nc 9/10": "class-9 class-10", 

3116 "nc 1": "class-1", 

3117 "nc 2": "class-2", 

3118 "nc 3": "class-3", 

3119 "nc 4": "class-4", 

3120 "nc 5": "class-5", 

3121 "nc 6": "class-6", 

3122 "nc 7": "class-7", 

3123 "nc 8": "class-8", 

3124 "nc 9": "class-9", 

3125 "nc 10": "class-10", 

3126 "nc 11": "class-11", 

3127 "nc 12": "class-12", 

3128 "nc 13": "class-13", 

3129 "nc 14": "class-14", 

3130 "nc 15": "class-15", 

3131 "nc 16": "class-16", 

3132 "nc 17": "class-17", 

3133 "nc 18": "class-18", 

3134 "cl. 2 to cl. 11 and cl. 16 to cl. 18": "class-2 class-3 class-4 class-5 class-6 class-7 class-8 class-9 class-10 class-11 class-16 class-17 class-18", 

3135 "refl": "reflexive", 

3136 "coll.": "colloquial", 

3137 "colloq.": "colloquial", 

3138 "colloq": "colloquial", 

3139 "collo.": "colloquial", 

3140 "collective when uncountable": "countable uncountable collective", 

3141 "coloquial": "colloquial", 

3142 "more colloquial": "colloquial", 

3143 "used colloquially and jokingly": "colloquial humorous", 

3144 "used adverbially": "adverbial", 

3145 "adverbially": "adverbial", 

3146 "intr.": "intransitive", 

3147 "tr.": "transitive", 

3148 "trans": "transitive", 

3149 "intransitive use": "intransitive", 

3150 "intransitive senses": "intransitive", 

3151 "intr. impers.": "intransitive impersonal", 

3152 "abbrev.": "abbreviation", 

3153 "Abbreviation": "abbreviation", 

3154 "Hiragana": "hiragana", 

3155 "Katakana": "katakana", 

3156 "synon. but common": "synonym common", 

3157 "common hyperhyms": "common hypernym", 

3158 "much more common": "common", 

3159 "common gender": "common-gender", 

3160 "incorrectly": "proscribed", 

3161 "incorrect": "proscribed", 

3162 "a hyponymic term": "hyponym", 

3163 "a hypernymic term": "hypernym", 

3164 "transitively": "transitive", 

3165 "intransitively": "intransitive", 

3166 "transitiv": "transitive", 

3167 "intransitiv": "intransitive", 

3168 "nominalized adjective": "noun-from-adj", 

3169 "adjectivized noun": "adjectival", 

3170 "adv.": "adverb", 

3171 "infomal": "informal error-misspelling", 

3172 "informally": "informal", 

3173 "formally": "formal", 

3174 "very formal": "formal", 

3175 "unmarked form": "unstressed", 

3176 "marked form": "stressed", 

3177 "inifnitive": "infinitive error-misspelling", 

3178 "inf.": "informal", 

3179 "inf": "infinitive", # darovať/Slovak 

3180 "unformal": "informal", 

3181 "unpolite": "impolite", 

3182 "fairly polite": "polite", 

3183 "postnominal": "postpositional", 

3184 "first/second declension": "declension-1 declension-2", 

3185 "first/second-declension": "declension-1 declension-2", 

3186 "first/declension-2 suffix": "declension-1 declension-2 suffix", 

3187 "first/declension-2 numeral plural only": "declension-1 declension-2 numeral plural-only plural", 

3188 "with gendered nouns": "with-gendered-noun", 

3189 "possessive (with noun)": "possessive with-noun", 

3190 "possessive (without noun)": "possessive without-noun", 

3191 "without a main word": "without-noun", 

3192 "informal 1st possessive": "informal first-person possessive", 

3193 "informal augmentations": "informal augmented", 

3194 "informal alternatives": "informal", 

3195 "strumental/locative/lative form": "instrumental locative lative", 

3196 "instrumental/locative/lative form": "instrumental locative lative", 

3197 "reflexive/dative/accusative form": "reflexive dative accusative", 

3198 "reflexive/accusative/dative form": "reflexive accusative dative", 

3199 "third-person/impersonal": "third-person impersonal", 

3200 "impersonal/third-person": "impersonal third-person", 

3201 "lative form": "lative", 

3202 "reflexive form": "reflexive", 

3203 "reflexive for": "reflexive form-of", 

3204 "passive for": "passive form-of", 

3205 "dative form": "dative", 

3206 "accusative form": "accusative", 

3207 "formal or literary": ["formal", "literary"], 

3208 "formal or plural": ["formal", "plural"], 

3209 "formal and written": "formal literary", 

3210 "addressing kings and queens": "formal deferential", 

3211 "adressing kings and queens": "formal deferential", 

3212 "impolite 2nd possessive": "informal second-person possessive", 

3213 "casual": "informal", 

3214 "fast speech": "informal", 

3215 "strong personal": "strong personal pronoun", 

3216 "weak personal": "weak personal pronoun", 

3217 "persent participle": "present participle", 

3218 "with adjective or adjective-phrase complement": "with-adjective", 

3219 "with accusative or dative": "with-accusative with-dative", 

3220 "with accusative or genitive": "with-accusative with-genitive", 

3221 "with accusative or ablative": "with-accusative with-ablative", 

3222 "genitive or accusative": ["genitive accusative"], 

3223 "genitive of personal pronoun": "genitive personal pronoun", 

3224 "nominative and accusative definite singular": "nominative accusative definite singular", 

3225 "not generally used in the plural": "singular-normally", 

3226 "+ genitive": "with-genitive", 

3227 "+ genitive possessive suffix or elative": "with-genitive with-possessive-suffix with-elative", 

3228 "+ genitive-accusative": "with-genitive", 

3229 "genitive + ~": "with-genitive postpositional", 

3230 "+ partitive or (less common) possessive suffix": "with-partitive with-possessive-suffix", 

3231 "+ allative": "with-allative", 

3232 "[an (about) + accusative]": "with-an with-accusative", 

3233 "less common": "uncommon", 

3234 "less frequently": "uncommon", 

3235 "no perfect or supine stem": "no-perfect no-supine", 

3236 "no present participle": "no-present-participle", 

3237 "no past participle": "no-past-participle", 

3238 "past participle (obsolete except in adjectival use)": "obsolete past participle", 

3239 "short past participle": "past participle short-form", 

3240 "short past adverbial perfective participle": "past adverbial perfective participle short-form", 

3241 "short past adverbial imperfective participle": "past adverbial imperfective participle short-form", 

3242 "short masculine": "masculine short-form", 

3243 "short feminine": "feminine short-form", 

3244 "short neuter": "neuter short-form", 

3245 "short plural": "plural short-form", 

3246 "short singular": "singular short-form", 

3247 "long past participle": "past participle long-form", 

3248 "of the past participle": "past participle", 

3249 "past participle n": "past participle neuter", 

3250 "past participle c": "past participle common-gender", 

3251 "past participle f": "past participle feminine", 

3252 "past participle m": "past participle masculine", 

3253 "past participle pl": "past participle plural", 

3254 "of the present participle": "present participle", 

3255 "adverbial locative noun in the pa, ku, or mu locative classes": "adverbial locative", 

3256 "comparative -": "no-comparative", 

3257 "superlative -": "no-superlative", 

3258 "comparative form only": "comparative-only", 

3259 "1 declension": "declension-1", 

3260 "4 declension": "declension-4", 

3261 "feminine ? declension": "feminine", 

3262 "masculine ? declension": "masculine", 

3263 "1st declension": "declension-1", 

3264 "2nd declension": "declension-2", 

3265 "3rd declension": "declension-3", 

3266 "4th declension": "declension-4", 

3267 "5th declension": "declension-5", 

3268 "6th declension": "declension-6", 

3269 "2nd-person": "second-person", 

3270 "1st-person": "first-person", 

3271 "3rd-person": "third-person", 

3272 "1st person": "first-person", 

3273 "2nd person": "second-person", 

3274 "3rd person": "third-person", 

3275 "1st actor trigger": "actor-i", 

3276 "2nd actor trigger": "actor-ii", 

3277 "3rd actor trigger": "actor-iii", 

3278 "4th actor trigger": "actor-iv", 

3279 "object trigger": "objective", 

3280 "1st object trigger": "objective actor-i", 

3281 "2nd object trigger": "objective actor-ii", 

3282 "3rd object trigger": "objective actor-iii", 

3283 "4th object trigger": "objective actor-iv", 

3284 "potential mood": "potential", 

3285 "causative mood": "causative", 

3286 "comitative trigger": "comitative", 

3287 "1st comitative trigger": "comitative actor-i", 

3288 "2nd comitative trigger": "comitative actor-ii", 

3289 "3rd comitative trigger": "comitative actor-iii", 

3290 "4th comitative trigger": "comitative actor-iv", 

3291 "locative trigger": "locative", 

3292 "thematic trigger": "thematic", 

3293 "benefactive trigger": "benefactive", 

3294 "instrument trigger": "instrumental", 

3295 "1st instrument trigger": "instrumental actor-i", 

3296 "2nd instrument trigger": "instrumental actor-ii", 

3297 "3rd instrument trigger": "instrumental actor-iii", 

3298 "4th instrument trigger": "instrumental actor-iv", 

3299 "1st": "first-person", 

3300 "2nd": "second-person", 

3301 "3rd": "third-person", 

3302 "plural inv": "plural invariable", 

3303 "plural not attested": "no-plural", 

3304 "no plural forms": "no-plural", 

3305 "not translated": "not-translated", 

3306 "not mutable": "not-mutable", 

3307 "used only predicatively": "predicative", 

3308 "only in predicative position": "predicative", 

3309 "only predicative": "predicative", 

3310 "only among women": "", 

3311 "predicate-only": "predicative error-misspelling", # eleng/Luxembourgish 

3312 "predicative only": "predicative", 

3313 "predicatively": "predicative", 

3314 "in attributive use": "attributive", 

3315 "(attributive)": "attributive", 

3316 "(predicative)": "predicative", 

3317 "(uncountable)": "uncountable", 

3318 "(as a measure)": "", 

3319 "only in attributive use": "attributive", 

3320 "present tense": "present", 

3321 "past tense": "past", 

3322 "feminine counterpart": "feminine", 

3323 "feminine form": "feminine", 

3324 "masculine counterpart": "masculine", 

3325 "masculine form": "masculine", 

3326 "neuter form": "neuter", 

3327 "passive counterpart": "passive", 

3328 "active counterpart": "active", 

3329 "attested mostly in the passive": "passive-mostly", 

3330 "basic stem form": "stem", 

3331 "no supine stem": "no-supine", 

3332 "no perfect stem": "no-perfect", 

3333 "construct state": "construct", 

3334 "construct form": "construct", 

3335 "phonemic reduplicative": "reduplication", 

3336 "reduplicated": "reduplication", 

3337 "neutrally formal": "polite", 

3338 "objective case": "objective", 

3339 "first person": "first-person", 

3340 "second person": "second-person", 

3341 "third person": "third-person", 

3342 "nominative case": "nominative", 

3343 "genitive case": "genitive", 

3344 "genitive 1": "genitive", 

3345 "genitive 2": "genitive", 

3346 "genitive 3": "genitive", 

3347 "dative case": "dative", 

3348 "dative 1": "dative", 

3349 "dative 2": "dative", 

3350 "dative 3": "dative", 

3351 "accusative 1": "accusative", 

3352 "accusative 2": "accusative", 

3353 "accusative 3": "accusative", 

3354 "accusative case": "accusative", 

3355 "ergative cases": "ergative", 

3356 "absolutive case": "absolutive", 

3357 "ablative case": "ablative", 

3358 "genitive unattested": "no-genitive", 

3359 "genitive -": "no-genitive", 

3360 "nominative plural -": "no-nominative-plural", 

3361 "colloquially also feminine": "colloquial feminine", 

3362 "colloquial or pejorative": "colloquial pejorative", 

3363 "colloquial or dialectal": "colloquial dialectal", 

3364 "pejorative or racial slur": "pejorative slur", 

3365 "pejoratively": "pejorative", 

3366 "pej.": "pejorative", 

3367 "racial slur": "slur", 

3368 "in some dialects": "dialectal", 

3369 "in other dialects": "dialectal", 

3370 "dialects": "dialectal", 

3371 "pejorativ": "pejorative error-misspelling", 

3372 "idionomic": "idiomatic error-misspelling", 

3373 "idiom": "idiomatic", 

3374 "humorously self-deprecating": "humorous self-depreciating", 

3375 "self-depeciatory": "self-depreciating", 

3376 "rare/awkward": "rare", 

3377 "rare/archaic": "archaic", 

3378 "archaic or Scotland": "archaic Scotland", 

3379 "extremely rare": "rare", 

3380 "now quite rare": "rare", 

3381 "rarefied": "rare", 

3382 "rarely": "rare", 

3383 "rarer form": "rare", 

3384 "relatively rare": "rare", 

3385 "personified": "person", 

3386 "person or animal": "person animal-not-person", 

3387 "found only in the imperfective tenses": "no-perfect", 

3388 "imperfekt": "imperfect error-misspelling", 

3389 "imperf. aspect": "imperfect", 

3390 "complete": "completive", 

3391 "perfective 1": "perfect", 

3392 "perfective 2": "perfect", 

3393 "in counterfactual conditionals": "conditional counterfactual", 

3394 "improbable of counterfactual": "usually counterfactual", 

3395 "third plural indicative": "third-person plural indicative", 

3396 "defective verb": "defective", 

3397 "+ active 3rd infinitive in elative": "with-infinitive-iii-elative", 

3398 "+ active 3rd infinitive in illative": "with-infinitive-iii-illative", 

3399 "+ third infinitive in illative": "with-infinitive-iii-illative", 

3400 "+ verb in 3rd infinitive abessive": "with-infinitive-iii-abessive", 

3401 "+ verb in third infinitive illative or adverb": "with-infinitive-iii with-illative with-adverb", 

3402 "+ partitive + 3rd person singular": "with-partitive", 

3403 "3rd possessive": "third-person possessive", 

3404 "active voice": "active", 

3405 "+ infinitive": "with-infinitive", 

3406 "+ first infinitive": "with-infinitive-i", 

3407 "transitive + first infinitive": "transitive with-infinitive-i", 

3408 "transitive + kV": "transitive with-kV", # gǀkxʻâã/ǃXóõ 

3409 "+ a + infinitive": "with-a with-infinitive", 

3410 "+ indicative mood": "with-indicative", 

3411 "+ conditional mood": "with-conditional", 

3412 "+nominative": "with-nominative", 

3413 "+ nominative": "with-nominative", 

3414 "plus genitive": "with-genitive", 

3415 "+ genetive": "with-genitive error-misspelling", 

3416 "+genitive": "with-genitive", 

3417 "+ genitive case": "with-genitive", 

3418 "genitive +": "with-genitive", 

3419 "nominative +": "with-nominative", 

3420 "genitive or possessive suffix +": "with-genitive with-possessive-suffix", 

3421 "with genitive case": "with-genitive", 

3422 "with genitive": "with-genitive", 

3423 "+dative": "with-dative", 

3424 "+ dative case": "with-dative", 

3425 "dative case +": "with-dative", 

3426 "+ dative": "with-dative", 

3427 "+ historic dative": "with-dative historic", 

3428 "only with adjectives": "with-adjective", 

3429 "plus dative": "with-dative", 

3430 "plus dative case": "with-dative", 

3431 "with dative": "with-dative", 

3432 "with the dative": "with-dative", 

3433 "with dative case": "with-dative", 

3434 "+ accusative": "with-accusative", 

3435 "+ accusative case": "with-accusative", 

3436 "+accusative": "with-accusative", 

3437 "with accusative case": "with-accusative", 

3438 "with the accusative": "with-accusative", 

3439 "with accusative": "with-accusative", 

3440 "plus accusative": "with-accusative", 

3441 "takes accusative": "with-accusative", 

3442 "takes accusative object": "with-accusative", 

3443 "governs the accusative": "with-accusative", 

3444 "governs the genitive": "with-genitive", 

3445 "governs the dative": "with-dative", 

3446 "takes dative": "with-dative", 

3447 "takes dative case": "with-dative", 

3448 "zhuyin": "Bopomofo", 

3449 "Zhuyin": "Bopomofo", 

3450 "East Midland": "East Midlands", 

3451 "Yorkshire & East Midlands": "Yorkshire East-Midlands", 

3452 "+ partitive": "with-partitive", 

3453 "+ partitive + vastaan": "with-partitive", 

3454 "+partitive": "with-partitive", 

3455 "with partitive case": "with-partitive", 

3456 "plus partitive": "with-partitive", 

3457 "with partitive": "with-partitive", 

3458 "+ablative": "with-ablative", 

3459 "+ ablative": "with-ablative", 

3460 "with ablative case": "with-ablative", 

3461 "plus ablative": "with-ablative", 

3462 "with ablative": "with-ablative", 

3463 "+ subjunctive": "with-subjunctive", 

3464 "+subjunctive": "with-subjunctive", 

3465 "plus subjunctive": "with-subjunctive", 

3466 "with subjunctive": "with-subjunctive", 

3467 "with subjunctives": "with-subjunctive", 

3468 "+ subordinate clause": "with-subordinate-clause", 

3469 "+ instrumental": "with-instrumental", 

3470 "+instrumental": "with-instrumental", 

3471 "+ instrumental case": "with-instrumental", 

3472 "with instrumental case": "with-instrumental", 

3473 "with instrumental": "with-instrumental", 

3474 "plus instrumental": "with-instrumental", 

3475 "with instrumental or genitive case": "with-instrumental with-genitive", 

3476 "with instrumental or dative case": "with-instrumental with-dative", 

3477 "+ locative": "with-locative", 

3478 "+ locative case": "with-locative", 

3479 "with locative": "with-locative", 

3480 "+ illative": "with-illative", 

3481 "intransitive + illative": "intransitive with-illative", 

3482 "intransitive + elative": "intransitive with-elative", 

3483 "intransitive + inessive or adessive": "intransitive with-inessive with-adessive", 

3484 "intransitive + inessive": "intransitive with-inessive", 

3485 "intransitive + adessive": "intransitive with-adessive", 

3486 "intransitive + translative": "intransitive with-translative", 

3487 "intransitive + partitive or transitive + accusative": "intransitive with-partitive transitive with-accusative", 

3488 "transitive + partitive": "transitive with-partitive", 

3489 "transitive + partitive + essive": "transitive with-partitive with-essive", 

3490 "transitive + elative + kiinni": "transitive with-elative", 

3491 "transitive (+ yllään) + partitive": "transitive with-partitive", 

3492 "transitive + accusative": "transitive with-accusative", 

3493 "transitive + elative": "transitive with-elative", 

3494 "transitive or reflexive": "transitive reflexive", 

3495 "illative + 3rd-person singular": "with-illative with-third-person-singular", 

3496 "partitive + 3rd-person singular": "with-partitive with-third-person-singular", 

3497 "+ translative": "with-translative", 

3498 "+ negative adjective in translative": "with-translative with-negative-adj", 

3499 "with negation": "with-negation", 

3500 "with negated verb": "with-negation", 

3501 "when negated": "with-negation", 

3502 "usu. in negative": "usually with-negation", 

3503 "predicate of copula": "copulative", 

3504 "copular verb": "copulative", 

3505 "copula": "copulative", # náina/Phalura 

3506 "+ adessive": "with-adessive", 

3507 "+ adessive or illative": "with-adessive with-illative", 

3508 "+absolutive": "with-absolutive", 

3509 "+ absolutive": "with-absolutive", 

3510 "with absolutive case": "with-absolutive", 

3511 "with absolutive": "with-absolutive", 

3512 "+ absolutive case": "with-absolutive", 

3513 "plus absolutive": "with-absolutive", 

3514 "take nouns in absolute case": "with-absolute", 

3515 "takes nouns in absolute case": "with-absolute", 

3516 "takes absolute case": "with-absolute", 

3517 "+elative": "with-elative", 

3518 "+ elative": "with-elative", 

3519 "elative +": "with-elative", 

3520 "elative case": "elative", 

3521 "+ [elative]": "with-elative", 

3522 "with elative case": "with-elative", 

3523 "with elative": "with-elative", 

3524 "plus elative": "with-elative", 

3525 "+ essive": "with-essive", 

3526 "+ comparative": "with-comparative", 

3527 "+objective": "with-objective", 

3528 "+ objective": "with-objective", 

3529 "with objective case": "with-objective", 

3530 "with objective": "with-objective", 

3531 "plus objective": "with-objective", 

3532 "sublative case": "sublative", 

3533 "terminative case": "terminative", 

3534 "+ present form": "with-present", 

3535 "+ noun phrase] + subjunctive (verb)": "with-noun-phrase with-subjunctive", 

3536 "with noun phrase": "with-noun-phrase", 

3537 "+ [nounphrase] + subjunctive": "with-noun-phrase with-subjunctive", 

3538 "+ number": "with-number", 

3539 "with number": "with-number", 

3540 "optative mood +": "with-optative", 

3541 "not used in plural form": "no-plural", 

3542 "in plural the singular form is used": "singular-only", 

3543 "indecl": "indeclinable", 

3544 "all forms unconjugated": "indeclinable", 

3545 "not declined": "indeclinable", 

3546 "not declinable": "indeclinable", 

3547 "undeclinable": "indeclinable", 

3548 "inconjugable": "indeclinable error-misspelling", 

3549 "indeclinable?": "indeclinable", 

3550 "no inflections": "indeclinable", 

3551 "not often used": "rare", 

3552 "interrogative adverb": "interrogative adverb", 

3553 "perfect tense": "perfect", 

3554 "intensive": "emphatic", 

3555 "intensifier": "emphatic", 

3556 "changed conjunct form": "conjunct", 

3557 "biblical hebrew pausal form": "pausal Biblical", 

3558 "bible": "Biblical", 

3559 "Bibilical": "Biblical", 

3560 "emphatic form": "emphatic", 

3561 "emphatic form of": "emphatic form-of", 

3562 "emphatically": "emphatic", 

3563 "emphatical": "emphatic", 

3564 "standard form": "standard", 

3565 "augmented form": "augmented", 

3566 "active form": "active", 

3567 "passive form": "passive", 

3568 "pre-1989 IPA": "pre-1989-IPA", 

3569 "mutated form": "mutated", 

3570 "auxiliary verb": "auxiliary", 

3571 "modal auxiliary verb": "auxiliary modal", 

3572 "transitive verb": "transitive", 

3573 "tr and intr": "transitive intransitive", 

3574 "intransitive verb": "intransitive", 

3575 "transitive or intransitive": "transitive intransitive", 

3576 "male equivalent": "masculine", 

3577 "in compounds": "in-compounds", 

3578 "in combination": "in-compounds", 

3579 "attribute": "attributive", 

3580 "in the past subjunctive": "with-past with-subjunctive", 

3581 "in conditional": "with-conditional", 

3582 "use the subjunctive tense of the verb that follows": "with-subjunctive", 

3583 "kyūjitai form": "kyūjitai", 

3584 "kyūjitai kanji": "kyūjitai", 

3585 "shinjitai form": "shinjitai", 

3586 "shinjitai kanji": "shinjitai", 

3587 "grade 1 “Kyōiku” kanji": "grade-1-kanji", 

3588 "grade 2 “Kyōiku” kanji": "grade-2-kanji", 

3589 "grade 3 “Kyōiku” kanji": "grade-3-kanji", 

3590 "grade 4 “Kyōiku” kanji": "grade-4-kanji", 

3591 "grade 5 “Kyōiku” kanji": "grade-5-kanji", 

3592 "grade 6 “Kyōiku” kanji": "grade-6-kanji", 

3593 "uncommon “Hyōgai” kanji": "uncommon Hyōgai", 

3594 "dialectical": "dialectal", 

3595 "dialectal or archaic": "dialectal archaic", 

3596 "dialectal or poetic": "dialectal poetic", 

3597 "dialect": "dialectal", 

3598 "obsolescent": "possibly obsolete", 

3599 "obsolete outside dialects": "obsolete dialectal", 

3600 "antiquated": "dated", 

3601 "dated or regional": "dated regional", 

3602 "dated or archaic": "archaic", 

3603 "common and polite term": "polite", 

3604 "most common but potentially demeaning term": "possibly derogatory", 

3605 "highly academic": "literary", 

3606 "highly irregular": "irregular", 

3607 "academic": "literary", 

3608 "learned": "literary", 

3609 "archaic ortography": "archaic", 

3610 "archaic elsewhere": "dialectal", 

3611 "derog.": "derogatory", 

3612 "derogative": "derogatory", 

3613 "derogatively": "derogatory", 

3614 "disparaging": "derogatory", 

3615 "disparagingly": "derogatory", # feic/Irish 

3616 "deprecative": "derogatory", 

3617 "collective sense": "collective", 

3618 "very rare": "rare", 

3619 "very informal": "informal", 

3620 "less formal": "informal", 

3621 "very archaic": "archaic", 

3622 "outdated": "archaic", 

3623 "historiographic": "historical", 

3624 "with a + inf.": "with-a with-infinitive", 

3625 "with di + inf.": "with-di with-infinitive", 

3626 "with che + subj.": "with-che with-subjunctive", 

3627 "with inf.": "with-infinitive", 

3628 "with infinitive": "with-infinitive", 

3629 "with following infinitive": "with-infinitive", 

3630 "followed by an infinitive": "with-infinitive", 

3631 "zu-infinitive": "infinitive infinitive-zu", 

3632 "zu infinitive": "infinitive infinitive-zu", 

3633 "da-infinitive": "infinitive infinitive-da", 

3634 "Use the future tense": "with-future", 

3635 # XXX re-enable "~ се": "with-ce", 

3636 "strong/mixed": "strong mixed", 

3637 "strong/weak/mixed": "strong weak mixed", 

3638 "weak/mixed": "weak mixed", 

3639 "weak verb": "weak", 

3640 "Weak conjugation": "weak", 

3641 "Strong conjugation": "strong", 

3642 "no auxiliary": "no-auxiliary", 

3643 "masculine/feminine": "masculine feminine", 

3644 "masculine/neuter": "masculine neuter", 

3645 "present/future": "present future", 

3646 "present/perfect": "present perfect", 

3647 "present/preterite": "present preterite", 

3648 "future/present": "present future", 

3649 "present/aoriest": "present aorist error-misspelling", 

3650 "superlative degree": "superlative", 

3651 "sup.": "superlative", 

3652 "comparative degree": "comparative", 

3653 "comp.": "comparative", 

3654 "comparatives": "comparative", 

3655 "positive degree": "positive", 

3656 "pos.": "positive", 

3657 "positive outcome": "positive", 

3658 "negative outcome": "negative", 

3659 "equative degree": "equative", 

3660 "indicative and subjunctive": "indicative subjunctive", 

3661 "indicative/subjunctive": "indicative subjunctive", 

3662 "second/third-person": "second-person third-person", 

3663 "singular/plural": "singular plural", 

3664 "in the singular": "singular", 

3665 "in singular": "singular", 

3666 "in plural": "plural", 

3667 "dual/plural": "dual plural", 

3668 "collective or in the plural": "collective in-plural", 

3669 "in the plural": "in-plural", 

3670 "(with savrtsobi)": "with-savrtsobi", 

3671 "plural and definite singular": ["plural", "definite singular"], 

3672 "feminine singular & neuter plural": ["feminine singular", "neuter plural"], 

3673 "partitive/illative": "partitive illative", 

3674 "oblique/nominative": "oblique nominative", 

3675 "nominative/vocative/dative/strong genitive": [ 

3676 "nominative vocative dative", 

3677 "strong genitive", 

3678 ], 

3679 "non-attributive": "predicative", 

3680 "not predicative": "attributive", 

3681 "attributive use": "attributive", 

3682 "nominative/vocative/instrumental": "nominative vocative instrumental", 

3683 "nominative/vocative/strong genitive/dative": [ 

3684 "nominative vocative dative", 

3685 "strong genitive", 

3686 ], 

3687 "nominative/vocative/dative": "nominative vocative dative", 

3688 "accusative/genitive/partitive/illative": "accusative genitive partitive illative", 

3689 "nominative/vocative/accusative/genitive": "nominative vocative accusative genitive", 

3690 "accusative/genitive/locative": "accusative locative genitive", 

3691 "accusative/genitive/dative/instrumental": "accusative genitive dative instrumental", 

3692 "accusative/genitive/dative": "accusative genitive dative", 

3693 "accusative/genitive": "accusative genitive", 

3694 "masculine/feminine/neuter": "masculine feminine neuter", 

3695 "feminine/neuter/masculine": "masculine feminine neuter", 

3696 "feminine/neuter": "feminine neuter", 

3697 "present participle and present tense": ["present participle", "present"], 

3698 "present participle and gerund": ["present participle", "gerund"], 

3699 "past indicative and past participle": "past indicative participle", 

3700 "all-gender": "", 

3701 "gender unknown": "", 

3702 "all-case": "", 

3703 "accusative/dative": "accusative dative", 

3704 "accusative-singular": "accusative singular", 

3705 "accusative-genitive": "accusative genitive", 

3706 "dative/locative/instrumental": "dative locative instrumental", 

3707 "dative/vocative": "dative vocative", 

3708 "dative/vocative/locative": "dative vocative locative", 

3709 "dative/prepositional": "dative prepositional", 

3710 "dative/prepositional/vocative": "dative prepositional vocative", 

3711 "prepositional/vocative": "prepositional vocative", 

3712 "prepositional/locative": "prepositional locative", 

3713 "dative and ablative": "dative ablative", 

3714 "nominative/vocative/dative and strong genitive": [ 

3715 "nominative vocative dative", 

3716 "strong genitive", 

3717 ], 

3718 "nominative/vocative/accusative": "nominative vocative accusative", 

3719 "nominative/vocative": "nominative vocative", 

3720 "nominative/oblique": "nominative oblique", 

3721 "nominative/locative": "nominative locative", 

3722 "nominative/instrumental": "nominative instrumental", 

3723 "nominative/genitive/dative/accusative": "nominative genitive dative accusative", 

3724 "nominative/genitive/dative": "nominative genitive dative", 

3725 "nominative/genitive/accusative/vocative": "nominative genitive accusative vocative", 

3726 "nominative/genitive/accusative": "nominative genitive accusative", 

3727 "nominative/dative": "nominative dative", 

3728 "nominative/accusative/vocative/instrumental": "nominative accusative vocative instrumental", 

3729 "nominative/accusative/vocative": "nominative accusative vocative", 

3730 "nominative/accusative/nominative/accusative": "nominative accusative", 

3731 "nominative/accusative/nominative": "nominative accusative", 

3732 "nominative/accusative/locative": "nominative accusative locative", 

3733 "nominative/accusative/genitive/dative": "nominative accusative genitive dative", 

3734 "nominative/accusative/genitive": "nominative accusative genitive", 

3735 "nominative/accusative/dative": "nominative accusative dative", 

3736 "nominative/accusative": "nominative accusative", 

3737 "perfective/imperfective": "perfective imperfective", 

3738 "imperfective/perfective": "imperfective perfective", 

3739 "neg. perfective": "perfective negative", 

3740 "neg. continuous": "continuative negative", 

3741 "negative form": "negative", 

3742 "negating particle": "negative particle", 

3743 "negation": "negative", 

3744 "continuous": "continuative", 

3745 "continuously": "continuative", 

3746 "animate/inanimate": "animate inanimate", 

3747 "animate or inanimate": "animate inanimate", 

3748 "locative/vocative": "locative vocative", 

3749 "prospective/agentive": "prospective agentive", 

3750 "genitive/accusative": "genitive accusative", 

3751 "singular/duoplural": "singular dual plural", 

3752 "duoplural": "dual plural", 

3753 "1st/3rd": "first-person third-person", 

3754 "first/second-person": "first-person second-person", 

3755 "first/second/third-person": "first-person second-person third-person", 

3756 "first/third/third-person": "first-person third-person", 

3757 "first-/third-person": "first-person third-person", 

3758 "first/second/second-person": "first-person second-person", 

3759 "first/third-person": "first-person third-person", 

3760 "first-person/second-person": "first-person second-person", 

3761 "first-person/third-person": "first-person third-person", 

3762 "first-person singular/third-person singular": "first-person third-person singular", 

3763 "first-person singular/third-person plural": [ 

3764 "first-person singular", 

3765 "third-person plural", 

3766 ], 

3767 "affirmative/negative": "affirmative negative", 

3768 "first-, second-, third-person singular subjunctive present": "first-person second-person third-person singular subjunctive present", 

3769 "first-, second- and third-person singular present indicative": "first-person second-person third-person singular present indicative", 

3770 "first- and third-person": "first-person third-person", 

3771 "female equivalent": "feminine", 

3772 "direct/oblique/vocative": "direct oblique vocative", 

3773 "definite/plural": "definite plural", 

3774 "singular definite and plural": ["singular definite", "plural"], 

3775 "agent noun": "agent", 

3776 "agent noun of": "agent form-of", 

3777 "Principle verb suffix": "agent suffix noun-from-verb", 

3778 "third active infinitive": "infinitive-iii active", 

3779 "third passive infinitive": "infinitive-iii passive", 

3780 "British spelling": "UK", 

3781 "American spelling": "US", 

3782 "IUPAC spelling": "IUPAC", 

3783 "Roman spelling": "romanization", 

3784 "Perso-Arabic spelling": "Perso-Arabic", 

3785 "Arabic/Persian": "Arabic Persian", 

3786 "Arabic spelling": "Arabic", 

3787 "Urdu spelling": "Urdu", 

3788 "Urdu spelling of": "Urdu alt-of", 

3789 "Hindi spelling": "Hindi", 

3790 "Jawi spelling": "Jawi", 

3791 "Mongolian spelling": "Mongolian", 

3792 "Shahmukhi spelling": "Shahmukhi", 

3793 "Rumi spelling": "Rumi", 

3794 "Gurmukhi spelling": "Gurmukhi", 

3795 "Hebrew spelling": "Hebrew", 

3796 "Hebrew Script": "Hebrew", 

3797 "Hebrew alphabet": "Hebrew", 

3798 "Baybayin spelling": "Baybayin", 

3799 "Tai-Tham spelling": "Tai-Tham", 

3800 "Greek spelling": "Greek", 

3801 "Thai spelling": "Thai", 

3802 "Newa spelling": "Newa", 

3803 "Devanagari spelling": "Devanagari", 

3804 "Javanese spelling": "Javanese", 

3805 "Gujarati spelling": "Gujarati", 

3806 "Cham spelling": "Cham", 

3807 "eye dialect": "pronunciation-spelling", 

3808 "feminist or eye dialect": "pronunciation-spelling", 

3809 "enclitic and proclitic": "enclitic proclitic", 

3810 "Enclitic contractions": "enclitic contraction", 

3811 "Proclitic contractions": "proclitic contraction", 

3812 "enclitic form": "enclitic", 

3813 "Devanagari script form of": "alt-of Devanagari", 

3814 "Hebrew script": "Hebrew", 

3815 "Mongolian script": "Mongolian", 

3816 "Bengali script": "Bengali", 

3817 "script": "character", 

3818 "letters": "letter", 

3819 "digits": "digit", 

3820 "characters": "character", 

3821 "symbols": "symbol", 

3822 "tetragrams": "symbol", 

3823 "letter names": "letter-name", 

3824 "Cyrillic-script": "Cyrillic", 

3825 "Latin-script": "Latin", 

3826 "Latin alphabet": "Latin", 

3827 "obsolete form of": "alt-of obsolete", 

3828 "former word": "obsolete", 

3829 "obs.": "obsolete", 

3830 "etymological spelling": "nonstandard", 

3831 "(Dialectological)": "dialectal", 

3832 "dialectal or nonstandard": "dialectal", 

3833 "(hence past tense)": "past", 

3834 "(ablative case)": "ablative", 

3835 "(genitive case)": "genitive", 

3836 "(suffix conjugation)": "suffix", 

3837 "(prefix conjugation)": "prefix", 

3838 "(nós)": "with-nos", 

3839 "(eu)": "with-eu", 

3840 "(vós)": "with-vós", 

3841 "(vos)": "with-vos", 

3842 "(voseo)": "with-voseo", 

3843 "voseo": "with-voseo", 

3844 "(tu)": "with-tu", 

3845 "(tú)": "with-tú", 

3846 "(eles)": "with-eles", 

3847 "(elas)": "with-elas", 

3848 "(vocês)": "with-vocês", 

3849 "(usted)": "with-usted", 

3850 "(ustedes)": "with-ustedes", 

3851 "(yo)": "with-yo", 

3852 "(ele, ela, also used with tu and você?)": "with-ele with-ela with-tu with-você", 

3853 "(eles and elas, also used with vocês and others)": "with-eles with-elas with-vocês with-others", 

3854 "(eles, elas, also used with vocês)": "with-eles with-elas with-vocês", 

3855 "(você)": "with-você", 

3856 "(hiri)": "with-hiri", 

3857 "(hura)": "with-hura", 

3858 "(zuek)": "with-zuek", 

3859 "(vós, sometimes used with vocês)": "with-vós with-vocês", 

3860 "(gij)": "with-gij", 

3861 "(tu, sometimes used with você)": "with-tu with-você", 

3862 "(\u00e9l, ella, also used with usted)": "with-él with-ella with-usted", 

3863 "(ellos, ellas, also used with ustedes)": "with-ellos with-ellas with-ustedes", 

3864 "(nosotros, nosotras)": "with-nosotros with-nosotras", 

3865 "(vosotros, vosotras)": "with-vosotros with-vosotras", 

3866 "(vosotros or vosotras)": "with-vosotros with-vosotras", 

3867 "(ele and ela, also used with você and others)": "with-ele with-ela with-você with-others", 

3868 "(ele, ela, also used with tu and você)": "with-ele with-ela with-tu with-você", 

3869 "former reform[s] only": "", 

3870 "no conj.": "", # XXX conjunctive/conjugation/indeclinable? dot/Latvian 

3871 "no construct forms": "no-construct-forms", 

3872 "no nominative plural": "no-nominative-plural", 

3873 "no supine": "no-supine", 

3874 "no perfect": "no-perfect", 

3875 "no perfective": "no-perfect", 

3876 "no genitive": "no-genitive", 

3877 "no superlative": "no-superlative", 

3878 "no sup.": "no-superlative", 

3879 "no comparative": "no-comparative", 

3880 "no comp.": "no-comparative", 

3881 "no singulative": "no-singulative", 

3882 "no plural": "no-plural", 

3883 "no singular": "plural-only plural", 

3884 "not comparable": "not-comparable", 

3885 "incomparable": "not-comparable", 

3886 "not generally comparable": "usually not-comparable", 

3887 "plurale tantum": "plural-only plural", 

3888 "plurare tantum": "plural-only plural", 

3889 "pluralia tantum": "plural-only plural", 

3890 "singulare tantum": "singular-only singular", 

3891 "normally plural": "plural-normally", 

3892 "used mostly in plural form": "plural-normally", 

3893 "used mostly in the plural form": "plural-normally", 

3894 "most often in the plural": "plural-normally", 

3895 "used especially in the plural form": "plural-normally", 

3896 "usually in the plural": "plural-normally", 

3897 "now usually in the plural": "plural-normally", 

3898 "suffixed pronoun": "suffix pronoun", 

3899 "possessive suffix": "possessive suffix", 

3900 "possessive determiner": "possessive determiner", 

3901 "pronominal state": "pronominal-state", 

3902 "nominal state": "nominal-state", 

3903 "form i": "form-i", 

3904 "form ii": "form-ii", 

3905 "form iii": "form-iii", 

3906 "form iv": "form-iv", 

3907 "form v": "form-v", 

3908 "form vi": "form-vi", 

3909 "form vii": "form-vii", 

3910 "form viii": "form-viii", 

3911 "form ix": "form-ix", 

3912 "form x": "form-x", 

3913 "form xi": "form-xi", 

3914 "form xii": "form-xii", 

3915 "form xiii": "form-xiii", 

3916 "form iq": "form-iq", 

3917 "form iiq": "form-iiq", 

3918 "form iiiq": "form-iiiq", 

3919 "form ivq": "form-ivq", 

3920 "form I": "form-i", 

3921 "form-I": "form-i", 

3922 "form II": "form-ii", 

3923 "form-II": "form-ii", 

3924 "form III": "form-iii", 

3925 "form-III": "form-iii", 

3926 "form IV": "form-iv", 

3927 "form-IV": "form-iv", 

3928 "form V": "form-v", 

3929 "form-V": "form-v", 

3930 "form VI": "form-vi", 

3931 "form-VI": "form-vi", 

3932 "form VII": "form-vii", 

3933 "form-VII": "form-vii", 

3934 "form VIII": "form-viii", 

3935 "form-VIII": "form-viii", 

3936 "form IX": "form-ix", 

3937 "form-IX": "form-ix", 

3938 "form X": "form-x", 

3939 "form-X": "form-x", 

3940 "form XI": "form-xi", 

3941 "form-XI": "form-xi", 

3942 "form XII": "form-xii", 

3943 "form-XII": "form-xii", 

3944 "form XIII": "form-xiii", 

3945 "form-XIII": "form-xiii", 

3946 "form Iq": "form-iq", 

3947 "form IIq": "form-iiq", 

3948 "form IIIq": "form-iiiq", 

3949 "form IVq": "form-ivq", 

3950 "class 1": "class-1", 

3951 "class 1a": "class-1a", 

3952 "class 2": "class-2", 

3953 "class 2a": "class-2a", 

3954 "class 3": "class-3", 

3955 "class 4": "class-4", 

3956 "class 5": "class-5", 

3957 "class 6": "class-6", 

3958 "class 7": "class-7", 

3959 "class 8": "class-8", 

3960 "class 9": "class-9", 

3961 "class 9a": "class-9a", 

3962 "class 10": "class-10", 

3963 "class 10a": "class-10", 

3964 "class 11": "class-11", 

3965 "class 12": "class-12", 

3966 "class 13": "class-13", 

3967 "class 14": "class-14", 

3968 "class 15": "class-15", 

3969 "class 16": "class-16", 

3970 "class 17": "class-17", 

3971 "class 18": "class-18", 

3972 "m-wa class": "class-1 class-2", 

3973 "m-mi class": "class-3 class-4", 

3974 "ma class": "class-5 class-6", 

3975 "ki-vi class": "class-7 class-8", 

3976 "n class": "class-9 class-10", 

3977 "u class": "class-11 class-12 class-14", 

3978 "ku class": "class-15", 

3979 "pa class": "class-16", 

3980 # "ku class": "class-17", # XXX how to distinguish from class-15? 

3981 "mu class": "class-18", 

3982 "first declension": "declension-1", 

3983 "second declension": "declension-2", 

3984 "third declension": "declension-3", 

3985 "fourth declension": "declension-4", 

3986 "fifth declension": "declension-5", 

3987 "first-declension": "declension-1", 

3988 "second-declension": "declension-2", 

3989 "third-declension": "declension-3", 

3990 "fourth-declension": "declension-4", 

3991 "fifth-declension": "declension-5", 

3992 "1st conj.": "conjugation-1", 

3993 "2nd conj.": "conjugation-2", 

3994 "3rd conj.": "conjugation-3", 

3995 "4th conj.": "conjugation-4", 

3996 "5th conj.": "conjugation-5", 

3997 "6th conj.": "conjugation-6", 

3998 "7th conj.": "conjugation-7", 

3999 "first conjugation": "conjugation-1", 

4000 "second conjugation": "conjugation-2", 

4001 "third conjugation": "conjugation-3", 

4002 "fourth conjugation": "conjugation-4", 

4003 "fifth conjugation": "conjugation-5", 

4004 "sixth conjugation": "conjugation-6", 

4005 "seventh conjugation": "conjugation-7", 

4006 "stress pattern 1": "stress-pattern-1", 

4007 "stress pattern 2": "stress-pattern-2", 

4008 "stress pattern 3": "stress-pattern-3", 

4009 "stress pattern 3a": "stress-pattern-3a", 

4010 "stress pattern 3b": "stress-pattern-3b", 

4011 "stress pattern 4": "stress-pattern-4", 

4012 "preposition stressed": "stressed-preposition", 

4013 "tone I": "tone-1", 

4014 "tone II": "tone-2", 

4015 "type p": "type-p", 

4016 "type P": "type-p", 

4017 "type u": "type-u", 

4018 "type U": "type-u", 

4019 "type up": "type-up", 

4020 "type UP": "type-up", 

4021 "type a": "type-a", 

4022 "type A": "type-a", 

4023 "type ua": "type-ua", 

4024 "type UA": "type-ua", 

4025 "form of": "form-of", 

4026 "ordinal form of": "ordinal form-of", 

4027 "ordinal form of the number": "ordinal form-of", 

4028 "ordinal of": "ordinal form-of", 

4029 "ordinal number corresponding to the cardinal number": "ordinal form-of", 

4030 "ordinal form of the cardinal number": "ordinal form-of", 

4031 "the ordinal number": "ordinal alt-of", 

4032 "used in the form": "used-in-the-form", 

4033 "upper case": "uppercase", 

4034 "upper-case": "uppercase", 

4035 "lower case": "lowercase", 

4036 "lower-case": "lowercase", 

4037 "mixed case": "mixedcase", 

4038 "mixed-case": "mixedcase", 

4039 "capital": "uppercase", 

4040 "verb form i": "verb-form-i", 

4041 "verb form ii": "verb-form-ii", 

4042 "pi'el construction": "construction-pi'el", 

4043 "pa'el construction": "construction-pa'el", 

4044 "pa'al construction": "construction-pa'al", 

4045 "hif'il construction": "construction-hif'il", 

4046 "hitpa'el construction": "construction-hitpa'el", 

4047 "hitpu'al construction": "construction-hitpu'al", 

4048 "pu'al construction": "construction-pu'al", 

4049 "nif'al construction": "construction-nif'al", 

4050 "huf'al construction": "construction-huf'al", 

4051 "peal construction": "construction-peal", 

4052 "verbal noun": "noun-from-verb", 

4053 "Verbal derivations": "verb", 

4054 "abstract noun": "abstract-noun", 

4055 "concrete verb": "concrete", 

4056 "concrete verbs": "concrete", 

4057 "genitive singular as substantive": "genitive singular substantive", 

4058 "female names": "feminine proper-noun", 

4059 "proper name": "proper-noun", 

4060 "proper noun": "proper-noun", 

4061 "proper nouns": "proper-noun", 

4062 "usually in the": "usually", 

4063 "usually in the negative": "usually with-negation", 

4064 "non-scientific usage": "non-scientific", 

4065 "krama inggil": "honorific", 

4066 "krama andhap": "humble", 

4067 "krama-ngoko": "informal", 

4068 "ngoko": "informal", 

4069 "McCune–Reischauer": "McCune-Reischauer", # Dash type differs 

4070 "gender indeterminate": "gender-neutral", 

4071 "singular only": "singular singular-only singular", 

4072 "not used in plural": "singular-only singular", 

4073 "singularonly": "singular-only singular", 

4074 "plural only": "plural plural-only", 

4075 "imperative only": "imperative-only", 

4076 "Imperative form of of": "imperative form-of", # ba/Middle English 

4077 "in general sense": "broadly", 

4078 "by extension": "broadly", 

4079 "by metonymy": "metonymically", 

4080 "metonymic": "metonymically", 

4081 "by synecdoche": "synecdoche", 

4082 "by semantic narrowing": "narrowly", 

4083 "by semantic widening": "broadly", 

4084 "strict sense": "strict-sense", 

4085 "baby talk": "baby-talk", 

4086 "middle infinitive": "middle-infinitive", 

4087 "first infinitive": "infinitive-i", 

4088 "third-person form of the long first infinitive of": "third-person infinitive-i-long form-of", 

4089 "second infinitive": "infinitive-ii", 

4090 "second active infinitive": "infinitive-ii active", 

4091 "second passive infinitive": "infinitive-ii passive", 

4092 "third infinitive": "infinitive-iii", 

4093 "fourth infinitive": "infinitive-iv", 

4094 "fifth infinitive": "infinitive-v", 

4095 "subjunctive I": "subjunctive-i", 

4096 "subjunctive II": "subjunctive-ii", 

4097 "morse code": "morse-code", 

4098 "with odd-syllable stems": "with-odd-syllable-stems", 

4099 "Brazilian ortography": "Brazilian", 

4100 "European ortography": "European", 

4101 "contracted dem-form": "contracted-dem-form", 

4102 "contractions": "contraction", 

4103 "Yale cen": "Yale", 

4104 "subjective pronoun": "subjective pronoun", 

4105 "subject": "subjective", 

4106 "subject form": "subjective", 

4107 "‘subject form’": "subjective", # tw.t/Egyptian 

4108 # "object": "objective", # XXX problems with "An object of ... form_of 

4109 "possessive pronoun": "possessive pronoun without-noun", 

4110 "demostrative": "demonstrative", # eeteeṇú/Phalura 

4111 "revised jeon": "revised-jeon", 

4112 "form used before": "archaic", 

4113 "front vowel harmony variant": "front-vowel", 

4114 "romanization of": "alt-of romanization", 

4115 "romanisation of": "alt-of romanization", 

4116 "archaic spelling of": "alt-of archaic", 

4117 "obsolete typography of": "alt-of obsolete", 

4118 "obsolete spelling of": "alt-of obsolete", 

4119 "rare spelling of": "alt-of rare", 

4120 "superseded spelling of": "alt-of archaic", 

4121 "pronunciation spelling of": "alt-of pronunciation-spelling", 

4122 "pronunciation spelling": "pronunciation-spelling", 

4123 "eye dialect spelling of": "alt-of pronunciation-spelling", 

4124 "alternative or obsolete spelling of": "alt-of obsolete alternative", 

4125 "obsolete and rare": "obsolete rare", 

4126 "Canadian spelling": "Canada", 

4127 "name of the": "alt-of name", # E.g. .. letter | Latin-script letter 

4128 "alternative name of": "alt-of alternative name", 

4129 "alternative name for": "alt-of alternative name", 

4130 "nonstandard spelling of": "alt-of nonstandard", 

4131 "US standard spelling of": "alt-of US standard", 

4132 "US spelling of": "alt-of US", 

4133 "alternative typography of": "alt-of alternative", 

4134 "polytonic spelling of": "alt-of polytonic", 

4135 "variant of": "alt-of alternative", 

4136 "uncommon spelling of": "alt-of uncommon", 

4137 "alternative typographic spelling of": "alt-of alternative", 

4138 "especially in typeface names": "typography", 

4139 "alternative spelling": "alternative", 

4140 "alternative reading": "alternative", # 鹿児島/Japanese 

4141 "alternative spelling of": "alt-of alternative", 

4142 "alternative form": "alternative", 

4143 "alternative form of": "alt-of alternative", 

4144 "alternative term for": "alt-of alternative", 

4145 "alternative stem of": "alt-of stem alternative", 

4146 "alternative letter-case form of": "alt-of", 

4147 "medieval spelling of": "alt-of obsolete", 

4148 "post-1930s Cyrillic spelling of": "alt-of standard Cyrillic", 

4149 "pre-1918 spelling of": "alt-of dated", 

4150 "pre-1945 period": "dated", 

4151 "Plural pre-1990": "dated plural", 

4152 "Plural pre-1990 reformed spelling": "plural", 

4153 "unreformed spelling": "nonstandard", 

4154 "Switzerland and Liechtenstein standard spelling of": "alt-of Switzerland Liechtenstein standard", 

4155 "form removed with the spelling reform of 2012; superseded by": "alt-of dated", 

4156 "excessive spelling of": "alt-of excessive", 

4157 "exaggerated degree of": "alt-of exaggerated", 

4158 "defective spelling of": "alt-of misspelling", 

4159 "verbal noun of": "noun-from-verb form-of", 

4160 "alternative verbal noun of": "form-of alternative noun-from-verb", 

4161 "alternative conjugation of": "alt-of alternative", 

4162 "abbreviation of": "alt-of abbreviation", 

4163 "short for": "alt-of abbreviation", 

4164 "short form": "short-form", 

4165 "eclipsed form of": "alt-of abbreviation eclipsis", 

4166 "apocopic form of": "alt-of abbreviation apocopic", 

4167 "apocope": "apocopic", 

4168 "truncated apocopic form": "apocopic", 

4169 "apocopic form": "apocopic abbreviation", 

4170 "apocopated": "apocopic abbreviation", 

4171 "apocopate": "apocopic abbreviation", 

4172 "h-prothesized form of": "alt-of prothesis-h", 

4173 "acronym of": "alt-of abbreviation acronym", 

4174 "acronym": "abbreviation acronym", 

4175 "initialism of": "alt-of abbreviation initialism", 

4176 "contraction of": "alt-of abbreviation contraction", 

4177 "IUPAC 3-letter abbreviation for": "alt-of abbreviation IUPAC", 

4178 "IUPAC 3-letter abbreviation of": "alt-of abbreviation IUPAC", 

4179 "IUPAC 2-letter abbreviation of": "alt-of abbreviation IUPAC", 

4180 "IUPAC 2-letter abbreviation for": "alt-of abbreviation IUPAC", 

4181 "IUPAC 1-letter abbreviation of": "alt-of abbreviation IUPAC", 

4182 "IUPAC 1-letter abbreviation for": "alt-of abbreviation IUPAC", 

4183 "IUPAC name": "IUPAC", 

4184 "symbol for": "alt-of symbol", 

4185 "praenominal abbreviation of": "alt-of abbreviation praenominal", 

4186 "ellipsis of": "alt-of ellipsis abbreviation", 

4187 "clipping of": "alt-of clipping abbreviation", 

4188 "X-system spelling of": "alt-of X-system", 

4189 "H-system spelling of": "alt-of H-system", 

4190 "Pinyin transcription of": "alt-of Pinyin", 

4191 "Rōmaji transcription of": "alt-of Rōmaji", 

4192 "romaji": "Rōmaji", 

4193 "rōmaji": "Rōmaji", 

4194 "visual rendering of Morse code for": "alt-of visual-rendering morse-code", 

4195 "soft mutation of": "form-of mutation-soft", 

4196 "causes soft mutation": "triggers-mutation-soft", 

4197 "non-Oxford British English standard spelling of": "alt-of nonstandard UK", 

4198 "Nil standard spelling of": "alt-of UK standard", 

4199 "nasal mutation of": "form-of mutation-nasal", 

4200 "nasal mutation": "mutation-nasal", 

4201 "triggers nasalization": "triggers-mutation-nasal", 

4202 "triggers nasal mutation": "triggers-mutation-nasal", 

4203 "triggers no mutation": "triggers-no-mutation", 

4204 "mixed mutation of": "form-of mutation-mixed", 

4205 "mixed mutation": "mutation-mixed", 

4206 "aspirate mutation of": "form-of mutation-aspirate", 

4207 "aspirate mutation": "mutation-aspirate", 

4208 "British misspelling": "misspelling British", 

4209 "misspelling of": "alt-of misspelling", 

4210 "deliberate misspelling of": "alt-of misspelling deliberate", 

4211 "common misspelling of": "alt-of misspelling", 

4212 "misconstruction of": "alt-of misconstruction", 

4213 "misconstructed": "misconstruction", 

4214 "ungrammatical": "misconstruction", 

4215 "Latin spelling of": "alt-of romanization", 

4216 "Latn": "Latin", 

4217 "Late Anglo-Norman spelling of": "alt-of Anglo-Norman", 

4218 "Jawi spelling of": "alt-of Jawi", 

4219 "Hanja form of": "alt-of hanja", 

4220 "Hanja form? of": "alt-of hanja", 

4221 "Hanja": "hanja", 

4222 "Hán Nôm": "Hán-Nôm", 

4223 "Hán tự form of": "alt-of Hán-tự", 

4224 "Newa Spelling": "Newa", 

4225 "Glagolitic spelling of": "alt-of Glagolitic", 

4226 "front vowel variant of": "alt-of front-vowel", 

4227 "front-vowel variant of": "alt-of front-vowel", 

4228 "euphemistic spelling of": "alt-of euphemistic", 

4229 "euphemistic reading of": "alt-of euphemistic", 

4230 "euphemism": "euphemistic", 

4231 "transliterated Russian pet forms": "transliteration Russian", 

4232 "Transliteration": "transliteration", 

4233 "transliteration needed": "", 

4234 "Cyrillic spelling of": "alt-of Cyrillic", 

4235 "Cyrillic spelling": "Cyrillic", 

4236 "Latin spelling": "romanization", 

4237 "British standard spellingh of": "alt-of UK standard", 

4238 "British and Canada standard spelling of": "alt-of UK Canada standard", 

4239 "Britain and Ireland standard spelling of": "alt-of Britain Ireland standard", 

4240 "Britain and New Zealand standard spelling of": "alt-of Britain New-Zealand standard", 

4241 "Britain and Canada spelling of": "alt-of Britain Canada", 

4242 "Baybayin spelling of": "alt-of Baybayin", 

4243 "Arabic spelling of": "alt-of Arabic", 

4244 "Arabic (Eastern)": "Arabic-Indic", 

4245 "Eastern Arabic": "Arabic-Indic", 

4246 "Arabic (Western)": "Arabic", 

4247 "Formerly standard spelling of": "alt-of archaic", 

4248 "informal spelling of": "alt-of informal", 

4249 "Yañalif spelling of": "alt-of Yañalif", 

4250 "traditional orthography spelling of": "alt-of traditional", 

4251 "traditional and simplified": "traditional simplified", 

4252 "Taraškievica spelling of": "alt-of Taraškievica", 

4253 "Post-1930s Cyrillic spelling of": "alt-of Cyrillic", 

4254 "Britain spelling of": "alt-of Britain", 

4255 "linguistically informed spelling of": "alt-of literary", 

4256 "Chinese spelling of": "alt-of China", 

4257 "Mongolian spelling of": "alt-of Mongolian", 

4258 "Leet spelling of": "alt-of Leet Internet", 

4259 "leetspeak": "Leet Internet", 

4260 "bulletin board system slang": "slang Internet", 

4261 "combining form of": "in-compounds form-of", 

4262 "combining form": "in-compounds", 

4263 "compound form": "in-compounds", 

4264 "compound of": "compound-of", 

4265 "compound of gerund of": "compound-of", 

4266 "compound of imperative (noi form) of": "compound-of", 

4267 "compound of imperative (tu form) of": "compound-of", 

4268 "compound of imperative (vo form) of": "compound-of", 

4269 "compound of imperative (voi form) of": "compound-of", 

4270 "compound of imperative of": "compound-of", 

4271 "compound of indicative present of": "compound-of", 

4272 "compound of masculine plural past participle of": "compound-of", 

4273 "compound of past participle of": "compound-of", 

4274 "compound of present indicative of": "compound-of", 

4275 "compound of plural past participle of": "compound-of", 

4276 "compound of second-person singular imperative of": "compound-of", 

4277 "compound of the gerund of": "compound-of", 

4278 "compound of the imperfect": "compound-of", 

4279 "compound of the infinitive": "compound-of", 

4280 "synonym of": "synonym synonym-of", 

4281 "same as": "synonym synonym-of", 

4282 "topicalized form of": "topicalized form-of", 

4283 "inflected form of": "form-of", 

4284 "inflected forms": "inflected", 

4285 "lenited form of": "lenition form-of", 

4286 "triggers lenition": "triggers-lenition", 

4287 "triggers lenition of a following consonant-initial noun": "triggers-lenition", 

4288 "triggers eclipsis": "triggers-eclipsis", 

4289 "triggers h-prothesis": "triggers-h-prothesis", 

4290 "causes aspirate mutation": "triggers-mutation-aspirate", 

4291 "triggers aspiration": "triggers-mutation-aspirate", 

4292 "triggers mixed mutation": "triggers-mutation-mixed", 

4293 # XXX Could be more accurate 

4294 "triggers mixed mutation except of forms of bod": "triggers-mutation-mixed", 

4295 "humurous": "humorous error-misspelling", 

4296 "humourous": "humorous", 

4297 "sarcasm": "sarcastic", 

4298 "ecclesiastic or ironic": "Ecclesiastical ironic", 

4299 "figuratively or literally": "figuratively literally", 

4300 "figuratively and literary": "figuratively literary", 

4301 "figuative": "figuratively", 

4302 "humorously": "humorous", 

4303 "jocular": "humorous", 

4304 "humorous or euphemistic": "humorous euphemistic", 

4305 "may sound impolite": "possibly impolite", 

4306 "northern dialects": "dialectal", 

4307 "dialectism": "dialectal", 

4308 "archaic or loosely": "archaic broadly", 

4309 "archaic or poetic": "archaic poetic", 

4310 "archeic or poetic": "archaic poetic", 

4311 "archaic or phrasal": "archaic idiomatic", 

4312 "archaic or dialectal": "archaic dialectal", 

4313 "archaic or literary": "archaic literary", 

4314 "archaic or Britain": "archaic Britain", 

4315 "archaic or nonstandard": "archaic nonstandard", 

4316 "most dialects": "dialectal", 

4317 "most dialects of Ripuarian": "dialectal", 

4318 "some dialects": "dialectal", 

4319 "some compounds": "idiomatic in-compounds", 

4320 "as a modifier in compound words": "in-compounds", 

4321 "used in compound adjectives": "in-compounds adjective", 

4322 "used attributively": "attributive", 

4323 "used predicatively": "predicative", 

4324 "used substatively": "substantive", 

4325 "substantival use of the verbal voice": "noun-from-verb", 

4326 "in ancient phrases": "idiomatic", 

4327 "unofficial spelling": "nonstandard", 

4328 "rare nonstandard spellings": "rare nonstandard", 

4329 "as rare alternative form": "rare", 

4330 "nonstandard spellings": "nonstandard", 

4331 "capitalised": "capitalized", 

4332 "always capitalized": "capitalized", 

4333 "sometimes not capitalized": "usually capitalized", 

4334 "sometimes capitalized": "sometimes capitalized", 

4335 "Sometimes capitalized": "sometimes capitalized", 

4336 "rhetorical question": "rhetoric", 

4337 "old-fashioned": "dated", 

4338 "rarely used": "rare", 

4339 "partially supplied": "", 

4340 "partially supplanted": "", 

4341 "present tense seldom used": "present-rare", 

4342 "often in place of present tense": "present often", 

4343 "conjugated non-suppletively in the present tense": "irregular", 

4344 "now rare": "archaic", 

4345 "in the past tense": "past", 

4346 "fixed expressions": "idiomatic", 

4347 "formulaic": "idiomatic", 

4348 "several set phrases": "idiomatic", 

4349 "now colloquial": "colloquial", 

4350 "now colloquial and nonstandard": "colloquial nonstandard", 

4351 "colloquial or Min Nan": "colloquial Min-Nan", 

4352 "colloquial or jargon": "colloquial jargon", 

4353 "Wiktionary and WMF jargon": "jargon Internet", 

4354 "colloquially": "colloquial", 

4355 "fossil word": "archaic", 

4356 "brusque": "impolite", 

4357 "verbs": "verb", 

4358 "prepositions": "prepositional", 

4359 "postpositions": "postpositional", 

4360 "postposition": "postpositional", 

4361 "interjections": "interjection", 

4362 "Abbreviations": "abbreviation", 

4363 "abbreviations": "abbreviation", 

4364 "variants": "variant", 

4365 "Ordinal": "ordinal", 

4366 "ordinals": "ordinal", 

4367 "local use": "regional", 

4368 "more generally": "broadly", 

4369 "loosely": "broadly", 

4370 "broad sense": "broadly", 

4371 "hypocoristic": "familiar", 

4372 "familiar or childish": "familiar childish", 

4373 "to a male": "addressee-masculine", 

4374 "to a man": "addressee-masculine", 

4375 "to a female": "addressee-masculine", 

4376 "to a woman": "addressee-feminine", 

4377 "hyperbolic": "excessive", 

4378 "18th century": "obsolete", 

4379 "9th century": "obsolete", 

4380 "17th century": "obsolete", 

4381 "10th century": "obsolete", 

4382 "16th century": "obsolete", 

4383 "14th century": "obsolete", 

4384 "12th century": "obsolete", 

4385 "post-classical": "obsolete", 

4386 "early 20th century": "archaic", 

4387 "20th century": "dated", 

4388 "mid-20th century": "dated", 

4389 "mid-19th century": "obsolete", 

4390 "before 20th century": "obsolete", 

4391 "19th to 20th century": "archaic", 

4392 "15th century": "obsolete", 

4393 "11th century": "obsolete", 

4394 "until early 20th century": "obsolete", 

4395 "since the 16th century": "dated", 

4396 "late 16th century": "obsolete", 

4397 "late 14th century": "obsolete", 

4398 "in usage until 20th century": "obsolete", 

4399 "in the 17th century": "obsolete", 

4400 "in the 16 th century": "obsolete", 

4401 "in Scots until the seventeenth century": "obsolete", 

4402 "in 10th century": "obsolete", 

4403 "early 17th century": "obsolete", 

4404 "chiefly 18th century": "obsolete", 

4405 "chiefly 12th century": "obsolete", 

4406 "before 16th century": "obsolete", 

4407 "attested in the 16th century": "obsolete", 

4408 "5th century": "obsolete", 

4409 "19th to early 20th century": "obsolete", 

4410 "19th-mid 20th century": "obsolete", 

4411 "19 the century": "obsolete", 

4412 "19th-early 20th century": "obsolete", 

4413 "19th century": "obsolete", 

4414 "1776-19th century": "obsolete", 

4415 "15th-16th century": "obsolete", 

4416 "Medieval and Early Modern Greek regional": "Medieval-Greek Early-Modern-Greek dialectal", 

4417 "collectively": "collective", 

4418 "collective or singulative": "collective singulative", 

4419 "used formally in Spain": "Spain", 

4420 "Spain's Canary Islands": "Canary-Islands", 

4421 "Sanskritised": "Sanskritized", 

4422 "Arabicised": "Arabicized", 

4423 "Perú": "Peru", 

4424 "Singapore/Malaysia": "Singapore Malaysia", 

4425 "nouns": "noun", 

4426 "phrases": "phrase", 

4427 "with the particle lai": "with-lai", 

4428 "adjectives": "adjective", 

4429 "related adjective": "adjective", 

4430 "adj": "adjective", 

4431 "adj.": "adjective", 

4432 "adv": "adverb", 

4433 "adverbs": "adverb", 

4434 "augmentatives": "augmentative", 

4435 "pejoratives": "pejorative", 

4436 "perjorative": "pejorative error-misspelling", 

4437 "pejorative or colloquial": "pejorative colloquial", 

4438 "non-standard since 2012": "nonstandard", 

4439 "colloquialism": "colloquial", 

4440 "non-standard since 1917": "nonstandard", 

4441 "conditional mood": "conditional", 

4442 "figurative": "figuratively", 

4443 "compound words": "compound", 

4444 "form of address": "term-of-address", 

4445 "term of address": "term-of-address", 

4446 "as a term of address": "term-of-address", 

4447 "direct address": "term-of-address", 

4448 "face-to-face address term": "term-of-address", 

4449 "address": "term-of-address", 

4450 "endearingly": "endearing", 

4451 "elliptically": "ellipsis", 

4452 "elegant": "formal", # Elegant or Formal Thai 

4453 "nonce word": "nonce-word", 

4454 "neologism or slang": "neologism slang", 

4455 "attributively": "attributive", 

4456 "poetic term": "poetic", 

4457 "poetic meter": "poetic", 

4458 "in certain phrases": "in-certain-phrases", 

4459 "deprecated template usage": "", 

4460 "deprecated": "proscribed", 

4461 "diacritical mark": "diacritic", 

4462 "inflection of": "form-of", 

4463 "mainland China": "Mainland-China", 

4464 "spelling in China": "China", 

4465 "rhyming slang": "slang", 

4466 "prison slang": "slang", 

4467 "criminal slang": "slang", 

4468 "fandom slang": "slang lifestyle", 

4469 "furry fandom": "slang lifestyle", 

4470 "manga fandom slang": "slang manga", 

4471 "real estate slang": "slang real-estate", 

4472 "gay slang": "slang LGBT", 

4473 "urban slang": "slang urbanism", 

4474 "lolspeak": "humorous Internet", 

4475 "Usenet": "Internet", 

4476 "one-termination adjective": "one-termination", 

4477 "two-termination adjective": "two-termination", 

4478 "three-termination adjective": "three-termination", 

4479 "one-termination participle": "one-termination participle", 

4480 "two-termination participle": "two-termination participle", 

4481 "three-termination particple": "three-termination participle", 

4482 "semelefactive": "semelfactive error-misspelling", 

4483 "invariant": "invariable", 

4484 "followed by to": "with-to", 

4485 "taking a to-infinitive": "with-to with-infinitive", 

4486 "with bare infinitive": "with-infinitive", 

4487 "direct object": "direct-object", 

4488 "indirect object": "indirect-object", 

4489 "transitive with of": "transitive-with-of", 

4490 "with of": "with-of", 

4491 "with on": "with-on", 

4492 "with down": "with-down", 

4493 "with up": "with-up", 

4494 "with a personal pronoun": "with-personal-pronoun", 

4495 "with an indirect object": "with-indirect-object", 

4496 "with comparatives": "with-comparative", 

4497 "with definite article": "with-definite-article", 

4498 'with "the"': "with-definite-article", 

4499 "etc.": "usually", 

4500 "regardless of gender": "gender-neutral", 

4501 "gender-neutral (or multigendered)": "gender-neutral", 

4502 "ditransitive for the second object": "ditransitive", 

4503 "double transitive": "ditransitive", 

4504 "transitive or ditransitive": "transitive ditransitive", 

4505 "number": "numeral", 

4506 "numerals": "numeral", 

4507 "Tally marks": "Tally-marks numeral", 

4508 "+ 3rd-pers.": "with-third-person", 

4509 "Historical": "historical", 

4510 "hist.": "historical", 

4511 "antiquity": "historical", 

4512 "ideophone": "ideophonic", 

4513 "Alsatian (Low Alemannic German)": "Alsatian Alemannic", 

4514 "all sects": "", 

4515 "adessive + 3rd person singular + ~": "with-adessive with-third-person-singular postpositional", 

4516 "inessive + 3rd person singular + ~": "with-inessive with-third-person-singular postpositional", 

4517 "~ (olemassa)": "with-olemassa", 

4518 "3rd person singular": "third-person singular", 

4519 "+ genitive + 3rd person singular + passive present participle": "with-genitive with-third-person-singular with-passive-present-participle", 

4520 "genitive + 3rd-pers. singular + 1st infinitive": "with-genitive with-third-person-singular with-infinitive-i", 

4521 "+ direct object in accusative + 3rd infinitive in illative": "transitive with-accusative with-infinitive-iii-illative", 

4522 "+ direct object in accusative + past participle in translative or partitive": "transitive with-accusative with-past-participle-translative with-past-participle-partitive", 

4523 "+ past participle in translative or partitive": "with-past-participle-translative with-past-participle-partitive", 

4524 "active past part. taitanut": "", 

4525 "+ passive past participle in translative": "with-passive-past-participle-translative", 

4526 "+ passive past participle in partitive": "with-passive-past-participle-partitive", 

4527 "+ active past participle in translative": "with-past-participle-translative", 

4528 "+ adjective in ablative or allative": "with-adjective with-ablative with-allative", 

4529 "in indicative or conditional mood": "in-indicative in-conditional", 

4530 "in negative sentences": "with-negation", 

4531 "in negative clauses": "with-negation", 

4532 "using Raguileo Alphabet": "Raguileo-Alphabet", 

4533 "using Raguileo alphabet": "Raguileo-Alphabet", 

4534 "using Raguileo and Unified Alphabet": "Raguileo-Alphabet Unified", 

4535 "transliterated": "transliteration", 

4536 "though not derogative": "", 

4537 "women generally don't accept to be called this way": "offensive", 

4538 "transitive sense": "transitive", 

4539 "in intransitive meaning": "intransitive", 

4540 "initial change reduplication": "reduplication", 

4541 "initial change reduplication with syncope": "reduplication syncope", 

4542 "initial change with syncope": "syncope", 

4543 "syncopated": "syncope", 

4544 "reduplication with syncope": "reduplication syncope", 

4545 "introducing subjunctive hortative": "subjunctive hortative", 

4546 "nominative and vocative plural animate": "nominative vocative plural animate", 

4547 "with diaeresis to indicate disyllabilicity": "", 

4548 "aphaeretic variant": "variant", 

4549 "mediopassive voice": "mediopassive", 

4550 "ALL": "", 

4551 "archaic or hypercorrect": "archaic hypercorrect", 

4552 "as a diacritic": "diacritic", 

4553 "as a gerund": "gerund", 

4554 "as a calque": "calque", 

4555 "pseudoarchaic": "dated", 

4556 "surnames": "surname", 

4557 "all countable senses": "countable", 

4558 "attributive form of pyjamas": "attributive", 

4559 "ordinal form": "ordinal", 

4560 "ordinal form of twelve": "ordinal", 

4561 "conjugative of": "conjugative-of", 

4562 "correlative of": "correlative-of", 

4563 "modern nonstandard spellings": "modern nonstandard", 

4564 "non-standard": "nonstandard", 

4565 "non-standard form of": "nonstandard alt-of", 

4566 "nonanimate": "inanimate", 

4567 "nominalized verb": "noun-from-verb", 

4568 "nominalized": "noun-from-verb", # XXX could this be from noun/adj 

4569 "n-v": "verb-from-noun", 

4570 "v-n": "noun-from-verb", 

4571 "n-n": "noun-from-noun", 

4572 "v-v": "verb-from-verb", 

4573 "uses -j- as interfix": "interfix-j", 

4574 "eulogistic": "poetic", # XXX not really, implies praise 

4575 "prev": "previous", 

4576 "normal usage": "", # In some Russian words with two heads 

4577 "professional usage": "", # In some Russian words with two heads 

4578 "?? missing information.": "", 

4579 "unknown comparative": "", 

4580 "unknown accent pattern": "", 

4581 "?? conj.": "", 

4582 "pres. ??": "", 

4583 "past ??": "", 

4584 "see usage notes": "", 

4585 "no known Cyrillic variant": "", 

4586 "no first-person singular present": "no-first-person-singular-present", 

4587 "no first-person singular preterite": "no-first-person-singular-preterite", 

4588 "no third-person singular past historic": "no-third-person-singular-past-historic", 

4589 "‘dependent’": "dependent", # sn/Egyptian 

4590 "‘independent’": "independent", # ntf/Egyptian 

4591 "eum": "hangeul", # Apparently synonym for the Korean alphabet 

4592 "classifiers": "classifier", 

4593 "discourse particle": "discourse particle", 

4594 "discourse": "discourse", # hum/Phalura 

4595 "numeral tones": "numeral-tones", 

4596 "alphabetic tones": "alphabetic-tones", 

4597 "class A infixed pronoun": "infix pronoun class-A", 

4598 "class B infixed pronoun": "infix pronoun class-B", 

4599 "class C infixed pronoun": "infix pronoun class-C", 

4600 "class B & C infixed pronoun": "infix pronoun class-B class-C", 

4601 "class I": "class-i", 

4602 "class II": "class-ii", 

4603 "class III": "class-iii", 

4604 "class IV": "class-iv", 

4605 "class V": "class-v", 

4606 "class VI": "class-vi", 

4607 "class VII": "class-vii", 

4608 "class VIII": "class-viii", 

4609 "class IX": "class-ix", 

4610 "class X": "class-x", 

4611 "class XI": "class-xi", 

4612 "class XII": "class-xii", 

4613 "class XIII": "class-xiii", 

4614 "class N": "class-n", 

4615 "class a-i": "class-a-i", 

4616 "to multiple people": "addressee-plural", 

4617 "to one person": "addressee-singular", 

4618 "actor focus": "actor-focus", 

4619 "indirect actor trigger": "actor-indirect", 

4620 "usually feminine": "feminine-usually", 

4621 "but usually feminine": "feminine-usually", 

4622 "usually masculine": "masculine-usually", 

4623 "but usually masculine": "masculine-usually", 

4624 "but rarely feminine": "masculine-usually", 

4625 "but rarely masculine": "feminine-usually", 

4626 "requires negation": "with-negation", 

4627 "inalienable–class I agreement": "inalienable class-i", 

4628 "inalienable–class II agreement": "inalienable class-ii", 

4629 "inalienable–class III agreement": "inalienable class-iii", 

4630 "no first-person singular past historic": "no-first-person-singular-past-historic", 

4631 "no definite forms": "no-definite", 

4632 "no definite form": "no-definite", 

4633 "no diminutive": "no-diminutive", 

4634 "no second-person singular imperative": "no-second-person-singular-imperative", 

4635 "no simple past": "no-past", 

4636 "no feminine form": "no-feminine", 

4637 "no infinitive": "no-infinitive", 

4638 "no longer productive": "idiomatic", 

4639 "no past tense": "no-past", 

4640 "no third-person singular present": "no-third-person-singular-present", 

4641 "nominalized adjective following adjective declension": "noun-from-adj", 

4642 # XXX this could be more accurate 

4643 "truncative except after q and r": "truncative", # Greenlandic 

4644 "of masculine singular": "masculine singular nominative", 

4645 "of masculine plural": "masculine plural nominative", 

4646 "of feminine singular": "feminine singular nominative", 

4647 "of feminine plural": "feminine plural nominative", 

4648 "officialese": "bureaucratese", 

4649 "+ optionally: adjective in accusative case + neuter noun in accusative case": "definite neuter with-accusative", 

4650 "non-emphatic": "unemphatic", 

4651 "not productive": "idiomatic", 

4652 "passive with different sense": "passive", 

4653 "active with different sense": "active", 

4654 "+ von": "with-von", # außerhalb/German 

4655 "Symbol:": "symbol", 

4656 "a reflexive": "reflexive", 

4657 "active/stative": "active stative", 

4658 "always postpostive": "postpositional", 

4659 "postpositive": "postpositional", 

4660 "defininte plural": "definite plural", # aigg/Westrobothnian 

4661 "determinative of": "determinative-of", 

4662 "lenites": "lenition", 

4663 "followed by indirect relative": "with-indirect-relative", 

4664 "inflected like": "inflected-like", 

4665 "locational noun": "locative", 

4666 "mass noun": "uncountable", 

4667 "negated": "past participle negative", # fera/Westrobothnian 

4668 "neutral": "gender-neutral", # countryman/English 

4669 "never clause-initial": "not-clause-initial", 

4670 "primarily": "", 

4671 "mostly": "", 

4672 "now": "", 

4673 "chiefly": "", 

4674 "only": "", 

4675 "somewhat": "", 

4676 "definite articulation": "definite", # boatsi/Aromanian 

4677 "p-past": "passive past", 

4678 "p‑past": "passive past", # Fancy unicode dash περπατάω/Greek 

4679 "ppp": "passive perfect participle", 

4680 "plural:": "plural", 

4681 "synonyms:": "synonym", 

4682 "quantified:": "quantified", 

4683 "sentence case": "sentence-case", 

4684 "set phrase from Classical Chinese": "idiomatic Classical-Chinese", 

4685 "the plural of": "plural-of", 

4686 "plural of": "plural-of", 

4687 "the reflexive case of": "reflexive-of", 

4688 "the reflexive form of": "reflexive-of", 

4689 "unipersonal": "", # Too rare to track 

4690 "used only after prepositions": "after-preposition", 

4691 "appended after imperfective form": "in-compounds with-imperfect", 

4692 "universal or indefinite": "universal indefinite", 

4693 "el/ea": "third-person singular", # o/Romanian/Verb 

4694 "ele/ei": "third-person plural", # vor/Romanian/Verb 

4695 "vestre": "slang", # type of backslang in Argentine and Uruguayan Spanish 

4696 "onomatopoeia": "onomatopoeic", 

4697 "ITERATIVE": "iterative", 

4698 "OPTATIVE": "optative", 

4699 "IMPERFECTIVE": "imperfective", 

4700 "PERFECTIVE": "perfective", 

4701 "(FIXME)": "error-fixme", 

4702 "Conversive": "conversive", 

4703 "Cholula and Milpa Alta": "Cholula Milpa-Alta", 

4704 "Surnames": "surname", 

4705 "metaphorically": "metaphoric", 

4706 "hypothetic": "hypothetical", 

4707 "Kinmen and Penghu Hokkien": "Kinmen-Hokkien Penghu-Hokkien", 

4708 "“Jinmeiyō” kanji used for names": "Jinmeiyō", 

4709 "by suppletion": "suppletive", 

4710 "only some senses": "", # Could use a tag; "limited-senses"? hero/English 

4711 "nautical sense": "nautical", # Without this, there's error-unknown and 

4712 # the topic tags include "transportation". pay out/English 

4713 "otherwise nonstandard": "nonstandard", # weep/English 

4714 "nonhuman": "non-human", # himself/English, talking about "it" 

4715 "both": "", # XXX "both" should trigger the tag to the next two forms! walrus/English 

4716 "pseudo-Latin": "hypercorrect", # platypus/English 

4717 "pseudo-Latinate": "hypercorrect", # Simplex/German 

4718 "archaic or informal": "archaic informal", # while/English 

4719 "more common in": "common", # tread water/English 

4720 "all": "", # XXX same as "both", "all" should extend tags the following forms 

4721 "less commonly": "uncommon", # avid/English 

4722 "muscle": "anatomy", # depressor/English 

4723 "optionally with an article": "with-article", # Mosambik/German 

4724 "genitive (des)": "genitive", # ordentlicher Professor/German, Lieber/German 

4725 "prenominally without an article": "without-article before-noun", # Mama/German 

4726 "usually in": "regional", # Vergnügungspark/German 

4727 "older ending": "archaic", # Fritz/German 

4728 "only in some regional vernaculars": "regional", # umhauen/German 

4729 "mostly only when written": "literary", # Magnet/German 

4730 "rarer": "rare", # verbleichen/German 

4731 "southern Germany": "Southern-Germany", # Holzscheit/German 

4732 "alternatively in the meaning": "uncommon", # abbondare/Italian 

4733 # XXX "for-subsense" or similar needs a tag or parsing 

4734 "alternatively in": "regional", # Holzscheit/German 

4735 "nonstandard but common": "nonstandard common", # Gedanke/German 

4736 "colloquial or archaic": ["colloquial", "archaic"], # Undorn/German 

4737 "predominant when spoken": "colloquial", # Gnom/German 

4738 "with a numeral": "with-numeral", # Radlermaß/German 

4739 "not with a numeral": "without-numeral", # Radlermaß/German 

4740 "alternatively when": "", # Radlermaß/German, 

4741 "traditional/standard": "archaic standard", # flecthen/German 

4742 "only in some senses": "uncommon", # hero/English 

4743 "prescribed, more frequent": "", # offenbaren/German These distinctions are minor 

4744 "less frequent but not uncommon": "", # offenbaren/German 

4745 "predominant": "", # März/German: "normal" 

4746 "common but sometimes considered nonstandard": "common", # gebären/German 

4747 "more standard": "standard", # Lump/German 

4748 "more common in general usage": "common", # Lump/German 

4749 "rare outside": "regional", # Park/German 

4750 "nonstandard, rather rare": "nonstandard rare", # Lexikon/German 

4751 "prescribed": "literary", # brauchen/German 

4752 "always used in speech": "common", # brauchen/German 

4753 "common in writing": "common", # brauchen/German 

4754 "when issues of different sorts are involved": "different-sort", # Wahnsinnsding/German 

4755 "when issues of the same sort are involved": "same-sort", # Wahnsinnsding/German 

4756 "elevated": "honorific", # Land/German 

4757 "original but now less common": "archaic", # winken/German 

4758 "standard but rare in the vernacular": "literary", # fechten/German 

4759 "mostly found in": "regional", # Ehrenschutz/German 

4760 "unofficial": "colloquial", # kørsel/Danish, although fixed, one user did a lot of this in Danish. 

4761 "common in": "regional", # tread water/English 

4762 "careful style": "formal", # valutarsi/Italian 

4763 "less popular": "uncommon", # rivedere/Italian 

4764 "also when intransitive": "intransitive", # risuonare/Italian 

4765 "popular": "common", # sciogliere/Italian 

4766 "high-style": "formal", # riesumare/Italian 

4767 "more common": "common", # compiersi/Italian 

4768 "Latinate pronunciation": "hypercorrect", # perorare/Italian 

4769 "medio-passive voice": "mediopassive", # afrohet/Albanian 

4770 # ~ "comparative of": "comparative-of", # miður/Icelandic 

4771 "subst.": "noun", 

4772 "Persic": "Persian", 

4773 "defunct": "archaic", # flugu/Norwegian 

4774 "used in definite form": "", # dyrerike/Norwegian Nynorsk 

4775 "used in definite singular form": "", # nettet/Norwegian Nynorsk 

4776 "reciprocative": "reciprocal", # konyugön/Volapük 

4777 "mfpl": "masculine feminine plural", # extrajudiciaires/French 

4778 "Internet slang": "Internet", # troll/many languages 

4779 "combined with se": "reflexive", # tecnificarse/Spanish 

4780 "combined with me": "object-first-person object-singular", # tergiver/Spanish 

4781 "combined with te": "object-second-person object-singular", # tergiver/Spanish 

4782 "combined with le": "object-third-person object-singular dative", # tergiver/Spanish 

4783 "combined with nos": "object-first-person object-plural", # tergiver/Spanish 

4784 "combined with os": "object-second-person object-plural", # tergiver/Spanish 

4785 "combined with les": "object-third-person object-plural dative", # tergiver/Spanish 

4786 "combined with lo": "object-third-person object-singular object-masculine accusative", 

4787 "combined with la": "object-third-person object-singular object-feminine accusative", 

4788 "combined with los": "object-third-person object-plural object-masculine accusative", 

4789 "combined with las": "object-third-person object-plural object-feminine accusative", 

4790 "class m-wa": "class-1 class-2", 

4791 "class m-mi": "class-3 class-4", 

4792 "class ma": "class-5 class-6", 

4793 "class ki-vi": "class-7 class-8", 

4794 "class n": "class-9 class-10", 

4795 "class n/n": "class-9 class-10", 

4796 "class u": "class-11 class-12 class-14", 

4797 "class ku": "class-15", 

4798 "class pa": "class-16", 

4799 "class mu": "class-18", 

4800 "predicate marker": "predicative", 

4801 # riannettere/Italian 

4802 "ditto": "", 

4803 # Dungan tone markers 

4804 "I-I": "", 

4805 "I-II": "", 

4806 "I-I-III": "", 

4807 "I-I-II": "", 

4808 "I-II-I": "", 

4809 "I-III": "", 

4810 "I-III-I": "", 

4811 "I-I-I": "", 

4812 "I-II-II": "", 

4813 "I-I-II-I": "", 

4814 "I-III-I-I": "", 

4815 # Mapuzugun/Mapudungun 

4816 "Raguileo spelling": "Raguileo-Alphabet", 

4817 "no predicative form": "no-predicative-form", # diamanten/German 

4818 "Dialectal or colloquial": "colloquial", 

4819 "Rare except in very formal contexts": "rare formal", 

4820 "alternative in würde normally preferred": "", 

4821 "sometimes derogatory": "sometimes derogatory", 

4822 # gratis/Swedish 

4823 "not inflected": "indeclinable", 

4824 "Sparsely attested near 1500": "archaic rare", 

4825 "Tajik spelling": "Tajik Cyrillic", 

4826} 

4827 

4828# This mapping is applied to full descriptions before splitting by comma. 

4829# Note: these cannot match just part of a description (even when separated 

4830# by comma or semicolon), as these can contain commas and semicolons. 

4831xlat_descs_map = { 

4832 "with there, or dialectally it, as dummy subject": "with-dummy-subject", 

4833 "+ location in inessive, adessive + vehicle in elative, often with pois": "with-inessive with-adessive with-elative", 

4834 "+ accusative +, Genitive": "with-accusative with-genitive", 

4835 "with genitive, instrumental or dative case": "with-genitive with-instrumental with-dative", 

4836 "+ illative, allative, (verbs) 3rd infinitive in illative": "with-illative with-allative with-infinitive-iii-illative", 

4837 "(inessive or adessive) + 3rd-pers. sg. + an adverb": "with-inessive with-adessive with-third-person-singular with-adverb", 

4838 "+ partitive for agent, + allative for target": "with-partitive with-allative", 

4839 "+ infinitive; in indicative or conditional mood": "with-infinitive with-indicative with-conditional", 

4840 "transitive, auxiliary + first infinitive, active past part. taitanut or tainnut": "transitive, auxiliary, with-infinitive-i", 

4841 "elative + 3rd person singular + noun/adjective in nominative or partitive or personal + translative": "with-elative with-third-person-singular", # XXX very incomplete 

4842 "group theory, of a group, semigroup, etc.": "group theory", 

4843 "Triggers lenition of b, c, f, g, m, p, s. Triggers eclipsis of d, t.": "triggers-lenition triggers-eclipsis", 

4844 # XXX this could be more precise 

4845 "‘his’ and ‘its’ trigger lenition; ‘her’ triggers /h/-prothesis; ‘their’ triggers eclipsis": "triggers-lenition triggers-h-prothesis triggers-eclipsis", 

4846 "for = elative; for verbs action noun in elative": "with-action-noun-in-elative", 

4847 # de/Danish 

4848 "as a personal pronoun, it has the forms dem in the oblique case and deres in the genitive; as a determiner, it is uninflected": "", 

4849 # spinifer/Latin 

4850 "nominative masculine singular in -er; two different stems": "", 

4851 "^(???) please indicate transitivity!": "", 

4852 "^(???) please provide spelling!": "", 

4853 "please provide plural": "", 

4854 "please provide feminine": "", 

4855 "please provide feminine plural": "", 

4856 "the passive, with different sense": "", 

4857 "the active, with different sense": "", 

4858 "m": "masculine", 

4859 "f": "feminine", 

4860 "classic": "", 

4861} 

4862 

4863# Words that are interpreted as tags at the beginning of a linkage 

4864linkage_beginning_tags = { 

4865 "factitive/causative": "factitive causative", 

4866 "factive/causative": "factive causative", 

4867 "factive": "factive", 

4868 "factitive": "factive", # Not sure if same or different as factive 

4869 "causative": "causative", 

4870 "reflexive": "reflexive", 

4871 "frequentative": "frequentative", 

4872 "optative": "optative", 

4873 "affirmative": "affirmative", 

4874 "cohortative": "cohortative", 

4875 "applicative": "applicative", 

4876 "stative": "stative", 

4877 "passive": "passive", 

4878 "adjective": "adjective", 

4879 "verb": "verb", 

4880 "noun": "noun", 

4881 "adverb": "adverb", 

4882} 

4883 

4884# For a gloss to be interpreted as a form_of by parse_alt_or_inflection_of(), 

4885# the form must contain at least one of these tags. This is only used for 

4886# the implicit form-of (tags followed by "of"). 

4887form_of_tags = { 

4888 "abessive", 

4889 "ablative", 

4890 "absolutive", 

4891 "accusative", 

4892 "adessive", 

4893 "adjectival", 

4894 "adverbial", 

4895 "affirmative", 

4896 "agentive", 

4897 "allative", 

4898 "aorist", 

4899 "applicative", 

4900 "attributive", 

4901 "augmentative", 

4902 "augmented", 

4903 "benefactive", 

4904 "causal-final", 

4905 "causative", 

4906 "collective", 

4907 "comitative", 

4908 "comparative", 

4909 "conditional", 

4910 "conditional-i", 

4911 "conditional-ii", 

4912 "connegative", 

4913 "construct", 

4914 "contemplative", 

4915 "counterfactual", 

4916 "dative", 

4917 "debitive", 

4918 "declension-1", 

4919 "declension-2", 

4920 "declension-3", 

4921 "definite", 

4922 "delative", 

4923 "demonstrative", 

4924 "desiderative", 

4925 "diminutive", 

4926 "distal", 

4927 "dual", 

4928 "durative", 

4929 "elative", 

4930 "endearing", 

4931 "equative", 

4932 "ergative", 

4933 "essive", 

4934 "feminine", 

4935 "first-person", 

4936 "form-i", 

4937 "form-ii", 

4938 "form-iii", 

4939 "form-iiiq", 

4940 "form-iiq", 

4941 "form-iq", 

4942 "form-iv", 

4943 "form-ivq", 

4944 "form-ix", 

4945 "form-v", 

4946 "form-vi", 

4947 "form-vii", 

4948 "form-viii", 

4949 "form-x", 

4950 "form-xi", 

4951 "form-xii", 

4952 "form-xiii", 

4953 "fourth-person", 

4954 "frequentative", 

4955 "future", 

4956 "gender-neutral", 

4957 "genitive", 

4958 "gerund", 

4959 "hortative", 

4960 "illative", 

4961 "imperative", 

4962 "imperfect", 

4963 "imperfective", 

4964 "impersonal", 

4965 "in-compounds", 

4966 "inclusive", 

4967 "indefinite", 

4968 "inessive", 

4969 "infinitive", 

4970 "infinitive-i", 

4971 "infinitive-ii", 

4972 "infinitive-iii", 

4973 "infinitive-iv", 

4974 "infinitive-v", 

4975 "instructive", 

4976 "instrumental", 

4977 "interrogative", 

4978 "iterative", 

4979 "jussive", 

4980 "lative", 

4981 "locative", 

4982 "masculine", 

4983 "mediopassive", 

4984 "middle-infinitive", 

4985 "mutation-aspirate", 

4986 "mutation-mixed", 

4987 "mutation-nasal", 

4988 "mutation-soft", 

4989 "negative", 

4990 "neuter", 

4991 "nominal", 

4992 "nominative", 

4993 "non-past", 

4994 "oblique", 

4995 "offensive", 

4996 "optative", 

4997 "ordinal", 

4998 "participle", 

4999 "partitive", 

5000 "passive", 

5001 "past", 

5002 "paucal", 

5003 "perfect", 

5004 "perfective", 

5005 "pluperfect", 

5006 "plural", 

5007 "polite", 

5008 "possessive", 

5009 "potential", 

5010 "predicative", 

5011 "prepositional", 

5012 "present", 

5013 "preterite", 

5014 "prolative", 

5015 "pronominal", 

5016 "prospective", 

5017 "proximal", 

5018 "quotative", 

5019 "reflexive", 

5020 "second-person", 

5021 "singular", 

5022 "singulative", 

5023 "stative", 

5024 "stressed", 

5025 "subjective", 

5026 "subjunctive", 

5027 "subjunctive-i", 

5028 "subjunctive-ii", 

5029 "sublative", 

5030 "superessive", 

5031 "superlative", 

5032 "supine", 

5033 "terminative", 

5034 "third-person", 

5035 "transgressive", 

5036 "translative", 

5037 "unstressed", 

5038 "vocative", 

5039 # 2084 objective - beware of "An object of ..." (e.g., song/English) 

5040} 

5041 

5042# For a gloss to be interpreted as an alt_of by parse_alt_or_inflection_of(), 

5043# the form must contain at least one of these tags. This is only used for 

5044# the implicit alt-of (tags followed by "of"). 

5045alt_of_tags = { 

5046 "abbreviation", 

5047 "capitalized", 

5048 "colloquial", 

5049 "contracted", 

5050 "dialectal", 

5051 "historic", 

5052 "hypercorrect", 

5053 "initialism", 

5054 "literary", 

5055 "lowercase", 

5056 "misconstruction", 

5057 "nonstandard", 

5058 "obsolete", 

5059 "proscribed", 

5060 "standard", 

5061 "uppercase", 

5062 "unabbreviation", # jku/Finnish 

5063} 

5064 

5065# Valid tag categories / attributes. These map to sort precedence, with 

5066# larger values put first. 

5067tag_categories = { 

5068 "referent": 500, # definite, indefinite, proximal, distal 

5069 "degree": 400, # comparative, superlative 

5070 "gender": 390, # Semantic gender (often also implies class) 

5071 "person": 380, # first-person, second-person, third-person, impersonal, 

5072 # fourth-person, inclusive, exclusive 

5073 "object": 375, # Object number/gender/class/definiteness/person 

5074 "case": 370, # Grammatical case (also direct-object, indirect-object) 

5075 "number": 360, # Singular, plural, dual, paucal, ... 

5076 # "addressee", # Something related to addressee 

5077 "possession": 350, # possessive, possessed-form, unpossessed-form, 

5078 # alienable, inalienable 

5079 "voice": 200, # active, passive, middle 

5080 "tense": 190, # present, past, imperfect, perfect, future, pluperfect 

5081 "aspect": 180, # Aspect of verbs (perfective, imperfective, habitual, ...) 

5082 "mood": 170, # cohortiative, commissive, conditional, conjunctive, 

5083 # declarative, hortative, imperative, indicative, 

5084 # interrogative, jussive, optative, potential, prohibitive, 

5085 # subjunctive 

5086 # Note that interrogative also used for, e.g., pronouns 

5087 "non-finite": 160, # infinitive, participle, ... 

5088 "polarity": 150, # positive, negative, connegative 

5089 "pos": 50, # Specifies part-of-speech 

5090 "category": 40, # person, animate, inanimate, 

5091 # (virile, nonvirile?), countable, uncountable 

5092 "transitivity": 35, # intransitive, transitive, ditransitive, 

5093 # ambitransitive 

5094 # "participants", # reflexive, reciprocal 

5095 "register": 30, # dialectal, formal, informal, slang, vulgar 

5096 "dialect": 25, # Typically uppercase tags specifying dialectal variations, 

5097 # region, language, who standardized, or time period 

5098 # when used 

5099 "class": 20, # Inflection class (Bantu languages, Japanese, etc) 

5100 "trigger": 15, # Triggers something (e.g., mutation) in some context 

5101 "gradation": 15, # gradation or qualifier 

5102 "derivation": 13, # Specifies derivation (agent, noun-from-verb, 

5103 # noun-from-and, noun-from-noun, verb-from-noun, ...) 

5104 "mod": 10, # Provides a modified form (e.g., abbreviation, mutation) 

5105 "pragmatic": 10, # Specifies pragmatics (e.g., stressed/unstressed) 

5106 "phonetic": 10, # Describes some phonetic aspect 

5107 "lexical": 10, # Describes some lexical/typographic aspect 

5108 "with": 10, # Co-occurs with something 

5109 "order": 10, # Word position or order 

5110 "detail": 5, # Provides some detail 

5111 "script": 5, # Provides version of word in given script in forms; 

5112 # sometimes also used as tag for language/country 

5113 "misc": 1, # lots of miscellaneous/uncategorized stuff 

5114 "error": 0, # error tags 

5115 "unknown": -1, # Only used internally 

5116 "dummy": -2, # Only used internally 

5117 "dummy2": -3, # Only used internally (this category never expands cell) 

5118} 

5119 

5120# Set of all valid tags 

5121# Note that this is extended below. 

5122valid_tags = { 

5123 "Adlam": "script", # Script 

5124 "Amharic": "script", # Script (at least for numberals) 

5125 "Arabic": "script", # Also script 

5126 "Arabic-Indic": "script", # Also script 

5127 "Armenian": "script", # Also script 

5128 "Assamese": "script", # Also script (India) 

5129 "Balinese": "script", # Also script 

5130 "Baybayin": "script", # Also script 

5131 "Bengali": "script", # Also script (India) 

5132 "Brahmi": "script", # Script (India, historic) 

5133 "Burmese": "script", # Script 

5134 "Chakma": "script", # Script (India/Burma?) 

5135 "Cham": "script", # Script (Austronesian - Vietnam/Cambodia) 

5136 "Chinese": "script", # Also script 

5137 "CJK": "script", # CJK variant, e.g., Vietnamese Chữ Hán / Chữ Nôm 

5138 "Cyrillic": "script", # Script 

5139 "Devanagari": "script", # Script 

5140 "Déné-syllabary": "script", # Script for Canadian Indian languages? 

5141 "Egyptian": "script", # Also script (hieroglyph) 

5142 "Ethiopic": "script", # Script 

5143 "Glagolitic": "script", # Script 

5144 "Gothic": "script", # Script 

5145 "Greek": "script", # Also script 

5146 "Gujarati": "script", # Script (Indo-Arabic) 

5147 "Gurmukhi": "script", # Script (Indo-Arabic) 

5148 "Gwoyeu-Romatsyh": "script", # latin alphabet for Chinese from the 1920s 

5149 "Hanifi-Rohingya": "script", # Script (Perso-Arabic) 

5150 "Hebrew": "script", # also Script (for Aramaic) 

5151 "Hindi": "script", # Script (at least for numberals, e.g. 80 

5152 "Javanese": "script", # Also script (Indonesia) 

5153 "Jawi": "script", # Script (Malay and several other languages) 

5154 "Jurchen": "script", # Script? 

5155 "Kannada": "script", # Script (at least for numerals, Hindu-Arabic?) 

5156 "Kayah-Li": "script", # Script (Sino-Tibetan) 

5157 "Khmer": "script", # Script 

5158 "Khudawadi": "script", # Script (Sindhi language, India) 

5159 "Lanna": "script", # Script (Thailand) 

5160 "Lao": "script", # Script (Lao langage in Laos) 

5161 "Latin": "script", # Script 

5162 "Lepcha": "script", # Script (Himalayas?) 

5163 "Limbu": "script", # Script (Limbu language in Central Himalayas) 

5164 "Meitei": "script", # Script (used with Meitei language in India) 

5165 "Mongolian": "script", # Also script 

5166 "Myanmar": "script", # Also script 

5167 "N'Ko": "script", # Script 

5168 "Newa": "script", # Script (Newa Spelling) ??? निर्वाचन/Newar/Noun 

5169 "Odia": "script", # Script (at least for numerals) 

5170 "Ol-Chiki": "script", # Script (Austroasiatic language in India) 

5171 "Old-Persian": "script", # Script 

5172 "Oriya": "script", # Script (Hindu-Arabic?) 

5173 "Osmanya": "script", # Script (Somalia) 

5174 "POJ": "script", # Latin alphabet based orthography for Min Nan (Peh-ōe-jī) 

5175 "Persian": "script", # Also script 

5176 "Phofsit-Daibuun": "script", # A way of writing latin alphabet Taiwanese 

5177 "Roman": "script", # Script 

5178 "Rumi": "script", # Script (modern Malay/Indonesian) 

5179 "Saurashtra": "script", # Script (Surashtra language in Tamil Nadu) 

5180 "Shahmukhi": "script", # Script (used by Punjabi Muslims for Punjabi lang) 

5181 "Sharada": "script", # Script (India for Sanskrit and Kashmiri; historic) 

5182 "Sinhalese": "script", # Script (Sri Lanka) 

5183 "Syriac": "script", # Also script (for Aramaic) 

5184 "Tai-Tham": "script", # Script (Northern Thai?) 

5185 "Takri": "script", # Script (mostly historic, used in Himachal Pradesh) 

5186 "Tamil": "script", # Also script 

5187 "Telugu": "script", # Also script (India) 

5188 "Thai": "script", # Script 

5189 "Tibetan": "script", # Script 

5190 "Tirhuta": "script", # Script (historical: Maithili, Sanskrit) 

5191 "Warang-Citi": "script", # Script (Ho language, East India) 

5192 "Bopomofo": "script", # Mandarin phonetic symbols script 

5193 "Hán-Nôm": "detail", # Vietnamese Latin spelling with diacritics? 

5194 "IPA": "detail", 

5195 "pre-1989-IPA": "detail", 

5196 "Sinological-IPA": "detail", 

5197 "X-system": "detail", # Esperanto circumflex accent encoding method 

5198 "Foochow-Romanized": "detail", # latin script for Fuzhou Eastern Min 

5199 "Phak-fa-su": "detail", # latin alphabet used by missionaries for Hakka (PFS) 

5200 "Hakka-Romanization-System": "detail", # Taiwanese Hakka Romanization System 

5201 "Kienning-Colloquial-Romanized": "detail", # missionary romanization system for the Kienning Dialect of Northern Min 

5202 "Latinxua-Sin-Wenz": "detail", 

5203 "Tai-lo": "detail", # romanization system for Taiwanese Hokkien 

5204 "Tongyong-Pinyin": "detail", # Taiwanese romanization from 2002 to 2008 

5205 "Jyutping": "detail", # used in Cantonese 

5206 "McCune-Reischauer": "detail", # Used in Korean 

5207 "Hagfa-Pinyim": "detail", 

5208 "Rōmaji": "detail", # Used in Okinawan, Japanese? for Latin characters 

5209 "Yale": "detail", # used in Cantonese 

5210 "Guangdong-Romanization": "detail", # way of romanizing Cantonese, Teochew, Hakka and Hainanese 

5211 "Wiktionary-specific": "detail", # denotes the use of Wiktionary specific conventions in spelling etc. 

5212 "internet-slang": "misc", 

5213 "Jinmeiyō": "misc", # Type of Kanji used for names 

5214 "-i": "class", # Japanese inflection type 

5215 "-na": "class", # Japanese inflection type 

5216 "-nari": "class", # Japanese inflection type 

5217 "-tari": "class", # Japanese inflection type 

5218 "abbreviation": "mod", 

5219 "abessive": "case", # Case 

5220 "ablative": "case", # Case 

5221 "absolute": "case", # Case, Bashkir, Swedish [absolute reflexive] 

5222 "absolutive": "case", # Case (patient or experience of action) 

5223 "abstract": "misc", 

5224 "abstract-noun": "misc", 

5225 "accent/glottal": "misc", 

5226 "accent-paradigm": "detail", 

5227 "accusative": "case", # Case for object in many languages 

5228 "acronym": "mod", # abbreviation formed by the initial letters of other words 

5229 "active": "voice", 

5230 "actor-focus": "misc", # Tagalog 

5231 "actor-indirect": "misc", # Tagalog 

5232 "actor-i": "misc", # Ilocano verbs 

5233 "actor-ii": "misc", 

5234 "actor-iii": "misc", 

5235 "actor-iv": "misc", 

5236 "additive": "misc", # Greenlandic: adds suffix after last letter of stem 

5237 "addressee-feminine": "misc", 

5238 "addressee-masculine": "misc", 

5239 "addressee-plural": "misc", 

5240 "addressee-singular": "misc", 

5241 "adessive": "case", # Case 

5242 "adjectival": "misc", 

5243 "adjective": "pos", 

5244 "adjective-declension": "class", 

5245 "admirative": "mood", # Verb form in Albanian 

5246 "adnominal": "misc", 

5247 "adverb": "pos", 

5248 "adverbial": "misc", # XXX is this same as adverb? 

5249 "adverbial-manner": "misc", # Manner of action adverbial 

5250 "affirmative": "misc", # Used for adjectives, interjections, pronouns 

5251 "affix": "pos", 

5252 "after-preposition": "misc", # Word used only after preposition nich/Lower Sorbian 

5253 "agent": "misc", 

5254 "agentive": "case", # Case indicating agent 

5255 "alienable": "possession", # Alienable possession; Choctaw, Ojibwe, Navajo, Tokelauan etc 

5256 "allative": "case", # Case 

5257 "allative-i": "case", 

5258 "allative-ii": "case", 

5259 "allative-iii": "case", 

5260 "allative-iv": "case", 

5261 "allative-v": "case", 

5262 "alphabetic-tones": "misc", 

5263 "already-form": "tense", # e.g. hojiwa/Swahili 

5264 "also": "misc", 

5265 "alt-of": "misc", 

5266 "alternative": "misc", 

5267 "ambitransitive": "transitivity", 

5268 "analytic": "misc", 

5269 "anaphorically": "misc", 

5270 "animate": "category", 

5271 "animal-not-person": "misc", # Refers to animal (e.g., Russian anml suffix) 

5272 "anterior": "tense", # French seems to have "past anterior" tense 

5273 "aorist": "tense", # Verb form (perfective past) E.g., Latin, Macedonian 

5274 "aorist-ii": "tense", # Albanian 

5275 "apocopic": "misc", # Omission of last vowel (+ following consonants) 

5276 "applicative": "mood", # Verb form 

5277 "approximative": "case", # Noun form (case?), e.g., марксизм/Komi-Zyrian 

5278 "archaic": "dialect", 

5279 "article": "detail", 

5280 "assertive": "mood", # Verb form (e.g., Korean) 

5281 "associative": "case", # Case (e.g., Quechua) 

5282 "ateji": "misc", 

5283 "attributive": "case", # Adjective attributive-only form/use 

5284 "augmentative": "misc", # Indicates large size, intensity, seniority 

5285 "augmented": "misc", 

5286 "autonomous": "person", # nigh/Irish; verb form for subjectless clauses 

5287 "auxiliary": "detail", 

5288 "baby-talk": "misc", 

5289 "base-form": "misc", # Base form of the word (e.g., with misspellings of forms) 

5290 "before-lenited-fh": "misc", # Next word starts with lenited fh (Irish) 

5291 "before-past": "misc", # Used before the past tense (Irish) 

5292 "before-vowel": "misc", # next words starts with vowel (in pronunciation) 

5293 "after-vowel": "misc", # -nən/Azerbaijani 

5294 "before-consonant": "misc", # oh-/Choctaw 

5295 "after-consonant": "misc", # -nən/Azerbaijani 

5296 "after-consonant-except-l": "misc", 

5297 "after-l-consonant": "misc", 

5298 "before-s": "misc", 

5299 "before-front-vowel": "misc", 

5300 "before-back-vowel": "misc", 

5301 "benefactive": "case", # Case (beneficiary of an action) 

5302 "broadly": "misc", 

5303 "būdinys": "misc", 

5304 "calque": "misc", 

5305 "cangjie-input": "detail", # Used in Chinese characters 

5306 "canonical": "misc", # Used to mark the canonical word from from the head tag 

5307 "capitalized": "misc", 

5308 "cardinal": "misc", 

5309 "caritive": "case", # Case (lack or absense of something), марксизм/Komi-Zyrian 

5310 "catenative": "misc", 

5311 "causal-final": "misc", 

5312 "causative": "aspect", # Verb aspect (e.g., Japanese); Cause/Reason (Korean) 

5313 "character": "pos", 

5314 "childish": "misc", 

5315 "circumstantial": "mood", # Verb form, e.g., patjaṉi 

5316 "circumposition": "misc", 

5317 "class": "detail", # Used as a head prefix in San Juan Quajihe Chatino (class 68 etc) 

5318 "class-1": "class", # Inflectional classes (e.g., Bantu languages), cf. gender 

5319 "class-10": "class", 

5320 "class-10a": "class", 

5321 "class-11": "class", 

5322 "class-12": "class", 

5323 "class-13": "class", 

5324 "class-14": "class", 

5325 "class-15": "class", 

5326 "class-16": "class", 

5327 "class-17": "class", 

5328 "class-18": "class", 

5329 "class-1a": "class", 

5330 "class-2": "class", 

5331 "class-2a": "class", 

5332 "class-3": "class", 

5333 "class-4": "class", 

5334 "class-5": "class", 

5335 "class-6": "class", 

5336 "class-7": "class", 

5337 "class-8": "class", 

5338 "class-9": "class", 

5339 "class-9a": "class", 

5340 "class-A": "class", # e.g., Old Irish affixed pronoun classes 

5341 "class-B": "class", 

5342 "class-C": "class", 

5343 "class-i": "class", # Choctaw 

5344 "class-ii": "class", 

5345 "class-iii": "class", 

5346 "class-iv": "class", 

5347 "class-v": "class", 

5348 "class-vi": "class", 

5349 "class-vii": "class", 

5350 "class-viii": "class", 

5351 "class-ix": "class", 

5352 "class-x": "class", 

5353 "class-xi": "class", 

5354 "class-xii": "class", 

5355 "class-xiii": "class", 

5356 "class-n": "class", # Chickasaw 

5357 "class-a-i": "class", # Akkadian 

5358 "classifier": "detail", 

5359 "clipping": "misc", 

5360 "clitic": "misc", 

5361 "coactive": "mood", # Verbs in Guaraní 

5362 "cohortative": "mood", # Verb form: plea, imploring, wish, intent, command, purpose 

5363 "collective": "number", # plural interpreted collectively 

5364 "colloquial": "register", 

5365 "combined-form": "misc", # e.g. Spanish combining forms 

5366 "comitative": "case", # Case 

5367 "common": "misc", # XXX where is this used, shuould this be removed? 

5368 "common-gender": "gender", # Gender in Swedish, Danish 

5369 "comparable": "category", 

5370 "comparative": "degree", # Comparison of adjectives/adverbs 

5371 "comparative-only": "misc", # Only comparative used 

5372 "completive": "aspect", 

5373 "composition": "detail", # Used in Chinese characters 

5374 "compound": "misc", # Compound words 

5375 "compound-of": "misc", 

5376 "concessive": "mood", # Verb form 

5377 "conclusive": "mood", # Verb form (e.g., Bulgarian) 

5378 "concrete": "misc", # Slavic verbs; also used to describe nouns 

5379 "conditional": "mood", # Verb mood 

5380 "conditional-i": "mood", # Verb mood (German) 

5381 "conditional-ii": "mood", # Verb mood (German) 

5382 "conjugation-type": "detail", # Used to indicate form really is conjugation class 

5383 "conjugation-1": "class", 

5384 "conjugation-2": "class", 

5385 "conjugation-3": "class", 

5386 "conjugation-4": "class", 

5387 "conjugation-5": "class", 

5388 "conjugation-6": "class", 

5389 "conjugation-7": "class", 

5390 "conjugative": "misc", # Verb form, e.g., উঘাল/Assamese 

5391 "conjugative-of": "detail", # Korean 

5392 "conjunct": "misc", # Verb form, e.g., gikaa/Ojibwe 

5393 "conjunct-incorporating": "misc", 

5394 "conjunct-non-incorporating": "misc", 

5395 "conjunctive": "mood", # Verb mood (doubt: wish, emotion, possibility, obligation) 

5396 "conjunctive-1": "mood", # e.g. saprast/Latvian 

5397 "conjunctive-2": "mood", 

5398 "conjunction": "misc", # Used in Phalura conjunctions, relative pronouns 

5399 "connective": "misc", # Group of verb forms in Korean 

5400 "connegative": "polarity", # Indicates verb form that goes with negative 

5401 "consecutive": "aspect", # Verb form, e.g., થૂંકવું/Gujarati, noun form марксизм 

5402 "construct": "misc", # Apparently like definite/indefinite (e.g., Arabic) 

5403 "construction-hif'il": "misc", # Subject is cause; active voice 

5404 "construction-hitpa'el": "misc", # middle voice? 

5405 "construction-hitpu'al": "misc", # XXX Same as hitpa'el? 

5406 "construction-huf'al": "misc", # Subject is cause; passive voice 

5407 "construction-nif'al": "misc", # Neutral about subject's role; middle voice 

5408 "construction-pa'al": "misc", # Neutral about subject's role; active voice 

5409 "construction-pa'el": "misc", 

5410 "construction-peal": "misc", # Aramaic, Classical Syriac 

5411 "construction-pi'el": "misc", # Subject is agent; active voice 

5412 "construction-pu'al": "misc", # Subject is agent; passive voice 

5413 "contemplative": "mood", 

5414 "contemporary": "misc", 

5415 "contingent": "mood", # Verb form, উঘাল/Assamese 

5416 "continuative": "aspect", # Verb aspect (actions still happening; e.g., Japanese) 

5417 "contracted": "misc", # Is this the same as contraction? -> not exactly, see ἐρωτάω/Greek 

5418 "contracted-dem-form": "misc", 

5419 "contraction": "mod", 

5420 "contrastive": "mood", # Apparently connective verb form in Korean 

5421 "converb": "misc", # Verb form or special converb word 

5422 "converb-i": "misc", # e.g., խածնել/Armenian 

5423 "converb-ii": "misc", 

5424 "conversive": "mood", # Verb form/type, at least in Swahili, reverse meaning? 

5425 "coordinating": "misc", 

5426 "copulative": "misc", 

5427 "correlative-of": "detail", 

5428 "cot-caught-merger": "misc", 

5429 "count-form": "misc", # Nominal form in Belarusian 

5430 "countable": "category", 

5431 "counter": "detail", 

5432 "counterfactual": "mood", 

5433 "dated": "dialect", 

5434 "dative": "case", # Case in many languages 

5435 "debitive": "misc", # need or obligation (XXX is this same as "obligative" ???) 

5436 "declension-1": "class", 

5437 "declension-2": "class", 

5438 "declension-3": "class", 

5439 "declension-4": "class", 

5440 "declension-5": "class", 

5441 "declension-6": "class", 

5442 "declension-pattern-of": "detail", 

5443 "declinable": "misc", 

5444 "defective": "misc", 

5445 "deferential": "register", # Addressing someone of higher status 

5446 "definite": "referent", 

5447 "definition": "misc", 

5448 "definitive": "misc", # XXX is this used same as "definite": "misc", opposite indefinite? 

5449 "deictically": "misc", 

5450 "delative": "case", # Case 

5451 "deliberate": "misc", 

5452 "demonstrative": "misc", # Type of pronoun 

5453 "demonym": "misc", 

5454 "dependent": "tense", # περπατάω/Gree/Verb (tense?); Egyptian 

5455 "deponent": "misc", # Having passive form with active meaning 

5456 "derogatory": "register", 

5457 "desiderative": "mood", # Verb mood 

5458 "destinative": "case", # Case, marks destination/something destined (e.g. Hindi) 

5459 "determinate": "misc", # Polish verbs (similar to "concrete" in Russian?) 

5460 "determinative-of": "detail", # Korean 

5461 "determiner": "misc", # Indicates determiner; Korean determiner verb forms? 

5462 "deuterotonic": "misc", # e.g., dofuissim/Old Irish 

5463 "diacritic": "misc", 

5464 "dialectal": "misc", 

5465 "digit": "misc", 

5466 "diminutive": "misc", 

5467 "diptote": "class", # Noun having two cases (e.g., Arabic) 

5468 "direct": "aspect", # Apparently verb form (e.g., Hindi, Punjabi) 

5469 "direct-object": "case", # Case for direct object? 

5470 "directional": "case", # Case?, e.g., тэр/Mongolian 

5471 "directive": "case", # Case (locative/nearness), e.g. Basque, Sumerian, Turkic 

5472 "disapproving": "misc", 

5473 "discourse": "misc", # At lest some Ancient Greek particles 

5474 "disjunctive": "misc", 

5475 "distal": "referent", # Demonstrative referent is far, cf. proximal, obviative 

5476 "distributive": "number", # Case in Quechua? (is this case or e.g. determiner?) 

5477 "ditransitive": "transitivity", 

5478 "dual": "number", # two in number, cf. singular, trial, plural 

5479 "dubitative": "mood", # Verb form (e.g., Bulgarian) 

5480 "dummy-ignore-skipped": "dummy", # Causes "-" entries to be ignored 

5481 "dummy-ignored-text-cell": "dummy2", # Cell has text but ignored 

5482 "dummy-mood": "dummy", # Used in inflection table parsing, never in data 

5483 "dummy-skip-this": "dummy", # Kludge in parsing, form skipped 

5484 "dummy-tense": "dummy", # Used in inflection table parsing, never in data 

5485 "dummy-object-concord": "dummy", # Used to transform personal pronouns, 

5486 # numbers and gender tags into object- form. 

5487 # This must only be used in the case where the verb has ONLY object 

5488 # concord present in it, because it changes all (listed) subject 

5489 # concord tags (like "first-person" or "plural") into object concord 

5490 # tags (like "object-first-person" and "object-plural". 

5491 "dummy-remove-this-cell": "dummy2", # পো/Assamese attempt to make this work 

5492 # Use this to get rid of unnecessary cells by propagating: for example 

5493 # if there's a "Notes" header and a text cell beneath it, using the 

5494 # header to give the text cell this tag will nuke it. 

5495 "dummy-reset-headers": "dummy", 

5496 "dummy-use-as-rowtags": "dummy", 

5497 "dummy-use-as-coltags": "dummy", 

5498 "dummy-store-hdrspan": "dummy", 

5499 "dummy-load-stored-hdrspans": "dummy", 

5500 "dummy-reset-stored-hdrspans": "dummy", 

5501 "dummy-section-header": "dummy", # When tables are split up into tables 

5502 # within a template so that the main header (like "Infinitives" in the 

5503 # new Swahili verb tables) is separated from the section it is a header 

5504 # of, use this to force a section header that is active until it is 

5505 # replaced by something else down the line. 

5506 "dummy-reset-section-header": "dummy", # Explicitly remove the saved 

5507 # tags in TableContext.section_header; you can also call dummy-section- 

5508 # header with an otherwise empty tag list, but this is needed when you 

5509 # need to have tags too. 

5510 "durative": "aspect", # Verb form XXX same as continuative? 

5511 "eclipsis": "misc", 

5512 "egressive": "case", # Case? e.g., дворец/Komi-Zyrian 

5513 "elative": "case", # Case 

5514 "ellipsis": "misc", 

5515 "emphatic": "misc", 

5516 "empty-gloss": "misc", # Gloss was present but is empty after cleanup 

5517 "enclitic": "misc", 

5518 "endearing": "misc", # XXX Is this different from diminutive? 

5519 "epic": "misc", 

5520 "epicene": "misc", 

5521 "equative": "case", # Case (indicates something is like something else) 

5522 "ergative": "misc", 

5523 "error-fixme": "error", # "(FIXME)" recognized in Wiktionary 

5524 "error-lua-exec": "error", # Lua error occurred 

5525 "error-lua-timeout": "error", # Lua code execution timed out 

5526 "error-unknown-tag": "error", # Tag not recognized 

5527 "error-misspelling": "error", # Misspelling was recognized in Wiktionary 

5528 "error-exponential-tagsets": "error", 

5529 "error-unrecognized-form": "error", # Word head or table hdr unrecognized 

5530 "especially": "misc", 

5531 "essive": "case", # Case 

5532 "essive-formal": "case", # Hungarian case 

5533 "essive-instructive": "case", # Hungarian case 

5534 "essive-modal": "case", # Hungarian case 

5535 "ethnic": "misc", 

5536 "eumhun": "misc", 

5537 "euphemistic": "misc", 

5538 "evidential": "mood", # Verb form (e.g., Azerbaijani) 

5539 "exaggerated": "misc", 

5540 "excessive": "misc", 

5541 "exclusive": "person", # inclusive vs. exclusive first-person; case in Quechua 

5542 "exessive": "case", # Case (transition away from state) 

5543 "expectative": "mood", # Verb form, e.g., ϯϩⲉ/Coptic 

5544 "expletive": "misc", 

5545 "expressively": "misc", 

5546 "extended": "misc", # At least in some Bulgarian forms, e.g. -лив 

5547 "extinct": "misc", # Uses for taxonomic entries, indicates species is extinct 

5548 "factitive": "misc", # Not sure if same or different as factive 

5549 "factive": "mood", # Verb mood, assumed to be true 

5550 "familiar": "register", # Formality/politeness degree of verbs etc 

5551 "feminine": "gender", # Grammatical gender, masculine, neuter, common, class-* etc. 

5552 "feminine-usually": "gender", # m/f, but usually feminine 

5553 "figuratively": "misc", 

5554 "finite-form": "misc", # General category for finite verb forms 

5555 "first-person": "person", 

5556 "focalising": "mood", # Verb form, e.g., ϯϩⲉ/Coptic 

5557 "form-i": "misc", 

5558 "form-ii": "misc", 

5559 "form-iii": "misc", 

5560 "form-iiiq": "misc", 

5561 "form-iiq": "misc", 

5562 "form-iq": "misc", 

5563 "form-iv": "misc", 

5564 "form-ivq": "misc", 

5565 "form-ix": "misc", 

5566 "form-of": "misc", 

5567 "form-v": "misc", 

5568 "form-vi": "misc", 

5569 "form-vii": "misc", 

5570 "form-viii": "misc", 

5571 "form-x": "misc", 

5572 "form-xi": "misc", 

5573 "form-xii": "misc", 

5574 "form-xiii": "misc", 

5575 "formal": "register", # Formality/politeness degree of verbs etc 

5576 "four-corner": "detail", # Used in Chinese characters 

5577 "fourth-person": "person", 

5578 "frequentative": "misc", 

5579 "front-vowel": "misc", 

5580 "front-vowel-harmony": "misc", # -nən/Azerbaijani 

5581 "back-vowel-harmony": "misc", # -nən/Azerbaijani 

5582 "rounded-harmony": "misc", 

5583 "unrounded-harmony": "misc", 

5584 "fusioning": "misc", # Greenlandic suffixes 

5585 "future": "tense", # Verb tense 

5586 "future-near": "tense", # immediate future ba/Zulu 

5587 "future-remote": "tense", # remote future ba/Zulu 

5588 "future-perfect": "tense", # future anteriore ripromettersi/Italian 

5589 "future-i": "tense", # Verb tense (German, e.g., vertippen) 

5590 "future-ii": "tense", # Verb tense (German) 

5591 "gender-neutral": "gender", 

5592 "general": "misc", # In general temporal participle, e.g., talamaq/Azerbaijani 

5593 "general-mood": "mood", # e.g. hojiwa/Swahili 

5594 "genitive": "case", 

5595 "gerund": "non-finite", 

5596 "gnomic": "mood", # e.g. hojiwa/Swahili 

5597 "goal": "mood", # Verb form, e.g., উঘাল/Assamese 

5598 "grade-1-kanji": "misc", 

5599 "grade-2-kanji": "misc", 

5600 "grade-3-kanji": "misc", 

5601 "grade-4-kanji": "misc", 

5602 "grade-5-kanji": "misc", 

5603 "grade-6-kanji": "misc", 

5604 "habitual": "aspect", # Verb aspect 

5605 "half-participle": "non-finite", # e.g. važiuoti/Lithuanian/Verb 

5606 "hangeul": "script", # Korean script 

5607 "hanja": "script", # Han character script (Chinese characters) to write Korean 

5608 "hard": "misc", # sladek/Slovene 

5609 "hellenism": "misc", 

5610 "hidden-n": "class", # Mongolian declension 

5611 "hiragana": "script", # Japanese syllabic spelling for native words 

5612 "historic": "tense", # Grammatical tense/mood for retelling past events 

5613 "historical": "misc", # Relating to history 

5614 "honorific": "register", # Formality/politeness degree of verbs etc 

5615 "hortative": "mood", # Verb mood 

5616 "humble": "register", 

5617 "humorous": "register", 

5618 "hypernym": "misc", 

5619 "hypercorrect": "misc", 

5620 "hyponym": "misc", 

5621 "hypothetical": "mood", # Verb mood (e.g., Japanese) 

5622 "ideophonic": "misc", 

5623 "idiomatic": "misc", 

5624 "if-not-form": "mood", # e.g. hojiwa/Swahili 

5625 "if-when-form": "mood", # e.g. hojiwa/Swahili 

5626 "illative": "case", # Case 

5627 "imperative": "mood", # Mood 

5628 "imperative-only": "misc", 

5629 "imperfect": "tense", # Past tense in various languages 

5630 "imperfect-se": "misc", # Spanish se/ra distinction 

5631 "imperfective": "aspect", # Verb aspect (action not completed) 

5632 "impersonal": "person", # Verb form, e.g., Portuguese impersonal infinitive 

5633 "impolite": "register", # Politeness degree of verbs etc 

5634 "imitating": "misc", # imitating X 

5635 "in-certain-phrases": "misc", 

5636 "in-compounds": "misc", 

5637 "in-plural": "misc", 

5638 "in-indicative": "misc", 

5639 "in-conditional": "misc", 

5640 "in-variation": "misc", # E.g. crush,WiFi,lhama,tsunami/Portuguese, 

5641 "inalienable": "possession", # Inablienable possession: body parts etc; Choctaw, Ojibwe.. 

5642 "inanimate": "category", 

5643 "including": "misc", 

5644 "includes-article": "misc", # Word form includes article 

5645 "inclusive": "person", # inclusive vs. exclusive first-person 

5646 "indeclinable": "class", 

5647 "indefinite": "referent", 

5648 "independent": "misc", # Verb form, e.g., gikaa/Ojibwe 

5649 "indeterminate": "misc", # Polish verbs (similar to "abstract" in Russian) 

5650 "indicative": "mood", # Indicative mood 

5651 "indirect": "aspect", # Verb form, e.g., بونا/ 

5652 "indirect-object": "case", # Case for indirect object 

5653 "inessive": "case", # Case 

5654 "inferential": "mood", # Verb form (w/ aorist), e.g. -ekalmak/Turkish 

5655 "infinitive": "non-finite", # Verb form 

5656 "infinitive-aorist": "non-finite", # e.g. περπατάω/Greek non-finite form 

5657 "infinitive-da": "non-finite", # Estonian: indicative active negative imperfect / indicative active pluperfect / imperative active present (non-2sg) / active perfect (hypothetical action - general action) 

5658 "infinitive-i": "non-finite", # Finnish 

5659 "infinitive-i-long": "non-finite", # Finnish 

5660 "infinitive-ii": "non-finite", # Finnish 

5661 "infinitive-iii": "non-finite", # Finnish 

5662 "infinitive-iv": "non-finite", # Finnish 

5663 "infinitive-ma": "non-finite", # Estonian: positive imperfect, quotative (has happened, is happening, or will happen) / Moksha 

5664 "infinitive-mda": "non-finite", # Moksha 

5665 "infinitive-v": "non-finite", # Finnish 

5666 "infinitive-zu": "non-finite", # German 

5667 "infix": "pos", 

5668 "inferred": "mood", 

5669 "inflected": "misc", # Marks inflected form, constrast to uninflected (e.g., Dutch) 

5670 "inflected-like": "misc", # seleen/Limburgish 

5671 "informal": "register", # Formality/politeness degree of verbs etc 

5672 "initialism": "misc", 

5673 "injunctive": "mood", # Verb form, e.g., पुस्नु/Nepali 

5674 "instructive": "case", # Case 

5675 "instrumental": "case", # Case 

5676 "iterative": "misc", 

5677 "intensifier": "misc", # In participle of intensification, e.g., talamaq 

5678 "intentive": "mood", # Verb form, e.g., patjaṉi 

5679 "interfix-j": "misc", # Greenlandic: adds -j- after long vowel 

5680 "interjection": "misc", 

5681 "interrogative": "mood", 

5682 "intransitive": "transitivity", 

5683 "invariable": "misc", 

5684 "invertive": "case", # Case? (e.g., Сотрэш/Adyghe) 

5685 "involuntary": "mood", # Verb form, e.g., khitan/Indonesian 

5686 "ionic": "misc", # XXX ??? 

5687 "ironic": "misc", 

5688 "irrealis": "mood", # Verb form, e.g., たたかう/Japanese 

5689 "irregular": "misc", # Word has irregular inflection 

5690 "irregular-pronunciation": "misc", # Kanji or similar pronunciation irregular 

5691 "italics": "misc", # Used in head form to indicate italic character variant 

5692 "iō-variant": "misc", # e.g. horior/Latin, interiicio/Latin 

5693 "jargon": "register", 

5694 "jussive": "mood", # Verb mood for orders, commanding, exhorting (subjunctively) 

5695 "kanji": "misc", # Used in word head for some Japanese symbols 

5696 "katakana": "script", # Japanese syllabic spelling for foreign words 

5697 "krama": "register", # Javanese register (polite form) 

5698 "krama-ngoko": "register", # Javanese register (neutral, without polite) 

5699 "kyūjitai": "detail", # Traditional Japanese Kanji (before 1947) 

5700 "l-participle": "non-finite", # dati/Proto-Slavic 

5701 "lative": "case", # Case, e.g., тіл/Khakas 

5702 "lenition": "misc", 

5703 "letter": "misc", 

5704 "letter-name": "misc", 

5705 "limitative": "mood", # Verb form, e.g., ϯϩⲉ/Coptic 

5706 "literally": "misc", 

5707 "literary": "misc", 

5708 "locative": "case", 

5709 "locative-qualitative": "case", 

5710 "long-form": "misc", # Verb forms, отъпоустити/Old Church Slavonic; long past participle e.g. anexar/Portuguese 

5711 "lowercase": "misc", 

5712 "main-clause": "misc", # e.g., omzagen/Dutch 

5713 "mainly": "misc", 

5714 "majestic": "register", # Referring to kings, queens, presidents, God 

5715 "masculine": "gender", # Grammatial gender see feminine, neuter, common, class-* etc. 

5716 "masculine-usually": "gender", # m/f, but usually masculine 

5717 "material": "misc", 

5718 "matronymic": "misc", 

5719 "medial": "misc", 

5720 "mediopassive": "voice", 

5721 "meliorative": "misc", # XXX See essere/Italian/Noun word head 

5722 "metaphoric": "misc", 

5723 "metonymically": "misc", 

5724 "metrically": "misc", # Used in Sanskrit word heads 

5725 "mi-form": "misc", # Malagasy verbs 

5726 "middle": "voice", # At least middle voice (cf. active, passive) 

5727 "middle-infinitive": "non-finite", 

5728 "mildly": "misc", 

5729 "misconstruction": "misc", # Used for e.g. incorrect Latin plurals 

5730 "misspelling": "misc", 

5731 "mixed": "misc", 

5732 "mixedcase": "misc", 

5733 "mnemonic": "misc", 

5734 "modal": "misc", 

5735 "modern": "misc", 

5736 "modified": "misc", # Noun form, e.g., dikko/Sidamo (similar to person?) 

5737 "monopersonal": "misc", 

5738 "morpheme": "misc", 

5739 "morse-code": "misc", 

5740 "motive-form": "mood", # Verb form for Korean (e.g., 조사하다) 

5741 "multiplicative": "case", # adverbial case in Finnish 

5742 "multiword-construction": "misc", # complex tenses in French/English conjugation 

5743 "mutated": "misc", 

5744 "mutation": "misc", 

5745 "mutation-aspirate": "misc", 

5746 "mutation-mixed": "misc", 

5747 "mutation-nasal": "misc", 

5748 "mutation-radical": "misc", # "radical" in mutation tables, e.g. hun/Welsh 

5749 "mutation-soft": "misc", # At least Welsh 

5750 "name": "misc", 

5751 "narrowly": "misc", 

5752 "natural": "misc", 

5753 "necessitative": "mood", # Verb form in some languages 

5754 "negated-with": "misc", # Indicates how word is negated, e.g., ϣⲗⲏⲗ/Coptic 

5755 "negative": "polarity", # Indicates negation of meaning (nominal or verbal) 

5756 "neologism": "misc", 

5757 "neuter": "gender", # Gender, cf. masculine, feminine, common-gender etc. 

5758 "next": "misc", # Next value in sequence (number, letter, etc.) 

5759 "no-absolute": "misc", # No aboslute form; femri/Icelandic 

5760 "no-auxiliary": "misc", # No auxiliary needed for verb (?); lavarsi/Italian 

5761 "no-comparative": "misc", # The word has no comparative form 

5762 "no-construct-forms": "misc", # The word has no construct forms 

5763 "no-definite": "misc", # Danish "no definite forms" 

5764 "no-diminutive": "misc", # No diminutive form (goeste/West Flemish) 

5765 "no-feminine": "misc", # No feminine form (ácimo/Spanish) 

5766 "no-first-person-singular-past-historic": "misc", # Italian 

5767 "no-first-person-singular-present": "misc", # Spanish (only third person?) 

5768 "no-first-person-singular-preterite": "misc", # Spanish (only third person?) 

5769 "no-genitive": "misc", # The word has no genitive form 

5770 "no-gloss": "misc", # This sense has no glosses 

5771 "no-gradation": "gradation", # No consonant gradation 

5772 "no-imperfective": "misc", # No imperfective form (исходить/Russian) 

5773 "no-infinitive": "misc", # No infinitive form (måste/Swedish) 

5774 "no-nominative": "misc", # The word has no nominative form (from this base) 

5775 "no-nominative-plural": "misc", # The word has no nominative plural 

5776 "no-past": "misc", # No simple past form" 

5777 "no-past-participle": "misc", # The word has no past participle 

5778 "no-perfect": "misc", # The word has no perfect/perfective aspect/form 

5779 "no-plural": "misc", # The word has no plural form (= singular only) 

5780 "no-possessor": "misc", # No possessor in possessive hajallan/Finnish 

5781 "no-present-participle": "misc", # The word has no present participle 

5782 "no-second-person-singular-imperative": "misc", # No imperative 

5783 "no-singulative": "misc", # no singulative form 

5784 "no-short-form": "misc", # no short forms (Russian) 

5785 "no-superlative": "misc", # The word has no superlative form 

5786 "no-supine": "misc", # The word has no supine form 

5787 "no-third-person-singular-past-historic": "misc", # Italian 

5788 "no-third-person-singular-present": "misc", # mittagessen/German 

5789 "nominal": "pos", 

5790 "nominal-state": "misc", 

5791 "nominative": "case", 

5792 "nomino-accusative": "misc", # 𒀀𒄿𒅖/Hittite XXX same as nominate/accusative??? 

5793 "non-aspectual": "aspect", # E.g., भूलना/Hindi 

5794 "non-durative": "misc", # non-durative sentence, e.g., ϣⲗⲏⲗ/Coptic 

5795 "non-numeral": "misc", # Assamese noun forms 

5796 "non-past": "tense", # Verb tense (e.g., Korean) 

5797 "non-prospective": "misc", # e.g. götürmek/Turkish 

5798 "non-scientific": "misc", 

5799 "non-subject": "misc", # ishno'/Chickasaw 

5800 "nonce-word": "misc", 

5801 "nondeferential": "misc", 

5802 "nonstandard": "dialect", 

5803 "nonvirile": "category", 

5804 "not-clause-initial": "misc", 

5805 "not-comparable": "category", 

5806 "not-mutable": "misc", 

5807 "not-translated": "misc", 

5808 "not-yet-form": "tense", # e.g. hojiwa/Swahili 

5809 "noun": "pos", 

5810 "noun-from-adj": "derivation", 

5811 "noun-from-noun": "derivation", # Greenlandic: suffix derives nominal from nominal 

5812 "noun-from-verb": "derivation", # Greenlandic: suffix derives nominal from verb 

5813 "numeral": "pos", # Numeral part-of-speech; also Assamese noun forms 

5814 "numeral-tones": "misc", 

5815 "obligative": "mood", # Verb form (e.g., Azerbaijani) 

5816 "object-concord": "misc", # Verb form includes object-based inflection 

5817 "object-first-person": "object", # Swahili object concords, Spanish combined-form 

5818 "object-second-person": "object", 

5819 "object-third-person": "object", 

5820 "object-singular": "object", 

5821 "object-plural": "object", 

5822 "object-definite": "object", # Object is definite, e.g. fut/Hungarian 

5823 "object-indefinite": "object", # Object is indefinite 

5824 "object-class-1": "object", # Swahili object class for object concord 

5825 "object-class-2": "object", 

5826 "object-class-3": "object", 

5827 "object-class-4": "object", 

5828 "object-class-5": "object", 

5829 "object-class-6": "object", 

5830 "object-class-7": "object", 

5831 "object-class-8": "object", 

5832 "object-class-9": "object", 

5833 "object-class-10": "object", 

5834 "object-class-11": "object", 

5835 "object-class-12": "object", 

5836 "object-class-13": "object", 

5837 "object-class-14": "object", 

5838 "object-class-15": "object", 

5839 "object-class-16": "object", 

5840 "object-class-17": "object", 

5841 "object-class-18": "object", 

5842 "object-masculine": "object", # Pashto verbs 

5843 "object-feminine": "object", 

5844 "objective": "case", # Case, used as an object 

5845 "oblique": "case", # Apparently like case form (e.g., Hindi) 

5846 "obsolete": "dialect", 

5847 "obviative": "referent", # Referent is not the most salient one, cf. proximal, distal 

5848 "offensive": "register", 

5849 "often": "misc", 

5850 "one-termination": "misc", 

5851 "onomatopoeic": "misc", 

5852 "oppositive": "misc", # expresses contrariety 

5853 "optative": "misc", 

5854 "ordinal": "misc", 

5855 "parasynonym": "misc", 

5856 "parenthetic": "misc", 

5857 "participle": "non-finite", 

5858 "participle-1": "non-finite", # e.g. saprast/Latvian/Verb 

5859 "participle-2": "non-finite", 

5860 "participle-3": "non-finite", 

5861 "participle-4": "non-finite", 

5862 "particle": "pos", 

5863 "partitive": "case", # Case 

5864 "passive": "voice", 

5865 "passive-mostly": "misc", # Attested mostly in the passive 

5866 "past": "tense", 

5867 "past-future": "tense", # Future in the past 

5868 "past-recent": "tense", 

5869 "past-remote": "tense", 

5870 "patronymic": "misc", 

5871 "paucal": "number", # cf. singular, plural, dual, trial 

5872 "pausal": "misc", # Relates to prosody/pronunciation? 

5873 "pejorative": "misc", 

5874 "perfect": "tense", # Tense/verb form, e.g., in Finnish 

5875 "perfect-i": "tense", # E.g., talamaq/Azerbaijani 

5876 "perfect-ii": "tense", # E.g., talamaq/Azerbaijani 

5877 "perfective": "aspect", # Verb aspect 

5878 "person": "category", 

5879 "personal": "misc", # Type of pronoun; Verb form (e.g., Portuguese personal infinitive) 

5880 "phoneme": "misc", 

5881 "phrasal": "misc", 

5882 "phrase": "misc", 

5883 "physical": "misc", 

5884 "pin-pen-merger": "misc", 

5885 "place": "misc", 

5886 "pluperfect": "tense", # Tense/verb form 

5887 "pluperfect-i": "tense", # воштыны'/Udmurt 

5888 "pluperfect-ii": "tense", 

5889 "plural": "number", # Number, cf. sigular, dual, trial 

5890 "plural-of": "detail", # Plural form of something 

5891 "plural-of-variety": "misc", # Plural indicating different kinds of things (Arabic) 

5892 "plural-only": "misc", # Word only manifested in plural in this sense 

5893 "plural-normally": "misc", # Usually plural, but singular may be possible 

5894 "poetic": "misc", 

5895 "polite": "register", # Politeness degree of verbs etc 

5896 "polytonic": "misc", 

5897 "positive": "degree", # opposite of negative (usually unattested); degree 

5898 "possessed-form": "misc", # Marks object that is possessed, cf. possessed 

5899 "possessive": "possession", # Possession (marks who possesses) 

5900 "possessed-single": "possession", # Possessive with single possessed 

5901 "possessed-many": "possession", # Possessive with multiple possessed 

5902 "possessed-two": "possession", # Two possessed, Mansi 

5903 "possessed-masculine": "possession", # Possessive with masculine possessed 

5904 "possessed-feminine": "possession", # Possessive with feminine possessed 

5905 "possessed-common": "possession", # Possessive with common-g possessed 

5906 "possessed-neuter": "possession", # Possessive with neuter possessed 

5907 "possibly": "misc", 

5908 "postpositional": "misc", 

5909 "potential": "mood", # Verb mood 

5910 "praenominal": "misc", 

5911 "precursive": "mood", # Verb form, e.g. ϯϩⲉ/Coptic 

5912 "predicative": "case", # Adjective predicate-only form/use 

5913 "prefix": "pos", 

5914 "preparative": "aspect", # Verb form, e.g., ᠵᡠᠸᡝᡩᡝᠮᠪᡳ/Manchu 

5915 "prepositional": "misc", 

5916 "present": "tense", # Verb tense 

5917 "present-rare": "misc", # Present tense is rare 

5918 "presumptive": "mood", # Verb mood, e.g., गरजना/Hindi 

5919 "preterite": "tense", # Verb tense (action in the past, similar to simple past) 

5920 "preterite-present": "tense", # word where present&preterite forms look opposite 

5921 "preterite-perfect": "tense", # trapassato remoto ripromettersi/Italian 

5922 "preterite-i": "tense", # воштыны/Udmurt 

5923 "preterite-ii": "tense", 

5924 "pretonic": "misc", # Precedes stressed syllable 

5925 "previous": "misc", # Previous value in sequence (number, letter, etc.) 

5926 "proclitic": "misc", 

5927 "progressive": "aspect", # Verb form, e.g., પચવું/Gurajati 

5928 "prohibitive": "mood", # Verb form (negative imperative), e.g., Old Armenian 

5929 "prolative": "case", 

5930 "pronominal": "misc", 

5931 "pronominal-state": "misc", 

5932 "pronoun": "pos", 

5933 "pronoun-included": "misc", 

5934 "pronunciation-spelling": "misc", 

5935 "proper-noun": "pos", 

5936 "proscribed": "misc", 

5937 "prosecutive": "case", # Case (move along a surface or way); Greenlandic -nnguaq 

5938 "prospective": "misc", # E.g., götürmek/Turkish 

5939 "prothesis": "misc", 

5940 "prothesis-h": "misc", 

5941 "prothesis-t": "misc", 

5942 "prototonic": "misc", # E.g., dofuissim/Old Irish 

5943 "proximal": "referent", # Demonstrative referent is far, cf. distal, obviative 

5944 "purposive": "mood", # Verb form, e.g., patjaṉi 

5945 "quadral": "misc", 

5946 "quantified": "misc", # bat/Jamaican Creole (head form) 

5947 "quotative": "mood", # Verb mood (marks quoted speech keeping orig person/tense) 

5948 "radical": "detail", # Used in Chinese characters 

5949 "radical+strokes": "detail", # Used in Chinese characters 

5950 "rare": "misc", 

5951 "realis": "mood", # Verb form, e.g., たたかう/Japanese 

5952 "reason": "mood", # Verb form, e.g., উঘাল/Assamese 

5953 "recently": "misc", # Used in Recently complete, e.g., {ligpit,magbukid}/Tagalog 

5954 "reciprocal": "misc", # Mutual action (board sense reflexive) 

5955 "reconstruction": "misc", # This word/sense is a reconstruction for a dead language 

5956 "reduced": "misc", # de/Central Franconian (XXX merge with e.g. clipping?) 

5957 "reduplication": "misc", 

5958 "reflexive": "misc", 

5959 "reflexive-of": "detail", # Reflexive form of something 

5960 "regional": "misc", 

5961 "relational": "misc", 

5962 "relative": "person", # At least gp/Egyptian, nigh/Irish verb forms; conjunctions 

5963 "renarrative": "mood", # Verb form (e.g. Bulgarian) 

5964 "replacive": "misc", # Greenlandic suffixes 

5965 "reported": "mood", # Verb forms for reported speech 

5966 "resultative": "misc", # partciple in Armenian (state resulting from action) 

5967 "retronym": "misc", 

5968 "revised": "misc", # Used in many Korean words, is this same as revised-jeon? 

5969 "revised-jeon": "misc", 

5970 "rhetoric": "misc", 

5971 "romanization": "detail", # Latin character version of other script 

5972 "root": "misc", 

5973 "sarcastic": "misc", 

5974 "second-person": "person", 

5975 "second-person-semantically": "person", # semantically second person 

5976 "secular": "misc", # Contrast with Ecclesiastical, Tham, etc 

5977 "self-depreciating": "misc", # Expression is self-depreciating 

5978 "semelfactive": "misc", 

5979 "sentence-case": "misc", # дь/Yakut 

5980 "sentence-final": "misc", # Korean verb forms (broad category) 

5981 "separable": "misc", # Used for separable verbs, e.g. omzagen/Dutch 

5982 "separative": "case", # e.g. keulemmaksi/Finnish 

5983 "sequence": "misc", 

5984 "sequential": "misc", 

5985 "shinjitai": "misc", # Simplified Japanese Kanji (after 1947) 

5986 "short-form": "misc", # Verb forms, отъпоустити/Old Church Slavonic; Portuguese short past participle e.g. anexar/Portuguese 

5987 "si-perfective": "misc", 

5988 "simplified": "misc", 

5989 "simultaneous": "misc", # simultaneous converb, e.g. խածնել/Armenian 

5990 "singular": "number", # Number, cf. plural, dual, trial, paucal 

5991 "singular-normally": "misc", 

5992 "singular-only": "misc", 

5993 "singulative": "misc", # Individuation of a collective or mass noun, like number 

5994 "situative": "case", # expressing location of things in comparison with one another 

5995 "slang": "register", 

5996 "slur": "misc", 

5997 "sociative": "case", # Case?, e.g., மரம்/Tamil 

5998 "soft": "misc", # najslajši/slovene 

5999 "sometimes": "misc", 

6000 "special": "misc", # Adverbial verb form in Lithuanian 

6001 "specific": "misc", # In specific temporal participle, e.g., talamaq 

6002 "specifically": "misc", 

6003 "standalone": "misc", # Without a main word (e.g., pronoun/determiner senses) 

6004 "standard": "misc", 

6005 "stative": "misc", 

6006 "stem": "misc", # Stem rather than full forms 

6007 "stem-primary": "misc", # Primary stem, e.g., दुनु/Nepali 

6008 "stem-secondary": "misc", # Secondary stem, e.g., दुनु/Nepali 

6009 "stress-pattern-1": "misc", 

6010 "stress-pattern-2": "misc", 

6011 "stress-pattern-3": "misc", 

6012 "stress-pattern-3a": "misc", 

6013 "stress-pattern-3b": "misc", 

6014 "stress-pattern-4": "misc", 

6015 "stressed": "misc", # Marked/full form, cf. unstressed 

6016 "stressed-preposition": "misc", 

6017 "strict-sense": "misc", 

6018 "strokes": "misc", 

6019 "strong": "misc", # strong form / strong inflection class 

6020 "subjective": "case", # Case, used as a subject; subject form 

6021 "subjunctive": "mood", # Subjunctive mood 

6022 "subjunctive-i": "mood", # Subjunctive i mood (German) 

6023 "subjunctive-ii": "mood", # Subjunctive ii mood (German) 

6024 "sublative": "case", 

6025 "subordinate-clause": "misc", # e.g., ϣⲗⲏⲗ/Coptic 

6026 "subordinating": "misc", 

6027 "subscript": "script", # Variant of certain characters 

6028 "substantive": "misc", 

6029 "subsuntive": "misc", # Verbs in Guaraní 

6030 "suffix": "pos", 

6031 "superessive": "case", # Case, e.g., Hungarian 

6032 "superlative": "degree", # Comparison of adjectives/adverbs 

6033 "superplural": "number", # Very many (rare, e.g. Barngarla (Australian)) 

6034 "superscript": "script", # Variant of certain characters 

6035 "supine": "non-finite", # Various non-finite forms in several languages 

6036 "suppletive": "misc", 

6037 "surname": "misc", 

6038 "suru": "class", # Japanese verb inflection type 

6039 "syllable-final": "misc", 

6040 "syllable-initial": "misc", 

6041 "symbol": "misc", 

6042 "syncope": "misc", 

6043 "synecdoche": "misc", 

6044 "synonym": "misc", 

6045 "synonym-of": "misc", 

6046 "table-tags": "detail", # Tags from inflection table, for all entries 

6047 "inflection-template": "detail", # Name of top-level template 

6048 "taboo": "misc", 

6049 "tafa-form": "misc", # Malagasy verbs 

6050 "temporal": "misc", # relating to time/tense, e.g., talamaq; Finnish adverbials 

6051 "term-of-address": "misc", 

6052 "terminative": "aspect", # Verb aspect/mood (e.g., Japanese); also case in Quechua? 

6053 "thematic": "misc", 

6054 "third-person": "person", 

6055 "three-termination": "misc", 

6056 "tone-1": "misc", 

6057 "tone-2": "misc", 

6058 "topicalized": "misc", 

6059 "toponymic": "misc", 

6060 "traditional": "misc", 

6061 "transcription": "misc", 

6062 "transgressive": "non-finite", # Verb form XXX non-finite/mood/tense? 

6063 "transitive": "transitivity", 

6064 "transitive-with-of": "misc", 

6065 "translation-hub": "misc", # Predictable compound term with translations, no gloss 

6066 "translative": "case", 

6067 "translingual": "misc", 

6068 "transliteration": "misc", 

6069 "trial": "number", # Number, cf. singular, dual, plural 

6070 "trigger-actor": "trigger", # Actor trigger, e.g., magtinda/Tagalog 

6071 "trigger-benefactive": "trigger", # Benefactive trigger 

6072 "trigger-causative": "trigger", # Causative trigger 

6073 "trigger-instrument": "trigger", # Instrument trigger 

6074 "trigger-locative": "trigger", # Locative trigger 

6075 "trigger-measurement": "trigger", # Measurement trigger, e.g., rumupok/Tagalog 

6076 "trigger-object": "trigger", # Object trigger 

6077 "trigger-referential": "trigger", # Referential trigger 

6078 "triggers-eclipsis": "trigger", # Irish 

6079 "triggers-h-prothesis": "trigger", # Irish 

6080 "triggers-lenition": "trigger", # Irish 

6081 "triggers-mutation-aspirate": "trigger", # Welsh 

6082 "triggers-mutation-mixed": "trigger", # Welsh 

6083 "triggers-mutation-nasal": "trigger", # Old Irish 

6084 "triggers-mutation-soft": "trigger", # Welsh 

6085 "triggers-no-mutation": "trigger", # Irish 

6086 "triptote": "class", # Noun having three cases (e.g., Arabic) 

6087 # ~ "triptote-a": "class", # "singular triptote in ـَة (-a)" جاذب/Arabic/Adj 

6088 "truncative": "misc", # Greenlandic: suffix attaches to last vowel, removing stuff 

6089 "two-termination": "misc", 

6090 "type-a": "class", 

6091 "type-b": "class", 

6092 "type-p": "class", 

6093 "type-u": "class", 

6094 "type-ua": "class", 

6095 "type-up": "class", 

6096 "unabbreviated": "mod", 

6097 "unaugmented": "misc", 

6098 "uncommon": "misc", 

6099 "uncountable": "category", 

6100 "unemphatic": "misc", 

6101 "uninflected": "misc", # uninflected form (e.g., Dutch), cf. inflected 

6102 "universal": "misc", # universally known (καθεμία/Greek) 

6103 # Arabic seems to use "unknown" for theoretical forms not attested 

6104 "unknown": "misc", # Apparently verb form, e.g., जाँच्नु/Nepali 

6105 "unmodified": "misc", # Noun form, e.g., dikko/Sidamo (similar to person?) 

6106 "unpossessed-form": "possession", # Not possessed (often omitted) 

6107 "unspecified": "misc", # селен/Macedonian uses this like proximal/distal 

6108 "unstressed": "misc", # Unstressed (unmarked, weaker) form 

6109 "unstressed-before-j": "misc", # unstressed when next word starts with /j/ 

6110 "uppercase": "misc", 

6111 "used-in-the-form": "misc", 

6112 "usually": "misc", 

6113 "usually-without-article": "misc", 

6114 "utterance-medial": "misc", 

6115 "variant": "misc", 

6116 "vav-consecutive": "misc", 

6117 "vernacular": "register", 

6118 "verb": "pos", 

6119 "verb-completement": "misc", # Used in some Chinese words (merged verb+complement?) 

6120 "verb-form-da": "misc", # Estonian da-form XXX is this same as infinitive-da? 

6121 "verb-form-des": "misc", # Estonian des-form 

6122 "verb-form-i": "misc", 

6123 "verb-form-ii": "misc", 

6124 "verb-from-noun": "derivation", # Forms verbs from nominals 

6125 "verb-object": "misc", # Used in some Chinese words (verb+object in same entry?) 

6126 "verb-from-verb": "derivation", # Suffix modifies verbs producing verbs 

6127 "vigesimal": "misc", 

6128 "virile": "category", 

6129 "visual-rendering": "misc", 

6130 "voa-form": "misc", # Malagasy verbs 

6131 "vocative": "case", # Case? used for addressee 

6132 "volitive": "mood", # Verb form ? XXX is this same as volitional? 

6133 "volitional": "mood", # Verb mood (e.g., Japanese: suggests, urges, initates act) 

6134 "vos-form": "register", # Spanish verb forms used with "vos" 

6135 "vulgar": "register", 

6136 "weak": "misc", 

6137 "with-a": "with", 

6138 "with-ablative": "with", 

6139 "with-absolute": "with", 

6140 "with-absolutive": "with", 

6141 "with-accusative": "with", 

6142 "with-action-noun-in-elative": "with", 

6143 "with-adessive": "with", 

6144 "with-adjective": "with", 

6145 "with-adverb": "with", 

6146 "with-allative": "with", 

6147 "with-an": "with", 

6148 "with-avec": "with", 

6149 "with-ce": "with", 

6150 "with-che": "with", 

6151 "with-comparative": "with", 

6152 "with-con": "with", 

6153 "with-conditional": "with", 

6154 "with-da": "with", 

6155 "with-dative": "with", 

6156 "with-de": "with", 

6157 "with-definite-article": "with", 

6158 "with-di": "with", 

6159 "with-down": "with", 

6160 "with-ela": "with", 

6161 "with-elas": "with", 

6162 "with-elative": "with", 

6163 "with-ele": "with", 

6164 "with-eles": "with", 

6165 "with-ella": "with", 

6166 "with-ellas": "with", 

6167 "with-ellos": "with", 

6168 "with-en": "with", 

6169 "with-essive": "with", 

6170 "with-eu": "with", 

6171 "with-infinitive-i": "with", 

6172 "with-future": "with", 

6173 "with-for": "with", 

6174 "with-gendered-noun": "with", 

6175 "with-genitive": "with", 

6176 "with-gij": "with", 

6177 "with-hiri": "with", 

6178 "with-hura": "with", 

6179 "with-illative": "with", 

6180 "with-imperfect": "with", 

6181 "with-in": "with", 

6182 "with-indicative": "with", 

6183 "with-indirect-object": "with", 

6184 "with-indirect-relative": "with", 

6185 "with-inessive": "with", 

6186 "with-infinitive": "with", 

6187 "with-instrumental": "with", 

6188 "with-it-dialectally": "with", 

6189 "with-järgi": "with", 

6190 "with-kala": "with", 

6191 "with-kV": "with", # gǀkxʻâã/ǃXóõ 

6192 "with-lai": "with", 

6193 "with-locative": "with", 

6194 "with-meel": "with", 

6195 "with-negation": "with", 

6196 "with-negative-adj": "with", 

6197 "with-nominative": "with", 

6198 "with-nos": "with", 

6199 "with-nosotras": "with", 

6200 "with-nosotros": "with", 

6201 "with-noun": "with", 

6202 "with-noun-phrase": "with", 

6203 "with-number": "with", 

6204 "with-objective": "with", 

6205 "with-odd-syllable-stems": "with", 

6206 "with-of": "with", 

6207 "with-olemassa": "with", # Finnish 

6208 "with-on": "with", 

6209 "with-optative": "with", 

6210 "with-others": "with", 

6211 "with-partitive": "with", 

6212 "with-passive-present-participle": "with", 

6213 "with-passive-past-participle-partitive": "with", 

6214 "with-passive-past-participle-translative": "with", 

6215 "with-past": "with", 

6216 "with-past-participle": "with", 

6217 "with-past-participle-translative": "with", 

6218 "with-past-participle-partitive": "with", 

6219 "with-per": "with", 

6220 "with-personal-pronoun": "with", 

6221 "with-por": "with", 

6222 "with-positive-imperative": "with", 

6223 "with-possessive-suffix": "with", 

6224 "with-pour": "with", 

6225 "with-prepositional": "with", 

6226 "with-present": "with", 

6227 "with-savrtsobi": "with", 

6228 "with-su": "with", 

6229 "with-subjunctive": "with", 

6230 "with-subordinate-clause": "with", 

6231 "with-sur": "with", 

6232 "with-dummy-subject": "with", 

6233 "with-there": "with", 

6234 "with-third-person": "with", 

6235 "with-third-person-singular": "with", 

6236 "with-infinitive-iii": "with", 

6237 "with-infinitive-iii-abessive": "with", 

6238 "with-infinitive-iii-elative": "with", 

6239 "with-infinitive-iii-illative": "with", 

6240 "with-to": "with", 

6241 "with-translative": "with", 

6242 "with-tu": "with", 

6243 "with-tú": "with", 

6244 "with-up": "with", 

6245 "with-usted": "with", 

6246 "with-ustedes": "with", 

6247 "with-você": "with", 

6248 "with-vocês": "with", 

6249 "with-von": "with", 

6250 "with-vos": "with", 

6251 "with-voseo": "with", 

6252 "with-vosotras": "with", 

6253 "with-vosotros": "with", 

6254 "with-välja": "with", 

6255 "with-vós": "with", 

6256 "with-yo": "with", 

6257 "with-zuek": "with", 

6258 "with-à": "with", 

6259 "with-él": "with", 

6260 "without-article": "misc", # E.g., grüun/Cimbrian 

6261 "without-noun": "misc", 

6262 "æ-tensing": "misc", 

6263 "има": "misc", # Distinguishes certain verb forms in Macedonian 

6264 "non-human": "misc", # XXX is there already a tag for this? himself/English - KJ 

6265 "human-person": "misc", 

6266 "with-article": "with", # Mosambik/German 

6267 "before-noun": "misc", # Mama/German 

6268 "with-numeral": "with", # Radlermaß/German 

6269 "without-numeral": "misc", # Radlermaß/German 

6270 "same-sort": "number", # Wahnsinnsding/German 

6271 "different-sort": "number", # Wahnsinnsding/German 

6272 "sigmatic": "mood", # adiuvo/Latin 

6273 "dummy-column": "dummy", # in חֲתוּלָתִי‎/Hebrew, Isolated forms 

6274 "be-prefix": "misc", # laikytis/Lithuanian, multi-use prefix... 

6275 "Japanese": "script", # also script, 弧/translingual, stroke count stuff 

6276 "privative": "mood", # afrohet/Albanian 

6277 # ~ "comparative-of": "degree", # miður/Icelandic 

6278 "xemxin-assimilation": "misc", # lil/Maltese 

6279 "qamrin-unassimilation": "misc", 

6280 "with-conjunction": "with", # thathar/Scottish Gaelic 

6281 "with-pronoun": "with", # thathar/Scottish Gaelic 

6282 "unabbreviation": "mod", # jku/Finnish 

6283 "long-construct": "misc", # a ذو الحجة/Arabic 

6284 "actor-secondary": "aspect", # Tagalog thing 

6285 "inferior": "degree", # madali/Tagalog 

6286 "superior": "degree", 

6287 "equal": "degree", 

6288 "l-case": "case", # ufuy/Afar 

6289 "k-case": "case", # ufuy/Afar 

6290 "t-case": "case", # ufuy/Afar 

6291 "h-case": "case", # ufuy/Afar 

6292 "with-postposition": "with", # ufuy/Afar 

6293 # icfide/Afar 

6294 "immediate-future": "tense", 

6295 "potential-i": "mood", 

6296 "potential-ii": "mood", 

6297 "n-affirmative": "misc", 

6298 "v-affirmative": "misc", 

6299 "conjunctive-i": "mood", 

6300 "conjunctive-ii": "mood", 

6301 "consultative": "mood", 

6302 "h-converb": "non-finite", 

6303 "i-form": "non-finite", 

6304 "k-converb": "non-finite", 

6305 "innuh-converb": "non-finite", 

6306 "innuk-converb": "non-finite", 

6307 "v-focus": "non-finite", 

6308 "n-focus": "non-finite", 

6309 # qunxa/Afar 

6310 "indicative-i": "mood", 

6311 "indicative-ii": "mood", 

6312 "duoplural": "number", # niteel/Navajo 

6313 "indefinite-person": "person", 

6314 "spatial-person": "person", 

6315 "middle-voice": "voice", # अवति/Sanskrit 

6316 "inversion": "case", # დაწერს/Sanskrit 

6317 "full-form": "misc", # ichwane/Zulu, "full" and "basic" forms 

6318 "basic-form": "misc", 

6319 "possessive-substantive": "possession", # explicit possessives without possessed: father's computer -> that's father's 

6320 "unmutated": "misc", # glad/Breton 

6321 "mutation-hard": "misc", 

6322 "confirmative": "tense", # сэрээх/Mongolian, past tense + evidentiality 

6323 # also 'resultative', but that's already used 

6324 "with-ergative": "with", # a ہاوُن/Kashmiri 

6325 "with-determiner": "with", # idealistesch/Luxembourgish 

6326 "without-determiner": "misc", 

6327 "with-head": "with", 

6328 "consequential": "mood", # erakutsi/Basque 

6329 "past-i": "tense", # eh/Albanian 

6330 "past-ii": "tense", 

6331 "focus": "detail", # magwahil/Tagalog, trigger-focus 

6332 "sound-plural": "class", 

6333 "ar-infl-in": "class", # Decomposing Arabic inflectional paradigms, سحلية/Arabic,تحو/Arabic 

6334 "ar-infl-ah": "class", # a قناة السويس/Arabic حماة/Arabic 

6335 "ar-infl-an-maksura": "class", # a مدى/Arabic 

6336 "ar-infl-an-alef": "class", # a سنا/Arabic 

6337 "ar-infl-awna": "class", 

6338 "ar-infl-a": "class", # a رمية/Arabic # "singular triptote in ـَة (-a)" جاذب/Arabic/Adj 

6339 "broken-form": "class", # Arabic broken-plural and broken-paucal 

6340 "sound-form": "class", # Arabic sound-feminine-plural sound-masculine-paucal etc. 

6341 "substantive-case": "case", # ананас/Chechen 

6342 "comparative-case": "case", # ананас/Chechen 

6343 "representative": "case", # a ئانا/Uyghur 

6344 "similitude": "case", # Uyghur 

6345 "v1": "misc", # verb-first, verb-second: these have a common term V1 and V2 

6346 "v2": "misc", # tèlle/Limburgish 

6347 "v3": "misc", 

6348 "intimate": "register", # ਪਾਉਣਾ/Punjabi 

6349 "accusative-i": "case", # ань/Komi-Zyrian 

6350 "accusative-ii": "case", # ань/Komi-Zyrian 

6351 "prolative-i": "case", # ань/Komi-Zyrian 

6352 "prolative-ii": "case", # ань/Komi-Zyrian 

6353 "ingressive": "aspect", # hāi/Namuyi 

6354 "experiential": "mood", # hāi/Namuyi 

6355 "premeditated": "mood", # hāi/Namuyi 

6356 "andative": "case", # motion away from something, nyanyi/Warlpiri 

6357 "nomic": "misc", # Warlpiri, no idea what it means. 

6358 "distant-imperfect-er": "tense", # être/Lorrain 

6359 "distant-imperfect-stab": "tense", # être/Lorrain 

6360 "near-imperfect": "tense", 

6361 "proximative": "case", # mahkwa/Fox, contrasted with obviative 

6362 "perlative": "case", # arnaq/Yup'ik 

6363 "gerund-temporal": "non-finite", # тодыны/Udmurt 

6364 "genitive-i": "case", # நத்தை/tamil 

6365 "genitive-ii": "case", 

6366 "locative-i": "case", 

6367 "locative-ii": "case", 

6368 "locative-iii": "case", 

6369 "locative-iv": "case", 

6370 "locative-v": "case", 

6371 "sociative-i": "case", 

6372 "sociative-ii": "case", 

6373 "gerund-i": "non-finite", # பிடி/Tamil 

6374 "gerund-ii": "non-finite", 

6375 "gerund-iii": "non-finite", 

6376 "effective": "aspect", 

6377 "affective": "voice", 

6378 "gerund-iv": "non-finite", # тодыны/Udmurt 

6379 "unwitnessed": "mood", # bolmak/Turkmen 

6380 "approximative-i": "case", # sugu/Veps 

6381 "approximative-ii": "case", # sugu/Veps 

6382 "terminative-i": "case", # sugu/Veps 

6383 "terminative-ii": "case", # sugu/Veps 

6384 "terminative-iii": "case", # sugu/Veps 

6385 "additive-i": "case", # sugu/Veps 

6386 "additive-ii": "case", # sugu/Veps 

6387 "suihortative": "mood", # ಹುಟ್ಟು/Kannada 

6388 "cohortative-i": "mood", # ಹುಟ್ಟು/Kannada 

6389 "cohortative-ii": "mood", # ಹುಟ್ಟು/Kannada 

6390 # цӏехуьл/Lezgi 

6391 "adelative": "case", 

6392 "addirective": "case", 

6393 "postessive": "case", 

6394 "postelative": "case", 

6395 "postdirective": "case", 

6396 "subessive": "case", 

6397 "subelative": "case", 

6398 "subdirective": "case", 

6399 "inelative": "case", 

6400 "superelative": "case", 

6401 "superdirective": "case", 

6402 "quantitative": "misc", # "how much" interrogative zenbat/Basque 

6403 # a ګړندی/Pashto 

6404 "oblique-i": "case", 

6405 "oblique-ii": "case", 

6406 "after-th": "misc", # wenyn/Cornish 

6407 # https://en.wiktionary.org/wiki/Appendix:Persian_ez%C3%A2fe 

6408 "ezafe": "misc", # izofa, ezâfé, райҳон/Tajik 

6409 "tri-plural": "number", # aaombiniili'/Chickasaw 

6410 "repeated": "misc", # coymaq/Crimean Tatar 

6411 "tu-derivative": "non-finite", # pawjō/Proto-Italic 

6412 "s-derivative": "non-finite", 

6413 # birciqqo/Sidamo 

6414 # In Sidamo, nouns have a form when they're modified by 

6415 # other words in an NP, and a form when they're not. 

6416 "with-modifier": "misc", 

6417 "without-modifier": "misc", 

6418 "inchoative": "aspect", 

6419 "series-i-verb-argument": "misc", # küm-/Maquiritari 

6420 "series-ii-verb-argument": "misc", 

6421 "patient-like": "misc", 

6422 "agent-like": "misc", 

6423 "object-dual": "number", 

6424 "object-exclusive": "person", 

6425 "ablative-i": "case", # хӏайван/Avar 

6426 "ablative-ii": "case", 

6427 "ablative-iii": "case", 

6428 "ablative-iv": "case", 

6429 "ablative-v": "case", 

6430 "translative-i": "case", 

6431 "translative-ii": "case", 

6432 "translative-iii": "case", 

6433 "translative-iv": "case", 

6434 "translative-v": "case", 

6435 "patient": "misc", 

6436 "conjectural": "mood", # 노타/Middle Korean 

6437 "adjective-from-verb": "derivation", 

6438 "anaphoric": "misc", # tꜣj/Egyptian 

6439 "distant-past": "tense", # Maquiritari, Mapudungun 

6440 "transitional-past": "tense", # тұту/Kazakh 

6441 "free-state": "misc", # aɣemmar/Tarifit 

6442 "proximal-to-speaker": "misc", # nꜣyw/Egyptian/38 

6443 "proximal-to-topic": "misc", 

6444 "by-personal-gender": "gender", # Italian has started to use 

6445 # "feminine or masculine, by sense" to mean "depending on the 

6446 # gender of the person". Bataglia/Italian 

6447 "toneless-final-syllable-variant": "misc", # zh-pron template stuff 

6448 # 食物/Chinese 

6449 "no-predicative-form": "misc", # diamanten/German 

6450 "feminine-plural": "gender", # Galician with different gender dep. on num. 

6451 "masculine-plural": "gender", 

6452 "collocation": "misc", 

6453 "comeronym": "misc", 

6454 # https://en.wiktionary.org/wiki/Template:vi-readings 

6455 "han-viet-reading": "misc", 

6456 "nom-reading": "misc", 

6457 "Traditional-Chinese": "script", 

6458 "Simplified-Chinese": "script", 

6459 "Second-Round-Simplified-Chinese": "script", 

6460 "Guangzhou-Cantonese": "script", 

6461 # "zh-pron" template 

6462 "phonetic": "misc", 

6463 # https://en.wiktionary.org/wiki/Template:ka-decl-noun 

6464 # some useful general "position" tags 

6465 # Because these postpositions don't seem to have any good 

6466 # single-word graecolatin terminology used for them 

6467 "on-position": "misc", 

6468 "near-position": "misc", 

6469 "in-position": "misc", 

6470 "like-position": "misc", 

6471 "for-position": "misc", 

6472 "towards-position": "misc", 

6473 "from-position": "misc", 

6474 "of-position": "misc", 

6475 "in-relation-to-position": "misc", 

6476 "since-position": "misc", 

6477 "together-with-position": "misc", 

6478 "up-to-position": "misc", 

6479 # "zh-dial" template 

6480 "Written-vernacular-Chinese": "script", 

6481 "Northeastern-Mandarin": "script", 

6482 "Jiaoliao-Mandarin": "script", 

6483 "Central-Plains-Mandarin": "script", 

6484 "Lanyin-Mandarin": "script", 

6485} 

6486 

6487for k, v in valid_tags.items(): 

6488 assert isinstance(k, str) 

6489 if v not in tag_categories: 6489 ↛ 6490line 6489 didn't jump to line 6490 because the condition on line 6489 was never true

6490 print( 

6491 "valid_tags[{!r}]={!r} - {!r} not in tag_categories!".format( 

6492 k, v, v 

6493 ) 

6494 ) 

6495 assert v in tag_categories 

6496 

6497for tag in form_of_tags - set(valid_tags.keys()): 6497 ↛ 6498line 6497 didn't jump to line 6498 because the loop on line 6497 never started

6498 print("tags.py:form_of_tags contains invalid tag {}".format(tag)) 

6499 

6500for tag in uppercase_tags: 

6501 hyphenated = re.sub(r"\s+", "-", tag) 

6502 if hyphenated in valid_tags: 6502 ↛ 6503line 6502 didn't jump to line 6503 because the condition on line 6502 was never true

6503 print( 

6504 "DUPLICATE TAG: {} (from uppercase tag {!r})".format( 

6505 hyphenated, tag 

6506 ) 

6507 ) 

6508 assert hyphenated not in valid_tags 

6509 # Might as well, while we're here: Add hyphenated location tag. 

6510 valid_tags[hyphenated] = "dialect" 

6511 

6512 

6513# Don't move this, notify me so that I can change some an import in 

6514# the kaikki.org regen code 

6515def sort_tags( 

6516 tags: list[str] | tuple[str, ...] | set[str], 

6517) -> tuple[str, ...]: 

6518 """Sorts tags into presentation order and returns them as a tuple. 

6519 This also removes duplicates.""" 

6520 assert isinstance(tags, (list, tuple, set)) 

6521 return tuple( 

6522 sorted( 

6523 set(tags), 

6524 key=lambda t: tag_categories.get(valid_tags.get(t, "unknown"), 0) 

6525 - len(t) / 1000, 

6526 reverse=True, 

6527 ) 

6528 )