Coverage for src/wiktextract/extractor/en/unsupported_titles.py: 100%

1 statements  

« prev     ^ index     » next       coverage.py v7.6.4, created at 2024-10-25 10:11 +0000

1# This file defines how titles beginning with "Unsupported titles/" are 

2# handled 

3# 

4# Copyright (c) 2020 Tatu Ylonen. See file LICENSE and https://ylonen.org 

5 

6unsupported_title_map: dict[str, str] = { 

7 "Ancient Greek dish": "λοπαδο­τεμαχο­σελαχο­γαλεο­κρανιο­λειψανο­δριμυ­ποτριμματο­σιλφιο­καραβο­μελιτο­κατακεχυμενο­κιχλε­πικοσσυφο­φαττο­περιστερα­λεκτρυο­νοπτο­κεφαλλιο­κιγκλο­πελειο­λαγῳο­σιραιο­βαφητραγανοπτερύγων", 

8 "Australian Aboriginal Flag emoticon": "[-o-]", 

9 "Australian Aboriginal Flag emoticon alternative": "[-0-]", 

10 "C sharp": "C#", 

11 "C through N to K": "C|N>K", 

12 "Colon": ":", 

13 "Colon capital P": ":P", 

14 "Colon capital thorn": ":Þ", 

15 "Colon equals": ":=", 

16 "Colon hyphen left paren": ":-(", 

17 "Colon hyphen right paren": ":-)", 

18 "Colon left paren": ":(", 

19 "Colon right paren": ":)", 

20 "Colon slash": ":/", 

21 "Curly brackets": "{}", 

22 "Double colon": "::", 

23 "Double period": "..", 

24 "Enclosing colons": ": :", 

25 "Enclosing less than greater than": "< >", 

26 "Enclosing low lines": "_ _", 

27 "Enclosing number signs": "# #", 

28 "Enclosing vertical lines": "| |", 

29 "Equal greater than": "=>", 

30 "Equal less than": "=<", 

31 "Full stop": ".", 

32 "Greater than": ">", 

33 "Greater than equal": ">=", 

34 "Greater than low line less than": ">_=", 

35 "HTML comment": "<!-- -->", 

36 "HTML start tag end tag": "< > </ >", 

37 "Hyphen greater than": "->", 

38 "Hyphen vertical line vertical line hyphen": "-||-", 

39 "Left curly bracket": "{", 

40 "Left square bracket": "[", 

41 "Less than": "<", 

42 "Less than equal": "<=", 

43 "Less than greater than": "<>", 

44 "Less than hyphen": "<-", 

45 "Less than slash three": "</3", 

46 "Less than three": "<3", 

47 "Less than trailing slash greater than": "< />", 

48 "Low line": "_", 

49 "Low line interfix": "-_-", 

50 "MeToo": "#MeToo", 

51 "Number sign": "#", 

52 "Ogham space": " ", 

53 "Period slash period": "./.", 

54 "Replacement character": "�", 

55 "Right curly bracket": "}", 

56 "Right square bracket": "]", 

57 "S:t": "S:t", 

58 "S:ta": "S:ta", 

59 "Space": " ", 

60 "Square bracketed ellipsis": "[...]", 

61 "Square brackets": "[ ]", 

62 "Thai name of Bangkok": "กรุงเทพมหานคร อมรรัตนโกสินทร์ มหินทรายุธยา มหาดิลกภพ นพรัตนราชธานีบูรีรมย์ อุดมราชนิเวศน์มหาสถาน อมรพิมานอวตารสถิต สักกะทัตติยวิษณุกรรมประสิทธิ์", 

63 "Vertical line": "|", 

64 "c:a": "c:a", 

65 "eq space": "eq #", 

66 "g tag": "<g>", 

67 "hr space": "hr #", 

68 "n:a": "n:a", 

69 "n:o": "n:o", 

70 "n:r": "n:r", 

71 "s:a": "s:a", 

72 "st:a": "st:a", 

73 "v:a": "v:a", 

74 "n:s": "n:s", 

75 "о slash dot": "o/.", 

76 "hr number sign": "hr #", 

77 "eq number sign": "eq #", 

78 "Colon small p": ":p", 

79 "Cifrão": "[Cifrão]", # Should be dollar sign with two vertical lines 

80 "Old Israeli shekel": "[Old Israeli shekel]", # Should be the symbol 

81 "Colon three": ":3", 

82 "Amp": "&amp;", 

83 "Colon lowercase thorn": ":þ", 

84 "Colon left curly bracket": ":{", 

85 ":≠": ":≠", 

86}