|
| 1 | +# Auto-generated by Tools/scripts/generate_re_casefix.py. |
| 2 | + |
| 3 | +# Maps the code of lowercased character to codes of different lowercased |
| 4 | +# characters which have the same uppercase. |
| 5 | +_EXTRA_CASES = { |
| 6 | + # LATIN SMALL LETTER I: LATIN SMALL LETTER DOTLESS I |
| 7 | + 0x0069: (0x0131,), # 'i': 'ı' |
| 8 | + # LATIN SMALL LETTER S: LATIN SMALL LETTER LONG S |
| 9 | + 0x0073: (0x017f,), # 's': 'ſ' |
| 10 | + # MICRO SIGN: GREEK SMALL LETTER MU |
| 11 | + 0x00b5: (0x03bc,), # 'µ': 'μ' |
| 12 | + # LATIN SMALL LETTER DOTLESS I: LATIN SMALL LETTER I |
| 13 | + 0x0131: (0x0069,), # 'ı': 'i' |
| 14 | + # LATIN SMALL LETTER LONG S: LATIN SMALL LETTER S |
| 15 | + 0x017f: (0x0073,), # 'ſ': 's' |
| 16 | + # COMBINING GREEK YPOGEGRAMMENI: GREEK SMALL LETTER IOTA, GREEK PROSGEGRAMMENI |
| 17 | + 0x0345: (0x03b9, 0x1fbe), # '\u0345': 'ιι' |
| 18 | + # GREEK SMALL LETTER IOTA WITH DIALYTIKA AND TONOS: GREEK SMALL LETTER IOTA WITH DIALYTIKA AND OXIA |
| 19 | + 0x0390: (0x1fd3,), # 'ΐ': 'ΐ' |
| 20 | + # GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND TONOS: GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND OXIA |
| 21 | + 0x03b0: (0x1fe3,), # 'ΰ': 'ΰ' |
| 22 | + # GREEK SMALL LETTER BETA: GREEK BETA SYMBOL |
| 23 | + 0x03b2: (0x03d0,), # 'β': 'ϐ' |
| 24 | + # GREEK SMALL LETTER EPSILON: GREEK LUNATE EPSILON SYMBOL |
| 25 | + 0x03b5: (0x03f5,), # 'ε': 'ϵ' |
| 26 | + # GREEK SMALL LETTER THETA: GREEK THETA SYMBOL |
| 27 | + 0x03b8: (0x03d1,), # 'θ': 'ϑ' |
| 28 | + # GREEK SMALL LETTER IOTA: COMBINING GREEK YPOGEGRAMMENI, GREEK PROSGEGRAMMENI |
| 29 | + 0x03b9: (0x0345, 0x1fbe), # 'ι': '\u0345ι' |
| 30 | + # GREEK SMALL LETTER KAPPA: GREEK KAPPA SYMBOL |
| 31 | + 0x03ba: (0x03f0,), # 'κ': 'ϰ' |
| 32 | + # GREEK SMALL LETTER MU: MICRO SIGN |
| 33 | + 0x03bc: (0x00b5,), # 'μ': 'µ' |
| 34 | + # GREEK SMALL LETTER PI: GREEK PI SYMBOL |
| 35 | + 0x03c0: (0x03d6,), # 'π': 'ϖ' |
| 36 | + # GREEK SMALL LETTER RHO: GREEK RHO SYMBOL |
| 37 | + 0x03c1: (0x03f1,), # 'ρ': 'ϱ' |
| 38 | + # GREEK SMALL LETTER FINAL SIGMA: GREEK SMALL LETTER SIGMA |
| 39 | + 0x03c2: (0x03c3,), # 'ς': 'σ' |
| 40 | + # GREEK SMALL LETTER SIGMA: GREEK SMALL LETTER FINAL SIGMA |
| 41 | + 0x03c3: (0x03c2,), # 'σ': 'ς' |
| 42 | + # GREEK SMALL LETTER PHI: GREEK PHI SYMBOL |
| 43 | + 0x03c6: (0x03d5,), # 'φ': 'ϕ' |
| 44 | + # GREEK BETA SYMBOL: GREEK SMALL LETTER BETA |
| 45 | + 0x03d0: (0x03b2,), # 'ϐ': 'β' |
| 46 | + # GREEK THETA SYMBOL: GREEK SMALL LETTER THETA |
| 47 | + 0x03d1: (0x03b8,), # 'ϑ': 'θ' |
| 48 | + # GREEK PHI SYMBOL: GREEK SMALL LETTER PHI |
| 49 | + 0x03d5: (0x03c6,), # 'ϕ': 'φ' |
| 50 | + # GREEK PI SYMBOL: GREEK SMALL LETTER PI |
| 51 | + 0x03d6: (0x03c0,), # 'ϖ': 'π' |
| 52 | + # GREEK KAPPA SYMBOL: GREEK SMALL LETTER KAPPA |
| 53 | + 0x03f0: (0x03ba,), # 'ϰ': 'κ' |
| 54 | + # GREEK RHO SYMBOL: GREEK SMALL LETTER RHO |
| 55 | + 0x03f1: (0x03c1,), # 'ϱ': 'ρ' |
| 56 | + # GREEK LUNATE EPSILON SYMBOL: GREEK SMALL LETTER EPSILON |
| 57 | + 0x03f5: (0x03b5,), # 'ϵ': 'ε' |
| 58 | + # CYRILLIC SMALL LETTER VE: CYRILLIC SMALL LETTER ROUNDED VE |
| 59 | + 0x0432: (0x1c80,), # 'в': 'ᲀ' |
| 60 | + # CYRILLIC SMALL LETTER DE: CYRILLIC SMALL LETTER LONG-LEGGED DE |
| 61 | + 0x0434: (0x1c81,), # 'д': 'ᲁ' |
| 62 | + # CYRILLIC SMALL LETTER O: CYRILLIC SMALL LETTER NARROW O |
| 63 | + 0x043e: (0x1c82,), # 'о': 'ᲂ' |
| 64 | + # CYRILLIC SMALL LETTER ES: CYRILLIC SMALL LETTER WIDE ES |
| 65 | + 0x0441: (0x1c83,), # 'с': 'ᲃ' |
| 66 | + # CYRILLIC SMALL LETTER TE: CYRILLIC SMALL LETTER TALL TE, CYRILLIC SMALL LETTER THREE-LEGGED TE |
| 67 | + 0x0442: (0x1c84, 0x1c85), # 'т': 'ᲄᲅ' |
| 68 | + # CYRILLIC SMALL LETTER HARD SIGN: CYRILLIC SMALL LETTER TALL HARD SIGN |
| 69 | + 0x044a: (0x1c86,), # 'ъ': 'ᲆ' |
| 70 | + # CYRILLIC SMALL LETTER YAT: CYRILLIC SMALL LETTER TALL YAT |
| 71 | + 0x0463: (0x1c87,), # 'ѣ': 'ᲇ' |
| 72 | + # CYRILLIC SMALL LETTER ROUNDED VE: CYRILLIC SMALL LETTER VE |
| 73 | + 0x1c80: (0x0432,), # 'ᲀ': 'в' |
| 74 | + # CYRILLIC SMALL LETTER LONG-LEGGED DE: CYRILLIC SMALL LETTER DE |
| 75 | + 0x1c81: (0x0434,), # 'ᲁ': 'д' |
| 76 | + # CYRILLIC SMALL LETTER NARROW O: CYRILLIC SMALL LETTER O |
| 77 | + 0x1c82: (0x043e,), # 'ᲂ': 'о' |
| 78 | + # CYRILLIC SMALL LETTER WIDE ES: CYRILLIC SMALL LETTER ES |
| 79 | + 0x1c83: (0x0441,), # 'ᲃ': 'с' |
| 80 | + # CYRILLIC SMALL LETTER TALL TE: CYRILLIC SMALL LETTER TE, CYRILLIC SMALL LETTER THREE-LEGGED TE |
| 81 | + 0x1c84: (0x0442, 0x1c85), # 'ᲄ': 'тᲅ' |
| 82 | + # CYRILLIC SMALL LETTER THREE-LEGGED TE: CYRILLIC SMALL LETTER TE, CYRILLIC SMALL LETTER TALL TE |
| 83 | + 0x1c85: (0x0442, 0x1c84), # 'ᲅ': 'тᲄ' |
| 84 | + # CYRILLIC SMALL LETTER TALL HARD SIGN: CYRILLIC SMALL LETTER HARD SIGN |
| 85 | + 0x1c86: (0x044a,), # 'ᲆ': 'ъ' |
| 86 | + # CYRILLIC SMALL LETTER TALL YAT: CYRILLIC SMALL LETTER YAT |
| 87 | + 0x1c87: (0x0463,), # 'ᲇ': 'ѣ' |
| 88 | + # CYRILLIC SMALL LETTER UNBLENDED UK: CYRILLIC SMALL LETTER MONOGRAPH UK |
| 89 | + 0x1c88: (0xa64b,), # 'ᲈ': 'ꙋ' |
| 90 | + # LATIN SMALL LETTER S WITH DOT ABOVE: LATIN SMALL LETTER LONG S WITH DOT ABOVE |
| 91 | + 0x1e61: (0x1e9b,), # 'ṡ': 'ẛ' |
| 92 | + # LATIN SMALL LETTER LONG S WITH DOT ABOVE: LATIN SMALL LETTER S WITH DOT ABOVE |
| 93 | + 0x1e9b: (0x1e61,), # 'ẛ': 'ṡ' |
| 94 | + # GREEK PROSGEGRAMMENI: COMBINING GREEK YPOGEGRAMMENI, GREEK SMALL LETTER IOTA |
| 95 | + 0x1fbe: (0x0345, 0x03b9), # 'ι': '\u0345ι' |
| 96 | + # GREEK SMALL LETTER IOTA WITH DIALYTIKA AND OXIA: GREEK SMALL LETTER IOTA WITH DIALYTIKA AND TONOS |
| 97 | + 0x1fd3: (0x0390,), # 'ΐ': 'ΐ' |
| 98 | + # GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND OXIA: GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND TONOS |
| 99 | + 0x1fe3: (0x03b0,), # 'ΰ': 'ΰ' |
| 100 | + # CYRILLIC SMALL LETTER MONOGRAPH UK: CYRILLIC SMALL LETTER UNBLENDED UK |
| 101 | + 0xa64b: (0x1c88,), # 'ꙋ': 'ᲈ' |
| 102 | + # LATIN SMALL LIGATURE LONG S T: LATIN SMALL LIGATURE ST |
| 103 | + 0xfb05: (0xfb06,), # 'ſt': 'st' |
| 104 | + # LATIN SMALL LIGATURE ST: LATIN SMALL LIGATURE LONG S T |
| 105 | + 0xfb06: (0xfb05,), # 'st': 'ſt' |
| 106 | +} |
0 commit comments