[TASK] Extract displayCond functionality from FormEngine to new class
[Packages/TYPO3.CMS.git] / t3lib / unidata / Translit.txt
1
2 # Latin (iso-8859-1)
3
4 00A1; 0021;             INVERTED EXCLAMATION MARK => !
5 00A2; 0063 0065 006E 0074;      CENT SIGN => cent
6 00A3; 0070 006F 0075 006E 0064; POUND SIGN => pound
7 00A5; 0079 0065 006E;   YEN SIGN => yen
8 00A6; 007C;             BROKEN BAR => |
9 00AB; 003C 003C;        LEFT-POINTING DOUBLE ANGLE QUOTATION MARK => <<
10 00A9; 0028 0063 0029;   COPYRIGHT SIGN => (c)
11 00AE; 0028 0052 0029;   REGISTERED SIGN => (R)
12 00B1; 002B 002F 002D;   PLUS-MINUS SIGN => +/-
13 00B5; 0075;             MICRO SIGN => u (American style)
14 00B7; 002A;             MIDDLE DOT => *
15 00BB; 003E 003E;        RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK => <<
16 00BF; 003F;             INVERTED QUESTION MARK => ?
17 00C4; 0041 0045;        LATIN CAPITAL LETTER A WITH DIAERESIS => AE (German)
18 00C5; 0041 0041;        LATIN CAPITAL LETTER A WITH RING ABOVE => AA (Danish)
19 00C6; 0041 0045;        LATIN CAPITAL LETTER AE => AE (Danish)
20 00D0; 0044;             LATIN CAPITAL LETTER ETH => D (Icelandic)
21 00D6; 004F 0045;        LATIN CAPITAL LETTER O WITH DIAERESIS => OE (German)
22 00D7; 0078;             MULTIPLICATION SIGN => x
23 00D8; 004F 0045;        LATIN CAPITAL LETTER O WITH STROKE => OE (Danish)
24 00DC; 0055 0045;        LATIN CAPITAL LETTER U WITH DIAERESIS => UE (German)
25 00DE; 0054 0048;        LATIN CAPITAL LETTER THORN => TH (Icelandic)
26 00E4; 0061 0065;        LATIN SMALL LETTER A WITH DIAERESIS => ae (German)
27 00E5; 0061 0061;        LATIN SMALL LETTER A WITH RING ABOVE => aa (Danish)
28 00DF; 0073 0073;        LATIN SMALL LETTER SHARP S => ss (German)
29 00E6; 0061 0065;        LATIN SMALL LETTER AE => ae (Danish)
30 00F0; 0064;             LATIN SMALL LETTER ETH => d (Icelandic)
31 00F6; 006F 0065;        LATIN SMALL LETTER O WITH DIAERESIS => oe (German)
32 00F7; 002F;             DIVISION SIGN => /
33 00F8; 006F 0065;        LATIN SMALL LETTER O WITH STROKE => oe (Danish)
34 00FC; 0075 0065;        LATIN SMALL LETTER U WITH DIAERESIS => ue (German)
35 00FE; 0074 0068;        LATIN SMALL LETTER THORN => th (Icelandic)
36
37 # more Latin (windows-1252, windows-1254, windows-1257)
38
39 # Uncomment the following 8 lines if you want to double Latvian "long" letters
40 # in URLs (non-typical but worked this way prior to TYPO3 4.0)
41 #0100; 0041 0041;       LATIN CAPITAL LETTER A WITH MACRON => AA (Latvian)
42 #0101; 0061 0061;       LATIN SMALL LETTER A WITH MACRON => aa (Latvian)
43 #0112; 0045 0045;       LATIN CAPITAL LETTER E WITH MACRON => EE (Latvian)
44 #0113; 0065 0065;       LATIN SMALL LETTER E WITH MACRON => ee (Latvian)
45 #012A; 0049 0049;       LATIN CAPITAL LETTER I WITH MACRON => II (Latvian)
46 #012B; 0060 0069;       LATIN SMALL LETTER I WITH MACRON => ii(Latvian)
47 #016A; 0055 0055;       LATIN CAPITAL LETTER U WITH MACRON => UU (Latvian)
48 #016B; 0075 0075;       LATIN SMALL LETTER U WITH MACRON => uu (Latvian)
49
50 014C; 004F 004F;        LATIN CAPITAL LETTER O WITH MACRON => OO
51 014D; 006F 006F;        LATIN SMALL LETTER O WITH MACRON => oo
52 0131; 0069;             LATIN SMALL LETTER DOTLESS I => i (Turkish)
53 0152; 004F 0045;        LATIN CAPITAL LETTER OE => OE
54 0153; 006F 0065;        LATIN SMALL LETTER OE => oe
55 0192; 0066;             LATIN SMALL LETTER F WITH HOOK => f
56 02BC; 0027;             MODIFIER LETTER APOSTROPHE => '
57 02CA; 0027;             MODIFIER LETTER ACUTE ACCENT => '
58 2010; 002D;             HYPHEN => -
59 2011; 002D;             NON-BREAKING HYPHEN => -
60 2012; 002D;             FIGURE DASH => -
61 2013; 002D;             EN DASH => -
62 2014; 002D;             EM DASH => -
63 2015; 002D;             HORIZONTAL BAR => -
64 2018; 0060;             LEFT SINGLE QUOTATION MARK => `
65 2019; 0027;             RIGHT SINGLE QUOTATION MARK >= '
66 201C; 0022;             LEFT DOUBLE QUOTATION MARK => "
67 201D; 0022;             RIGHT DOUBLE QUOTATION MARK => "
68 201E; 0022;             DOUBLE LOW-9 QUOTATION MARK => "
69 2022; 002A;             BULLET => *
70 2039; 003C;             SINGLE LEFT-POINTING ANGLE QUOTATION MARK => <
71 203A; 003E;             SINGLE RIGHT-POINTING ANGLE QUOTATION MARK => >
72 2044; 002F;             FRACTION SLASH => /
73 20A0; 0045 0055 0052;   EURO-CURRENCY SIGN => EUR
74 20AC; 0045 0055 0052;   EURO-CURRENCY SIGN => EUR
75 2122; 0028 0054 004D 0029;              TRADE MARK SIGN => (TM)
76
77 # Greek transliteration
78
79 0370; 0048;                     GREEK CAPITAL LETTER HETA => H
80 0371; 0068;                     GREEK SMALL LETTER HETA => h
81 0374; 0027;                     GREEK UPPER NUMERAL SIGN => '
82 0375; 002C;                     GREEK LOWER NUMERAL SIGN => ,
83 037E; 003F;                     GREEK QUESTION MARK => ?
84 0384; 0027;                     GREEK TONOS => '
85 #0385;                          GREEK DIALYTIKA TONOS
86 0386; 0066;                     GREEK CAPITAL LETTER ALPHA WITH TONOS => A
87 0387; 002A;                     GREEK ANO TELEIA => *;  
88 0388; 0045;                     GREEK CAPITAL LETTER EPSILON WITH TONOS => E
89 0389; 0049;                     GREEK CAPITAL LETTER ETA WITH TONOS => I
90 038A; 0049;                     GREEK CAPITAL LETTER IOTA WITH TONOS => I
91 038C; 004F;                     GREEK CAPITAL LETTER OMICRON WITH TONOS => O
92 038E; 0059;                     GREEK CAPITAL LETTER UPSILON WITH TONOS => Y
93 038F; 004F;                     GREEK CAPITAL LETTER OMEGA WITH TONOS => O
94 0390; 0069;                     GREEK SMALL LETTER IOTA WITH DIALYTIKA AND TONOS => i
95 0391; 0041;                     GREEK CAPITAL LETTER ALPHA => A
96 0392; 0042;                     GREEK CAPITAL LETTER BETA => B (possibly V)
97 0393; 0047;                     GREEK CAPITAL LETTER GAMMA => G
98 0394; 0044;                     GREEK CAPITAL LETTER DELTA => D
99 0395; 0045;                     GREEK CAPITAL LETTER EPSILON => E
100 0396; 005A;                     GREEK CAPITAL LETTER ZETA => Z
101 0397; 0049;                     GREEK CAPITAL LETTER ETA => I
102 0398; 0054 0048;        GREEK CAPITAL LETTER THETA => TH
103 0399; 0049;                     GREEK CAPITAL LETTER IOTA => I
104 039A; 004B;                     GREEK CAPITAL LETTER KAPPA => K
105 039B; 004C;                     GREEK CAPITAL LETTER LAMDA => L
106 039C; 004D;                     GREEK CAPITAL LETTER MU => M
107 039D; 004E;                     GREEK CAPITAL LETTER NU => N
108 039E; 0058;                     GREEK CAPITAL LETTER XI => X (possibly KS 004B 0053)
109 039F; 004F;                     GREEK CAPITAL LETTER OMICRON => O
110 03A0; 0050;                     GREEK CAPITAL LETTER PI => P
111 03A1; 0052;                     GREEK CAPITAL LETTER RHO => R
112 03A3; 0053;                     GREEK CAPITAL LETTER SIGMA => S
113 03A4; 0054;                     GREEK CAPITAL LETTER TAU => T
114 03A5; 0059;                     GREEK CAPITAL LETTER UPSILON => Y
115 03A6; 0046;                     GREEK CAPITAL LETTER PHI => F
116 03A7; 0043 0048;        GREEK CAPITAL LETTER CHI => CH (possibly KH 0058 0048)
117 03A8; 0050 0053;        GREEK CAPITAL LETTER PSI => PS
118 03A9; 004F;                     GREEK CAPITAL LETTER OMEGA => O
119 03AA; 0049;                     GREEK CAPITAL LETTER IOTA WITH DIALYTIKA => I
120 03AB; 0059;                     GREEK CAPITAL LETTER UPSILON WITH DIALYTIKA => Y
121 03AC; 0061;                     GREEK SMALL LETTER ALPHA WITH TONOS => a
122 03AD; 0065;                     GREEK SMALL LETTER EPSILON WITH TONOS => e
123 03AE; 0069;                     GREEK SMALL LETTER ETA WITH TONOS => i
124 03AF; 0069;                     GREEK SMALL LETTER IOTA WITH TONOS => i
125
126 03B0; 0079;                     GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND TONOS => y
127 03B1; 0061;                     GREEK SMALL LETTER ALPHA => a
128 03B2; 0062;                     GREEK SMALL LETTER BETA => b
129 03B3; 0067;                     GREEK SMALL LETTER GAMMA => g
130 03B4; 0064;                     GREEK SMALL LETTER DELTA => d
131 03B5; 0065;                     GREEK SMALL LETTER EPSILON => e
132 03B6; 007A;                     GREEK SMALL LETTER ZETA => z
133 03B7; 0069;                     GREEK SMALL LETTER ETA => i
134 03B8; 0074 0068;        GREEK SMALL LETTER THETA => th
135 03B9; 0069;                     GREEK SMALL LETTER IOTA => i
136 03BA; 006B;                     GREEK SMALL LETTER KAPPA => k
137 03BB; 006C;                     GREEK SMALL LETTER LAMDA => l
138 03BC; 006D;                     GREEK SMALL LETTER MU => m
139 03BD; 006E;                     GREEK SMALL LETTER NU => n
140 03BE; 0078;                     GREEK SMALL LETTER XI => x (possibly ks: 006B 0073)
141 03BF; 006F;                     GREEK SMALL LETTER OMICRON => o
142 03C0; 0070;                     GREEK SMALL LETTER PI => p
143 03C1; 0072;                     GREEK SMALL LETTER RHO => r
144 03C2; 0073;                     GREEK SMALL LETTER FINAL SIGMA => s
145 03C3; 0073;                     GREEK SMALL LETTER SIGMA => s
146 03C4; 0074;                     GREEK SMALL LETTER TAU => t
147 03C5; 0079;                     GREEK SMALL LETTER UPSILON => y
148 03C6; 0066;                     GREEK SMALL LETTER PHI => f
149 03C7; 0063 0068;        GREEK SMALL LETTER CHI => ch (possibly kh: 006B 0068)
150 03C8; 0070 0073;        GREEK SMALL LETTER PSI => ps
151 03C9; 006F;                     GREEK SMALL LETTER OMEGA => o
152 03CA; 0069;                     GREEK SMALL LETTER IOTA WITH DIALYTIKA => i
153 03CB; 0079;                     GREEK SMALL LETTER UPSILON WITH DIALYTIKA => y
154 03CC; 006F;                     GREEK SMALL LETTER OMICRON WITH TONOS => o
155 03CD; 0079;                     GREEK SMALL LETTER UPSILON WITH TONOS => y
156 03CE; 006F;                     GREEK SMALL LETTER OMEGA WITH TONOS => o
157
158 # Cyrillic (Russian transliteration: modified GOST)
159
160 0401; 004A 004F;                CYRILLIC CAPITAL LETTER IO => JO
161 #0402; ;                        CYRILLIC CAPITAL LETTER DJE
162 #0403; ;                        CYRILLIC CAPITAL LETTER GJE
163 0404; 004A 0045;                CYRILLIC CAPITAL LETTER UKRAINIAN IE => JE
164 #0405; ;                        CYRILLIC CAPITAL LETTER DZE
165 0406; 0049;                     CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I => I
166 0407; 0049;                     CYRILLIC CAPITAL LETTER YI => I
167 #0408; ;                        CYRILLIC CAPITAL LETTER JE ?? J
168 #0409; ;                        CYRILLIC CAPITAL LETTER LJE ?? LJ
169 #040A; ;                        CYRILLIC CAPITAL LETTER NJE ??  NJ
170 #040B; ;                        CYRILLIC CAPITAL LETTER TSHE ?? TSH
171 #040C; ;                        CYRILLIC CAPITAL LETTER KJE ?? KJ KY
172 040E; 0055;                     CYRILLIC CAPITAL LETTER SHORT U => U (Belorussian)
173 #040F; ;                        CYRILLIC CAPITAL LETTER DZHE ?? DZH
174 0410; 0041;                     CYRILLIC CAPITAL LETTER A => A
175 0411; 0042;                     CYRILLIC CAPITAL LETTER BE => B
176 0412; 0056;                     CYRILLIC CAPITAL LETTER VE => V
177 0413; 0047;                     CYRILLIC CAPITAL LETTER GHE => G
178 0414; 0044;                     CYRILLIC CAPITAL LETTER DE => D
179 0415; 0045;                     CYRILLIC CAPITAL LETTER IE => E
180 0416; 005A 0048;                CYRILLIC CAPITAL LETTER ZHE => ZH
181 0417; 005A;                     CYRILLIC CAPITAL LETTER ZE => Z
182 0418; 0049;                     CYRILLIC CAPITAL LETTER I=> I
183 0419; 0049;                     CYRILLIC CAPITAL LETTER SHORT I => I (GOST has I)
184 041A; 004B;                     CYRILLIC CAPITAL LETTER KA => K
185 041B; 004C;                     CYRILLIC CAPITAL LETTER EL => L
186 041C; 004D;                     CYRILLIC CAPITAL LETTER EM => M
187 041D; 004E;                     CYRILLIC CAPITAL LETTER EN => N
188 041E; 004F;                     CYRILLIC CAPITAL LETTER O => O
189 041F; 0050;                     CYRILLIC CAPITAL LETTER PE => P
190 0420; 0052;                     CYRILLIC CAPITAL LETTER ER => R
191 0421; 0053;                     CYRILLIC CAPITAL LETTER ES => S
192 0422; 0054;                     CYRILLIC CAPITAL LETTER TE => T
193 0423; 0055;                     CYRILLIC CAPITAL LETTER U => U
194 0424; 0046;                     CYRILLIC CAPITAL LETTER EF => F
195 0425; 004B 0048;                CYRILLIC CAPITAL LETTER HA => KH
196 0426; 0043;                     CYRILLIC CAPITAL LETTER TSE => C
197 0427; 0043 0048;                CYRILLIC CAPITAL LETTER CHE => CH
198 0428; 0053 0048;                CYRILLIC CAPITAL LETTER SHA => SH
199 0429; 0053 0048 0043 0048;      CYRILLIC CAPITAL LETTER SHCHA => SHCH (GOST has SHH)
200 042A; ;                         CYRILLIC CAPITAL LETTER HARD SIGN => omit (GOST has ")
201 042B; 0059;                     CYRILLIC CAPITAL LETTER YERU => Y
202 042C; ;                         CYRILLIC CAPITAL LETTER SOFT SIGN => omit (GOST has ')
203 042D; 0045 0048;                CYRILLIC CAPITAL LETTER E => EH
204 042E; 004A 0055;                CYRILLIC CAPITAL LETTER YU => JU
205 042F; 004A 0041;                CYRILLIC CAPITAL LETTER YA => JA
206
207 0430; 0061;                     CYRILLIC SMALL LETTER A => a
208 0431; 0062;                     CYRILLIC SMALL LETTER BE => b
209 0432; 0076;                     CYRILLIC SMALL LETTER VE => v
210 0433; 0067;                     CYRILLIC SMALL LETTER GHE => g
211 0434; 0064;                     CYRILLIC SMALL LETTER DE => d
212 0435; 0065;                     CYRILLIC SMALL LETTER IE => e
213 0436; 007A 0068;                CYRILLIC SMALL LETTER ZHE => zh
214 0437; 007A;                     CYRILLIC SMALL LETTER ZE => z
215 0438; 0069;                     CYRILLIC SMALL LETTER I => i
216 0439; 0069;                     CYRILLIC SMALL LETTER SHORT I => i (GOST has j)
217 043A; 006B;                     CYRILLIC SMALL LETTER KA => k
218 043B; 006C;                     CYRILLIC SMALL LETTER EL => l
219 043C; 006D;                     CYRILLIC SMALL LETTER EM => m
220 043D; 006E;                     CYRILLIC SMALL LETTER EN => n
221 043E; 006F;                     CYRILLIC SMALL LETTER O => o
222 043F; 0070;                     CYRILLIC SMALL LETTER PE => p
223 0440; 0072;                     CYRILLIC SMALL LETTER ER => r
224 0441; 0073;                     CYRILLIC SMALL LETTER ES => s
225 0442; 0074;                     CYRILLIC SMALL LETTER TE => t
226 0443; 0075;                     CYRILLIC SMALL LETTER U => u
227 0444; 0066;                     CYRILLIC SMALL LETTER EF => f
228 0445; 006B 0068;                CYRILLIC SMALL LETTER HA => kh
229 0446; 0063;                     CYRILLIC SMALL LETTER TSE => c
230 0447; 0063 0068;                CYRILLIC SMALL LETTER CHE => ch
231 0448; 0073 0068;                CYRILLIC SMALL LETTER SHA => sh
232 0449; 0073 0068 0063 0068;      CYRILLIC SMALL LETTER SHCHA => shch (GOST has shh)
233 044A; ;                         CYRILLIC SMALL LETTER HARD SIGN => omit (GOST has ")
234 044B; 0079;                     CYRILLIC SMALL LETTER YERU => y
235 044C; ;                         CYRILLIC SMALL LETTER SOFT SIGN => omit (GOST has ')
236 044D; 0065 0068;                CYRILLIC SMALL LETTER E => eh
237 044E; 006A 0075;                CYRILLIC SMALL LETTER YU => ju
238 044F; 006A 0061;                CYRILLIC SMALL LETTER YA => ja
239 0451; 006A 006F;                CYRILLIC SMALL LETTER IO => jo
240 #0452; ;                        CYRILLIC SMALL LETTER DJE => dj dy ??
241 #0453; ;                        CYRILLIC SMALL LETTER GJE => gj gy ??
242 0454; 006A 0065;                CYRILLIC SMALL LETTER UKRAINIAN IE => je
243 #0455; ;                        CYRILLIC SMALL LETTER DZE => dz ??
244 0456; 0069;                     CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I => i
245 0457; 006A 0069;                CYRILLIC SMALL LETTER YI => ji
246 #0458; ;                        CYRILLIC SMALL LETTER JE ?? j y
247 #0459; ;                        CYRILLIC SMALL LETTER LJE ?? lj ly
248 #045A; ;                        CYRILLIC SMALL LETTER NJE ?? nj ny
249 #045B; ;                        CYRILLIC SMALL LETTER TSHE => ??? tsh ch (Serbocroatian)
250 #045C; ;                        CYRILLIC SMALL LETTER KJE
251 045E; 0075;                     CYRILLIC SMALL LETTER SHORT U => U (Belorussian)
252 #045F; ;                        CYRILLIC SMALL LETTER DZHE ???
253
254 0490; 0047 0047;                CYRILLIC CAPITAL LETTER GHE WITH UPTURN => GG (Belorussian, Ukrainian)
255 0491; 0067 0076;                CYRILLIC SMALL LETTER GHE WITH UPTURN => gg (Belorussian, Ukrainian)
256
257 # Hebrew
258
259 #05B0; ;                HEBREW POINT SHEVA ??? win1255
260 #05B1; ;                HEBREW POINT HATAF SEGOL ??? win1255
261 #05B2; ;                HEBREW POINT HATAF PATAH ??? win1255
262 #05B3; ;                HEBREW POINT HATAF QAMATS ??? win1255
263 #05B4; ;                HEBREW POINT HIRIQ ??? win1255
264 #05B5; ;                HEBREW POINT TSERE ??? win1255
265 #05B6; ;                HEBREW POINT SEGOL ??? win1255
266 #05B7; ;                HEBREW POINT PATAH ??? win1255
267 #05B8; ;                HEBREW POINT QAMATS ??? win1255
268 #05B9; ;                HEBREW POINT HOLAM ??? win1255
269 #05BB; ;                HEBREW POINT QUBUTS ??? win1255
270 #05BC; ;                HEBREW POINT DAGESH OR MAPIQ ??? win1255
271 #05BD; ;                HEBREW POINT METEG ??? win1255
272 #05BE; ;                HEBREW PUNCTUATION MAQAF ??? win1255
273 #05BF; ;                HEBREW POINT RAFE ??? win1255
274 #05C0; ;                HEBREW PUNCTUATION PASEQ ??? win1255
275 #05C1; ;                HEBREW POINT SHIN DOT ??? win1255
276 #05C2; ;                HEBREW POINT SIN DOT ??? win1255
277 05D0; 0061;             HEBREW LETTER ALEF => a
278 05D1; 0062;             HEBREW LETTER BET => b
279 05D2; 0067;             HEBREW LETTER GIMEL => g
280 05D3; 0064;             HEBREW LETTER DALET => d
281 05D4; 0068 0061;        HEBREW LETTER HEI => ha
282 05D5; 006F;             HEBREW LETTER VAV => o
283 05D6; 007A;             HEBREW LETTER ZAYIN => z
284 05D7; 0068;             HEBREW LETTER HET => h
285 05D8; 0074;             HEBREW LETTER TET => t
286 05D9; 0069;             HEBREW LETTER YOD => i
287 05DA; 006B 0068;        HEBREW LETTER FINAL KAF HAF => kh
288 05DB; 006B;             HEBREW LETTER KAF HAF => k
289 05DC; 006C;             HEBREW LETTER LAMED => l
290 05DD; 006D;             HEBREW LETTER FINAL MEM => m
291 05DE; 006D;             HEBREW LETTER MEM => m
292 05DF; 006E;             HEBREW LETTER FINAL NUN => n
293 05E0; 006E;             HEBREW LETTER NUN => n
294 05E1; 0073;             HEBREW LETTER SAMEKH => s
295 05E2; 0061;             HEBREW LETTER AYIN => a
296 05E3; 0066;             HEBREW LETTER FINAL PE => f
297 05E4; 0066;             HEBREW LETTER PE => f
298 05E5; 0074 007A;        HEBREW LETTER FINAL TSADI => tz
299 05E6; 0074 007A;        HEBREW LETTER TSADI => tz
300 05E7; 006B;             HEBREW LETTER QOF => k
301 05E8; 0072;             HEBREW LETTER RESH => r
302 05E9; 0073 0068;        HEBREW LETTER SHIN => sh
303 05EA; 0074;             HEBREW LETTER TAV => t
304 05F0; 0076;             HEBREW LIGATURE YIDDISH DOUBLE VAV => o
305 #05F1; ;                HEBREW LIGATURE YIDDISH VAV YOD ??? win1255
306 #05F2; ;                HEBREW LIGATURE YIDDISH DOUBLE YOD ??? win1255
307 #05F3; ;                HEBREW PUNCTUATION GERESH ??? win1255
308 #05F4; ;                HEBREW PUNCTUATION GERSHAYIM ??? win1255
309
310 #20AA; 004E 0049 0053;          NEW SHEQEL SIGN => NIS