summaryrefslogtreecommitdiffstats
path: root/tools/encoding/macCentEuro.txt
blob: e6507d63f2cd965f09e6c1f78026e8a739d82124 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
#=======================================================================
#   FTP file name:  CENTEURO.TXT
#
#   Contents:       Map (external version) from Mac OS Central European
#                   character set to Unicode 2.1
#
#   Copyright:      (c) 1995-1999 by Apple Computer, Inc., all rights
#                   reserved.
#
#   Contact:        charsets@apple.com
#
#   Changes:
#
#       b02  1999-Sep-22    Update contact e-mail address. Matches
#                           internal utom<b1>, ufrm<b1>, and Text
#                           Encoding Converter version 1.5.
#       n05  1998-Feb-05    Update header comments to new format; no
#                           mapping changes.  Matches internal utom<n3>,
#                           ufrm<n13>, and Text Encoding Converter
#                           version 1.3.
#       n03  1995-Apr-15    First version (after fixing some typos).
#                           Matches internal ufrm<n5>.
#
# Standard header:
# ----------------
#
#   Apple, the Apple logo, and Macintosh are trademarks of Apple
#   Computer, Inc., registered in the United States and other countries.
#   Unicode is a trademark of Unicode Inc. For the sake of brevity,
#   throughout this document, "Macintosh" can be used to refer to
#   Macintosh computers and "Unicode" can be used to refer to the
#   Unicode standard.
#
#   Apple makes no warranty or representation, either express or
#   implied, with respect to these tables, their quality, accuracy, or
#   fitness for a particular purpose. In no event will Apple be liable
#   for direct, indirect, special, incidental, or consequential damages 
#   resulting from any defect or inaccuracy in this document or the
#   accompanying tables.
#
#   These mapping tables and character lists are subject to change.
#   The latest tables should be available from the following:
#
#   <ftp://ftp.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#   <ftp://dev.apple.com/devworld/Technical_Documentation/Misc._Standards/>
#
#   For general information about Mac OS encodings and these mapping
#   tables, see the file "README.TXT".
#
# Format:
# -------
#
#   Three tab-separated columns;
#   '#' begins a comment which continues to the end of the line.
#     Column #1 is the Mac OS Central European code (in hex as 0xNN)
#     Column #2 is the corresponding Unicode (in hex as 0xNNNN)
#     Column #3 is a comment containing the Unicode name
#
#   The entries are in Mac OS Central European code order.
#
#   Control character mappings are not shown in this table, following
#   the conventions of the standard UTC mapping tables. However, the
#   Mac OS Central European character set uses the standard control
#   characters at 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Central European:
# ---------------------------------
#
#   This character set is intended to cover the following languages:
#
#   Polish, Czech, Slovak, Hungarian, Estonian, Latvian, Lithuanian
#
#   These are written in Latin script, but using a different set of
#   of accented characters than Mac OS Roman. The Mac OS Central
#   European character set also includes a number of characters
#   needed for the Mac OS user interface and localization (e.g.
#   ellipsis, bullet, copyright sign), several typographic
#   punctuation symbols, math symbols, etc. However, it has a
#   smaller set of punctuation and symbols than Mac OS Roman. All of
#   the characters in Mac OS Central European that are also in the
#   Mac OS Roman character set are at the same code point in both
#   character sets; this improves application compatibility.
#
#   Note: This does not have the same letter repertoire as ISO
#   8859-2 (Latin-2); each has some accented letters that the other
#   does not have.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# Details of mapping changes in each version:
# -------------------------------------------
#
##################

0x20	0x0020	# SPACE
0x21	0x0021	# EXCLAMATION MARK
0x22	0x0022	# QUOTATION MARK
0x23	0x0023	# NUMBER SIGN
0x24	0x0024	# DOLLAR SIGN
0x25	0x0025	# PERCENT SIGN
0x26	0x0026	# AMPERSAND
0x27	0x0027	# APOSTROPHE
0x28	0x0028	# LEFT PARENTHESIS
0x29	0x0029	# RIGHT PARENTHESIS
0x2A	0x002A	# ASTERISK
0x2B	0x002B	# PLUS SIGN
0x2C	0x002C	# COMMA
0x2D	0x002D	# HYPHEN-MINUS
0x2E	0x002E	# FULL STOP
0x2F	0x002F	# SOLIDUS
0x30	0x0030	# DIGIT ZERO
0x31	0x0031	# DIGIT ONE
0x32	0x0032	# DIGIT TWO
0x33	0x0033	# DIGIT THREE
0x34	0x0034	# DIGIT FOUR
0x35	0x0035	# DIGIT FIVE
0x36	0x0036	# DIGIT SIX
0x37	0x0037	# DIGIT SEVEN
0x38	0x0038	# DIGIT EIGHT
0x39	0x0039	# DIGIT NINE
0x3A	0x003A	# COLON
0x3B	0x003B	# SEMICOLON
0x3C	0x003C	# LESS-THAN SIGN
0x3D	0x003D	# EQUALS SIGN
0x3E	0x003E	# GREATER-THAN SIGN
0x3F	0x003F	# QUESTION MARK
0x40	0x0040	# COMMERCIAL AT
0x41	0x0041	# LATIN CAPITAL LETTER A
0x42	0x0042	# LATIN CAPITAL LETTER B
0x43	0x0043	# LATIN CAPITAL LETTER C
0x44	0x0044	# LATIN CAPITAL LETTER D
0x45	0x0045	# LATIN CAPITAL LETTER E
0x46	0x0046	# LATIN CAPITAL LETTER F
0x47	0x0047	# LATIN CAPITAL LETTER G
0x48	0x0048	# LATIN CAPITAL LETTER H
0x49	0x0049	# LATIN CAPITAL LETTER I
0x4A	0x004A	# LATIN CAPITAL LETTER J
0x4B	0x004B	# LATIN CAPITAL LETTER K
0x4C	0x004C	# LATIN CAPITAL LETTER L
0x4D	0x004D	# LATIN CAPITAL LETTER M
0x4E	0x004E	# LATIN CAPITAL LETTER N
0x4F	0x004F	# LATIN CAPITAL LETTER O
0x50	0x0050	# LATIN CAPITAL LETTER P
0x51	0x0051	# LATIN CAPITAL LETTER Q
0x52	0x0052	# LATIN CAPITAL LETTER R
0x53	0x0053	# LATIN CAPITAL LETTER S
0x54	0x0054	# LATIN CAPITAL LETTER T
0x55	0x0055	# LATIN CAPITAL LETTER U
0x56	0x0056	# LATIN CAPITAL LETTER V
0x57	0x0057	# LATIN CAPITAL LETTER W
0x58	0x0058	# LATIN CAPITAL LETTER X
0x59	0x0059	# LATIN CAPITAL LETTER Y
0x5A	0x005A	# LATIN CAPITAL LETTER Z
0x5B	0x005B	# LEFT SQUARE BRACKET
0x5C	0x005C	# REVERSE SOLIDUS
0x5D	0x005D	# RIGHT SQUARE BRACKET
0x5E	0x005E	# CIRCUMFLEX ACCENT
0x5F	0x005F	# LOW LINE
0x60	0x0060	# GRAVE ACCENT
0x61	0x0061	# LATIN SMALL LETTER A
0x62	0x0062	# LATIN SMALL LETTER B
0x63	0x0063	# LATIN SMALL LETTER C
0x64	0x0064	# LATIN SMALL LETTER D
0x65	0x0065	# LATIN SMALL LETTER E
0x66	0x0066	# LATIN SMALL LETTER F
0x67	0x0067	# LATIN SMALL LETTER G
0x68	0x0068	# LATIN SMALL LETTER H
0x69	0x0069	# LATIN SMALL LETTER I
0x6A	0x006A	# LATIN SMALL LETTER J
0x6B	0x006B	# LATIN SMALL LETTER K
0x6C	0x006C	# LATIN SMALL LETTER L
0x6D	0x006D	# LATIN SMALL LETTER M
0x6E	0x006E	# LATIN SMALL LETTER N
0x6F	0x006F	# LATIN SMALL LETTER O
0x70	0x0070	# LATIN SMALL LETTER P
0x71	0x0071	# LATIN SMALL LETTER Q
0x72	0x0072	# LATIN SMALL LETTER R
0x73	0x0073	# LATIN SMALL LETTER S
0x74	0x0074	# LATIN SMALL LETTER T
0x75	0x0075	# LATIN SMALL LETTER U
0x76	0x0076	# LATIN SMALL LETTER V
0x77	0x0077	# LATIN SMALL LETTER W
0x78	0x0078	# LATIN SMALL LETTER X
0x79	0x0079	# LATIN SMALL LETTER Y
0x7A	0x007A	# LATIN SMALL LETTER Z
0x7B	0x007B	# LEFT CURLY BRACKET
0x7C	0x007C	# VERTICAL LINE
0x7D	0x007D	# RIGHT CURLY BRACKET
0x7E	0x007E	# TILDE
#
0x80	0x00C4	# LATIN CAPITAL LETTER A WITH DIAERESIS
0x81	0x0100	# LATIN CAPITAL LETTER A WITH MACRON
0x82	0x0101	# LATIN SMALL LETTER A WITH MACRON
0x83	0x00C9	# LATIN CAPITAL LETTER E WITH ACUTE
0x84	0x0104	# LATIN CAPITAL LETTER A WITH OGONEK
0x85	0x00D6	# LATIN CAPITAL LETTER O WITH DIAERESIS
0x86	0x00DC	# LATIN CAPITAL LETTER U WITH DIAERESIS
0x87	0x00E1	# LATIN SMALL LETTER A WITH ACUTE
0x88	0x0105	# LATIN SMALL LETTER A WITH OGONEK
0x89	0x010C	# LATIN CAPITAL LETTER C WITH CARON
0x8A	0x00E4	# LATIN SMALL LETTER A WITH DIAERESIS
0x8B	0x010D	# LATIN SMALL LETTER C WITH CARON
0x8C	0x0106	# LATIN CAPITAL LETTER C WITH ACUTE
0x8D	0x0107	# LATIN SMALL LETTER C WITH ACUTE
0x8E	0x00E9	# LATIN SMALL LETTER E WITH ACUTE
0x8F	0x0179	# LATIN CAPITAL LETTER Z WITH ACUTE
0x90	0x017A	# LATIN SMALL LETTER Z WITH ACUTE
0x91	0x010E	# LATIN CAPITAL LETTER D WITH CARON
0x92	0x00ED	# LATIN SMALL LETTER I WITH ACUTE
0x93	0x010F	# LATIN SMALL LETTER D WITH CARON
0x94	0x0112	# LATIN CAPITAL LETTER E WITH MACRON
0x95	0x0113	# LATIN SMALL LETTER E WITH MACRON
0x96	0x0116	# LATIN CAPITAL LETTER E WITH DOT ABOVE
0x97	0x00F3	# LATIN SMALL LETTER O WITH ACUTE
0x98	0x0117	# LATIN SMALL LETTER E WITH DOT ABOVE
0x99	0x00F4	# LATIN SMALL LETTER O WITH CIRCUMFLEX
0x9A	0x00F6	# LATIN SMALL LETTER O WITH DIAERESIS
0x9B	0x00F5	# LATIN SMALL LETTER O WITH TILDE
0x9C	0x00FA	# LATIN SMALL LETTER U WITH ACUTE
0x9D	0x011A	# LATIN CAPITAL LETTER E WITH CARON
0x9E	0x011B	# LATIN SMALL LETTER E WITH CARON
0x9F	0x00FC	# LATIN SMALL LETTER U WITH DIAERESIS
0xA0	0x2020	# DAGGER
0xA1	0x00B0	# DEGREE SIGN
0xA2	0x0118	# LATIN CAPITAL LETTER E WITH OGONEK
0xA3	0x00A3	# POUND SIGN
0xA4	0x00A7	# SECTION SIGN
0xA5	0x2022	# BULLET
0xA6	0x00B6	# PILCROW SIGN
0xA7	0x00DF	# LATIN SMALL LETTER SHARP S
0xA8	0x00AE	# REGISTERED SIGN
0xA9	0x00A9	# COPYRIGHT SIGN
0xAA	0x2122	# TRADE MARK SIGN
0xAB	0x0119	# LATIN SMALL LETTER E WITH OGONEK
0xAC	0x00A8	# DIAERESIS
0xAD	0x2260	# NOT EQUAL TO
0xAE	0x0123	# LATIN SMALL LETTER G WITH CEDILLA
0xAF	0x012E	# LATIN CAPITAL LETTER I WITH OGONEK
0xB0	0x012F	# LATIN SMALL LETTER I WITH OGONEK
0xB1	0x012A	# LATIN CAPITAL LETTER I WITH MACRON
0xB2	0x2264	# LESS-THAN OR EQUAL TO
0xB3	0x2265	# GREATER-THAN OR EQUAL TO
0xB4	0x012B	# LATIN SMALL LETTER I WITH MACRON
0xB5	0x0136	# LATIN CAPITAL LETTER K WITH CEDILLA
0xB6	0x2202	# PARTIAL DIFFERENTIAL
0xB7	0x2211	# N-ARY SUMMATION
0xB8	0x0142	# LATIN SMALL LETTER L WITH STROKE
0xB9	0x013B	# LATIN CAPITAL LETTER L WITH CEDILLA
0xBA	0x013C	# LATIN SMALL LETTER L WITH CEDILLA
0xBB	0x013D	# LATIN CAPITAL LETTER L WITH CARON
0xBC	0x013E	# LATIN SMALL LETTER L WITH CARON
0xBD	0x0139	# LATIN CAPITAL LETTER L WITH ACUTE
0xBE	0x013A	# LATIN SMALL LETTER L WITH ACUTE
0xBF	0x0145	# LATIN CAPITAL LETTER N WITH CEDILLA
0xC0	0x0146	# LATIN SMALL LETTER N WITH CEDILLA
0xC1	0x0143	# LATIN CAPITAL LETTER N WITH ACUTE
0xC2	0x00AC	# NOT SIGN
0xC3	0x221A	# SQUARE ROOT
0xC4	0x0144	# LATIN SMALL LETTER N WITH ACUTE
0xC5	0x0147	# LATIN CAPITAL LETTER N WITH CARON
0xC6	0x2206	# INCREMENT
0xC7	0x00AB	# LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
0xC8	0x00BB	# RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0xC9	0x2026	# HORIZONTAL ELLIPSIS
0xCA	0x00A0	# NO-BREAK SPACE
0xCB	0x0148	# LATIN SMALL LETTER N WITH CARON
0xCC	0x0150	# LATIN CAPITAL LETTER O WITH DOUBLE ACUTE
0xCD	0x00D5	# LATIN CAPITAL LETTER O WITH TILDE
0xCE	0x0151	# LATIN SMALL LETTER O WITH DOUBLE ACUTE
0xCF	0x014C	# LATIN CAPITAL LETTER O WITH MACRON
0xD0	0x2013	# EN DASH
0xD1	0x2014	# EM DASH
0xD2	0x201C	# LEFT DOUBLE QUOTATION MARK
0xD3	0x201D	# RIGHT DOUBLE QUOTATION MARK
0xD4	0x2018	# LEFT SINGLE QUOTATION MARK
0xD5	0x2019	# RIGHT SINGLE QUOTATION MARK
0xD6	0x00F7	# DIVISION SIGN
0xD7	0x25CA	# LOZENGE
0xD8	0x014D	# LATIN SMALL LETTER O WITH MACRON
0xD9	0x0154	# LATIN CAPITAL LETTER R WITH ACUTE
0xDA	0x0155	# LATIN SMALL LETTER R WITH ACUTE
0xDB	0x0158	# LATIN CAPITAL LETTER R WITH CARON
0xDC	0x2039	# SINGLE LEFT-POINTING ANGLE QUOTATION MARK
0xDD	0x203A	# SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
0xDE	0x0159	# LATIN SMALL LETTER R WITH CARON
0xDF	0x0156	# LATIN CAPITAL LETTER R WITH CEDILLA
0xE0	0x0157	# LATIN SMALL LETTER R WITH CEDILLA
0xE1	0x0160	# LATIN CAPITAL LETTER S WITH CARON
0xE2	0x201A	# SINGLE LOW-9 QUOTATION MARK
0xE3	0x201E	# DOUBLE LOW-9 QUOTATION MARK
0xE4	0x0161	# LATIN SMALL LETTER S WITH CARON
0xE5	0x015A	# LATIN CAPITAL LETTER S WITH ACUTE
0xE6	0x015B	# LATIN SMALL LETTER S WITH ACUTE
0xE7	0x00C1	# LATIN CAPITAL LETTER A WITH ACUTE
0xE8	0x0164	# LATIN CAPITAL LETTER T WITH CARON
0xE9	0x0165	# LATIN SMALL LETTER T WITH CARON
0xEA	0x00CD	# LATIN CAPITAL LETTER I WITH ACUTE
0xEB	0x017D	# LATIN CAPITAL LETTER Z WITH CARON
0xEC	0x017E	# LATIN SMALL LETTER Z WITH CARON
0xED	0x016A	# LATIN CAPITAL LETTER U WITH MACRON
0xEE	0x00D3	# LATIN CAPITAL LETTER O WITH ACUTE
0xEF	0x00D4	# LATIN CAPITAL LETTER O WITH CIRCUMFLEX
0xF0	0x016B	# LATIN SMALL LETTER U WITH MACRON
0xF1	0x016E	# LATIN CAPITAL LETTER U WITH RING ABOVE
0xF2	0x00DA	# LATIN CAPITAL LETTER U WITH ACUTE
0xF3	0x016F	# LATIN SMALL LETTER U WITH RING ABOVE
0xF4	0x0170	# LATIN CAPITAL LETTER U WITH DOUBLE ACUTE
0xF5	0x0171	# LATIN SMALL LETTER U WITH DOUBLE ACUTE
0xF6	0x0172	# LATIN CAPITAL LETTER U WITH OGONEK
0xF7	0x0173	# LATIN SMALL LETTER U WITH OGONEK
0xF8	0x00DD	# LATIN CAPITAL LETTER Y WITH ACUTE
0xF9	0x00FD	# LATIN SMALL LETTER Y WITH ACUTE
0xFA	0x0137	# LATIN SMALL LETTER K WITH CEDILLA
0xFB	0x017B	# LATIN CAPITAL LETTER Z WITH DOT ABOVE
0xFC	0x0141	# LATIN CAPITAL LETTER L WITH STROKE
0xFD	0x017C	# LATIN SMALL LETTER Z WITH DOT ABOVE
0xFE	0x0122	# LATIN CAPITAL LETTER G WITH CEDILLA
0xFF	0x02C7	# CARON