source: trunk/include/encodings/cp1252.h@ 201

Last change on this file since 201 was 147, checked in by umoeller, 23 years ago

Misc updates for Unicode.

  • Property svn:eol-style set to CRLF
  • Property svn:keywords set to Author Date Id Revision
File size: 11.7 KB
Line 
1
2/*
3 *@@sourcefile cp1252.h:
4 * encoding translation for CP1252 to Unicode.
5 *
6 * Note: From my checking, 1252 is exactly the
7 * same as 1004, except for codepoint 0xAF.
8 *
9 *@@added V0.9.9 (2001-02-10) [umoeller]
10 */
11
12XWPENCODINGMAP G_cp1252[] =
13{
14//
15// Name: cp1252 to Unicode table
16// Unicode version: 2.0
17// Table version: 2.01
18// Table format: Format A
19// Date: 04/15/98
20//
21// Contact: cpxlate@microsoft.com
22//
23// General notes: none
24//
25// Format: Three tab-separated columns
26// Column #1 is the cp1252 code (in hex)
27// Column #2 is the Unicode (in hex as 0xXXXX)
28// Column #3 is the Unicode name (follows a comment sign, '#')
29//
30// The entries are in cp1252 order
31//
32 0x00, 0x0000, // NULL
33 0x01, 0x0001, // START OF HEADING
34 0x02, 0x0002, // START OF TEXT
35 0x03, 0x0003, // END OF TEXT
36 0x04, 0x0004, // END OF TRANSMISSION
37 0x05, 0x0005, // ENQUIRY
38 0x06, 0x0006, // ACKNOWLEDGE
39 0x07, 0x0007, // BELL
40 0x08, 0x0008, // BACKSPACE
41 0x09, 0x0009, // HORIZONTAL TABULATION
42 0x0A, 0x000A, // LINE FEED
43 0x0B, 0x000B, // VERTICAL TABULATION
44 0x0C, 0x000C, // FORM FEED
45 0x0D, 0x000D, // CARRIAGE RETURN
46 0x0E, 0x000E, // SHIFT OUT
47 0x0F, 0x000F, // SHIFT IN
48 0x10, 0x0010, // DATA LINK ESCAPE
49 0x11, 0x0011, // DEVICE CONTROL ONE
50 0x12, 0x0012, // DEVICE CONTROL TWO
51 0x13, 0x0013, // DEVICE CONTROL THREE
52 0x14, 0x0014, // DEVICE CONTROL FOUR
53 0x15, 0x0015, // NEGATIVE ACKNOWLEDGE
54 0x16, 0x0016, // SYNCHRONOUS IDLE
55 0x17, 0x0017, // END OF TRANSMISSION BLOCK
56 0x18, 0x0018, // CANCEL
57 0x19, 0x0019, // END OF MEDIUM
58 0x1A, 0x001A, // SUBSTITUTE
59 0x1B, 0x001B, // ESCAPE
60 0x1C, 0x001C, // FILE SEPARATOR
61 0x1D, 0x001D, // GROUP SEPARATOR
62 0x1E, 0x001E, // RECORD SEPARATOR
63 0x1F, 0x001F, // UNIT SEPARATOR
64 0x20, 0x0020, // SPACE
65 0x21, 0x0021, // EXCLAMATION MARK
66 0x22, 0x0022, // QUOTATION MARK
67 0x23, 0x0023, // NUMBER SIGN
68 0x24, 0x0024, // DOLLAR SIGN
69 0x25, 0x0025, // PERCENT SIGN
70 0x26, 0x0026, // AMPERSAND
71 0x27, 0x0027, // APOSTROPHE
72 0x28, 0x0028, // LEFT PARENTHESIS
73 0x29, 0x0029, // RIGHT PARENTHESIS
74 0x2A, 0x002A, // ASTERISK
75 0x2B, 0x002B, // PLUS SIGN
76 0x2C, 0x002C, // COMMA
77 0x2D, 0x002D, // HYPHEN-MINUS
78 0x2E, 0x002E, // FULL STOP
79 0x2F, 0x002F, // SOLIDUS
80 0x30, 0x0030, // DIGIT ZERO
81 0x31, 0x0031, // DIGIT ONE
82 0x32, 0x0032, // DIGIT TWO
83 0x33, 0x0033, // DIGIT THREE
84 0x34, 0x0034, // DIGIT FOUR
85 0x35, 0x0035, // DIGIT FIVE
86 0x36, 0x0036, // DIGIT SIX
87 0x37, 0x0037, // DIGIT SEVEN
88 0x38, 0x0038, // DIGIT EIGHT
89 0x39, 0x0039, // DIGIT NINE
90 0x3A, 0x003A, // COLON
91 0x3B, 0x003B, // SEMICOLON
92 0x3C, 0x003C, // LESS-THAN SIGN
93 0x3D, 0x003D, // EQUALS SIGN
94 0x3E, 0x003E, // GREATER-THAN SIGN
95 0x3F, 0x003F, // QUESTION MARK
96 0x40, 0x0040, // COMMERCIAL AT
97 0x41, 0x0041, // LATIN CAPITAL LETTER A
98 0x42, 0x0042, // LATIN CAPITAL LETTER B
99 0x43, 0x0043, // LATIN CAPITAL LETTER C
100 0x44, 0x0044, // LATIN CAPITAL LETTER D
101 0x45, 0x0045, // LATIN CAPITAL LETTER E
102 0x46, 0x0046, // LATIN CAPITAL LETTER F
103 0x47, 0x0047, // LATIN CAPITAL LETTER G
104 0x48, 0x0048, // LATIN CAPITAL LETTER H
105 0x49, 0x0049, // LATIN CAPITAL LETTER I
106 0x4A, 0x004A, // LATIN CAPITAL LETTER J
107 0x4B, 0x004B, // LATIN CAPITAL LETTER K
108 0x4C, 0x004C, // LATIN CAPITAL LETTER L
109 0x4D, 0x004D, // LATIN CAPITAL LETTER M
110 0x4E, 0x004E, // LATIN CAPITAL LETTER N
111 0x4F, 0x004F, // LATIN CAPITAL LETTER O
112 0x50, 0x0050, // LATIN CAPITAL LETTER P
113 0x51, 0x0051, // LATIN CAPITAL LETTER Q
114 0x52, 0x0052, // LATIN CAPITAL LETTER R
115 0x53, 0x0053, // LATIN CAPITAL LETTER S
116 0x54, 0x0054, // LATIN CAPITAL LETTER T
117 0x55, 0x0055, // LATIN CAPITAL LETTER U
118 0x56, 0x0056, // LATIN CAPITAL LETTER V
119 0x57, 0x0057, // LATIN CAPITAL LETTER W
120 0x58, 0x0058, // LATIN CAPITAL LETTER X
121 0x59, 0x0059, // LATIN CAPITAL LETTER Y
122 0x5A, 0x005A, // LATIN CAPITAL LETTER Z
123 0x5B, 0x005B, // LEFT SQUARE BRACKET
124 0x5C, 0x005C, // REVERSE SOLIDUS
125 0x5D, 0x005D, // RIGHT SQUARE BRACKET
126 0x5E, 0x005E, // CIRCUMFLEX ACCENT
127 0x5F, 0x005F, // LOW LINE
128 0x60, 0x0060, // GRAVE ACCENT
129 0x61, 0x0061, // LATIN SMALL LETTER A
130 0x62, 0x0062, // LATIN SMALL LETTER B
131 0x63, 0x0063, // LATIN SMALL LETTER C
132 0x64, 0x0064, // LATIN SMALL LETTER D
133 0x65, 0x0065, // LATIN SMALL LETTER E
134 0x66, 0x0066, // LATIN SMALL LETTER F
135 0x67, 0x0067, // LATIN SMALL LETTER G
136 0x68, 0x0068, // LATIN SMALL LETTER H
137 0x69, 0x0069, // LATIN SMALL LETTER I
138 0x6A, 0x006A, // LATIN SMALL LETTER J
139 0x6B, 0x006B, // LATIN SMALL LETTER K
140 0x6C, 0x006C, // LATIN SMALL LETTER L
141 0x6D, 0x006D, // LATIN SMALL LETTER M
142 0x6E, 0x006E, // LATIN SMALL LETTER N
143 0x6F, 0x006F, // LATIN SMALL LETTER O
144 0x70, 0x0070, // LATIN SMALL LETTER P
145 0x71, 0x0071, // LATIN SMALL LETTER Q
146 0x72, 0x0072, // LATIN SMALL LETTER R
147 0x73, 0x0073, // LATIN SMALL LETTER S
148 0x74, 0x0074, // LATIN SMALL LETTER T
149 0x75, 0x0075, // LATIN SMALL LETTER U
150 0x76, 0x0076, // LATIN SMALL LETTER V
151 0x77, 0x0077, // LATIN SMALL LETTER W
152 0x78, 0x0078, // LATIN SMALL LETTER X
153 0x79, 0x0079, // LATIN SMALL LETTER Y
154 0x7A, 0x007A, // LATIN SMALL LETTER Z
155 0x7B, 0x007B, // LEFT CURLY BRACKET
156 0x7C, 0x007C, // VERTICAL LINE
157 0x7D, 0x007D, // RIGHT CURLY BRACKET
158 0x7E, 0x007E, // TILDE
159 0x7F, 0x007F, // DELETE
160 0x80, 0x20AC, // EURO SIGN
161 0x81, 0xffff, // #UNDEFINED
162 0x82, 0x201A, // SINGLE LOW-9 QUOTATION MARK
163 0x83, 0x0192, // LATIN SMALL LETTER F WITH HOOK
164 0x84, 0x201E, // DOUBLE LOW-9 QUOTATION MARK
165 0x85, 0x2026, // HORIZONTAL ELLIPSIS
166 0x86, 0x2020, // DAGGER
167 0x87, 0x2021, // DOUBLE DAGGER
168 0x88, 0x02C6, // MODIFIER LETTER CIRCUMFLEX ACCENT
169 0x89, 0x2030, // PER MILLE SIGN
170 0x8A, 0x0160, // LATIN CAPITAL LETTER S WITH CARON
171 0x8B, 0x2039, // SINGLE LEFT-POINTING ANGLE QUOTATION MARK
172 0x8C, 0x0152, // LATIN CAPITAL LIGATURE OE
173 0x8D, 0xffff, // #UNDEFINED
174 0x8E, 0x017D, // LATIN CAPITAL LETTER Z WITH CARON
175 0x8F, 0xffff, // #UNDEFINED
176 0x90, 0xffff, // #UNDEFINED
177 0x91, 0x2018, // LEFT SINGLE QUOTATION MARK
178 0x92, 0x2019, // RIGHT SINGLE QUOTATION MARK
179 0x93, 0x201C, // LEFT DOUBLE QUOTATION MARK
180 0x94, 0x201D, // RIGHT DOUBLE QUOTATION MARK
181 0x95, 0x2022, // BULLET
182 0x96, 0x2013, // EN DASH
183 0x97, 0x2014, // EM DASH
184 0x98, 0x02DC, // SMALL TILDE
185 0x99, 0x2122, // TRADE MARK SIGN
186 0x9A, 0x0161, // LATIN SMALL LETTER S WITH CARON
187 0x9B, 0x203A, // SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
188 0x9C, 0x0153, // LATIN SMALL LIGATURE OE
189 0x9D, 0xffff, // #UNDEFINED
190 0x9E, 0x017E, // LATIN SMALL LETTER Z WITH CARON
191 0x9F, 0x0178, // LATIN CAPITAL LETTER Y WITH DIAERESIS
192 0xA0, 0x00A0, // NO-BREAK SPACE
193 0xA1, 0x00A1, // INVERTED EXCLAMATION MARK
194 0xA2, 0x00A2, // CENT SIGN
195 0xA3, 0x00A3, // POUND SIGN
196 0xA4, 0x00A4, // CURRENCY SIGN
197 0xA5, 0x00A5, // YEN SIGN
198 0xA6, 0x00A6, // BROKEN BAR
199 0xA7, 0x00A7, // SECTION SIGN
200 0xA8, 0x00A8, // DIAERESIS
201 0xA9, 0x00A9, // COPYRIGHT SIGN
202 0xAA, 0x00AA, // FEMININE ORDINAL INDICATOR
203 0xAB, 0x00AB, // LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
204 0xAC, 0x00AC, // NOT SIGN
205 0xAD, 0x00AD, // SOFT HYPHEN
206 0xAE, 0x00AE, // REGISTERED SIGN
207 0xAF, 0x00AF, // MACRON
208 0xB0, 0x00B0, // DEGREE SIGN
209 0xB1, 0x00B1, // PLUS-MINUS SIGN
210 0xB2, 0x00B2, // SUPERSCRIPT TWO
211 0xB3, 0x00B3, // SUPERSCRIPT THREE
212 0xB4, 0x00B4, // ACUTE ACCENT
213 0xB5, 0x00B5, // MICRO SIGN
214 0xB6, 0x00B6, // PILCROW SIGN
215 0xB7, 0x00B7, // MIDDLE DOT
216 0xB8, 0x00B8, // CEDILLA
217 0xB9, 0x00B9, // SUPERSCRIPT ONE
218 0xBA, 0x00BA, // MASCULINE ORDINAL INDICATOR
219 0xBB, 0x00BB, // RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
220 0xBC, 0x00BC, // VULGAR FRACTION ONE QUARTER
221 0xBD, 0x00BD, // VULGAR FRACTION ONE HALF
222 0xBE, 0x00BE, // VULGAR FRACTION THREE QUARTERS
223 0xBF, 0x00BF, // INVERTED QUESTION MARK
224 0xC0, 0x00C0, // LATIN CAPITAL LETTER A WITH GRAVE
225 0xC1, 0x00C1, // LATIN CAPITAL LETTER A WITH ACUTE
226 0xC2, 0x00C2, // LATIN CAPITAL LETTER A WITH CIRCUMFLEX
227 0xC3, 0x00C3, // LATIN CAPITAL LETTER A WITH TILDE
228 0xC4, 0x00C4, // LATIN CAPITAL LETTER A WITH DIAERESIS
229 0xC5, 0x00C5, // LATIN CAPITAL LETTER A WITH RING ABOVE
230 0xC6, 0x00C6, // LATIN CAPITAL LETTER AE
231 0xC7, 0x00C7, // LATIN CAPITAL LETTER C WITH CEDILLA
232 0xC8, 0x00C8, // LATIN CAPITAL LETTER E WITH GRAVE
233 0xC9, 0x00C9, // LATIN CAPITAL LETTER E WITH ACUTE
234 0xCA, 0x00CA, // LATIN CAPITAL LETTER E WITH CIRCUMFLEX
235 0xCB, 0x00CB, // LATIN CAPITAL LETTER E WITH DIAERESIS
236 0xCC, 0x00CC, // LATIN CAPITAL LETTER I WITH GRAVE
237 0xCD, 0x00CD, // LATIN CAPITAL LETTER I WITH ACUTE
238 0xCE, 0x00CE, // LATIN CAPITAL LETTER I WITH CIRCUMFLEX
239 0xCF, 0x00CF, // LATIN CAPITAL LETTER I WITH DIAERESIS
240 0xD0, 0x00D0, // LATIN CAPITAL LETTER ETH
241 0xD1, 0x00D1, // LATIN CAPITAL LETTER N WITH TILDE
242 0xD2, 0x00D2, // LATIN CAPITAL LETTER O WITH GRAVE
243 0xD3, 0x00D3, // LATIN CAPITAL LETTER O WITH ACUTE
244 0xD4, 0x00D4, // LATIN CAPITAL LETTER O WITH CIRCUMFLEX
245 0xD5, 0x00D5, // LATIN CAPITAL LETTER O WITH TILDE
246 0xD6, 0x00D6, // LATIN CAPITAL LETTER O WITH DIAERESIS
247 0xD7, 0x00D7, // MULTIPLICATION SIGN
248 0xD8, 0x00D8, // LATIN CAPITAL LETTER O WITH STROKE
249 0xD9, 0x00D9, // LATIN CAPITAL LETTER U WITH GRAVE
250 0xDA, 0x00DA, // LATIN CAPITAL LETTER U WITH ACUTE
251 0xDB, 0x00DB, // LATIN CAPITAL LETTER U WITH CIRCUMFLEX
252 0xDC, 0x00DC, // LATIN CAPITAL LETTER U WITH DIAERESIS
253 0xDD, 0x00DD, // LATIN CAPITAL LETTER Y WITH ACUTE
254 0xDE, 0x00DE, // LATIN CAPITAL LETTER THORN
255 0xDF, 0x00DF, // LATIN SMALL LETTER SHARP S
256 0xE0, 0x00E0, // LATIN SMALL LETTER A WITH GRAVE
257 0xE1, 0x00E1, // LATIN SMALL LETTER A WITH ACUTE
258 0xE2, 0x00E2, // LATIN SMALL LETTER A WITH CIRCUMFLEX
259 0xE3, 0x00E3, // LATIN SMALL LETTER A WITH TILDE
260 0xE4, 0x00E4, // LATIN SMALL LETTER A WITH DIAERESIS
261 0xE5, 0x00E5, // LATIN SMALL LETTER A WITH RING ABOVE
262 0xE6, 0x00E6, // LATIN SMALL LETTER AE
263 0xE7, 0x00E7, // LATIN SMALL LETTER C WITH CEDILLA
264 0xE8, 0x00E8, // LATIN SMALL LETTER E WITH GRAVE
265 0xE9, 0x00E9, // LATIN SMALL LETTER E WITH ACUTE
266 0xEA, 0x00EA, // LATIN SMALL LETTER E WITH CIRCUMFLEX
267 0xEB, 0x00EB, // LATIN SMALL LETTER E WITH DIAERESIS
268 0xEC, 0x00EC, // LATIN SMALL LETTER I WITH GRAVE
269 0xED, 0x00ED, // LATIN SMALL LETTER I WITH ACUTE
270 0xEE, 0x00EE, // LATIN SMALL LETTER I WITH CIRCUMFLEX
271 0xEF, 0x00EF, // LATIN SMALL LETTER I WITH DIAERESIS
272 0xF0, 0x00F0, // LATIN SMALL LETTER ETH
273 0xF1, 0x00F1, // LATIN SMALL LETTER N WITH TILDE
274 0xF2, 0x00F2, // LATIN SMALL LETTER O WITH GRAVE
275 0xF3, 0x00F3, // LATIN SMALL LETTER O WITH ACUTE
276 0xF4, 0x00F4, // LATIN SMALL LETTER O WITH CIRCUMFLEX
277 0xF5, 0x00F5, // LATIN SMALL LETTER O WITH TILDE
278 0xF6, 0x00F6, // LATIN SMALL LETTER O WITH DIAERESIS
279 0xF7, 0x00F7, // DIVISION SIGN
280 0xF8, 0x00F8, // LATIN SMALL LETTER O WITH STROKE
281 0xF9, 0x00F9, // LATIN SMALL LETTER U WITH GRAVE
282 0xFA, 0x00FA, // LATIN SMALL LETTER U WITH ACUTE
283 0xFB, 0x00FB, // LATIN SMALL LETTER U WITH CIRCUMFLEX
284 0xFC, 0x00FC, // LATIN SMALL LETTER U WITH DIAERESIS
285 0xFD, 0x00FD, // LATIN SMALL LETTER Y WITH ACUTE
286 0xFE, 0x00FE, // LATIN SMALL LETTER THORN
287 0xFF, 0x00FF // LATIN SMALL LETTER Y WITH DIAERESIS
288};
289
Note: See TracBrowser for help on using the repository browser.