forked from wine-mirror/wine
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathunicode-defaults
202 lines (192 loc) · 10.2 KB
/
unicode-defaults
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
# Default Unicode mappings
#
# Copyright 2000 Alexandre Julliard
#
# This library is free software; you can redistribute it and/or
# modify it under the terms of the GNU Lesser General Public
# License as published by the Free Software Foundation; either
# version 2.1 of the License, or (at your option) any later version.
#
# This library is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
# Lesser General Public License for more details.
#
# You should have received a copy of the GNU Lesser General Public
# License along with this library; if not, write to the Free Software
# Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
#
# NOTES:
#
# This file contains default mappings for Unicode chars that aren't
# defined directly in the code page file. It is used by the cpmap.pl
# tool to build codepage tables.
#
# The first column defines equivalence sets; if any character in the set
# is defined in the codepage file, all others in the set will map to the
# same value.
#
# The second column specifies the default char to map the whole set to,
# if no characters in the set are defined by the codepage file.
#
# Characters that have an explicit decomposition in the UnicodeData.txt
# file (for instance 00c0 LATIN CAPITAL LETTER A WITH GRAVE -> 0041 0300)
# are handled automatically and do not have to be defined here. They can
# still be defined if necessary to override the unicode decomposition.
#
# letters
00a2,20a1 'c' # CENT SIGN, COLON SIGN
00a3,20a4 'L' # POUND SIGN, LIRA SIGN
00a5 'Y' # YEN SIGN
00a6 '|' # BROKEN BAR
00a9 'c' # COPYRIGHT SIGN
00ae 'r' # REGISTERED SIGN
00b5,03bc 'u' # MICRO SIGN, GREEK SMALL LETTER MU
00c6 'A' # LATIN CAPITAL LETTER AE
00d0,0110,0189 'D' # LATIN CAPITAL LETTER D WITH STROKE/AFRICAN D/ETH
00d7 'x' # MULTIPLICATION SIGN
00d8,2205 'O' # LATIN CAPITAL LETTER O WITH STROKE, EMPTY SET
00df,03b2 none # LATIN SMALL LETTER SHARP S, GREEK SMALL LETTER BETA
00e6 'a' # LATIN SMALL LETTER AE
00f0 'd' # LATIN SMALL LETTER ETH
00f8 'o' # LATIN SMALL LETTER O WITH STROKE
0111 'd' # LATIN SMALL LETTER D WITH STROKE
0126 'H' # LATIN CAPITAL LETTER H WITH STROKE
0127 'h' # LATIN SMALL LETTER H WITH STROKE
0131 'i' # LATIN SMALL LETTER DOTLESS I
0141 'L' # LATIN CAPITAL LETTER L WITH STROKE
0142 'l' # LATIN SMALL LETTER L WITH STROKE
0152 'O' # LATIN CAPITAL LIGATURE OE
0153 'o' # LATIN SMALL LIGATURE OE
0166 'T' # LATIN CAPITAL LETTER T WITH STROKE
0167 't' # LATIN SMALL LETTER T WITH STROKE
0180 'b' # LATIN SMALL LETTER B WITH STROKE
0190 'E' # LATIN CAPITAL LETTER OPEN E
0191 'F' # LATIN CAPITAL LETTER F WITH HOOK
0192 'f' # LATIN SMALL LETTER F WITH HOOK
0197 'I' # LATIN CAPITAL LETTER I WITH STROKE
019a 'l' # LATIN SMALL LETTER L WITH BAR
019f 'O' # LATIN CAPITAL LETTER O WITH MIDDLE TILDE
01ab 't' # LATIN SMALL LETTER T WITH PALATAL HOOK
01ae 'T' # LATIN CAPITAL LETTER T WITH RETROFLEX HOOK
01b6 'z' # LATIN SMALL LETTER Z WITH STROKE
0391 'A' # GREEK CAPITAL LETTER ALPHA
0392 'B' # GREEK CAPITAL LETTER BETA
0395 'E' # GREEK CAPITAL LETTER EPSILON
0396 'Z' # GREEK CAPITAL LETTER ZETA
0397 'H' # GREEK CAPITAL LETTER ETA
0399 'I' # GREEK CAPITAL LETTER IOTA
039a 'K' # GREEK CAPITAL LETTER KAPPA
039c 'M' # GREEK CAPITAL LETTER MU
039d 'N' # GREEK CAPITAL LETTER NU
039f 'O' # GREEK CAPITAL LETTER OMICRON
03a1 'P' # GREEK CAPITAL LETTER RHO
03a4 'T' # GREEK CAPITAL LETTER TAU
03a5 'Y' # GREEK CAPITAL LETTER UPSILON
03a7 'X' # GREEK CAPITAL LETTER CHI
01e4 'G' # LATIN CAPITAL LETTER G WITH STROKE
01e5 'g' # LATIN SMALL LETTER G WITH STROKE
0261 'g' # LATIN SMALL LETTER SCRIPT G
2118 'P' # SCRIPT CAPITAL P
212e 'e' # ESTIMATED SYMBOL
# accents
00a8,0308 '"' # DIAERESIS
00af,02c9,0304 2014 # MACRON -> EM DASH
00b4,02b9,02ca,0301,2032 ''' # ACUTE ACCENT, PRIME
00b8,0327 ',' # CEDILLA
02ba,02dd,030b,2033 '"' # DOUBLE ACUTE ACCENT, DOUBLE PRIME
02c4,2303 '^' # UP ARROWHEAD
02c6,0302 '^' # CIRCUMFLEX ACCENT
02c7,030c 'v' # COMBINING CARON -> CARON
02c8 ''' # MODIFIER LETTER VERTICAL LINE
02cb,0300 '`' # GRAVE ACCENT
02cd,0331,0332 '_' # MODIFIER LETTER LOW MACRON, COMBINING MACRON BELOW, COMBINING LOW LINE
02d8,0306 none # BREVE
02d9,0307 none # DOT ABOVE
02da,030a,2070,2218 00b0 # RING ABOVE, SUPERSCRIPT ZERO, RING OPERATOR -> DEGREE SIGN
02db,0328 none # OGONEK
02dc,0303 '~' # SMALL TILDE
0305,203e 00af # OVERLINE -> MACRON
030e '"' # COMBINING DOUBLE VERTICAL LINE ABOVE
0333 '_' # COMBINING DOUBLE LOW LINE
# mathematical symbols
00b1,2213 none # PLUS-MINUS SIGN, MINUS-OR-PLUS SIGN
2044,2215 '/' # FRACTION/DIVISION SLASH
2216 '\' # SET MINUS
2217 '*' # ASTERISK OPERATOR
221a 'V' # SQUARE ROOT
221f 'L' # RIGHT ANGLE
2223 '|' # DIVIDES
2229 'n' # INTERSECTION
2236 ':' # RATIO
2248 02DC # ALMOST EQUAL TO -> SMALL TILDE
2261,2263 '=' # IDENTICAL TO, STRICTLY EQUIVALENT TO
226a 00ab # MUCH LESS-THAN -> LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
226b 00bb # MUCH GREATER-THAN -> RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
22c5 00b7 # DOT OPERATOR -> MIDDLE DOT
# misc symbols
00a1 '!' # INVERTED EXCLAMATION MARK
00ab,300a '<' # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK, LEFT DOUBLE ANGLE BRACKET
00ad '-' # SOFT HYPHEN
00bb,300b '>' # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK, RIGHT DOUBLE ANGLE BRACKET
01c0 2502 # LATIN LETTER DENTAL CLICK -> BOX DRAWINGS LIGHT VERTICAL
01c3 '!' # LATIN LETTER RETROFLEX CLICK
02bb 2018 # MODIFIER LETTER TURNED COMMA -> LEFT SINGLE QUOTATION MARK
02bc,2019 ''' # RIGHT SINGLE QUOTATION MARK
2010,2011,2212 '-' # HYPHEN, MINUS SIGN
2013,2014,2015 '-' # EN DASH, EM DASH, HORIZONTAL BAR, MINUS SIGN
2018,201b,2035 '`' # LEFT SINGLE QUOTATION MARK, SINGLE HIGH-REVERSED-9 QUOTATION MARK, REVERSED PRIME
201a ',' # SINGLE LOW-9 QUOTATION MARK
201c,301d '"' # LEFT DOUBLE QUOTATION MARK, REVERSED DOUBLE PRIME QUOTATION MARK
201d,301e '"' # RIGHT DOUBLE QUOTATION MARK, DOUBLE PRIME QUOTATION MARK
201e,301f ',' # LOW DOUBLE PRIME QUOTATION MARK, DOUBLE LOW-9 QUOTATION MARK
2022,2219 none # BULLET, BULLET OPERATOR
2039,3008 '<' # SINGLE LEFT-POINTING ANGLE QUOTATION MARK, LEFT ANGLE BRACKET
203a,3009 '>' # SINGLE RIGHT-POINTING ANGLE QUOTATION MARK, RIGHT ANGLE BRACKET
203c '!' # DOUBLE EXCLAMATION MARK
2190 2039 # LEFTWARDS ARROW -> SINGLE LEFT-POINTING ANGLE QUOTATION MARK
2191 02c6 # UPWARDS ARROW -> MODIFIER LETTER CIRCUMFLEX ACCENT
2192 203a # RIGHTWARDS ARROW -> SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
2193 02c7 # DOWNWARDS ARROW -> CARON
2194 '-' # LEFT RIGHT ARROW
2195 '|' # UP DOWN ARROW
223c '~' # TILDE
301a '[' # LEFT WHITE SQUARE BRACKET
301b ']' # RIGHT WHITE SQUARE BRACKET
fe49,fe4a,fe4b,fe4c 203e # DOUBLE WAVY OVERLINE -> OVERLINE
fe4d,fe4e,fe4f '_' # DASHED/CENTRELINE/WAVY LOW LINE
# box drawing chars
2500,2501 '-' # BOX DRAWINGS LIGHT/HEAVY HORIZONTAL
2502,2503 '|' # BOX DRAWINGS LIGHT/HEAVY VERTICAL
2504,2505 '-' # BOX DRAWINGS LIGHT/HEAVY TRIPLE DASH HORIZONTAL
2506,2507 00a6 # BOX DRAWINGS LIGHT/HEAVY TRIPLE DASH VERTICAL -> BROKEN BAR
2508,2509 '-' # BOX DRAWINGS LIGHT/HEAVY QUADRUPLE DASH HORIZONTAL
250a,250b 00a6 # BOX DRAWINGS LIGHT/HEAVY QUADRUPLE DASH VERTICAL -> BROKEN BAR
250c,250d,250e,250f '+' # BOX DRAWINGS LIGHT/HEAVY DOWN AND RIGHT
2510,2511,2512,2513 00ac # BOX DRAWINGS LIGHT/HEAVY DOWN AND LEFT -> NOT SIGN
2514,2515,2516,2517 'L' # BOX DRAWINGS LIGHT/HEAVY UP AND RIGHT
2518,2519,251a,251b '+' # BOX DRAWINGS LIGHT/HEAVY UP AND LEFT
251c,251d,251e,251f,2520,2521,2522,2523 '+' # BOX DRAWINGS LIGHT/HEAVY VERTICAL AND RIGHT
2524,2525,2526,2527,2528,2529,252a,252b '+' # BOX DRAWINGS LIGHT/HEAVY VERTICAL AND LEFT
252c,252d,252e,252f,2530,2531,2532,2533 'T' # BOX DRAWINGS LIGHT/HEAVY DOWN AND HORIZONTAL
2534,2535,2536,2537,2538,2539,253a,253b '+' # BOX DRAWINGS LIGHT/HEAVY UP AND HORIZONTAL
253c,253d,253e,253f,2540,2541,2542,2543,2544,2545,2546,2547,2548,2549,254a,254b '+' # BOX DRAWINGS LIGHT/HEAVY VERTICAL AND HORIZONTAL
254c,254d '-' # BOX DRAWINGS LIGHT/HEAVY DOUBLE DASH HORIZONTAL
254e,254f 00a6 # BOX DRAWINGS LIGHT/HEAVY DOUBLE DASH VERTICAL -> BROKEN BAR
2550 '=' # BOX DRAWINGS DOUBLE HORIZONTAL
2551 '|' # BOX DRAWINGS DOUBLE VERTICAL
2552,2553,2554 '+' # BOX DRAWINGS DOWN AND RIGHT
2555,2556,2557 00ac # BOX DRAWINGS DOWN AND LEFT -> NOT SIGN
2558,2559,255a 'L' # BOX DRAWINGS UP AND RIGHT
255b,255c,255d '+' # BOX DRAWINGS UP AND LEFT
255e,255f,2560 '+' # BOX DRAWINGS VERTICAL AND RIGHT
2561,2562,2563 '+' # BOX DRAWINGS VERTICAL AND LEFT
2564,2565,2566 'T' # BOX DRAWINGS DOWN AND HORIZONTAL
2567,2568,2569 '+' # BOX DRAWINGS UP AND HORIZONTAL
256a,256b,256c '+' # BOX DRAWINGS VERTICAL AND HORIZONTAL
2571 '/' # BOX DRAWINGS LIGHT DIAGONAL UPPER RIGHT TO LOWER LEFT
2572 '\' # BOX DRAWINGS LIGHT DIAGONAL UPPER LEFT TO LOWER RIGHT
2573 'X' # BOX DRAWINGS LIGHT DIAGONAL CROSS
2574,2576,2578,257a,257c,257e '-' # BOX DRAWINGS LIGHT/HEAVY LEFT/RIGHT
2575,2577,2579,257b,257d,257f '|' # BOX DRAWINGS LIGHT/HEAVY UP/DOWN
25cb,25ef 'O' # WHITE/LARGE CIRCLE