8148
|
1 |
"
|
|
2 |
COPYRIGHT (c) 2004 by eXept Software AG
|
|
3 |
All Rights Reserved
|
|
4 |
|
|
5 |
This software is furnished under a license and may be used
|
|
6 |
only in accordance with the terms of that license and with the
|
|
7 |
inclusion of the above copyright notice. This software may not
|
|
8 |
be provided or otherwise made available to, or used by, any
|
|
9 |
other person. No title to or ownership of the software is
|
|
10 |
hereby transferred.
|
|
11 |
"
|
|
12 |
|
8081
|
13 |
"{ Package: 'stx:libbasic' }"
|
|
14 |
|
|
15 |
"{ NameSpace: CharacterEncoderImplementations }"
|
|
16 |
|
|
17 |
SingleByteEncoder subclass:#MS_Cyrillic
|
|
18 |
instanceVariableNames:''
|
|
19 |
classVariableNames:''
|
|
20 |
poolDictionaries:''
|
|
21 |
category:'Collections-Text-Encodings'
|
|
22 |
!
|
|
23 |
|
8148
|
24 |
!MS_Cyrillic class methodsFor:'documentation'!
|
|
25 |
|
|
26 |
copyright
|
|
27 |
"
|
|
28 |
COPYRIGHT (c) 2004 by eXept Software AG
|
|
29 |
All Rights Reserved
|
|
30 |
|
|
31 |
This software is furnished under a license and may be used
|
|
32 |
only in accordance with the terms of that license and with the
|
|
33 |
inclusion of the above copyright notice. This software may not
|
|
34 |
be provided or otherwise made available to, or used by, any
|
|
35 |
other person. No title to or ownership of the software is
|
|
36 |
hereby transferred.
|
|
37 |
"
|
8813
|
38 |
!
|
|
39 |
|
|
40 |
documentation
|
|
41 |
"
|
|
42 |
CP1251 / Microsoft Cyrillic
|
|
43 |
|
|
44 |
[see with:]
|
|
45 |
CharacterEncoderImplementations::MS_Cyrillic showCharacterSet
|
|
46 |
|
|
47 |
[author:]
|
|
48 |
Claus Gittinger
|
|
49 |
"
|
8148
|
50 |
! !
|
8081
|
51 |
|
|
52 |
!MS_Cyrillic class methodsFor:'mapping'!
|
|
53 |
|
|
54 |
mapFileURL2_relativePathName
|
|
55 |
^ 'CP1251'
|
8813
|
56 |
|
|
57 |
"
|
|
58 |
self generateCode
|
|
59 |
"
|
8081
|
60 |
!
|
|
61 |
|
|
62 |
mapping
|
|
63 |
"
|
|
64 |
# From: http://std.dkuug.dk/i18n/charmaps/CP1251
|
|
65 |
|
|
66 |
<code_set_name> CP1251
|
|
67 |
<comment_char> %
|
|
68 |
<escape_char> /
|
|
69 |
% version: 1.0
|
|
70 |
% repertoiremap: mnemonic,ds
|
|
71 |
% source: UNICODE 1.0
|
|
72 |
|
|
73 |
% alias MS-CYRL
|
|
74 |
CHARMAP
|
|
75 |
<NU> /x00 <U0000> NULL (NUL)
|
|
76 |
<SH> /x01 <U0001> START OF HEADING (SOH)
|
|
77 |
<SX> /x02 <U0002> START OF TEXT (STX)
|
|
78 |
<EX> /x03 <U0003> END OF TEXT (ETX)
|
|
79 |
<ET> /x04 <U0004> END OF TRANSMISSION (EOT)
|
|
80 |
<EQ> /x05 <U0005> ENQUIRY (ENQ)
|
|
81 |
<AK> /x06 <U0006> ACKNOWLEDGE (ACK)
|
|
82 |
<BL> /x07 <U0007> BELL (BEL)
|
|
83 |
<BS> /x08 <U0008> BACKSPACE (BS)
|
|
84 |
<HT> /x09 <U0009> CHARACTER TABULATION (HT)
|
|
85 |
<LF> /x0A <U000A> LINE FEED (LF)
|
|
86 |
<VT> /x0B <U000B> LINE TABULATION (VT)
|
|
87 |
<FF> /x0C <U000C> FORM FEED (FF)
|
|
88 |
<CR> /x0D <U000D> CARRIAGE RETURN (CR)
|
|
89 |
<SO> /x0E <U000E> SHIFT OUT (SO)
|
|
90 |
<SI> /x0F <U000F> SHIFT IN (SI)
|
|
91 |
<DL> /x10 <U0010> DATALINK ESCAPE (DLE)
|
|
92 |
<D1> /x11 <U0011> DEVICE CONTROL ONE (DC1)
|
|
93 |
<D2> /x12 <U0012> DEVICE CONTROL TWO (DC2)
|
|
94 |
<D3> /x13 <U0013> DEVICE CONTROL THREE (DC3)
|
|
95 |
<D4> /x14 <U0014> DEVICE CONTROL FOUR (DC4)
|
|
96 |
<NK> /x15 <U0015> NEGATIVE ACKNOWLEDGE (NAK)
|
|
97 |
<SY> /x16 <U0016> SYNCHRONOUS IDLE (SYN)
|
|
98 |
<EB> /x17 <U0017> END OF TRANSMISSION BLOCK (ETB)
|
|
99 |
<CN> /x18 <U0018> CANCEL (CAN)
|
|
100 |
<EM> /x19 <U0019> END OF MEDIUM (EM)
|
|
101 |
<SB> /x1A <U001A> SUBSTITUTE (SUB)
|
|
102 |
<EC> /x1B <U001B> ESCAPE (ESC)
|
|
103 |
<FS> /x1C <U001C> FILE SEPARATOR (IS4)
|
|
104 |
<GS> /x1D <U001D> GROUP SEPARATOR (IS3)
|
|
105 |
<RS> /x1E <U001E> RECORD SEPARATOR (IS2)
|
|
106 |
<US> /x1F <U001F> UNIT SEPARATOR (IS1)
|
|
107 |
<SP> /x20 <U0020> SPACE
|
|
108 |
<!!> /x21 <U0021> EXCLAMATION MARK
|
|
109 |
<'> /x22 <U0022> QUOTATION MARK
|
|
110 |
<Nb> /x23 <U0023> NUMBER SIGN
|
|
111 |
<DO> /x24 <U0024> DOLLAR SIGN
|
|
112 |
<%> /x25 <U0025> PERCENT SIGN
|
|
113 |
<&> /x26 <U0026> AMPERSAND
|
|
114 |
<'> /x27 <U0027> APOSTROPHE
|
|
115 |
<(> /x28 <U0028> LEFT PARENTHESIS
|
|
116 |
<)> /x29 <U0029> RIGHT PARENTHESIS
|
|
117 |
<*> /x2A <U002A> ASTERISK
|
|
118 |
<+> /x2B <U002B> PLUS SIGN
|
|
119 |
<,> /x2C <U002C> COMMA
|
|
120 |
<-> /x2D <U002D> HYPHEN-MINUS
|
|
121 |
<.> /x2E <U002E> FULL STOP
|
|
122 |
<//> /x2F <U002F> SOLIDUS
|
|
123 |
<0> /x30 <U0030> DIGIT ZERO
|
|
124 |
<1> /x31 <U0031> DIGIT ONE
|
|
125 |
<2> /x32 <U0032> DIGIT TWO
|
|
126 |
<3> /x33 <U0033> DIGIT THREE
|
|
127 |
<4> /x34 <U0034> DIGIT FOUR
|
|
128 |
<5> /x35 <U0035> DIGIT FIVE
|
|
129 |
<6> /x36 <U0036> DIGIT SIX
|
|
130 |
<7> /x37 <U0037> DIGIT SEVEN
|
|
131 |
<8> /x38 <U0038> DIGIT EIGHT
|
|
132 |
<9> /x39 <U0039> DIGIT NINE
|
|
133 |
<:> /x3A <U003A> COLON
|
|
134 |
<;> /x3B <U003B> SEMICOLON
|
|
135 |
<<> /x3C <U003C> LESS-THAN SIGN
|
|
136 |
<=> /x3D <U003D> EQUALS SIGN
|
|
137 |
</>> /x3E <U003E> GREATER-THAN SIGN
|
|
138 |
<?> /x3F <U003F> QUESTION MARK
|
|
139 |
<At> /x40 <U0040> COMMERCIAL AT
|
|
140 |
<A> /x41 <U0041> LATIN CAPITAL LETTER A
|
|
141 |
<B> /x42 <U0042> LATIN CAPITAL LETTER B
|
|
142 |
<C> /x43 <U0043> LATIN CAPITAL LETTER C
|
|
143 |
<D> /x44 <U0044> LATIN CAPITAL LETTER D
|
|
144 |
<E> /x45 <U0045> LATIN CAPITAL LETTER E
|
|
145 |
<F> /x46 <U0046> LATIN CAPITAL LETTER F
|
|
146 |
<G> /x47 <U0047> LATIN CAPITAL LETTER G
|
|
147 |
<H> /x48 <U0048> LATIN CAPITAL LETTER H
|
|
148 |
<I> /x49 <U0049> LATIN CAPITAL LETTER I
|
|
149 |
<J> /x4A <U004A> LATIN CAPITAL LETTER J
|
|
150 |
<K> /x4B <U004B> LATIN CAPITAL LETTER K
|
|
151 |
<L> /x4C <U004C> LATIN CAPITAL LETTER L
|
|
152 |
<M> /x4D <U004D> LATIN CAPITAL LETTER M
|
|
153 |
<N> /x4E <U004E> LATIN CAPITAL LETTER N
|
|
154 |
<O> /x4F <U004F> LATIN CAPITAL LETTER O
|
|
155 |
<P> /x50 <U0050> LATIN CAPITAL LETTER P
|
|
156 |
<Q> /x51 <U0051> LATIN CAPITAL LETTER Q
|
|
157 |
<R> /x52 <U0052> LATIN CAPITAL LETTER R
|
|
158 |
<S> /x53 <U0053> LATIN CAPITAL LETTER S
|
|
159 |
<T> /x54 <U0054> LATIN CAPITAL LETTER T
|
|
160 |
<U> /x55 <U0055> LATIN CAPITAL LETTER U
|
|
161 |
<V> /x56 <U0056> LATIN CAPITAL LETTER V
|
|
162 |
<W> /x57 <U0057> LATIN CAPITAL LETTER W
|
|
163 |
<X> /x58 <U0058> LATIN CAPITAL LETTER X
|
|
164 |
<Y> /x59 <U0059> LATIN CAPITAL LETTER Y
|
|
165 |
<Z> /x5A <U005A> LATIN CAPITAL LETTER Z
|
|
166 |
<<(> /x5B <U005B> LEFT SQUARE BRACKET
|
|
167 |
<////> /x5C <U005C> REVERSE SOLIDUS
|
|
168 |
<)/>> /x5D <U005D> RIGHT SQUARE BRACKET
|
|
169 |
<'/>> /x5E <U005E> CIRCUMFLEX ACCENT
|
|
170 |
<_> /x5F <U005F> LOW LINE
|
|
171 |
<'!!> /x60 <U0060> GRAVE ACCENT
|
|
172 |
<a> /x61 <U0061> LATIN SMALL LETTER A
|
|
173 |
<b> /x62 <U0062> LATIN SMALL LETTER B
|
|
174 |
<c> /x63 <U0063> LATIN SMALL LETTER C
|
|
175 |
<d> /x64 <U0064> LATIN SMALL LETTER D
|
|
176 |
<e> /x65 <U0065> LATIN SMALL LETTER E
|
|
177 |
<f> /x66 <U0066> LATIN SMALL LETTER F
|
|
178 |
<g> /x67 <U0067> LATIN SMALL LETTER G
|
|
179 |
<h> /x68 <U0068> LATIN SMALL LETTER H
|
|
180 |
<i> /x69 <U0069> LATIN SMALL LETTER I
|
|
181 |
<j> /x6A <U006A> LATIN SMALL LETTER J
|
|
182 |
<k> /x6B <U006B> LATIN SMALL LETTER K
|
|
183 |
<l> /x6C <U006C> LATIN SMALL LETTER L
|
|
184 |
<m> /x6D <U006D> LATIN SMALL LETTER M
|
|
185 |
<n> /x6E <U006E> LATIN SMALL LETTER N
|
|
186 |
<o> /x6F <U006F> LATIN SMALL LETTER O
|
|
187 |
<p> /x70 <U0070> LATIN SMALL LETTER P
|
|
188 |
<q> /x71 <U0071> LATIN SMALL LETTER Q
|
|
189 |
<r> /x72 <U0072> LATIN SMALL LETTER R
|
|
190 |
<s> /x73 <U0073> LATIN SMALL LETTER S
|
|
191 |
<t> /x74 <U0074> LATIN SMALL LETTER T
|
|
192 |
<u> /x75 <U0075> LATIN SMALL LETTER U
|
|
193 |
<v> /x76 <U0076> LATIN SMALL LETTER V
|
|
194 |
<w> /x77 <U0077> LATIN SMALL LETTER W
|
|
195 |
<x> /x78 <U0078> LATIN SMALL LETTER X
|
|
196 |
<y> /x79 <U0079> LATIN SMALL LETTER Y
|
|
197 |
<z> /x7A <U007A> LATIN SMALL LETTER Z
|
|
198 |
<(!!> /x7B <U007B> LEFT CURLY BRACKET
|
|
199 |
<!!!!> /x7C <U007C> VERTICAL LINE
|
|
200 |
<!!)> /x7D <U007D> RIGHT CURLY BRACKET
|
|
201 |
<'?> /x7E <U007E> TILDE
|
|
202 |
<DT> /x7F <U007F> DELETE (DEL)
|
|
203 |
<D%> /x80 <U0402> CYRILLIC CAPITAL LETTER DJE (Serbocroatian)
|
|
204 |
<G%> /x81 <U0403> CYRILLIC CAPITAL LETTER GJE
|
|
205 |
<.9> /x82 <U201A> SINGLE LOW-9 QUOTATION MARK
|
|
206 |
<g%> /x83 <U0453> CYRILLIC SMALL LETTER GJE
|
|
207 |
<:9> /x84 <U201E> DOUBLE LOW-9 QUOTATION MARK
|
|
208 |
<.3> /x85 <U2026> HORIZONTAL ELLIPSIS
|
|
209 |
<//-> /x86 <U2020> DAGGER
|
|
210 |
<//=> /x87 <U2021> DOUBLE DAGGER
|
|
211 |
<%0> /x89 <U2030> PER MILLE SIGN
|
|
212 |
<LJ> /x8A <U0409> CYRILLIC CAPITAL LETTER LJE
|
|
213 |
<<1> /x8B <U2039> SINGLE LEFT-POINTING ANGLE QUOTATION MARK
|
|
214 |
<NJ> /x8C <U040A> CYRILLIC CAPITAL LETTER NJE
|
|
215 |
<KJ> /x8D <U040C> CYRILLIC CAPITAL LETTER KJE
|
|
216 |
<Ts> /x8E <U040B> CYRILLIC CAPITAL LETTER TSHE (Serbocroatian)
|
|
217 |
<DZ> /x8F <U040F> CYRILLIC CAPITAL LETTER DZHE
|
|
218 |
<d%> /x90 <U0452> CYRILLIC SMALL LETTER DJE (Serbocroatian)
|
|
219 |
<'6> /x91 <U2018> LEFT SINGLE QUOTATION MARK
|
|
220 |
<'9> /x92 <U2019> RIGHT SINGLE QUOTATION MARK
|
|
221 |
<'6> /x93 <U201C> LEFT DOUBLE QUOTATION MARK
|
|
222 |
<'9> /x94 <U201D> RIGHT DOUBLE QUOTATION MARK
|
|
223 |
<sb> /x95 <U2022> BULLET
|
|
224 |
<-N> /x96 <U2013> EN DASH
|
|
225 |
<-M> /x97 <U2014> EM DASH
|
|
226 |
<TM> /x99 <U2122> TRADE MARK SIGN
|
|
227 |
<lj> /x9A <U0459> CYRILLIC SMALL LETTER LJE
|
|
228 |
</>1> /x9B <U203A> SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
|
|
229 |
<nj> /x9C <U045A> CYRILLIC SMALL LETTER NJE
|
|
230 |
<kj> /x9D <U045C> CYRILLIC SMALL LETTER KJE
|
|
231 |
<ts> /x9E <U045B> CYRILLIC SMALL LETTER TSHE (Serbocroatian)
|
|
232 |
<dz> /x9F <U045F> CYRILLIC SMALL LETTER DZHE
|
|
233 |
<NS> /xA0 <U00A0> NO-BREAK SPACE
|
|
234 |
<V%> /xA1 <U040E> CYRILLIC CAPITAL LETTER SHORT U (Byelorussian)
|
|
235 |
<v%> /xA2 <U045E> CYRILLIC SMALL LETTER SHORT U (Byelorussian)
|
|
236 |
<J%> /xA3 <U0408> CYRILLIC CAPITAL LETTER JE
|
|
237 |
<Cu> /xA4 <U00A4> CURRENCY SIGN
|
|
238 |
<G3> /xA5 <U0490> CYRILLIC CAPITAL LETTER GHE WITH UPTURN
|
|
239 |
<BB> /xA6 <U00A6> BROKEN BAR
|
|
240 |
<SE> /xA7 <U00A7> SECTION SIGN
|
|
241 |
<IO> /xA8 <U0401> CYRILLIC CAPITAL LETTER IO
|
|
242 |
<Co> /xA9 <U00A9> COPYRIGHT SIGN
|
|
243 |
<IE> /xAA <U0404> CYRILLIC CAPITAL LETTER UKRAINIAN IE
|
|
244 |
<<<> /xAB <U00AB> LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
|
|
245 |
<NO> /xAC <U00AC> NOT SIGN
|
|
246 |
<--> /xAD <U00AD> SOFT HYPHEN
|
|
247 |
<Rg> /xAE <U00AE> REGISTERED SIGN
|
|
248 |
<YI> /xAF <U0407> CYRILLIC CAPITAL LETTER YI (Ukrainian)
|
|
249 |
<DG> /xB0 <U00B0> DEGREE SIGN
|
|
250 |
<+-> /xB1 <U00B1> PLUS-MINUS SIGN
|
|
251 |
<II> /xB2 <U0406> CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I
|
|
252 |
<ii> /xB3 <U0456> CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I
|
|
253 |
<g3> /xB4 <U0491> CYRILLIC SMALL LETTER GHE WITH UPTURN
|
|
254 |
<My> /xB5 <U00B5> MICRO SIGN
|
|
255 |
<PI> /xB6 <U00B6> PILCROW SIGN
|
|
256 |
<.M> /xB7 <U00B7> MIDDLE DOT
|
|
257 |
<io> /xB8 <U0451> CYRILLIC SMALL LETTER IO
|
|
258 |
<N0> /xB9 <U2116> NUMERO SIGN
|
|
259 |
<ie> /xBA <U0454> CYRILLIC SMALL LETTER UKRAINIAN IE
|
|
260 |
</>/>> /xBB <U00BB> RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
|
|
261 |
<j%> /xBC <U0458> CYRILLIC SMALL LETTER JE
|
|
262 |
<DS> /xBD <U0405> CYRILLIC CAPITAL LETTER DZE
|
|
263 |
<ds> /xBE <U0455> CYRILLIC SMALL LETTER DZE
|
|
264 |
<yi> /xBF <U0457> CYRILLIC SMALL LETTER YI (Ukrainian)
|
|
265 |
<A=> /xC0 <U0410> CYRILLIC CAPITAL LETTER A
|
|
266 |
<B=> /xC1 <U0411> CYRILLIC CAPITAL LETTER BE
|
|
267 |
<V=> /xC2 <U0412> CYRILLIC CAPITAL LETTER VE
|
|
268 |
<G=> /xC3 <U0413> CYRILLIC CAPITAL LETTER GHE
|
|
269 |
<D=> /xC4 <U0414> CYRILLIC CAPITAL LETTER DE
|
|
270 |
<E=> /xC5 <U0415> CYRILLIC CAPITAL LETTER IE
|
|
271 |
<Z%> /xC6 <U0416> CYRILLIC CAPITAL LETTER ZHE
|
|
272 |
<Z=> /xC7 <U0417> CYRILLIC CAPITAL LETTER ZE
|
|
273 |
<I=> /xC8 <U0418> CYRILLIC CAPITAL LETTER I
|
|
274 |
<J=> /xC9 <U0419> CYRILLIC CAPITAL LETTER SHORT I
|
|
275 |
<K=> /xCA <U041A> CYRILLIC CAPITAL LETTER KA
|
|
276 |
<L=> /xCB <U041B> CYRILLIC CAPITAL LETTER EL
|
|
277 |
<M=> /xCC <U041C> CYRILLIC CAPITAL LETTER EM
|
|
278 |
<N=> /xCD <U041D> CYRILLIC CAPITAL LETTER EN
|
|
279 |
<O=> /xCE <U041E> CYRILLIC CAPITAL LETTER O
|
|
280 |
<P=> /xCF <U041F> CYRILLIC CAPITAL LETTER PE
|
|
281 |
<R=> /xD0 <U0420> CYRILLIC CAPITAL LETTER ER
|
|
282 |
<S=> /xD1 <U0421> CYRILLIC CAPITAL LETTER ES
|
|
283 |
<T=> /xD2 <U0422> CYRILLIC CAPITAL LETTER TE
|
|
284 |
<U=> /xD3 <U0423> CYRILLIC CAPITAL LETTER U
|
|
285 |
<F=> /xD4 <U0424> CYRILLIC CAPITAL LETTER EF
|
|
286 |
<H=> /xD5 <U0425> CYRILLIC CAPITAL LETTER HA
|
|
287 |
<C=> /xD6 <U0426> CYRILLIC CAPITAL LETTER TSE
|
|
288 |
<C%> /xD7 <U0427> CYRILLIC CAPITAL LETTER CHE
|
|
289 |
<S%> /xD8 <U0428> CYRILLIC CAPITAL LETTER SHA
|
|
290 |
<Sc> /xD9 <U0429> CYRILLIC CAPITAL LETTER SHCHA
|
|
291 |
<='> /xDA <U042A> CYRILLIC CAPITAL LETTER HARD SIGN
|
|
292 |
<Y=> /xDB <U042B> CYRILLIC CAPITAL LETTER YERU
|
|
293 |
<%'> /xDC <U042C> CYRILLIC CAPITAL LETTER SOFT SIGN
|
|
294 |
<JE> /xDD <U042D> CYRILLIC CAPITAL LETTER E
|
|
295 |
<JU> /xDE <U042E> CYRILLIC CAPITAL LETTER YU
|
|
296 |
<JA> /xDF <U042F> CYRILLIC CAPITAL LETTER YA
|
|
297 |
<a=> /xE0 <U0430> CYRILLIC SMALL LETTER A
|
|
298 |
<b=> /xE1 <U0431> CYRILLIC SMALL LETTER BE
|
|
299 |
<v=> /xE2 <U0432> CYRILLIC SMALL LETTER VE
|
|
300 |
<g=> /xE3 <U0433> CYRILLIC SMALL LETTER GHE
|
|
301 |
<d=> /xE4 <U0434> CYRILLIC SMALL LETTER DE
|
|
302 |
<e=> /xE5 <U0435> CYRILLIC SMALL LETTER IE
|
|
303 |
<z%> /xE6 <U0436> CYRILLIC SMALL LETTER ZHE
|
|
304 |
<z=> /xE7 <U0437> CYRILLIC SMALL LETTER ZE
|
|
305 |
<i=> /xE8 <U0438> CYRILLIC SMALL LETTER I
|
|
306 |
<j=> /xE9 <U0439> CYRILLIC SMALL LETTER SHORT I
|
|
307 |
<k=> /xEA <U043A> CYRILLIC SMALL LETTER KA
|
|
308 |
<l=> /xEB <U043B> CYRILLIC SMALL LETTER EL
|
|
309 |
<m=> /xEC <U043C> CYRILLIC SMALL LETTER EM
|
|
310 |
<n=> /xED <U043D> CYRILLIC SMALL LETTER EN
|
|
311 |
<o=> /xEE <U043E> CYRILLIC SMALL LETTER O
|
|
312 |
<p=> /xEF <U043F> CYRILLIC SMALL LETTER PE
|
|
313 |
<r=> /xF0 <U0440> CYRILLIC SMALL LETTER ER
|
|
314 |
<s=> /xF1 <U0441> CYRILLIC SMALL LETTER ES
|
|
315 |
<t=> /xF2 <U0442> CYRILLIC SMALL LETTER TE
|
|
316 |
<u=> /xF3 <U0443> CYRILLIC SMALL LETTER U
|
|
317 |
<f=> /xF4 <U0444> CYRILLIC SMALL LETTER EF
|
|
318 |
<h=> /xF5 <U0445> CYRILLIC SMALL LETTER HA
|
|
319 |
<c=> /xF6 <U0446> CYRILLIC SMALL LETTER TSE
|
|
320 |
<c%> /xF7 <U0447> CYRILLIC SMALL LETTER CHE
|
|
321 |
<s%> /xF8 <U0448> CYRILLIC SMALL LETTER SHA
|
|
322 |
<sc> /xF9 <U0449> CYRILLIC SMALL LETTER SHCHA
|
|
323 |
<='> /xFA <U044A> CYRILLIC SMALL LETTER HARD SIGN
|
|
324 |
<y=> /xFB <U044B> CYRILLIC SMALL LETTER YERU
|
|
325 |
<%'> /xFC <U044C> CYRILLIC SMALL LETTER SOFT SIGN
|
|
326 |
<je> /xFD <U044D> CYRILLIC SMALL LETTER E
|
|
327 |
<ju> /xFE <U044E> CYRILLIC SMALL LETTER YU
|
|
328 |
<ja> /xFF <U044F> CYRILLIC SMALL LETTER YA
|
|
329 |
END CHARMAP
|
|
330 |
|
|
331 |
"
|
|
332 |
! !
|
|
333 |
|
8813
|
334 |
!MS_Cyrillic methodsFor:'encoding & decoding'!
|
|
335 |
|
|
336 |
decode:codeArg
|
|
337 |
"Automagically generated by generateCode - do not modify.
|
|
338 |
Decode from my encoding into unicode."
|
|
339 |
|
|
340 |
|code "{ Class: SmallInteger }"|
|
|
341 |
|
|
342 |
code := codeArg.
|
|
343 |
code <= 16r7F ifTrue:[ ^ code ].
|
|
344 |
code > 16rFF ifTrue:[
|
|
345 |
^ self decodingError.
|
|
346 |
].
|
|
347 |
[
|
|
348 |
|t|
|
|
349 |
t := #(
|
|
350 |
"16r0080" 16r0402 " CYRILLIC CAPITAL LETTER DJE (Serbocroatian) "
|
|
351 |
"16r0081" 16r0403 " CYRILLIC CAPITAL LETTER GJE "
|
|
352 |
"16r0082" 16r201A " SINGLE LOW-9 QUOTATION MARK "
|
|
353 |
"16r0083" 16r0453 " CYRILLIC SMALL LETTER GJE "
|
|
354 |
"16r0084" 16r201E " DOUBLE LOW-9 QUOTATION MARK "
|
|
355 |
"16r0085" 16r2026 " HORIZONTAL ELLIPSIS "
|
|
356 |
"16r0086" 16r2020 " DAGGER "
|
|
357 |
"16r0087" 16r2021 " DOUBLE DAGGER "
|
|
358 |
"16r0088" 16r0000 " invalid "
|
|
359 |
"16r0089" 16r2030 " PER MILLE SIGN "
|
|
360 |
"16r008A" 16r0409 " CYRILLIC CAPITAL LETTER LJE "
|
|
361 |
"16r008B" 16r2039 " SINGLE LEFT-POINTING ANGLE QUOTATION MARK "
|
|
362 |
"16r008C" 16r040A " CYRILLIC CAPITAL LETTER NJE "
|
|
363 |
"16r008D" 16r040C " CYRILLIC CAPITAL LETTER KJE "
|
|
364 |
"16r008E" 16r040B " CYRILLIC CAPITAL LETTER TSHE (Serbocroatian) "
|
|
365 |
"16r008F" 16r040F " CYRILLIC CAPITAL LETTER DZHE "
|
|
366 |
"16r0090" 16r0452 " CYRILLIC SMALL LETTER DJE (Serbocroatian) "
|
|
367 |
"16r0091" 16r2018 " LEFT SINGLE QUOTATION MARK "
|
|
368 |
"16r0092" 16r2019 " RIGHT SINGLE QUOTATION MARK "
|
|
369 |
"16r0093" 16r201C " LEFT DOUBLE QUOTATION MARK "
|
|
370 |
"16r0094" 16r201D " RIGHT DOUBLE QUOTATION MARK "
|
|
371 |
"16r0095" 16r2022 " BULLET "
|
|
372 |
"16r0096" 16r2013 " EN DASH "
|
|
373 |
"16r0097" 16r2014 " EM DASH "
|
|
374 |
"16r0098" 16r0000 " invalid "
|
|
375 |
"16r0099" 16r2122 " TRADE MARK SIGN "
|
|
376 |
"16r009A" 16r0459 " CYRILLIC SMALL LETTER LJE "
|
|
377 |
"16r009B" 16r203A " SINGLE RIGHT-POINTING ANGLE QUOTATION MARK "
|
|
378 |
"16r009C" 16r045A " CYRILLIC SMALL LETTER NJE "
|
|
379 |
"16r009D" 16r045C " CYRILLIC SMALL LETTER KJE "
|
|
380 |
"16r009E" 16r045B " CYRILLIC SMALL LETTER TSHE (Serbocroatian) "
|
|
381 |
"16r009F" 16r045F " CYRILLIC SMALL LETTER DZHE "
|
|
382 |
"16r00A0" 16r00A0 " NO-BREAK SPACE "
|
|
383 |
"16r00A1" 16r040E " CYRILLIC CAPITAL LETTER SHORT U (Byelorussian) "
|
|
384 |
"16r00A2" 16r045E " CYRILLIC SMALL LETTER SHORT U (Byelorussian) "
|
|
385 |
"16r00A3" 16r0408 " CYRILLIC CAPITAL LETTER JE "
|
|
386 |
"16r00A4" 16r00A4 " CURRENCY SIGN "
|
|
387 |
"16r00A5" 16r0490 " CYRILLIC CAPITAL LETTER GHE WITH UPTURN "
|
|
388 |
"16r00A6" 16r00A6 " BROKEN BAR "
|
|
389 |
"16r00A7" 16r00A7 " SECTION SIGN "
|
|
390 |
"16r00A8" 16r0401 " CYRILLIC CAPITAL LETTER IO "
|
|
391 |
"16r00A9" 16r00A9 " COPYRIGHT SIGN "
|
|
392 |
"16r00AA" 16r0404 " CYRILLIC CAPITAL LETTER UKRAINIAN IE "
|
|
393 |
"16r00AB" 16r00AB " LEFT-POINTING DOUBLE ANGLE QUOTATION MARK "
|
|
394 |
"16r00AC" 16r00AC " NOT SIGN "
|
|
395 |
"16r00AD" 16r00AD " SOFT HYPHEN "
|
|
396 |
"16r00AE" 16r00AE " REGISTERED SIGN "
|
|
397 |
"16r00AF" 16r0407 " CYRILLIC CAPITAL LETTER YI (Ukrainian) "
|
|
398 |
"16r00B0" 16r00B0 " DEGREE SIGN "
|
|
399 |
"16r00B1" 16r00B1 " PLUS-MINUS SIGN "
|
|
400 |
"16r00B2" 16r0406 " CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I "
|
|
401 |
"16r00B3" 16r0456 " CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I "
|
|
402 |
"16r00B4" 16r0491 " CYRILLIC SMALL LETTER GHE WITH UPTURN "
|
|
403 |
"16r00B5" 16r00B5 " MICRO SIGN "
|
|
404 |
"16r00B6" 16r00B6 " PILCROW SIGN "
|
|
405 |
"16r00B7" 16r00B7 " MIDDLE DOT "
|
|
406 |
"16r00B8" 16r0451 " CYRILLIC SMALL LETTER IO "
|
|
407 |
"16r00B9" 16r2116 " NUMERO SIGN "
|
|
408 |
"16r00BA" 16r0454 " CYRILLIC SMALL LETTER UKRAINIAN IE "
|
|
409 |
"16r00BB" 16r00BB " RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK "
|
|
410 |
"16r00BC" 16r0458 " CYRILLIC SMALL LETTER JE "
|
|
411 |
"16r00BD" 16r0405 " CYRILLIC CAPITAL LETTER DZE "
|
|
412 |
"16r00BE" 16r0455 " CYRILLIC SMALL LETTER DZE "
|
|
413 |
"16r00BF" 16r0457 " CYRILLIC SMALL LETTER YI (Ukrainian) "
|
|
414 |
"16r00C0" 16r0410 " CYRILLIC CAPITAL LETTER A "
|
|
415 |
"16r00C1" 16r0411 " CYRILLIC CAPITAL LETTER BE "
|
|
416 |
"16r00C2" 16r0412 " CYRILLIC CAPITAL LETTER VE "
|
|
417 |
"16r00C3" 16r0413 " CYRILLIC CAPITAL LETTER GHE "
|
|
418 |
"16r00C4" 16r0414 " CYRILLIC CAPITAL LETTER DE "
|
|
419 |
"16r00C5" 16r0415 " CYRILLIC CAPITAL LETTER IE "
|
|
420 |
"16r00C6" 16r0416 " CYRILLIC CAPITAL LETTER ZHE "
|
|
421 |
"16r00C7" 16r0417 " CYRILLIC CAPITAL LETTER ZE "
|
|
422 |
"16r00C8" 16r0418 " CYRILLIC CAPITAL LETTER I "
|
|
423 |
"16r00C9" 16r0419 " CYRILLIC CAPITAL LETTER SHORT I "
|
|
424 |
"16r00CA" 16r041A " CYRILLIC CAPITAL LETTER KA "
|
|
425 |
"16r00CB" 16r041B " CYRILLIC CAPITAL LETTER EL "
|
|
426 |
"16r00CC" 16r041C " CYRILLIC CAPITAL LETTER EM "
|
|
427 |
"16r00CD" 16r041D " CYRILLIC CAPITAL LETTER EN "
|
|
428 |
"16r00CE" 16r041E " CYRILLIC CAPITAL LETTER O "
|
|
429 |
"16r00CF" 16r041F " CYRILLIC CAPITAL LETTER PE "
|
|
430 |
"16r00D0" 16r0420 " CYRILLIC CAPITAL LETTER ER "
|
|
431 |
"16r00D1" 16r0421 " CYRILLIC CAPITAL LETTER ES "
|
|
432 |
"16r00D2" 16r0422 " CYRILLIC CAPITAL LETTER TE "
|
|
433 |
"16r00D3" 16r0423 " CYRILLIC CAPITAL LETTER U "
|
|
434 |
"16r00D4" 16r0424 " CYRILLIC CAPITAL LETTER EF "
|
|
435 |
"16r00D5" 16r0425 " CYRILLIC CAPITAL LETTER HA "
|
|
436 |
"16r00D6" 16r0426 " CYRILLIC CAPITAL LETTER TSE "
|
|
437 |
"16r00D7" 16r0427 " CYRILLIC CAPITAL LETTER CHE "
|
|
438 |
"16r00D8" 16r0428 " CYRILLIC CAPITAL LETTER SHA "
|
|
439 |
"16r00D9" 16r0429 " CYRILLIC CAPITAL LETTER SHCHA "
|
|
440 |
"16r00DA" 16r042A " CYRILLIC CAPITAL LETTER HARD SIGN "
|
|
441 |
"16r00DB" 16r042B " CYRILLIC CAPITAL LETTER YERU "
|
|
442 |
"16r00DC" 16r042C " CYRILLIC CAPITAL LETTER SOFT SIGN "
|
|
443 |
"16r00DD" 16r042D " CYRILLIC CAPITAL LETTER E "
|
|
444 |
"16r00DE" 16r042E " CYRILLIC CAPITAL LETTER YU "
|
|
445 |
"16r00DF" 16r042F " CYRILLIC CAPITAL LETTER YA "
|
|
446 |
"16r00E0" 16r0430 " CYRILLIC SMALL LETTER A "
|
|
447 |
"16r00E1" 16r0431 " CYRILLIC SMALL LETTER BE "
|
|
448 |
"16r00E2" 16r0432 " CYRILLIC SMALL LETTER VE "
|
|
449 |
"16r00E3" 16r0433 " CYRILLIC SMALL LETTER GHE "
|
|
450 |
"16r00E4" 16r0434 " CYRILLIC SMALL LETTER DE "
|
|
451 |
"16r00E5" 16r0435 " CYRILLIC SMALL LETTER IE "
|
|
452 |
"16r00E6" 16r0436 " CYRILLIC SMALL LETTER ZHE "
|
|
453 |
"16r00E7" 16r0437 " CYRILLIC SMALL LETTER ZE "
|
|
454 |
"16r00E8" 16r0438 " CYRILLIC SMALL LETTER I "
|
|
455 |
"16r00E9" 16r0439 " CYRILLIC SMALL LETTER SHORT I "
|
|
456 |
"16r00EA" 16r043A " CYRILLIC SMALL LETTER KA "
|
|
457 |
"16r00EB" 16r043B " CYRILLIC SMALL LETTER EL "
|
|
458 |
"16r00EC" 16r043C " CYRILLIC SMALL LETTER EM "
|
|
459 |
"16r00ED" 16r043D " CYRILLIC SMALL LETTER EN "
|
|
460 |
"16r00EE" 16r043E " CYRILLIC SMALL LETTER O "
|
|
461 |
"16r00EF" 16r043F " CYRILLIC SMALL LETTER PE "
|
|
462 |
"16r00F0" 16r0440 " CYRILLIC SMALL LETTER ER "
|
|
463 |
"16r00F1" 16r0441 " CYRILLIC SMALL LETTER ES "
|
|
464 |
"16r00F2" 16r0442 " CYRILLIC SMALL LETTER TE "
|
|
465 |
"16r00F3" 16r0443 " CYRILLIC SMALL LETTER U "
|
|
466 |
"16r00F4" 16r0444 " CYRILLIC SMALL LETTER EF "
|
|
467 |
"16r00F5" 16r0445 " CYRILLIC SMALL LETTER HA "
|
|
468 |
"16r00F6" 16r0446 " CYRILLIC SMALL LETTER TSE "
|
|
469 |
"16r00F7" 16r0447 " CYRILLIC SMALL LETTER CHE "
|
|
470 |
"16r00F8" 16r0448 " CYRILLIC SMALL LETTER SHA "
|
|
471 |
"16r00F9" 16r0449 " CYRILLIC SMALL LETTER SHCHA "
|
|
472 |
"16r00FA" 16r044A " CYRILLIC SMALL LETTER HARD SIGN "
|
|
473 |
"16r00FB" 16r044B " CYRILLIC SMALL LETTER YERU "
|
|
474 |
"16r00FC" 16r044C " CYRILLIC SMALL LETTER SOFT SIGN "
|
|
475 |
"16r00FD" 16r044D " CYRILLIC SMALL LETTER E "
|
|
476 |
"16r00FE" 16r044E " CYRILLIC SMALL LETTER YU "
|
|
477 |
"16r00FF" 16r044F " CYRILLIC SMALL LETTER YA "
|
|
478 |
) at:(code - 16r7F).
|
|
479 |
t == 0 ifFalse:[^ t].
|
|
480 |
^ self decodingError.
|
|
481 |
] value.
|
|
482 |
!
|
|
483 |
|
|
484 |
encode:unicodeArg
|
|
485 |
"Automagically generated by generateCode - do not modify.
|
|
486 |
Encode from unicode into my encoding."
|
|
487 |
|
|
488 |
|unicode "{ Class: SmallInteger }"|
|
|
489 |
|
|
490 |
unicode := unicodeArg.
|
|
491 |
unicode <= 16r7F ifTrue:[ ^ unicode ].
|
|
492 |
unicode > 16r2122 ifTrue:[
|
|
493 |
^ self encodingError.
|
|
494 |
].
|
|
495 |
unicode <= 16r9F ifTrue:[
|
|
496 |
^ self encodingError
|
|
497 |
].
|
|
498 |
unicode <= 16r491 ifTrue:[
|
|
499 |
unicode <= 16rBB ifTrue:[
|
|
500 |
[
|
|
501 |
|t|
|
|
502 |
t := #[
|
|
503 |
"16r00A0" 16rA0 " NO-BREAK SPACE "
|
|
504 |
"16r00A1" 16r00 " invalid "
|
|
505 |
"16r00A2" 16r00 " invalid "
|
|
506 |
"16r00A3" 16r00 " invalid "
|
|
507 |
"16r00A4" 16rA4 " CURRENCY SIGN "
|
|
508 |
"16r00A5" 16r00 " invalid "
|
|
509 |
"16r00A6" 16rA6 " BROKEN BAR "
|
|
510 |
"16r00A7" 16rA7 " SECTION SIGN "
|
|
511 |
"16r00A8" 16r00 " invalid "
|
|
512 |
"16r00A9" 16rA9 " COPYRIGHT SIGN "
|
|
513 |
"16r00AA" 16r00 " invalid "
|
|
514 |
"16r00AB" 16rAB " LEFT-POINTING DOUBLE ANGLE QUOTATION MARK "
|
|
515 |
"16r00AC" 16rAC " NOT SIGN "
|
|
516 |
"16r00AD" 16rAD " SOFT HYPHEN "
|
|
517 |
"16r00AE" 16rAE " REGISTERED SIGN "
|
|
518 |
"16r00AF" 16r00 " invalid "
|
|
519 |
"16r00B0" 16rB0 " DEGREE SIGN "
|
|
520 |
"16r00B1" 16rB1 " PLUS-MINUS SIGN "
|
|
521 |
"16r00B2" 16r00 " invalid "
|
|
522 |
"16r00B3" 16r00 " invalid "
|
|
523 |
"16r00B4" 16r00 " invalid "
|
|
524 |
"16r00B5" 16rB5 " MICRO SIGN "
|
|
525 |
"16r00B6" 16rB6 " PILCROW SIGN "
|
|
526 |
"16r00B7" 16rB7 " MIDDLE DOT "
|
|
527 |
"16r00B8" 16r00 " invalid "
|
|
528 |
"16r00B9" 16r00 " invalid "
|
|
529 |
"16r00BA" 16r00 " invalid "
|
|
530 |
"16r00BB" 16rBB " RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK "
|
|
531 |
] at:(unicode - 16r9F).
|
|
532 |
t == 0 ifFalse:[^ t].
|
|
533 |
^ self encodingError
|
|
534 |
] value.
|
|
535 |
].
|
|
536 |
unicode <= 16r400 ifTrue:[
|
|
537 |
^ self encodingError
|
|
538 |
].
|
|
539 |
unicode <= 16r45F ifTrue:[
|
|
540 |
[
|
|
541 |
|t|
|
|
542 |
t := #[
|
|
543 |
"16r0401" 16rA8 " CYRILLIC CAPITAL LETTER IO "
|
|
544 |
"16r0402" 16r80 " CYRILLIC CAPITAL LETTER DJE (Serbocroatian) "
|
|
545 |
"16r0403" 16r81 " CYRILLIC CAPITAL LETTER GJE "
|
|
546 |
"16r0404" 16rAA " CYRILLIC CAPITAL LETTER UKRAINIAN IE "
|
|
547 |
"16r0405" 16rBD " CYRILLIC CAPITAL LETTER DZE "
|
|
548 |
"16r0406" 16rB2 " CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I "
|
|
549 |
"16r0407" 16rAF " CYRILLIC CAPITAL LETTER YI (Ukrainian) "
|
|
550 |
"16r0408" 16rA3 " CYRILLIC CAPITAL LETTER JE "
|
|
551 |
"16r0409" 16r8A " CYRILLIC CAPITAL LETTER LJE "
|
|
552 |
"16r040A" 16r8C " CYRILLIC CAPITAL LETTER NJE "
|
|
553 |
"16r040B" 16r8E " CYRILLIC CAPITAL LETTER TSHE (Serbocroatian) "
|
|
554 |
"16r040C" 16r8D " CYRILLIC CAPITAL LETTER KJE "
|
|
555 |
"16r040D" 16r00 " invalid "
|
|
556 |
"16r040E" 16rA1 " CYRILLIC CAPITAL LETTER SHORT U (Byelorussian) "
|
|
557 |
"16r040F" 16r8F " CYRILLIC CAPITAL LETTER DZHE "
|
|
558 |
"16r0410" 16rC0 " CYRILLIC CAPITAL LETTER A "
|
|
559 |
"16r0411" 16rC1 " CYRILLIC CAPITAL LETTER BE "
|
|
560 |
"16r0412" 16rC2 " CYRILLIC CAPITAL LETTER VE "
|
|
561 |
"16r0413" 16rC3 " CYRILLIC CAPITAL LETTER GHE "
|
|
562 |
"16r0414" 16rC4 " CYRILLIC CAPITAL LETTER DE "
|
|
563 |
"16r0415" 16rC5 " CYRILLIC CAPITAL LETTER IE "
|
|
564 |
"16r0416" 16rC6 " CYRILLIC CAPITAL LETTER ZHE "
|
|
565 |
"16r0417" 16rC7 " CYRILLIC CAPITAL LETTER ZE "
|
|
566 |
"16r0418" 16rC8 " CYRILLIC CAPITAL LETTER I "
|
|
567 |
"16r0419" 16rC9 " CYRILLIC CAPITAL LETTER SHORT I "
|
|
568 |
"16r041A" 16rCA " CYRILLIC CAPITAL LETTER KA "
|
|
569 |
"16r041B" 16rCB " CYRILLIC CAPITAL LETTER EL "
|
|
570 |
"16r041C" 16rCC " CYRILLIC CAPITAL LETTER EM "
|
|
571 |
"16r041D" 16rCD " CYRILLIC CAPITAL LETTER EN "
|
|
572 |
"16r041E" 16rCE " CYRILLIC CAPITAL LETTER O "
|
|
573 |
"16r041F" 16rCF " CYRILLIC CAPITAL LETTER PE "
|
|
574 |
"16r0420" 16rD0 " CYRILLIC CAPITAL LETTER ER "
|
|
575 |
"16r0421" 16rD1 " CYRILLIC CAPITAL LETTER ES "
|
|
576 |
"16r0422" 16rD2 " CYRILLIC CAPITAL LETTER TE "
|
|
577 |
"16r0423" 16rD3 " CYRILLIC CAPITAL LETTER U "
|
|
578 |
"16r0424" 16rD4 " CYRILLIC CAPITAL LETTER EF "
|
|
579 |
"16r0425" 16rD5 " CYRILLIC CAPITAL LETTER HA "
|
|
580 |
"16r0426" 16rD6 " CYRILLIC CAPITAL LETTER TSE "
|
|
581 |
"16r0427" 16rD7 " CYRILLIC CAPITAL LETTER CHE "
|
|
582 |
"16r0428" 16rD8 " CYRILLIC CAPITAL LETTER SHA "
|
|
583 |
"16r0429" 16rD9 " CYRILLIC CAPITAL LETTER SHCHA "
|
|
584 |
"16r042A" 16rDA " CYRILLIC CAPITAL LETTER HARD SIGN "
|
|
585 |
"16r042B" 16rDB " CYRILLIC CAPITAL LETTER YERU "
|
|
586 |
"16r042C" 16rDC " CYRILLIC CAPITAL LETTER SOFT SIGN "
|
|
587 |
"16r042D" 16rDD " CYRILLIC CAPITAL LETTER E "
|
|
588 |
"16r042E" 16rDE " CYRILLIC CAPITAL LETTER YU "
|
|
589 |
"16r042F" 16rDF " CYRILLIC CAPITAL LETTER YA "
|
|
590 |
"16r0430" 16rE0 " CYRILLIC SMALL LETTER A "
|
|
591 |
"16r0431" 16rE1 " CYRILLIC SMALL LETTER BE "
|
|
592 |
"16r0432" 16rE2 " CYRILLIC SMALL LETTER VE "
|
|
593 |
"16r0433" 16rE3 " CYRILLIC SMALL LETTER GHE "
|
|
594 |
"16r0434" 16rE4 " CYRILLIC SMALL LETTER DE "
|
|
595 |
"16r0435" 16rE5 " CYRILLIC SMALL LETTER IE "
|
|
596 |
"16r0436" 16rE6 " CYRILLIC SMALL LETTER ZHE "
|
|
597 |
"16r0437" 16rE7 " CYRILLIC SMALL LETTER ZE "
|
|
598 |
"16r0438" 16rE8 " CYRILLIC SMALL LETTER I "
|
|
599 |
"16r0439" 16rE9 " CYRILLIC SMALL LETTER SHORT I "
|
|
600 |
"16r043A" 16rEA " CYRILLIC SMALL LETTER KA "
|
|
601 |
"16r043B" 16rEB " CYRILLIC SMALL LETTER EL "
|
|
602 |
"16r043C" 16rEC " CYRILLIC SMALL LETTER EM "
|
|
603 |
"16r043D" 16rED " CYRILLIC SMALL LETTER EN "
|
|
604 |
"16r043E" 16rEE " CYRILLIC SMALL LETTER O "
|
|
605 |
"16r043F" 16rEF " CYRILLIC SMALL LETTER PE "
|
|
606 |
"16r0440" 16rF0 " CYRILLIC SMALL LETTER ER "
|
|
607 |
"16r0441" 16rF1 " CYRILLIC SMALL LETTER ES "
|
|
608 |
"16r0442" 16rF2 " CYRILLIC SMALL LETTER TE "
|
|
609 |
"16r0443" 16rF3 " CYRILLIC SMALL LETTER U "
|
|
610 |
"16r0444" 16rF4 " CYRILLIC SMALL LETTER EF "
|
|
611 |
"16r0445" 16rF5 " CYRILLIC SMALL LETTER HA "
|
|
612 |
"16r0446" 16rF6 " CYRILLIC SMALL LETTER TSE "
|
|
613 |
"16r0447" 16rF7 " CYRILLIC SMALL LETTER CHE "
|
|
614 |
"16r0448" 16rF8 " CYRILLIC SMALL LETTER SHA "
|
|
615 |
"16r0449" 16rF9 " CYRILLIC SMALL LETTER SHCHA "
|
|
616 |
"16r044A" 16rFA " CYRILLIC SMALL LETTER HARD SIGN "
|
|
617 |
"16r044B" 16rFB " CYRILLIC SMALL LETTER YERU "
|
|
618 |
"16r044C" 16rFC " CYRILLIC SMALL LETTER SOFT SIGN "
|
|
619 |
"16r044D" 16rFD " CYRILLIC SMALL LETTER E "
|
|
620 |
"16r044E" 16rFE " CYRILLIC SMALL LETTER YU "
|
|
621 |
"16r044F" 16rFF " CYRILLIC SMALL LETTER YA "
|
|
622 |
"16r0450" 16r00 " invalid "
|
|
623 |
"16r0451" 16rB8 " CYRILLIC SMALL LETTER IO "
|
|
624 |
"16r0452" 16r90 " CYRILLIC SMALL LETTER DJE (Serbocroatian) "
|
|
625 |
"16r0453" 16r83 " CYRILLIC SMALL LETTER GJE "
|
|
626 |
"16r0454" 16rBA " CYRILLIC SMALL LETTER UKRAINIAN IE "
|
|
627 |
"16r0455" 16rBE " CYRILLIC SMALL LETTER DZE "
|
|
628 |
"16r0456" 16rB3 " CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I "
|
|
629 |
"16r0457" 16rBF " CYRILLIC SMALL LETTER YI (Ukrainian) "
|
|
630 |
"16r0458" 16rBC " CYRILLIC SMALL LETTER JE "
|
|
631 |
"16r0459" 16r9A " CYRILLIC SMALL LETTER LJE "
|
|
632 |
"16r045A" 16r9C " CYRILLIC SMALL LETTER NJE "
|
|
633 |
"16r045B" 16r9E " CYRILLIC SMALL LETTER TSHE (Serbocroatian) "
|
|
634 |
"16r045C" 16r9D " CYRILLIC SMALL LETTER KJE "
|
|
635 |
"16r045D" 16r00 " invalid "
|
|
636 |
"16r045E" 16rA2 " CYRILLIC SMALL LETTER SHORT U (Byelorussian) "
|
|
637 |
"16r045F" 16r9F " CYRILLIC SMALL LETTER DZHE "
|
|
638 |
] at:(unicode - 16r400).
|
|
639 |
t == 0 ifFalse:[^ t].
|
|
640 |
^ self encodingError
|
|
641 |
] value.
|
|
642 |
].
|
|
643 |
unicode <= 16r48F ifTrue:[
|
|
644 |
^ self encodingError
|
|
645 |
].
|
|
646 |
^ #[
|
|
647 |
"16r0490" 16rA5 " CYRILLIC CAPITAL LETTER GHE WITH UPTURN "
|
|
648 |
"16r0491" 16rB4 " CYRILLIC SMALL LETTER GHE WITH UPTURN "
|
|
649 |
] at:(unicode - 16r48F).
|
|
650 |
].
|
|
651 |
unicode <= 16r2012 ifTrue:[
|
|
652 |
^ self encodingError
|
|
653 |
].
|
|
654 |
unicode <= 16r203A ifTrue:[
|
|
655 |
[
|
|
656 |
|t|
|
|
657 |
t := #[
|
|
658 |
"16r2013" 16r96 " EN DASH "
|
|
659 |
"16r2014" 16r97 " EM DASH "
|
|
660 |
"16r2015" 16r00 " invalid "
|
|
661 |
"16r2016" 16r00 " invalid "
|
|
662 |
"16r2017" 16r00 " invalid "
|
|
663 |
"16r2018" 16r91 " LEFT SINGLE QUOTATION MARK "
|
|
664 |
"16r2019" 16r92 " RIGHT SINGLE QUOTATION MARK "
|
|
665 |
"16r201A" 16r82 " SINGLE LOW-9 QUOTATION MARK "
|
|
666 |
"16r201B" 16r00 " invalid "
|
|
667 |
"16r201C" 16r93 " LEFT DOUBLE QUOTATION MARK "
|
|
668 |
"16r201D" 16r94 " RIGHT DOUBLE QUOTATION MARK "
|
|
669 |
"16r201E" 16r84 " DOUBLE LOW-9 QUOTATION MARK "
|
|
670 |
"16r201F" 16r00 " invalid "
|
|
671 |
"16r2020" 16r86 " DAGGER "
|
|
672 |
"16r2021" 16r87 " DOUBLE DAGGER "
|
|
673 |
"16r2022" 16r95 " BULLET "
|
|
674 |
"16r2023" 16r00 " invalid "
|
|
675 |
"16r2024" 16r00 " invalid "
|
|
676 |
"16r2025" 16r00 " invalid "
|
|
677 |
"16r2026" 16r85 " HORIZONTAL ELLIPSIS "
|
|
678 |
"16r2027" 16r00 " invalid "
|
|
679 |
"16r2028" 16r00 " invalid "
|
|
680 |
"16r2029" 16r00 " invalid "
|
|
681 |
"16r202A" 16r00 " invalid "
|
|
682 |
"16r202B" 16r00 " invalid "
|
|
683 |
"16r202C" 16r00 " invalid "
|
|
684 |
"16r202D" 16r00 " invalid "
|
|
685 |
"16r202E" 16r00 " invalid "
|
|
686 |
"16r202F" 16r00 " invalid "
|
|
687 |
"16r2030" 16r89 " PER MILLE SIGN "
|
|
688 |
"16r2031" 16r00 " invalid "
|
|
689 |
"16r2032" 16r00 " invalid "
|
|
690 |
"16r2033" 16r00 " invalid "
|
|
691 |
"16r2034" 16r00 " invalid "
|
|
692 |
"16r2035" 16r00 " invalid "
|
|
693 |
"16r2036" 16r00 " invalid "
|
|
694 |
"16r2037" 16r00 " invalid "
|
|
695 |
"16r2038" 16r00 " invalid "
|
|
696 |
"16r2039" 16r8B " SINGLE LEFT-POINTING ANGLE QUOTATION MARK "
|
|
697 |
"16r203A" 16r9B " SINGLE RIGHT-POINTING ANGLE QUOTATION MARK "
|
|
698 |
] at:(unicode - 16r2012).
|
|
699 |
t == 0 ifFalse:[^ t].
|
|
700 |
^ self encodingError
|
|
701 |
] value.
|
|
702 |
].
|
|
703 |
unicode <= 16r2115 ifTrue:[
|
|
704 |
^ self encodingError
|
|
705 |
].
|
|
706 |
unicode == 16r2116 ifTrue:[
|
|
707 |
(#[
|
|
708 |
"16r2116" 1 " NUMERO SIGN "
|
|
709 |
] at:(unicode - 8469)) ~~ 0 ifTrue:[^ unicode].
|
|
710 |
^ self encodingError
|
|
711 |
].
|
|
712 |
unicode <= 16r2121 ifTrue:[
|
|
713 |
^ self encodingError
|
|
714 |
].
|
|
715 |
^ "16r2122" 16r0099 " TRADE MARK SIGN "
|
|
716 |
! !
|
|
717 |
|
8081
|
718 |
!MS_Cyrillic class methodsFor:'documentation'!
|
|
719 |
|
|
720 |
version
|
8813
|
721 |
^ '$Header: /cvs/stx/stx/libbasic/CharacterEncoderImplementations__MS_Cyrillic.st,v 1.4 2005-03-31 18:48:53 cg Exp $'
|
8081
|
722 |
! !
|