CharacterEncoderImplementations__MS_CP1252.st
author Claus Gittinger <cg@exept.de>
Tue, 09 Jul 2019 20:55:17 +0200
changeset 24417 03b083548da2
parent 23334 cb5a5878342b
permissions -rw-r--r--
#REFACTORING by exept class: Smalltalk class changed: #recursiveInstallAutoloadedClassesFrom:rememberIn:maxLevels:noAutoload:packageTop:showSplashInLevels: Transcript showCR:(... bindWith:...) -> Transcript showCR:... with:...
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
22586
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
     1
"{ Encoding: utf8 }"
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
     2
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
     3
"
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
     4
 COPYRIGHT (c) 2004 by eXept Software AG
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
     5
              All Rights Reserved
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
     6
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
     7
 This software is furnished under a license and may be used
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
     8
 only in accordance with the terms of that license and with the
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
     9
 inclusion of the above copyright notice.   This software may not
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    10
 be provided or otherwise made available to, or used by, any
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    11
 other person.  No title to or ownership of the software is
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    12
 hereby transferred.
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    13
"
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    14
"{ Package: 'stx:libbasic' }"
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    15
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    16
"{ NameSpace: CharacterEncoderImplementations }"
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    17
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    18
SingleByteEncoder subclass:#MS_CP1252
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    19
	instanceVariableNames:''
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    20
	classVariableNames:''
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    21
	poolDictionaries:''
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    22
	category:'Collections-Text-Encodings'
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    23
!
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    24
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    25
!MS_CP1252 class methodsFor:'documentation'!
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    26
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    27
copyright
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    28
"
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    29
 COPYRIGHT (c) 2004 by eXept Software AG
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    30
              All Rights Reserved
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    31
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    32
 This software is furnished under a license and may be used
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    33
 only in accordance with the terms of that license and with the
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    34
 inclusion of the above copyright notice.   This software may not
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    35
 be provided or otherwise made available to, or used by, any
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    36
 other person.  No title to or ownership of the software is
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    37
 hereby transferred.
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    38
"
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    39
!
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    40
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    41
documentation
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    42
"
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    43
    Microsoft CP1252 is based on iso8859-1. 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    44
    Codepoints 0x80–0x9F which are control characters
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    45
    in iso8859 are mapped to special windows characters.
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    46
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    47
    This is similar to MS_ANSI,
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    48
    but will always return single byte chars
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    49
    (in contrast to MS_ANSI)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    50
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    51
    [see with:]
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    52
        CharacterEncoderImplementations::MS_Ansi showCharacterSet
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    53
        CharacterEncoderImplementations::MS_CP1252 showCharacterSet
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    54
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    55
    [author:]
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    56
        Claus Gittinger
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    57
"
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    58
! !
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    59
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    60
!MS_CP1252 class methodsFor:'mapping'!
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    61
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    62
mapFileURL2_relativePathName
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    63
    ^ 'CP1252'
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    64
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    65
    "
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    66
     self generateCode
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    67
    "
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    68
!
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    69
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    70
mapping
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    71
"
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    72
# From: http://std.dkuug.dk/i18n/charmaps/CP1252
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    73
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    74
<code_set_name> CP1252
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    75
<comment_char> %
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    76
<escape_char> /
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    77
% version: 1.0
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    78
% repertoiremap: mnemonic,ds
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    79
%  source: UNICODE 1.0
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    80
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    81
% alias MS-ANSI
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    82
CHARMAP
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    83
<NU>                   /x00   <U0000> NULL (NUL)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    84
<SH>                   /x01   <U0001> START OF HEADING (SOH)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    85
<SX>                   /x02   <U0002> START OF TEXT (STX)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    86
<EX>                   /x03   <U0003> END OF TEXT (ETX)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    87
<ET>                   /x04   <U0004> END OF TRANSMISSION (EOT)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    88
<EQ>                   /x05   <U0005> ENQUIRY (ENQ)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    89
<AK>                   /x06   <U0006> ACKNOWLEDGE (ACK)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    90
<BL>                   /x07   <U0007> BELL (BEL)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    91
<BS>                   /x08   <U0008> BACKSPACE (BS)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    92
<HT>                   /x09   <U0009> CHARACTER TABULATION (HT)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    93
<LF>                   /x0A   <U000A> LINE FEED (LF)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    94
<VT>                   /x0B   <U000B> LINE TABULATION (VT)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    95
<FF>                   /x0C   <U000C> FORM FEED (FF)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    96
<CR>                   /x0D   <U000D> CARRIAGE RETURN (CR)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    97
<SO>                   /x0E   <U000E> SHIFT OUT (SO)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    98
<SI>                   /x0F   <U000F> SHIFT IN (SI)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    99
<DL>                   /x10   <U0010> DATALINK ESCAPE (DLE)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   100
<D1>                   /x11   <U0011> DEVICE CONTROL ONE (DC1)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   101
<D2>                   /x12   <U0012> DEVICE CONTROL TWO (DC2)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   102
<D3>                   /x13   <U0013> DEVICE CONTROL THREE (DC3)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   103
<D4>                   /x14   <U0014> DEVICE CONTROL FOUR (DC4)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   104
<NK>                   /x15   <U0015> NEGATIVE ACKNOWLEDGE (NAK)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   105
<SY>                   /x16   <U0016> SYNCHRONOUS IDLE (SYN)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   106
<EB>                   /x17   <U0017> END OF TRANSMISSION BLOCK (ETB)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   107
<CN>                   /x18   <U0018> CANCEL (CAN)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   108
<EM>                   /x19   <U0019> END OF MEDIUM (EM)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   109
<SB>                   /x1A   <U001A> SUBSTITUTE (SUB)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   110
<EC>                   /x1B   <U001B> ESCAPE (ESC)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   111
<FS>                   /x1C   <U001C> FILE SEPARATOR (IS4)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   112
<GS>                   /x1D   <U001D> GROUP SEPARATOR (IS3)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   113
<RS>                   /x1E   <U001E> RECORD SEPARATOR (IS2)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   114
<US>                   /x1F   <U001F> UNIT SEPARATOR (IS1)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   115
<SP>                   /x20   <U0020> SPACE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   116
<!!>                    /x21   <U0021> EXCLAMATION MARK
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   117
<'>                    /x22   <U0022> QUOTATION MARK
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   118
<Nb>                   /x23   <U0023> NUMBER SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   119
<DO>                   /x24   <U0024> DOLLAR SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   120
<%>                    /x25   <U0025> PERCENT SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   121
<&>                    /x26   <U0026> AMPERSAND
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   122
<'>                    /x27   <U0027> APOSTROPHE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   123
<(>                    /x28   <U0028> LEFT PARENTHESIS
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   124
<)>                    /x29   <U0029> RIGHT PARENTHESIS
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   125
<*>                    /x2A   <U002A> ASTERISK
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   126
<+>                    /x2B   <U002B> PLUS SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   127
<,>                    /x2C   <U002C> COMMA
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   128
<->                    /x2D   <U002D> HYPHEN-MINUS
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   129
<.>                    /x2E   <U002E> FULL STOP
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   130
<//>                   /x2F   <U002F> SOLIDUS
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   131
<0>                    /x30   <U0030> DIGIT ZERO
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   132
<1>                    /x31   <U0031> DIGIT ONE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   133
<2>                    /x32   <U0032> DIGIT TWO
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   134
<3>                    /x33   <U0033> DIGIT THREE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   135
<4>                    /x34   <U0034> DIGIT FOUR
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   136
<5>                    /x35   <U0035> DIGIT FIVE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   137
<6>                    /x36   <U0036> DIGIT SIX
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   138
<7>                    /x37   <U0037> DIGIT SEVEN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   139
<8>                    /x38   <U0038> DIGIT EIGHT
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   140
<9>                    /x39   <U0039> DIGIT NINE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   141
<:>                    /x3A   <U003A> COLON
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   142
<;>                    /x3B   <U003B> SEMICOLON
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   143
<<>                    /x3C   <U003C> LESS-THAN SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   144
<=>                    /x3D   <U003D> EQUALS SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   145
</>>                   /x3E   <U003E> GREATER-THAN SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   146
<?>                    /x3F   <U003F> QUESTION MARK
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   147
<At>                   /x40   <U0040> COMMERCIAL AT
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   148
<A>                    /x41   <U0041> LATIN CAPITAL LETTER A
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   149
<B>                    /x42   <U0042> LATIN CAPITAL LETTER B
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   150
<C>                    /x43   <U0043> LATIN CAPITAL LETTER C
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   151
<D>                    /x44   <U0044> LATIN CAPITAL LETTER D
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   152
<E>                    /x45   <U0045> LATIN CAPITAL LETTER E
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   153
<F>                    /x46   <U0046> LATIN CAPITAL LETTER F
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   154
<G>                    /x47   <U0047> LATIN CAPITAL LETTER G
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   155
<H>                    /x48   <U0048> LATIN CAPITAL LETTER H
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   156
<I>                    /x49   <U0049> LATIN CAPITAL LETTER I
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   157
<J>                    /x4A   <U004A> LATIN CAPITAL LETTER J
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   158
<K>                    /x4B   <U004B> LATIN CAPITAL LETTER K
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   159
<L>                    /x4C   <U004C> LATIN CAPITAL LETTER L
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   160
<M>                    /x4D   <U004D> LATIN CAPITAL LETTER M
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   161
<N>                    /x4E   <U004E> LATIN CAPITAL LETTER N
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   162
<O>                    /x4F   <U004F> LATIN CAPITAL LETTER O
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   163
<P>                    /x50   <U0050> LATIN CAPITAL LETTER P
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   164
<Q>                    /x51   <U0051> LATIN CAPITAL LETTER Q
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   165
<R>                    /x52   <U0052> LATIN CAPITAL LETTER R
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   166
<S>                    /x53   <U0053> LATIN CAPITAL LETTER S
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   167
<T>                    /x54   <U0054> LATIN CAPITAL LETTER T
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   168
<U>                    /x55   <U0055> LATIN CAPITAL LETTER U
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   169
<V>                    /x56   <U0056> LATIN CAPITAL LETTER V
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   170
<W>                    /x57   <U0057> LATIN CAPITAL LETTER W
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   171
<X>                    /x58   <U0058> LATIN CAPITAL LETTER X
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   172
<Y>                    /x59   <U0059> LATIN CAPITAL LETTER Y
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   173
<Z>                    /x5A   <U005A> LATIN CAPITAL LETTER Z
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   174
<<(>                   /x5B   <U005B> LEFT SQUARE BRACKET
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   175
<////>                 /x5C   <U005C> REVERSE SOLIDUS
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   176
<)/>>                  /x5D   <U005D> RIGHT SQUARE BRACKET
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   177
<'/>>                  /x5E   <U005E> CIRCUMFLEX ACCENT
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   178
<_>                    /x5F   <U005F> LOW LINE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   179
<'!!>                   /x60   <U0060> GRAVE ACCENT
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   180
<a>                    /x61   <U0061> LATIN SMALL LETTER A
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   181
<b>                    /x62   <U0062> LATIN SMALL LETTER B
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   182
<c>                    /x63   <U0063> LATIN SMALL LETTER C
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   183
<d>                    /x64   <U0064> LATIN SMALL LETTER D
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   184
<e>                    /x65   <U0065> LATIN SMALL LETTER E
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   185
<f>                    /x66   <U0066> LATIN SMALL LETTER F
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   186
<g>                    /x67   <U0067> LATIN SMALL LETTER G
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   187
<h>                    /x68   <U0068> LATIN SMALL LETTER H
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   188
<i>                    /x69   <U0069> LATIN SMALL LETTER I
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   189
<j>                    /x6A   <U006A> LATIN SMALL LETTER J
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   190
<k>                    /x6B   <U006B> LATIN SMALL LETTER K
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   191
<l>                    /x6C   <U006C> LATIN SMALL LETTER L
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   192
<m>                    /x6D   <U006D> LATIN SMALL LETTER M
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   193
<n>                    /x6E   <U006E> LATIN SMALL LETTER N
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   194
<o>                    /x6F   <U006F> LATIN SMALL LETTER O
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   195
<p>                    /x70   <U0070> LATIN SMALL LETTER P
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   196
<q>                    /x71   <U0071> LATIN SMALL LETTER Q
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   197
<r>                    /x72   <U0072> LATIN SMALL LETTER R
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   198
<s>                    /x73   <U0073> LATIN SMALL LETTER S
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   199
<t>                    /x74   <U0074> LATIN SMALL LETTER T
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   200
<u>                    /x75   <U0075> LATIN SMALL LETTER U
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   201
<v>                    /x76   <U0076> LATIN SMALL LETTER V
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   202
<w>                    /x77   <U0077> LATIN SMALL LETTER W
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   203
<x>                    /x78   <U0078> LATIN SMALL LETTER X
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   204
<y>                    /x79   <U0079> LATIN SMALL LETTER Y
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   205
<z>                    /x7A   <U007A> LATIN SMALL LETTER Z
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   206
<(!!>                   /x7B   <U007B> LEFT CURLY BRACKET
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   207
<!!!!>                   /x7C   <U007C> VERTICAL LINE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   208
<!!)>                   /x7D   <U007D> RIGHT CURLY BRACKET
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   209
<'?>                   /x7E   <U007E> TILDE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   210
<DT>                   /x7F   <U007F> DELETE (DEL)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   211
<.9>                   /x82   <U201A> SINGLE LOW-9 QUOTATION MARK
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   212
<f2>                   /x83   <U0192> LATIN SMALL LETTER F WITH HOOK
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   213
<:9>                   /x84   <U201E> DOUBLE LOW-9 QUOTATION MARK
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   214
<.3>                   /x85   <U2026> HORIZONTAL ELLIPSIS
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   215
<//->                  /x86   <U2020> DAGGER
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   216
<//=>                  /x87   <U2021> DOUBLE DAGGER
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   217
<1/>>                  /x88   <U02C6> MODIFIER LETTER CIRCUMFLEX ACCENT
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   218
<%0>                   /x89   <U2030> PER MILLE SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   219
<S<>                   /x8A   <U0160> LATIN CAPITAL LETTER S WITH CARON
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   220
<<1>                   /x8B   <U2039> SINGLE LEFT-POINTING ANGLE QUOTATION MARK
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   221
<OE>                   /x8C   <U0152> LATIN CAPITAL LIGATURE OE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   222
<'6>                   /x91   <U2018> LEFT SINGLE QUOTATION MARK
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   223
<'9>                   /x92   <U2019> RIGHT SINGLE QUOTATION MARK
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   224
<'6>                   /x93   <U201C> LEFT DOUBLE QUOTATION MARK
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   225
<'9>                   /x94   <U201D> RIGHT DOUBLE QUOTATION MARK
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   226
<sb>                   /x95   <U2022> BULLET
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   227
<-N>                   /x96   <U2013> EN DASH
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   228
<-M>                   /x97   <U2014> EM DASH
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   229
<1?>                   /x98   <U02DC> SMALL TILDE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   230
<TM>                   /x99   <U2122> TRADE MARK SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   231
<s<>                   /x9A   <U0161> LATIN SMALL LETTER S WITH CARON
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   232
</>1>                  /x9B   <U203A> SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   233
<oe>                   /x9C   <U0153> LATIN SMALL LIGATURE OE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   234
<Y:>                   /x9F   <U0178> LATIN CAPITAL LETTER Y WITH DIAERESIS
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   235
<NS>                   /xA0   <U00A0> NO-BREAK SPACE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   236
<!!I>                   /xA1   <U00A1> INVERTED EXCLAMATION MARK
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   237
<Ct>                   /xA2   <U00A2> CENT SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   238
<Pd>                   /xA3   <U00A3> POUND SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   239
<Cu>                   /xA4   <U00A4> CURRENCY SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   240
<Ye>                   /xA5   <U00A5> YEN SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   241
<BB>                   /xA6   <U00A6> BROKEN BAR
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   242
<SE>                   /xA7   <U00A7> SECTION SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   243
<':>                   /xA8   <U00A8> DIAERESIS
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   244
<Co>                   /xA9   <U00A9> COPYRIGHT SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   245
<-a>                   /xAA   <U00AA> FEMININE ORDINAL INDICATOR
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   246
<<<>                   /xAB   <U00AB> LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   247
<NO>                   /xAC   <U00AC> NOT SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   248
<-->                   /xAD   <U00AD> SOFT HYPHEN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   249
<Rg>                   /xAE   <U00AE> REGISTERED SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   250
<'m>                   /xAF   <U00AF> MACRON
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   251
<DG>                   /xB0   <U00B0> DEGREE SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   252
<+->                   /xB1   <U00B1> PLUS-MINUS SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   253
<2S>                   /xB2   <U00B2> SUPERSCRIPT TWO
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   254
<3S>                   /xB3   <U00B3> SUPERSCRIPT THREE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   255
<''>                   /xB4   <U00B4> ACUTE ACCENT
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   256
<My>                   /xB5   <U00B5> MICRO SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   257
<PI>                   /xB6   <U00B6> PILCROW SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   258
<.M>                   /xB7   <U00B7> MIDDLE DOT
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   259
<',>                   /xB8   <U00B8> CEDILLA
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   260
<1S>                   /xB9   <U00B9> SUPERSCRIPT ONE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   261
<-o>                   /xBA   <U00BA> MASCULINE ORDINAL INDICATOR
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   262
</>/>>                 /xBB   <U00BB> RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   263
<14>                   /xBC   <U00BC> VULGAR FRACTION ONE QUARTER
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   264
<12>                   /xBD   <U00BD> VULGAR FRACTION ONE HALF
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   265
<34>                   /xBE   <U00BE> VULGAR FRACTION THREE QUARTERS
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   266
<?I>                   /xBF   <U00BF> INVERTED QUESTION MARK
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   267
<A!!>                   /xC0   <U00C0> LATIN CAPITAL LETTER A WITH GRAVE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   268
<A'>                   /xC1   <U00C1> LATIN CAPITAL LETTER A WITH ACUTE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   269
<A/>>                  /xC2   <U00C2> LATIN CAPITAL LETTER A WITH CIRCUMFLEX
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   270
<A?>                   /xC3   <U00C3> LATIN CAPITAL LETTER A WITH TILDE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   271
<A:>                   /xC4   <U00C4> LATIN CAPITAL LETTER A WITH DIAERESIS
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   272
<AA>                   /xC5   <U00C5> LATIN CAPITAL LETTER A WITH RING ABOVE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   273
<AE>                   /xC6   <U00C6> LATIN CAPITAL LETTER AE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   274
<C,>                   /xC7   <U00C7> LATIN CAPITAL LETTER C WITH CEDILLA
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   275
<E!!>                   /xC8   <U00C8> LATIN CAPITAL LETTER E WITH GRAVE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   276
<E'>                   /xC9   <U00C9> LATIN CAPITAL LETTER E WITH ACUTE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   277
<E/>>                  /xCA   <U00CA> LATIN CAPITAL LETTER E WITH CIRCUMFLEX
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   278
<E:>                   /xCB   <U00CB> LATIN CAPITAL LETTER E WITH DIAERESIS
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   279
<I!!>                   /xCC   <U00CC> LATIN CAPITAL LETTER I WITH GRAVE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   280
<I'>                   /xCD   <U00CD> LATIN CAPITAL LETTER I WITH ACUTE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   281
<I/>>                  /xCE   <U00CE> LATIN CAPITAL LETTER I WITH CIRCUMFLEX
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   282
<I:>                   /xCF   <U00CF> LATIN CAPITAL LETTER I WITH DIAERESIS
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   283
<D->                   /xD0   <U00D0> LATIN CAPITAL LETTER ETH (Icelandic)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   284
<N?>                   /xD1   <U00D1> LATIN CAPITAL LETTER N WITH TILDE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   285
<O!!>                   /xD2   <U00D2> LATIN CAPITAL LETTER O WITH GRAVE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   286
<O'>                   /xD3   <U00D3> LATIN CAPITAL LETTER O WITH ACUTE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   287
<O/>>                  /xD4   <U00D4> LATIN CAPITAL LETTER O WITH CIRCUMFLEX
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   288
<O?>                   /xD5   <U00D5> LATIN CAPITAL LETTER O WITH TILDE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   289
<O:>                   /xD6   <U00D6> LATIN CAPITAL LETTER O WITH DIAERESIS
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   290
<*X>                   /xD7   <U00D7> MULTIPLICATION SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   291
<O//>                  /xD8   <U00D8> LATIN CAPITAL LETTER O WITH STROKE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   292
<U!!>                   /xD9   <U00D9> LATIN CAPITAL LETTER U WITH GRAVE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   293
<U'>                   /xDA   <U00DA> LATIN CAPITAL LETTER U WITH ACUTE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   294
<U/>>                  /xDB   <U00DB> LATIN CAPITAL LETTER U WITH CIRCUMFLEX
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   295
<U:>                   /xDC   <U00DC> LATIN CAPITAL LETTER U WITH DIAERESIS
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   296
<Y'>                   /xDD   <U00DD> LATIN CAPITAL LETTER Y WITH ACUTE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   297
<TH>                   /xDE   <U00DE> LATIN CAPITAL LETTER THORN (Icelandic)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   298
<ss>                   /xDF   <U00DF> LATIN SMALL LETTER SHARP S (German)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   299
<a!!>                   /xE0   <U00E0> LATIN SMALL LETTER A WITH GRAVE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   300
<a'>                   /xE1   <U00E1> LATIN SMALL LETTER A WITH ACUTE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   301
<a/>>                  /xE2   <U00E2> LATIN SMALL LETTER A WITH CIRCUMFLEX
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   302
<a?>                   /xE3   <U00E3> LATIN SMALL LETTER A WITH TILDE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   303
<a:>                   /xE4   <U00E4> LATIN SMALL LETTER A WITH DIAERESIS
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   304
<aa>                   /xE5   <U00E5> LATIN SMALL LETTER A WITH RING ABOVE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   305
<ae>                   /xE6   <U00E6> LATIN SMALL LETTER AE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   306
<c,>                   /xE7   <U00E7> LATIN SMALL LETTER C WITH CEDILLA
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   307
<e!!>                   /xE8   <U00E8> LATIN SMALL LETTER E WITH GRAVE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   308
<e'>                   /xE9   <U00E9> LATIN SMALL LETTER E WITH ACUTE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   309
<e/>>                  /xEA   <U00EA> LATIN SMALL LETTER E WITH CIRCUMFLEX
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   310
<e:>                   /xEB   <U00EB> LATIN SMALL LETTER E WITH DIAERESIS
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   311
<i!!>                   /xEC   <U00EC> LATIN SMALL LETTER I WITH GRAVE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   312
<i'>                   /xED   <U00ED> LATIN SMALL LETTER I WITH ACUTE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   313
<i/>>                  /xEE   <U00EE> LATIN SMALL LETTER I WITH CIRCUMFLEX
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   314
<i:>                   /xEF   <U00EF> LATIN SMALL LETTER I WITH DIAERESIS
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   315
<d->                   /xF0   <U00F0> LATIN SMALL LETTER ETH (Icelandic)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   316
<n?>                   /xF1   <U00F1> LATIN SMALL LETTER N WITH TILDE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   317
<o!!>                   /xF2   <U00F2> LATIN SMALL LETTER O WITH GRAVE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   318
<o'>                   /xF3   <U00F3> LATIN SMALL LETTER O WITH ACUTE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   319
<o/>>                  /xF4   <U00F4> LATIN SMALL LETTER O WITH CIRCUMFLEX
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   320
<o?>                   /xF5   <U00F5> LATIN SMALL LETTER O WITH TILDE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   321
<o:>                   /xF6   <U00F6> LATIN SMALL LETTER O WITH DIAERESIS
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   322
<-:>                   /xF7   <U00F7> DIVISION SIGN
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   323
<o//>                  /xF8   <U00F8> LATIN SMALL LETTER O WITH STROKE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   324
<u!!>                   /xF9   <U00F9> LATIN SMALL LETTER U WITH GRAVE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   325
<u'>                   /xFA   <U00FA> LATIN SMALL LETTER U WITH ACUTE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   326
<u/>>                  /xFB   <U00FB> LATIN SMALL LETTER U WITH CIRCUMFLEX
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   327
<u:>                   /xFC   <U00FC> LATIN SMALL LETTER U WITH DIAERESIS
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   328
<y'>                   /xFD   <U00FD> LATIN SMALL LETTER Y WITH ACUTE
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   329
<th>                   /xFE   <U00FE> LATIN SMALL LETTER THORN (Icelandic)
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   330
<y:>                   /xFF   <U00FF> LATIN SMALL LETTER Y WITH DIAERESIS
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   331
END CHARMAP
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   332
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   333
"
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   334
! !
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   335
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   336
!MS_CP1252 class methodsFor:'queries'!
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   337
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   338
maxCode
22588
f52044b2de85 #FEATURE by cg
Claus Gittinger <cg@exept.de>
parents: 22586
diff changeset
   339
    ^ 255 
22586
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   340
!
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   341
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   342
minCode
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   343
    ^ 0 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   344
! !
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   345
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   346
!MS_CP1252 methodsFor:'encoding & decoding'!
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   347
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   348
decode:codeArg
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   349
    |code "{ Class: SmallInteger }" t|
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   350
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   351
    code := codeArg.
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   352
    code <= 16r7F ifTrue:[ ^ code ].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   353
    code >= 16rA0 ifTrue:[
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   354
        code > 16rFF ifTrue:[
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   355
            ^ 16rFF.
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   356
        ].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   357
        ^ codeArg.
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   358
    ].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   359
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   360
    "similar to 8859-1 with different chars in the 8x..9x area"
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   361
    "we map CP1252 chars to unicode chars"
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   362
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   363
    t := #(
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   364
       "16r0080"    16r20AC " EURO character " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   365
       "16r0081"    16r0000 " invalid " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   366
       "16r0082"    16r201A " SINGLE LOW-9 QUOTATION MARK " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   367
       "16r0083"    16r0192 " LATIN SMALL LETTER F WITH HOOK " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   368
       "16r0084"    16r201E " DOUBLE LOW-9 QUOTATION MARK " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   369
       "16r0085"    16r2026 " HORIZONTAL ELLIPSIS " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   370
       "16r0086"    16r2020 " DAGGER " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   371
       "16r0087"    16r2021 " DOUBLE DAGGER " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   372
       "16r0088"    16r02C6 " MODIFIER LETTER CIRCUMFLEX ACCENT " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   373
       "16r0089"    16r2030 " PER MILLE SIGN " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   374
       "16r008A"    16r0160 " LATIN CAPITAL LETTER S WITH CARON " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   375
       "16r008B"    16r2039 " SINGLE LEFT-POINTING ANGLE QUOTATION MARK " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   376
       "16r008C"    16r0152 " LATIN CAPITAL LIGATURE OE " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   377
       "16r008D"    16r0000 " invalid " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   378
       "16r008E"    16r017D " LATIN CAPITAL Z WITH INVERSE CARON" 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   379
       "16r008F"    16r0000 " invalid " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   380
       "16r0090"    16r0000 " invalid " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   381
       "16r0091"    16r2018 " LEFT SINGLE QUOTATION MARK " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   382
       "16r0092"    16r2019 " RIGHT SINGLE QUOTATION MARK " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   383
       "16r0093"    16r201C " LEFT DOUBLE QUOTATION MARK " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   384
       "16r0094"    16r201D " RIGHT DOUBLE QUOTATION MARK " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   385
       "16r0095"    16r2022 " BULLET " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   386
       "16r0096"    16r2013 " EN DASH " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   387
       "16r0097"    16r2014 " EM DASH " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   388
       "16r0098"    16r02DC " SMALL TILDE " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   389
       "16r0099"    16r2122 " TRADE MARK SIGN " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   390
       "16r009A"    16r0161 " LATIN SMALL LETTER S WITH CARON " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   391
       "16r009B"    16r203A " SINGLE RIGHT-POINTING ANGLE QUOTATION MARK " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   392
       "16r009C"    16r0153 " LATIN SMALL LIGATURE OE " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   393
       "16r009D"    16r0000 " invalid " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   394
       "16r009E"    16r017E " LATIN SMALL LETTER Z WITH INVERSE CARON " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   395
       "16r009F"    16r0178 " LATIN CAPITAL LETTER Y WITH DIAERESIS " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   396
       ) at:(code - 16r7F).
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   397
    t == 0 ifFalse:[^ t].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   398
    ^ self decodingError.
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   399
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   400
    "Modified (format): / 12-07-2012 / 14:06:56 / cg"
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   401
!
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   402
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   403
decodeString:anEncodedStringOrByteCollection
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   404
    "given a string in my encoding, return a unicode-string for it"
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   405
23334
cb5a5878342b #BUGFIX by cg
Claus Gittinger <cg@exept.de>
parents: 22588
diff changeset
   406
    |outStream myCode code size "{ Class:SmallInteger }"|
22586
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   407
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   408
    size := anEncodedStringOrByteCollection size.
23334
cb5a5878342b #BUGFIX by cg
Claus Gittinger <cg@exept.de>
parents: 22588
diff changeset
   409
    outStream := CharacterWriteStream new:size.
22586
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   410
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   411
    1 to:size do:[:idx |
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   412
        code := (anEncodedStringOrByteCollection at:idx) codePoint.
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   413
        myCode := self decode:code.
23334
cb5a5878342b #BUGFIX by cg
Claus Gittinger <cg@exept.de>
parents: 22588
diff changeset
   414
        outStream nextPut:(Character codePoint:myCode).
22586
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   415
    ].
23334
cb5a5878342b #BUGFIX by cg
Claus Gittinger <cg@exept.de>
parents: 22588
diff changeset
   416
    ^ outStream contents
22586
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   417
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   418
    "
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   419
     CharacterEncoderImplementations::MS_CP1252 decodeString:'hello'
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   420
    "
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   421
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   422
    "Created: / 16-01-2018 / 19:54:02 / stefan"
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   423
    "Modified (format): / 17-01-2018 / 16:30:59 / stefan"
23334
cb5a5878342b #BUGFIX by cg
Claus Gittinger <cg@exept.de>
parents: 22588
diff changeset
   424
    "Modified: / 14-09-2018 / 14:24:18 / Claus Gittinger"
22586
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   425
!
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   426
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   427
encode:unicodeArg
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   428
    |unicode "{ Class: SmallInteger }" t
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   429
     replacementForInvalid|
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   430
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   431
    "we map unicode chars to CP1252 where a mapping exists.
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   432
     If no mapping exists, we encode it as 0xFF"
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   433
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   434
    replacementForInvalid := 16r7F.
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   435
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   436
    unicode := unicodeArg.
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   437
    unicode > 16r2122 ifTrue:[
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   438
        ^ replacementForInvalid.
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   439
    ].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   440
    unicode <= 16rFF ifTrue:[
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   441
        ^ unicode
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   442
    ].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   443
    unicode <= 16r2DC ifTrue:[
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   444
        unicode <= 16r192 ifTrue:[
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   445
            unicode <= 16r178 ifTrue:[
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   446
                unicode <= 16r161 ifTrue:[
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   447
                    t := #[
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   448
                       "16r0152"    16r8C " LATIN CAPITAL LIGATURE OE " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   449
                       "16r0153"    16r9C " LATIN SMALL LIGATURE OE " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   450
                       "16r0154"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   451
                       "16r0155"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   452
                       "16r0156"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   453
                       "16r0157"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   454
                       "16r0158"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   455
                       "16r0159"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   456
                       "16r015A"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   457
                       "16r015B"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   458
                       "16r015C"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   459
                       "16r015D"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   460
                       "16r015E"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   461
                       "16r015F"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   462
                       "16r0160"    16r8A " LATIN CAPITAL LETTER S WITH CARON " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   463
                       "16r0161"    16r9A " LATIN SMALL LETTER S WITH CARON " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   464
                       ] at:(unicode - 16r151).
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   465
                    t == 0 ifFalse:[^ t].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   466
                    ^ unicode
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   467
                ].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   468
                unicode <= 16r177 ifTrue:[
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   469
                    ^ replacementForInvalid
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   470
                ].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   471
                ^  "16r0178" 16r009F " LATIN CAPITAL LETTER Y WITH DIAERESIS " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   472
            ].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   473
            unicode <= 16r191 ifTrue:[
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   474
                ^ replacementForInvalid
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   475
            ].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   476
            ^  "16r0192" 16r0083 " LATIN SMALL LETTER F WITH HOOK " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   477
        ].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   478
        unicode <= 16r2C5 ifTrue:[
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   479
            ^ replacementForInvalid
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   480
        ].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   481
        unicode == 16r2C6 ifTrue:[
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   482
            ^  "16r02C6" 16r0088 " MODIFIER LETTER CIRCUMFLEX ACCENT " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   483
        ].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   484
        unicode <= 16r2DB ifTrue:[
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   485
            ^ replacementForInvalid
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   486
        ].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   487
        ^  "16r02DC" 16r0098 " SMALL TILDE " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   488
    ].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   489
    unicode <= 16r2012 ifTrue:[
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   490
        ^ replacementForInvalid
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   491
    ].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   492
    unicode <= 16r203A ifTrue:[
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   493
        t := #(
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   494
           "16r2013"    16r96"  EN DASH " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   495
           "16r2014"    16r97"  EM DASH " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   496
           "16r2015"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   497
           "16r2016"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   498
           "16r2017"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   499
           "16r2018"    16r91 " LEFT SINGLE QUOTATION MARK " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   500
           "16r2019"    16r92 " RIGHT SINGLE QUOTATION MARK " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   501
           "16r201A"    16r82 " SINGLE LOW-9 QUOTATION MARK " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   502
           "16r201B"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   503
           "16r201C"    16r93 " LEFT DOUBLE QUOTATION MARK " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   504
           "16r201D"    16r94 " RIGHT DOUBLE QUOTATION MARK " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   505
           "16r201E"    16r84 " DOUBLE LOW-9 QUOTATION MARK " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   506
           "16r201F"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   507
           "16r2020"    16r86 " DAGGER " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   508
           "16r2021"    16r87 " DOUBLE DAGGER " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   509
           "16r2022"    16r95 " BULLET " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   510
           "16r2023"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   511
           "16r2024"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   512
           "16r2025"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   513
           "16r2026"    16r85 " HORIZONTAL ELLIPSIS " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   514
           "16r2027"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   515
           "16r2028"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   516
           "16r2029"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   517
           "16r202A"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   518
           "16r202B"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   519
           "16r202C"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   520
           "16r202D"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   521
           "16r202E"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   522
           "16r202F"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   523
           "16r2030"    16r89 " PER MILLE SIGN " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   524
           "16r2031"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   525
           "16r2032"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   526
           "16r2033"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   527
           "16r2034"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   528
           "16r2035"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   529
           "16r2036"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   530
           "16r2037"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   531
           "16r2038"    16r00 " keep unicode " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   532
           "16r2039"    16r8B " SINGLE LEFT-POINTING ANGLE QUOTATION MARK " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   533
           "16r203A"    16r9B " SINGLE RIGHT-POINTING ANGLE QUOTATION MARK " 
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   534
           ) at:(unicode - 16r2012).
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   535
        t == 0 ifFalse:[^ t].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   536
        ^ replacementForInvalid
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   537
    ].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   538
    unicode = 16r20AC ifTrue:[
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   539
        ^ 16r0080 " EURO character "
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   540
    ].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   541
    unicode <= 16r2121 ifTrue:[
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   542
        ^ replacementForInvalid
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   543
    ].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   544
    ^  "16r2122" 16r0099 " TRADE MARK SIGN "
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   545
!
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   546
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   547
encodeString:aStringOrUnicodeString
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   548
    "redefined to speedup simple 8 bit strings"
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   549
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   550
    |newString myCode bits size "{ Class:SmallInteger }"|
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   551
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   552
    "/ all between 0 and 7F ?
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   553
    (aStringOrUnicodeString containsNon7BitAscii) ifFalse:[
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   554
         ^ aStringOrUnicodeString asSingleByteString.
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   555
    ].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   556
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   557
    size := aStringOrUnicodeString size.
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   558
    newString := String new:size.
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   559
    bits := newString bitsPerCharacter.
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   560
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   561
    1 to:size do:[:idx |
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   562
        myCode := self encode:((aStringOrUnicodeString at:idx) codePoint).
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   563
        newString at:idx put:(Character codePoint:myCode).
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   564
    ].
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   565
    ^ newString
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   566
! !
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   567
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   568
!MS_CP1252 class methodsFor:'documentation'!
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   569
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   570
version
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   571
    ^ '$Header$'
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   572
!
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   573
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   574
version_CVS
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   575
    ^ '$Header$'
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   576
! !
41099578373e initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   577