CharacterEncoderImplementations__TwoByteEncoder.st
author Claus Gittinger <cg@exept.de>
Tue, 09 Jul 2019 20:55:17 +0200
changeset 24417 03b083548da2
parent 22479 833b8c85dbda
permissions -rw-r--r--
#REFACTORING by exept class: Smalltalk class changed: #recursiveInstallAutoloadedClassesFrom:rememberIn:maxLevels:noAutoload:packageTop:showSplashInLevels: Transcript showCR:(... bindWith:...) -> Transcript showCR:... with:...
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
22428
b4f17397e9c3 #BUGFIX by cg
Claus Gittinger <cg@exept.de>
parents: 21306
diff changeset
     1
"{ Encoding: utf8 }"
b4f17397e9c3 #BUGFIX by cg
Claus Gittinger <cg@exept.de>
parents: 21306
diff changeset
     2
8148
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
     3
"
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
     4
 COPYRIGHT (c) 2004 by eXept Software AG
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
     5
              All Rights Reserved
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
     6
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
     7
 This software is furnished under a license and may be used
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
     8
 only in accordance with the terms of that license and with the
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
     9
 inclusion of the above copyright notice.   This software may not
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
    10
 be provided or otherwise made available to, or used by, any
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
    11
 other person.  No title to or ownership of the software is
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
    12
 hereby transferred.
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
    13
"
8079
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    14
"{ Package: 'stx:libbasic' }"
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    15
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    16
"{ NameSpace: CharacterEncoderImplementations }"
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    17
22479
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    18
FixedBytesEncoder subclass:#TwoByteEncoder
8079
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    19
	instanceVariableNames:''
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    20
	classVariableNames:''
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    21
	poolDictionaries:''
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    22
	category:'Collections-Text-Encodings'
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    23
!
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    24
8148
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
    25
!TwoByteEncoder class methodsFor:'documentation'!
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
    26
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
    27
copyright
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
    28
"
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
    29
 COPYRIGHT (c) 2004 by eXept Software AG
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
    30
              All Rights Reserved
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
    31
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
    32
 This software is furnished under a license and may be used
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
    33
 only in accordance with the terms of that license and with the
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
    34
 inclusion of the above copyright notice.   This software may not
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
    35
 be provided or otherwise made available to, or used by, any
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
    36
 other person.  No title to or ownership of the software is
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
    37
 hereby transferred.
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
    38
"
21306
8ed77ba2521a #DOCUMENTATION by cg
Claus Gittinger <cg@exept.de>
parents: 21141
diff changeset
    39
!
8ed77ba2521a #DOCUMENTATION by cg
Claus Gittinger <cg@exept.de>
parents: 21141
diff changeset
    40
8ed77ba2521a #DOCUMENTATION by cg
Claus Gittinger <cg@exept.de>
parents: 21141
diff changeset
    41
documentation
8ed77ba2521a #DOCUMENTATION by cg
Claus Gittinger <cg@exept.de>
parents: 21141
diff changeset
    42
"
8ed77ba2521a #DOCUMENTATION by cg
Claus Gittinger <cg@exept.de>
parents: 21141
diff changeset
    43
    abstract superclass of all two-byte encoders
8ed77ba2521a #DOCUMENTATION by cg
Claus Gittinger <cg@exept.de>
parents: 21141
diff changeset
    44
"
8148
dbf64e3142d9 *** empty log message ***
Claus Gittinger <cg@exept.de>
parents: 8134
diff changeset
    45
! !
8079
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    46
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    47
!TwoByteEncoder class methodsFor:'queries'!
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    48
21306
8ed77ba2521a #DOCUMENTATION by cg
Claus Gittinger <cg@exept.de>
parents: 21141
diff changeset
    49
isAbstract
8ed77ba2521a #DOCUMENTATION by cg
Claus Gittinger <cg@exept.de>
parents: 21141
diff changeset
    50
    "Return if this class is an abstract class.
8ed77ba2521a #DOCUMENTATION by cg
Claus Gittinger <cg@exept.de>
parents: 21141
diff changeset
    51
     True is returned here; false for subclasses.
8ed77ba2521a #DOCUMENTATION by cg
Claus Gittinger <cg@exept.de>
parents: 21141
diff changeset
    52
     Abstract subclasses must redefine this again."
8ed77ba2521a #DOCUMENTATION by cg
Claus Gittinger <cg@exept.de>
parents: 21141
diff changeset
    53
8ed77ba2521a #DOCUMENTATION by cg
Claus Gittinger <cg@exept.de>
parents: 21141
diff changeset
    54
    ^ self == CharacterEncoderImplementations::TwoByteEncoder
8ed77ba2521a #DOCUMENTATION by cg
Claus Gittinger <cg@exept.de>
parents: 21141
diff changeset
    55
!
8ed77ba2521a #DOCUMENTATION by cg
Claus Gittinger <cg@exept.de>
parents: 21141
diff changeset
    56
8079
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    57
maxCode
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    58
    ^ 16rFFFF 
22479
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    59
! !
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    60
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    61
!TwoByteEncoder methodsFor:'encoding & decoding'!
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    62
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    63
encodeString:aUnicodeString
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    64
    "given a string in unicode, return a string in my encoding for it"
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    65
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    66
    |newString myCode stringSize "{ Class: SmallInteger }"|
8079
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    67
22479
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    68
    stringSize := aUnicodeString size.
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    69
    newString := self newString:stringSize.
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    70
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    71
    1 to:stringSize do:[:idx |
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    72
        myCode := self encode:((aUnicodeString at:idx) codePoint).
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    73
        newString at:idx put:(Character codePoint:myCode).
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    74
    ].
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    75
    ^ newString
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    76
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    77
    "Created: / 17-01-2018 / 16:33:52 / stefan"
8079
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    78
! !
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
    79
11995
e8df4cb7d6bb changed #characterSize:
fm
parents: 8148
diff changeset
    80
!TwoByteEncoder methodsFor:'queries'!
e8df4cb7d6bb changed #characterSize:
fm
parents: 8148
diff changeset
    81
22428
b4f17397e9c3 #BUGFIX by cg
Claus Gittinger <cg@exept.de>
parents: 21306
diff changeset
    82
characterSize:charOrCodePoint
21141
7781e9897d93 #DOCUMENTATION by cg
Claus Gittinger <cg@exept.de>
parents: 19827
diff changeset
    83
    "return the number of bytes required to encode codePoint"
11995
e8df4cb7d6bb changed #characterSize:
fm
parents: 8148
diff changeset
    84
22479
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    85
    ^ 2
11995
e8df4cb7d6bb changed #characterSize:
fm
parents: 8148
diff changeset
    86
e8df4cb7d6bb changed #characterSize:
fm
parents: 8148
diff changeset
    87
    "Created: / 15-06-2005 / 15:12:01 / janfrog"
22479
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    88
    "Modified (format): / 16-01-2018 / 22:32:03 / stefan"
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    89
!
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    90
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    91
newString:size
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    92
    ^ TwoByteString new:size.
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    93
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    94
    "Created: / 17-01-2018 / 16:36:56 / stefan"
11995
e8df4cb7d6bb changed #characterSize:
fm
parents: 8148
diff changeset
    95
! !
e8df4cb7d6bb changed #characterSize:
fm
parents: 8148
diff changeset
    96
12434
Claus Gittinger <cg@exept.de>
parents: 11995
diff changeset
    97
!TwoByteEncoder methodsFor:'stream support'!
Claus Gittinger <cg@exept.de>
parents: 11995
diff changeset
    98
22479
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
    99
encodeCharacter:aUnicodeCharacterOrCodePoint on:aStream
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
   100
    "given a character in unicode, encode it onto aStream.
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
   101
     Subclasses can redefine this to avoid allocating many new string instances."
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
   102
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
   103
    aStream nextPutInt16:(self encode:aUnicodeCharacterOrCodePoint codePoint) MSB:false.
12434
Claus Gittinger <cg@exept.de>
parents: 11995
diff changeset
   104
22479
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
   105
    "
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
   106
      CharacterEncoderImplementations::ISO8859_10 new encodeCharacter:260 on:Transcript
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
   107
      CharacterEncoderImplementations::ISO8859_10 new encodeCharacter:$Ą  on:Transcript
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
   108
    "
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
   109
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
   110
    "Created: / 17-01-2018 / 16:41:09 / stefan"
12434
Claus Gittinger <cg@exept.de>
parents: 11995
diff changeset
   111
!
Claus Gittinger <cg@exept.de>
parents: 11995
diff changeset
   112
22479
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
   113
readNextCharacterFrom:aStream
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
   114
    | codePoint |
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
   115
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
   116
    codePoint := aStream nextUnsignedInt16MSB:false.
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
   117
    ^ codePoint isNil 
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
   118
        ifTrue: [nil]
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
   119
        ifFalse: [Character codePoint:codePoint]
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
   120
833b8c85dbda #REFACTORING by stefan
Stefan Vogel <sv@exept.de>
parents: 22428
diff changeset
   121
    "Modified: / 16-01-2018 / 22:30:36 / stefan"
12434
Claus Gittinger <cg@exept.de>
parents: 11995
diff changeset
   122
! !
Claus Gittinger <cg@exept.de>
parents: 11995
diff changeset
   123
8079
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   124
!TwoByteEncoder class methodsFor:'documentation'!
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   125
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   126
version
19215
b20035967455 #REFACTORING
Claus Gittinger <cg@exept.de>
parents: 12434
diff changeset
   127
    ^ '$Header$'
12434
Claus Gittinger <cg@exept.de>
parents: 11995
diff changeset
   128
!
Claus Gittinger <cg@exept.de>
parents: 11995
diff changeset
   129
Claus Gittinger <cg@exept.de>
parents: 11995
diff changeset
   130
version_CVS
19215
b20035967455 #REFACTORING
Claus Gittinger <cg@exept.de>
parents: 12434
diff changeset
   131
    ^ '$Header$'
8079
0c51c515c6b6 initial checkin
Claus Gittinger <cg@exept.de>
parents:
diff changeset
   132
! !
19215
b20035967455 #REFACTORING
Claus Gittinger <cg@exept.de>
parents: 12434
diff changeset
   133