#DOCUMENTATION by cg
class: CharacterEncoder class
comment/format in:
#mapFileURL1_relativePathName
#mapFileURL2_relativePathName
#mappingURL1
#mappingURL2
changed: #initializeEncoderClassesByName
--- a/CharacterEncoder.st Wed Apr 26 16:01:39 2017 +0200
+++ b/CharacterEncoder.st Wed Apr 26 16:02:26 2017 +0200
@@ -1,3 +1,5 @@
+"{ Encoding: utf8 }"
+
"
COPYRIGHT (c) 2004 by eXept Software AG
All Rights Reserved
@@ -565,144 +567,146 @@
EncoderClassesByName := Dictionary new.
EncoderClassesByName at:#'unicode' put:(ud := Dictionary new:237).
- ud at:#'fontspecific' put:NullEncoder.
+ ud at:#'fontspecific' put:NullEncoder.
ud at:#'adobe-fontspecific' put:NullEncoder.
- ud at:#'ms-oem' put:NullEncoder.
- ud at:#'ms-default' put:NullEncoder.
+ ud at:#'ms-oem' put:NullEncoder.
+ ud at:#'ms-default' put:NullEncoder.
- "/ className decoded-name array-of-encodingNames
+ "/ className decoded-name array-of-encodingNames
#(
- (ASCII unicode ( ascii 'us-ascii' 'iso-ir-6' 'ibm-367' 'ms-cp367' 'cp367' 'iso646-us' 'ibm-cp367' 'ansi_x3.4-1968' ))
+ (ASCII unicode ( ascii 'us-ascii' 'iso-ir-6' 'ibm-367' 'ms-cp367' 'cp367' 'iso646-us' 'ibm-cp367' 'ansi_x3.4-1968' ))
- (BIG5 unicode ( big5 ))
+ (BIG5 unicode ( big5 ))
- (CNS11643 unicode ( 'cns11643' ))
+ (CNS11643 unicode ( 'cns11643' ))
- (CP437 unicode ( 'cp437' 'cp-437' 'ibm-437' 'ms-cp437' 'microsoft-cp437' 'ibm-cp437' ))
+ (CP437 unicode ( 'cp437' 'cp-437' 'ibm-437' 'ms-cp437' 'microsoft-cp437' 'ibm-cp437' ))
- (EBCDIC unicode ( 'ebcdic' ))
+ (EBCDIC unicode ( 'ebcdic' ))
"/ (GB2313_1980 unicode ( 'gb2313' 'gb2313-1980' ))
- (GB2312_1980_0 unicode ( 'gb2312' 'gb2312.1980' 'gb2312.1980-0'))
+ (GB2312_1980_0 unicode ( 'gb2312' 'gb2312.1980' 'gb2312.1980-0'))
- (HANGUL unicode ( 'hangul' ))
+ (HANGUL unicode ( 'hangul' ))
- (ISO10646_1 unicode ( unicode 'iso10646_1' 'iso10646-1' 'iso-10646-1' ))
+ (ISO10646_1 unicode ( unicode 'iso10646_1' 'iso10646-1' 'iso-10646-1' ))
- (ISO10646_to_UTF8 unicode ( utf8 'utf-8' ))
- (ISO10646_to_UTF16BE unicode ( utf16b utf16be 'utf-16b' 'utf-16be' ))
- (ISO10646_to_UTF16LE unicode ( utf16l utf16le 'utf-16e' 'utf-16le' ))
+ (ISO10646_to_UTF8 unicode ( utf8 'utf-8' ))
+ (ISO10646_to_UTF16BE unicode ( utf16b utf16be 'utf-16b' 'utf-16be' ))
+ (ISO10646_to_UTF16LE unicode ( utf16l utf16le 'utf-16e' 'utf-16le' ))
- (ISO10646_to_UTF8_MAC unicode ( 'utf8-mac' 'utf-8-mac' ))
- (ISO10646_to_XMLUTF8 unicode ( 'utf8-XML' ))
+ (ISO10646_to_UTF8_MAC unicode ( 'utf8-mac' 'utf-8-mac' ))
+ (ISO10646_to_XMLUTF8 unicode ( 'utf8-XML' ))
- (ISO8859_1 unicode ( 'iso8859_1' 'iso8859-1' 'iso-8859-1' 'latin-1' 'latin1' 'iso-ir-100' 'ibm-819' 'ms-cp819' 'ibm-cp819' 'iso8859'))
+ (ISO8859_1 unicode ( 'iso8859_1' 'iso8859-1' 'iso-8859-1' 'latin-1' 'latin1' 'iso-ir-100' 'ibm-819' 'ms-cp819' 'ibm-cp819' 'iso8859'))
- (ISO8859_2 unicode ( 'iso8859_2' 'iso8859-2' 'iso-8859-2' 'latin2' 'latin-2' 'iso-ir-101'))
+ (ISO8859_2 unicode ( 'iso8859_2' 'iso8859-2' 'iso-8859-2' 'latin2' 'latin-2' 'iso-ir-101'))
- (ISO8859_3 unicode ( 'iso8859_3' 'iso8859-3' 'iso-8859-3' 'latin3' 'latin-3' 'iso-ir-109'))
+ (ISO8859_3 unicode ( 'iso8859_3' 'iso8859-3' 'iso-8859-3' 'latin3' 'latin-3' 'iso-ir-109'))
- (ISO8859_4 unicode ( 'iso8859_4' 'iso8859-4' 'iso-8859-4' 'latin4' 'latin-4' 'iso-ir-110'))
+ (ISO8859_4 unicode ( 'iso8859_4' 'iso8859-4' 'iso-8859-4' 'latin4' 'latin-4' 'iso-ir-110'))
- (ISO8859_5 unicode ( 'iso8859_5' 'iso8859-5' 'iso-8859-5' 'cyrillic' 'iso-ir-144' ))
+ (ISO8859_5 unicode ( 'iso8859_5' 'iso8859-5' 'iso-8859-5' 'cyrillic' 'iso-ir-144' ))
- (ISO8859_6 unicode ( 'iso8859_6' 'iso8859-6' 'iso-8859-6' 'arabic' 'asmo-708' 'ecma-114' 'iso-ir-127' ))
+ (ISO8859_6 unicode ( 'iso8859_6' 'iso8859-6' 'iso-8859-6' 'arabic' 'asmo-708' 'ecma-114' 'iso-ir-127' ))
- (ISO8859_7 unicode ( 'iso8859_7' 'iso8859-7' 'iso-8859-7' 'greek' 'iso-ir-126' 'ecma-118'))
+ (ISO8859_7 unicode ( 'iso8859_7' 'iso8859-7' 'iso-8859-7' 'greek' 'iso-ir-126' 'ecma-118'))
- (ISO8859_8 unicode ( 'iso8859_8' 'iso8859-8' 'iso-8859-8' 'hebrew' 'iso-ir-138' ))
+ (ISO8859_8 unicode ( 'iso8859_8' 'iso8859-8' 'iso-8859-8' 'hebrew' 'iso-ir-138' ))
- (ISO8859_9 unicode ( 'iso8859_9' 'iso8859-9' 'iso-8859-9' 'latin5' 'latin-5' 'iso-ir-148'))
+ (ISO8859_9 unicode ( 'iso8859_9' 'iso8859-9' 'iso-8859-9' 'latin5' 'latin-5' 'iso-ir-148'))
- (ISO8859_10 unicode ( 'iso8859_10' 'iso8859-10' 'iso-8859-10' 'latin6' 'latin-6' 'iso-ir-157'))
+ (ISO8859_10 unicode ( 'iso8859_10' 'iso8859-10' 'iso-8859-10' 'latin6' 'latin-6' 'iso-ir-157'))
- (ISO8859_11 unicode ( 'iso8859_11' 'iso8859-11' 'iso-8859-11' 'thai' ))
+ (ISO8859_11 unicode ( 'iso8859_11' 'iso8859-11' 'iso-8859-11' 'thai' ))
- (ISO8859_13 unicode ( 'iso8859_13' 'iso8859-13' 'iso-8859-13' 'latin7' 'latin-7' ))
+ (ISO8859_13 unicode ( 'iso8859_13' 'iso8859-13' 'iso-8859-13' 'latin7' 'latin-7' ))
- (ISO8859_14 unicode ( 'iso8859_14' 'iso8859-14' 'iso-8859-14' 'latin8' 'latin-8' 'latin-celtic' ))
+ (ISO8859_14 unicode ( 'iso8859_14' 'iso8859-14' 'iso-8859-14' 'latin8' 'latin-8' 'latin-celtic' ))
- (ISO8859_15 unicode ( 'iso8859_15' 'iso8859-15' 'iso-8859-15' 'latin9' 'latin-9' 'iso-ir-203'))
+ (ISO8859_15 unicode ( 'iso8859_15' 'iso8859-15' 'iso-8859-15' 'latin9' 'latin-9' 'iso-ir-203'))
- (ISO8859_16 unicode ( 'iso8859_16' 'iso8859-16' 'iso-8859-16' 'latin10' 'latin-10' ))
+ (ISO8859_16 unicode ( 'iso8859_16' 'iso8859-16' 'iso-8859-16' 'latin10' 'latin-10' ))
- (JIS0201 unicode ( 'jis0201' #'jisx0201.1976-0'))
+ (JIS0201 unicode ( 'jis0201' #'jisx0201.1976-0'))
- (JIS0208 unicode ( jis0208 'jisx0208' 'jisx0208.1983-0' 'jisx0208.1990-0'))
+ (JIS0208 unicode ( jis0208 'jisx0208' 'jisx0208.1983-0' 'jisx0208.1990-0'))
- (JIS0208_to_JIS7 jis0208 ( jis7 'jis-7' 'x-jis7' 'x-iso2022-jp' 'iso2022-jp'))
+ (JIS0208_to_JIS7 jis0208 ( jis7 'jis-7' 'x-jis7' 'x-iso2022-jp' 'iso2022-jp'))
- (JIS0208_to_EUC jis0208 ( euc #'x-euc-jp' ))
+ (JIS0208_to_EUC jis0208 ( euc #'x-euc-jp' ))
- (JIS0208_to_SJIS jis0208 ( 'sjis' 'shiftjis' 'x-sjis' #'x-shift-jis' #'shift-jis'))
+ (JIS0208_to_SJIS jis0208 ( 'sjis' 'shiftjis' 'x-sjis' #'x-shift-jis' #'shift-jis'))
- (JIS0212 unicode ( 'jis0212' ))
+ (JIS0212 unicode ( 'jis0212' ))
- (JOHAB unicode ( 'johab' ))
+ (JOHAB unicode ( 'johab' ))
- (KOI7 unicode ( 'koi7' ))
+ (KOI7 unicode ( 'koi7' ))
- (KOI8_R unicode ( #'koi8-r' 'cp878' ))
+ (KOI8_R unicode ( #'koi8-r' 'cp878' ))
- (KOI8_U unicode ( #'koi8-u' ))
+ (KOI8_U unicode ( #'koi8-u' ))
- (KSC5601 unicode ( #'ksc5601' ))
+ (KSC5601 unicode ( #'ksc5601' ))
- (MAC_Arabic unicode ( #'mac-arabic' 'macarabic' ))
+ (MAC_Arabic unicode ( #'mac-arabic' 'macarabic' ))
- (MAC_CentralEuropean unicode ( #'mac-centraleuropean' #'mac-centraleurope' 'maccentraleurope' 'maccentraleuropean' ))
+ (MAC_CentralEuropean unicode ( #'mac-centraleuropean' #'mac-centraleurope' 'maccentraleurope' 'maccentraleuropean' ))
- (MAC_Croatian unicode ( #'mac-croatian' 'maccroatian'))
+ (MAC_Croatian unicode ( #'mac-croatian' 'maccroatian'))
- (MAC_Cyrillic unicode ( #'mac-cyrillic' 'maccyrillic' ))
+ (MAC_Cyrillic unicode ( #'mac-cyrillic' 'maccyrillic' ))
- (MAC_Dingbats unicode ( #'mac-dingbats' 'macdingbats' 'macdingbat'))
+ (MAC_Dingbats unicode ( #'mac-dingbats' 'macdingbats' 'macdingbat'))
- (MAC_Farsi unicode ( #'mac-farsi' 'macfarsi' ))
+ (MAC_Farsi unicode ( #'mac-farsi' 'macfarsi' ))
- (MAC_Greek unicode ( #'mac-greek' #'macgreek' ))
+ (MAC_Greek unicode ( #'mac-greek' #'macgreek' ))
- (MAC_Hebrew unicode ( #'mac-hebrew' #'machebrew' ))
+ (MAC_Hebrew unicode ( #'mac-hebrew' #'machebrew' ))
- (MAC_Iceland unicode ( #'mac-iceland' #'maciceland' ))
+ (MAC_Iceland unicode ( #'mac-iceland' #'maciceland' ))
- (MAC_Japanese unicode ( #'mac-japanese' #'macjapanese' ))
+ (MAC_Japanese unicode ( #'mac-japanese' #'macjapanese' ))
- (MAC_Korean unicode ( #'mac-korean' #'mackorean' ))
+ (MAC_Korean unicode ( #'mac-korean' #'mackorean' ))
- (MAC_Roman unicode ( #'mac-roman' #'macroman' 'macintosh' 'cp10000' ))
+ (MAC_Roman unicode ( #'mac-roman' #'macroman' 'macintosh' 'cp10000' ))
- (MAC_Romanian unicode ( #'mac-romanian' #'macromanian' ))
+ (MAC_Romanian unicode ( #'mac-romanian' #'macromanian' ))
- (MAC_Symbol unicode ( #'mac-symbol' #'macsymbol' ))
+ (MAC_Symbol unicode ( #'mac-symbol' #'macsymbol' ))
- (MAC_Thai unicode ( #'mac-thai' #'macthai' ))
+ (MAC_Thai unicode ( #'mac-thai' #'macthai' ))
- (MAC_Turkish unicode ( #'mac-turkish' #'macturkish' ))
+ (MAC_Turkish unicode ( #'mac-turkish' #'macturkish' ))
- (MS_Ansi unicode ( #'ms-ansi' 'ms-cp1252' 'microsoft-cp1252' 'cp1252' 'microsoft-ansi' 'windows-1252' 'windows-latin1'))
+ (MS_Ansi unicode ( #'ms-ansi' 'ms-cp1252' 'microsoft-cp1252' 'cp1252' 'microsoft-ansi' 'windows-1252' 'windows-latin1'))
- (MS_Arabic unicode ( 'ms-arabic' 'ms-cp1256' 'microsoft-cp1256' 'cp1256' 'microsoft-arabic' 'windows-1256' ))
+ (MS_Arabic unicode ( 'ms-arabic' 'ms-cp1256' 'microsoft-cp1256' 'cp1256' 'microsoft-arabic' 'windows-1256' ))
- (MS_Baltic unicode ( 'ms-baltic' 'ms-cp1257' 'microsoft-cp1257' 'cp1257' 'microsoft-baltic' 'windows-1257' ))
+ (MS_Baltic unicode ( 'ms-baltic' 'ms-cp1257' 'microsoft-cp1257' 'cp1257' 'microsoft-baltic' 'windows-1257' ))
- (MS_Cyrillic unicode ( 'ms-cyrillic' 'ms-cp1251' 'microsoft-cp1251' 'cp1251' 'microsoft-cyrillic' 'windows-1251' ))
+ (MS_Cyrillic unicode ( 'ms-cyrillic' 'ms-cp1251' 'microsoft-cp1251' 'cp1251' 'microsoft-cyrillic' 'windows-1251' ))
- (MS_EastEuropean unicode ( 'ms-easteuropean' 'ms-ee' 'cp1250' 'ms-cp1250' 'microsoft-cp1250' 'microsoft-easteuropean' 'windows-1250' ))
+ (MS_EastEuropean unicode ( 'ms-easteuropean' 'ms-ee' 'cp1250' 'ms-cp1250' 'microsoft-cp1250' 'microsoft-easteuropean' 'windows-1250' ))
- (MS_Greek unicode ( 'ms-greek' 'ms-cp1253' 'microsoft-cp1253' 'cp1253' 'microsoft-greek' 'windows-1253' ))
+ (MS_Greek unicode ( 'ms-greek' 'ms-cp1253' 'microsoft-cp1253' 'cp1253' 'microsoft-greek' 'windows-1253' ))
- (MS_Hebrew unicode ( 'ms-hebrew' 'ms-cp1255' 'microsoft-cp1255' 'cp1255' 'microsoft-hebrew' 'windows-1255' ))
+ (MS_Hebrew unicode ( 'ms-hebrew' 'ms-cp1255' 'microsoft-cp1255' 'cp1255' 'microsoft-hebrew' 'windows-1255' ))
"/ (MS_Symbol unicode ( 'ms-symbol' 'microsoft-symbol' ))
- (MS_Turkish unicode ( 'ms-turkish' 'ms-cp1254' 'microsoft-cp1254' 'cp1254' 'microsoft-turkish' 'windows-1254' ))
+ (MS_Turkish unicode ( 'ms-turkish' 'ms-cp1254' 'microsoft-cp1254' 'cp1254' 'microsoft-turkish' 'windows-1254' ))
- (NEXT unicode ( 'next' 'nextstep' ))
+ (NEXT unicode ( 'next' 'nextstep' ))
(ISO10646_to_SGML unicode ( 'sgml' ))
(ISO10646_to_JavaText unicode ( 'java' 'javaText' ))
+
+ (AdobeStandard unicode ( 'Adobe Standard' 'AdobeStandard' 'Adobe' 'adobe-standard' ))
) triplesDo:[:className :decodesTo :encodesTo |
|decodesToDict|
@@ -911,20 +915,18 @@
!
mapFileURL1_relativePathName
- "raise an error: must be redefined in concrete subclass(es)"
+ "must be redefined in concrete subclass(es)"
^ nil
!
mapFileURL2_relativePathName
- "raise an error: must be redefined in concrete subclass(es)"
+ "must be redefined in concrete subclass(es)"
^ nil
!
mappingURL1
- "raise an error: must be redefined in concrete subclass(es)"
-
|rel|
rel := self mapFileURL1_relativePathName.
@@ -935,8 +937,6 @@
!
mappingURL2
- "raise an error: must be redefined in concrete subclass(es)"
-
|rel|
rel := self mapFileURL2_relativePathName.