#DOCUMENTATION by cg
authorClaus Gittinger <cg@exept.de>
Wed, 26 Apr 2017 16:02:26 +0200
changeset 21711 2020534180c5
parent 21710 285f6431ad4a
child 21712 bbdbb633670b
#DOCUMENTATION by cg class: CharacterEncoder class comment/format in: #mapFileURL1_relativePathName #mapFileURL2_relativePathName #mappingURL1 #mappingURL2 changed: #initializeEncoderClassesByName
CharacterEncoder.st
--- a/CharacterEncoder.st	Wed Apr 26 16:01:39 2017 +0200
+++ b/CharacterEncoder.st	Wed Apr 26 16:02:26 2017 +0200
@@ -1,3 +1,5 @@
+"{ Encoding: utf8 }"
+
 "
  COPYRIGHT (c) 2004 by eXept Software AG
               All Rights Reserved
@@ -565,144 +567,146 @@
     EncoderClassesByName := Dictionary new.
 
     EncoderClassesByName at:#'unicode' put:(ud := Dictionary new:237).
-    ud at:#'fontspecific' put:NullEncoder.    
+    ud at:#'fontspecific'       put:NullEncoder.    
     ud at:#'adobe-fontspecific' put:NullEncoder.    
-    ud at:#'ms-oem' put:NullEncoder.    
-    ud at:#'ms-default' put:NullEncoder.    
+    ud at:#'ms-oem'             put:NullEncoder.    
+    ud at:#'ms-default'         put:NullEncoder.    
 
-    "/ className        decoded-name    array-of-encodingNames
+    "/ className            decoded-name    array-of-encodingNames
     #(
-        (ASCII              unicode     ( ascii 'us-ascii' 'iso-ir-6' 'ibm-367' 'ms-cp367' 'cp367'  'iso646-us' 'ibm-cp367' 'ansi_x3.4-1968' ))
+        (ASCII                  unicode     ( ascii 'us-ascii' 'iso-ir-6' 'ibm-367' 'ms-cp367' 'cp367'  'iso646-us' 'ibm-cp367' 'ansi_x3.4-1968' ))
 
-        (BIG5               unicode     ( big5 ))
+        (BIG5                   unicode     ( big5 ))
 
-        (CNS11643           unicode     ( 'cns11643' ))
+        (CNS11643               unicode     ( 'cns11643' ))
 
-        (CP437              unicode     ( 'cp437'  'cp-437' 'ibm-437' 'ms-cp437' 'microsoft-cp437' 'ibm-cp437' ))
+        (CP437                  unicode     ( 'cp437'  'cp-437' 'ibm-437' 'ms-cp437' 'microsoft-cp437' 'ibm-cp437' ))
 
-        (EBCDIC             unicode     ( 'ebcdic' ))
+        (EBCDIC                 unicode     ( 'ebcdic' ))
 
 "/        (GB2313_1980        unicode     ( 'gb2313' 'gb2313-1980' ))
 
-        (GB2312_1980_0      unicode     ( 'gb2312' 'gb2312.1980' 'gb2312.1980-0'))
+        (GB2312_1980_0          unicode     ( 'gb2312' 'gb2312.1980' 'gb2312.1980-0'))
 
-        (HANGUL             unicode     ( 'hangul' ))
+        (HANGUL                 unicode     ( 'hangul' ))
 
-        (ISO10646_1         unicode     ( unicode 'iso10646_1' 'iso10646-1' 'iso-10646-1' ))
+        (ISO10646_1             unicode     ( unicode 'iso10646_1' 'iso10646-1' 'iso-10646-1' ))
 
-        (ISO10646_to_UTF8     unicode   ( utf8 'utf-8' ))
-        (ISO10646_to_UTF16BE  unicode   ( utf16b utf16be 'utf-16b' 'utf-16be' ))
-        (ISO10646_to_UTF16LE  unicode   ( utf16l utf16le 'utf-16e' 'utf-16le' ))
+        (ISO10646_to_UTF8       unicode   ( utf8 'utf-8' ))
+        (ISO10646_to_UTF16BE    unicode   ( utf16b utf16be 'utf-16b' 'utf-16be' ))
+        (ISO10646_to_UTF16LE    unicode   ( utf16l utf16le 'utf-16e' 'utf-16le' ))
 
-        (ISO10646_to_UTF8_MAC unicode   ( 'utf8-mac' 'utf-8-mac' ))
-        (ISO10646_to_XMLUTF8  unicode   ( 'utf8-XML' ))
+        (ISO10646_to_UTF8_MAC   unicode   ( 'utf8-mac' 'utf-8-mac' ))
+        (ISO10646_to_XMLUTF8    unicode   ( 'utf8-XML' ))
 
-        (ISO8859_1          unicode     ( 'iso8859_1' 'iso8859-1' 'iso-8859-1' 'latin-1' 'latin1' 'iso-ir-100' 'ibm-819' 'ms-cp819' 'ibm-cp819' 'iso8859'))
+        (ISO8859_1              unicode     ( 'iso8859_1' 'iso8859-1' 'iso-8859-1' 'latin-1' 'latin1' 'iso-ir-100' 'ibm-819' 'ms-cp819' 'ibm-cp819' 'iso8859'))
 
-        (ISO8859_2          unicode     ( 'iso8859_2' 'iso8859-2' 'iso-8859-2' 'latin2' 'latin-2' 'iso-ir-101'))
+        (ISO8859_2              unicode     ( 'iso8859_2' 'iso8859-2' 'iso-8859-2' 'latin2' 'latin-2' 'iso-ir-101'))
 
-        (ISO8859_3          unicode     ( 'iso8859_3' 'iso8859-3' 'iso-8859-3' 'latin3' 'latin-3' 'iso-ir-109'))
+        (ISO8859_3              unicode     ( 'iso8859_3' 'iso8859-3' 'iso-8859-3' 'latin3' 'latin-3' 'iso-ir-109'))
 
-        (ISO8859_4          unicode     ( 'iso8859_4' 'iso8859-4' 'iso-8859-4' 'latin4' 'latin-4' 'iso-ir-110'))
+        (ISO8859_4              unicode     ( 'iso8859_4' 'iso8859-4' 'iso-8859-4' 'latin4' 'latin-4' 'iso-ir-110'))
 
-        (ISO8859_5          unicode     ( 'iso8859_5' 'iso8859-5' 'iso-8859-5' 'cyrillic' 'iso-ir-144' ))
+        (ISO8859_5              unicode     ( 'iso8859_5' 'iso8859-5' 'iso-8859-5' 'cyrillic' 'iso-ir-144' ))
 
-        (ISO8859_6          unicode     ( 'iso8859_6' 'iso8859-6' 'iso-8859-6' 'arabic' 'asmo-708' 'ecma-114' 'iso-ir-127' ))
+        (ISO8859_6              unicode     ( 'iso8859_6' 'iso8859-6' 'iso-8859-6' 'arabic' 'asmo-708' 'ecma-114' 'iso-ir-127' ))
 
-        (ISO8859_7          unicode     ( 'iso8859_7' 'iso8859-7' 'iso-8859-7' 'greek' 'iso-ir-126' 'ecma-118'))
+        (ISO8859_7              unicode     ( 'iso8859_7' 'iso8859-7' 'iso-8859-7' 'greek' 'iso-ir-126' 'ecma-118'))
 
-        (ISO8859_8          unicode     ( 'iso8859_8' 'iso8859-8' 'iso-8859-8' 'hebrew' 'iso-ir-138' ))
+        (ISO8859_8              unicode     ( 'iso8859_8' 'iso8859-8' 'iso-8859-8' 'hebrew' 'iso-ir-138' ))
 
-        (ISO8859_9          unicode     ( 'iso8859_9' 'iso8859-9' 'iso-8859-9' 'latin5' 'latin-5' 'iso-ir-148'))
+        (ISO8859_9              unicode     ( 'iso8859_9' 'iso8859-9' 'iso-8859-9' 'latin5' 'latin-5' 'iso-ir-148'))
 
-        (ISO8859_10         unicode     ( 'iso8859_10' 'iso8859-10' 'iso-8859-10' 'latin6' 'latin-6' 'iso-ir-157'))
+        (ISO8859_10             unicode     ( 'iso8859_10' 'iso8859-10' 'iso-8859-10' 'latin6' 'latin-6' 'iso-ir-157'))
 
-        (ISO8859_11         unicode     ( 'iso8859_11' 'iso8859-11' 'iso-8859-11' 'thai' ))
+        (ISO8859_11             unicode     ( 'iso8859_11' 'iso8859-11' 'iso-8859-11' 'thai' ))
 
-        (ISO8859_13         unicode     ( 'iso8859_13' 'iso8859-13' 'iso-8859-13' 'latin7' 'latin-7' ))
+        (ISO8859_13             unicode     ( 'iso8859_13' 'iso8859-13' 'iso-8859-13' 'latin7' 'latin-7' ))
 
-        (ISO8859_14         unicode     ( 'iso8859_14' 'iso8859-14' 'iso-8859-14' 'latin8' 'latin-8' 'latin-celtic' ))
+        (ISO8859_14             unicode     ( 'iso8859_14' 'iso8859-14' 'iso-8859-14' 'latin8' 'latin-8' 'latin-celtic' ))
 
-        (ISO8859_15         unicode     ( 'iso8859_15' 'iso8859-15' 'iso-8859-15' 'latin9' 'latin-9' 'iso-ir-203'))
+        (ISO8859_15             unicode     ( 'iso8859_15' 'iso8859-15' 'iso-8859-15' 'latin9' 'latin-9' 'iso-ir-203'))
 
-        (ISO8859_16         unicode     ( 'iso8859_16' 'iso8859-16' 'iso-8859-16' 'latin10' 'latin-10' ))
+        (ISO8859_16             unicode     ( 'iso8859_16' 'iso8859-16' 'iso-8859-16' 'latin10' 'latin-10' ))
 
-        (JIS0201            unicode     ( 'jis0201' #'jisx0201.1976-0'))
+        (JIS0201                unicode     ( 'jis0201' #'jisx0201.1976-0'))
 
-        (JIS0208            unicode     ( jis0208 'jisx0208' 'jisx0208.1983-0' 'jisx0208.1990-0'))
+        (JIS0208                unicode     ( jis0208 'jisx0208' 'jisx0208.1983-0' 'jisx0208.1990-0'))
 
-        (JIS0208_to_JIS7    jis0208     ( jis7 'jis-7' 'x-jis7' 'x-iso2022-jp' 'iso2022-jp'))
+        (JIS0208_to_JIS7        jis0208     ( jis7 'jis-7' 'x-jis7' 'x-iso2022-jp' 'iso2022-jp'))
 
-        (JIS0208_to_EUC     jis0208     ( euc #'x-euc-jp' ))
+        (JIS0208_to_EUC         jis0208     ( euc #'x-euc-jp' ))
 
-        (JIS0208_to_SJIS    jis0208     ( 'sjis' 'shiftjis' 'x-sjis' #'x-shift-jis' #'shift-jis'))
+        (JIS0208_to_SJIS        jis0208     ( 'sjis' 'shiftjis' 'x-sjis' #'x-shift-jis' #'shift-jis'))
 
-        (JIS0212            unicode     ( 'jis0212' ))
+        (JIS0212                unicode     ( 'jis0212' ))
 
-        (JOHAB              unicode     ( 'johab' ))
+        (JOHAB                  unicode     ( 'johab' ))
 
-        (KOI7               unicode     ( 'koi7' ))
+        (KOI7                   unicode     ( 'koi7' ))
 
-        (KOI8_R             unicode     ( #'koi8-r' 'cp878' ))
+        (KOI8_R                 unicode     ( #'koi8-r' 'cp878' ))
 
-        (KOI8_U             unicode     ( #'koi8-u' ))
+        (KOI8_U                 unicode     ( #'koi8-u' ))
 
-        (KSC5601            unicode     ( #'ksc5601' ))
+        (KSC5601                unicode     ( #'ksc5601' ))
 
-        (MAC_Arabic         unicode     ( #'mac-arabic' 'macarabic' ))
+        (MAC_Arabic             unicode     ( #'mac-arabic' 'macarabic' ))
 
-        (MAC_CentralEuropean unicode    ( #'mac-centraleuropean' #'mac-centraleurope' 'maccentraleurope' 'maccentraleuropean' ))
+        (MAC_CentralEuropean    unicode    ( #'mac-centraleuropean' #'mac-centraleurope' 'maccentraleurope' 'maccentraleuropean' ))
 
-        (MAC_Croatian       unicode     ( #'mac-croatian' 'maccroatian'))
+        (MAC_Croatian           unicode     ( #'mac-croatian' 'maccroatian'))
 
-        (MAC_Cyrillic       unicode     ( #'mac-cyrillic' 'maccyrillic' ))
+        (MAC_Cyrillic           unicode     ( #'mac-cyrillic' 'maccyrillic' ))
 
-        (MAC_Dingbats       unicode     ( #'mac-dingbats'  'macdingbats'  'macdingbat'))
+        (MAC_Dingbats           unicode     ( #'mac-dingbats'  'macdingbats'  'macdingbat'))
 
-        (MAC_Farsi          unicode     ( #'mac-farsi' 'macfarsi' ))
+        (MAC_Farsi              unicode     ( #'mac-farsi' 'macfarsi' ))
 
-        (MAC_Greek          unicode     ( #'mac-greek' #'macgreek' ))
+        (MAC_Greek              unicode     ( #'mac-greek' #'macgreek' ))
 
-        (MAC_Hebrew         unicode     ( #'mac-hebrew' #'machebrew'  ))
+        (MAC_Hebrew             unicode     ( #'mac-hebrew' #'machebrew'  ))
 
-        (MAC_Iceland        unicode     ( #'mac-iceland' #'maciceland'  ))
+        (MAC_Iceland            unicode     ( #'mac-iceland' #'maciceland'  ))
 
-        (MAC_Japanese       unicode     ( #'mac-japanese' #'macjapanese'  ))
+        (MAC_Japanese           unicode     ( #'mac-japanese' #'macjapanese'  ))
 
-        (MAC_Korean         unicode     ( #'mac-korean' #'mackorean'  ))
+        (MAC_Korean             unicode     ( #'mac-korean' #'mackorean'  ))
 
-        (MAC_Roman          unicode     ( #'mac-roman' #'macroman' 'macintosh' 'cp10000' ))
+        (MAC_Roman              unicode     ( #'mac-roman' #'macroman' 'macintosh' 'cp10000' ))
 
-        (MAC_Romanian       unicode     ( #'mac-romanian' #'macromanian'  ))
+        (MAC_Romanian           unicode     ( #'mac-romanian' #'macromanian'  ))
 
-        (MAC_Symbol         unicode     ( #'mac-symbol' #'macsymbol'  ))
+        (MAC_Symbol             unicode     ( #'mac-symbol' #'macsymbol'  ))
 
-        (MAC_Thai           unicode     ( #'mac-thai' #'macthai'  ))
+        (MAC_Thai               unicode     ( #'mac-thai' #'macthai'  ))
 
-        (MAC_Turkish        unicode     ( #'mac-turkish' #'macturkish'  ))
+        (MAC_Turkish            unicode     ( #'mac-turkish' #'macturkish'  ))
 
-        (MS_Ansi            unicode     ( #'ms-ansi' 'ms-cp1252' 'microsoft-cp1252' 'cp1252' 'microsoft-ansi' 'windows-1252' 'windows-latin1'))
+        (MS_Ansi                unicode     ( #'ms-ansi' 'ms-cp1252' 'microsoft-cp1252' 'cp1252' 'microsoft-ansi' 'windows-1252' 'windows-latin1'))
 
-        (MS_Arabic          unicode     ( 'ms-arabic' 'ms-cp1256' 'microsoft-cp1256' 'cp1256'  'microsoft-arabic' 'windows-1256'  ))
+        (MS_Arabic              unicode     ( 'ms-arabic' 'ms-cp1256' 'microsoft-cp1256' 'cp1256'  'microsoft-arabic' 'windows-1256'  ))
 
-        (MS_Baltic          unicode     ( 'ms-baltic' 'ms-cp1257' 'microsoft-cp1257' 'cp1257' 'microsoft-baltic' 'windows-1257'  ))
+        (MS_Baltic              unicode     ( 'ms-baltic' 'ms-cp1257' 'microsoft-cp1257' 'cp1257' 'microsoft-baltic' 'windows-1257'  ))
 
-        (MS_Cyrillic        unicode     ( 'ms-cyrillic' 'ms-cp1251' 'microsoft-cp1251' 'cp1251' 'microsoft-cyrillic' 'windows-1251'  ))
+        (MS_Cyrillic            unicode     ( 'ms-cyrillic' 'ms-cp1251' 'microsoft-cp1251' 'cp1251' 'microsoft-cyrillic' 'windows-1251'  ))
 
-        (MS_EastEuropean    unicode     ( 'ms-easteuropean' 'ms-ee' 'cp1250' 'ms-cp1250' 'microsoft-cp1250' 'microsoft-easteuropean' 'windows-1250'  ))
+        (MS_EastEuropean        unicode     ( 'ms-easteuropean' 'ms-ee' 'cp1250' 'ms-cp1250' 'microsoft-cp1250' 'microsoft-easteuropean' 'windows-1250'  ))
 
-        (MS_Greek           unicode     ( 'ms-greek' 'ms-cp1253' 'microsoft-cp1253' 'cp1253' 'microsoft-greek' 'windows-1253' ))
+        (MS_Greek               unicode     ( 'ms-greek' 'ms-cp1253' 'microsoft-cp1253' 'cp1253' 'microsoft-greek' 'windows-1253' ))
 
-        (MS_Hebrew          unicode     ( 'ms-hebrew' 'ms-cp1255' 'microsoft-cp1255' 'cp1255' 'microsoft-hebrew' 'windows-1255' ))
+        (MS_Hebrew              unicode     ( 'ms-hebrew' 'ms-cp1255' 'microsoft-cp1255' 'cp1255' 'microsoft-hebrew' 'windows-1255' ))
 
 "/        (MS_Symbol           unicode     ( 'ms-symbol' 'microsoft-symbol'  ))
 
-        (MS_Turkish         unicode     ( 'ms-turkish' 'ms-cp1254' 'microsoft-cp1254' 'cp1254' 'microsoft-turkish' 'windows-1254'  ))
+        (MS_Turkish             unicode     ( 'ms-turkish' 'ms-cp1254' 'microsoft-cp1254' 'cp1254' 'microsoft-turkish' 'windows-1254'  ))
 
-        (NEXT               unicode     ( 'next' 'nextstep'  ))
+        (NEXT                   unicode     ( 'next' 'nextstep'  ))
 
         (ISO10646_to_SGML       unicode     ( 'sgml' ))
         (ISO10646_to_JavaText   unicode     ( 'java' 'javaText' ))
+
+        (AdobeStandard          unicode     ( 'Adobe Standard' 'AdobeStandard' 'Adobe' 'adobe-standard' ))
     ) triplesDo:[:className :decodesTo :encodesTo |
         |decodesToDict|
 
@@ -911,20 +915,18 @@
 !
 
 mapFileURL1_relativePathName
-    "raise an error: must be redefined in concrete subclass(es)"
+    "must be redefined in concrete subclass(es)"
     
     ^ nil
 !
 
 mapFileURL2_relativePathName
-    "raise an error: must be redefined in concrete subclass(es)"
+    "must be redefined in concrete subclass(es)"
     
     ^ nil
 !
 
 mappingURL1
-    "raise an error: must be redefined in concrete subclass(es)"
-    
     |rel|
 
     rel := self mapFileURL1_relativePathName.
@@ -935,8 +937,6 @@
 !
 
 mappingURL2
-    "raise an error: must be redefined in concrete subclass(es)"
-    
     |rel|
 
     rel := self mapFileURL2_relativePathName.