CharacterEncoderImplementations__MAC_CentralEuropean.st
author Claus Gittinger <cg@exept.de>
Tue, 09 Jul 2019 20:55:17 +0200
changeset 24417 03b083548da2
parent 8148 dbf64e3142d9
child 17711 39faaaf888b4
permissions -rw-r--r--
#REFACTORING by exept class: Smalltalk class changed: #recursiveInstallAutoloadedClassesFrom:rememberIn:maxLevels:noAutoload:packageTop:showSplashInLevels: Transcript showCR:(... bindWith:...) -> Transcript showCR:... with:...

"
 COPYRIGHT (c) 2004 by eXept Software AG
              All Rights Reserved

 This software is furnished under a license and may be used
 only in accordance with the terms of that license and with the
 inclusion of the above copyright notice.   This software may not
 be provided or otherwise made available to, or used by, any
 other person.  No title to or ownership of the software is
 hereby transferred.
"

"{ Package: 'stx:libbasic' }"

"{ NameSpace: CharacterEncoderImplementations }"

SingleByteEncoder subclass:#MAC_CentralEuropean
	instanceVariableNames:''
	classVariableNames:''
	poolDictionaries:''
	category:'Collections-Text-Encodings'
!

!MAC_CentralEuropean class methodsFor:'documentation'!

copyright
"
 COPYRIGHT (c) 2004 by eXept Software AG
              All Rights Reserved

 This software is furnished under a license and may be used
 only in accordance with the terms of that license and with the
 inclusion of the above copyright notice.   This software may not
 be provided or otherwise made available to, or used by, any
 other person.  No title to or ownership of the software is
 hereby transferred.
"
! !

!MAC_CentralEuropean class methodsFor:'mapping'!

mapFileURL1_relativePathName
    ^ 'VENDORS/APPLE/CENTEURO.TXT'
!

mapping
"
# From: http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/CENTEURO.TXT

#=======================================================================
#   File name:  CENTEURO.TXT
#
#   Contents:   Map (external version) from Mac OS Central European
#               character set to Unicode 2.1 through Unicode 3.2.
#
#   Copyright:  (c) 1995-2002 by Apple Computer, Inc., all rights
#               reserved.
#
#   Contact:    charsets@apple.com
#
#   Changes:
#
#      b3,c1 2002-Dec-19    Update URLs. Matches internal utom<b1>.
#       b02  1999-Sep-22    Update contact e-mail address. Matches
#                           internal utom<b1>, ufrm<b1>, and Text
#                           Encoding Converter version 1.5.
#       n05  1998-Feb-05    Update header comments to new format; no
#                           mapping changes. Matches internal utom<n3>,
#                           ufrm<n13>, and Text Encoding Converter
#                           version 1.3.
#       n03  1995-Apr-15    First version (after fixing some typos).
#                           Matches internal ufrm<n5>.
#
# Standard header:
# ----------------
#
#   Apple, the Apple logo, and Macintosh are trademarks of Apple
#   Computer, Inc., registered in the United States and other countries.
#   Unicode is a trademark of Unicode Inc. For the sake of brevity,
#   throughout this document, 'Macintosh' can be used to refer to
#   Macintosh computers and 'Unicode' can be used to refer to the
#   Unicode standard.
#
#   Apple makes no warranty or representation, either express or
#   implied, with respect to these tables, their quality, accuracy, or
#   fitness for a particular purpose. In no event will Apple be liable
#   for direct, indirect, special, incidental, or consequential damages 
#   resulting from any defect or inaccuracy in this document or the
#   accompanying tables.
#
#   These mapping tables and character lists are subject to change.
#   The latest tables should be available from the following:
#
#   <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
#   For general information about Mac OS encodings and these mapping
#   tables, see the file 'README.TXT'.
#
# Format:
# -------
#
#   Three tab-separated columns;
#   '#' begins a comment which continues to the end of the line.
#     Column #1 is the Mac OS Central European code (in hex as 0xNN)
#     Column #2 is the corresponding Unicode (in hex as 0xNNNN)
#     Column #3 is a comment containing the Unicode name
#
#   The entries are in Mac OS Central European code order.
#
#   Control character mappings are not shown in this table, following
#   the conventions of the standard UTC mapping tables. However, the
#   Mac OS Central European character set uses the standard control
#   characters at 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Central European:
# ---------------------------------
#
#   This character set is intended to cover the following languages:
#
#   Polish, Czech, Slovak, Hungarian, Estonian, Latvian, Lithuanian
#
#   These are written in Latin script, but using a different set of
#   of accented characters than Mac OS Roman. The Mac OS Central
#   European character set also includes a number of characters
#   needed for the Mac OS user interface and localization (e.g.
#   ellipsis, bullet, copyright sign), several typographic
#   punctuation symbols, math symbols, etc. However, it has a
#   smaller set of punctuation and symbols than Mac OS Roman. All of
#   the characters in Mac OS Central European that are also in the
#   Mac OS Roman character set are at the same code point in both
#   character sets; this improves application compatibility.
#
#   Note: This does not have the same letter repertoire as ISO
#   8859-2 (Latin-2); each has some accented letters that the other
#   does not have.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# Details of mapping changes in each version:
# -------------------------------------------
#
##################

0x20    0x0020  # SPACE
0x21    0x0021  # EXCLAMATION MARK
0x22    0x0022  # QUOTATION MARK
0x23    0x0023  # NUMBER SIGN
0x24    0x0024  # DOLLAR SIGN
0x25    0x0025  # PERCENT SIGN
0x26    0x0026  # AMPERSAND
0x27    0x0027  # APOSTROPHE
0x28    0x0028  # LEFT PARENTHESIS
0x29    0x0029  # RIGHT PARENTHESIS
0x2A    0x002A  # ASTERISK
0x2B    0x002B  # PLUS SIGN
0x2C    0x002C  # COMMA
0x2D    0x002D  # HYPHEN-MINUS
0x2E    0x002E  # FULL STOP
0x2F    0x002F  # SOLIDUS
0x30    0x0030  # DIGIT ZERO
0x31    0x0031  # DIGIT ONE
0x32    0x0032  # DIGIT TWO
0x33    0x0033  # DIGIT THREE
0x34    0x0034  # DIGIT FOUR
0x35    0x0035  # DIGIT FIVE
0x36    0x0036  # DIGIT SIX
0x37    0x0037  # DIGIT SEVEN
0x38    0x0038  # DIGIT EIGHT
0x39    0x0039  # DIGIT NINE
0x3A    0x003A  # COLON
0x3B    0x003B  # SEMICOLON
0x3C    0x003C  # LESS-THAN SIGN
0x3D    0x003D  # EQUALS SIGN
0x3E    0x003E  # GREATER-THAN SIGN
0x3F    0x003F  # QUESTION MARK
0x40    0x0040  # COMMERCIAL AT
0x41    0x0041  # LATIN CAPITAL LETTER A
0x42    0x0042  # LATIN CAPITAL LETTER B
0x43    0x0043  # LATIN CAPITAL LETTER C
0x44    0x0044  # LATIN CAPITAL LETTER D
0x45    0x0045  # LATIN CAPITAL LETTER E
0x46    0x0046  # LATIN CAPITAL LETTER F
0x47    0x0047  # LATIN CAPITAL LETTER G
0x48    0x0048  # LATIN CAPITAL LETTER H
0x49    0x0049  # LATIN CAPITAL LETTER I
0x4A    0x004A  # LATIN CAPITAL LETTER J
0x4B    0x004B  # LATIN CAPITAL LETTER K
0x4C    0x004C  # LATIN CAPITAL LETTER L
0x4D    0x004D  # LATIN CAPITAL LETTER M
0x4E    0x004E  # LATIN CAPITAL LETTER N
0x4F    0x004F  # LATIN CAPITAL LETTER O
0x50    0x0050  # LATIN CAPITAL LETTER P
0x51    0x0051  # LATIN CAPITAL LETTER Q
0x52    0x0052  # LATIN CAPITAL LETTER R
0x53    0x0053  # LATIN CAPITAL LETTER S
0x54    0x0054  # LATIN CAPITAL LETTER T
0x55    0x0055  # LATIN CAPITAL LETTER U
0x56    0x0056  # LATIN CAPITAL LETTER V
0x57    0x0057  # LATIN CAPITAL LETTER W
0x58    0x0058  # LATIN CAPITAL LETTER X
0x59    0x0059  # LATIN CAPITAL LETTER Y
0x5A    0x005A  # LATIN CAPITAL LETTER Z
0x5B    0x005B  # LEFT SQUARE BRACKET
0x5C    0x005C  # REVERSE SOLIDUS
0x5D    0x005D  # RIGHT SQUARE BRACKET
0x5E    0x005E  # CIRCUMFLEX ACCENT
0x5F    0x005F  # LOW LINE
0x60    0x0060  # GRAVE ACCENT
0x61    0x0061  # LATIN SMALL LETTER A
0x62    0x0062  # LATIN SMALL LETTER B
0x63    0x0063  # LATIN SMALL LETTER C
0x64    0x0064  # LATIN SMALL LETTER D
0x65    0x0065  # LATIN SMALL LETTER E
0x66    0x0066  # LATIN SMALL LETTER F
0x67    0x0067  # LATIN SMALL LETTER G
0x68    0x0068  # LATIN SMALL LETTER H
0x69    0x0069  # LATIN SMALL LETTER I
0x6A    0x006A  # LATIN SMALL LETTER J
0x6B    0x006B  # LATIN SMALL LETTER K
0x6C    0x006C  # LATIN SMALL LETTER L
0x6D    0x006D  # LATIN SMALL LETTER M
0x6E    0x006E  # LATIN SMALL LETTER N
0x6F    0x006F  # LATIN SMALL LETTER O
0x70    0x0070  # LATIN SMALL LETTER P
0x71    0x0071  # LATIN SMALL LETTER Q
0x72    0x0072  # LATIN SMALL LETTER R
0x73    0x0073  # LATIN SMALL LETTER S
0x74    0x0074  # LATIN SMALL LETTER T
0x75    0x0075  # LATIN SMALL LETTER U
0x76    0x0076  # LATIN SMALL LETTER V
0x77    0x0077  # LATIN SMALL LETTER W
0x78    0x0078  # LATIN SMALL LETTER X
0x79    0x0079  # LATIN SMALL LETTER Y
0x7A    0x007A  # LATIN SMALL LETTER Z
0x7B    0x007B  # LEFT CURLY BRACKET
0x7C    0x007C  # VERTICAL LINE
0x7D    0x007D  # RIGHT CURLY BRACKET
0x7E    0x007E  # TILDE
#
0x80    0x00C4  # LATIN CAPITAL LETTER A WITH DIAERESIS
0x81    0x0100  # LATIN CAPITAL LETTER A WITH MACRON
0x82    0x0101  # LATIN SMALL LETTER A WITH MACRON
0x83    0x00C9  # LATIN CAPITAL LETTER E WITH ACUTE
0x84    0x0104  # LATIN CAPITAL LETTER A WITH OGONEK
0x85    0x00D6  # LATIN CAPITAL LETTER O WITH DIAERESIS
0x86    0x00DC  # LATIN CAPITAL LETTER U WITH DIAERESIS
0x87    0x00E1  # LATIN SMALL LETTER A WITH ACUTE
0x88    0x0105  # LATIN SMALL LETTER A WITH OGONEK
0x89    0x010C  # LATIN CAPITAL LETTER C WITH CARON
0x8A    0x00E4  # LATIN SMALL LETTER A WITH DIAERESIS
0x8B    0x010D  # LATIN SMALL LETTER C WITH CARON
0x8C    0x0106  # LATIN CAPITAL LETTER C WITH ACUTE
0x8D    0x0107  # LATIN SMALL LETTER C WITH ACUTE
0x8E    0x00E9  # LATIN SMALL LETTER E WITH ACUTE
0x8F    0x0179  # LATIN CAPITAL LETTER Z WITH ACUTE
0x90    0x017A  # LATIN SMALL LETTER Z WITH ACUTE
0x91    0x010E  # LATIN CAPITAL LETTER D WITH CARON
0x92    0x00ED  # LATIN SMALL LETTER I WITH ACUTE
0x93    0x010F  # LATIN SMALL LETTER D WITH CARON
0x94    0x0112  # LATIN CAPITAL LETTER E WITH MACRON
0x95    0x0113  # LATIN SMALL LETTER E WITH MACRON
0x96    0x0116  # LATIN CAPITAL LETTER E WITH DOT ABOVE
0x97    0x00F3  # LATIN SMALL LETTER O WITH ACUTE
0x98    0x0117  # LATIN SMALL LETTER E WITH DOT ABOVE
0x99    0x00F4  # LATIN SMALL LETTER O WITH CIRCUMFLEX
0x9A    0x00F6  # LATIN SMALL LETTER O WITH DIAERESIS
0x9B    0x00F5  # LATIN SMALL LETTER O WITH TILDE
0x9C    0x00FA  # LATIN SMALL LETTER U WITH ACUTE
0x9D    0x011A  # LATIN CAPITAL LETTER E WITH CARON
0x9E    0x011B  # LATIN SMALL LETTER E WITH CARON
0x9F    0x00FC  # LATIN SMALL LETTER U WITH DIAERESIS
0xA0    0x2020  # DAGGER
0xA1    0x00B0  # DEGREE SIGN
0xA2    0x0118  # LATIN CAPITAL LETTER E WITH OGONEK
0xA3    0x00A3  # POUND SIGN
0xA4    0x00A7  # SECTION SIGN
0xA5    0x2022  # BULLET
0xA6    0x00B6  # PILCROW SIGN
0xA7    0x00DF  # LATIN SMALL LETTER SHARP S
0xA8    0x00AE  # REGISTERED SIGN
0xA9    0x00A9  # COPYRIGHT SIGN
0xAA    0x2122  # TRADE MARK SIGN
0xAB    0x0119  # LATIN SMALL LETTER E WITH OGONEK
0xAC    0x00A8  # DIAERESIS
0xAD    0x2260  # NOT EQUAL TO
0xAE    0x0123  # LATIN SMALL LETTER G WITH CEDILLA
0xAF    0x012E  # LATIN CAPITAL LETTER I WITH OGONEK
0xB0    0x012F  # LATIN SMALL LETTER I WITH OGONEK
0xB1    0x012A  # LATIN CAPITAL LETTER I WITH MACRON
0xB2    0x2264  # LESS-THAN OR EQUAL TO
0xB3    0x2265  # GREATER-THAN OR EQUAL TO
0xB4    0x012B  # LATIN SMALL LETTER I WITH MACRON
0xB5    0x0136  # LATIN CAPITAL LETTER K WITH CEDILLA
0xB6    0x2202  # PARTIAL DIFFERENTIAL
0xB7    0x2211  # N-ARY SUMMATION
0xB8    0x0142  # LATIN SMALL LETTER L WITH STROKE
0xB9    0x013B  # LATIN CAPITAL LETTER L WITH CEDILLA
0xBA    0x013C  # LATIN SMALL LETTER L WITH CEDILLA
0xBB    0x013D  # LATIN CAPITAL LETTER L WITH CARON
0xBC    0x013E  # LATIN SMALL LETTER L WITH CARON
0xBD    0x0139  # LATIN CAPITAL LETTER L WITH ACUTE
0xBE    0x013A  # LATIN SMALL LETTER L WITH ACUTE
0xBF    0x0145  # LATIN CAPITAL LETTER N WITH CEDILLA
0xC0    0x0146  # LATIN SMALL LETTER N WITH CEDILLA
0xC1    0x0143  # LATIN CAPITAL LETTER N WITH ACUTE
0xC2    0x00AC  # NOT SIGN
0xC3    0x221A  # SQUARE ROOT
0xC4    0x0144  # LATIN SMALL LETTER N WITH ACUTE
0xC5    0x0147  # LATIN CAPITAL LETTER N WITH CARON
0xC6    0x2206  # INCREMENT
0xC7    0x00AB  # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
0xC8    0x00BB  # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0xC9    0x2026  # HORIZONTAL ELLIPSIS
0xCA    0x00A0  # NO-BREAK SPACE
0xCB    0x0148  # LATIN SMALL LETTER N WITH CARON
0xCC    0x0150  # LATIN CAPITAL LETTER O WITH DOUBLE ACUTE
0xCD    0x00D5  # LATIN CAPITAL LETTER O WITH TILDE
0xCE    0x0151  # LATIN SMALL LETTER O WITH DOUBLE ACUTE
0xCF    0x014C  # LATIN CAPITAL LETTER O WITH MACRON
0xD0    0x2013  # EN DASH
0xD1    0x2014  # EM DASH
0xD2    0x201C  # LEFT DOUBLE QUOTATION MARK
0xD3    0x201D  # RIGHT DOUBLE QUOTATION MARK
0xD4    0x2018  # LEFT SINGLE QUOTATION MARK
0xD5    0x2019  # RIGHT SINGLE QUOTATION MARK
0xD6    0x00F7  # DIVISION SIGN
0xD7    0x25CA  # LOZENGE
0xD8    0x014D  # LATIN SMALL LETTER O WITH MACRON
0xD9    0x0154  # LATIN CAPITAL LETTER R WITH ACUTE
0xDA    0x0155  # LATIN SMALL LETTER R WITH ACUTE
0xDB    0x0158  # LATIN CAPITAL LETTER R WITH CARON
0xDC    0x2039  # SINGLE LEFT-POINTING ANGLE QUOTATION MARK
0xDD    0x203A  # SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
0xDE    0x0159  # LATIN SMALL LETTER R WITH CARON
0xDF    0x0156  # LATIN CAPITAL LETTER R WITH CEDILLA
0xE0    0x0157  # LATIN SMALL LETTER R WITH CEDILLA
0xE1    0x0160  # LATIN CAPITAL LETTER S WITH CARON
0xE2    0x201A  # SINGLE LOW-9 QUOTATION MARK
0xE3    0x201E  # DOUBLE LOW-9 QUOTATION MARK
0xE4    0x0161  # LATIN SMALL LETTER S WITH CARON
0xE5    0x015A  # LATIN CAPITAL LETTER S WITH ACUTE
0xE6    0x015B  # LATIN SMALL LETTER S WITH ACUTE
0xE7    0x00C1  # LATIN CAPITAL LETTER A WITH ACUTE
0xE8    0x0164  # LATIN CAPITAL LETTER T WITH CARON
0xE9    0x0165  # LATIN SMALL LETTER T WITH CARON
0xEA    0x00CD  # LATIN CAPITAL LETTER I WITH ACUTE
0xEB    0x017D  # LATIN CAPITAL LETTER Z WITH CARON
0xEC    0x017E  # LATIN SMALL LETTER Z WITH CARON
0xED    0x016A  # LATIN CAPITAL LETTER U WITH MACRON
0xEE    0x00D3  # LATIN CAPITAL LETTER O WITH ACUTE
0xEF    0x00D4  # LATIN CAPITAL LETTER O WITH CIRCUMFLEX
0xF0    0x016B  # LATIN SMALL LETTER U WITH MACRON
0xF1    0x016E  # LATIN CAPITAL LETTER U WITH RING ABOVE
0xF2    0x00DA  # LATIN CAPITAL LETTER U WITH ACUTE
0xF3    0x016F  # LATIN SMALL LETTER U WITH RING ABOVE
0xF4    0x0170  # LATIN CAPITAL LETTER U WITH DOUBLE ACUTE
0xF5    0x0171  # LATIN SMALL LETTER U WITH DOUBLE ACUTE
0xF6    0x0172  # LATIN CAPITAL LETTER U WITH OGONEK
0xF7    0x0173  # LATIN SMALL LETTER U WITH OGONEK
0xF8    0x00DD  # LATIN CAPITAL LETTER Y WITH ACUTE
0xF9    0x00FD  # LATIN SMALL LETTER Y WITH ACUTE
0xFA    0x0137  # LATIN SMALL LETTER K WITH CEDILLA
0xFB    0x017B  # LATIN CAPITAL LETTER Z WITH DOT ABOVE
0xFC    0x0141  # LATIN CAPITAL LETTER L WITH STROKE
0xFD    0x017C  # LATIN SMALL LETTER Z WITH DOT ABOVE
0xFE    0x0122  # LATIN CAPITAL LETTER G WITH CEDILLA
0xFF    0x02C7  # CARON

"
! !

!MAC_CentralEuropean class methodsFor:'documentation'!

version
    ^ '$Header: /cvs/stx/stx/libbasic/CharacterEncoderImplementations__MAC_CentralEuropean.st,v 1.3 2004-03-09 21:57:41 cg Exp $'
! !