CharacterEncoderImplementations__MAC_CentralEuropean.st
author Claus Gittinger <cg@exept.de>
Fri, 05 Mar 2004 18:28:27 +0100
changeset 8081 b468050174a9
child 8114 05274a80fcc4
permissions -rw-r--r--
initial checkin

"{ Encoding: utf8 }"

"{ Package: 'stx:libbasic' }"

"{ NameSpace: CharacterEncoderImplementations }"

SingleByteEncoder subclass:#MAC_CentralEuropean
	instanceVariableNames:''
	classVariableNames:''
	poolDictionaries:''
	category:'Collections-Text-Encodings'
!


!MAC_CentralEuropean class methodsFor:'mapping'!

mapFileURL1_relativePathName
    ^ 'VENDORS/APPLE/CENTEURO.TXT'
!

mapping
"
# From: http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/CENTEURO.TXT

#=======================================================================
#   File name:  CENTEURO.TXT
#
#   Contents:   Map (external version) from Mac OS Central European
#               character set to Unicode 2.1 through Unicode 3.2.
#
#   Copyright:  (c) 1995-2002 by Apple Computer, Inc., all rights
#               reserved.
#
#   Contact:    charsets@apple.com
#
#   Changes:
#
#      b3,c1 2002-Dec-19    Update URLs. Matches internal utom<b1>.
#       b02  1999-Sep-22    Update contact e-mail address. Matches
#                           internal utom<b1>, ufrm<b1>, and Text
#                           Encoding Converter version 1.5.
#       n05  1998-Feb-05    Update header comments to new format; no
#                           mapping changes. Matches internal utom<n3>,
#                           ufrm<n13>, and Text Encoding Converter
#                           version 1.3.
#       n03  1995-Apr-15    First version (after fixing some typos).
#                           Matches internal ufrm<n5>.
#
# Standard header:
# ----------------
#
#   Apple, the Apple logo, and Macintosh are trademarks of Apple
#   Computer, Inc., registered in the United States and other countries.
#   Unicode is a trademark of Unicode Inc. For the sake of brevity,
#   throughout this document, 'Macintosh' can be used to refer to
#   Macintosh computers and 'Unicode' can be used to refer to the
#   Unicode standard.
#
#   Apple makes no warranty or representation, either express or
#   implied, with respect to these tables, their quality, accuracy, or
#   fitness for a particular purpose. In no event will Apple be liable
#   for direct, indirect, special, incidental, or consequential damages 
#   resulting from any defect or inaccuracy in this document or the
#   accompanying tables.
#
#   These mapping tables and character lists are subject to change.
#   The latest tables should be available from the following:
#
#   <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
#   For general information about Mac OS encodings and these mapping
#   tables, see the file 'README.TXT'.
#
# Format:
# -------
#
#   Three tab-separated columns;
#   '#' begins a comment which continues to the end of the line.
#     Column #1 is the Mac OS Central European code (in hex as 0xNN)
#     Column #2 is the corresponding Unicode (in hex as 0xNNNN)
#     Column #3 is a comment containing the Unicode name
#
#   The entries are in Mac OS Central European code order.
#
#   Control character mappings are not shown in this table, following
#   the conventions of the standard UTC mapping tables. However, the
#   Mac OS Central European character set uses the standard control
#   characters at 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Central European:
# ---------------------------------
#
#   This character set is intended to cover the following languages:
#
#   Polish, Czech, Slovak, Hungarian, Estonian, Latvian, Lithuanian
#
#   These are written in Latin script, but using a different set of
#   of accented characters than Mac OS Roman. The Mac OS Central
#   European character set also includes a number of characters
#   needed for the Mac OS user interface and localization (e.g.
#   ellipsis, bullet, copyright sign), several typographic
#   punctuation symbols, math symbols, etc. However, it has a
#   smaller set of punctuation and symbols than Mac OS Roman. All of
#   the characters in Mac OS Central European that are also in the
#   Mac OS Roman character set are at the same code point in both
#   character sets; this improves application compatibility.
#
#   Note: This does not have the same letter repertoire as ISO
#   8859-2 (Latin-2); each has some accented letters that the other
#   does not have.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# Details of mapping changes in each version:
# -------------------------------------------
#
##################

0x20    0x0020  # SPACE
0x21    0x0021  # EXCLAMATION MARK
0x22    0x0022  # QUOTATION MARK
0x23    0x0023  # NUMBER SIGN
0x24    0x0024  # DOLLAR SIGN
0x25    0x0025  # PERCENT SIGN
0x26    0x0026  # AMPERSAND
0x27    0x0027  # APOSTROPHE
0x28    0x0028  # LEFT PARENTHESIS
0x29    0x0029  # RIGHT PARENTHESIS
0x2A    0x002A  # ASTERISK
0x2B    0x002B  # PLUS SIGN
0x2C    0x002C  # COMMA
0x2D    0x002D  # HYPHEN-MINUS
0x2E    0x002E  # FULL STOP
0x2F    0x002F  # SOLIDUS
0x30    0x0030  # DIGIT ZERO
0x31    0x0031  # DIGIT ONE
0x32    0x0032  # DIGIT TWO
0x33    0x0033  # DIGIT THREE
0x34    0x0034  # DIGIT FOUR
0x35    0x0035  # DIGIT FIVE
0x36    0x0036  # DIGIT SIX
0x37    0x0037  # DIGIT SEVEN
0x38    0x0038  # DIGIT EIGHT
0x39    0x0039  # DIGIT NINE
0x3A    0x003A  # COLON
0x3B    0x003B  # SEMICOLON
0x3C    0x003C  # LESS-THAN SIGN
0x3D    0x003D  # EQUALS SIGN
0x3E    0x003E  # GREATER-THAN SIGN
0x3F    0x003F  # QUESTION MARK
0x40    0x0040  # COMMERCIAL AT
0x41    0x0041  # LATIN CAPITAL LETTER A
0x42    0x0042  # LATIN CAPITAL LETTER B
0x43    0x0043  # LATIN CAPITAL LETTER C
0x44    0x0044  # LATIN CAPITAL LETTER D
0x45    0x0045  # LATIN CAPITAL LETTER E
0x46    0x0046  # LATIN CAPITAL LETTER F
0x47    0x0047  # LATIN CAPITAL LETTER G
0x48    0x0048  # LATIN CAPITAL LETTER H
0x49    0x0049  # LATIN CAPITAL LETTER I
0x4A    0x004A  # LATIN CAPITAL LETTER J
0x4B    0x004B  # LATIN CAPITAL LETTER K
0x4C    0x004C  # LATIN CAPITAL LETTER L
0x4D    0x004D  # LATIN CAPITAL LETTER M
0x4E    0x004E  # LATIN CAPITAL LETTER N
0x4F    0x004F  # LATIN CAPITAL LETTER O
0x50    0x0050  # LATIN CAPITAL LETTER P
0x51    0x0051  # LATIN CAPITAL LETTER Q
0x52    0x0052  # LATIN CAPITAL LETTER R
0x53    0x0053  # LATIN CAPITAL LETTER S
0x54    0x0054  # LATIN CAPITAL LETTER T
0x55    0x0055  # LATIN CAPITAL LETTER U
0x56    0x0056  # LATIN CAPITAL LETTER V
0x57    0x0057  # LATIN CAPITAL LETTER W
0x58    0x0058  # LATIN CAPITAL LETTER X
0x59    0x0059  # LATIN CAPITAL LETTER Y
0x5A    0x005A  # LATIN CAPITAL LETTER Z
0x5B    0x005B  # LEFT SQUARE BRACKET
0x5C    0x005C  # REVERSE SOLIDUS
0x5D    0x005D  # RIGHT SQUARE BRACKET
0x5E    0x005E  # CIRCUMFLEX ACCENT
0x5F    0x005F  # LOW LINE
0x60    0x0060  # GRAVE ACCENT
0x61    0x0061  # LATIN SMALL LETTER A
0x62    0x0062  # LATIN SMALL LETTER B
0x63    0x0063  # LATIN SMALL LETTER C
0x64    0x0064  # LATIN SMALL LETTER D
0x65    0x0065  # LATIN SMALL LETTER E
0x66    0x0066  # LATIN SMALL LETTER F
0x67    0x0067  # LATIN SMALL LETTER G
0x68    0x0068  # LATIN SMALL LETTER H
0x69    0x0069  # LATIN SMALL LETTER I
0x6A    0x006A  # LATIN SMALL LETTER J
0x6B    0x006B  # LATIN SMALL LETTER K
0x6C    0x006C  # LATIN SMALL LETTER L
0x6D    0x006D  # LATIN SMALL LETTER M
0x6E    0x006E  # LATIN SMALL LETTER N
0x6F    0x006F  # LATIN SMALL LETTER O
0x70    0x0070  # LATIN SMALL LETTER P
0x71    0x0071  # LATIN SMALL LETTER Q
0x72    0x0072  # LATIN SMALL LETTER R
0x73    0x0073  # LATIN SMALL LETTER S
0x74    0x0074  # LATIN SMALL LETTER T
0x75    0x0075  # LATIN SMALL LETTER U
0x76    0x0076  # LATIN SMALL LETTER V
0x77    0x0077  # LATIN SMALL LETTER W
0x78    0x0078  # LATIN SMALL LETTER X
0x79    0x0079  # LATIN SMALL LETTER Y
0x7A    0x007A  # LATIN SMALL LETTER Z
0x7B    0x007B  # LEFT CURLY BRACKET
0x7C    0x007C  # VERTICAL LINE
0x7D    0x007D  # RIGHT CURLY BRACKET
0x7E    0x007E  # TILDE
#
0x80    0x00C4  # LATIN CAPITAL LETTER A WITH DIAERESIS
0x81    0x0100  # LATIN CAPITAL LETTER A WITH MACRON
0x82    0x0101  # LATIN SMALL LETTER A WITH MACRON
0x83    0x00C9  # LATIN CAPITAL LETTER E WITH ACUTE
0x84    0x0104  # LATIN CAPITAL LETTER A WITH OGONEK
0x85    0x00D6  # LATIN CAPITAL LETTER O WITH DIAERESIS
0x86    0x00DC  # LATIN CAPITAL LETTER U WITH DIAERESIS
0x87    0x00E1  # LATIN SMALL LETTER A WITH ACUTE
0x88    0x0105  # LATIN SMALL LETTER A WITH OGONEK
0x89    0x010C  # LATIN CAPITAL LETTER C WITH CARON
0x8A    0x00E4  # LATIN SMALL LETTER A WITH DIAERESIS
0x8B    0x010D  # LATIN SMALL LETTER C WITH CARON
0x8C    0x0106  # LATIN CAPITAL LETTER C WITH ACUTE
0x8D    0x0107  # LATIN SMALL LETTER C WITH ACUTE
0x8E    0x00E9  # LATIN SMALL LETTER E WITH ACUTE
0x8F    0x0179  # LATIN CAPITAL LETTER Z WITH ACUTE
0x90    0x017A  # LATIN SMALL LETTER Z WITH ACUTE
0x91    0x010E  # LATIN CAPITAL LETTER D WITH CARON
0x92    0x00ED  # LATIN SMALL LETTER I WITH ACUTE
0x93    0x010F  # LATIN SMALL LETTER D WITH CARON
0x94    0x0112  # LATIN CAPITAL LETTER E WITH MACRON
0x95    0x0113  # LATIN SMALL LETTER E WITH MACRON
0x96    0x0116  # LATIN CAPITAL LETTER E WITH DOT ABOVE
0x97    0x00F3  # LATIN SMALL LETTER O WITH ACUTE
0x98    0x0117  # LATIN SMALL LETTER E WITH DOT ABOVE
0x99    0x00F4  # LATIN SMALL LETTER O WITH CIRCUMFLEX
0x9A    0x00F6  # LATIN SMALL LETTER O WITH DIAERESIS
0x9B    0x00F5  # LATIN SMALL LETTER O WITH TILDE
0x9C    0x00FA  # LATIN SMALL LETTER U WITH ACUTE
0x9D    0x011A  # LATIN CAPITAL LETTER E WITH CARON
0x9E    0x011B  # LATIN SMALL LETTER E WITH CARON
0x9F    0x00FC  # LATIN SMALL LETTER U WITH DIAERESIS
0xA0    0x2020  # DAGGER
0xA1    0x00B0  # DEGREE SIGN
0xA2    0x0118  # LATIN CAPITAL LETTER E WITH OGONEK
0xA3    0x00A3  # POUND SIGN
0xA4    0x00A7  # SECTION SIGN
0xA5    0x2022  # BULLET
0xA6    0x00B6  # PILCROW SIGN
0xA7    0x00DF  # LATIN SMALL LETTER SHARP S
0xA8    0x00AE  # REGISTERED SIGN
0xA9    0x00A9  # COPYRIGHT SIGN
0xAA    0x2122  # TRADE MARK SIGN
0xAB    0x0119  # LATIN SMALL LETTER E WITH OGONEK
0xAC    0x00A8  # DIAERESIS
0xAD    0x2260  # NOT EQUAL TO
0xAE    0x0123  # LATIN SMALL LETTER G WITH CEDILLA
0xAF    0x012E  # LATIN CAPITAL LETTER I WITH OGONEK
0xB0    0x012F  # LATIN SMALL LETTER I WITH OGONEK
0xB1    0x012A  # LATIN CAPITAL LETTER I WITH MACRON
0xB2    0x2264  # LESS-THAN OR EQUAL TO
0xB3    0x2265  # GREATER-THAN OR EQUAL TO
0xB4    0x012B  # LATIN SMALL LETTER I WITH MACRON
0xB5    0x0136  # LATIN CAPITAL LETTER K WITH CEDILLA
0xB6    0x2202  # PARTIAL DIFFERENTIAL
0xB7    0x2211  # N-ARY SUMMATION
0xB8    0x0142  # LATIN SMALL LETTER L WITH STROKE
0xB9    0x013B  # LATIN CAPITAL LETTER L WITH CEDILLA
0xBA    0x013C  # LATIN SMALL LETTER L WITH CEDILLA
0xBB    0x013D  # LATIN CAPITAL LETTER L WITH CARON
0xBC    0x013E  # LATIN SMALL LETTER L WITH CARON
0xBD    0x0139  # LATIN CAPITAL LETTER L WITH ACUTE
0xBE    0x013A  # LATIN SMALL LETTER L WITH ACUTE
0xBF    0x0145  # LATIN CAPITAL LETTER N WITH CEDILLA
0xC0    0x0146  # LATIN SMALL LETTER N WITH CEDILLA
0xC1    0x0143  # LATIN CAPITAL LETTER N WITH ACUTE
0xC2    0x00AC  # NOT SIGN
0xC3    0x221A  # SQUARE ROOT
0xC4    0x0144  # LATIN SMALL LETTER N WITH ACUTE
0xC5    0x0147  # LATIN CAPITAL LETTER N WITH CARON
0xC6    0x2206  # INCREMENT
0xC7    0x00AB  # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
0xC8    0x00BB  # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
0xC9    0x2026  # HORIZONTAL ELLIPSIS
0xCA    0x00A0  # NO-BREAK SPACE
0xCB    0x0148  # LATIN SMALL LETTER N WITH CARON
0xCC    0x0150  # LATIN CAPITAL LETTER O WITH DOUBLE ACUTE
0xCD    0x00D5  # LATIN CAPITAL LETTER O WITH TILDE
0xCE    0x0151  # LATIN SMALL LETTER O WITH DOUBLE ACUTE
0xCF    0x014C  # LATIN CAPITAL LETTER O WITH MACRON
0xD0    0x2013  # EN DASH
0xD1    0x2014  # EM DASH
0xD2    0x201C  # LEFT DOUBLE QUOTATION MARK
0xD3    0x201D  # RIGHT DOUBLE QUOTATION MARK
0xD4    0x2018  # LEFT SINGLE QUOTATION MARK
0xD5    0x2019  # RIGHT SINGLE QUOTATION MARK
0xD6    0x00F7  # DIVISION SIGN
0xD7    0x25CA  # LOZENGE
0xD8    0x014D  # LATIN SMALL LETTER O WITH MACRON
0xD9    0x0154  # LATIN CAPITAL LETTER R WITH ACUTE
0xDA    0x0155  # LATIN SMALL LETTER R WITH ACUTE
0xDB    0x0158  # LATIN CAPITAL LETTER R WITH CARON
0xDC    0x2039  # SINGLE LEFT-POINTING ANGLE QUOTATION MARK
0xDD    0x203A  # SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
0xDE    0x0159  # LATIN SMALL LETTER R WITH CARON
0xDF    0x0156  # LATIN CAPITAL LETTER R WITH CEDILLA
0xE0    0x0157  # LATIN SMALL LETTER R WITH CEDILLA
0xE1    0x0160  # LATIN CAPITAL LETTER S WITH CARON
0xE2    0x201A  # SINGLE LOW-9 QUOTATION MARK
0xE3    0x201E  # DOUBLE LOW-9 QUOTATION MARK
0xE4    0x0161  # LATIN SMALL LETTER S WITH CARON
0xE5    0x015A  # LATIN CAPITAL LETTER S WITH ACUTE
0xE6    0x015B  # LATIN SMALL LETTER S WITH ACUTE
0xE7    0x00C1  # LATIN CAPITAL LETTER A WITH ACUTE
0xE8    0x0164  # LATIN CAPITAL LETTER T WITH CARON
0xE9    0x0165  # LATIN SMALL LETTER T WITH CARON
0xEA    0x00CD  # LATIN CAPITAL LETTER I WITH ACUTE
0xEB    0x017D  # LATIN CAPITAL LETTER Z WITH CARON
0xEC    0x017E  # LATIN SMALL LETTER Z WITH CARON
0xED    0x016A  # LATIN CAPITAL LETTER U WITH MACRON
0xEE    0x00D3  # LATIN CAPITAL LETTER O WITH ACUTE
0xEF    0x00D4  # LATIN CAPITAL LETTER O WITH CIRCUMFLEX
0xF0    0x016B  # LATIN SMALL LETTER U WITH MACRON
0xF1    0x016E  # LATIN CAPITAL LETTER U WITH RING ABOVE
0xF2    0x00DA  # LATIN CAPITAL LETTER U WITH ACUTE
0xF3    0x016F  # LATIN SMALL LETTER U WITH RING ABOVE
0xF4    0x0170  # LATIN CAPITAL LETTER U WITH DOUBLE ACUTE
0xF5    0x0171  # LATIN SMALL LETTER U WITH DOUBLE ACUTE
0xF6    0x0172  # LATIN CAPITAL LETTER U WITH OGONEK
0xF7    0x0173  # LATIN SMALL LETTER U WITH OGONEK
0xF8    0x00DD  # LATIN CAPITAL LETTER Y WITH ACUTE
0xF9    0x00FD  # LATIN SMALL LETTER Y WITH ACUTE
0xFA    0x0137  # LATIN SMALL LETTER K WITH CEDILLA
0xFB    0x017B  # LATIN CAPITAL LETTER Z WITH DOT ABOVE
0xFC    0x0141  # LATIN CAPITAL LETTER L WITH STROKE
0xFD    0x017C  # LATIN SMALL LETTER Z WITH DOT ABOVE
0xFE    0x0122  # LATIN CAPITAL LETTER G WITH CEDILLA
0xFF    0x02C7  # CARON

"
! !

!MAC_CentralEuropean class methodsFor:'queries'!

namesOfEncoding
    ^ #( #'mac-centraleuropean' #'mac-centraleurope' 'maccentraleurope' 'maccentraleuropean' )
! !

!MAC_CentralEuropean class methodsFor:'documentation'!

version
    ^ '$Header: /cvs/stx/stx/libbasic/CharacterEncoderImplementations__MAC_CentralEuropean.st,v 1.1 2004-03-05 17:19:00 cg Exp $'
! !