diff options
Diffstat (limited to 'tools/encoding/macTurkish.txt')
-rw-r--r-- | tools/encoding/macTurkish.txt | 119 |
1 files changed, 82 insertions, 37 deletions
diff --git a/tools/encoding/macTurkish.txt b/tools/encoding/macTurkish.txt index 6daa774..7b143e0 100644 --- a/tools/encoding/macTurkish.txt +++ b/tools/encoding/macTurkish.txt @@ -1,11 +1,28 @@ +#======================================================================= +# FTP file name: TURKISH.TXT # -# Name: MacOS_Turkish [to Unicode] -# Unicode versions: 1.1, 2.0 -# Table version: 0.2 (from internal ufrm version <4>) -# Date: 15 April 1995 -# Author: Peter Edberg <edberg1@applelink.apple.com> +# Contents: Map (external version) from Mac OS Turkish +# character set to Unicode 2.1 # -# Copyright (c) 1995 Apple Computer, Inc. All Rights reserved. +# Copyright: (c) 1995-1999 by Apple Computer, Inc., all rights +# reserved. +# +# Contact: charsets@apple.com +# +# Changes: +# +# b02 1999-Sep-22 Update contact e-mail address. Matches +# internal utom<b1>, ufrm<b1>, and Text +# Encoding Converter version 1.5. +# n05 1998-Feb-05 Minor update to header comments +# n03 1997-Dec-14 Update to match internal utom<n5>, ufrm<n15>: +# Change standard mapping for 0xBD from U+2126 +# to its canonical decomposition, U+03A9. +# n02 1995-Apr-15 First version (after fixing some typos). +# Matches internal ufrm<n4>. +# +# Standard header: +# ---------------- # # Apple, the Apple logo, and Macintosh are trademarks of Apple # Computer, Inc., registered in the United States and other countries. @@ -17,49 +34,77 @@ # Apple makes no warranty or representation, either express or # implied, with respect to these tables, their quality, accuracy, or # fitness for a particular purpose. In no event will Apple be liable -# for direct, indirect, special, incidental, or consequential damages +# for direct, indirect, special, incidental, or consequential damages # resulting from any defect or inaccuracy in this document or the # accompanying tables. # -# These mapping tables and character lists are preliminary and -# subject to change. Updated tables will be available from the -# Unicode Inc. ftp site (unicode.org), the Apple Computer ftp site -# (ftp.info.apple.com), the Apple Computer World-Wide Web pages -# (http://www.info.apple.com), and possibly on diskette from APDA -# (Apple's mail-order distribution service for developers). +# These mapping tables and character lists are subject to change. +# The latest tables should be available from the following: +# +# <ftp://ftp.unicode.org/Public/MAPPINGS/VENDORS/APPLE/> +# <ftp://dev.apple.com/devworld/Technical_Documentation/Misc._Standards/> # -# Format: -# ------- +# For general information about Mac OS encodings and these mapping +# tables, see the file "README.TXT". +# +# Format: +# ------- # # Three tab-separated columns; # '#' begins a comment which continues to the end of the line. -# Column #1 is the MacOS Turkish code (in hex as 0xNN) -# Column #2 is the Unicode (in hex as 0xNNNN) -# Column #3 is the Unicode name (follows a comment sign, '#') +# Column #1 is the Mac OS Turkish code (in hex as 0xNN) +# Column #2 is the corresponding Unicode (in hex as 0xNNNN) +# Column #3 is a comment containing the Unicode name +# +# The entries are in Mac OS Turkish code order. +# +# Two of these mappings requires the use of a corporate character. +# See the file "CORPCHAR.TXT" and notes below. +# +# Control character mappings are not shown in this table, following +# the conventions of the standard UTC mapping tables. However, the +# Mac OS Roman character set uses the standard control characters at +# 0x00-0x1F and 0x7F. +# +# Notes on Mac OS Turkish: +# ------------------------ # -# The entries are in MacOS Turkish code order. +# Mac OS Turkish is used for Turkish. +# +# The Mac OS Turkish encoding shares the script code smRoman +# (0) with the Mac OS Roman encoding. To determine if the Turkish +# encoding is being used, you must also check if the system region +# code is 24, verTurkey. +# +# This character set is a variant of standard Mac OS Roman. It adds +# upper & lower G with breve, upper & lower S with cedilla, upper I +# with dot, and moves the dotless lower i from its position at 0xF5 +# in standard Mac OS Roman to a position at 0xDD here (leaving the +# 0xF5 code point undefined in Mac OS Turkish). This gives a total +# of 7 code point differences from standard Mac OS Roman. +# +# Unicode mapping issues and notes: +# --------------------------------- +# +# The following corporate zone Unicode characters are used in this +# mapping: +# +# 0xF8A0 undefined1, used to map the single undefined code point +# in Mac OS Turkish and Greek (to obtain roundtrip +# fidelity for all code points). +# 0xF8FF Apple logo # -# Two of these mappings requires the use of a corporate character: -# for the Apple logo character, and for the one undefined code -# point. See the file "MacOS-CorpCharList". # NOTE: The graphic image associated with the Apple logo character # is not authorized for use without permission of Apple, and # unauthorized use might constitute trademark infringement. # -# Notes on MacOS Turkish: -# ----------------------- +# Details of mapping changes in each version: +# ------------------------------------------- # -# The MacOS Turkish encoding shares the script code smRoman -# (0) with the standard MacOS Roman encoding. To determine if -# the Turkish encoding is being used, you must also check if the -# system region code is 24, verTurkey. +# Changes from version n02 to version n03: # -# This character set is a variant of standard MacOS Roman. It adds -# upper & lower G with breve, upper & lower S with cedilla, upper I -# with dot, and moves the dotless lower i from its position at 0xF5 -# in standard MacOS Roman to a position at 0xDD here (leaving the -# 0xF5 code point undefined in MacTurkish). This gives a total of 7 -# code point differences from standard MacOS Roman. +# - Change mapping of 0xBD from U+2126 to its canonical +# decomposition, U+03A9. # ################## @@ -205,7 +250,7 @@ 0xAB 0x00B4 # ACUTE ACCENT 0xAC 0x00A8 # DIAERESIS 0xAD 0x2260 # NOT EQUAL TO -0xAE 0x00C6 # LATIN CAPITAL LIGATURE AE +0xAE 0x00C6 # LATIN CAPITAL LETTER AE 0xAF 0x00D8 # LATIN CAPITAL LETTER O WITH STROKE 0xB0 0x221E # INFINITY 0xB1 0x00B1 # PLUS-MINUS SIGN @@ -220,8 +265,8 @@ 0xBA 0x222B # INTEGRAL 0xBB 0x00AA # FEMININE ORDINAL INDICATOR 0xBC 0x00BA # MASCULINE ORDINAL INDICATOR -0xBD 0x2126 # OHM SIGN -0xBE 0x00E6 # LATIN SMALL LIGATURE AE +0xBD 0x03A9 # GREEK CAPITAL LETTER OMEGA +0xBE 0x00E6 # LATIN SMALL LETTER AE 0xBF 0x00F8 # LATIN SMALL LETTER O WITH STROKE 0xC0 0x00BF # INVERTED QUESTION MARK 0xC1 0x00A1 # INVERTED EXCLAMATION MARK |