/share/i18n/csmapper/APPLE/SYMBOL%UCS.src

https://bitbucket.org/freebsd/freebsd-head/ · Unknown · 321 lines · 318 code · 3 blank · 0 comment · 0 complexity · 8b2c3baaf3ef42bd5482ed2e6d2ca010 MD5 · raw file

  1. # $FreeBSD$
  2. TYPE ROWCOL
  3. NAME SYMBOL/UCS
  4. SRC_ZONE 0x00-0xFF
  5. OOB_MODE ILSEQ
  6. DST_ILSEQ 0xFFFE
  7. DST_UNIT_BITS 16
  8. BEGIN_MAP
  9. #=======================================================================
  10. # File name: SYMBOL.TXT
  11. #
  12. # Contents: Map (external version) from Mac OS Symbol
  13. # character set to Unicode 4.0 and later.
  14. #
  15. # Copyright: (c) 1994-2002, 2005 by Apple Computer, Inc., all rights
  16. # reserved.
  17. #
  18. # Contact: charsets@apple.com
  19. #
  20. # Changes:
  21. #
  22. # c02 2005-Apr-05 Change mappings for 0xBD, 0xE0. Update
  23. # header comments. Matches internal xml <c1.2>
  24. # and Text Encoding Converter 2.0.
  25. # b4,c1 2002-Dec-19 Update mappings for encoded glyph fragments
  26. # 0xBE, 0xE6-EF, 0xF4, 0xF6-FE to use new
  27. # Unicode 3.2 characters instead of sequences
  28. # involving corporate-use characters. Update
  29. # URLs, notes. Matches internal utom<b4>.
  30. # b03 1999-Sep-22 Update contact e-mail address. Matches
  31. # internal utom<b3>, ufrm<b3>, and Text
  32. # Encoding Converter version 1.5.
  33. # b02 1998-Aug-18 Encoding changed for Mac OS 8.5; add new
  34. # mapping from 0xA0 to EURO SIGN. Matches
  35. # internal utom<b3>, ufrm<b3>.
  36. # n05 1998-Feb-05 Update to match internal utom<n5>, ufrm<n15>
  37. # and Text Encoding Converter version 1.3:
  38. # Use standard Unicodes plus transcoding hints
  39. # instead of single corporate characters, also
  40. # change mappings for 0xE1 & 0xF1 from U+2329
  41. # & U+232A to their canonical decompositions;
  42. # see details below. Also update header
  43. # comments to new format.
  44. # n03 1995-Apr-15 First version (after fixing some typos).
  45. # Matches internal ufrm<n4>.
  46. #
  47. # Standard header:
  48. # ----------------
  49. #
  50. # Apple, the Apple logo, and Macintosh are trademarks of Apple
  51. # Computer, Inc., registered in the United States and other countries.
  52. # Unicode is a trademark of Unicode Inc. For the sake of brevity,
  53. # throughout this document, "Macintosh" can be used to refer to
  54. # Macintosh computers and "Unicode" can be used to refer to the
  55. # Unicode standard.
  56. #
  57. # Apple Computer, Inc. ("Apple") makes no warranty or representation,
  58. # either express or implied, with respect to this document and the
  59. # included data, its quality, accuracy, or fitness for a particular
  60. # purpose. In no event will Apple be liable for direct, indirect,
  61. # special, incidental, or consequential damages resulting from any
  62. # defect or inaccuracy in this document or the included data.
  63. #
  64. # These mapping tables and character lists are subject to change.
  65. # The latest tables should be available from the following:
  66. #
  67. # <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
  68. #
  69. # For general information about Mac OS encodings and these mapping
  70. # tables, see the file "README.TXT".
  71. #
  72. # Format:
  73. # -------
  74. #
  75. # Three tab-separated columns;
  76. # '#' begins a comment which continues to the end of the line.
  77. # Column #1 is the Mac OS Symbol code (in hex as 0xNN)
  78. # Column #2 is the corresponding Unicode or Unicode sequence
  79. # (in hex as 0xNNNN or 0xNNNN+0xNNNN).
  80. # Column #3 is a comment containing the Unicode name.
  81. # In some cases an additional comment follows the Unicode name.
  82. #
  83. # The entries are in Mac OS Symbol code order.
  84. #
  85. # Some of these mappings require the use of corporate characters.
  86. # See the file "CORPCHAR.TXT" and notes below.
  87. #
  88. # Control character mappings are not shown in this table, following
  89. # the conventions of the standard UTC mapping tables. However, the
  90. # Mac OS Symbol character set uses the standard control characters
  91. # at 0x00-0x1F and 0x7F.
  92. #
  93. # Notes on Mac OS Symbol:
  94. # -----------------------
  95. #
  96. # This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
  97. # environments, it is only supported directly in programming
  98. # interfaces for QuickDraw Text, the Script Manager, and related
  99. # Text Utilities. For other purposes it is supported via transcoding
  100. # to and from Unicode.
  101. #
  102. # The Mac OS Symbol encoding shares the script code smRoman
  103. # (0) with the Mac OS Roman encoding. To determine if the Symbol
  104. # encoding is being used, you must check if the font name is
  105. # "Symbol".
  106. #
  107. # Before Mac OS 8.5, code point 0xA0 was unused. In Mac OS 8.5
  108. # and later versions, code point 0xA0 is EURO SIGN and maps to
  109. # U+20AC (the Symbol font is updated for Mac OS 8.5 to reflect
  110. # this).
  111. #
  112. # The layout of the Mac OS Symbol character set is identical to
  113. # the layout of the Adobe Symbol encoding vector, with the
  114. # addition of the Apple logo character at 0xF0.
  115. #
  116. # This character set encodes a number of glyph fragments. Some are
  117. # used as extenders: 0x60 is used to extend radical signs, 0xBD and
  118. # 0xBE are used to extend vertical and horizontal arrows, etc. In
  119. # addition, there are top, bottom, and center sections for
  120. # parentheses, brackets, integral signs, and other signs that may
  121. # extend vertically for 2 or more lines of normal text. As of
  122. # Unicode 3.2, most of these are now encoded in Unicode; a few are
  123. # not, so these are mapped using corporate-zone Unicode characters
  124. # (see below).
  125. #
  126. # In addition, Symbol separately encodes both serif and sans-serif
  127. # forms for copyright, trademark, and registered signs. Unicode
  128. # encodes only the abstract characters, so one set of these (the
  129. # sans-serif forms) are also mapped using corporate-zone Unicode
  130. # characters (see below).
  131. #
  132. # The following code points are unused, and are not shown here:
  133. # 0x80-0x9F, 0xFF.
  134. #
  135. # Unicode mapping issues and notes:
  136. # ---------------------------------
  137. #
  138. # The goals in the mappings provided here are:
  139. # - Ensure roundtrip mapping from every character in the Mac OS
  140. # Symbol character set to Unicode and back
  141. # - Use standard Unicode characters as much as possible, to
  142. # maximize interchangeability of the resulting Unicode text.
  143. # Whenever possible, avoid having content carried by private-use
  144. # characters.
  145. #
  146. # Some of the characters in the Mac OS Symbol character set do not
  147. # correspond to distinct, single Unicode characters. To map these
  148. # and satisfy both goals above, we employ various strategies.
  149. #
  150. # a) If possible, use private use characters in combination with
  151. # standard Unicode characters to mark variants of the standard
  152. # Unicode character.
  153. #
  154. # Apple has defined a block of 32 corporate characters as "transcoding
  155. # hints." These are used in combination with standard Unicode
  156. # characters to force them to be treated in a special way for mapping
  157. # to other encodings; they have no other effect. Sixteen of these
  158. # transcoding hints are "grouping hints" - they indicate that the next
  159. # 2-4 Unicode characters should be treated as a single entity for
  160. # transcoding. The other sixteen transcoding hints are "variant tags"
  161. # - they are like combining characters, and can follow a standard
  162. # Unicode (or a sequence consisting of a base character and other
  163. # combining characters) to cause it to be treated in a special way for
  164. # transcoding. These always terminate a combining-character sequence.
  165. #
  166. # The transcoding coding hint used in this mapping table is the
  167. # variant tag 0xF87F. Since this is combined with standard Unicode
  168. # characters, some characters in the Mac OS Symbol character set map
  169. # to a sequence of two Unicodes instead of a single Unicode character.
  170. #
  171. # For example, the Mac OS Symbol character at 0xE2 is an alternate,
  172. # sans-serif form of the REGISTERED SIGN (the standard mapping is for
  173. # the abstract character at 0xD2, which here has a serif form). So 0xE2
  174. # is mapped to 0x00AE (REGISTERED SIGN) + 0xF87F (a variant tag).
  175. #
  176. # b) Otherwise, use private use characters by themselves to map
  177. # Mac OS Symbol characters which have no relationship to any standard
  178. # Unicode character.
  179. #
  180. # The following additional corporate zone Unicode characters are
  181. # used for this purpose here:
  182. #
  183. # 0xF8E5 radical extender
  184. # 0xF8FF Apple logo
  185. #
  186. # NOTE: The graphic image associated with the Apple logo character
  187. # is not authorized for use without permission of Apple, and
  188. # unauthorized use might constitute trademark infringement.
  189. #
  190. # Details of mapping changes in each version:
  191. # -------------------------------------------
  192. #
  193. # Changes from version c01 to version c02:
  194. #
  195. # - Update mappings for 0xBD from 0xF8E6 to 0x23D0 (use new Unicode
  196. # 4.0 char)
  197. # - Correct mapping for 0xE0 from 0x22C4 to 0x25CA
  198. #
  199. # Changes from version b02 to version b03/c01:
  200. #
  201. # - Update mappings for encoded glyph fragments 0xBE, 0xE6-EF, 0xF4,
  202. # 0xF6-FE to use new Unicode 3.2 characters instead of using either
  203. # single corporate-use characters (e.g. 0xBE was mapped to 0xF8E7) or
  204. # sequences combining a standard Unicode character with a transcoding
  205. # hint (e.g. 0xE6 was mapped to 0x0028+0xF870).
  206. #
  207. # Changes from version n05 to version b02:
  208. #
  209. # - Encoding changed for Mac OS 8.5; 0xA0 now maps to 0x20AC, EURO
  210. # SIGN. 0xA0 was unmapped in earlier versions.
  211. #
  212. # Changes from version n03 to version n05:
  213. #
  214. # - Change strict mapping for 0xE1 & 0xF1 from U+2329 & U+232A
  215. # to their canonical decompositions, U+3008 & U+3009.
  216. #
  217. # - Change mapping for the following to use standard Unicode +
  218. # transcoding hint, instead of single corporate-zone
  219. # character: 0xE2-0xE4, 0xE6-0xEE, 0xF4, 0xF6-0xFE.
  220. #
  221. ##################
  222. 0x00 - 0x7F = 0x0000 -
  223. 0xA0 = 0x20AC
  224. 0xA1 = 0x03D2
  225. 0xA2 = 0x2032
  226. 0xA3 = 0x2264
  227. 0xA4 = 0x2044
  228. 0xA5 = 0x221E
  229. 0xA6 = 0x0192
  230. 0xA7 = 0x2663
  231. 0xA8 = 0x2666
  232. 0xA9 = 0x2665
  233. 0xAA = 0x2660
  234. 0xAB = 0x2194
  235. 0xAC = 0x2190
  236. 0xAD = 0x2191
  237. 0xAE = 0x2192
  238. 0xAF = 0x2193
  239. 0xB0 = 0x00B0
  240. 0xB1 = 0x00B1
  241. 0xB2 = 0x2033
  242. 0xB3 = 0x2265
  243. 0xB4 = 0x00D7
  244. 0xB5 = 0x221D
  245. 0xB6 = 0x2202
  246. 0xB7 = 0x2022
  247. 0xB8 = 0x00F7
  248. 0xB9 = 0x2260
  249. 0xBA = 0x2261
  250. 0xBB = 0x2248
  251. 0xBC = 0x2026
  252. 0xBD = 0x23D0
  253. 0xBE = 0x23AF
  254. 0xBF = 0x21B5
  255. 0xC0 = 0x2135
  256. 0xC1 = 0x2111
  257. 0xC2 = 0x211C
  258. 0xC3 = 0x2118
  259. 0xC4 = 0x2297
  260. 0xC5 = 0x2295
  261. 0xC6 = 0x2205
  262. 0xC7 = 0x2229
  263. 0xC8 = 0x222A
  264. 0xC9 = 0x2283
  265. 0xCA = 0x2287
  266. 0xCB = 0x2284
  267. 0xCC = 0x2282
  268. 0xCD = 0x2286
  269. 0xCE = 0x2208
  270. 0xCF = 0x2209
  271. 0xD0 = 0x2220
  272. 0xD1 = 0x2207
  273. 0xD2 = 0x00AE
  274. 0xD3 = 0x00A9
  275. 0xD4 = 0x2122
  276. 0xD5 = 0x220F
  277. 0xD6 = 0x221A
  278. 0xD7 = 0x22C5
  279. 0xD8 = 0x00AC
  280. 0xD9 = 0x2227
  281. 0xDA = 0x2228
  282. 0xDB = 0x21D4
  283. 0xDC = 0x21D0
  284. 0xDD = 0x21D1
  285. 0xDE = 0x21D2
  286. 0xDF = 0x21D3
  287. 0xE0 = 0x25CA
  288. 0xE1 = 0x3008
  289. #0xE2 = 0x00AE+0xF87F
  290. #0xE3 = 0x00A9+0xF87F
  291. #0xE4 = 0x2122+0xF87F
  292. 0xE5 = 0x2211
  293. 0xE6 = 0x239B
  294. 0xE7 = 0x239C
  295. 0xE8 = 0x239D
  296. 0xE9 = 0x23A1
  297. 0xEA = 0x23A2
  298. 0xEB = 0x23A3
  299. 0xEC = 0x23A7
  300. 0xED = 0x23A8
  301. 0xEE = 0x23A9
  302. 0xEF = 0x23AA
  303. 0xF0 = 0xF8FF
  304. 0xF1 = 0x3009
  305. 0xF2 = 0x222B
  306. 0xF3 = 0x2320
  307. 0xF4 = 0x23AE
  308. 0xF5 = 0x2321
  309. 0xF6 = 0x239E
  310. 0xF7 = 0x239F
  311. 0xF8 = 0x23A0
  312. 0xF9 = 0x23A4
  313. 0xFA = 0x23A5
  314. 0xFB = 0x23A6
  315. 0xFC = 0x23AB
  316. 0xFD = 0x23AC
  317. 0xFE = 0x23AD
  318. END_MAP