Import locale tools and ressource files

This commit requires special steps, please checkout docs/UPDATING.

Tools:
 - gencat
 - locale
 - mkcsmapper
 - mkesdb
 - mklocale

Libs:
 - i18n_module
 - libintl

Ressources:
 - i18n
 - locale

Change-Id: I559d0399d8e98bcee15225cab786e43f31506207
This commit is contained in:
Lionel Sambuc 2016-06-20 18:30:51 +02:00
parent 733a844ac6
commit 36dcc4a4a9
1369 changed files with 623024 additions and 9 deletions

File diff suppressed because it is too large Load Diff

View File

@ -1126,6 +1126,7 @@
./usr/include/libelf.h minix-comp
./usr/include/libexec.h minix-comp
./usr/include/libgen.h minix-comp
./usr/include/libintl.h minix-comp
./usr/include/libutil.h minix-comp
./usr/include/limits.h minix-comp
./usr/include/link.h minix-comp
@ -1899,6 +1900,7 @@
./usr/lib/bc/libhgfs.a minix-comp bitcode
./usr/lib/bc/libiberty.a minix-comp bitcode,binutils
./usr/lib/bc/libinputdriver.a minix-comp bitcode
./usr/lib/bc/libintl.a minix-comp bitcode
./usr/lib/bc/libkvm.a minix-comp bitcode
./usr/lib/bc/libl.a minix-comp bitcode
./usr/lib/bc/liblua.a minix-comp bitcode
@ -1937,6 +1939,53 @@
./usr/lib/bc/libvirtio.a minix-comp bitcode
./usr/lib/bc/libvtreefs.a minix-comp bitcode
./usr/lib/bc/libz.a minix-comp bitcode
./usr/lib/i18n/bc minix-comp bitcode
./usr/lib/i18n/bc/libBIG5.a minix-comp bitcode
./usr/lib/i18n/bc/libDECHanyu.a minix-comp bitcode
./usr/lib/i18n/bc/libEUC.a minix-comp bitcode
./usr/lib/i18n/bc/libEUCTW.a minix-comp bitcode
./usr/lib/i18n/bc/libGBK2K.a minix-comp bitcode
./usr/lib/i18n/bc/libHZ.a minix-comp bitcode
./usr/lib/i18n/bc/libISO2022.a minix-comp bitcode
./usr/lib/i18n/bc/libJOHAB.a minix-comp bitcode
./usr/lib/i18n/bc/libMSKanji.a minix-comp bitcode
./usr/lib/i18n/bc/libUES.a minix-comp bitcode
./usr/lib/i18n/bc/libUTF1632.a minix-comp bitcode
./usr/lib/i18n/bc/libUTF7.a minix-comp bitcode
./usr/lib/i18n/bc/libUTF8.a minix-comp bitcode
./usr/lib/i18n/bc/libVIQR.a minix-comp bitcode
./usr/lib/i18n/bc/libZW.a minix-comp bitcode
./usr/lib/i18n/bc/libiconv_none.a minix-comp bitcode
./usr/lib/i18n/bc/libiconv_std.a minix-comp bitcode
./usr/lib/i18n/bc/libmapper_646.a minix-comp bitcode
./usr/lib/i18n/bc/libmapper_none.a minix-comp bitcode
./usr/lib/i18n/bc/libmapper_parallel.a minix-comp bitcode
./usr/lib/i18n/bc/libmapper_serial.a minix-comp bitcode
./usr/lib/i18n/bc/libmapper_std.a minix-comp bitcode
./usr/lib/i18n/bc/libmapper_zone.a minix-comp bitcode
./usr/lib/i18n/libBIG5.a minix-comp
./usr/lib/i18n/libDECHanyu.a minix-comp
./usr/lib/i18n/libEUC.a minix-comp
./usr/lib/i18n/libEUCTW.a minix-comp
./usr/lib/i18n/libGBK2K.a minix-comp
./usr/lib/i18n/libHZ.a minix-comp
./usr/lib/i18n/libISO2022.a minix-comp
./usr/lib/i18n/libJOHAB.a minix-comp
./usr/lib/i18n/libMSKanji.a minix-comp
./usr/lib/i18n/libUES.a minix-comp
./usr/lib/i18n/libUTF1632.a minix-comp
./usr/lib/i18n/libUTF7.a minix-comp
./usr/lib/i18n/libUTF8.a minix-comp
./usr/lib/i18n/libVIQR.a minix-comp
./usr/lib/i18n/libZW.a minix-comp
./usr/lib/i18n/libiconv_none.a minix-comp
./usr/lib/i18n/libiconv_std.a minix-comp
./usr/lib/i18n/libmapper_646.a minix-comp
./usr/lib/i18n/libmapper_none.a minix-comp
./usr/lib/i18n/libmapper_parallel.a minix-comp
./usr/lib/i18n/libmapper_serial.a minix-comp
./usr/lib/i18n/libmapper_std.a minix-comp
./usr/lib/i18n/libmapper_zone.a minix-comp
./usr/lib/libarchive.a minix-comp
./usr/lib/libarchive_pic.a minix-comp
./usr/lib/libasyn.a minix-comp
@ -1995,6 +2044,8 @@
./usr/lib/libgcov.a minix-comp gcc=45,!gcccmds
./usr/lib/libinputdriver.a minix-comp
./usr/lib/libinputdriver_pic.a minix-comp
./usr/lib/libintl.a minix-comp
./usr/lib/libintl_pic.a minix-comp
./usr/lib/libkvm.a minix-comp
./usr/lib/libkvm_pic.a minix-comp
./usr/lib/libl.a minix-comp

View File

@ -122,6 +122,7 @@
./usr/man/man1/fsplit.1 minix-man
./usr/man/man1/ftp.1 minix-man
./usr/man/man1/genassym.1 minix-man
./usr/man/man1/gencat.1 minix-man
./usr/man/man1/getopt.1 minix-man
./usr/man/man1/getopts.1 minix-man obsolete
./usr/man/man1/gprof.1 minix-man binutils
@ -187,6 +188,7 @@
./usr/man/man1/loadfont.1 minix-man
./usr/man/man1/loadkeys.1 minix-man
./usr/man/man1/local.1 minix-man obsolete
./usr/man/man1/locale.1 minix-man
./usr/man/man1/lock.1 minix-man
./usr/man/man1/logger.1 minix-man
./usr/man/man1/login.1 minix-man
@ -220,6 +222,7 @@
./usr/man/man1/mkdir.1 minix-man
./usr/man/man1/mkfifo.1 minix-man
./usr/man/man1/mkfs.mfs.1 minix-man
./usr/man/man1/mklocale.1 minix-man
./usr/man/man1/mkproto.1 minix-man
./usr/man/man1/mkstr.1 minix-man
./usr/man/man1/mktemp.1 minix-man
@ -1112,6 +1115,8 @@
./usr/man/man3/bcmp.3 minix-man
./usr/man/man3/bcopy.3 minix-man
./usr/man/man3/beep.3 minix-man
./usr/man/man3/bind_textdomain_codeset.3 minix-man
./usr/man/man3/bindtextdomain.3 minix-man
./usr/man/man3/bkgd.3 minix-man
./usr/man/man3/bkgdset.3 minix-man
./usr/man/man3/blacklist.3 minix-man
@ -1351,6 +1356,8 @@
./usr/man/man3/dbm_open.3 minix-man
./usr/man/man3/dbm_store.3 minix-man
./usr/man/man3/dbopen.3 minix-man
./usr/man/man3/dcgettext.3 minix-man
./usr/man/man3/dcngettext.3 minix-man
./usr/man/man3/def_prog_mode.3 minix-man
./usr/man/man3/def_shell_mode.3 minix-man
./usr/man/man3/define_key.3 minix-man
@ -1399,6 +1406,7 @@
./usr/man/man3/des_string_to_key.3 minix-man crypto
./usr/man/man3/des_xcbc_encrypt.3 minix-man crypto
./usr/man/man3/devname.3 minix-man
./usr/man/man3/dgettext.3 minix-man
./usr/man/man3/difftime.3 minix-man
./usr/man/man3/directory.3 minix-man
./usr/man/man3/dirfd.3 minix-man
@ -1406,6 +1414,7 @@
./usr/man/man3/div.3 minix-man
./usr/man/man3/dn_comp.3 minix-man
./usr/man/man3/dn_expand.3 minix-man
./usr/man/man3/dngettext.3 minix-man
./usr/man/man3/doupdate.3 minix-man
./usr/man/man3/dprintf.3 minix-man
./usr/man/man3/drand48.3 minix-man
@ -1866,6 +1875,7 @@
./usr/man/man3/getservent.3 minix-man
./usr/man/man3/getstr.3 minix-man
./usr/man/man3/getsubopt.3 minix-man
./usr/man/man3/gettext.3 minix-man
./usr/man/man3/gettmode.3 minix-man
./usr/man/man3/getttyent.3 minix-man
./usr/man/man3/getttynam.3 minix-man
@ -2300,6 +2310,7 @@
./usr/man/man3/nexttoward.3 minix-man
./usr/man/man3/nexttowardf.3 minix-man
./usr/man/man3/nftw.3 minix-man
./usr/man/man3/ngettext.3 minix-man
./usr/man/man3/nice.3 minix-man
./usr/man/man3/nl.3 minix-man
./usr/man/man3/nl_langinfo.3 minix-man
@ -2987,6 +2998,7 @@
./usr/man/man3/termcap.3 minix-man
./usr/man/man3/terminfo.3 minix-man
./usr/man/man3/termname.3 minix-man
./usr/man/man3/textdomain.3 minix-man
./usr/man/man3/tfind.3 minix-man
./usr/man/man3/tgamma.3 minix-man
./usr/man/man3/tgammaf.3 minix-man

View File

@ -1,3 +1,14 @@
20160702:
Some tools are required to generate the locale resources which are
embedded into libintl, which is why you need to run the following:
for t in gencat locale mkcsmapper mkesdb mklocale
do
make -C /usr/src/usr.bin/${t} all install
done
Then the usual "make build".
20150623:
In order to use the new Unix98 PTYs, and to ensure that the test set
continues to pass, please add the following line to your /etc/fstab:

View File

@ -1,5 +1,6 @@
/set type=dir uid=0 gid=0 mode=0755
./usr/lib/i18n/bc
./usr/tests/lib
./usr/tests/lib/csu
./usr/tests/lib/csu/bc

View File

@ -120,6 +120,7 @@
./usr/include/ufs/mfs
./usr/include/ufs/ufs
./usr/lib
./usr/lib/i18n
./usr/lib/bc
./usr/lib/cawf
./usr/lib/keymaps
@ -137,6 +138,7 @@
./usr/libdata/debug/usr/bin
./usr/libdata/debug/usr/games
./usr/libdata/debug/usr/lib
./usr/libdata/debug/usr/lib/i18n
./usr/libdata/debug/usr/libexec
./usr/libdata/debug/usr/mdec
./usr/libdata/debug/usr/sbin
@ -160,9 +162,9 @@
./usr/pkg/var/run
./usr/preserve
./usr/run
./usr/sbin
./usr/service
./usr/service/asr
./usr/sbin
./usr/share
./usr/share/atf
./usr/share/calendar
@ -190,6 +192,45 @@
./usr/share/examples/tmux
./usr/share/games
./usr/share/games/fortune
./usr/share/i18n
./usr/share/i18n/csmapper
./usr/share/i18n/csmapper/APPLE
./usr/share/i18n/csmapper/AST
./usr/share/i18n/csmapper/BIG5
./usr/share/i18n/csmapper/CBM
./usr/share/i18n/csmapper/CNS
./usr/share/i18n/csmapper/CP
./usr/share/i18n/csmapper/EBCDIC
./usr/share/i18n/csmapper/GB
./usr/share/i18n/csmapper/GEORGIAN
./usr/share/i18n/csmapper/ISO-8859
./usr/share/i18n/csmapper/ISO646
./usr/share/i18n/csmapper/JIS
./usr/share/i18n/csmapper/KAZAKH
./usr/share/i18n/csmapper/KOI
./usr/share/i18n/csmapper/KS
./usr/share/i18n/csmapper/MISC
./usr/share/i18n/csmapper/TCVN
./usr/share/i18n/esdb
./usr/share/i18n/esdb/APPLE
./usr/share/i18n/esdb/AST
./usr/share/i18n/esdb/BIG5
./usr/share/i18n/esdb/CBM
./usr/share/i18n/esdb/CP
./usr/share/i18n/esdb/DEC
./usr/share/i18n/esdb/EBCDIC
./usr/share/i18n/esdb/EUC
./usr/share/i18n/esdb/GB
./usr/share/i18n/esdb/GEORGIAN
./usr/share/i18n/esdb/ISO-2022
./usr/share/i18n/esdb/ISO-8859
./usr/share/i18n/esdb/ISO646
./usr/share/i18n/esdb/KAZAKH
./usr/share/i18n/esdb/KOI
./usr/share/i18n/esdb/MISC
./usr/share/i18n/esdb/TCVN
./usr/share/i18n/esdb/UTF
./usr/share/i18n/iconv
./usr/share/info
./usr/share/keymaps
./usr/share/kyua-atf-compat
@ -197,10 +238,415 @@
./usr/share/kyua-cli/misc
./usr/share/kyua-cli/store
./usr/share/legal
./usr/share/locale
./usr/share/locale/af_ZA.ISO8859-1
./usr/share/locale/af_ZA.ISO8859-1/LC_MESSAGES
./usr/share/locale/af_ZA.ISO8859-15
./usr/share/locale/af_ZA.ISO8859-15/LC_MESSAGES
./usr/share/locale/af_ZA.UTF-8
./usr/share/locale/af_ZA.UTF-8/LC_MESSAGES
./usr/share/locale/be
./usr/share/locale/be/LC_MESSAGES
./usr/share/locale/be_BY.CP1251
./usr/share/locale/be_BY.CP1251/LC_MESSAGES
./usr/share/locale/be_BY.ISO8859-5
./usr/share/locale/be_BY.ISO8859-5/LC_MESSAGES
./usr/share/locale/be_BY.UTF-8
./usr/share/locale/be_BY.UTF-8/LC_MESSAGES
./usr/share/locale/bg_BG.CP1251
./usr/share/locale/bg_BG.CP1251/LC_MESSAGES
./usr/share/locale/bg_BG.UTF-8
./usr/share/locale/bg_BG.UTF-8/LC_MESSAGES
./usr/share/locale/ca
./usr/share/locale/ca/LC_MESSAGES
./usr/share/locale/ca_ES.ISO8859-1
./usr/share/locale/ca_ES.ISO8859-1/LC_MESSAGES
./usr/share/locale/ca_ES.ISO8859-15
./usr/share/locale/ca_ES.ISO8859-15/LC_MESSAGES
./usr/share/locale/ca_ES.UTF-8
./usr/share/locale/ca_ES.UTF-8/LC_MESSAGES
./usr/share/locale/cs
./usr/share/locale/cs/LC_MESSAGES
./usr/share/locale/cs_CZ.ISO8859-2
./usr/share/locale/cs_CZ.ISO8859-2/LC_MESSAGES
./usr/share/locale/cs_CZ.UTF-8
./usr/share/locale/cs_CZ.UTF-8/LC_MESSAGES
./usr/share/locale/da
./usr/share/locale/da/LC_MESSAGES
./usr/share/locale/da_DK.ISO8859-1
./usr/share/locale/da_DK.ISO8859-1/LC_MESSAGES
./usr/share/locale/da_DK.ISO8859-15
./usr/share/locale/da_DK.ISO8859-15/LC_MESSAGES
./usr/share/locale/da_DK.UTF-8
./usr/share/locale/da_DK.UTF-8/LC_MESSAGES
./usr/share/locale/de
./usr/share/locale/de/LC_MESSAGES
./usr/share/locale/de_AT
./usr/share/locale/de_AT.ISO8859-1
./usr/share/locale/de_AT.ISO8859-1/LC_MESSAGES
./usr/share/locale/de_AT.ISO8859-15
./usr/share/locale/de_AT.ISO8859-15/LC_MESSAGES
./usr/share/locale/de_AT.UTF-8
./usr/share/locale/de_AT.UTF-8/LC_MESSAGES
./usr/share/locale/de_AT/LC_MESSAGES
./usr/share/locale/de_CH.ISO8859-1
./usr/share/locale/de_CH.ISO8859-1/LC_MESSAGES
./usr/share/locale/de_CH.ISO8859-15
./usr/share/locale/de_CH.ISO8859-15/LC_MESSAGES
./usr/share/locale/de_CH.UTF-8
./usr/share/locale/de_CH.UTF-8/LC_MESSAGES
./usr/share/locale/de_DE.ISO8859-1
./usr/share/locale/de_DE.ISO8859-1/LC_MESSAGES
./usr/share/locale/de_DE.ISO8859-15
./usr/share/locale/de_DE.ISO8859-15/LC_MESSAGES
./usr/share/locale/de_DE.UTF-8
./usr/share/locale/de_DE.UTF-8/LC_MESSAGES
./usr/share/locale/el
./usr/share/locale/el/LC_MESSAGES
./usr/share/locale/el_GR.ISO8859-7
./usr/share/locale/el_GR.ISO8859-7/LC_MESSAGES
./usr/share/locale/el_GR.UTF-8
./usr/share/locale/el_GR.UTF-8/LC_MESSAGES
./usr/share/locale/en@boldquot
./usr/share/locale/en@boldquot/LC_MESSAGES
./usr/share/locale/en@quot
./usr/share/locale/en@quot/LC_MESSAGES
./usr/share/locale/en_AU.ISO8859-1
./usr/share/locale/en_AU.ISO8859-1/LC_MESSAGES
./usr/share/locale/en_AU.ISO8859-15
./usr/share/locale/en_AU.ISO8859-15/LC_MESSAGES
./usr/share/locale/en_AU.UTF-8
./usr/share/locale/en_AU.UTF-8/LC_MESSAGES
./usr/share/locale/en_CA.ISO8859-1
./usr/share/locale/en_CA.ISO8859-1/LC_MESSAGES
./usr/share/locale/en_CA.ISO8859-15
./usr/share/locale/en_CA.ISO8859-15/LC_MESSAGES
./usr/share/locale/en_CA.UTF-8
./usr/share/locale/en_CA.UTF-8/LC_MESSAGES
./usr/share/locale/en_GB.ISO8859-1
./usr/share/locale/en_GB.ISO8859-1/LC_MESSAGES
./usr/share/locale/en_GB.ISO8859-15
./usr/share/locale/en_GB.ISO8859-15/LC_MESSAGES
./usr/share/locale/en_GB.UTF-8
./usr/share/locale/en_GB.UTF-8/LC_MESSAGES
./usr/share/locale/en_NZ.ISO8859-1
./usr/share/locale/en_NZ.ISO8859-1/LC_MESSAGES
./usr/share/locale/en_NZ.ISO8859-15
./usr/share/locale/en_NZ.ISO8859-15/LC_MESSAGES
./usr/share/locale/en_NZ.UTF-8
./usr/share/locale/en_NZ.UTF-8/LC_MESSAGES
./usr/share/locale/en_US.ISO8859-1
./usr/share/locale/en_US.ISO8859-1/LC_MESSAGES
./usr/share/locale/en_US.ISO8859-15
./usr/share/locale/en_US.ISO8859-15/LC_MESSAGES
./usr/share/locale/en_US.US-ASCII
./usr/share/locale/en_US.US-ASCII/LC_MESSAGES
./usr/share/locale/en_US.UTF-8
./usr/share/locale/en_US.UTF-8/LC_MESSAGES
./usr/share/locale/eo
./usr/share/locale/eo/LC_MESSAGES
./usr/share/locale/es
./usr/share/locale/es/LC_MESSAGES
./usr/share/locale/es_ES.ISO8859-1
./usr/share/locale/es_ES.ISO8859-1/LC_MESSAGES
./usr/share/locale/es_ES.ISO8859-15
./usr/share/locale/es_ES.ISO8859-15/LC_MESSAGES
./usr/share/locale/es_ES.UTF-8
./usr/share/locale/es_ES.UTF-8/LC_MESSAGES
./usr/share/locale/et
./usr/share/locale/et/LC_MESSAGES
./usr/share/locale/et_EE.ISO8859-15
./usr/share/locale/et_EE.ISO8859-15/LC_MESSAGES
./usr/share/locale/et_EE.UTF-8
./usr/share/locale/et_EE.UTF-8/LC_MESSAGES
./usr/share/locale/eu_ES.ISO8859-1
./usr/share/locale/eu_ES.ISO8859-1/LC_MESSAGES
./usr/share/locale/eu_ES.ISO8859-15
./usr/share/locale/eu_ES.ISO8859-15/LC_MESSAGES
./usr/share/locale/eu_ES.UTF-8
./usr/share/locale/eu_ES.UTF-8/LC_MESSAGES
./usr/share/locale/fi
./usr/share/locale/fi/LC_MESSAGES
./usr/share/locale/fi_FI.ISO8859-1
./usr/share/locale/fi_FI.ISO8859-1/LC_MESSAGES
./usr/share/locale/fi_FI.ISO8859-15
./usr/share/locale/fi_FI.ISO8859-15/LC_MESSAGES
./usr/share/locale/fi_FI.UTF-8
./usr/share/locale/fi_FI.UTF-8/LC_MESSAGES
./usr/share/locale/fr
./usr/share/locale/fr/LC_MESSAGES
./usr/share/locale/fr_BE.ISO8859-1
./usr/share/locale/fr_BE.ISO8859-1/LC_MESSAGES
./usr/share/locale/fr_BE.ISO8859-15
./usr/share/locale/fr_BE.ISO8859-15/LC_MESSAGES
./usr/share/locale/fr_BE.UTF-8
./usr/share/locale/fr_BE.UTF-8/LC_MESSAGES
./usr/share/locale/fr_CA.ISO8859-1
./usr/share/locale/fr_CA.ISO8859-1/LC_MESSAGES
./usr/share/locale/fr_CA.ISO8859-15
./usr/share/locale/fr_CA.ISO8859-15/LC_MESSAGES
./usr/share/locale/fr_CA.UTF-8
./usr/share/locale/fr_CA.UTF-8/LC_MESSAGES
./usr/share/locale/fr_CH.ISO8859-1
./usr/share/locale/fr_CH.ISO8859-1/LC_MESSAGES
./usr/share/locale/fr_CH.ISO8859-15
./usr/share/locale/fr_CH.ISO8859-15/LC_MESSAGES
./usr/share/locale/fr_CH.UTF-8
./usr/share/locale/fr_CH.UTF-8/LC_MESSAGES
./usr/share/locale/fr_FR.ISO8859-1
./usr/share/locale/fr_FR.ISO8859-1/LC_MESSAGES
./usr/share/locale/fr_FR.ISO8859-15
./usr/share/locale/fr_FR.ISO8859-15/LC_MESSAGES
./usr/share/locale/fr_FR.UTF-8
./usr/share/locale/fr_FR.UTF-8/LC_MESSAGES
./usr/share/locale/gl
./usr/share/locale/gl/LC_MESSAGES
./usr/share/locale/he
./usr/share/locale/he/LC_MESSAGES
./usr/share/locale/hr
./usr/share/locale/hr/LC_MESSAGES
./usr/share/locale/hr_HR.ISO8859-2
./usr/share/locale/hr_HR.ISO8859-2/LC_MESSAGES
./usr/share/locale/hr_HR.UTF-8
./usr/share/locale/hr_HR.UTF-8/LC_MESSAGES
./usr/share/locale/hu_HU.ISO8859-2
./usr/share/locale/hu_HU.ISO8859-2/LC_MESSAGES
./usr/share/locale/hu_HU.UTF-8
./usr/share/locale/hu_HU.UTF-8/LC_MESSAGES
./usr/share/locale/hy_AM.ARMSCII-8
./usr/share/locale/hy_AM.ARMSCII-8/LC_MESSAGES
./usr/share/locale/hy_AM.UTF-8
./usr/share/locale/hy_AM.UTF-8/LC_MESSAGES
./usr/share/locale/id
./usr/share/locale/id/LC_MESSAGES
./usr/share/locale/is_IS.ISO8859-1
./usr/share/locale/is_IS.ISO8859-1/LC_MESSAGES
./usr/share/locale/is_IS.ISO8859-15
./usr/share/locale/is_IS.ISO8859-15/LC_MESSAGES
./usr/share/locale/is_IS.UTF-8
./usr/share/locale/is_IS.UTF-8/LC_MESSAGES
./usr/share/locale/it
./usr/share/locale/it/LC_MESSAGES
./usr/share/locale/it_CH.ISO8859-1
./usr/share/locale/it_CH.ISO8859-1/LC_MESSAGES
./usr/share/locale/it_CH.ISO8859-15
./usr/share/locale/it_CH.ISO8859-15/LC_MESSAGES
./usr/share/locale/it_CH.UTF-8
./usr/share/locale/it_CH.UTF-8/LC_MESSAGES
./usr/share/locale/it_IT.ISO8859-1
./usr/share/locale/it_IT.ISO8859-1/LC_MESSAGES
./usr/share/locale/it_IT.ISO8859-15
./usr/share/locale/it_IT.ISO8859-15/LC_MESSAGES
./usr/share/locale/it_IT.UTF-8
./usr/share/locale/it_IT.UTF-8/LC_MESSAGES
./usr/share/locale/ja
./usr/share/locale/ja/LC_MESSAGES
./usr/share/locale/ja_JP.ISO-2022-JP
./usr/share/locale/ja_JP.ISO-2022-JP-2
./usr/share/locale/ja_JP.ISO-2022-JP-2/LC_MESSAGES
./usr/share/locale/ja_JP.ISO-2022-JP/LC_MESSAGES
./usr/share/locale/ja_JP.SJIS
./usr/share/locale/ja_JP.SJIS/LC_MESSAGES
./usr/share/locale/ja_JP.UTF-8
./usr/share/locale/ja_JP.UTF-8/LC_MESSAGES
./usr/share/locale/ja_JP.ct
./usr/share/locale/ja_JP.ct/LC_MESSAGES
./usr/share/locale/ja_JP.eucJP
./usr/share/locale/ja_JP.eucJP/LC_MESSAGES
./usr/share/locale/kk_KZ.PT154
./usr/share/locale/kk_KZ.PT154/LC_MESSAGES
./usr/share/locale/kk_KZ.UTF-8
./usr/share/locale/kk_KZ.UTF-8/LC_MESSAGES
./usr/share/locale/ko
./usr/share/locale/ko/LC_MESSAGES
./usr/share/locale/ko_KR.UTF-8
./usr/share/locale/ko_KR.UTF-8/LC_MESSAGES
./usr/share/locale/ko_KR.eucKR
./usr/share/locale/ko_KR.eucKR/LC_MESSAGES
./usr/share/locale/lt_LT.ISO8859-13
./usr/share/locale/lt_LT.ISO8859-13/LC_MESSAGES
./usr/share/locale/lt_LT.ISO8859-4
./usr/share/locale/lt_LT.ISO8859-4/LC_MESSAGES
./usr/share/locale/lt_LT.UTF-8
./usr/share/locale/lt_LT.UTF-8/LC_MESSAGES
./usr/share/locale/nb
./usr/share/locale/nb/LC_MESSAGES
./usr/share/locale/nb_NO.ISO8859-1
./usr/share/locale/nb_NO.ISO8859-1/LC_MESSAGES
./usr/share/locale/nb_NO.ISO8859-15
./usr/share/locale/nb_NO.ISO8859-15/LC_MESSAGES
./usr/share/locale/nb_NO.UTF-8
./usr/share/locale/nb_NO.UTF-8/LC_MESSAGES
./usr/share/locale/nn_NO.ISO8859-1
./usr/share/locale/nn_NO.ISO8859-1/LC_MESSAGES
./usr/share/locale/nn_NO.ISO8859-15
./usr/share/locale/nn_NO.ISO8859-15/LC_MESSAGES
./usr/share/locale/nn_NO.UTF-8
./usr/share/locale/nn_NO.UTF-8/LC_MESSAGES
./usr/share/locale/nl
./usr/share/locale/nl/LC_MESSAGES
./usr/share/locale/nl_BE.ISO8859-1
./usr/share/locale/nl_BE.ISO8859-1/LC_MESSAGES
./usr/share/locale/nl_BE.ISO8859-15
./usr/share/locale/nl_BE.ISO8859-15/LC_MESSAGES
./usr/share/locale/nl_BE.UTF-8
./usr/share/locale/nl_BE.UTF-8/LC_MESSAGES
./usr/share/locale/nl_NL.ISO8859-1
./usr/share/locale/nl_NL.ISO8859-1/LC_MESSAGES
./usr/share/locale/nl_NL.ISO8859-15
./usr/share/locale/nl_NL.ISO8859-15/LC_MESSAGES
./usr/share/locale/nl_NL.UTF-8
./usr/share/locale/nl_NL.UTF-8/LC_MESSAGES
./usr/share/locale/nn
./usr/share/locale/nn/LC_MESSAGES
./usr/share/locale/no
./usr/share/locale/no/LC_MESSAGES
./usr/share/locale/no@nynorsk
./usr/share/locale/no@nynorsk/LC_MESSAGES
./usr/share/locale/pl
./usr/share/locale/pl/LC_MESSAGES
./usr/share/locale/pl_PL.ISO8859-2
./usr/share/locale/pl_PL.ISO8859-2/LC_MESSAGES
./usr/share/locale/pl_PL.UTF-8
./usr/share/locale/pl_PL.UTF-8/LC_MESSAGES
./usr/share/locale/pt
./usr/share/locale/pt/LC_MESSAGES
./usr/share/locale/pt_BR
./usr/share/locale/pt_BR.ISO8859-1
./usr/share/locale/pt_BR.ISO8859-1/LC_MESSAGES
./usr/share/locale/pt_BR.UTF-8
./usr/share/locale/pt_BR.UTF-8/LC_MESSAGES
./usr/share/locale/pt_BR/LC_MESSAGES
./usr/share/locale/pt_PT.ISO8859-1
./usr/share/locale/pt_PT.ISO8859-1/LC_MESSAGES
./usr/share/locale/pt_PT.ISO8859-15
./usr/share/locale/pt_PT.ISO8859-15/LC_MESSAGES
./usr/share/locale/pt_PT.UTF-8
./usr/share/locale/pt_PT.UTF-8/LC_MESSAGES
./usr/share/locale/ro
./usr/share/locale/ro/LC_MESSAGES
./usr/share/locale/ro_RO.ISO8859-2
./usr/share/locale/ro_RO.ISO8859-2/LC_MESSAGES
./usr/share/locale/ro_RO.UTF-8
./usr/share/locale/ro_RO.UTF-8/LC_MESSAGES
./usr/share/locale/ru
./usr/share/locale/ru/LC_MESSAGES
./usr/share/locale/ru_BY.CP1251
./usr/share/locale/ru_BY.CP1251/LC_MESSAGES
./usr/share/locale/ru_BY.UTF-8
./usr/share/locale/ru_BY.UTF-8/LC_MESSAGES
./usr/share/locale/ru_RU.CP1251
./usr/share/locale/ru_RU.CP1251/LC_MESSAGES
./usr/share/locale/ru_RU.CP866
./usr/share/locale/ru_RU.CP866/LC_MESSAGES
./usr/share/locale/ru_RU.ISO8859-5
./usr/share/locale/ru_RU.ISO8859-5/LC_MESSAGES
./usr/share/locale/ru_RU.KOI8-R
./usr/share/locale/ru_RU.KOI8-R/LC_MESSAGES
./usr/share/locale/ru_RU.UTF-8
./usr/share/locale/ru_RU.UTF-8/LC_MESSAGES
./usr/share/locale/sk
./usr/share/locale/sk/LC_MESSAGES
./usr/share/locale/sk_SK.ISO8859-2
./usr/share/locale/sk_SK.ISO8859-2/LC_MESSAGES
./usr/share/locale/sk_SK.UTF-8
./usr/share/locale/sk_SK.UTF-8/LC_MESSAGES
./usr/share/locale/sl
./usr/share/locale/sl/LC_MESSAGES
./usr/share/locale/sl_SI.ISO8859-2
./usr/share/locale/sl_SI.ISO8859-2/LC_MESSAGES
./usr/share/locale/sl_SI.UTF-8
./usr/share/locale/sl_SI.UTF-8/LC_MESSAGES
./usr/share/locale/sr
./usr/share/locale/sr/LC_MESSAGES
./usr/share/locale/sr_Cyrl_ME.ISO8859-5
./usr/share/locale/sr_Cyrl_ME.ISO8859-5/LC_MESSAGES
./usr/share/locale/sr_Cyrl_ME.UTF-8
./usr/share/locale/sr_Cyrl_ME.UTF-8/LC_MESSAGES
./usr/share/locale/sr_Latn_ME.ISO8859-2
./usr/share/locale/sr_Latn_ME.ISO8859-2/LC_MESSAGES
./usr/share/locale/sr_Latn_ME.UTF-8
./usr/share/locale/sr_Cyrl_RS.ISO8859-5
./usr/share/locale/sr_Cyrl_RS.ISO8859-5/LC_MESSAGES
./usr/share/locale/sr_Cyrl_RS.UTF-8
./usr/share/locale/sr_Cyrl_RS.UTF-8/LC_MESSAGES
./usr/share/locale/sr_Latn_ME.UTF-8/LC_MESSAGES
./usr/share/locale/sr_Latn_RS.ISO8859-2
./usr/share/locale/sr_Latn_RS.ISO8859-2/LC_MESSAGES
./usr/share/locale/sr_Latn_RS.UTF-8
./usr/share/locale/sr_Latn_RS.UTF-8/LC_MESSAGES
./usr/share/locale/sv
./usr/share/locale/sv/LC_MESSAGES
./usr/share/locale/sv_SE.ISO8859-1
./usr/share/locale/sv_SE.ISO8859-1/LC_MESSAGES
./usr/share/locale/sv_SE.ISO8859-15
./usr/share/locale/sv_SE.ISO8859-15/LC_MESSAGES
./usr/share/locale/sv_SE.UTF-8
./usr/share/locale/sv_SE.UTF-8/LC_MESSAGES
./usr/share/locale/tr
./usr/share/locale/tr/LC_MESSAGES
./usr/share/locale/tr_TR.ISO8859-9
./usr/share/locale/tr_TR.ISO8859-9/LC_MESSAGES
./usr/share/locale/tr_TR.UTF-8
./usr/share/locale/tr_TR.UTF-8/LC_MESSAGES
./usr/share/locale/uk
./usr/share/locale/uk/LC_MESSAGES
./usr/share/locale/uk_UA.CP1251
./usr/share/locale/uk_UA.CP1251/LC_MESSAGES
./usr/share/locale/uk_UA.ISO8859-5
./usr/share/locale/uk_UA.ISO8859-5/LC_MESSAGES
./usr/share/locale/uk_UA.KOI8-U
./usr/share/locale/uk_UA.KOI8-U/LC_MESSAGES
./usr/share/locale/uk_UA.UTF-8
./usr/share/locale/uk_UA.UTF-8/LC_MESSAGES
./usr/share/locale/zh_CN
./usr/share/locale/zh_CN.GB18030
./usr/share/locale/zh_CN.GB18030/LC_MESSAGES
./usr/share/locale/zh_CN.UTF-8
./usr/share/locale/zh_CN.UTF-8/LC_MESSAGES
./usr/share/locale/zh_CN.eucCN
./usr/share/locale/zh_CN.eucCN/LC_MESSAGES
./usr/share/locale/zh_CN/LC_MESSAGES
./usr/share/locale/zh_HK.Big5hkscs
./usr/share/locale/zh_HK.Big5hkscs/LC_MESSAGES
./usr/share/locale/zh_HK.UTF-8
./usr/share/locale/zh_HK.UTF-8/LC_MESSAGES
./usr/share/locale/zh_TW
./usr/share/locale/zh_TW.Big5
./usr/share/locale/zh_TW.Big5/LC_MESSAGES
./usr/share/locale/zh_TW.UTF-8
./usr/share/locale/zh_TW.UTF-8/LC_MESSAGES
./usr/share/locale/zh_TW.eucTW
./usr/share/locale/zh_TW.eucTW/LC_MESSAGES
./usr/share/locale/zh_TW/LC_MESSAGES
./usr/share/lua
./usr/share/lua/5.3
./usr/share/misc
./usr/share/mk
./usr/share/nls
./usr/share/nls/C
./usr/share/nls/Pig
./usr/share/nls/ca
./usr/share/nls/cs
./usr/share/nls/de
./usr/share/nls/es
./usr/share/nls/es_ES.ISO8859-1
./usr/share/nls/fi
./usr/share/nls/fr
./usr/share/nls/gl_ES.ISO8859-1
./usr/share/nls/hu_HU.ISO8859-2
./usr/share/nls/ja_JP.SJIS
./usr/share/nls/ja_JP.UTF-8
./usr/share/nls/ja_JP.eucJP
./usr/share/nls/nl
./usr/share/nls/no
./usr/share/nls/pl
./usr/share/nls/pt_BR.ISO8859-1
./usr/share/nls/ru_RU.KOI8-R
./usr/share/nls/sk
./usr/share/nls/sv
./usr/share/nls/uk_UA.UTF-8
./usr/share/nls/zh_CN.UTF-8
./usr/share/nvi
./usr/share/nvi/catalog
./usr/share/terminfo

View File

@ -73,12 +73,12 @@ SUBDIR+= ../minix/lib/libmagicrt
# below will depend on versions from DESTDIR only.
#
#SUBDIR+= i18n_module
SUBDIR+= i18n_module
SUBDIR+= \
libbz2 \
libcrypt \
libkvm libm \
libintl libkvm libm \
libpci libprop \
libpuffs librmt \
libterminfo \

View File

@ -0,0 +1,5 @@
# $NetBSD: Makefile,v 1.2 2006/11/22 23:38:27 tnozaki Exp $
SRCS= citrus_big5.c citrus_prop.c
.include <bsd.lib.mk>

View File

@ -0,0 +1,4 @@
# $NetBSD: Makefile,v 1.1 2007/04/01 18:52:31 tnozaki Exp $
SRCPRE=citrus_
.include <bsd.lib.mk>

View File

@ -0,0 +1,4 @@
# $NetBSD: Makefile,v 1.1 2002/03/17 22:14:15 tshiozak Exp $
SRCPRE=citrus_
.include <bsd.lib.mk>

View File

@ -0,0 +1,4 @@
# $NetBSD: Makefile,v 1.1 2002/03/17 22:14:15 tshiozak Exp $
SRCPRE=citrus_
.include <bsd.lib.mk>

View File

@ -0,0 +1,5 @@
# $NetBSD: Makefile,v 1.1 2003/03/25 18:26:54 tshiozak Exp $
SRCPRE=citrus_
#CFLAGS+=-g
.include <bsd.lib.mk>

View File

@ -0,0 +1,5 @@
# $NetBSD: Makefile,v 1.1 2006/11/22 23:38:27 tnozaki Exp $
SRCS= citrus_hz.c citrus_prop.c
.include <bsd.lib.mk>

View File

@ -0,0 +1,4 @@
# $NetBSD: Makefile,v 1.1 2002/03/17 22:14:16 tshiozak Exp $
SRCPRE=citrus_
.include <bsd.lib.mk>

View File

@ -0,0 +1,4 @@
# $NetBSD: Makefile,v 1.1 2006/10/18 17:54:55 tnozaki Exp $
SRCPRE=citrus_
.include <bsd.lib.mk>

View File

@ -0,0 +1,4 @@
# $NetBSD: Makefile,v 1.1 2002/03/17 22:14:16 tshiozak Exp $
SRCPRE=citrus_
.include <bsd.lib.mk>

8
lib/i18n_module/Makefile Normal file
View File

@ -0,0 +1,8 @@
# $NetBSD: Makefile,v 1.8 2007/04/01 18:52:31 tnozaki Exp $
SUBDIR= BIG5 DECHanyu EUC EUCTW GBK2K HZ ISO2022 JOHAB MSKanji UES UTF1632 UTF8 UTF7 VIQR ZW
SUBDIR+=iconv_none iconv_std
SUBDIR+=mapper_646 mapper_none mapper_serial mapper_parallel mapper_std \
mapper_zone
.include <bsd.subdir.mk>

View File

@ -0,0 +1,28 @@
# $NetBSD: Makefile.inc,v 1.14 2012/08/23 21:21:15 joerg Exp $
NOLINT= # defined
NOPICINSTALL= # defined
NOPROFILE= # defined
NOCLANGERROR= # defined
.include <bsd.own.mk>
SHLIB_VERSION_FILE= ${NETBSDSRCDIR}/lib/i18n_module/shlib_version
.if defined(MLIBDIR)
LIBDIR= /usr/lib/${MLIBDIR}/i18n
SHLIBDIR= /usr/lib/${MLIBDIR}/i18n
SHLIBINSTALLDIR=/usr/lib/${MLIBDIR}/i18n
.else
LIBDIR= /usr/lib/i18n
SHLIBDIR= /usr/lib/i18n
SHLIBINSTALLDIR=/usr/lib/i18n
.endif
CPPFLAGS+= -I${NETBSDSRCDIR}/lib/libc/citrus
CPPFLAGS+= -DLOCALEMOD_MAJOR=${SHLIB_MAJOR}
CPPFLAGS+= -DLIBC_SCCS
BASENAME= ${.CURDIR:T}
LIB= ${BASENAME}
SRCS?= ${SRCPRE:tl}${BASENAME:tl}.c
.PATH: ${NETBSDSRCDIR}/lib/libc/citrus ${NETBSDSRCDIR}/lib/libc/citrus/modules

View File

@ -0,0 +1,4 @@
# $NetBSD: Makefile,v 1.1 2006/11/13 15:16:31 tnozaki Exp $
SRCPRE=citrus_
.include <bsd.lib.mk>

View File

@ -0,0 +1,4 @@
# $NetBSD: Makefile,v 1.1 2003/06/25 10:38:03 tshiozak Exp $
SRCPRE=citrus_
.include <bsd.lib.mk>

View File

@ -0,0 +1,8 @@
# $NetBSD: Makefile,v 1.4 2011/06/20 06:52:36 mrg Exp $
SRCPRE=citrus_
.include <bsd.lib.mk>
.if ${MACHINE_ARCH} == "vax" && defined(HAVE_GCC)
COPTS.citrus_utf7.c+= -O0
.endif

View File

@ -0,0 +1,4 @@
# $NetBSD: Makefile,v 1.1 2002/03/17 22:14:17 tshiozak Exp $
SRCPRE=citrus_
.include <bsd.lib.mk>

View File

@ -0,0 +1,4 @@
# $NetBSD: Makefile,v 1.1 2006/11/13 15:16:31 tnozaki Exp $
SRCPRE=citrus_
.include <bsd.lib.mk>

View File

@ -0,0 +1,4 @@
# $NetBSD: Makefile,v 1.1 2006/11/22 23:38:27 tnozaki Exp $
SRCPRE=citrus_
.include <bsd.lib.mk>

View File

@ -0,0 +1,4 @@
# $NetBSD: Makefile,v 1.1 2003/06/25 10:38:04 tshiozak Exp $
SRCPRE=citrus_
.include <bsd.lib.mk>

View File

@ -0,0 +1,4 @@
# $NetBSD: Makefile,v 1.1 2003/06/25 10:38:04 tshiozak Exp $
SRCPRE=citrus_
.include <bsd.lib.mk>

View File

@ -0,0 +1,4 @@
# $NetBSD: Makefile,v 1.1 2003/06/25 10:38:04 tshiozak Exp $
SRCPRE=citrus_
.include <bsd.lib.mk>

View File

@ -0,0 +1,4 @@
# $NetBSD: Makefile,v 1.1 2003/06/25 10:38:05 tshiozak Exp $
SRCPRE=citrus_
.include <bsd.lib.mk>

View File

@ -0,0 +1,4 @@
# $NetBSD: Makefile,v 1.1 2003/06/25 10:38:05 tshiozak Exp $
SRCS=citrus_mapper_serial.c
.include <bsd.lib.mk>

View File

@ -0,0 +1,4 @@
# $NetBSD: Makefile,v 1.1 2003/06/25 10:38:05 tshiozak Exp $
SRCPRE=citrus_
.include <bsd.lib.mk>

View File

@ -0,0 +1,4 @@
# $NetBSD: Makefile,v 1.1 2003/06/25 10:38:06 tshiozak Exp $
SRCPRE=citrus_
.include <bsd.lib.mk>

View File

@ -0,0 +1,4 @@
# $NetBSD: Makefile,v 1.1 2003/06/25 10:38:06 tshiozak Exp $
SRCPRE=citrus_
.include <bsd.lib.mk>

View File

@ -0,0 +1,5 @@
# $NetBSD: shlib_version,v 1.6 2009/01/11 03:07:47 christos Exp $
# Remember to update distrib/sets/lists/base/shl.* when changing
#
major=5
minor=0

20
lib/libintl/Makefile Normal file
View File

@ -0,0 +1,20 @@
# $NetBSD: Makefile,v 1.6 2005/05/14 17:58:56 tshiozak Exp $
.include <bsd.own.mk>
LIB= intl
SRCS= gettext.c textdomain.c gettext_iconv.c gettext_dummy.c strhash.c \
sysdep.c plural_parser.c
INCS= libintl.h
INCSDIR=/usr/include
#CFLAGS+=-g
CPPFLAGS+=-I${.CURDIR} -I${.CURDIR}/../libc
MAN= gettext.3
MLINKS= gettext.3 dgettext.3 gettext.3 dcgettext.3 \
gettext.3 ngettext.3 gettext.3 dngettext.3 \
gettext.3 dcngettext.3 gettext.3 textdomain.3 \
gettext.3 bindtextdomain.3 gettext.3 bind_textdomain_codeset.3
.include <bsd.lib.mk>

407
lib/libintl/gettext.3 Normal file
View File

@ -0,0 +1,407 @@
.\" $NetBSD: gettext.3,v 1.12 2009/11/12 00:43:52 joerg Exp $
.\"
.\" Copyright (c) 2000 Citrus Project,
.\" All rights reserved.
.\"
.\" Redistribution and use in source and binary forms, with or without
.\" modification, are permitted provided that the following conditions
.\" are met:
.\" 1. Redistributions of source code must retain the above copyright
.\" notice, this list of conditions and the following disclaimer.
.\" 2. Redistributions in binary form must reproduce the above copyright
.\" notice, this list of conditions and the following disclaimer in the
.\" documentation and/or other materials provided with the distribution.
.\"
.\" THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
.\" ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
.\" IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
.\" ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
.\" FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
.\" DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
.\" OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
.\" HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
.\" LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
.\" OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
.\" SUCH DAMAGE.
.\"
.Dd November 10, 2004
.Dt GETTEXT 3
.Os
.Sh NAME
.Nm gettext ,
.Nm dgettext ,
.Nm ngettext ,
.Nm dngettext ,
.Nm textdomain ,
.Nm bindtextdomain ,
.Nm bind_textdomain_codeset ,
.Nm dcgettext ,
.Nm dcngettext
.Nd message handling functions
.Sh LIBRARY
.Lb libintl
.Sh SYNOPSIS
.In libintl.h
.Ft char *
.Fn gettext "const char *msgid"
.Ft char *
.Fn dgettext "const char *domainname" "const char *msgid"
.Ft char *
.Fn ngettext "const char *msgid1" "const char *msgid2" "unsigned long int n"
.Ft char *
.Fn dngettext "const char *domainname" "const char *msgid1" "const char *msgid2" "unsigned long int n"
.Ft char *
.Fn textdomain "const char *domainname"
.Ft char *
.Fn bindtextdomain "const char *domainname" "const char *dirname"
.Ft char *
.Fn bind_textdomain_codeset "const char *domainname" "const char *codeset"
.In libintl.h
.In locale.h
.Ft char *
.Fn dcgettext "const char *domainname" "const char *msgid" "int category"
.Ft char *
.Fn dcngettext "const char *domainname" "const char *msgid1" "const char *msgid2" "unsigned long int n" "int category"
.Sh DESCRIPTION
The
.Fn gettext ,
.Fn dgettext ,
and
.Fn dcgettext
functions attempt to retrieve a
target string based on the specified
.Fa msgid
argument within the context of a
specific domain and the current locale.
The length of strings returned by
.Fn gettext ,
.Fn dgettext ,
and
.Fn dcgettext
is undetermined until the function is
called.
The
.Fa msgid
argument is a nul-terminated string.
.Pp
The
.Fn ngettext ,
.Fn dngettext ,
and
.Fn dcngettext
functions are equivalent to
.Fn gettext ,
.Fn dgettext ,
and
.Fn dcgettext ,
respectively, except for the handling of
plural forms.
The
.Fn ngettext ,
.Fn dngettext ,
and
.Fn dcngettext
functions search for the
message string using the
.Fa msgid1
argument as the key, using the argument
.Fa n
to
determine the plural form.
If no message catalogs are found,
.Fa msgid1
is returned
if
.Fa n Li == 1 ,
otherwise
.Fa msgid2
is returned.
.Pp
The
.Dv LANGUAGE
environment variable is examined first to determine the message
catalogs to be used.
The value of the
.Dv LANGUAGE
environment variable is a list
of locale names separated by colon (:) character.
If the
.Dv LANGUAGE
environment
variable is defined, each locale name is tried in the specified order and if a
message catalog containing the requested message is found, the message is
returned.
If the
.Dv LANGUAGE
environment variable is defined but failed to locate
a message catalog, the
.Fa msgid
string will be returned.
.Pp
If the
.Dv LANGUAGE
environment variable is not defined,
.Dv LC_ALL ,
.Dv LC_xxx ,
and
.Dv LANG
environment variables are examined to locate the message catalog,
following the convention used by the
.Xr setlocale 3
function.
.Pp
The pathname used to locate the message catalog is
.Pa dirname/locale/category/domainname.mo ,
where dirname is the directory specified by
.Fn bindtextdomain ,
locale is a locale name determined by the definition of environment variables,
.Fa category
is
.Dv LC_MESSAGES
if
.Fn gettext ,
.Fn ngettext ,
.Fn dgettext ,
or
.Fn dngettext
is
called, otherwise
.Dv LC_xxx
where the name is the same as the locale category name
specified by the
.Fa category
argument of
.Fn dcgettext
or
.Fn dcngettext .
.Fa domainname
is the name of the domain specified by
.Fn textdomain
or the
.Fa domainname
argument of
.Fn dgettext ,
.Fn dngettext ,
.Fn dcgettext ,
or
.Fn dcngettext .
.Pp
For
.Fn gettext
and
.Fn ngettext ,
the domain used is set by the last valid call to
.Fn textdomain .
If a valid call to
.Fn textdomain
has not been made, the default
domain (called messages) is used.
.Pp
For
.Fn dgettext ,
.Fn dngettext ,
.Fn dcgettext ,
and
.Fn dcngettext ,
the domain used is
specified by the
.Fa domainname
argument.
The
.Fa domainname
argument is equivalent in
syntax and meaning to the
.Fa domainname
argument to
.Fn textdomain ,
except that the
selection of the domain is valid only for the duration of the
.Fn dgettext ,
.Fn dngettext ,
.Fn dcgettext ,
or
.Fn dcngettext
function call.
.Pp
The
.Fn dcgettext
and
.Fn dcngettext
functions require additional argument
.Fa category
for retrieving message string for other than
.Dv LC_MESSAGES
category.
Available value for the
.Fa category
argument are
.Dv LC_CTYPE ,
.Dv LC_COLLATE ,
.Dv LC_MESSAGES ,
.Dv LC_MONETARY ,
.Dv LC_NUMERIC ,
and
.Dv LC_TIME .
The call of
.Fn dcgettext "domainname" "msgid" "LC_MESSAGES"
is equivalent to
.Fn dgettext "domainname" "msgid" .
Note that
.Dv LC_ALL
must not be used.
.Pp
The
.Fn textdomain
function sets or queries the name of the current domain of the
active
.Dv LC_MESSAGES
locale category.
The
.Fa domainname
argument is a
nul-terminated string that can contain only the characters allowed in legal
filenames.
.Pp
The
.Fa domainname
argument is the unique name of a domain on the system.
If there
are multiple versions of the same domain on one system, namespace collisions
can be avoided by using
.Fn bindtextdomain .
If
.Fn textdomain
is not called, a
default domain is selected.
The setting of domain made by the last valid call
to
.Fn textdomain
remains valid across subsequent calls to
.Xr setlocale 3 ,
and
.Fn gettext .
.Pp
The
.Fa domainname
argument is applied to the currently active LC_MESSAGES locale.
.Pp
The current setting of the domain can be queried without affecting the current
state of the domain by calling
.Fn textdomain
with
.Fa domainname
set to the
.Dv NULL
pointer.
Calling
.Fn textdomain
with a
.Fa domainname
argument of a
.Dv NULL
string sets
the domain to the default domain
.Pq messages .
.Pp
The
.Fn bindtextdomain
function binds the path predicate for a message domain
.Fa domainname
to the value contained in dirname.
If
.Fa domainname
is a non-empty
string and has not been bound previously,
.Fn bindtextdomain
binds
.Fa domainname
with
.Fa dirname .
.Pp
If
.Fa domainname
is a non-empty string and has been bound previously,
.Fn bindtextdomain
replaces the old binding with dirname.
The dirname argument
can be an absolute pathname being resolved when
.Fn gettext ,
.Fn ngettext ,
.Fn dgettext ,
.Fn dngettext ,
.Fn dcgettext ,
or
.Fn dcngettext
are called.
If
.Fa domainname
is a
.Dv NULL
pointer or an empty string,
.Fn bindtextdomain
returns a
.Dv NULL
pointer.
If
.Fn bindtextdomain
is not called, implementation-defined default directory is used.
.Pp
The
.Fn bind_textdomain_codeset
function can be used to specify the output
.Fa codeset
for message catalogs for domain
.Fa domainname .
The
.Fa codeset
argument must
be a valid codeset name which can be used for the
.Xr iconv_open 3
function.
.Pp
If the
.Fa codeset
argument is the
.Dv NULL
pointer,
.Fn bind_textdomain_codeset
returns the currently selected
.Fa codeset
for the domain with the name
.Fa domainname .
It returns a
.Dv NULL
pointer if no
.Fa codeset
has yet been selected.
.Pp
The
.Fn bind_textdomain_codeset
function can be used several times.
If used multiple times, with the same
.Fa domainname
argument,
the later call overrides the
settings made by the earlier one.
.Pp
The
.Fn bind_textdomain_codeset
function returns a pointer to a string containing
the name of the selected
.Fa codeset .
.\".Sh "RETURN VALUES"
.\".Sh EXAMPLES
.Sh SEE ALSO
.Xr setlocale 3 ,
.Xr nls 7
.\".Sh STANDARDS
.Sh HISTORY
The functions are implemented by Citrus project,
based on the documentations for GNU gettext.
.Sh BUGS
.\" The text was ripped off from Annex C of
.\" .Dq LI18NUX 2000 Globalization Specification Version 1.0 .
.\" .Pp
.Fn bind_textdomain_codeset
does not work at this moment
.Pq it always fails .

1054
lib/libintl/gettext.c Normal file

File diff suppressed because it is too large Load Diff

View File

@ -0,0 +1,44 @@
/* $NetBSD: gettext_dummy.c,v 1.3 2007/09/25 08:16:08 junyoung Exp $ */
/*-
* Copyright (c) 2000 Citrus Project,
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*/
#include <sys/cdefs.h>
__RCSID("$NetBSD: gettext_dummy.c,v 1.3 2007/09/25 08:16:08 junyoung Exp $");
/*
* The symbol is referenced by gettext.m4 (autoconf m4 macro fragment
* that ships with GNU gettext), to check if libintl is GNU origin or not.
* Since we are trying to mimic GNU gettext, we supply the symbol just to
* make gettext.m4 happy.
*
* If we do not provide this symbol, as a result of gettext.m4, *.mo will be
* installed into /usr/lib/locale, not /usr/share/locale. It is not desirable.
*
* Yes, I understand this is a dirty hack. gettext.m4 is doing something
* very wrong here and I have no other choice.
*/
int _nl_msg_cat_cntr;

224
lib/libintl/gettext_iconv.c Normal file
View File

@ -0,0 +1,224 @@
/* $NetBSD: gettext_iconv.c,v 1.8 2009/02/18 13:08:22 yamt Exp $ */
/*-
* Copyright (c) 2004 Citrus Project,
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*
* $Citrus$
*/
#include <sys/types.h>
#include <sys/param.h>
#include <errno.h>
#include <iconv.h>
#include <libintl.h>
#include <langinfo.h>
#include <search.h>
#include <stdlib.h>
#include <string.h>
#include "libintl_local.h"
struct cache {
const char *c_origmsg;
const char *c_resultmsg;
};
static const struct cache *cache_find(const char *, struct domainbinding *);
static int cache_enter(const char *, const char *);
static int cache_cmp(const void *, const void *);
static void *cacheroot;
/* ARGSUSED1 */
static const struct cache *
cache_find(const char *msg, struct domainbinding *db)
{
struct cache key;
struct cache **c;
key.c_origmsg = msg;
c = tfind(&key, &cacheroot, cache_cmp);
return c ? *c : NULL;
}
static int
cache_enter(const char *origmsg, const char *resultmsg)
{
struct cache *c;
c = malloc(sizeof(*c));
if (c == NULL)
return -1;
c->c_origmsg = origmsg;
c->c_resultmsg = resultmsg;
if (tsearch(c, &cacheroot, cache_cmp) == NULL) {
free(c);
return -1;
}
return 0;
}
static int
cache_cmp(const void *va, const void *vb)
{
const struct cache *a = va;
const struct cache *b = vb;
int result;
if (a->c_origmsg > b->c_origmsg) {
result = 1;
} else if (a->c_origmsg < b->c_origmsg) {
result = -1;
} else {
result = 0;
}
return result;
}
#define GETTEXT_ICONV_MALLOC_CHUNK (16 * 1024)
const char *
__gettext_iconv(const char *origmsg, struct domainbinding *db)
{
const char *tocode;
const char *fromcode = db->mohandle.mo.mo_charset;
const struct cache *cache;
const char *result;
iconv_t cd;
const char *src;
char *dst;
size_t origlen;
size_t srclen;
size_t dstlen;
size_t nvalid;
int savederrno = errno;
/*
* static buffer for converted texts.
*
* note:
* we never free buffers once returned to callers.
* because of interface design of gettext, we can't know
* the lifetime of them.
*/
static char *buffer;
static size_t bufferlen;
/*
* don't convert message if *.mo doesn't specify codeset.
*/
if (fromcode == NULL)
return origmsg;
tocode = db->codeset;
if (tocode == NULL) {
/*
* codeset isn't specified explicitly by
* bind_textdomain_codeset().
* use current locale(LC_CTYPE)'s codeset.
*
* XXX maybe wrong; it can mismatch with
* environment variable setting.
*/
tocode = nl_langinfo(CODESET);
}
/*
* shortcut if possible.
* XXX should handle aliases
*/
if (!strcasecmp(tocode, fromcode))
return origmsg;
/* XXX LOCK */
/* XXX should detect change of tocode and purge caches? */
/*
* see if we have already converted this message.
*/
cache = cache_find(origmsg, db);
if (cache) {
result = cache->c_resultmsg;
goto out;
}
origlen = strlen(origmsg) + 1;
again:
cd = iconv_open(tocode, fromcode);
if (cd == (iconv_t)-1) {
result = origmsg;
goto out;
}
src = origmsg;
srclen = origlen;
dst = buffer;
dstlen = bufferlen;
nvalid = iconv(cd, &src, &srclen, &dst, &dstlen);
iconv_close(cd);
if (nvalid == (size_t)-1) {
/*
* try to allocate a new buffer.
*
* just give up if GETTEXT_ICONV_MALLOC_CHUNK was not enough.
*/
if (errno == E2BIG &&
bufferlen != GETTEXT_ICONV_MALLOC_CHUNK) {
buffer = malloc(GETTEXT_ICONV_MALLOC_CHUNK);
if (buffer) {
bufferlen = GETTEXT_ICONV_MALLOC_CHUNK;
goto again;
}
}
result = origmsg;
} else if (cache_enter(origmsg, buffer)) {
/*
* failed to enter cache. give up.
*/
result = origmsg;
} else {
size_t resultlen = dst - buffer;
result = buffer;
bufferlen -= resultlen;
buffer += resultlen;
}
out:
/* XXX UNLOCK */
errno = savederrno;
return result;
}

83
lib/libintl/libintl.h Normal file
View File

@ -0,0 +1,83 @@
/* $NetBSD: libintl.h,v 1.8 2015/06/08 15:04:20 christos Exp $ */
/*-
* Copyright (c) 2000 Citrus Project,
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*/
#ifndef _LIBINTL_H_
#define _LIBINTL_H_
#include <sys/cdefs.h>
#ifndef _LIBGETTEXT_H
/*
* Avoid defining these if the GNU gettext compatibility header includes
* us, since it re-defines those unconditionally and creates inline functions
* for some of them. This is horrible.
*/
#define pgettext_expr(msgctxt, msgid) pgettext((msgctxt), (msgid))
#define dpgettext_expr(domainname, msgctxt, msgid) \
dpgettext((domainname), (msgctxt), (msgid))
#define dcpgettext_expr(domainname, msgctxt, msgid, category) \
dcpgettext((domainname), (msgctxt), (msgid), (category))
#define npgettext_expr(msgctxt, msgid1, msgid2, n) \
npgettext((msgctxt), (msgid1), (msgid2), (n))
#define dnpgettext_expr(domainname, msgctxt, msgid1, n) \
dnpgettext((domainname), (msgctxt), (msgid1), (msgid2), (n))
#define dcnpgettext_expr(domainname, msgctxt, msgid1, msgid2, n, category) \
dcnpgettext((domainname), (msgctxt), (msgid1), (msgid2), (n), (category))
#endif
__BEGIN_DECLS
char *gettext(const char *) __format_arg(1);
char *dgettext(const char *, const char *) __format_arg(2);
char *dcgettext(const char *, const char *, int) __format_arg(2);
char *ngettext(const char *, const char *, unsigned long int)
__format_arg(1) __format_arg(2);
char *dngettext(const char *, const char *, const char *, unsigned long int)
__format_arg(2) __format_arg(3);
char *dcngettext(const char *, const char *, const char *, unsigned long int,
int) __format_arg(2) __format_arg(3);
const char *pgettext(const char *, const char *) __format_arg(2);
const char *dpgettext(const char *, const char *, const char *)
__format_arg(3);
const char *dcpgettext(const char *, const char *, const char *, int)
__format_arg(3);
const char *npgettext(const char *, const char *, const char *,
unsigned long int) __format_arg(2) __format_arg(3);
const char *dnpgettext(const char *, const char *, const char *,
const char *, unsigned long int) __format_arg(3)
__format_arg(4);
const char *dcnpgettext(const char *, const char *, const char *,
const char *, unsigned long int, int) __format_arg(3)
__format_arg(4);
char *textdomain(const char *);
char *bindtextdomain(const char *, const char *);
char *bind_textdomain_codeset(const char *, const char *);
__END_DECLS
#endif /* _LIBINTL_H_ */

148
lib/libintl/libintl_local.h Normal file
View File

@ -0,0 +1,148 @@
/* $NetBSD: libintl_local.h,v 1.12 2007/09/25 08:22:44 junyoung Exp $ */
/*-
* Copyright (c) 2000, 2001 Citrus Project,
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*
* $Citrus: xpg4dl/FreeBSD/lib/libintl/libintl_local.h,v 1.13 2001/09/27 15:18:45 yamt Exp $
*/
#define MO_MAGIC 0x950412de
#define MO_MAGIC_SWAPPED 0xde120495
#define MO_GET_REV_MAJOR(r) (((r) >> 16) & 0xFFFF)
#define MO_GET_REV_MINOR(r) ((r) & 0xFFFF)
#define MO_MAKE_REV(maj, min) (((maj) << 16) | (min))
#define GETTEXT_MMAP_MAX (1024 * 1024) /*XXX*/
#define DEFAULT_DOMAINNAME "messages"
/* *.mo file format */
struct mo {
uint32_t mo_magic; /* determines endian */
uint32_t mo_revision; /* file format revision: 0 */
uint32_t mo_nstring; /* N: number of strings */
uint32_t mo_otable; /* O: original text table offset */
uint32_t mo_ttable; /* T: translated text table offset */
uint32_t mo_hsize; /* S: size of hashing table */
uint32_t mo_hoffset; /* H: offset of hashing table */
/* rev 0.1 / 1.1 */
/* system dependent string support */
uint32_t mo_sysdep_nsegs; /* number of sysdep segments */
uint32_t mo_sysdep_segoff; /* offset of sysdep segment table */
uint32_t mo_sysdep_nstring; /* number of strings */
uint32_t mo_sysdep_otable; /* offset of original text table */
uint32_t mo_sysdep_ttable; /* offset of translated text table */
} __packed;
struct moentry {
uint32_t len; /* strlen(str), so region will be len + 1 */
uint32_t off; /* offset of \0-terminated string */
} __packed;
struct mosysdepsegentry {
uint32_t len; /* length of this part */
uint32_t ref; /* reference number of the sysdep string,
* concatenated just after this segment.
*/
} __packed;
#define MO_LASTSEG (0xFFFFFFFF)
struct mosysdepstr {
uint32_t off; /* offset of seed text */
struct mosysdepsegentry segs[1]; /* text segments */
} __packed;
/* libintl internal data format */
struct moentry_h {
size_t len; /* strlen(str), so region will be len + 1 */
char *off; /* offset of \0-terminated string */
};
struct mosysdepsegs_h {
const char *str;
size_t len;
};
struct mosysdepsegentry_h {
uint32_t len;
uint32_t ref;
};
struct mosysdepstr_h {
const char *off; /* offset of the base string */
char *expanded; /* expanded string */
size_t expanded_len; /* length of expanded string */
struct mosysdepsegentry_h segs[1]; /* text segments */
};
struct gettext_plural;
struct mo_h {
uint32_t mo_magic; /* determines endian */
uint32_t mo_revision; /* file format revision: 0 */
uint32_t mo_nstring; /* N: number of strings */
struct moentry_h *mo_otable; /* O: original text table offset */
struct moentry_h *mo_ttable; /* T: translated text table offset */
const char *mo_header;
struct gettext_plural *mo_plural;
unsigned long mo_nplurals;
char *mo_charset;
uint32_t mo_hsize; /* S: size of hashing table */
uint32_t *mo_htable; /* H: hashing table */
#define MO_HASH_SYSDEP_MASK 0x80000000 /* means sysdep entry */
uint32_t mo_flags;
#define MO_F_SYSDEP 0x00000001 /* enable sysdep string support */
/* system dependent string support */
uint32_t mo_sysdep_nsegs; /* number of sysdep segments */
uint32_t mo_sysdep_nstring; /* number of sysdep strings */
struct mosysdepsegs_h *mo_sysdep_segs; /* sysdep segment table */
struct mosysdepstr_h **mo_sysdep_otable; /* original text */
struct mosysdepstr_h **mo_sysdep_ttable; /* translated text */
};
struct mohandle {
void *addr; /* mmap'ed region */
size_t len;
struct mo_h mo; /* endian-flipped mo file header */
};
struct domainbinding {
struct domainbinding *next;
char domainname[PATH_MAX];
char path[PATH_MAX];
char *codeset;
struct mohandle mohandle;
};
extern struct domainbinding *__bindings;
extern char __current_domainname[PATH_MAX];
__BEGIN_DECLS
const char *__gettext_iconv(const char *, struct domainbinding *);
uint32_t __intl_string_hash(const char *);
const char *__intl_sysdep_get_string_by_tag(const char *, size_t *);
__END_DECLS

29
lib/libintl/pathnames.h Normal file
View File

@ -0,0 +1,29 @@
/* $NetBSD: pathnames.h,v 1.1.1.1 2000/10/31 10:45:04 itojun Exp $ */
/*-
* Copyright (c) 2000 Citrus Project,
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*/
#define _PATH_TEXTDOMAIN "/usr/share/locale"

1119
lib/libintl/plural_parser.c Normal file

File diff suppressed because it is too large Load Diff

View File

@ -0,0 +1,43 @@
/* $NetBSD: plural_parser.h,v 1.2 2007/09/25 08:19:09 junyoung Exp $ */
/*-
* Copyright (c) 2005 Citrus Project,
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*
*/
#ifndef PLURAL_PARSER_H_
#define PLURAL_PARSER_H_
struct gettext_plural;
__BEGIN_DECLS
int _gettext_parse_plural(struct gettext_plural **, unsigned long *,
const char *, size_t);
unsigned long _gettext_calculate_plural(const struct gettext_plural *,
unsigned long);
void _gettext_free_plural(struct gettext_plural *);
__END_DECLS
#endif

View File

@ -0,0 +1,5 @@
# $NetBSD: shlib_version,v 1.3 2015/05/29 12:27:03 christos Exp $
# Remember to update distrib/sets/lists/base/shl.* when changing
#
major=1
minor=1

60
lib/libintl/strhash.c Normal file
View File

@ -0,0 +1,60 @@
/* $NetBSD: strhash.c,v 1.3 2007/09/25 08:19:09 junyoung Exp $ */
/*-
* Copyright (c)2003, 2004 Citrus Project,
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*/
#include <sys/cdefs.h>
#if defined(LIBC_SCCS) && !defined(lint)
__RCSID("$NetBSD: strhash.c,v 1.3 2007/09/25 08:19:09 junyoung Exp $");
#endif /* LIBC_SCCS and not lint */
#include <sys/param.h>
#include <sys/types.h>
#include "libintl_local.h"
/*
* string hash function by P.J.Weinberger.
* this implementation is derived from src/lib/libc/citrus/citrus_db_hash.c.
*/
uint32_t
/*ARGSUSED*/
__intl_string_hash(const char *str)
{
const uint8_t *p;
uint32_t hash = 0, tmp;
for (p = (const uint8_t *)str; *p; p++) {
hash <<= 4;
hash += *p;
tmp = hash & 0xF0000000;
if (tmp != 0) {
hash ^= tmp;
hash ^= tmp >> 24;
}
}
return hash;
}

236
lib/libintl/sysdep.c Normal file
View File

@ -0,0 +1,236 @@
/* $NetBSD: sysdep.c,v 1.2 2005/04/27 09:50:26 yamt Exp $ */
/*-
* Copyright (c)2004 Citrus Project,
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*/
#include <sys/cdefs.h>
#if defined(LIBC_SCCS) && !defined(lint)
__RCSID("$NetBSD: sysdep.c,v 1.2 2005/04/27 09:50:26 yamt Exp $");
#endif /* LIBC_SCCS and not lint */
#include <sys/param.h>
#include <sys/types.h>
#include <inttypes.h>
#include <stdlib.h>
#include <string.h>
#include "libintl_local.h"
struct sysdep_pair
{
const char *tag;
const char *string;
size_t len;
};
#define T_(tag) { #tag, tag, sizeof (tag)-1 }
#define numof(a) (sizeof (a) / sizeof ((a)[0]))
const struct sysdep_pair sysdep_pair_table[] = {
/* this table must be sorted in the dictionary order. */
T_(PRIX16),
T_(PRIX32),
T_(PRIX64),
T_(PRIX8),
T_(PRIXFAST16),
T_(PRIXFAST32),
T_(PRIXFAST64),
T_(PRIXFAST8),
T_(PRIXLEAST16),
T_(PRIXLEAST32),
T_(PRIXLEAST64),
T_(PRIXLEAST8),
T_(PRIXMAX),
T_(PRIXPTR),
T_(PRId16),
T_(PRId32),
T_(PRId64),
T_(PRId8),
T_(PRIdFAST16),
T_(PRIdFAST32),
T_(PRIdFAST64),
T_(PRIdFAST8),
T_(PRIdLEAST16),
T_(PRIdLEAST32),
T_(PRIdLEAST64),
T_(PRIdLEAST8),
T_(PRIdMAX),
T_(PRIdPTR),
T_(PRIi16),
T_(PRIi32),
T_(PRIi64),
T_(PRIi8),
T_(PRIiFAST16),
T_(PRIiFAST32),
T_(PRIiFAST64),
T_(PRIiFAST8),
T_(PRIiLEAST16),
T_(PRIiLEAST32),
T_(PRIiLEAST64),
T_(PRIiLEAST8),
T_(PRIiMAX),
T_(PRIiPTR),
T_(PRIo16),
T_(PRIo32),
T_(PRIo64),
T_(PRIo8),
T_(PRIoFAST16),
T_(PRIoFAST32),
T_(PRIoFAST64),
T_(PRIoFAST8),
T_(PRIoLEAST16),
T_(PRIoLEAST32),
T_(PRIoLEAST64),
T_(PRIoLEAST8),
T_(PRIoMAX),
T_(PRIoPTR),
T_(PRIu16),
T_(PRIu32),
T_(PRIu64),
T_(PRIu8),
T_(PRIuFAST16),
T_(PRIuFAST32),
T_(PRIuFAST64),
T_(PRIuFAST8),
T_(PRIuLEAST16),
T_(PRIuLEAST32),
T_(PRIuLEAST64),
T_(PRIuLEAST8),
T_(PRIuMAX),
T_(PRIuPTR),
T_(PRIx16),
T_(PRIx32),
T_(PRIx64),
T_(PRIx8),
T_(PRIxFAST16),
T_(PRIxFAST32),
T_(PRIxFAST64),
T_(PRIxFAST8),
T_(PRIxLEAST16),
T_(PRIxLEAST32),
T_(PRIxLEAST64),
T_(PRIxLEAST8),
T_(PRIxMAX),
T_(PRIxPTR),
T_(SCNd16),
T_(SCNd32),
T_(SCNd64),
T_(SCNd8),
T_(SCNdFAST16),
T_(SCNdFAST32),
T_(SCNdFAST64),
T_(SCNdFAST8),
T_(SCNdLEAST16),
T_(SCNdLEAST32),
T_(SCNdLEAST64),
T_(SCNdLEAST8),
T_(SCNdMAX),
T_(SCNdPTR),
T_(SCNi16),
T_(SCNi32),
T_(SCNi64),
T_(SCNi8),
T_(SCNiFAST16),
T_(SCNiFAST32),
T_(SCNiFAST64),
T_(SCNiFAST8),
T_(SCNiLEAST16),
T_(SCNiLEAST32),
T_(SCNiLEAST64),
T_(SCNiLEAST8),
T_(SCNiMAX),
T_(SCNiPTR),
T_(SCNo16),
T_(SCNo32),
T_(SCNo64),
T_(SCNo8),
T_(SCNoFAST16),
T_(SCNoFAST32),
T_(SCNoFAST64),
T_(SCNoFAST8),
T_(SCNoLEAST16),
T_(SCNoLEAST32),
T_(SCNoLEAST64),
T_(SCNoLEAST8),
T_(SCNoMAX),
T_(SCNoPTR),
T_(SCNu16),
T_(SCNu32),
T_(SCNu64),
T_(SCNu8),
T_(SCNuFAST16),
T_(SCNuFAST32),
T_(SCNuFAST64),
T_(SCNuFAST8),
T_(SCNuLEAST16),
T_(SCNuLEAST32),
T_(SCNuLEAST64),
T_(SCNuLEAST8),
T_(SCNuMAX),
T_(SCNuPTR),
T_(SCNx16),
T_(SCNx32),
T_(SCNx64),
T_(SCNx8),
T_(SCNxFAST16),
T_(SCNxFAST32),
T_(SCNxFAST64),
T_(SCNxFAST8),
T_(SCNxLEAST16),
T_(SCNxLEAST32),
T_(SCNxLEAST64),
T_(SCNxLEAST8),
T_(SCNxMAX),
T_(SCNxPTR)
};
static int
cmp_sysdep_tag(const void *tag, const void *elem)
{
const struct sysdep_pair *pair = elem;
return strcmp(tag, pair->tag);
}
const char *
__intl_sysdep_get_string_by_tag(const char *tag, size_t *rlen)
{
const struct sysdep_pair *found;
found = bsearch(tag, sysdep_pair_table, numof(sysdep_pair_table),
sizeof(sysdep_pair_table[0]), &cmp_sysdep_tag);
if (found) {
if (rlen)
*rlen = found->len;
return found->string;
}
if (rlen)
*rlen = 0;
return "";
}

148
lib/libintl/textdomain.c Normal file
View File

@ -0,0 +1,148 @@
/* $NetBSD: textdomain.c,v 1.14 2015/05/29 12:26:28 christos Exp $ */
/*-
* Copyright (c) 2000, 2001 Citrus Project,
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*/
#include <sys/cdefs.h>
__RCSID("$NetBSD: textdomain.c,v 1.14 2015/05/29 12:26:28 christos Exp $");
#include <sys/param.h>
#include <stdio.h>
#include <string.h>
#include <stdlib.h>
#include <libintl.h>
#include "libintl_local.h"
#include "pathnames.h"
static struct domainbinding __default_binding = {
.path = { _PATH_TEXTDOMAIN },
.domainname = { DEFAULT_DOMAINNAME },
};
struct domainbinding *__bindings = &__default_binding;
char __current_domainname[PATH_MAX] = DEFAULT_DOMAINNAME;
static struct domainbinding *domainbinding_lookup(const char *, int);
/*
* set the default domainname for dcngettext() and friends.
*/
char *
textdomain(const char *domainname)
{
/* NULL pointer gives the current setting */
if (!domainname)
return __current_domainname;
/* empty string sets the value back to the default */
if (!*domainname) {
strlcpy(__current_domainname, DEFAULT_DOMAINNAME,
sizeof(__current_domainname));
} else {
strlcpy(__current_domainname, domainname,
sizeof(__current_domainname));
}
return __current_domainname;
}
char *
bindtextdomain(const char *domainname, const char *dirname)
{
struct domainbinding *p;
/* NULL pointer or empty string returns NULL with no operation */
if (!domainname || !*domainname)
return NULL;
if (dirname && (strlen(dirname) + 1 > sizeof(p->path)))
return NULL;
#if 0
/* disallow relative path */
if (dirname[0] != '/')
return NULL;
#endif
if (strlen(domainname) + 1 > sizeof(p->domainname))
return NULL;
p = domainbinding_lookup(domainname, (dirname != NULL));
if (!dirname) {
if (p)
return (p->path);
else
return (char *)__UNCONST(_PATH_TEXTDOMAIN);
}
strlcpy(p->path, dirname, sizeof(p->path));
p->mohandle.mo.mo_magic = 0; /* invalidate current mapping */
return (p->path);
}
char *
bind_textdomain_codeset(const char *domainname, const char *codeset)
{
struct domainbinding *p;
p = domainbinding_lookup(domainname, (codeset != NULL));
if (p == NULL)
return NULL;
if (codeset) {
free(p->codeset);
p->codeset = strdup(codeset);
}
return p->codeset;
}
/*
* lookup binding for the domainname
*/
static struct domainbinding *
domainbinding_lookup(const char *domainname, int alloc)
{
struct domainbinding *p;
for (p = __bindings; p; p = p->next)
if (strcmp(p->domainname, domainname) == 0)
break;
if (!p && alloc) {
p = (struct domainbinding *)malloc(sizeof(*p));
if (!p)
return NULL;
memset(p, 0, sizeof(*p));
p->next = __bindings;
strlcpy(p->domainname, domainname, sizeof(p->domainname));
__bindings = p;
}
return p;
}

5
share/i18n/Makefile Normal file
View File

@ -0,0 +1,5 @@
# $NetBSD: Makefile,v 1.1 2003/06/27 08:39:59 tshiozak Exp $
SUBDIR=csmapper esdb iconv
.include <bsd.subdir.mk>

View File

@ -0,0 +1,247 @@
# $NetBSD: CELTIC%UCS.src,v 1.1 2006/03/13 19:45:36 tnozaki Exp $
TYPE ROWCOL
NAME CELTIC/UCS
SRC_ZONE 0x00-0xFF
OOB_MODE ILSEQ
DST_ILSEQ 0xFFFE
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: CELTIC.TXT
#
# Contents: Map (external version) from Mac OS Celtic
# character set to Unicode 2.1 and later
#
# Contacts: charsets@apple.com, everson@evertype.com
#
# Changes:
#
# c01 2005-Apr-01 First posted version. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Celtic code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Celtic code order.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Celtic character set uses the standard control characters
# at 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Celtic (partly from Michael Everson):
# -----------------------------------------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported via transcoding to and from
# Unicode.
#
# This character set was developed by Michael Everson of Everson
# Typography (everson@evertype.com) and was used for the Irish
# localizations of Mac OS 6.0.8 and 7.1, for the Welsh localization of
# Mac OS 7.1, and for several fonts that can be used on any version of
# Mac OS 7.1 or later. Note that while Apple authorized
# the Irish and Welsh localizations mentioned above, they were not
# systems which shipped with Apple hardware, and were not otherwise
# supported by Apple. Fonts conforming to the Mac OS Celtic character
# set are available from Everson Typography (http://www.evertype.com)
# and MEU Cymru (http://www.meucymru.co.uk). Information about the use
# of this character set is available at
# http://www.evertype.com/celtscript/celtcode.html.
#
# The Mac OS Celtic encoding shares the script code smRoman (0) with
# the standard Mac OS Roman encoding. To determine if the Celtic
# encoding is being used in Mac OS 7-9, you should also check if the
# system region code is 50, verIreland, or 79, verWales. Otherwise,
# you can check for particular fonts that conform to this encoding.
#
# This character set is a variant of standard Mac OS Roman, adding
# capital and small y with acute, grave, and circumflex, and capital
# and small w with acute, grave, circumflex and diaeresis. It has 14
# code point differences from standard Mac OS Roman (0xDE, 0xDF, 0xE2,
# 0xE3, 0xF6-0xFF).
#
# Before Mac OS 8.5, code point 0xDB was CURRENCY SIGN, and was
# mapped to U+00A4. In Mac OS 8.5 and later versions, code point
# 0xDB is changed to EURO SIGN and maps to U+20AC; the standard
# Apple fonts were updated for Mac OS 8.5 to reflect this. There is
# a "currency sign" variant of the Mac OS Celtic encoding that still
# maps 0xDB to U+00A4; this can be used for older fonts.
# Note: U+20AC is new with Unicode 2.1; for earlier Unicode
# versions, Mac OS Celtic 0xDB may be mapped to private-use
# character U+F8A0.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# Details of mapping changes in each version:
# -------------------------------------------
#
##################
0x00 - 0x7E = 0x0000 -
0x80 = 0x00C4
0x81 = 0x00C5
0x82 = 0x00C7
0x83 = 0x00C9
0x84 = 0x00D1
0x85 = 0x00D6
0x86 = 0x00DC
0x87 = 0x00E1
0x88 = 0x00E0
0x89 = 0x00E2
0x8A = 0x00E4
0x8B = 0x00E3
0x8C = 0x00E5
0x8D = 0x00E7
0x8E = 0x00E9
0x8F = 0x00E8
0x90 = 0x00EA
0x91 = 0x00EB
0x92 = 0x00ED
0x93 = 0x00EC
0x94 = 0x00EE
0x95 = 0x00EF
0x96 = 0x00F1
0x97 = 0x00F3
0x98 = 0x00F2
0x99 = 0x00F4
0x9A = 0x00F6
0x9B = 0x00F5
0x9C = 0x00FA
0x9D = 0x00F9
0x9E = 0x00FB
0x9F = 0x00FC
0xA0 = 0x2020
0xA1 = 0x00B0
0xA2 = 0x00A2
0xA3 = 0x00A3
0xA4 = 0x00A7
0xA5 = 0x2022
0xA6 = 0x00B6
0xA7 = 0x00DF
0xA8 = 0x00AE
0xA9 = 0x00A9
0xAA = 0x2122
0xAB = 0x00B4
0xAC = 0x00A8
0xAD = 0x2260
0xAE = 0x00C6
0xAF = 0x00D8
0xB0 = 0x221E
0xB1 = 0x00B1
0xB2 = 0x2264
0xB3 = 0x2265
0xB4 = 0x00A5
0xB5 = 0x00B5
0xB6 = 0x2202
0xB7 = 0x2211
0xB8 = 0x220F
0xB9 = 0x03C0
0xBA = 0x222B
0xBB = 0x00AA
0xBC = 0x00BA
0xBD = 0x03A9
0xBE = 0x00E6
0xBF = 0x00F8
0xC0 = 0x00BF
0xC1 = 0x00A1
0xC2 = 0x00AC
0xC3 = 0x221A
0xC4 = 0x0192
0xC5 = 0x2248
0xC6 = 0x2206
0xC7 = 0x00AB
0xC8 = 0x00BB
0xC9 = 0x2026
0xCA = 0x00A0
0xCB = 0x00C0
0xCC = 0x00C3
0xCD = 0x00D5
0xCE = 0x0152
0xCF = 0x0153
0xD0 = 0x2013
0xD1 = 0x2014
0xD2 = 0x201C
0xD3 = 0x201D
0xD4 = 0x2018
0xD5 = 0x2019
0xD6 = 0x00F7
0xD7 = 0x25CA
0xD8 = 0x00FF
0xD9 = 0x0178
0xDA = 0x2044
0xDB = 0x20AC
0xDC = 0x2039
0xDD = 0x203A
0xDE = 0x0176
0xDF = 0x0177
0xE0 = 0x2021
0xE1 = 0x00B7
0xE2 = 0x1EF2
0xE3 = 0x1EF3
0xE4 = 0x2030
0xE5 = 0x00C2
0xE6 = 0x00CA
0xE7 = 0x00C1
0xE8 = 0x00CB
0xE9 = 0x00C8
0xEA = 0x00CD
0xEB = 0x00CE
0xEC = 0x00CF
0xED = 0x00CC
0xEE = 0x00D3
0xEF = 0x00D4
0xF0 = 0x2663
0xF1 = 0x00D2
0xF2 = 0x00DA
0xF3 = 0x00DB
0xF4 = 0x00D9
0xF5 = 0x0131
0xF6 = 0x00DD
0xF7 = 0x00FD
0xF8 = 0x0174
0xF9 = 0x0175
0xFA = 0x1E84
0xFB = 0x1E85
0xFC = 0x1E80
0xFD = 0x1E81
0xFE = 0x1E82
0xFF = 0x1E83
END_MAP

View File

@ -0,0 +1,246 @@
# $NetBSD: CENTEURO%UCS.src,v 1.1 2006/03/13 19:45:36 tnozaki Exp $
TYPE ROWCOL
NAME CENTEURO/UCS
SRC_ZONE 0x00-0xFF
OOB_MODE ILSEQ
DST_ILSEQ 0xFFFE
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: CENTEURO.TXT
#
# Contents: Map (external version) from Mac OS Central European
# character set to Unicode 2.1 and later.
#
# Copyright: (c) 1995-2002, 2005 by Apple Computer, Inc., all rights
# reserved.
#
# Contact: charsets@apple.com
#
# Changes:
#
# c02 2005-Apr-04 Update header comments. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
# b3,c1 2002-Dec-19 Update URLs. Matches internal utom<b1>.
# b02 1999-Sep-22 Update contact e-mail address. Matches
# internal utom<b1>, ufrm<b1>, and Text
# Encoding Converter version 1.5.
# n05 1998-Feb-05 Update header comments to new format; no
# mapping changes. Matches internal utom<n3>,
# ufrm<n13>, and Text Encoding Converter
# version 1.3.
# n03 1995-Apr-15 First version (after fixing some typos).
# Matches internal ufrm<n5>.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Central European code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Central European code order.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Central European character set uses the standard control
# characters at 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Central European:
# ---------------------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported directly in programming
# interfaces for QuickDraw Text, the Script Manager, and related
# Text Utilities. For other purposes it is supported via transcoding
# to and from Unicode.
#
# This character set is intended to cover the following languages:
#
# Polish, Czech, Slovak, Hungarian, Estonian, Latvian, Lithuanian
#
# These are written in Latin script, but using a different set of
# of accented characters than Mac OS Roman. The Mac OS Central
# European character set also includes a number of characters
# needed for the Mac OS user interface and localization (e.g.
# ellipsis, bullet, copyright sign), several typographic
# punctuation symbols, math symbols, etc. However, it has a
# smaller set of punctuation and symbols than Mac OS Roman. All of
# the characters in Mac OS Central European that are also in the
# Mac OS Roman character set are at the same code point in both
# character sets; this improves application compatibility.
#
# Note: This does not have the same letter repertoire as ISO
# 8859-2 (Latin-2); each has some accented letters that the other
# does not have.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# Details of mapping changes in each version:
# -------------------------------------------
#
##################
0x00 - 0x7F = 0x0000 -
0x80 = 0x00C4
0x81 = 0x0100
0x82 = 0x0101
0x83 = 0x00C9
0x84 = 0x0104
0x85 = 0x00D6
0x86 = 0x00DC
0x87 = 0x00E1
0x88 = 0x0105
0x89 = 0x010C
0x8A = 0x00E4
0x8B = 0x010D
0x8C = 0x0106
0x8D = 0x0107
0x8E = 0x00E9
0x8F = 0x0179
0x90 = 0x017A
0x91 = 0x010E
0x92 = 0x00ED
0x93 = 0x010F
0x94 = 0x0112
0x95 = 0x0113
0x96 = 0x0116
0x97 = 0x00F3
0x98 = 0x0117
0x99 = 0x00F4
0x9A = 0x00F6
0x9B = 0x00F5
0x9C = 0x00FA
0x9D = 0x011A
0x9E = 0x011B
0x9F = 0x00FC
0xA0 = 0x2020
0xA1 = 0x00B0
0xA2 = 0x0118
0xA3 = 0x00A3
0xA4 = 0x00A7
0xA5 = 0x2022
0xA6 = 0x00B6
0xA7 = 0x00DF
0xA8 = 0x00AE
0xA9 = 0x00A9
0xAA = 0x2122
0xAB = 0x0119
0xAC = 0x00A8
0xAD = 0x2260
0xAE = 0x0123
0xAF = 0x012E
0xB0 = 0x012F
0xB1 = 0x012A
0xB2 = 0x2264
0xB3 = 0x2265
0xB4 = 0x012B
0xB5 = 0x0136
0xB6 = 0x2202
0xB7 = 0x2211
0xB8 = 0x0142
0xB9 = 0x013B
0xBA = 0x013C
0xBB = 0x013D
0xBC = 0x013E
0xBD = 0x0139
0xBE = 0x013A
0xBF = 0x0145
0xC0 = 0x0146
0xC1 = 0x0143
0xC2 = 0x00AC
0xC3 = 0x221A
0xC4 = 0x0144
0xC5 = 0x0147
0xC6 = 0x2206
0xC7 = 0x00AB
0xC8 = 0x00BB
0xC9 = 0x2026
0xCA = 0x00A0
0xCB = 0x0148
0xCC = 0x0150
0xCD = 0x00D5
0xCE = 0x0151
0xCF = 0x014C
0xD0 = 0x2013
0xD1 = 0x2014
0xD2 = 0x201C
0xD3 = 0x201D
0xD4 = 0x2018
0xD5 = 0x2019
0xD6 = 0x00F7
0xD7 = 0x25CA
0xD8 = 0x014D
0xD9 = 0x0154
0xDA = 0x0155
0xDB = 0x0158
0xDC = 0x2039
0xDD = 0x203A
0xDE = 0x0159
0xDF = 0x0156
0xE0 = 0x0157
0xE1 = 0x0160
0xE2 = 0x201A
0xE3 = 0x201E
0xE4 = 0x0161
0xE5 = 0x015A
0xE6 = 0x015B
0xE7 = 0x00C1
0xE8 = 0x0164
0xE9 = 0x0165
0xEA = 0x00CD
0xEB = 0x017D
0xEC = 0x017E
0xED = 0x016A
0xEE = 0x00D3
0xEF = 0x00D4
0xF0 = 0x016B
0xF1 = 0x016E
0xF2 = 0x00DA
0xF3 = 0x016F
0xF4 = 0x0170
0xF5 = 0x0171
0xF6 = 0x0172
0xF7 = 0x0173
0xF8 = 0x00DD
0xF9 = 0x00FD
0xFA = 0x0137
0xFB = 0x017B
0xFC = 0x0141
0xFD = 0x017C
0xFE = 0x0122
0xFF = 0x02C7
END_MAP

View File

@ -0,0 +1,270 @@
# $NetBSD: CROATIAN%UCS.src,v 1.1 2006/03/13 19:45:36 tnozaki Exp $
TYPE ROWCOL
NAME CROATIAN/UCS
SRC_ZONE 0x00-0xFF
OOB_MODE ILSEQ
DST_ILSEQ 0xFFFE
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: CROATIAN.TXT
#
# Contents: Map (external version) from Mac OS Croatian
# character set to Unicode 2.1 and later.
#
# Copyright: (c) 1995-2002, 2005 by Apple Computer, Inc., all rights
# reserved.
#
# Contact: charsets@apple.com
#
# Changes:
#
# c02 2005-Apr-04 Update header comments. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
# b3,c1 2002-Dec-19 Update URLs, notes. Matches internal
# utom<b3>.
# b02 1999-Sep-22 Encoding changed for Mac OS 8.5; change
# mapping of 0xDB from CURRENCY SIGN to EURO
# SIGN. Update contact e-mail address. Matches
# internal utom<b2>, ufrm<b2>, and Text
# Encoding Converter version 1.5.
# n07 1998-Feb-05 Minor update to header comments
# n05 1997-Dec-14 Update to match internal utom<5>, ufrm<16>:
# Change standard mapping for 0xBD from U+2126
# to its canonical decomposition, U+03A9.
# n03 1995-Apr-15 First version (after fixing some typos).
# Matches internal ufrm<6>.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Croatian code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Croatian code order.
#
# One of these mappings requires the use of a corporate character.
# See the file "CORPCHAR.TXT" and notes below.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Croatian character set uses the standard control characters
# at 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Croatian:
# -------------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported via transcoding to and from
# Unicode.
#
# Mac OS Croatian is used for Croatian and Slovene.
#
# The Mac OS Croatian encoding shares the script code smRoman
# (0) with the standard Mac OS Roman encoding. To determine if
# the Croatian encoding is being used, you must check if the
# system region code is 68, verCroatia (or 25, verYugoCroatian,
# only used in older systems).
#
# This character set is a variant of standard Mac OS Roman
# encoding, adding five accented letter case pairs to handle
# Croatian. It has 20 code point differences from standard
# Mac OS Roman, but only 10 differences in repertoire.
#
# Before Mac OS 8.5, code point 0xDB was CURRENCY SIGN, and was
# mapped to U+00A4. In Mac OS 8.5 and later versions, code point
# 0xDB is changed to EURO SIGN and maps to U+20AC; the standard
# Apple fonts are updated for Mac OS 8.5 to reflect this. There is
# a "currency sign" variant of the Mac OS Croatian encoding that
# still maps 0xDB to U+00A4; this can be used for older fonts.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# The following corporate zone Unicode character is used in this
# mapping:
#
# 0xF8FF Apple logo
#
# NOTE: The graphic image associated with the Apple logo character
# is not authorized for use without permission of Apple, and
# unauthorized use might constitute trademark infringement.
#
# Details of mapping changes in each version:
# -------------------------------------------
#
# Changes from version n07 to version b02:
#
# - Encoding changed for Mac OS 8.5; change mapping of 0xDB from
# CURRENCY SIGN (U+00A4) to EURO SIGN (U+20AC).
#
# Changes from version n03 to version n05:
#
# - Change mapping of 0xBD from U+2126 to its canonical
# decomposition, U+03A9.
#
##################
0x00 - 0x7E = 0x0000 -
0x80 = 0x00C4
0x81 = 0x00C5
0x82 = 0x00C7
0x83 = 0x00C9
0x84 = 0x00D1
0x85 = 0x00D6
0x86 = 0x00DC
0x87 = 0x00E1
0x88 = 0x00E0
0x89 = 0x00E2
0x8A = 0x00E4
0x8B = 0x00E3
0x8C = 0x00E5
0x8D = 0x00E7
0x8E = 0x00E9
0x8F = 0x00E8
0x90 = 0x00EA
0x91 = 0x00EB
0x92 = 0x00ED
0x93 = 0x00EC
0x94 = 0x00EE
0x95 = 0x00EF
0x96 = 0x00F1
0x97 = 0x00F3
0x98 = 0x00F2
0x99 = 0x00F4
0x9A = 0x00F6
0x9B = 0x00F5
0x9C = 0x00FA
0x9D = 0x00F9
0x9E = 0x00FB
0x9F = 0x00FC
0xA0 = 0x2020
0xA1 = 0x00B0
0xA2 = 0x00A2
0xA3 = 0x00A3
0xA4 = 0x00A7
0xA5 = 0x2022
0xA6 = 0x00B6
0xA7 = 0x00DF
0xA8 = 0x00AE
0xA9 = 0x0160
0xAA = 0x2122
0xAB = 0x00B4
0xAC = 0x00A8
0xAD = 0x2260
0xAE = 0x017D
0xAF = 0x00D8
0xB0 = 0x221E
0xB1 = 0x00B1
0xB2 = 0x2264
0xB3 = 0x2265
0xB4 = 0x2206
0xB5 = 0x00B5
0xB6 = 0x2202
0xB7 = 0x2211
0xB8 = 0x220F
0xB9 = 0x0161
0xBA = 0x222B
0xBB = 0x00AA
0xBC = 0x00BA
0xBD = 0x03A9
0xBE = 0x017E
0xBF = 0x00F8
0xC0 = 0x00BF
0xC1 = 0x00A1
0xC2 = 0x00AC
0xC3 = 0x221A
0xC4 = 0x0192
0xC5 = 0x2248
0xC6 = 0x0106
0xC7 = 0x00AB
0xC8 = 0x010C
0xC9 = 0x2026
0xCA = 0x00A0
0xCB = 0x00C0
0xCC = 0x00C3
0xCD = 0x00D5
0xCE = 0x0152
0xCF = 0x0153
0xD0 = 0x0110
0xD1 = 0x2014
0xD2 = 0x201C
0xD3 = 0x201D
0xD4 = 0x2018
0xD5 = 0x2019
0xD6 = 0x00F7
0xD7 = 0x25CA
0xD8 = 0xF8FF
0xD9 = 0x00A9
0xDA = 0x2044
0xDB = 0x20AC
0xDC = 0x2039
0xDD = 0x203A
0xDE = 0x00C6
0xDF = 0x00BB
0xE0 = 0x2013
0xE1 = 0x00B7
0xE2 = 0x201A
0xE3 = 0x201E
0xE4 = 0x2030
0xE5 = 0x00C2
0xE6 = 0x0107
0xE7 = 0x00C1
0xE8 = 0x010D
0xE9 = 0x00C8
0xEA = 0x00CD
0xEB = 0x00CE
0xEC = 0x00CF
0xED = 0x00CC
0xEE = 0x00D3
0xEF = 0x00D4
0xF0 = 0x0111
0xF1 = 0x00D2
0xF2 = 0x00DA
0xF3 = 0x00DB
0xF4 = 0x00D9
0xF5 = 0x0131
0xF6 = 0x02C6
0xF7 = 0x02DC
0xF8 = 0x00AF
0xF9 = 0x03C0
0xFA = 0x00CB
0xFB = 0x02DA
0xFC = 0x00B8
0xFD = 0x00CA
0xFE = 0x00E6
0xFF = 0x02C7
END_MAP

View File

@ -0,0 +1,271 @@
# $NetBSD: CYRILLIC%UCS.src,v 1.1 2006/03/13 19:45:36 tnozaki Exp $
TYPE ROWCOL
NAME CYRILLIC/UCS
SRC_ZONE 0x00-0xFF
OOB_MODE ILSEQ
DST_ILSEQ 0xFFFE
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: CYRILLIC.TXT
#
# Contents: Map (external version) from Mac OS Cyrillic
# character set to Unicode 2.1 and later.
#
# Copyright: (c) 1995-2002, 2005 by Apple Computer, Inc., all rights
# reserved.
#
# Contact: charsets@apple.com
#
# Changes:
#
# c03 2005-Apr-05 Update header comments. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
# b3,c1 2002-Dec-19 Update URLs, notes. Matches internal
# utom<b2>.
# b02 1999-Sep-22 Encoding changed for Mac OS 9.0 to merge
# with Mac OS Ukrainian and support EURO SIGN;
# Change mappings for 0xA2, 0xB6, and 0xFF.
# Update contact e-mail address. Matches
# internal utom<b2>, ufrm<b2>, and Text
# Encoding Converter version 1.5.
# n05 1998-Feb-05 Update header comments to new format; no
# mapping changes. Matches internal utom<n3>,
# ufrm<n13>, and Text Encoding Converter
# version 1.3.
# n03 1995-Apr-15 First version (after fixing some typos).
# Matches internal ufrm<n5>.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Cyrillic code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Cyrillic code order.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Cyrillic character set uses the standard control characters
# at 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Cyrillic:
# -------------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported directly in programming
# interfaces for QuickDraw Text, the Script Manager, and related
# Text Utilities. For other purposes it is supported via transcoding
# to and from Unicode.
#
# This is the "Euro sign" version of Mac Cyrillic for Mac OS 9.0 and
# later. Before Mac OS 9.0, there were two separate Slavic Cyrillic
# encodings:
#
# 1. The Cyrillic currency sign variant (used for localized Russian
# and Bulgarian systems), which had the following:
# 0xA2 U+00A2 CENT SIGN
# 0xB6 U+2202 PARTIAL DIFFERENTIAL
# 0xFF U+00A4 CURRENCY SIGN
#
# 2. The Ukrainian currency sign variant (used for localized Ukrainian
# systems and the pre-9.0 Cyrillic Language Kit), which had the
# following:
# 0xA2 U+0490 CYRILLIC CAPITAL LETTER GHE WITH UPTURN
# 0xB6 U+0491 CYRILLIC SMALL LETTER GHE WITH UPTURN
# 0xFF U+00A4 CURRENCY SIGN
#
# This new Cyrillic Euro sign version is based on the old Ukrainian
# currency sign variant, with 0xFF changed to be EURO SIGN.
#
# The Mac OS Cyrillic encoding includes the Cyrillic letter repertoire
# of ISO 8859-5 (although not at the same code points). This covers
# most of the Slavic languages written in Cyrillic script.
#
# The Mac OS Cyrillic encoding also includes a number of characters
# needed for the Mac OS user interface and localization (e.g.
# ellipsis, bullet, copyright sign). All of the characters in Mac OS
# Cyrillic that are also in the Mac OS Roman encoding are at the
# same code point in both; this improves application compatibility.
#
# Note: There is a common Ukrainian glyph variation in which the glyph
# for CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I may or may not
# have a dot above.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# Details of mapping changes in each version:
# -------------------------------------------
#
# Changes from version n05 to version b02:
#
# - Encoding changed for Mac OS 9.0 to merge with Mac OS Ukrainian and
# support EURO SIGN. 0xA2 changed from U+00A2 to U+0490; 0xB6 changed
# from U+2202 to U+0491; 0xFF changed from U+00A4 to U+20AC.
#
##################
0x00 - 0x7E = 0x00 -
0x80 = 0x0410
0x81 = 0x0411
0x82 = 0x0412
0x83 = 0x0413
0x84 = 0x0414
0x85 = 0x0415
0x86 = 0x0416
0x87 = 0x0417
0x88 = 0x0418
0x89 = 0x0419
0x8A = 0x041A
0x8B = 0x041B
0x8C = 0x041C
0x8D = 0x041D
0x8E = 0x041E
0x8F = 0x041F
0x90 = 0x0420
0x91 = 0x0421
0x92 = 0x0422
0x93 = 0x0423
0x94 = 0x0424
0x95 = 0x0425
0x96 = 0x0426
0x97 = 0x0427
0x98 = 0x0428
0x99 = 0x0429
0x9A = 0x042A
0x9B = 0x042B
0x9C = 0x042C
0x9D = 0x042D
0x9E = 0x042E
0x9F = 0x042F
0xA0 = 0x2020
0xA1 = 0x00B0
0xA2 = 0x0490
0xA3 = 0x00A3
0xA4 = 0x00A7
0xA5 = 0x2022
0xA6 = 0x00B6
0xA7 = 0x0406
0xA8 = 0x00AE
0xA9 = 0x00A9
0xAA = 0x2122
0xAB = 0x0402
0xAC = 0x0452
0xAD = 0x2260
0xAE = 0x0403
0xAF = 0x0453
0xB0 = 0x221E
0xB1 = 0x00B1
0xB2 = 0x2264
0xB3 = 0x2265
0xB4 = 0x0456
0xB5 = 0x00B5
0xB6 = 0x0491
0xB7 = 0x0408
0xB8 = 0x0404
0xB9 = 0x0454
0xBA = 0x0407
0xBB = 0x0457
0xBC = 0x0409
0xBD = 0x0459
0xBE = 0x040A
0xBF = 0x045A
0xC0 = 0x0458
0xC1 = 0x0405
0xC2 = 0x00AC
0xC3 = 0x221A
0xC4 = 0x0192
0xC5 = 0x2248
0xC6 = 0x2206
0xC7 = 0x00AB
0xC8 = 0x00BB
0xC9 = 0x2026
0xCA = 0x00A0
0xCB = 0x040B
0xCC = 0x045B
0xCD = 0x040C
0xCE = 0x045C
0xCF = 0x0455
0xD0 = 0x2013
0xD1 = 0x2014
0xD2 = 0x201C
0xD3 = 0x201D
0xD4 = 0x2018
0xD5 = 0x2019
0xD6 = 0x00F7
0xD7 = 0x201E
0xD8 = 0x040E
0xD9 = 0x045E
0xDA = 0x040F
0xDB = 0x045F
0xDC = 0x2116
0xDD = 0x0401
0xDE = 0x0451
0xDF = 0x044F
0xE0 = 0x0430
0xE1 = 0x0431
0xE2 = 0x0432
0xE3 = 0x0433
0xE4 = 0x0434
0xE5 = 0x0435
0xE6 = 0x0436
0xE7 = 0x0437
0xE8 = 0x0438
0xE9 = 0x0439
0xEA = 0x043A
0xEB = 0x043B
0xEC = 0x043C
0xED = 0x043D
0xEE = 0x043E
0xEF = 0x043F
0xF0 = 0x0440
0xF1 = 0x0441
0xF2 = 0x0442
0xF3 = 0x0443
0xF4 = 0x0444
0xF5 = 0x0445
0xF6 = 0x0446
0xF7 = 0x0447
0xF8 = 0x0448
0xF9 = 0x0449
0xFA = 0x044A
0xFB = 0x044B
0xFC = 0x044C
0xFD = 0x044D
0xFE = 0x044E
0xFF = 0x20AC
END_MAP

View File

@ -0,0 +1,340 @@
# $NetBSD: DINGBATS%UCS.src,v 1.1 2006/03/13 19:45:36 tnozaki Exp $
TYPE ROWCOL
NAME DINGBATS/UCS
SRC_ZONE 0x00-0xFF
OOB_MODE ILSEQ
DST_ILSEQ 0xFFFE
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: DINGBATS.TXT
#
# Contents: Map (external version) from Mac OS Dingbats
# character set to Unicode 3.2 and later.
#
# Copyright: (c) 1994-2002, 2005 by Apple Computer, Inc., all rights
# reserved.
#
# Contact: charsets@apple.com
#
# Changes:
#
# c02 2005-Apr-05 Update header comments. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
# b3,c1 2002-Dec-19 Update mappings for 0x80-0x8D to use new
# Unicode 3.2 characters. Update URLs, notes.
# Matches internal utom<b2>.
# b02 1999-Sep-22 Update contact e-mail address. Matches
# internal utom<b1>, ufrm<b1>, and Text
# Encoding Converter version 1.5.
# n05 1998-Feb-05 Update to match internal utom<n4>, ufrm<n14>,
# and Text Encoding Converter version 1.3:
# Change all mappings to single corporate-zone
# Unicodes to either use standard Unicodes
# or standard Unicodes plus transcoding hints;
# see details below. Also update header
# comments to new format.
# n03 1995-Apr-15 First version (after fixing some typos).
# Matches internal ufrm<n4>.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Dingbats code (in hex as 0xNN)
# Column #2 is the corresponding Unicode or Unicode sequence
# (in hex as 0xNNNN).
# Column #3 is a comment containing the Unicode name.
# In some cases an additional comment follows the Unicode name.
#
# The entries are in Mac OS Dingbats code order.
#
# Some of these mappings require the use of corporate characters.
# See the file "CORPCHAR.TXT" and notes below.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Dingbats character set uses the standard control characters
# at 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Dingbats:
# -------------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported directly in programming
# interfaces for QuickDraw Text, the Script Manager, and related
# Text Utilities. For other purposes it is supported via transcoding
# to and from Unicode.
#
# The Mac OS Dingbats encoding shares the script code smRoman
# (0) with the standard Mac OS Roman encoding. To determine if
# the Dingbats encoding is being used, you must check if the
# font name is "Zapf Dingbats".
#
# The layout of the Dingbats character set is identical to or
# a superset of the layout of the Adobe Zapf Dingbats encoding
# vector.
#
# The following code points are unused, and are not shown here:
# 0x8E-0xA0, 0xF0, 0xFF.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# Details of mapping changes in each version:
# -------------------------------------------
#
# Changes from version b02 to version b03/c01:
#
# - The mappings for the following Mac OS Dingbats characters
# were changed to use standard Unicode characters added for
# Unicode 3.2: 0x80-0x8D.
#
# Changes from version n03 to version n05:
#
# - The mappings for the following Mac OS Dingbats characters
# were changed from single corporate-zone Unicode characters
# to standard Unicode characters:
# 0x80-0x81, 0x84-0x87, 0x8A-0x8D.
#
# - The mappings for the following Mac OS Dingbats characters
# were changed from single corporate-zone Unicode characters
# to combinations of a standard Unicode and a transcoding hint:
# 0x82-0x83, 0x88-0x89.
#
##################
0x00 - 0x20 = 0x00 -
0x21 = 0x2701
0x22 = 0x2702
0x23 = 0x2703
0x24 = 0x2704
0x25 = 0x260E
0x26 = 0x2706
0x27 = 0x2707
0x28 = 0x2708
0x29 = 0x2709
0x2A = 0x261B
0x2B = 0x261E
0x2C = 0x270C
0x2D = 0x270D
0x2E = 0x270E
0x2F = 0x270F
0x30 = 0x2710
0x31 = 0x2711
0x32 = 0x2712
0x33 = 0x2713
0x34 = 0x2714
0x35 = 0x2715
0x36 = 0x2716
0x37 = 0x2717
0x38 = 0x2718
0x39 = 0x2719
0x3A = 0x271A
0x3B = 0x271B
0x3C = 0x271C
0x3D = 0x271D
0x3E = 0x271E
0x3F = 0x271F
0x40 = 0x2720
0x41 = 0x2721
0x42 = 0x2722
0x43 = 0x2723
0x44 = 0x2724
0x45 = 0x2725
0x46 = 0x2726
0x47 = 0x2727
0x48 = 0x2605
0x49 = 0x2729
0x4A = 0x272A
0x4B = 0x272B
0x4C = 0x272C
0x4D = 0x272D
0x4E = 0x272E
0x4F = 0x272F
0x50 = 0x2730
0x51 = 0x2731
0x52 = 0x2732
0x53 = 0x2733
0x54 = 0x2734
0x55 = 0x2735
0x56 = 0x2736
0x57 = 0x2737
0x58 = 0x2738
0x59 = 0x2739
0x5A = 0x273A
0x5B = 0x273B
0x5C = 0x273C
0x5D = 0x273D
0x5E = 0x273E
0x5F = 0x273F
0x60 = 0x2740
0x61 = 0x2741
0x62 = 0x2742
0x63 = 0x2743
0x64 = 0x2744
0x65 = 0x2745
0x66 = 0x2746
0x67 = 0x2747
0x68 = 0x2748
0x69 = 0x2749
0x6A = 0x274A
0x6B = 0x274B
0x6C = 0x25CF
0x6D = 0x274D
0x6E = 0x25A0
0x6F = 0x274F
0x70 = 0x2750
0x71 = 0x2751
0x72 = 0x2752
0x73 = 0x25B2
0x74 = 0x25BC
0x75 = 0x25C6
0x76 = 0x2756
0x77 = 0x25D7
0x78 = 0x2758
0x79 = 0x2759
0x7A = 0x275A
0x7B = 0x275B
0x7C = 0x275C
0x7D = 0x275D
0x7E = 0x275E
0x80 = 0x2768
0x81 = 0x2769
0x82 = 0x276A
0x83 = 0x276B
0x84 = 0x276C
0x85 = 0x276D
0x86 = 0x276E
0x87 = 0x276F
0x88 = 0x2770
0x89 = 0x2771
0x8A = 0x2772
0x8B = 0x2773
0x8C = 0x2774
0x8D = 0x2775
0xA1 = 0x2761
0xA2 = 0x2762
0xA3 = 0x2763
0xA4 = 0x2764
0xA5 = 0x2765
0xA6 = 0x2766
0xA7 = 0x2767
0xA8 = 0x2663
0xA9 = 0x2666
0xAA = 0x2665
0xAB = 0x2660
0xAC = 0x2460
0xAD = 0x2461
0xAE = 0x2462
0xAF = 0x2463
0xB0 = 0x2464
0xB1 = 0x2465
0xB2 = 0x2466
0xB3 = 0x2467
0xB4 = 0x2468
0xB5 = 0x2469
0xB6 = 0x2776
0xB7 = 0x2777
0xB8 = 0x2778
0xB9 = 0x2779
0xBA = 0x277A
0xBB = 0x277B
0xBC = 0x277C
0xBD = 0x277D
0xBE = 0x277E
0xBF = 0x277F
0xC0 = 0x2780
0xC1 = 0x2781
0xC2 = 0x2782
0xC3 = 0x2783
0xC4 = 0x2784
0xC5 = 0x2785
0xC6 = 0x2786
0xC7 = 0x2787
0xC8 = 0x2788
0xC9 = 0x2789
0xCA = 0x278A
0xCB = 0x278B
0xCC = 0x278C
0xCD = 0x278D
0xCE = 0x278E
0xCF = 0x278F
0xD0 = 0x2790
0xD1 = 0x2791
0xD2 = 0x2792
0xD3 = 0x2793
0xD4 = 0x2794
0xD5 = 0x2192
0xD6 = 0x2194
0xD7 = 0x2195
0xD8 = 0x2798
0xD9 = 0x2799
0xDA = 0x279A
0xDB = 0x279B
0xDC = 0x279C
0xDD = 0x279D
0xDE = 0x279E
0xDF = 0x279F
0xE0 = 0x27A0
0xE1 = 0x27A1
0xE2 = 0x27A2
0xE3 = 0x27A3
0xE4 = 0x27A4
0xE5 = 0x27A5
0xE6 = 0x27A6
0xE7 = 0x27A7
0xE8 = 0x27A8
0xE9 = 0x27A9
0xEA = 0x27AA
0xEB = 0x27AB
0xEC = 0x27AC
0xED = 0x27AD
0xEE = 0x27AE
0xEF = 0x27AF
0xF1 = 0x27B1
0xF2 = 0x27B2
0xF3 = 0x27B3
0xF4 = 0x27B4
0xF5 = 0x27B5
0xF6 = 0x27B6
0xF7 = 0x27B7
0xF8 = 0x27B8
0xF9 = 0x27B9
0xFA = 0x27BA
0xFB = 0x27BB
0xFC = 0x27BC
0xFD = 0x27BD
0xFE = 0x27BE
END_MAP

View File

@ -0,0 +1,256 @@
# $NetBSD: GAELIC%UCS.src,v 1.1 2006/03/13 19:45:36 tnozaki Exp $
TYPE ROWCOL
NAME GAELIC/UCS
SRC_ZONE 0x00-0xFF
OOB_MODE ILSEQ
DST_ILSEQ 0xFFFE
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: GAELIC.TXT
#
# Contents: Map (external version) from Mac OS Celtic
# character set to Unicode 3.0 and later
#
# Contacts: charsets@apple.com, everson@evertype.com
#
# Changes:
#
# c01 2005-Apr-01 First posted version. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Gaelic code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Gaelic code order.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Gaelic character set uses the standard control characters
# at 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Gaelic (partly from Michael Everson):
# -----------------------------------------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported via transcoding to and from
# Unicode.
#
# This character set was developed by Michael Everson of Everson
# Typography (everson@evertype.com) and was used for fonts in his
# Celtic Utilities and CeltScript font packages for the Mac, as well
# as some fonts included with the Irish localizations of Mac OS 6.0.8
# and 7.1. Note that while Apple authorized this Irish localization,
# it was not a system which shipped with Apple hardware, and was not
# otherwise supported by Apple. Fonts conforming to the Mac OS Gaelic
# character set are available from Everson Typography
# (http://www.evertype.com/celtscript/). Information about the use of
# this character set is available at
# http://www.evertype.com/celtscript/celtcode.html.
#
# The Mac OS Gaelic encoding shares the script code smRoman (0) with
# the standard Mac OS Roman encoding. To determine if the Gaelic
# encoding is being used in Mac OS 7-9, you should also check if the
# system region code is 81. Otherwise, you can check for particular
# fonts that conform to this encoding (since in practice Gaelic fonts
# are used with the ordinary US or UK system versions).
#
# This character set is a variant of standard Mac OS Roman, adding
# capital and small y with acute, grave, and circumflex; capital and
# small w with acute, grave, circumflex and diaeresis; capital and
# small b, c, d, f, g, m, p, s, t with dot above; tironian et; small
# long r, small long s, and small long s with dot above. It has 36
# code point differences from standard Mac OS Roman.
#
# Before Mac OS 8.5, code point 0xDB was CURRENCY SIGN, and was
# mapped to U+00A4. In Mac OS 8.5 and later versions, code point
# 0xDB is changed to EURO SIGN and maps to U+20AC; the standard
# Apple fonts are updated for Mac OS 8.5 to reflect this. There is
# a "currency sign" variant of the Latin 8 Extended encoding that still
# maps 0xDB to U+00A4; this can be used for older fonts.
# Note: U+20AC is new with Unicode 2.1; for earlier Unicode
# versions, Latin 8 Extended 0xDB may be mapped to private-use
# character U+F8A0.
#
# Before Unicode 3.0, code point 0xE4 was PER MILLE SIGN, and was
# mapped to U+2030. Since August 1998, code point 0xE4 is changed
# to TIRONIAN SIGN ET and maps to U+204A. There is a "per mille
# sign" variant of the Mac OS Gaelic encoding that still
# maps 0xE4 to U+2030; this can be used for older fonts.
# Note: U+204A is new with Unicode 3.0; for earlier Unicode
# versions, Mac OS Gaelic was unified with AMPERSAND.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# Details of mapping changes in each version:
# -------------------------------------------
#
##################
0x00 - 0x7E = 0x00 -
0x80 = 0x00C4
0x81 = 0x00C5
0x82 = 0x00C7
0x83 = 0x00C9
0x84 = 0x00D1
0x85 = 0x00D6
0x86 = 0x00DC
0x87 = 0x00E1
0x88 = 0x00E0
0x89 = 0x00E2
0x8A = 0x00E4
0x8B = 0x00E3
0x8C = 0x00E5
0x8D = 0x00E7
0x8E = 0x00E9
0x8F = 0x00E8
0x90 = 0x00EA
0x91 = 0x00EB
0x92 = 0x00ED
0x93 = 0x00EC
0x94 = 0x00EE
0x95 = 0x00EF
0x96 = 0x00F1
0x97 = 0x00F3
0x98 = 0x00F2
0x99 = 0x00F4
0x9A = 0x00F6
0x9B = 0x00F5
0x9C = 0x00FA
0x9D = 0x00F9
0x9E = 0x00FB
0x9F = 0x00FC
0xA0 = 0x2020
0xA1 = 0x00B0
0xA2 = 0x00A2
0xA3 = 0x00A3
0xA4 = 0x00A7
0xA5 = 0x2022
0xA6 = 0x00B6
0xA7 = 0x00DF
0xA8 = 0x00AE
0xA9 = 0x00A9
0xAA = 0x2122
0xAB = 0x00B4
0xAC = 0x00A8
0xAD = 0x2260
0xAE = 0x00C6
0xAF = 0x00D8
0xB0 = 0x1E02
0xB1 = 0x00B1
0xB2 = 0x2264
0xB3 = 0x2265
0xB4 = 0x1E03
0xB5 = 0x010A
0xB6 = 0x010B
0xB7 = 0x1E0A
0xB8 = 0x1E0B
0xB9 = 0x1E1E
0xBA = 0x1E1F
0xBB = 0x0120
0xBC = 0x0121
0xBD = 0x1E40
0xBE = 0x00E6
0xBF = 0x00F8
0xC0 = 0x1E41
0xC1 = 0x1E56
0xC2 = 0x1E57
0xC3 = 0x027C
0xC4 = 0x0192
0xC5 = 0x017F
0xC6 = 0x1E60
0xC7 = 0x00AB
0xC8 = 0x00BB
0xC9 = 0x2026
0xCA = 0x00A0
0xCB = 0x00C0
0xCC = 0x00C3
0xCD = 0x00D5
0xCE = 0x0152
0xCF = 0x0153
0xD0 = 0x2013
0xD1 = 0x2014
0xD2 = 0x201C
0xD3 = 0x201D
0xD4 = 0x2018
0xD5 = 0x2019
0xD6 = 0x1E61
0xD7 = 0x1E9B
0xD8 = 0x00FF
0xD9 = 0x0178
0xDA = 0x1E6A
0xDB = 0x20AC
0xDC = 0x2039
0xDD = 0x203A
0xDE = 0x0176
0xDF = 0x0177
0xE0 = 0x1E6B
0xE1 = 0x00B7
0xE2 = 0x1EF2
0xE3 = 0x1EF3
0xE4 = 0x204A
0xE5 = 0x00C2
0xE6 = 0x00CA
0xE7 = 0x00C1
0xE8 = 0x00CB
0xE9 = 0x00C8
0xEA = 0x00CD
0xEB = 0x00CE
0xEC = 0x00CF
0xED = 0x00CC
0xEE = 0x00D3
0xEF = 0x00D4
0xF0 = 0x2663
0xF1 = 0x00D2
0xF2 = 0x00DA
0xF3 = 0x00DB
0xF4 = 0x00D9
0xF5 = 0x0131
0xF6 = 0x00DD
0xF7 = 0x00FD
0xF8 = 0x0174
0xF9 = 0x0175
0xFA = 0x1E84
0xFB = 0x1E85
0xFC = 0x1E80
0xFD = 0x1E81
0xFE = 0x1E82
0xFF = 0x1E83
END_MAP

View File

@ -0,0 +1,274 @@
# $NetBSD: GREEK%UCS.src,v 1.1 2006/03/13 19:45:36 tnozaki Exp $
TYPE ROWCOL
NAME GREEK/UCS
SRC_ZONE 0x00-0xFF
OOB_MODE ILSEQ
DST_ILSEQ 0xFFFE
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: GREEK.TXT
#
# Contents: Map (external version) from Mac OS Greek
# character set to Unicode 2.1 and later.
#
# Copyright: (c) 1995-2002, 2005 by Apple Computer, Inc., all rights
# reserved.
#
# Contact: charsets@apple.com
#
# Changes:
#
# c02 2005-Apr-05 Update header comments. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
# b3,c1 2002-Dec-19 Update to match changes in Mac OS Greek
# encoding for Mac OS 9.2.2 and later.
# Update URLs, notes. Matches internal
# utom<b3>.
# b02 1999-Sep-22 Update contact e-mail address. Matches
# internal utom<b1>, ufrm<b1>, and Text
# Encoding Converter version 1.5.
# n06 1998-Feb-05 Update to match internal utom<n4>, ufrm<n17>,
# and Text Encoding Converter versions 1.3:
# Change mapping for 0xAF from U+0387 to its
# canonical decomposition, U+00B7. Also
# update header comments to new format.
# n04 1995-Apr-15 First version (after fixing some typos).
# Matches internal ufrm<n7>.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Greek code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Greek code order.
#
# One of these mappings requires the use of a corporate character.
# See the file "CORPCHAR.TXT" and notes below.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Greek character set uses the standard control characters at
# 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Greek:
# ----------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported via transcoding to and from
# Unicode.
#
# Although a Mac OS script code is defined for Greek (smGreek = 6),
# the Greek localized system does not currently use it (the font
# family IDs are in the Mac OS Roman range). To determine if the
# Greek encoding is being used when the script code is smRoman (0),
# you must check if the system region code is 20, verGreece.
#
# The Mac OS Greek encoding is a superset of the repertoire of
# ISO 8859-7 (although characters are not at the same code points),
# except that LEFT & RIGHT SINGLE QUOTATION MARK replace the
# MODIFIER LETTER REVERSED COMMA & APOSTROPHE (spacing versions of
# Greek rough & smooth breathing marks) that are in ISO 8859-7.
# The added characters in Mac OS Greek include more punctuation and
# symbols and several accented Latin letters.
#
# Before Mac OS 9.2.2, code point 0x9C was SOFT HYPHEN (U+00AD), and
# code point 0xFF was undefined. In Mac OS 9.2.2 and later versions,
# SOFT HYPHEN was moved to 0xFF, and code point 0x9C was changed to be
# EURO SIGN (U+20AC); the standard Apple fonts are updated for Mac OS
# 9.2.2 to reflect this. There is a "no Euro sign" variant of the Mac
# OS Greek encoding that uses the older mapping; this can be used for
# older fonts.
#
# This "no Euro sign" variant of Mac OS Greek was the character set
# used by Mac OS Greek systems before 9.2.2 except for system 6.0.7,
# which used a variant character set but was quickly replaced with
# Greek system 6.0.7.1 using the no Euro sign" character set
# documented here. Greek system 4.1 used a variant Greek set that had
# ISO 8859-7 in 0xA0-0xFF (with some holes filled in with DTP
# characters), and Mac OS Roman accented Roman letters in 0x80-0x9F.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# Details of mapping changes in each version:
# -------------------------------------------
#
# Changes from version b02 to version b03/c01:
#
# - The Mac OS Greek encoding changed for Mac OS 9.2.2 and later
# as follows:
# 0x9C, changed from 0x00AD SOFT HYPHEN to 0x20AC EURO SIGN
# 0xFF, changed from undefined to 0x00AD SOFT HYPHEN
#
# Changes from version n04 to version n06:
#
# - Change mapping of 0xAF from U+0387 to its canonical
# decomposition, U+00B7.
#
##################
0x00 - 0x7E = 0x00 -
0x80 = 0x00C4
0x81 = 0x00B9
0x82 = 0x00B2
0x83 = 0x00C9
0x84 = 0x00B3
0x85 = 0x00D6
0x86 = 0x00DC
0x87 = 0x0385
0x88 = 0x00E0
0x89 = 0x00E2
0x8A = 0x00E4
0x8B = 0x0384
0x8C = 0x00A8
0x8D = 0x00E7
0x8E = 0x00E9
0x8F = 0x00E8
0x90 = 0x00EA
0x91 = 0x00EB
0x92 = 0x00A3
0x93 = 0x2122
0x94 = 0x00EE
0x95 = 0x00EF
0x96 = 0x2022
0x97 = 0x00BD
0x98 = 0x2030
0x99 = 0x00F4
0x9A = 0x00F6
0x9B = 0x00A6
0x9C = 0x20AC
0x9D = 0x00F9
0x9E = 0x00FB
0x9F = 0x00FC
0xA0 = 0x2020
0xA1 = 0x0393
0xA2 = 0x0394
0xA3 = 0x0398
0xA4 = 0x039B
0xA5 = 0x039E
0xA6 = 0x03A0
0xA7 = 0x00DF
0xA8 = 0x00AE
0xA9 = 0x00A9
0xAA = 0x03A3
0xAB = 0x03AA
0xAC = 0x00A7
0xAD = 0x2260
0xAE = 0x00B0
0xAF = 0x00B7
0xB0 = 0x0391
0xB1 = 0x00B1
0xB2 = 0x2264
0xB3 = 0x2265
0xB4 = 0x00A5
0xB5 = 0x0392
0xB6 = 0x0395
0xB7 = 0x0396
0xB8 = 0x0397
0xB9 = 0x0399
0xBA = 0x039A
0xBB = 0x039C
0xBC = 0x03A6
0xBD = 0x03AB
0xBE = 0x03A8
0xBF = 0x03A9
0xC0 = 0x03AC
0xC1 = 0x039D
0xC2 = 0x00AC
0xC3 = 0x039F
0xC4 = 0x03A1
0xC5 = 0x2248
0xC6 = 0x03A4
0xC7 = 0x00AB
0xC8 = 0x00BB
0xC9 = 0x2026
0xCA = 0x00A0
0xCB = 0x03A5
0xCC = 0x03A7
0xCD = 0x0386
0xCE = 0x0388
0xCF = 0x0153
0xD0 = 0x2013
0xD1 = 0x2015
0xD2 = 0x201C
0xD3 = 0x201D
0xD4 = 0x2018
0xD5 = 0x2019
0xD6 = 0x00F7
0xD7 = 0x0389
0xD8 = 0x038A
0xD9 = 0x038C
0xDA = 0x038E
0xDB = 0x03AD
0xDC = 0x03AE
0xDD = 0x03AF
0xDE = 0x03CC
0xDF = 0x038F
0xE0 = 0x03CD
0xE1 = 0x03B1
0xE2 = 0x03B2
0xE3 = 0x03C8
0xE4 = 0x03B4
0xE5 = 0x03B5
0xE6 = 0x03C6
0xE7 = 0x03B3
0xE8 = 0x03B7
0xE9 = 0x03B9
0xEA = 0x03BE
0xEB = 0x03BA
0xEC = 0x03BB
0xED = 0x03BC
0xEE = 0x03BD
0xEF = 0x03BF
0xF0 = 0x03C0
0xF1 = 0x03CE
0xF2 = 0x03C1
0xF3 = 0x03C3
0xF4 = 0x03C4
0xF5 = 0x03B8
0xF6 = 0x03C9
0xF7 = 0x03C2
0xF8 = 0x03C7
0xF9 = 0x03C5
0xFA = 0x03B6
0xFB = 0x03CA
0xFC = 0x03CB
0xFD = 0x0390
0xFE = 0x03B0
0xFF = 0x00AD
END_MAP

View File

@ -0,0 +1,284 @@
# $NetBSD: ICELAND%UCS.src,v 1.1 2006/03/13 19:45:36 tnozaki Exp $
TYPE ROWCOL
NAME ICELAND/UCS
SRC_ZONE 0x00-0xFF
OOB_MODE ILSEQ
DST_ILSEQ 0xFFFE
DST_UNIT_BITS 16
BEGIN_MAP
#=======================================================================
# File name: ICELAND.TXT
#
# Contents: Map (external version) from Mac OS Icelandic
# character set to Unicode 2.1 and later.
#
# Copyright: (c) 1995-2002, 2005 by Apple Computer, Inc., all rights
# reserved.
#
# Contact: charsets@apple.com
#
# Changes:
#
# c02 2005-Apr-05 Update header comments. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
# b3,c1 2002-Dec-19 Update URLs, notes. Matches internal
# utom<b3>.
# b02 1999-Sep-22 Encoding changed for Mac OS 8.5; change
# mapping of 0xDB from CURRENCY SIGN to EURO
# SIGN. Update contact e-mail address. Matches
# internal utom<b2>, ufrm<b2>, and Text
# Encoding Converter version 1.5.
# n06 1998-Feb-05 Minor update to header comments, add
# information on font variants
# n03 1997-Dec-14 Update to match internal utom<n4>, ufrm<n16>:
# Change standard mapping for 0xBD from U+2126
# to its canonical decomposition, U+03A9.
# n02 1995-Apr-15 First version (after fixing some typos).
# Matches internal ufrm<n5>.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Icelandic code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Icelandic code order.
#
# One of these mappings requires the use of a corporate character.
# See the file "CORPCHAR.TXT" and notes below.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Icelandic character set uses the standard control characters
# at 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Icelandic:
# --------------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported via transcoding to and from
# Unicode.
#
# 1. General
#
# Mac OS Icelandic is used for Icelandic and Faroese.
#
# The Mac OS Icelandic encoding shares the script code smRoman
# (0) with the standard Mac OS Roman encoding. To determine if
# the Icelandic encoding is being used, you must also check if
# the system region code is 21, verIceland.
#
# This character set is a variant of standard Mac OS Roman,
# adding upper and lower eth, thorn, and Y acute. It has 6 code
# point differences from standard Mac OS Roman.
#
# Before Mac OS 8.5, code point 0xDB was CURRENCY SIGN, and was
# mapped to U+00A4. In Mac OS 8.5 and later versions, code point
# 0xDB is changed to EURO SIGN and maps to U+20AC; the standard
# Apple fonts are updated for Mac OS 8.5 to reflect this. There are
# "currency sign" variants of the Mac OS Icelandic encoding that
# still map 0xDB to U+00A4; these can be used for older fonts.
#
# 2. Font variants
#
# The table in this file gives the Unicode mappings for the standard
# Mac OS Icelandic encoding. This encoding is supported by the
# Icelandic versions of the fonts Chicago, Geneva, Monaco, and New
# York, and is the encoding supported by the text processing
# utilities. However, other TrueType fonts implement a slightly
# different encoding; the difference is only in two code points.
# For the standard variant, these are:
# 0xBB -> 0x00AA FEMININE ORDINAL INDICATOR
# 0xBC -> 0x00BA MASCULINE ORDINAL INDICATOR
#
# For the TrueType variant (used by the Icelandic versions of the
# fonts Courier, Helvetica, Palatino, and Times), these are:
# 0xBB -> 0xFB01 LATIN SMALL LIGATURE FI
# 0xBC -> 0xFB02 LATIN SMALL LIGATURE FL
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# The following corporate zone Unicode character is used in this
# mapping:
#
# 0xF8FF Apple logo
#
# NOTE: The graphic image associated with the Apple logo character
# is not authorized for use without permission of Apple, and
# unauthorized use might constitute trademark infringement.
#
# Details of mapping changes in each version:
# -------------------------------------------
#
# Changes from version n06 to version b02:
#
# - Encoding changed for Mac OS 8.5; change mapping of 0xDB from
# CURRENCY SIGN (U+00A4) to EURO SIGN (U+20AC).
#
# Changes from version n02 to version n03:
#
# - Change mapping of 0xBD from U+2126 to its canonical
# decomposition, U+03A9.
#
##################
0x00 - 0x7E = 0x0000 -
0x80 = 0x00C4
0x81 = 0x00C5
0x82 = 0x00C7
0x83 = 0x00C9
0x84 = 0x00D1
0x85 = 0x00D6
0x86 = 0x00DC
0x87 = 0x00E1
0x88 = 0x00E0
0x89 = 0x00E2
0x8A = 0x00E4
0x8B = 0x00E3
0x8C = 0x00E5
0x8D = 0x00E7
0x8E = 0x00E9
0x8F = 0x00E8
0x90 = 0x00EA
0x91 = 0x00EB
0x92 = 0x00ED
0x93 = 0x00EC
0x94 = 0x00EE
0x95 = 0x00EF
0x96 = 0x00F1
0x97 = 0x00F3
0x98 = 0x00F2
0x99 = 0x00F4
0x9A = 0x00F6
0x9B = 0x00F5
0x9C = 0x00FA
0x9D = 0x00F9
0x9E = 0x00FB
0x9F = 0x00FC
0xA0 = 0x00DD
0xA1 = 0x00B0
0xA2 = 0x00A2
0xA3 = 0x00A3
0xA4 = 0x00A7
0xA5 = 0x2022
0xA6 = 0x00B6
0xA7 = 0x00DF
0xA8 = 0x00AE
0xA9 = 0x00A9
0xAA = 0x2122
0xAB = 0x00B4
0xAC = 0x00A8
0xAD = 0x2260
0xAE = 0x00C6
0xAF = 0x00D8
0xB0 = 0x221E
0xB1 = 0x00B1
0xB2 = 0x2264
0xB3 = 0x2265
0xB4 = 0x00A5
0xB5 = 0x00B5
0xB6 = 0x2202
0xB7 = 0x2211
0xB8 = 0x220F
0xB9 = 0x03C0
0xBA = 0x222B
0xBB = 0x00AA
0xBC = 0x00BA
0xBD = 0x03A9
0xBE = 0x00E6
0xBF = 0x00F8
0xC0 = 0x00BF
0xC1 = 0x00A1
0xC2 = 0x00AC
0xC3 = 0x221A
0xC4 = 0x0192
0xC5 = 0x2248
0xC6 = 0x2206
0xC7 = 0x00AB
0xC8 = 0x00BB
0xC9 = 0x2026
0xCA = 0x00A0
0xCB = 0x00C0
0xCC = 0x00C3
0xCD = 0x00D5
0xCE = 0x0152
0xCF = 0x0153
0xD0 = 0x2013
0xD1 = 0x2014
0xD2 = 0x201C
0xD3 = 0x201D
0xD4 = 0x2018
0xD5 = 0x2019
0xD6 = 0x00F7
0xD7 = 0x25CA
0xD8 = 0x00FF
0xD9 = 0x0178
0xDA = 0x2044
0xDB = 0x20AC
0xDC = 0x00D0
0xDD = 0x00F0
0xDE = 0x00DE
0xDF = 0x00FE
0xE0 = 0x00FD
0xE1 = 0x00B7
0xE2 = 0x201A
0xE3 = 0x201E
0xE4 = 0x2030
0xE5 = 0x00C2
0xE6 = 0x00CA
0xE7 = 0x00C1
0xE8 = 0x00CB
0xE9 = 0x00C8
0xEA = 0x00CD
0xEB = 0x00CE
0xEC = 0x00CF
0xED = 0x00CC
0xEE = 0x00D3
0xEF = 0x00D4
0xF0 = 0xF8FF
0xF1 = 0x00D2
0xF2 = 0x00DA
0xF3 = 0x00DB
0xF4 = 0x00D9
0xF5 = 0x0131
0xF6 = 0x02C6
0xF7 = 0x02DC
0xF8 = 0x00AF
0xF9 = 0x02D8
0xFA = 0x02D9
0xFB = 0x02DA
0xFC = 0x00B8
0xFD = 0x02DD
0xFE = 0x02DB
0xFF = 0x02C7
END_MAP

View File

@ -0,0 +1,241 @@
# $NetBSD: INUIT%UCS.src,v 1.1 2006/03/13 19:45:36 tnozaki Exp $
TYPE ROWCOL
NAME INUIT/UCS
SRC_ZONE 0x00-0xFF
OOB_MODE ILSEQ
DST_ILSEQ 0xFFFE
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: INUIT.TXT
#
# Contents: Map (external version) from Mac OS Inuit
# character set to Unicode 3.0 and later
#
# Contacts: charsets@apple.com, everson@evertype.com
#
# Changes:
#
# c01 2005-Apr-01 First posted version. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Inuit code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Inuit code order.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Inuit character set uses the standard control characters
# at 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Inuit (partly from Michael Everson):
# ----------------------------------------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported via transcoding to and from
# Unicode.
#
# This character set was developed by Michael Everson of Everson
# Typography (everson@evertype.com) and was used for the Inuktitut
# localizations of Mac OS, as well as for the Inuktitut utilities
# package from Everson Typography. Note that while Apple authorized
# the Inuktitut localization mentioned above, it was not shipped with
# Apple hardware, and was not otherwise supported by Apple. Fonts
# conforming to the Mac OS Inuit character set are available from
# Everson Typography (http://www.evertype.com/software/apple/).
# Information about the use of this character set is available at
# http://www.evertype.com/standards/iu/.
#
# The Mac OS Inuit character set shares the script code smEthiopic
# (28) with the Ethiopic encoding. To determine if the Inuktitut
# encoding is being used, you must also check if the system region
# code is 78, verNunavut.
#
# The Mac OS Inuit character set includes the full syllabic letter
# repertoire required for Inuktitut; it is a subset of the Unified
# Canadian Aboriginal Syllabics set encoded in Unicode. The encoding
# is InuitSCII, designed by Doug Hitch for the Government of the
# Northwest Territories.
#
# The Mac OS Inuit character set also includes a number of characters
# that were needed for the classic Mac OS user interface and
# localization (e.g. ellipsis, bullet, copyright sign). All of the
# characters in Mac OS Inuit that are also in the Mac OS Roman
# encoding are at the same code point in both; this improves
# application compatibility.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# Details of mapping changes in each version:
# -------------------------------------------
#
##################
0x00 - 0x7E = 0x0000 -
0x80 = 0x1403
0x81 = 0x1404
0x82 = 0x1405
0x83 = 0x1406
0x84 = 0x140A
0x85 = 0x140B
0x86 = 0x1431
0x87 = 0x1432
0x88 = 0x1433
0x89 = 0x1434
0x8A = 0x1438
0x8B = 0x1439
0x8C = 0x1449
0x8D = 0x144E
0x8E = 0x144F
0x8F = 0x1450
0x90 = 0x1451
0x91 = 0x1455
0x92 = 0x1456
0x93 = 0x1466
0x94 = 0x146D
0x95 = 0x146E
0x96 = 0x146F
0x97 = 0x1470
0x98 = 0x1472
0x99 = 0x1473
0x9A = 0x1483
0x9B = 0x148B
0x9C = 0x148C
0x9D = 0x148D
0x9E = 0x148E
0x9F = 0x1490
0xA0 = 0x1491
0xA1 = 0x00B0
0xA2 = 0x14A1
0xA3 = 0x14A5
0xA4 = 0x14A6
0xA5 = 0x2022
0xA6 = 0x00B6
0xA7 = 0x14A7
0xA8 = 0x00AE
0xA9 = 0x00A9
0xAA = 0x2122
0xAB = 0x14A8
0xAC = 0x14AA
0xAD = 0x14AB
0xAE = 0x14BB
0xAF = 0x14C2
0xB0 = 0x14C3
0xB1 = 0x14C4
0xB2 = 0x14C5
0xB3 = 0x14C7
0xB4 = 0x14C8
0xB5 = 0x14D0
0xB6 = 0x14EF
0xB7 = 0x14F0
0xB8 = 0x14F1
0xB9 = 0x14F2
0xBA = 0x14F4
0xBB = 0x14F5
0xBC = 0x1505
0xBD = 0x14D5
0xBE = 0x14D6
0xBF = 0x14D7
0xC0 = 0x14D8
0xC1 = 0x14DA
0xC2 = 0x14DB
0xC3 = 0x14EA
0xC4 = 0x1528
0xC5 = 0x1529
0xC6 = 0x152A
0xC7 = 0x152B
0xC8 = 0x152D
0xC9 = 0x2026
0xCA = 0x00A0
0xCB = 0x152E
0xCC = 0x153E
0xCD = 0x1555
0xCE = 0x1556
0xCF = 0x1557
0xD0 = 0x2013
0xD1 = 0x2014
0xD2 = 0x201C
0xD3 = 0x201D
0xD4 = 0x2018
0xD5 = 0x2019
0xD6 = 0x1558
0xD7 = 0x1559
0xD8 = 0x155A
0xD9 = 0x155D
0xDA = 0x1546
0xDB = 0x1547
0xDC = 0x1548
0xDD = 0x1549
0xDE = 0x154B
0xDF = 0x154C
0xE0 = 0x1550
0xE1 = 0x157F
0xE2 = 0x1580
0xE3 = 0x1581
0xE4 = 0x1582
0xE5 = 0x1583
0xE6 = 0x1584
0xE7 = 0x1585
0xE8 = 0x158F
0xE9 = 0x1590
0xEA = 0x1591
0xEB = 0x1592
0xEC = 0x1593
0xED = 0x1594
0xEE = 0x1595
0xEF = 0x1671
0xF0 = 0x1672
0xF1 = 0x1673
0xF2 = 0x1674
0xF3 = 0x1675
0xF4 = 0x1676
0xF5 = 0x1596
0xF6 = 0x15A0
0xF7 = 0x15A1
0xF8 = 0x15A2
0xF9 = 0x15A3
0xFA = 0x15A4
0xFB = 0x15A5
0xFC = 0x15A6
0xFD = 0x157C
0xFE = 0x0141
0xFF = 0x0142
END_MAP

View File

@ -0,0 +1,15 @@
# $NetBSD: MAC.part,v 1.1 2006/03/13 19:45:36 tnozaki Exp $
CELTIC
CENTEURO
CROATIAN
CYRILLIC
DINGBATS
GAELIC
GREEK
ICELAND
INUIT
ROMAN
ROMANIAN
THAI
TURKISH

View File

@ -0,0 +1,45 @@
# $NetBSD: Makefile.inc,v 1.2 2008/10/25 22:35:36 apb Exp $
.PATH: ${.CURDIR}/APPLE
SRCS_mapper.dir+= mapper.dir.APPLE
SRCS_charset.pivot+= charset.pivot.APPLE
CLEANFILES+= mapper.dir.APPLE charset.pivot.APPLE
PART_MAC!= ${TOOL_SED} '/^\#/d;/^$$/d;' ${.CURDIR}/APPLE/MAC.part
.for i in ${PART_MAC}
.if exists(${.CURDIR}/APPLE/$i%UCS.src)
FILES+= $i%UCS.mps
CLEANFILES+= $i%UCS.mps
FILESDIR_$i%UCS.mps= ${BINDIR}/APPLE
.endif
.if exists(${.CURDIR}/APPLE/UCS%$i.src)
FILES+= UCS%$i.mps
CLEANFILES+= UCS%$i.mps
FILESDIR_UCS%$i.mps= ${BINDIR}/APPLE
.endif
.endfor
mapper.dir.APPLE: ${.CURDIR}/APPLE/MAC.part
${_MKTARGET_CREATE}
( \
echo "# APPLE"; \
for i in ${PART_MAC}; do \
printf "%-32s%-32s%s\n" $$i/UCS mapper_std \
APPLE/$$i%UCS.mps; \
printf "%-32s%-32s%s\n" UCS/$$i mapper_std \
APPLE/UCS%$$i.mps; \
done; \
echo; \
) > ${.TARGET}
charset.pivot.APPLE: ${.CURDIR}/APPLE/MAC.part
${_MKTARGET_CREATE}
( \
echo "# APPLE"; \
for i in ${PART_MAC}; do \
printf "%-32s%-32s%d\n" $$i UCS 1; \
printf "%-32s%-32s%d\n" UCS $$i 1; \
done; \
echo; \
) > ${.TARGET}

View File

@ -0,0 +1,289 @@
# $NetBSD: ROMAN%UCS.src,v 1.1 2006/03/13 19:45:36 tnozaki Exp $
TYPE ROWCOL
NAME ROMAN/UCS
SRC_ZONE 0x00-0xFF
OOB_MODE ILSEQ
DST_ILSEQ 0xFFFE
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: ROMAN.TXT
#
# Contents: Map (external version) from Mac OS Roman
# character set to Unicode 2.1 and later.
#
# Copyright: (c) 1994-2002, 2005 by Apple Computer, Inc., all rights
# reserved.
#
# Contact: charsets@apple.com
#
# Changes:
#
# c02 2005-Apr-05 Update header comments. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
# b4,c1 2002-Dec-19 Update URLs, notes. Matches internal
# utom<b5>.
# b03 1999-Sep-22 Update contact e-mail address. Matches
# internal utom<b4>, ufrm<b3>, and Text
# Encoding Converter version 1.5.
# b02 1998-Aug-18 Encoding changed for Mac OS 8.5; change
# mapping of 0xDB from CURRENCY SIGN to
# EURO SIGN. Matches internal utom<b3>,
# ufrm<b3>.
# n08 1998-Feb-05 Minor update to header comments
# n06 1997-Dec-14 Add warning about future changes to 0xDB
# from CURRENCY SIGN to EURO SIGN. Clarify
# some header information
# n04 1997-Dec-01 Update to match internal utom<n3>, ufrm<n22>:
# Change standard mapping for 0xBD from U+2126
# to its canonical decomposition, U+03A9.
# n03 1995-Apr-15 First version (after fixing some typos).
# Matches internal ufrm<n9>.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Roman code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Roman code order.
#
# One of these mappings requires the use of a corporate character.
# See the file "CORPCHAR.TXT" and notes below.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Roman character set uses the standard control characters at
# 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Roman:
# ----------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported directly in programming
# interfaces for QuickDraw Text, the Script Manager, and related
# Text Utilities. For other purposes it is supported via transcoding
# to and from Unicode.
#
# This character set is used for at least the following Mac OS
# localizations: U.S., British, Canadian French, French, Swiss
# French, German, Swiss German, Italian, Swiss Italian, Dutch,
# Swedish, Norwegian, Danish, Finnish, Spanish, Catalan,
# Portuguese, Brazilian, and the default International system.
#
# Variants of Mac OS Roman are used for Croatian, Icelandic,
# Turkish, Romanian, and other encodings. Separate mapping tables
# are available for these encodings.
#
# Before Mac OS 8.5, code point 0xDB was CURRENCY SIGN, and was
# mapped to U+00A4. In Mac OS 8.5 and later versions, code point
# 0xDB is changed to EURO SIGN and maps to U+20AC; the standard
# Apple fonts are updated for Mac OS 8.5 to reflect this. There is
# a "currency sign" variant of the Mac OS Roman encoding that still
# maps 0xDB to U+00A4; this can be used for older fonts.
#
# Before Mac OS 8.5, the ROM bitmap versions of the fonts Chicago,
# New York, Geneva, and Monaco did not implement the full Mac OS
# Roman character set; they only supported character codes up to
# 0xD8. The TrueType versions of these fonts have always implemented
# the full character set, as with the bitmap and TrueType versions
# of the other standard Roman fonts.
#
# In all Mac OS encodings, fonts such as Chicago which are used
# as "system" fonts (for menus, dialogs, etc.) have four glyphs
# at code points 0x11-0x14 for transient use by the Menu Manager.
# These glyphs are not intended as characters for use in normal
# text, and the associated code points are not generally
# interpreted as associated with these glyphs; they are usually
# interpreted (if at all) as the control codes DC1-DC4.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# The following corporate zone Unicode character is used in this
# mapping:
#
# 0xF8FF Apple logo
#
# NOTE: The graphic image associated with the Apple logo character
# is not authorized for use without permission of Apple, and
# unauthorized use might constitute trademark infringement.
#
# Details of mapping changes in each version:
# -------------------------------------------
#
# Changes from version n08 to version b02:
#
# - Encoding changed for Mac OS 8.5; change mapping of 0xDB from
# CURRENCY SIGN (U+00A4) to EURO SIGN (U+20AC).
#
# Changes from version n03 to version n04:
#
# - Change mapping of 0xBD from U+2126 to its canonical
# decomposition, U+03A9.
#
##################
0x00-0x7E = 0x00 -
0x80 = 0x00C4
0x81 = 0x00C5
0x82 = 0x00C7
0x83 = 0x00C9
0x84 = 0x00D1
0x85 = 0x00D6
0x86 = 0x00DC
0x87 = 0x00E1
0x88 = 0x00E0
0x89 = 0x00E2
0x8A = 0x00E4
0x8B = 0x00E3
0x8C = 0x00E5
0x8D = 0x00E7
0x8E = 0x00E9
0x8F = 0x00E8
0x90 = 0x00EA
0x91 = 0x00EB
0x92 = 0x00ED
0x93 = 0x00EC
0x94 = 0x00EE
0x95 = 0x00EF
0x96 = 0x00F1
0x97 = 0x00F3
0x98 = 0x00F2
0x99 = 0x00F4
0x9A = 0x00F6
0x9B = 0x00F5
0x9C = 0x00FA
0x9D = 0x00F9
0x9E = 0x00FB
0x9F = 0x00FC
0xA0 = 0x2020
0xA1 = 0x00B0
0xA2 = 0x00A2
0xA3 = 0x00A3
0xA4 = 0x00A7
0xA5 = 0x2022
0xA6 = 0x00B6
0xA7 = 0x00DF
0xA8 = 0x00AE
0xA9 = 0x00A9
0xAA = 0x2122
0xAB = 0x00B4
0xAC = 0x00A8
0xAD = 0x2260
0xAE = 0x00C6
0xAF = 0x00D8
0xB0 = 0x221E
0xB1 = 0x00B1
0xB2 = 0x2264
0xB3 = 0x2265
0xB4 = 0x00A5
0xB5 = 0x00B5
0xB6 = 0x2202
0xB7 = 0x2211
0xB8 = 0x220F
0xB9 = 0x03C0
0xBA = 0x222B
0xBB = 0x00AA
0xBC = 0x00BA
0xBD = 0x03A9
0xBE = 0x00E6
0xBF = 0x00F8
0xC0 = 0x00BF
0xC1 = 0x00A1
0xC2 = 0x00AC
0xC3 = 0x221A
0xC4 = 0x0192
0xC5 = 0x2248
0xC6 = 0x2206
0xC7 = 0x00AB
0xC8 = 0x00BB
0xC9 = 0x2026
0xCA = 0x00A0
0xCB = 0x00C0
0xCC = 0x00C3
0xCD = 0x00D5
0xCE = 0x0152
0xCF = 0x0153
0xD0 = 0x2013
0xD1 = 0x2014
0xD2 = 0x201C
0xD3 = 0x201D
0xD4 = 0x2018
0xD5 = 0x2019
0xD6 = 0x00F7
0xD7 = 0x25CA
0xD8 = 0x00FF
0xD9 = 0x0178
0xDA = 0x2044
0xDB = 0x20AC
0xDC = 0x2039
0xDD = 0x203A
0xDE = 0xFB01
0xDF = 0xFB02
0xE0 = 0x2021
0xE1 = 0x00B7
0xE2 = 0x201A
0xE3 = 0x201E
0xE4 = 0x2030
0xE5 = 0x00C2
0xE6 = 0x00CA
0xE7 = 0x00C1
0xE8 = 0x00CB
0xE9 = 0x00C8
0xEA = 0x00CD
0xEB = 0x00CE
0xEC = 0x00CF
0xED = 0x00CC
0xEE = 0x00D3
0xEF = 0x00D4
0xF0 = 0xF8FF
0xF1 = 0x00D2
0xF2 = 0x00DA
0xF3 = 0x00DB
0xF4 = 0x00D9
0xF5 = 0x0131
0xF6 = 0x02C6
0xF7 = 0x02DC
0xF8 = 0x00AF
0xF9 = 0x02D8
0xFA = 0x02D9
0xFB = 0x02DA
0xFC = 0x00B8
0xFD = 0x02DD
0xFE = 0x02DB
0xFF = 0x02C7
END_MAP

View File

@ -0,0 +1,284 @@
# $NetBSD: ROMANIAN%UCS.src,v 1.1 2006/03/13 19:45:36 tnozaki Exp $
TYPE ROWCOL
NAME ROMANIAN/UCS
SRC_ZONE 0x00-0xFF
OOB_MODE ILSEQ
DST_ILSEQ 0xFFFE
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: ROMANIAN.TXT
#
# Contents: Map (external version) from Mac OS Romanian
# character set to Unicode 3.0 and later.
#
# Copyright: (c) 1995-2002, 2005 by Apple Computer, Inc., all rights
# reserved.
#
# Contact: charsets@apple.com
#
# Changes:
#
# c02 2005-Apr-05 Update header comments. Matches internal xml
# <c1.2> and Text Encoding Converter 2.0.
# b3,c1 2002-Dec-19 Update mappings for 0xAF, 0xBF, 0xDE, 0xDF
# to use new composed characters added in
# Unicode 3.0. Update URLs, notes. Matches
# internal utom<b3>.
# b02 1999-Sep-22 Encoding changed for Mac OS 8.5; change
# mapping of 0xDB from CURRENCY SIGN to EURO
# SIGN. Update contact e-mail address. Matches
# internal utom<b2>, ufrm<b2>, and Text
# Encoding Converter version 1.5.
# n05 1998-Feb-05 Minor update to header comments
# n03 1997-Dec-14 Update to match internal utom<n5>, ufrm<n16>:
# Change standard mapping for 0xBD from U+2126
# to its canonical decomposition, U+03A9.
# Change mapping of 0xAF,0xBF,0xDE,0xDF from
# composed S/T WITH CEDILLA to S/T with
# COMBINING COMMA BELOW (to match our
# decomposition mappings).
# n02 1995-Apr-15 First version (after fixing some typos).
# Matches internal ufrm<n4>.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Romanian code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Romanian code order.
#
# One of these mappings requires the use of a corporate character.
# See the file "CORPCHAR.TXT" and notes below.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Romanian character set uses the standard control characters at
# 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Romanian:
# -------------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported via transcoding to and from
# Unicode.
#
# Mac OS Romanian is used only for Romanian.
#
# The Mac OS Romanian encoding shares the script code smRoman
# (0) with the standard Mac OS Roman encoding. To determine if
# the Romanian encoding is being used, you must also check if the
# system region code is 39, verRomania.
#
# This character set is a variant of standard Mac OS Roman, adding
# upper and lower A breve, S comma below, and T comma below. It
# has 6 code point differences from standard Mac OS Roman.
#
# Before Mac OS 8.5, code point 0xDB was CURRENCY SIGN, and was
# mapped to U+00A4. In Mac OS 8.5 and later versions, code point
# 0xDB is changed to EURO SIGN and maps to U+20AC; the standard
# Apple fonts are updated for Mac OS 8.5 to reflect this. There is
# a "currency sign" variant of the Mac OS Romanian encoding that
# still maps 0xDB to U+00A4; this can be used for older fonts.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# The following corporate zone Unicode character is used in this
# mapping:
#
# 0xF8FF Apple logo
#
# NOTE: The graphic image associated with the Apple logo character
# is not authorized for use without permission of Apple, and
# unauthorized use might constitute trademark infringement.
#
# Details of mapping changes in each version:
# -------------------------------------------
#
# Changes from version b02 to version b03/c01:
#
# - Update the mappings for 0xAF, 0xBF, 0xDE, 0xDF to use new
# composed Unicode characters 0x0218-0x021B added in Unicode 3.0;
# the previous mappings were to the equivalent decomposition
# sequences.
#
# Changes from version n05 to version b02:
#
# - Encoding changed for Mac OS 8.5; change mapping of 0xDB from
# CURRENCY SIGN (U+00A4) to EURO SIGN (U+20AC).
#
# Changes from version n02 to version n03:
#
# - Change mapping of 0xBD from U+2126 to its canonical
# decomposition, U+03A9.
# - Change mapping of 0xAF,0xBF,0xDE,0xDF from composed S or T
# WITH CEDILLA to S or T with COMBINING COMMA BELOW (to match
# our decomposition mappings).
#
##################
0x00 - 0x7E = 0x0000 -
0x80 = 0x00C4
0x81 = 0x00C5
0x82 = 0x00C7
0x83 = 0x00C9
0x84 = 0x00D1
0x85 = 0x00D6
0x86 = 0x00DC
0x87 = 0x00E1
0x88 = 0x00E0
0x89 = 0x00E2
0x8A = 0x00E4
0x8B = 0x00E3
0x8C = 0x00E5
0x8D = 0x00E7
0x8E = 0x00E9
0x8F = 0x00E8
0x90 = 0x00EA
0x91 = 0x00EB
0x92 = 0x00ED
0x93 = 0x00EC
0x94 = 0x00EE
0x95 = 0x00EF
0x96 = 0x00F1
0x97 = 0x00F3
0x98 = 0x00F2
0x99 = 0x00F4
0x9A = 0x00F6
0x9B = 0x00F5
0x9C = 0x00FA
0x9D = 0x00F9
0x9E = 0x00FB
0x9F = 0x00FC
0xA0 = 0x2020
0xA1 = 0x00B0
0xA2 = 0x00A2
0xA3 = 0x00A3
0xA4 = 0x00A7
0xA5 = 0x2022
0xA6 = 0x00B6
0xA7 = 0x00DF
0xA8 = 0x00AE
0xA9 = 0x00A9
0xAA = 0x2122
0xAB = 0x00B4
0xAC = 0x00A8
0xAD = 0x2260
0xAE = 0x0102
0xAF = 0x0218
0xB0 = 0x221E
0xB1 = 0x00B1
0xB2 = 0x2264
0xB3 = 0x2265
0xB4 = 0x00A5
0xB5 = 0x00B5
0xB6 = 0x2202
0xB7 = 0x2211
0xB8 = 0x220F
0xB9 = 0x03C0
0xBA = 0x222B
0xBB = 0x00AA
0xBC = 0x00BA
0xBD = 0x03A9
0xBE = 0x0103
0xBF = 0x0219
0xC0 = 0x00BF
0xC1 = 0x00A1
0xC2 = 0x00AC
0xC3 = 0x221A
0xC4 = 0x0192
0xC5 = 0x2248
0xC6 = 0x2206
0xC7 = 0x00AB
0xC8 = 0x00BB
0xC9 = 0x2026
0xCA = 0x00A0
0xCB = 0x00C0
0xCC = 0x00C3
0xCD = 0x00D5
0xCE = 0x0152
0xCF = 0x0153
0xD0 = 0x2013
0xD1 = 0x2014
0xD2 = 0x201C
0xD3 = 0x201D
0xD4 = 0x2018
0xD5 = 0x2019
0xD6 = 0x00F7
0xD7 = 0x25CA
0xD8 = 0x00FF
0xD9 = 0x0178
0xDA = 0x2044
0xDB = 0x20AC
0xDC = 0x2039
0xDD = 0x203A
0xDE = 0x021A
0xDF = 0x021B
0xE0 = 0x2021
0xE1 = 0x00B7
0xE2 = 0x201A
0xE3 = 0x201E
0xE4 = 0x2030
0xE5 = 0x00C2
0xE6 = 0x00CA
0xE7 = 0x00C1
0xE8 = 0x00CB
0xE9 = 0x00C8
0xEA = 0x00CD
0xEB = 0x00CE
0xEC = 0x00CF
0xED = 0x00CC
0xEE = 0x00D3
0xEF = 0x00D4
0xF0 = 0xF8FF
0xF1 = 0x00D2
0xF2 = 0x00DA
0xF3 = 0x00DB
0xF4 = 0x00D9
0xF5 = 0x0131
0xF6 = 0x02C6
0xF7 = 0x02DC
0xF8 = 0x00AF
0xF9 = 0x02D8
0xFA = 0x02D9
0xFB = 0x02DA
0xFC = 0x00B8
0xFD = 0x02DD
0xFE = 0x02DB
0xFF = 0x02C7
END_MAP

View File

@ -0,0 +1,301 @@
# $NetBSD: THAI%UCS.src,v 1.1 2006/03/13 19:45:36 tnozaki Exp $
TYPE ROWCOL
NAME THAI/UCS
SRC_ZONE 0x00-0xFF
OOB_MODE ILSEQ
DST_ILSEQ 0xFFFE
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: THAI.TXT
#
# Contents: Map (external version) from Mac OS Thai
# character set to Unicode 3.2 and later.
#
# Copyright: (c) 1995-2002, 2005 by Apple Computer, Inc., all rights
# reserved.
#
# Contact: charsets@apple.com
#
# Changes:
#
# c02 2005-Apr-05 Update header comments. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
# b3,c1 2002-Dec-19 Update mapping for 0xDB to use new Unicode
# 3.2 WORD JOINER instead of ZWNBSP (BOM).
# Update URLs. Matches internal utom<b3>.
# b02 1999-Sep-22 Update contact e-mail address. Matches
# internal utom<b1>, ufrm<b2>, and Text
# Encoding Converter version 1.5.
# n07 1998-Feb-05 Update to match internal utom<n5>, ufrm<n13>
# and Text Encoding Converter version 1.3:
# Use standard Unicodes plus transcoding hints
# instead of single corporate characters; see
# details below. Also update header comments
# to new format.
# n04 1995-Nov-17 First version (after fixing some typos).
# Matches internal ufrm<n6>.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Thai code (in hex as 0xNN)
# Column #2 is the corresponding Unicode or Unicode sequence
# (in hex as 0xNNNN or 0xNNNN+0xNNNN).
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Thai code order.
#
# Some of these mappings require the use of corporate characters.
# See the file "CORPCHAR.TXT" and notes below.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Thai character set uses the standard control characters at
# 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Thai:
# ---------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported via transcoding to and from
# Unicode.
#
# Codes 0xA1-0xDA and 0xDF-0xFB are the character set from Thai
# standard TIS 620-2533, except that the following changes are
# made:
# 0xEE is TRADE MARK SIGN (instead of THAI CHARACTER YAMAKKAN)
# 0xFA is REGISTERED SIGN (instead of THAI CHARACTER ANGKHANKHU)
# 0xFB is COPYRIGHT SIGN (instead of THAI CHARACTER KHOMUT)
#
# Codes 0x80-0x82, 0x8D-0x8E, 0x91, 0x9D-0x9E, and 0xDB-0xDE are
# various additional punctuation marks (e.g. curly quotes,
# ellipsis), no-break space, and two special characters "word join"
# and "word break".
#
# Codes 0x83-0x8C, 0x8F, and 0x92-0x9C are for positional variants
# of the upper vowels, tone marks, and other signs at 0xD1,
# 0xD4-0xD7, and 0xE7-0xED. The positional variants would normally
# be considered presentation forms only and not characters. In most
# cases they are not typed directly; they are selected automatically
# at display time by the WorldScript software. However, using the
# Thai-DTP keyboard, the presentation forms can in fact be typed
# directly using dead keys. Thus they must be treated as real
# characters in the Mac OS Thai encoding. They are mapped using
# variant tags; see below.
#
# Several code points are undefined and unused (they cannot be
# typed using any of the Mac OS Thai keyboard layouts): 0x90, 0x9F,
# 0xFC-0xFE. These are not shown in the table below.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# The goals in the Apple mappings provided here are:
# - Ensure roundtrip mapping from every character in the Mac OS Thai
# character set to Unicode and back
# - Use standard Unicode characters as much as possible, to maximize
# interchangeability of the resulting Unicode text. Whenever possible,
# avoid having content carried by private-use characters.
#
# To satisfy both goals, we use private use characters to mark variants
# that are similar to a sequence of one or more standard Unicode
# characters.
#
# Apple has defined a block of 32 corporate characters as "transcoding
# hints." These are used in combination with standard Unicode characters
# to force them to be treated in a special way for mapping to other
# encodings; they have no other effect. Sixteen of these transcoding
# hints are "grouping hints" - they indicate that the next 2-4 Unicode
# characters should be treated as a single entity for transcoding. The
# other sixteen transcoding hints are "variant tags" - they are like
# combining characters, and can follow a standard Unicode (or a sequence
# consisting of a base character and other combining characters) to
# cause it to be treated in a special way for transcoding. These always
# terminate a combining-character sequence.
#
# The transcoding coding hints used in this mapping table are four
# variant tags in the range 0xF873-75. Since these are combined with
# standard Unicode characters, some characters in the Mac OS Thai
# character set map to a sequence of two Unicodes instead of a single
# Unicode character. For example, the Mac OS Thai character at 0x83 is a
# low-left positional variant of THAI CHARACTER MAI EK (the standard
# mapping is for the abstract character at 0xE8). So 0x83 is mapped to
# 0x0E48 (THAI CHARACTER MAI EK) + 0xF875 (a variant tag).
#
# Details of mapping changes in each version:
# -------------------------------------------
#
# Changes from version b02 to version b03/c01:
#
# - Update mapping for 0xDB to use new Unicode 3.2 character U+2060
# WORD JOINER instead of U+FEFF ZERO WIDTH NO-BREAK SPACE (BOM)
#
# Changes from version n04 to version n07:
#
# - Changed mappings of the positional variants to use standard
# Unicodes + transcoding hint, instead of using single corporate
# zone characters. This affected the mappings for the following:
# 0x83-08C, 0x8F, 0x92-0x9C
#
# - Just comment out unused code points in the table, instead
# of mapping them to U+FFFD.
#
##################
0x00 - 0x7E = 0x0000 -
0x80 = 0x00AB
0x81 = 0x00BB
0x82 = 0x2026
0x83 = 0x0E48
0x84 = 0x0E49
0x85 = 0x0E4A
0x86 = 0x0E4B
0x87 = 0x0E4C
0x88 = 0x0E48
0x89 = 0x0E49
0x8A = 0x0E4A
0x8B = 0x0E4B
0x8C = 0x0E4C
0x8D = 0x201C
0x8E = 0x201D
0x8F = 0x0E4D
0x91 = 0x2022
0x92 = 0x0E31
0x93 = 0x0E47
0x94 = 0x0E34
0x95 = 0x0E35
0x96 = 0x0E36
0x97 = 0x0E37
0x98 = 0x0E48
0x99 = 0x0E49
0x9A = 0x0E4A
0x9B = 0x0E4B
0x9C = 0x0E4C
0x9D = 0x2018
0x9E = 0x2019
0xA0 = 0x00A0
0xA1 = 0x0E01
0xA2 = 0x0E02
0xA3 = 0x0E03
0xA4 = 0x0E04
0xA5 = 0x0E05
0xA6 = 0x0E06
0xA7 = 0x0E07
0xA8 = 0x0E08
0xA9 = 0x0E09
0xAA = 0x0E0A
0xAB = 0x0E0B
0xAC = 0x0E0C
0xAD = 0x0E0D
0xAE = 0x0E0E
0xAF = 0x0E0F
0xB0 = 0x0E10
0xB1 = 0x0E11
0xB2 = 0x0E12
0xB3 = 0x0E13
0xB4 = 0x0E14
0xB5 = 0x0E15
0xB6 = 0x0E16
0xB7 = 0x0E17
0xB8 = 0x0E18
0xB9 = 0x0E19
0xBA = 0x0E1A
0xBB = 0x0E1B
0xBC = 0x0E1C
0xBD = 0x0E1D
0xBE = 0x0E1E
0xBF = 0x0E1F
0xC0 = 0x0E20
0xC1 = 0x0E21
0xC2 = 0x0E22
0xC3 = 0x0E23
0xC4 = 0x0E24
0xC5 = 0x0E25
0xC6 = 0x0E26
0xC7 = 0x0E27
0xC8 = 0x0E28
0xC9 = 0x0E29
0xCA = 0x0E2A
0xCB = 0x0E2B
0xCC = 0x0E2C
0xCD = 0x0E2D
0xCE = 0x0E2E
0xCF = 0x0E2F
0xD0 = 0x0E30
0xD1 = 0x0E31
0xD2 = 0x0E32
0xD3 = 0x0E33
0xD4 = 0x0E34
0xD5 = 0x0E35
0xD6 = 0x0E36
0xD7 = 0x0E37
0xD8 = 0x0E38
0xD9 = 0x0E39
0xDA = 0x0E3A
0xDB = 0x2060
0xDC = 0x200B
0xDD = 0x2013
0xDE = 0x2014
0xDF = 0x0E3F
0xE0 = 0x0E40
0xE1 = 0x0E41
0xE2 = 0x0E42
0xE3 = 0x0E43
0xE4 = 0x0E44
0xE5 = 0x0E45
0xE6 = 0x0E46
0xE7 = 0x0E47
0xE8 = 0x0E48
0xE9 = 0x0E49
0xEA = 0x0E4A
0xEB = 0x0E4B
0xEC = 0x0E4C
0xED = 0x0E4D
0xEE = 0x2122
0xEF = 0x0E4F
0xF0 = 0x0E50
0xF1 = 0x0E51
0xF2 = 0x0E52
0xF3 = 0x0E53
0xF4 = 0x0E54
0xF5 = 0x0E55
0xF6 = 0x0E56
0xF7 = 0x0E57
0xF8 = 0x0E58
0xF9 = 0x0E59
0xFA = 0x00AE
0xFB = 0x00A9
END_MAP

View File

@ -0,0 +1,260 @@
# $NetBSD: TURKISH%UCS.src,v 1.1 2006/03/13 19:45:36 tnozaki Exp $
TYPE ROWCOL
NAME TURKISH/UCS
SRC_ZONE 0x00-0xFF
OOB_MODE ILSEQ
DST_ILSEQ 0xFFFE
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: TURKISH.TXT
#
# Contents: Map (external version) from Mac OS Turkish
# character set to Unicode 2.1 and later.
#
# Copyright: (c) 1995-2002, 2005 by Apple Computer, Inc., all rights
# reserved.
#
# Contact: charsets@apple.com
#
# Changes:
#
# c02 2005-Apr-05 Update header comments. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
# b3,c1 2002-Dec-19 Update URLs, notes. Matches internal
# utom<b1>.
# b02 1999-Sep-22 Update contact e-mail address. Matches
# internal utom<b1>, ufrm<b1>, and Text
# Encoding Converter version 1.5.
# n05 1998-Feb-05 Minor update to header comments
# n03 1997-Dec-14 Update to match internal utom<n5>, ufrm<n15>:
# Change standard mapping for 0xBD from U+2126
# to its canonical decomposition, U+03A9.
# n02 1995-Apr-15 First version (after fixing some typos).
# Matches internal ufrm<n4>.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Turkish code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Turkish code order.
#
# Two of these mappings requires the use of a corporate character.
# See the file "CORPCHAR.TXT" and notes below.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Turkish character set uses the standard control characters at
# 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Turkish:
# ------------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported via transcoding to and from
# Unicode.
#
# Mac OS Turkish is used for Turkish.
#
# The Mac OS Turkish encoding shares the script code smRoman
# (0) with the Mac OS Roman encoding. To determine if the Turkish
# encoding is being used, you must also check if the system region
# code is 24, verTurkey.
#
# This character set is a variant of standard Mac OS Roman. It adds
# upper & lower G with breve, upper & lower S with cedilla, upper I
# with dot, and moves the dotless lower i from its position at 0xF5
# in standard Mac OS Roman to a position at 0xDD here (leaving the
# 0xF5 code point undefined in Mac OS Turkish). This gives a total
# of 7 code point differences from standard Mac OS Roman.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# The following corporate zone Unicode characters are used in this
# mapping:
#
# 0xF8A0 undefined1, used to map the single undefined code point
# in Mac OS Turkish (to obtain roundtrip fidelity for all
# code points).
# 0xF8FF Apple logo
#
# NOTE: The graphic image associated with the Apple logo character
# is not authorized for use without permission of Apple, and
# unauthorized use might constitute trademark infringement.
#
# Details of mapping changes in each version:
# -------------------------------------------
#
# Changes from version n02 to version n03:
#
# - Change mapping of 0xBD from U+2126 to its canonical
# decomposition, U+03A9.
#
##################
0x00 - 0x7E = 0x0000 -
0x80 = 0x00C4
0x81 = 0x00C5
0x82 = 0x00C7
0x83 = 0x00C9
0x84 = 0x00D1
0x85 = 0x00D6
0x86 = 0x00DC
0x87 = 0x00E1
0x88 = 0x00E0
0x89 = 0x00E2
0x8A = 0x00E4
0x8B = 0x00E3
0x8C = 0x00E5
0x8D = 0x00E7
0x8E = 0x00E9
0x8F = 0x00E8
0x90 = 0x00EA
0x91 = 0x00EB
0x92 = 0x00ED
0x93 = 0x00EC
0x94 = 0x00EE
0x95 = 0x00EF
0x96 = 0x00F1
0x97 = 0x00F3
0x98 = 0x00F2
0x99 = 0x00F4
0x9A = 0x00F6
0x9B = 0x00F5
0x9C = 0x00FA
0x9D = 0x00F9
0x9E = 0x00FB
0x9F = 0x00FC
0xA0 = 0x2020
0xA1 = 0x00B0
0xA2 = 0x00A2
0xA3 = 0x00A3
0xA4 = 0x00A7
0xA5 = 0x2022
0xA6 = 0x00B6
0xA7 = 0x00DF
0xA8 = 0x00AE
0xA9 = 0x00A9
0xAA = 0x2122
0xAB = 0x00B4
0xAC = 0x00A8
0xAD = 0x2260
0xAE = 0x00C6
0xAF = 0x00D8
0xB0 = 0x221E
0xB1 = 0x00B1
0xB2 = 0x2264
0xB3 = 0x2265
0xB4 = 0x00A5
0xB5 = 0x00B5
0xB6 = 0x2202
0xB7 = 0x2211
0xB8 = 0x220F
0xB9 = 0x03C0
0xBA = 0x222B
0xBB = 0x00AA
0xBC = 0x00BA
0xBD = 0x03A9
0xBE = 0x00E6
0xBF = 0x00F8
0xC0 = 0x00BF
0xC1 = 0x00A1
0xC2 = 0x00AC
0xC3 = 0x221A
0xC4 = 0x0192
0xC5 = 0x2248
0xC6 = 0x2206
0xC7 = 0x00AB
0xC8 = 0x00BB
0xC9 = 0x2026
0xCA = 0x00A0
0xCB = 0x00C0
0xCC = 0x00C3
0xCD = 0x00D5
0xCE = 0x0152
0xCF = 0x0153
0xD0 = 0x2013
0xD1 = 0x2014
0xD2 = 0x201C
0xD3 = 0x201D
0xD4 = 0x2018
0xD5 = 0x2019
0xD6 = 0x00F7
0xD7 = 0x25CA
0xD8 = 0x00FF
0xD9 = 0x0178
0xDA = 0x011E
0xDB = 0x011F
0xDC = 0x0130
0xDD = 0x0131
0xDE = 0x015E
0xDF = 0x015F
0xE0 = 0x2021
0xE1 = 0x00B7
0xE2 = 0x201A
0xE3 = 0x201E
0xE4 = 0x2030
0xE5 = 0x00C2
0xE6 = 0x00CA
0xE7 = 0x00C1
0xE8 = 0x00CB
0xE9 = 0x00C8
0xEA = 0x00CD
0xEB = 0x00CE
0xEC = 0x00CF
0xED = 0x00CC
0xEE = 0x00D3
0xEF = 0x00D4
0xF0 = 0xF8FF
0xF1 = 0x00D2
0xF2 = 0x00DA
0xF3 = 0x00DB
0xF4 = 0x00D9
0xF5 = 0xF8A0
0xF6 = 0x02C6
0xF7 = 0x02DC
0xF8 = 0x00AF
0xF9 = 0x02D8
0xFA = 0x02D9
0xFB = 0x02DA
0xFC = 0x00B8
0xFD = 0x02DD
0xFE = 0x02DB
0xFF = 0x02C7
END_MAP

View File

@ -0,0 +1,247 @@
# $NetBSD: UCS%CELTIC.src,v 1.2 2006/04/08 15:47:39 tnozaki Exp $
TYPE ROWCOL
NAME UCS/CELTIC
SRC_ZONE 0x0000-0x2663
OOB_MODE INVALID
DST_INVALID 0x100
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: CELTIC.TXT
#
# Contents: Map (external version) from Mac OS Celtic
# character set to Unicode 2.1 and later
#
# Contacts: charsets@apple.com, everson@evertype.com
#
# Changes:
#
# c01 2005-Apr-01 First posted version. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Celtic code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Celtic code order.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Celtic character set uses the standard control characters
# at 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Celtic (partly from Michael Everson):
# -----------------------------------------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported via transcoding to and from
# Unicode.
#
# This character set was developed by Michael Everson of Everson
# Typography (everson@evertype.com) and was used for the Irish
# localizations of Mac OS 6.0.8 and 7.1, for the Welsh localization of
# Mac OS 7.1, and for several fonts that can be used on any version of
# Mac OS 7.1 or later. Note that while Apple authorized
# the Irish and Welsh localizations mentioned above, they were not
# systems which shipped with Apple hardware, and were not otherwise
# supported by Apple. Fonts conforming to the Mac OS Celtic character
# set are available from Everson Typography (http://www.evertype.com)
# and MEU Cymru (http://www.meucymru.co.uk). Information about the use
# of this character set is available at
# http://www.evertype.com/celtscript/celtcode.html.
#
# The Mac OS Celtic encoding shares the script code smRoman (0) with
# the standard Mac OS Roman encoding. To determine if the Celtic
# encoding is being used in Mac OS 7-9, you should also check if the
# system region code is 50, verIreland, or 79, verWales. Otherwise,
# you can check for particular fonts that conform to this encoding.
#
# This character set is a variant of standard Mac OS Roman, adding
# capital and small y with acute, grave, and circumflex, and capital
# and small w with acute, grave, circumflex and diaeresis. It has 14
# code point differences from standard Mac OS Roman (0xDE, 0xDF, 0xE2,
# 0xE3, 0xF6-0xFF).
#
# Before Mac OS 8.5, code point 0xDB was CURRENCY SIGN, and was
# mapped to U+00A4. In Mac OS 8.5 and later versions, code point
# 0xDB is changed to EURO SIGN and maps to U+20AC; the standard
# Apple fonts were updated for Mac OS 8.5 to reflect this. There is
# a "currency sign" variant of the Mac OS Celtic encoding that still
# maps 0xDB to U+00A4; this can be used for older fonts.
# Note: U+20AC is new with Unicode 2.1; for earlier Unicode
# versions, Mac OS Celtic 0xDB may be mapped to private-use
# character U+F8A0.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# Details of mapping changes in each version:
# -------------------------------------------
#
##################
0x0000 - 0x007E = 0x00 -
0x00A0 = 0xCA
0x00A1 = 0xC1
0x00A2 = 0xA2
0x00A3 = 0xA3
0x00A5 = 0xB4
0x00A7 = 0xA4
0x00A8 = 0xAC
0x00A9 = 0xA9
0x00AA = 0xBB
0x00AB = 0xC7
0x00AC = 0xC2
0x00AE = 0xA8
0x00B0 = 0xA1
0x00B1 = 0xB1
0x00B4 = 0xAB
0x00B5 = 0xB5
0x00B6 = 0xA6
0x00B7 = 0xE1
0x00BA = 0xBC
0x00BB = 0xC8
0x00BF = 0xC0
0x00C0 = 0xCB
0x00C1 = 0xE7
0x00C2 = 0xE5
0x00C3 = 0xCC
0x00C4 = 0x80
0x00C5 = 0x81
0x00C6 = 0xAE
0x00C7 = 0x82
0x00C8 = 0xE9
0x00C9 = 0x83
0x00CA = 0xE6
0x00CB = 0xE8
0x00CC = 0xED
0x00CD = 0xEA
0x00CE = 0xEB
0x00CF = 0xEC
0x00D1 = 0x84
0x00D2 = 0xF1
0x00D3 = 0xEE
0x00D4 = 0xEF
0x00D5 = 0xCD
0x00D6 = 0x85
0x00D8 = 0xAF
0x00D9 = 0xF4
0x00DA = 0xF2
0x00DB = 0xF3
0x00DC = 0x86
0x00DD = 0xF6
0x00DF = 0xA7
0x00E0 = 0x88
0x00E1 = 0x87
0x00E2 = 0x89
0x00E3 = 0x8B
0x00E4 = 0x8A
0x00E5 = 0x8C
0x00E6 = 0xBE
0x00E7 = 0x8D
0x00E8 = 0x8F
0x00E9 = 0x8E
0x00EA = 0x90
0x00EB = 0x91
0x00EC = 0x93
0x00ED = 0x92
0x00EE = 0x94
0x00EF = 0x95
0x00F1 = 0x96
0x00F2 = 0x98
0x00F3 = 0x97
0x00F4 = 0x99
0x00F5 = 0x9B
0x00F6 = 0x9A
0x00F7 = 0xD6
0x00F8 = 0xBF
0x00F9 = 0x9D
0x00FA = 0x9C
0x00FB = 0x9E
0x00FC = 0x9F
0x00FD = 0xF7
0x00FF = 0xD8
0x0131 = 0xF5
0x0152 = 0xCE
0x0153 = 0xCF
0x0174 = 0xF8
0x0175 = 0xF9
0x0176 = 0xDE
0x0177 = 0xDF
0x0178 = 0xD9
0x0192 = 0xC4
0x03A9 = 0xBD
0x03C0 = 0xB9
0x1E80 = 0xFC
0x1E81 = 0xFD
0x1E82 = 0xFE
0x1E83 = 0xFF
0x1E84 = 0xFA
0x1E85 = 0xFB
0x1EF2 = 0xE2
0x1EF3 = 0xE3
0x2013 = 0xD0
0x2014 = 0xD1
0x2018 = 0xD4
0x2019 = 0xD5
0x201C = 0xD2
0x201D = 0xD3
0x2020 = 0xA0
0x2021 = 0xE0
0x2022 = 0xA5
0x2026 = 0xC9
0x2030 = 0xE4
0x2039 = 0xDC
0x203A = 0xDD
0x2044 = 0xDA
0x20AC = 0xDB
0x2122 = 0xAA
0x2202 = 0xB6
0x2206 = 0xC6
0x220F = 0xB8
0x2211 = 0xB7
0x221A = 0xC3
0x221E = 0xB0
0x222B = 0xBA
0x2248 = 0xC5
0x2260 = 0xAD
0x2264 = 0xB2
0x2265 = 0xB3
0x25CA = 0xD7
0x2663 = 0xF0
END_MAP

View File

@ -0,0 +1,246 @@
# $NetBSD: UCS%CENTEURO.src,v 1.2 2006/04/08 15:47:39 tnozaki Exp $
TYPE ROWCOL
NAME UCS/CENTEURO
SRC_ZONE 0x0000-0x25CA
OOB_MODE INVALID
DST_INVALID 0x100
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: CENTEURO.TXT
#
# Contents: Map (external version) from Mac OS Central European
# character set to Unicode 2.1 and later.
#
# Copyright: (c) 1995-2002, 2005 by Apple Computer, Inc., all rights
# reserved.
#
# Contact: charsets@apple.com
#
# Changes:
#
# c02 2005-Apr-04 Update header comments. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
# b3,c1 2002-Dec-19 Update URLs. Matches internal utom<b1>.
# b02 1999-Sep-22 Update contact e-mail address. Matches
# internal utom<b1>, ufrm<b1>, and Text
# Encoding Converter version 1.5.
# n05 1998-Feb-05 Update header comments to new format; no
# mapping changes. Matches internal utom<n3>,
# ufrm<n13>, and Text Encoding Converter
# version 1.3.
# n03 1995-Apr-15 First version (after fixing some typos).
# Matches internal ufrm<n5>.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Central European code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Central European code order.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Central European character set uses the standard control
# characters at 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Central European:
# ---------------------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported directly in programming
# interfaces for QuickDraw Text, the Script Manager, and related
# Text Utilities. For other purposes it is supported via transcoding
# to and from Unicode.
#
# This character set is intended to cover the following languages:
#
# Polish, Czech, Slovak, Hungarian, Estonian, Latvian, Lithuanian
#
# These are written in Latin script, but using a different set of
# of accented characters than Mac OS Roman. The Mac OS Central
# European character set also includes a number of characters
# needed for the Mac OS user interface and localization (e.g.
# ellipsis, bullet, copyright sign), several typographic
# punctuation symbols, math symbols, etc. However, it has a
# smaller set of punctuation and symbols than Mac OS Roman. All of
# the characters in Mac OS Central European that are also in the
# Mac OS Roman character set are at the same code point in both
# character sets; this improves application compatibility.
#
# Note: This does not have the same letter repertoire as ISO
# 8859-2 (Latin-2); each has some accented letters that the other
# does not have.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# Details of mapping changes in each version:
# -------------------------------------------
#
##################
0x0000 - 0x007F = 0x00 -
0x00A0 = 0xCA
0x00A3 = 0xA3
0x00A7 = 0xA4
0x00A8 = 0xAC
0x00A9 = 0xA9
0x00AB = 0xC7
0x00AC = 0xC2
0x00AE = 0xA8
0x00B0 = 0xA1
0x00B6 = 0xA6
0x00BB = 0xC8
0x00C1 = 0xE7
0x00C4 = 0x80
0x00C9 = 0x83
0x00CD = 0xEA
0x00D3 = 0xEE
0x00D4 = 0xEF
0x00D5 = 0xCD
0x00D6 = 0x85
0x00DA = 0xF2
0x00DC = 0x86
0x00DD = 0xF8
0x00DF = 0xA7
0x00E1 = 0x87
0x00E4 = 0x8A
0x00E9 = 0x8E
0x00ED = 0x92
0x00F3 = 0x97
0x00F4 = 0x99
0x00F5 = 0x9B
0x00F6 = 0x9A
0x00F7 = 0xD6
0x00FA = 0x9C
0x00FC = 0x9F
0x00FD = 0xF9
0x0100 = 0x81
0x0101 = 0x82
0x0104 = 0x84
0x0105 = 0x88
0x0106 = 0x8C
0x0107 = 0x8D
0x010C = 0x89
0x010D = 0x8B
0x010E = 0x91
0x010F = 0x93
0x0112 = 0x94
0x0113 = 0x95
0x0116 = 0x96
0x0117 = 0x98
0x0118 = 0xA2
0x0119 = 0xAB
0x011A = 0x9D
0x011B = 0x9E
0x0122 = 0xFE
0x0123 = 0xAE
0x012A = 0xB1
0x012B = 0xB4
0x012E = 0xAF
0x012F = 0xB0
0x0136 = 0xB5
0x0137 = 0xFA
0x0139 = 0xBD
0x013A = 0xBE
0x013B = 0xB9
0x013C = 0xBA
0x013D = 0xBB
0x013E = 0xBC
0x0141 = 0xFC
0x0142 = 0xB8
0x0143 = 0xC1
0x0144 = 0xC4
0x0145 = 0xBF
0x0146 = 0xC0
0x0147 = 0xC5
0x0148 = 0xCB
0x014C = 0xCF
0x014D = 0xD8
0x0150 = 0xCC
0x0151 = 0xCE
0x0154 = 0xD9
0x0155 = 0xDA
0x0156 = 0xDF
0x0157 = 0xE0
0x0158 = 0xDB
0x0159 = 0xDE
0x015A = 0xE5
0x015B = 0xE6
0x0160 = 0xE1
0x0161 = 0xE4
0x0164 = 0xE8
0x0165 = 0xE9
0x016A = 0xED
0x016B = 0xF0
0x016E = 0xF1
0x016F = 0xF3
0x0170 = 0xF4
0x0171 = 0xF5
0x0172 = 0xF6
0x0173 = 0xF7
0x0179 = 0x8F
0x017A = 0x90
0x017B = 0xFB
0x017C = 0xFD
0x017D = 0xEB
0x017E = 0xEC
0x02C7 = 0xFF
0x2013 = 0xD0
0x2014 = 0xD1
0x2018 = 0xD4
0x2019 = 0xD5
0x201A = 0xE2
0x201C = 0xD2
0x201D = 0xD3
0x201E = 0xE3
0x2020 = 0xA0
0x2022 = 0xA5
0x2026 = 0xC9
0x2039 = 0xDC
0x203A = 0xDD
0x2122 = 0xAA
0x2202 = 0xB6
0x2206 = 0xC6
0x2211 = 0xB7
0x221A = 0xC3
0x2260 = 0xAD
0x2264 = 0xB2
0x2265 = 0xB3
0x25CA = 0xD7
END_MAP

View File

@ -0,0 +1,270 @@
# $NetBSD: UCS%CROATIAN.src,v 1.2 2006/04/08 15:47:39 tnozaki Exp $
TYPE ROWCOL
NAME UCS/CROATIAN
SRC_ZONE 0x0000-0xF8FF
OOB_MODE INVALID
DST_INVALID 0x100
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: CROATIAN.TXT
#
# Contents: Map (external version) from Mac OS Croatian
# character set to Unicode 2.1 and later.
#
# Copyright: (c) 1995-2002, 2005 by Apple Computer, Inc., all rights
# reserved.
#
# Contact: charsets@apple.com
#
# Changes:
#
# c02 2005-Apr-04 Update header comments. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
# b3,c1 2002-Dec-19 Update URLs, notes. Matches internal
# utom<b3>.
# b02 1999-Sep-22 Encoding changed for Mac OS 8.5; change
# mapping of 0xDB from CURRENCY SIGN to EURO
# SIGN. Update contact e-mail address. Matches
# internal utom<b2>, ufrm<b2>, and Text
# Encoding Converter version 1.5.
# n07 1998-Feb-05 Minor update to header comments
# n05 1997-Dec-14 Update to match internal utom<5>, ufrm<16>:
# Change standard mapping for 0xBD from U+2126
# to its canonical decomposition, U+03A9.
# n03 1995-Apr-15 First version (after fixing some typos).
# Matches internal ufrm<6>.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Croatian code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Croatian code order.
#
# One of these mappings requires the use of a corporate character.
# See the file "CORPCHAR.TXT" and notes below.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Croatian character set uses the standard control characters
# at 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Croatian:
# -------------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported via transcoding to and from
# Unicode.
#
# Mac OS Croatian is used for Croatian and Slovene.
#
# The Mac OS Croatian encoding shares the script code smRoman
# (0) with the standard Mac OS Roman encoding. To determine if
# the Croatian encoding is being used, you must check if the
# system region code is 68, verCroatia (or 25, verYugoCroatian,
# only used in older systems).
#
# This character set is a variant of standard Mac OS Roman
# encoding, adding five accented letter case pairs to handle
# Croatian. It has 20 code point differences from standard
# Mac OS Roman, but only 10 differences in repertoire.
#
# Before Mac OS 8.5, code point 0xDB was CURRENCY SIGN, and was
# mapped to U+00A4. In Mac OS 8.5 and later versions, code point
# 0xDB is changed to EURO SIGN and maps to U+20AC; the standard
# Apple fonts are updated for Mac OS 8.5 to reflect this. There is
# a "currency sign" variant of the Mac OS Croatian encoding that
# still maps 0xDB to U+00A4; this can be used for older fonts.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# The following corporate zone Unicode character is used in this
# mapping:
#
# 0xF8FF Apple logo
#
# NOTE: The graphic image associated with the Apple logo character
# is not authorized for use without permission of Apple, and
# unauthorized use might constitute trademark infringement.
#
# Details of mapping changes in each version:
# -------------------------------------------
#
# Changes from version n07 to version b02:
#
# - Encoding changed for Mac OS 8.5; change mapping of 0xDB from
# CURRENCY SIGN (U+00A4) to EURO SIGN (U+20AC).
#
# Changes from version n03 to version n05:
#
# - Change mapping of 0xBD from U+2126 to its canonical
# decomposition, U+03A9.
#
##################
0x0000 - 0x007E = 0x00 -
0x00A0 = 0xCA
0x00A1 = 0xC1
0x00A2 = 0xA2
0x00A3 = 0xA3
0x00A7 = 0xA4
0x00A8 = 0xAC
0x00A9 = 0xD9
0x00AA = 0xBB
0x00AB = 0xC7
0x00AC = 0xC2
0x00AE = 0xA8
0x00AF = 0xF8
0x00B0 = 0xA1
0x00B1 = 0xB1
0x00B4 = 0xAB
0x00B5 = 0xB5
0x00B6 = 0xA6
0x00B7 = 0xE1
0x00B8 = 0xFC
0x00BA = 0xBC
0x00BB = 0xDF
0x00BF = 0xC0
0x00C0 = 0xCB
0x00C1 = 0xE7
0x00C2 = 0xE5
0x00C3 = 0xCC
0x00C4 = 0x80
0x00C5 = 0x81
0x00C6 = 0xDE
0x00C7 = 0x82
0x00C8 = 0xE9
0x00C9 = 0x83
0x00CA = 0xFD
0x00CB = 0xFA
0x00CC = 0xED
0x00CD = 0xEA
0x00CE = 0xEB
0x00CF = 0xEC
0x00D1 = 0x84
0x00D2 = 0xF1
0x00D3 = 0xEE
0x00D4 = 0xEF
0x00D5 = 0xCD
0x00D6 = 0x85
0x00D8 = 0xAF
0x00D9 = 0xF4
0x00DA = 0xF2
0x00DB = 0xF3
0x00DC = 0x86
0x00DF = 0xA7
0x00E0 = 0x88
0x00E1 = 0x87
0x00E2 = 0x89
0x00E3 = 0x8B
0x00E4 = 0x8A
0x00E5 = 0x8C
0x00E6 = 0xFE
0x00E7 = 0x8D
0x00E8 = 0x8F
0x00E9 = 0x8E
0x00EA = 0x90
0x00EB = 0x91
0x00EC = 0x93
0x00ED = 0x92
0x00EE = 0x94
0x00EF = 0x95
0x00F1 = 0x96
0x00F2 = 0x98
0x00F3 = 0x97
0x00F4 = 0x99
0x00F5 = 0x9B
0x00F6 = 0x9A
0x00F7 = 0xD6
0x00F8 = 0xBF
0x00F9 = 0x9D
0x00FA = 0x9C
0x00FB = 0x9E
0x00FC = 0x9F
0x0106 = 0xC6
0x0107 = 0xE6
0x010C = 0xC8
0x010D = 0xE8
0x0110 = 0xD0
0x0111 = 0xF0
0x0131 = 0xF5
0x0152 = 0xCE
0x0153 = 0xCF
0x0160 = 0xA9
0x0161 = 0xB9
0x017D = 0xAE
0x017E = 0xBE
0x0192 = 0xC4
0x02C6 = 0xF6
0x02C7 = 0xFF
0x02DA = 0xFB
0x02DC = 0xF7
0x03A9 = 0xBD
0x03C0 = 0xF9
0x2013 = 0xE0
0x2014 = 0xD1
0x2018 = 0xD4
0x2019 = 0xD5
0x201A = 0xE2
0x201C = 0xD2
0x201D = 0xD3
0x201E = 0xE3
0x2020 = 0xA0
0x2022 = 0xA5
0x2026 = 0xC9
0x2030 = 0xE4
0x2039 = 0xDC
0x203A = 0xDD
0x2044 = 0xDA
0x20AC = 0xDB
0x2122 = 0xAA
0x2202 = 0xB6
0x2206 = 0xB4
0x220F = 0xB8
0x2211 = 0xB7
0x221A = 0xC3
0x221E = 0xB0
0x222B = 0xBA
0x2248 = 0xC5
0x2260 = 0xAD
0x2264 = 0xB2
0x2265 = 0xB3
0x25CA = 0xD7
0xF8FF = 0xD8
END_MAP

View File

@ -0,0 +1,271 @@
# $NetBSD: UCS%CYRILLIC.src,v 1.2 2006/04/08 15:47:39 tnozaki Exp $
TYPE ROWCOL
NAME UCS/CYRILLIC
SRC_ZONE 0x0000-0x2265
OOB_MODE INVALID
DST_INVALID 0x100
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: CYRILLIC.TXT
#
# Contents: Map (external version) from Mac OS Cyrillic
# character set to Unicode 2.1 and later.
#
# Copyright: (c) 1995-2002, 2005 by Apple Computer, Inc., all rights
# reserved.
#
# Contact: charsets@apple.com
#
# Changes:
#
# c03 2005-Apr-05 Update header comments. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
# b3,c1 2002-Dec-19 Update URLs, notes. Matches internal
# utom<b2>.
# b02 1999-Sep-22 Encoding changed for Mac OS 9.0 to merge
# with Mac OS Ukrainian and support EURO SIGN;
# Change mappings for 0xA2, 0xB6, and 0xFF.
# Update contact e-mail address. Matches
# internal utom<b2>, ufrm<b2>, and Text
# Encoding Converter version 1.5.
# n05 1998-Feb-05 Update header comments to new format; no
# mapping changes. Matches internal utom<n3>,
# ufrm<n13>, and Text Encoding Converter
# version 1.3.
# n03 1995-Apr-15 First version (after fixing some typos).
# Matches internal ufrm<n5>.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Cyrillic code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Cyrillic code order.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Cyrillic character set uses the standard control characters
# at 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Cyrillic:
# -------------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported directly in programming
# interfaces for QuickDraw Text, the Script Manager, and related
# Text Utilities. For other purposes it is supported via transcoding
# to and from Unicode.
#
# This is the "Euro sign" version of Mac Cyrillic for Mac OS 9.0 and
# later. Before Mac OS 9.0, there were two separate Slavic Cyrillic
# encodings:
#
# 1. The Cyrillic currency sign variant (used for localized Russian
# and Bulgarian systems), which had the following:
# 0xA2 U+00A2 CENT SIGN
# 0xB6 U+2202 PARTIAL DIFFERENTIAL
# 0xFF U+00A4 CURRENCY SIGN
#
# 2. The Ukrainian currency sign variant (used for localized Ukrainian
# systems and the pre-9.0 Cyrillic Language Kit), which had the
# following:
# 0xA2 U+0490 CYRILLIC CAPITAL LETTER GHE WITH UPTURN
# 0xB6 U+0491 CYRILLIC SMALL LETTER GHE WITH UPTURN
# 0xFF U+00A4 CURRENCY SIGN
#
# This new Cyrillic Euro sign version is based on the old Ukrainian
# currency sign variant, with 0xFF changed to be EURO SIGN.
#
# The Mac OS Cyrillic encoding includes the Cyrillic letter repertoire
# of ISO 8859-5 (although not at the same code points). This covers
# most of the Slavic languages written in Cyrillic script.
#
# The Mac OS Cyrillic encoding also includes a number of characters
# needed for the Mac OS user interface and localization (e.g.
# ellipsis, bullet, copyright sign). All of the characters in Mac OS
# Cyrillic that are also in the Mac OS Roman encoding are at the
# same code point in both; this improves application compatibility.
#
# Note: There is a common Ukrainian glyph variation in which the glyph
# for CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I may or may not
# have a dot above.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# Details of mapping changes in each version:
# -------------------------------------------
#
# Changes from version n05 to version b02:
#
# - Encoding changed for Mac OS 9.0 to merge with Mac OS Ukrainian and
# support EURO SIGN. 0xA2 changed from U+00A2 to U+0490; 0xB6 changed
# from U+2202 to U+0491; 0xFF changed from U+00A4 to U+20AC.
#
##################
0x0000 - 0x007E = 0x0000 -
0x00A0 = 0xCA
0x00A3 = 0xA3
0x00A7 = 0xA4
0x00A9 = 0xA9
0x00AB = 0xC7
0x00AC = 0xC2
0x00AE = 0xA8
0x00B0 = 0xA1
0x00B1 = 0xB1
0x00B5 = 0xB5
0x00B6 = 0xA6
0x00BB = 0xC8
0x00F7 = 0xD6
0x0192 = 0xC4
0x0401 = 0xDD
0x0402 = 0xAB
0x0403 = 0xAE
0x0404 = 0xB8
0x0405 = 0xC1
0x0406 = 0xA7
0x0407 = 0xBA
0x0408 = 0xB7
0x0409 = 0xBC
0x040A = 0xBE
0x040B = 0xCB
0x040C = 0xCD
0x040E = 0xD8
0x040F = 0xDA
0x0410 = 0x80
0x0411 = 0x81
0x0412 = 0x82
0x0413 = 0x83
0x0414 = 0x84
0x0415 = 0x85
0x0416 = 0x86
0x0417 = 0x87
0x0418 = 0x88
0x0419 = 0x89
0x041A = 0x8A
0x041B = 0x8B
0x041C = 0x8C
0x041D = 0x8D
0x041E = 0x8E
0x041F = 0x8F
0x0420 = 0x90
0x0421 = 0x91
0x0422 = 0x92
0x0423 = 0x93
0x0424 = 0x94
0x0425 = 0x95
0x0426 = 0x96
0x0427 = 0x97
0x0428 = 0x98
0x0429 = 0x99
0x042A = 0x9A
0x042B = 0x9B
0x042C = 0x9C
0x042D = 0x9D
0x042E = 0x9E
0x042F = 0x9F
0x0430 = 0xE0
0x0431 = 0xE1
0x0432 = 0xE2
0x0433 = 0xE3
0x0434 = 0xE4
0x0435 = 0xE5
0x0436 = 0xE6
0x0437 = 0xE7
0x0438 = 0xE8
0x0439 = 0xE9
0x043A = 0xEA
0x043B = 0xEB
0x043C = 0xEC
0x043D = 0xED
0x043E = 0xEE
0x043F = 0xEF
0x0440 = 0xF0
0x0441 = 0xF1
0x0442 = 0xF2
0x0443 = 0xF3
0x0444 = 0xF4
0x0445 = 0xF5
0x0446 = 0xF6
0x0447 = 0xF7
0x0448 = 0xF8
0x0449 = 0xF9
0x044A = 0xFA
0x044B = 0xFB
0x044C = 0xFC
0x044D = 0xFD
0x044E = 0xFE
0x044F = 0xDF
0x0451 = 0xDE
0x0452 = 0xAC
0x0453 = 0xAF
0x0454 = 0xB9
0x0455 = 0xCF
0x0456 = 0xB4
0x0457 = 0xBB
0x0458 = 0xC0
0x0459 = 0xBD
0x045A = 0xBF
0x045B = 0xCC
0x045C = 0xCE
0x045E = 0xD9
0x045F = 0xDB
0x0490 = 0xA2
0x0491 = 0xB6
0x2013 = 0xD0
0x2014 = 0xD1
0x2018 = 0xD4
0x2019 = 0xD5
0x201C = 0xD2
0x201D = 0xD3
0x201E = 0xD7
0x2020 = 0xA0
0x2022 = 0xA5
0x2026 = 0xC9
0x20AC = 0xFF
0x2116 = 0xDC
0x2122 = 0xAA
0x2206 = 0xC6
0x221A = 0xC3
0x221E = 0xB0
0x2248 = 0xC5
0x2260 = 0xAD
0x2264 = 0xB2
0x2265 = 0xB3
END_MAP

View File

@ -0,0 +1,340 @@
# $NetBSD: UCS%DINGBATS.src,v 1.2 2006/04/08 15:47:39 tnozaki Exp $
TYPE ROWCOL
NAME UCS/DINGBATS
SRC_ZONE 0x0000-0x27BE
OOB_MODE INVALID
DST_INVALID 0x100
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: DINGBATS.TXT
#
# Contents: Map (external version) from Mac OS Dingbats
# character set to Unicode 3.2 and later.
#
# Copyright: (c) 1994-2002, 2005 by Apple Computer, Inc., all rights
# reserved.
#
# Contact: charsets@apple.com
#
# Changes:
#
# c02 2005-Apr-05 Update header comments. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
# b3,c1 2002-Dec-19 Update mappings for 0x80-0x8D to use new
# Unicode 3.2 characters. Update URLs, notes.
# Matches internal utom<b2>.
# b02 1999-Sep-22 Update contact e-mail address. Matches
# internal utom<b1>, ufrm<b1>, and Text
# Encoding Converter version 1.5.
# n05 1998-Feb-05 Update to match internal utom<n4>, ufrm<n14>,
# and Text Encoding Converter version 1.3:
# Change all mappings to single corporate-zone
# Unicodes to either use standard Unicodes
# or standard Unicodes plus transcoding hints;
# see details below. Also update header
# comments to new format.
# n03 1995-Apr-15 First version (after fixing some typos).
# Matches internal ufrm<n4>.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Dingbats code (in hex as 0xNN)
# Column #2 is the corresponding Unicode or Unicode sequence
# (in hex as 0xNNNN).
# Column #3 is a comment containing the Unicode name.
# In some cases an additional comment follows the Unicode name.
#
# The entries are in Mac OS Dingbats code order.
#
# Some of these mappings require the use of corporate characters.
# See the file "CORPCHAR.TXT" and notes below.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Dingbats character set uses the standard control characters
# at 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Dingbats:
# -------------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported directly in programming
# interfaces for QuickDraw Text, the Script Manager, and related
# Text Utilities. For other purposes it is supported via transcoding
# to and from Unicode.
#
# The Mac OS Dingbats encoding shares the script code smRoman
# (0) with the standard Mac OS Roman encoding. To determine if
# the Dingbats encoding is being used, you must check if the
# font name is "Zapf Dingbats".
#
# The layout of the Dingbats character set is identical to or
# a superset of the layout of the Adobe Zapf Dingbats encoding
# vector.
#
# The following code points are unused, and are not shown here:
# 0x8E-0xA0, 0xF0, 0xFF.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# Details of mapping changes in each version:
# -------------------------------------------
#
# Changes from version b02 to version b03/c01:
#
# - The mappings for the following Mac OS Dingbats characters
# were changed to use standard Unicode characters added for
# Unicode 3.2: 0x80-0x8D.
#
# Changes from version n03 to version n05:
#
# - The mappings for the following Mac OS Dingbats characters
# were changed from single corporate-zone Unicode characters
# to standard Unicode characters:
# 0x80-0x81, 0x84-0x87, 0x8A-0x8D.
#
# - The mappings for the following Mac OS Dingbats characters
# were changed from single corporate-zone Unicode characters
# to combinations of a standard Unicode and a transcoding hint:
# 0x82-0x83, 0x88-0x89.
#
##################
0x0000 - 0x0020 = 0x00 -
0x2192 = 0xD5
0x2194 = 0xD6
0x2195 = 0xD7
0x2460 = 0xAC
0x2461 = 0xAD
0x2462 = 0xAE
0x2463 = 0xAF
0x2464 = 0xB0
0x2465 = 0xB1
0x2466 = 0xB2
0x2467 = 0xB3
0x2468 = 0xB4
0x2469 = 0xB5
0x25A0 = 0x6E
0x25B2 = 0x73
0x25BC = 0x74
0x25C6 = 0x75
0x25CF = 0x6C
0x25D7 = 0x77
0x2605 = 0x48
0x260E = 0x25
0x261B = 0x2A
0x261E = 0x2B
0x2660 = 0xAB
0x2663 = 0xA8
0x2665 = 0xAA
0x2666 = 0xA9
0x2701 = 0x21
0x2702 = 0x22
0x2703 = 0x23
0x2704 = 0x24
0x2706 = 0x26
0x2707 = 0x27
0x2708 = 0x28
0x2709 = 0x29
0x270C = 0x2C
0x270D = 0x2D
0x270E = 0x2E
0x270F = 0x2F
0x2710 = 0x30
0x2711 = 0x31
0x2712 = 0x32
0x2713 = 0x33
0x2714 = 0x34
0x2715 = 0x35
0x2716 = 0x36
0x2717 = 0x37
0x2718 = 0x38
0x2719 = 0x39
0x271A = 0x3A
0x271B = 0x3B
0x271C = 0x3C
0x271D = 0x3D
0x271E = 0x3E
0x271F = 0x3F
0x2720 = 0x40
0x2721 = 0x41
0x2722 = 0x42
0x2723 = 0x43
0x2724 = 0x44
0x2725 = 0x45
0x2726 = 0x46
0x2727 = 0x47
0x2729 = 0x49
0x272A = 0x4A
0x272B = 0x4B
0x272C = 0x4C
0x272D = 0x4D
0x272E = 0x4E
0x272F = 0x4F
0x2730 = 0x50
0x2731 = 0x51
0x2732 = 0x52
0x2733 = 0x53
0x2734 = 0x54
0x2735 = 0x55
0x2736 = 0x56
0x2737 = 0x57
0x2738 = 0x58
0x2739 = 0x59
0x273A = 0x5A
0x273B = 0x5B
0x273C = 0x5C
0x273D = 0x5D
0x273E = 0x5E
0x273F = 0x5F
0x2740 = 0x60
0x2741 = 0x61
0x2742 = 0x62
0x2743 = 0x63
0x2744 = 0x64
0x2745 = 0x65
0x2746 = 0x66
0x2747 = 0x67
0x2748 = 0x68
0x2749 = 0x69
0x274A = 0x6A
0x274B = 0x6B
0x274D = 0x6D
0x274F = 0x6F
0x2750 = 0x70
0x2751 = 0x71
0x2752 = 0x72
0x2756 = 0x76
0x2758 = 0x78
0x2759 = 0x79
0x275A = 0x7A
0x275B = 0x7B
0x275C = 0x7C
0x275D = 0x7D
0x275E = 0x7E
0x2761 = 0xA1
0x2762 = 0xA2
0x2763 = 0xA3
0x2764 = 0xA4
0x2765 = 0xA5
0x2766 = 0xA6
0x2767 = 0xA7
0x2768 = 0x80
0x2769 = 0x81
0x276A = 0x82
0x276B = 0x83
0x276C = 0x84
0x276D = 0x85
0x276E = 0x86
0x276F = 0x87
0x2770 = 0x88
0x2771 = 0x89
0x2772 = 0x8A
0x2773 = 0x8B
0x2774 = 0x8C
0x2775 = 0x8D
0x2776 = 0xB6
0x2777 = 0xB7
0x2778 = 0xB8
0x2779 = 0xB9
0x277A = 0xBA
0x277B = 0xBB
0x277C = 0xBC
0x277D = 0xBD
0x277E = 0xBE
0x277F = 0xBF
0x2780 = 0xC0
0x2781 = 0xC1
0x2782 = 0xC2
0x2783 = 0xC3
0x2784 = 0xC4
0x2785 = 0xC5
0x2786 = 0xC6
0x2787 = 0xC7
0x2788 = 0xC8
0x2789 = 0xC9
0x278A = 0xCA
0x278B = 0xCB
0x278C = 0xCC
0x278D = 0xCD
0x278E = 0xCE
0x278F = 0xCF
0x2790 = 0xD0
0x2791 = 0xD1
0x2792 = 0xD2
0x2793 = 0xD3
0x2794 = 0xD4
0x2798 = 0xD8
0x2799 = 0xD9
0x279A = 0xDA
0x279B = 0xDB
0x279C = 0xDC
0x279D = 0xDD
0x279E = 0xDE
0x279F = 0xDF
0x27A0 = 0xE0
0x27A1 = 0xE1
0x27A2 = 0xE2
0x27A3 = 0xE3
0x27A4 = 0xE4
0x27A5 = 0xE5
0x27A6 = 0xE6
0x27A7 = 0xE7
0x27A8 = 0xE8
0x27A9 = 0xE9
0x27AA = 0xEA
0x27AB = 0xEB
0x27AC = 0xEC
0x27AD = 0xED
0x27AE = 0xEE
0x27AF = 0xEF
0x27B1 = 0xF1
0x27B2 = 0xF2
0x27B3 = 0xF3
0x27B4 = 0xF4
0x27B5 = 0xF5
0x27B6 = 0xF6
0x27B7 = 0xF7
0x27B8 = 0xF8
0x27B9 = 0xF9
0x27BA = 0xFA
0x27BB = 0xFB
0x27BC = 0xFC
0x27BD = 0xFD
0x27BE = 0xFE
END_MAP

View File

@ -0,0 +1,256 @@
# $NetBSD: UCS%GAELIC.src,v 1.2 2006/04/08 15:47:39 tnozaki Exp $
TYPE ROWCOL
NAME UCS/GAELIC
SRC_ZONE 0x0000-0x2663
OOB_MODE INVALID
DST_INVALID 0x100
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: GAELIC.TXT
#
# Contents: Map (external version) from Mac OS Celtic
# character set to Unicode 3.0 and later
#
# Contacts: charsets@apple.com, everson@evertype.com
#
# Changes:
#
# c01 2005-Apr-01 First posted version. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Gaelic code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Gaelic code order.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Gaelic character set uses the standard control characters
# at 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Gaelic (partly from Michael Everson):
# -----------------------------------------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported via transcoding to and from
# Unicode.
#
# This character set was developed by Michael Everson of Everson
# Typography (everson@evertype.com) and was used for fonts in his
# Celtic Utilities and CeltScript font packages for the Mac, as well
# as some fonts included with the Irish localizations of Mac OS 6.0.8
# and 7.1. Note that while Apple authorized this Irish localization,
# it was not a system which shipped with Apple hardware, and was not
# otherwise supported by Apple. Fonts conforming to the Mac OS Gaelic
# character set are available from Everson Typography
# (http://www.evertype.com/celtscript/). Information about the use of
# this character set is available at
# http://www.evertype.com/celtscript/celtcode.html.
#
# The Mac OS Gaelic encoding shares the script code smRoman (0) with
# the standard Mac OS Roman encoding. To determine if the Gaelic
# encoding is being used in Mac OS 7-9, you should also check if the
# system region code is 81. Otherwise, you can check for particular
# fonts that conform to this encoding (since in practice Gaelic fonts
# are used with the ordinary US or UK system versions).
#
# This character set is a variant of standard Mac OS Roman, adding
# capital and small y with acute, grave, and circumflex; capital and
# small w with acute, grave, circumflex and diaeresis; capital and
# small b, c, d, f, g, m, p, s, t with dot above; tironian et; small
# long r, small long s, and small long s with dot above. It has 36
# code point differences from standard Mac OS Roman.
#
# Before Mac OS 8.5, code point 0xDB was CURRENCY SIGN, and was
# mapped to U+00A4. In Mac OS 8.5 and later versions, code point
# 0xDB is changed to EURO SIGN and maps to U+20AC; the standard
# Apple fonts are updated for Mac OS 8.5 to reflect this. There is
# a "currency sign" variant of the Latin 8 Extended encoding that still
# maps 0xDB to U+00A4; this can be used for older fonts.
# Note: U+20AC is new with Unicode 2.1; for earlier Unicode
# versions, Latin 8 Extended 0xDB may be mapped to private-use
# character U+F8A0.
#
# Before Unicode 3.0, code point 0xE4 was PER MILLE SIGN, and was
# mapped to U+2030. Since August 1998, code point 0xE4 is changed
# to TIRONIAN SIGN ET and maps to U+204A. There is a "per mille
# sign" variant of the Mac OS Gaelic encoding that still
# maps 0xE4 to U+2030; this can be used for older fonts.
# Note: U+204A is new with Unicode 3.0; for earlier Unicode
# versions, Mac OS Gaelic was unified with AMPERSAND.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# Details of mapping changes in each version:
# -------------------------------------------
#
##################
0x0000 - 0x007E = 0x00 -
0x00A0 = 0xCA
0x00A2 = 0xA2
0x00A3 = 0xA3
0x00A7 = 0xA4
0x00A8 = 0xAC
0x00A9 = 0xA9
0x00AB = 0xC7
0x00AE = 0xA8
0x00B0 = 0xA1
0x00B1 = 0xB1
0x00B4 = 0xAB
0x00B6 = 0xA6
0x00B7 = 0xE1
0x00BB = 0xC8
0x00C0 = 0xCB
0x00C1 = 0xE7
0x00C2 = 0xE5
0x00C3 = 0xCC
0x00C4 = 0x80
0x00C5 = 0x81
0x00C6 = 0xAE
0x00C7 = 0x82
0x00C8 = 0xE9
0x00C9 = 0x83
0x00CA = 0xE6
0x00CB = 0xE8
0x00CC = 0xED
0x00CD = 0xEA
0x00CE = 0xEB
0x00CF = 0xEC
0x00D1 = 0x84
0x00D2 = 0xF1
0x00D3 = 0xEE
0x00D4 = 0xEF
0x00D5 = 0xCD
0x00D6 = 0x85
0x00D8 = 0xAF
0x00D9 = 0xF4
0x00DA = 0xF2
0x00DB = 0xF3
0x00DC = 0x86
0x00DD = 0xF6
0x00DF = 0xA7
0x00E0 = 0x88
0x00E1 = 0x87
0x00E2 = 0x89
0x00E3 = 0x8B
0x00E4 = 0x8A
0x00E5 = 0x8C
0x00E6 = 0xBE
0x00E7 = 0x8D
0x00E8 = 0x8F
0x00E9 = 0x8E
0x00EA = 0x90
0x00EB = 0x91
0x00EC = 0x93
0x00ED = 0x92
0x00EE = 0x94
0x00EF = 0x95
0x00F1 = 0x96
0x00F2 = 0x98
0x00F3 = 0x97
0x00F4 = 0x99
0x00F5 = 0x9B
0x00F6 = 0x9A
0x00F8 = 0xBF
0x00F9 = 0x9D
0x00FA = 0x9C
0x00FB = 0x9E
0x00FC = 0x9F
0x00FD = 0xF7
0x00FF = 0xD8
0x010A = 0xB5
0x010B = 0xB6
0x0120 = 0xBB
0x0121 = 0xBC
0x0131 = 0xF5
0x0152 = 0xCE
0x0153 = 0xCF
0x0174 = 0xF8
0x0175 = 0xF9
0x0176 = 0xDE
0x0177 = 0xDF
0x0178 = 0xD9
0x017F = 0xC5
0x0192 = 0xC4
0x027C = 0xC3
0x1E02 = 0xB0
0x1E03 = 0xB4
0x1E0A = 0xB7
0x1E0B = 0xB8
0x1E1E = 0xB9
0x1E1F = 0xBA
0x1E40 = 0xBD
0x1E41 = 0xC0
0x1E56 = 0xC1
0x1E57 = 0xC2
0x1E60 = 0xC6
0x1E61 = 0xD6
0x1E6A = 0xDA
0x1E6B = 0xE0
0x1E80 = 0xFC
0x1E81 = 0xFD
0x1E82 = 0xFE
0x1E83 = 0xFF
0x1E84 = 0xFA
0x1E85 = 0xFB
0x1E9B = 0xD7
0x1EF2 = 0xE2
0x1EF3 = 0xE3
0x2013 = 0xD0
0x2014 = 0xD1
0x2018 = 0xD4
0x2019 = 0xD5
0x201C = 0xD2
0x201D = 0xD3
0x2020 = 0xA0
0x2022 = 0xA5
0x2026 = 0xC9
0x2039 = 0xDC
0x203A = 0xDD
0x204A = 0xE4
0x20AC = 0xDB
0x2122 = 0xAA
0x2260 = 0xAD
0x2264 = 0xB2
0x2265 = 0xB3
0x2663 = 0xF0
END_MAP

View File

@ -0,0 +1,274 @@
# $NetBSD: UCS%GREEK.src,v 1.2 2006/04/08 15:47:40 tnozaki Exp $
TYPE ROWCOL
NAME UCS/GREEK
SRC_ZONE 0x0000-0x2265
OOB_MODE INVALID
DST_INVALID 0x100
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: GREEK.TXT
#
# Contents: Map (external version) from Mac OS Greek
# character set to Unicode 2.1 and later.
#
# Copyright: (c) 1995-2002, 2005 by Apple Computer, Inc., all rights
# reserved.
#
# Contact: charsets@apple.com
#
# Changes:
#
# c02 2005-Apr-05 Update header comments. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
# b3,c1 2002-Dec-19 Update to match changes in Mac OS Greek
# encoding for Mac OS 9.2.2 and later.
# Update URLs, notes. Matches internal
# utom<b3>.
# b02 1999-Sep-22 Update contact e-mail address. Matches
# internal utom<b1>, ufrm<b1>, and Text
# Encoding Converter version 1.5.
# n06 1998-Feb-05 Update to match internal utom<n4>, ufrm<n17>,
# and Text Encoding Converter versions 1.3:
# Change mapping for 0xAF from U+0387 to its
# canonical decomposition, U+00B7. Also
# update header comments to new format.
# n04 1995-Apr-15 First version (after fixing some typos).
# Matches internal ufrm<n7>.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Greek code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Greek code order.
#
# One of these mappings requires the use of a corporate character.
# See the file "CORPCHAR.TXT" and notes below.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Greek character set uses the standard control characters at
# 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Greek:
# ----------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported via transcoding to and from
# Unicode.
#
# Although a Mac OS script code is defined for Greek (smGreek = 6),
# the Greek localized system does not currently use it (the font
# family IDs are in the Mac OS Roman range). To determine if the
# Greek encoding is being used when the script code is smRoman (0),
# you must check if the system region code is 20, verGreece.
#
# The Mac OS Greek encoding is a superset of the repertoire of
# ISO 8859-7 (although characters are not at the same code points),
# except that LEFT & RIGHT SINGLE QUOTATION MARK replace the
# MODIFIER LETTER REVERSED COMMA & APOSTROPHE (spacing versions of
# Greek rough & smooth breathing marks) that are in ISO 8859-7.
# The added characters in Mac OS Greek include more punctuation and
# symbols and several accented Latin letters.
#
# Before Mac OS 9.2.2, code point 0x9C was SOFT HYPHEN (U+00AD), and
# code point 0xFF was undefined. In Mac OS 9.2.2 and later versions,
# SOFT HYPHEN was moved to 0xFF, and code point 0x9C was changed to be
# EURO SIGN (U+20AC); the standard Apple fonts are updated for Mac OS
# 9.2.2 to reflect this. There is a "no Euro sign" variant of the Mac
# OS Greek encoding that uses the older mapping; this can be used for
# older fonts.
#
# This "no Euro sign" variant of Mac OS Greek was the character set
# used by Mac OS Greek systems before 9.2.2 except for system 6.0.7,
# which used a variant character set but was quickly replaced with
# Greek system 6.0.7.1 using the no Euro sign" character set
# documented here. Greek system 4.1 used a variant Greek set that had
# ISO 8859-7 in 0xA0-0xFF (with some holes filled in with DTP
# characters), and Mac OS Roman accented Roman letters in 0x80-0x9F.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# Details of mapping changes in each version:
# -------------------------------------------
#
# Changes from version b02 to version b03/c01:
#
# - The Mac OS Greek encoding changed for Mac OS 9.2.2 and later
# as follows:
# 0x9C, changed from 0x00AD SOFT HYPHEN to 0x20AC EURO SIGN
# 0xFF, changed from undefined to 0x00AD SOFT HYPHEN
#
# Changes from version n04 to version n06:
#
# - Change mapping of 0xAF from U+0387 to its canonical
# decomposition, U+00B7.
#
##################
0x0000 - 0x007E = 0x00 -
0x00A0 = 0xCA
0x00A3 = 0x92
0x00A5 = 0xB4
0x00A6 = 0x9B
0x00A7 = 0xAC
0x00A8 = 0x8C
0x00A9 = 0xA9
0x00AB = 0xC7
0x00AC = 0xC2
0x00AD = 0xFF
0x00AE = 0xA8
0x00B0 = 0xAE
0x00B1 = 0xB1
0x00B2 = 0x82
0x00B3 = 0x84
0x00B7 = 0xAF
0x00B9 = 0x81
0x00BB = 0xC8
0x00BD = 0x97
0x00C4 = 0x80
0x00C9 = 0x83
0x00D6 = 0x85
0x00DC = 0x86
0x00DF = 0xA7
0x00E0 = 0x88
0x00E2 = 0x89
0x00E4 = 0x8A
0x00E7 = 0x8D
0x00E8 = 0x8F
0x00E9 = 0x8E
0x00EA = 0x90
0x00EB = 0x91
0x00EE = 0x94
0x00EF = 0x95
0x00F4 = 0x99
0x00F6 = 0x9A
0x00F7 = 0xD6
0x00F9 = 0x9D
0x00FB = 0x9E
0x00FC = 0x9F
0x0153 = 0xCF
0x0384 = 0x8B
0x0385 = 0x87
0x0386 = 0xCD
0x0388 = 0xCE
0x0389 = 0xD7
0x038A = 0xD8
0x038C = 0xD9
0x038E = 0xDA
0x038F = 0xDF
0x0390 = 0xFD
0x0391 = 0xB0
0x0392 = 0xB5
0x0393 = 0xA1
0x0394 = 0xA2
0x0395 = 0xB6
0x0396 = 0xB7
0x0397 = 0xB8
0x0398 = 0xA3
0x0399 = 0xB9
0x039A = 0xBA
0x039B = 0xA4
0x039C = 0xBB
0x039D = 0xC1
0x039E = 0xA5
0x039F = 0xC3
0x03A0 = 0xA6
0x03A1 = 0xC4
0x03A3 = 0xAA
0x03A4 = 0xC6
0x03A5 = 0xCB
0x03A6 = 0xBC
0x03A7 = 0xCC
0x03A8 = 0xBE
0x03A9 = 0xBF
0x03AA = 0xAB
0x03AB = 0xBD
0x03AC = 0xC0
0x03AD = 0xDB
0x03AE = 0xDC
0x03AF = 0xDD
0x03B0 = 0xFE
0x03B1 = 0xE1
0x03B2 = 0xE2
0x03B3 = 0xE7
0x03B4 = 0xE4
0x03B5 = 0xE5
0x03B6 = 0xFA
0x03B7 = 0xE8
0x03B8 = 0xF5
0x03B9 = 0xE9
0x03BA = 0xEB
0x03BB = 0xEC
0x03BC = 0xED
0x03BD = 0xEE
0x03BE = 0xEA
0x03BF = 0xEF
0x03C0 = 0xF0
0x03C1 = 0xF2
0x03C2 = 0xF7
0x03C3 = 0xF3
0x03C4 = 0xF4
0x03C5 = 0xF9
0x03C6 = 0xE6
0x03C7 = 0xF8
0x03C8 = 0xE3
0x03C9 = 0xF6
0x03CA = 0xFB
0x03CB = 0xFC
0x03CC = 0xDE
0x03CD = 0xE0
0x03CE = 0xF1
0x2013 = 0xD0
0x2015 = 0xD1
0x2018 = 0xD4
0x2019 = 0xD5
0x201C = 0xD2
0x201D = 0xD3
0x2020 = 0xA0
0x2022 = 0x96
0x2026 = 0xC9
0x2030 = 0x98
0x20AC = 0x9C
0x2122 = 0x93
0x2248 = 0xC5
0x2260 = 0xAD
0x2264 = 0xB2
0x2265 = 0xB3
END_MAP

View File

@ -0,0 +1,288 @@
# $NetBSD: UCS%ICELAND.src,v 1.2 2006/04/08 15:47:40 tnozaki Exp $
TYPE ROWCOL
NAME UCS/ICELAND
SRC_ZONE 0x0000-0xF8FF
OOB_MODE INVALID
DST_INVALID 0x100
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: ICELAND.TXT
#
# Contents: Map (external version) from Mac OS Icelandic
# character set to Unicode 2.1 and later.
#
# Copyright: (c) 1995-2002, 2005 by Apple Computer, Inc., all rights
# reserved.
#
# Contact: charsets@apple.com
#
# Changes:
#
# c02 2005-Apr-05 Update header comments. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
# b3,c1 2002-Dec-19 Update URLs, notes. Matches internal
# utom<b3>.
# b02 1999-Sep-22 Encoding changed for Mac OS 8.5; change
# mapping of 0xDB from CURRENCY SIGN to EURO
# SIGN. Update contact e-mail address. Matches
# internal utom<b2>, ufrm<b2>, and Text
# Encoding Converter version 1.5.
# n06 1998-Feb-05 Minor update to header comments, add
# information on font variants
# n03 1997-Dec-14 Update to match internal utom<n4>, ufrm<n16>:
# Change standard mapping for 0xBD from U+2126
# to its canonical decomposition, U+03A9.
# n02 1995-Apr-15 First version (after fixing some typos).
# Matches internal ufrm<n5>.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Icelandic code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Icelandic code order.
#
# One of these mappings requires the use of a corporate character.
# See the file "CORPCHAR.TXT" and notes below.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Icelandic character set uses the standard control characters
# at 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Icelandic:
# --------------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported via transcoding to and from
# Unicode.
#
# 1. General
#
# Mac OS Icelandic is used for Icelandic and Faroese.
#
# The Mac OS Icelandic encoding shares the script code smRoman
# (0) with the standard Mac OS Roman encoding. To determine if
# the Icelandic encoding is being used, you must also check if
# the system region code is 21, verIceland.
#
# This character set is a variant of standard Mac OS Roman,
# adding upper and lower eth, thorn, and Y acute. It has 6 code
# point differences from standard Mac OS Roman.
#
# Before Mac OS 8.5, code point 0xDB was CURRENCY SIGN, and was
# mapped to U+00A4. In Mac OS 8.5 and later versions, code point
# 0xDB is changed to EURO SIGN and maps to U+20AC; the standard
# Apple fonts are updated for Mac OS 8.5 to reflect this. There are
# "currency sign" variants of the Mac OS Icelandic encoding that
# still map 0xDB to U+00A4; these can be used for older fonts.
#
# 2. Font variants
#
# The table in this file gives the Unicode mappings for the standard
# Mac OS Icelandic encoding. This encoding is supported by the
# Icelandic versions of the fonts Chicago, Geneva, Monaco, and New
# York, and is the encoding supported by the text processing
# utilities. However, other TrueType fonts implement a slightly
# different encoding; the difference is only in two code points.
# For the standard variant, these are:
# 0xBB -> 0x00AA FEMININE ORDINAL INDICATOR
# 0xBC -> 0x00BA MASCULINE ORDINAL INDICATOR
#
# For the TrueType variant (used by the Icelandic versions of the
# fonts Courier, Helvetica, Palatino, and Times), these are:
# 0xBB -> 0xFB01 LATIN SMALL LIGATURE FI
# 0xBC -> 0xFB02 LATIN SMALL LIGATURE FL
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# The following corporate zone Unicode character is used in this
# mapping:
#
# 0xF8FF Apple logo
#
# NOTE: The graphic image associated with the Apple logo character
# is not authorized for use without permission of Apple, and
# unauthorized use might constitute trademark infringement.
#
# Details of mapping changes in each version:
# -------------------------------------------
#
# Changes from version n06 to version b02:
#
# - Encoding changed for Mac OS 8.5; change mapping of 0xDB from
# CURRENCY SIGN (U+00A4) to EURO SIGN (U+20AC).
#
# Changes from version n02 to version n03:
#
# - Change mapping of 0xBD from U+2126 to its canonical
# decomposition, U+03A9.
#
##################
0x0000 - 0x007E = 0x00 -
0x00A0 = 0xCA
0x00A1 = 0xC1
0x00A2 = 0xA2
0x00A3 = 0xA3
0x00A5 = 0xB4
0x00A7 = 0xA4
0x00A8 = 0xAC
0x00A9 = 0xA9
0x00AA = 0xBB
0x00AB = 0xC7
0x00AC = 0xC2
0x00AE = 0xA8
0x00AF = 0xF8
0x00B0 = 0xA1
0x00B1 = 0xB1
0x00B4 = 0xAB
0x00B5 = 0xB5
0x00B6 = 0xA6
0x00B7 = 0xE1
0x00B8 = 0xFC
0x00BA = 0xBC
0x00BB = 0xC8
0x00BF = 0xC0
0x00C0 = 0xCB
0x00C1 = 0xE7
0x00C2 = 0xE5
0x00C3 = 0xCC
0x00C4 = 0x80
0x00C5 = 0x81
0x00C6 = 0xAE
0x00C7 = 0x82
0x00C8 = 0xE9
0x00C9 = 0x83
0x00CA = 0xE6
0x00CB = 0xE8
0x00CC = 0xED
0x00CD = 0xEA
0x00CE = 0xEB
0x00CF = 0xEC
0x00D0 = 0xDC
0x00D1 = 0x84
0x00D2 = 0xF1
0x00D3 = 0xEE
0x00D4 = 0xEF
0x00D5 = 0xCD
0x00D6 = 0x85
0x00D8 = 0xAF
0x00D9 = 0xF4
0x00DA = 0xF2
0x00DB = 0xF3
0x00DC = 0x86
0x00DD = 0xA0
0x00DE = 0xDE
0x00DF = 0xA7
0x00E0 = 0x88
0x00E1 = 0x87
0x00E2 = 0x89
0x00E3 = 0x8B
0x00E4 = 0x8A
0x00E5 = 0x8C
0x00E6 = 0xBE
0x00E7 = 0x8D
0x00E8 = 0x8F
0x00E9 = 0x8E
0x00EA = 0x90
0x00EB = 0x91
0x00EC = 0x93
0x00ED = 0x92
0x00EE = 0x94
0x00EF = 0x95
0x00F0 = 0xDD
0x00F1 = 0x96
0x00F2 = 0x98
0x00F3 = 0x97
0x00F4 = 0x99
0x00F5 = 0x9B
0x00F6 = 0x9A
0x00F7 = 0xD6
0x00F8 = 0xBF
0x00F9 = 0x9D
0x00FA = 0x9C
0x00FB = 0x9E
0x00FC = 0x9F
0x00FD = 0xE0
0x00FE = 0xDF
0x00FF = 0xD8
0x0131 = 0xF5
0x0152 = 0xCE
0x0153 = 0xCF
0x0178 = 0xD9
0x0192 = 0xC4
0x02C6 = 0xF6
0x02C7 = 0xFF
0x02D8 = 0xF9
0x02D9 = 0xFA
0x02DA = 0xFB
0x02DB = 0xFE
0x02DC = 0xF7
0x02DD = 0xFD
0x03A9 = 0xBD
0x03C0 = 0xB9
0x2013 = 0xD0
0x2014 = 0xD1
0x2018 = 0xD4
0x2019 = 0xD5
0x201A = 0xE2
0x201C = 0xD2
0x201D = 0xD3
0x201E = 0xE3
0x2022 = 0xA5
0x2026 = 0xC9
0x2030 = 0xE4
0x2044 = 0xDA
0x20AC = 0xDB
0x2122 = 0xAA
0x2202 = 0xB6
0x2206 = 0xC6
0x220F = 0xB8
0x2211 = 0xB7
0x221A = 0xC3
0x221E = 0xB0
0x222B = 0xBA
0x2248 = 0xC5
0x2260 = 0xAD
0x2264 = 0xB2
0x2265 = 0xB3
0x25CA = 0xD7
0xF8FF = 0xF0
END_MAP

View File

@ -0,0 +1,241 @@
# $NetBSD: UCS%INUIT.src,v 1.2 2006/04/08 15:47:40 tnozaki Exp $
TYPE ROWCOL
NAME UCS/INUIT
SRC_ZONE 0x0000-0x2122
OOB_MODE INVALID
DST_INVALID 0x100
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: INUIT.TXT
#
# Contents: Map (external version) from Mac OS Inuit
# character set to Unicode 3.0 and later
#
# Contacts: charsets@apple.com, everson@evertype.com
#
# Changes:
#
# c01 2005-Apr-01 First posted version. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Inuit code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Inuit code order.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Inuit character set uses the standard control characters
# at 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Inuit (partly from Michael Everson):
# ----------------------------------------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported via transcoding to and from
# Unicode.
#
# This character set was developed by Michael Everson of Everson
# Typography (everson@evertype.com) and was used for the Inuktitut
# localizations of Mac OS, as well as for the Inuktitut utilities
# package from Everson Typography. Note that while Apple authorized
# the Inuktitut localization mentioned above, it was not shipped with
# Apple hardware, and was not otherwise supported by Apple. Fonts
# conforming to the Mac OS Inuit character set are available from
# Everson Typography (http://www.evertype.com/software/apple/).
# Information about the use of this character set is available at
# http://www.evertype.com/standards/iu/.
#
# The Mac OS Inuit character set shares the script code smEthiopic
# (28) with the Ethiopic encoding. To determine if the Inuktitut
# encoding is being used, you must also check if the system region
# code is 78, verNunavut.
#
# The Mac OS Inuit character set includes the full syllabic letter
# repertoire required for Inuktitut; it is a subset of the Unified
# Canadian Aboriginal Syllabics set encoded in Unicode. The encoding
# is InuitSCII, designed by Doug Hitch for the Government of the
# Northwest Territories.
#
# The Mac OS Inuit character set also includes a number of characters
# that were needed for the classic Mac OS user interface and
# localization (e.g. ellipsis, bullet, copyright sign). All of the
# characters in Mac OS Inuit that are also in the Mac OS Roman
# encoding are at the same code point in both; this improves
# application compatibility.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# Details of mapping changes in each version:
# -------------------------------------------
#
##################
0x0000 - 0x007E = 0x00 -
0x00A0 = 0xCA
0x00A9 = 0xA9
0x00AE = 0xA8
0x00B0 = 0xA1
0x00B6 = 0xA6
0x0141 = 0xFE
0x0142 = 0xFF
0x1403 = 0x80
0x1404 = 0x81
0x1405 = 0x82
0x1406 = 0x83
0x140A = 0x84
0x140B = 0x85
0x1431 = 0x86
0x1432 = 0x87
0x1433 = 0x88
0x1434 = 0x89
0x1438 = 0x8A
0x1439 = 0x8B
0x1449 = 0x8C
0x144E = 0x8D
0x144F = 0x8E
0x1450 = 0x8F
0x1451 = 0x90
0x1455 = 0x91
0x1456 = 0x92
0x1466 = 0x93
0x146D = 0x94
0x146E = 0x95
0x146F = 0x96
0x1470 = 0x97
0x1472 = 0x98
0x1473 = 0x99
0x1483 = 0x9A
0x148B = 0x9B
0x148C = 0x9C
0x148D = 0x9D
0x148E = 0x9E
0x1490 = 0x9F
0x1491 = 0xA0
0x14A1 = 0xA2
0x14A5 = 0xA3
0x14A6 = 0xA4
0x14A7 = 0xA7
0x14A8 = 0xAB
0x14AA = 0xAC
0x14AB = 0xAD
0x14BB = 0xAE
0x14C2 = 0xAF
0x14C3 = 0xB0
0x14C4 = 0xB1
0x14C5 = 0xB2
0x14C7 = 0xB3
0x14C8 = 0xB4
0x14D0 = 0xB5
0x14D5 = 0xBD
0x14D6 = 0xBE
0x14D7 = 0xBF
0x14D8 = 0xC0
0x14DA = 0xC1
0x14DB = 0xC2
0x14EA = 0xC3
0x14EF = 0xB6
0x14F0 = 0xB7
0x14F1 = 0xB8
0x14F2 = 0xB9
0x14F4 = 0xBA
0x14F5 = 0xBB
0x1505 = 0xBC
0x1528 = 0xC4
0x1529 = 0xC5
0x152A = 0xC6
0x152B = 0xC7
0x152D = 0xC8
0x152E = 0xCB
0x153E = 0xCC
0x1546 = 0xDA
0x1547 = 0xDB
0x1548 = 0xDC
0x1549 = 0xDD
0x154B = 0xDE
0x154C = 0xDF
0x1550 = 0xE0
0x1555 = 0xCD
0x1556 = 0xCE
0x1557 = 0xCF
0x1558 = 0xD6
0x1559 = 0xD7
0x155A = 0xD8
0x155D = 0xD9
0x157C = 0xFD
0x157F = 0xE1
0x1580 = 0xE2
0x1581 = 0xE3
0x1582 = 0xE4
0x1583 = 0xE5
0x1584 = 0xE6
0x1585 = 0xE7
0x158F = 0xE8
0x1590 = 0xE9
0x1591 = 0xEA
0x1592 = 0xEB
0x1593 = 0xEC
0x1594 = 0xED
0x1595 = 0xEE
0x1596 = 0xF5
0x15A0 = 0xF6
0x15A1 = 0xF7
0x15A2 = 0xF8
0x15A3 = 0xF9
0x15A4 = 0xFA
0x15A5 = 0xFB
0x15A6 = 0xFC
0x1671 = 0xEF
0x1672 = 0xF0
0x1673 = 0xF1
0x1674 = 0xF2
0x1675 = 0xF3
0x1676 = 0xF4
0x2013 = 0xD0
0x2014 = 0xD1
0x2018 = 0xD4
0x2019 = 0xD5
0x201C = 0xD2
0x201D = 0xD3
0x2022 = 0xA5
0x2026 = 0xC9
0x2122 = 0xAA
END_MAP

View File

@ -0,0 +1,289 @@
# $NetBSD: UCS%ROMAN.src,v 1.2 2006/04/08 15:47:40 tnozaki Exp $
TYPE ROWCOL
NAME UCS/ROMAN
SRC_ZONE 0x0000-0xFB02
OOB_MODE INVALID
DST_INVALID 0x100
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: ROMAN.TXT
#
# Contents: Map (external version) from Mac OS Roman
# character set to Unicode 2.1 and later.
#
# Copyright: (c) 1994-2002, 2005 by Apple Computer, Inc., all rights
# reserved.
#
# Contact: charsets@apple.com
#
# Changes:
#
# c02 2005-Apr-05 Update header comments. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
# b4,c1 2002-Dec-19 Update URLs, notes. Matches internal
# utom<b5>.
# b03 1999-Sep-22 Update contact e-mail address. Matches
# internal utom<b4>, ufrm<b3>, and Text
# Encoding Converter version 1.5.
# b02 1998-Aug-18 Encoding changed for Mac OS 8.5; change
# mapping of 0xDB from CURRENCY SIGN to
# EURO SIGN. Matches internal utom<b3>,
# ufrm<b3>.
# n08 1998-Feb-05 Minor update to header comments
# n06 1997-Dec-14 Add warning about future changes to 0xDB
# from CURRENCY SIGN to EURO SIGN. Clarify
# some header information
# n04 1997-Dec-01 Update to match internal utom<n3>, ufrm<n22>:
# Change standard mapping for 0xBD from U+2126
# to its canonical decomposition, U+03A9.
# n03 1995-Apr-15 First version (after fixing some typos).
# Matches internal ufrm<n9>.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Roman code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Roman code order.
#
# One of these mappings requires the use of a corporate character.
# See the file "CORPCHAR.TXT" and notes below.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Roman character set uses the standard control characters at
# 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Roman:
# ----------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported directly in programming
# interfaces for QuickDraw Text, the Script Manager, and related
# Text Utilities. For other purposes it is supported via transcoding
# to and from Unicode.
#
# This character set is used for at least the following Mac OS
# localizations: U.S., British, Canadian French, French, Swiss
# French, German, Swiss German, Italian, Swiss Italian, Dutch,
# Swedish, Norwegian, Danish, Finnish, Spanish, Catalan,
# Portuguese, Brazilian, and the default International system.
#
# Variants of Mac OS Roman are used for Croatian, Icelandic,
# Turkish, Romanian, and other encodings. Separate mapping tables
# are available for these encodings.
#
# Before Mac OS 8.5, code point 0xDB was CURRENCY SIGN, and was
# mapped to U+00A4. In Mac OS 8.5 and later versions, code point
# 0xDB is changed to EURO SIGN and maps to U+20AC; the standard
# Apple fonts are updated for Mac OS 8.5 to reflect this. There is
# a "currency sign" variant of the Mac OS Roman encoding that still
# maps 0xDB to U+00A4; this can be used for older fonts.
#
# Before Mac OS 8.5, the ROM bitmap versions of the fonts Chicago,
# New York, Geneva, and Monaco did not implement the full Mac OS
# Roman character set; they only supported character codes up to
# 0xD8. The TrueType versions of these fonts have always implemented
# the full character set, as with the bitmap and TrueType versions
# of the other standard Roman fonts.
#
# In all Mac OS encodings, fonts such as Chicago which are used
# as "system" fonts (for menus, dialogs, etc.) have four glyphs
# at code points 0x11-0x14 for transient use by the Menu Manager.
# These glyphs are not intended as characters for use in normal
# text, and the associated code points are not generally
# interpreted as associated with these glyphs; they are usually
# interpreted (if at all) as the control codes DC1-DC4.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# The following corporate zone Unicode character is used in this
# mapping:
#
# 0xF8FF Apple logo
#
# NOTE: The graphic image associated with the Apple logo character
# is not authorized for use without permission of Apple, and
# unauthorized use might constitute trademark infringement.
#
# Details of mapping changes in each version:
# -------------------------------------------
#
# Changes from version n08 to version b02:
#
# - Encoding changed for Mac OS 8.5; change mapping of 0xDB from
# CURRENCY SIGN (U+00A4) to EURO SIGN (U+20AC).
#
# Changes from version n03 to version n04:
#
# - Change mapping of 0xBD from U+2126 to its canonical
# decomposition, U+03A9.
#
##################
0x0000 - 0x007E = 0x00 -
0x00A0 = 0xCA
0x00A1 = 0xC1
0x00A2 = 0xA2
0x00A3 = 0xA3
0x00A5 = 0xB4
0x00A7 = 0xA4
0x00A8 = 0xAC
0x00A9 = 0xA9
0x00AA = 0xBB
0x00AB = 0xC7
0x00AC = 0xC2
0x00AE = 0xA8
0x00AF = 0xF8
0x00B0 = 0xA1
0x00B1 = 0xB1
0x00B4 = 0xAB
0x00B5 = 0xB5
0x00B6 = 0xA6
0x00B7 = 0xE1
0x00B8 = 0xFC
0x00BA = 0xBC
0x00BB = 0xC8
0x00BF = 0xC0
0x00C0 = 0xCB
0x00C1 = 0xE7
0x00C2 = 0xE5
0x00C3 = 0xCC
0x00C4 = 0x80
0x00C5 = 0x81
0x00C6 = 0xAE
0x00C7 = 0x82
0x00C8 = 0xE9
0x00C9 = 0x83
0x00CA = 0xE6
0x00CB = 0xE8
0x00CC = 0xED
0x00CD = 0xEA
0x00CE = 0xEB
0x00CF = 0xEC
0x00D1 = 0x84
0x00D2 = 0xF1
0x00D3 = 0xEE
0x00D4 = 0xEF
0x00D5 = 0xCD
0x00D6 = 0x85
0x00D8 = 0xAF
0x00D9 = 0xF4
0x00DA = 0xF2
0x00DB = 0xF3
0x00DC = 0x86
0x00DF = 0xA7
0x00E0 = 0x88
0x00E1 = 0x87
0x00E2 = 0x89
0x00E3 = 0x8B
0x00E4 = 0x8A
0x00E5 = 0x8C
0x00E6 = 0xBE
0x00E7 = 0x8D
0x00E8 = 0x8F
0x00E9 = 0x8E
0x00EA = 0x90
0x00EB = 0x91
0x00EC = 0x93
0x00ED = 0x92
0x00EE = 0x94
0x00EF = 0x95
0x00F1 = 0x96
0x00F2 = 0x98
0x00F3 = 0x97
0x00F4 = 0x99
0x00F5 = 0x9B
0x00F6 = 0x9A
0x00F7 = 0xD6
0x00F8 = 0xBF
0x00F9 = 0x9D
0x00FA = 0x9C
0x00FB = 0x9E
0x00FC = 0x9F
0x00FF = 0xD8
0x0131 = 0xF5
0x0152 = 0xCE
0x0153 = 0xCF
0x0178 = 0xD9
0x0192 = 0xC4
0x02C6 = 0xF6
0x02C7 = 0xFF
0x02D8 = 0xF9
0x02D9 = 0xFA
0x02DA = 0xFB
0x02DB = 0xFE
0x02DC = 0xF7
0x02DD = 0xFD
0x03A9 = 0xBD
0x03C0 = 0xB9
0x2013 = 0xD0
0x2014 = 0xD1
0x2018 = 0xD4
0x2019 = 0xD5
0x201A = 0xE2
0x201C = 0xD2
0x201D = 0xD3
0x201E = 0xE3
0x2020 = 0xA0
0x2021 = 0xE0
0x2022 = 0xA5
0x2026 = 0xC9
0x2030 = 0xE4
0x2039 = 0xDC
0x203A = 0xDD
0x2044 = 0xDA
0x20AC = 0xDB
0x2122 = 0xAA
0x2202 = 0xB6
0x2206 = 0xC6
0x220F = 0xB8
0x2211 = 0xB7
0x221A = 0xC3
0x221E = 0xB0
0x222B = 0xBA
0x2248 = 0xC5
0x2260 = 0xAD
0x2264 = 0xB2
0x2265 = 0xB3
0x25CA = 0xD7
0xF8FF = 0xF0
0xFB01 = 0xDE
0xFB02 = 0xDF
END_MAP

View File

@ -0,0 +1,284 @@
# $NetBSD: UCS%ROMANIAN.src,v 1.2 2006/04/08 15:47:40 tnozaki Exp $
TYPE ROWCOL
NAME UCS/ROMANIAN
SRC_ZONE 0x0000-0xF8FF
OOB_MODE INVALID
DST_INVALID 0x100
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: ROMANIAN.TXT
#
# Contents: Map (external version) from Mac OS Romanian
# character set to Unicode 3.0 and later.
#
# Copyright: (c) 1995-2002, 2005 by Apple Computer, Inc., all rights
# reserved.
#
# Contact: charsets@apple.com
#
# Changes:
#
# c02 2005-Apr-05 Update header comments. Matches internal xml
# <c1.2> and Text Encoding Converter 2.0.
# b3,c1 2002-Dec-19 Update mappings for 0xAF, 0xBF, 0xDE, 0xDF
# to use new composed characters added in
# Unicode 3.0. Update URLs, notes. Matches
# internal utom<b3>.
# b02 1999-Sep-22 Encoding changed for Mac OS 8.5; change
# mapping of 0xDB from CURRENCY SIGN to EURO
# SIGN. Update contact e-mail address. Matches
# internal utom<b2>, ufrm<b2>, and Text
# Encoding Converter version 1.5.
# n05 1998-Feb-05 Minor update to header comments
# n03 1997-Dec-14 Update to match internal utom<n5>, ufrm<n16>:
# Change standard mapping for 0xBD from U+2126
# to its canonical decomposition, U+03A9.
# Change mapping of 0xAF,0xBF,0xDE,0xDF from
# composed S/T WITH CEDILLA to S/T with
# COMBINING COMMA BELOW (to match our
# decomposition mappings).
# n02 1995-Apr-15 First version (after fixing some typos).
# Matches internal ufrm<n4>.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Romanian code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Romanian code order.
#
# One of these mappings requires the use of a corporate character.
# See the file "CORPCHAR.TXT" and notes below.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Romanian character set uses the standard control characters at
# 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Romanian:
# -------------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported via transcoding to and from
# Unicode.
#
# Mac OS Romanian is used only for Romanian.
#
# The Mac OS Romanian encoding shares the script code smRoman
# (0) with the standard Mac OS Roman encoding. To determine if
# the Romanian encoding is being used, you must also check if the
# system region code is 39, verRomania.
#
# This character set is a variant of standard Mac OS Roman, adding
# upper and lower A breve, S comma below, and T comma below. It
# has 6 code point differences from standard Mac OS Roman.
#
# Before Mac OS 8.5, code point 0xDB was CURRENCY SIGN, and was
# mapped to U+00A4. In Mac OS 8.5 and later versions, code point
# 0xDB is changed to EURO SIGN and maps to U+20AC; the standard
# Apple fonts are updated for Mac OS 8.5 to reflect this. There is
# a "currency sign" variant of the Mac OS Romanian encoding that
# still maps 0xDB to U+00A4; this can be used for older fonts.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# The following corporate zone Unicode character is used in this
# mapping:
#
# 0xF8FF Apple logo
#
# NOTE: The graphic image associated with the Apple logo character
# is not authorized for use without permission of Apple, and
# unauthorized use might constitute trademark infringement.
#
# Details of mapping changes in each version:
# -------------------------------------------
#
# Changes from version b02 to version b03/c01:
#
# - Update the mappings for 0xAF, 0xBF, 0xDE, 0xDF to use new
# composed Unicode characters 0x0218-0x021B added in Unicode 3.0;
# the previous mappings were to the equivalent decomposition
# sequences.
#
# Changes from version n05 to version b02:
#
# - Encoding changed for Mac OS 8.5; change mapping of 0xDB from
# CURRENCY SIGN (U+00A4) to EURO SIGN (U+20AC).
#
# Changes from version n02 to version n03:
#
# - Change mapping of 0xBD from U+2126 to its canonical
# decomposition, U+03A9.
# - Change mapping of 0xAF,0xBF,0xDE,0xDF from composed S or T
# WITH CEDILLA to S or T with COMBINING COMMA BELOW (to match
# our decomposition mappings).
#
##################
0x0000 - 0x007E = 0x00 -
0x00A0 = 0xCA
0x00A1 = 0xC1
0x00A2 = 0xA2
0x00A3 = 0xA3
0x00A5 = 0xB4
0x00A7 = 0xA4
0x00A8 = 0xAC
0x00A9 = 0xA9
0x00AA = 0xBB
0x00AB = 0xC7
0x00AC = 0xC2
0x00AE = 0xA8
0x00AF = 0xF8
0x00B0 = 0xA1
0x00B1 = 0xB1
0x00B4 = 0xAB
0x00B5 = 0xB5
0x00B6 = 0xA6
0x00B7 = 0xE1
0x00B8 = 0xFC
0x00BA = 0xBC
0x00BB = 0xC8
0x00BF = 0xC0
0x00C0 = 0xCB
0x00C1 = 0xE7
0x00C2 = 0xE5
0x00C3 = 0xCC
0x00C4 = 0x80
0x00C5 = 0x81
0x00C7 = 0x82
0x00C8 = 0xE9
0x00C9 = 0x83
0x00CA = 0xE6
0x00CB = 0xE8
0x00CC = 0xED
0x00CD = 0xEA
0x00CE = 0xEB
0x00CF = 0xEC
0x00D1 = 0x84
0x00D2 = 0xF1
0x00D3 = 0xEE
0x00D4 = 0xEF
0x00D5 = 0xCD
0x00D6 = 0x85
0x00D9 = 0xF4
0x00DA = 0xF2
0x00DB = 0xF3
0x00DC = 0x86
0x00DF = 0xA7
0x00E0 = 0x88
0x00E1 = 0x87
0x00E2 = 0x89
0x00E3 = 0x8B
0x00E4 = 0x8A
0x00E5 = 0x8C
0x00E7 = 0x8D
0x00E8 = 0x8F
0x00E9 = 0x8E
0x00EA = 0x90
0x00EB = 0x91
0x00EC = 0x93
0x00ED = 0x92
0x00EE = 0x94
0x00EF = 0x95
0x00F1 = 0x96
0x00F2 = 0x98
0x00F3 = 0x97
0x00F4 = 0x99
0x00F5 = 0x9B
0x00F6 = 0x9A
0x00F7 = 0xD6
0x00F9 = 0x9D
0x00FA = 0x9C
0x00FB = 0x9E
0x00FC = 0x9F
0x00FF = 0xD8
0x0102 = 0xAE
0x0103 = 0xBE
0x0131 = 0xF5
0x0152 = 0xCE
0x0153 = 0xCF
0x0178 = 0xD9
0x0192 = 0xC4
0x0218 = 0xAF
0x0219 = 0xBF
0x021A = 0xDE
0x021B = 0xDF
0x02C6 = 0xF6
0x02C7 = 0xFF
0x02D8 = 0xF9
0x02D9 = 0xFA
0x02DA = 0xFB
0x02DB = 0xFE
0x02DC = 0xF7
0x02DD = 0xFD
0x03A9 = 0xBD
0x03C0 = 0xB9
0x2013 = 0xD0
0x2014 = 0xD1
0x2018 = 0xD4
0x2019 = 0xD5
0x201A = 0xE2
0x201C = 0xD2
0x201D = 0xD3
0x201E = 0xE3
0x2020 = 0xA0
0x2021 = 0xE0
0x2022 = 0xA5
0x2026 = 0xC9
0x2030 = 0xE4
0x2039 = 0xDC
0x203A = 0xDD
0x2044 = 0xDA
0x20AC = 0xDB
0x2122 = 0xAA
0x2202 = 0xB6
0x2206 = 0xC6
0x220F = 0xB8
0x2211 = 0xB7
0x221A = 0xC3
0x221E = 0xB0
0x222B = 0xBA
0x2248 = 0xC5
0x2260 = 0xAD
0x2264 = 0xB2
0x2265 = 0xB3
0x25CA = 0xD7
0xF8FF = 0xF0
END_MAP

View File

@ -0,0 +1,301 @@
# $NetBSD: UCS%THAI.src,v 1.2 2006/04/08 15:47:40 tnozaki Exp $
TYPE ROWCOL
NAME UCS/THAI
SRC_ZONE 0x0000-0x2122
OOB_MODE INVALID
DST_INVALID 0x100
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: THAI.TXT
#
# Contents: Map (external version) from Mac OS Thai
# character set to Unicode 3.2 and later.
#
# Copyright: (c) 1995-2002, 2005 by Apple Computer, Inc., all rights
# reserved.
#
# Contact: charsets@apple.com
#
# Changes:
#
# c02 2005-Apr-05 Update header comments. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
# b3,c1 2002-Dec-19 Update mapping for 0xDB to use new Unicode
# 3.2 WORD JOINER instead of ZWNBSP (BOM).
# Update URLs. Matches internal utom<b3>.
# b02 1999-Sep-22 Update contact e-mail address. Matches
# internal utom<b1>, ufrm<b2>, and Text
# Encoding Converter version 1.5.
# n07 1998-Feb-05 Update to match internal utom<n5>, ufrm<n13>
# and Text Encoding Converter version 1.3:
# Use standard Unicodes plus transcoding hints
# instead of single corporate characters; see
# details below. Also update header comments
# to new format.
# n04 1995-Nov-17 First version (after fixing some typos).
# Matches internal ufrm<n6>.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Thai code (in hex as 0xNN)
# Column #2 is the corresponding Unicode or Unicode sequence
# (in hex as 0xNNNN or 0xNNNN+0xNNNN).
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Thai code order.
#
# Some of these mappings require the use of corporate characters.
# See the file "CORPCHAR.TXT" and notes below.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Thai character set uses the standard control characters at
# 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Thai:
# ---------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported via transcoding to and from
# Unicode.
#
# Codes 0xA1-0xDA and 0xDF-0xFB are the character set from Thai
# standard TIS 620-2533, except that the following changes are
# made:
# 0xEE is TRADE MARK SIGN (instead of THAI CHARACTER YAMAKKAN)
# 0xFA is REGISTERED SIGN (instead of THAI CHARACTER ANGKHANKHU)
# 0xFB is COPYRIGHT SIGN (instead of THAI CHARACTER KHOMUT)
#
# Codes 0x80-0x82, 0x8D-0x8E, 0x91, 0x9D-0x9E, and 0xDB-0xDE are
# various additional punctuation marks (e.g. curly quotes,
# ellipsis), no-break space, and two special characters "word join"
# and "word break".
#
# Codes 0x83-0x8C, 0x8F, and 0x92-0x9C are for positional variants
# of the upper vowels, tone marks, and other signs at 0xD1,
# 0xD4-0xD7, and 0xE7-0xED. The positional variants would normally
# be considered presentation forms only and not characters. In most
# cases they are not typed directly; they are selected automatically
# at display time by the WorldScript software. However, using the
# Thai-DTP keyboard, the presentation forms can in fact be typed
# directly using dead keys. Thus they must be treated as real
# characters in the Mac OS Thai encoding. They are mapped using
# variant tags; see below.
#
# Several code points are undefined and unused (they cannot be
# typed using any of the Mac OS Thai keyboard layouts): 0x90, 0x9F,
# 0xFC-0xFE. These are not shown in the table below.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# The goals in the Apple mappings provided here are:
# - Ensure roundtrip mapping from every character in the Mac OS Thai
# character set to Unicode and back
# - Use standard Unicode characters as much as possible, to maximize
# interchangeability of the resulting Unicode text. Whenever possible,
# avoid having content carried by private-use characters.
#
# To satisfy both goals, we use private use characters to mark variants
# that are similar to a sequence of one or more standard Unicode
# characters.
#
# Apple has defined a block of 32 corporate characters as "transcoding
# hints." These are used in combination with standard Unicode characters
# to force them to be treated in a special way for mapping to other
# encodings; they have no other effect. Sixteen of these transcoding
# hints are "grouping hints" - they indicate that the next 2-4 Unicode
# characters should be treated as a single entity for transcoding. The
# other sixteen transcoding hints are "variant tags" - they are like
# combining characters, and can follow a standard Unicode (or a sequence
# consisting of a base character and other combining characters) to
# cause it to be treated in a special way for transcoding. These always
# terminate a combining-character sequence.
#
# The transcoding coding hints used in this mapping table are four
# variant tags in the range 0xF873-75. Since these are combined with
# standard Unicode characters, some characters in the Mac OS Thai
# character set map to a sequence of two Unicodes instead of a single
# Unicode character. For example, the Mac OS Thai character at 0x83 is a
# low-left positional variant of THAI CHARACTER MAI EK (the standard
# mapping is for the abstract character at 0xE8). So 0x83 is mapped to
# 0x0E48 (THAI CHARACTER MAI EK) + 0xF875 (a variant tag).
#
# Details of mapping changes in each version:
# -------------------------------------------
#
# Changes from version b02 to version b03/c01:
#
# - Update mapping for 0xDB to use new Unicode 3.2 character U+2060
# WORD JOINER instead of U+FEFF ZERO WIDTH NO-BREAK SPACE (BOM)
#
# Changes from version n04 to version n07:
#
# - Changed mappings of the positional variants to use standard
# Unicodes + transcoding hint, instead of using single corporate
# zone characters. This affected the mappings for the following:
# 0x83-08C, 0x8F, 0x92-0x9C
#
# - Just comment out unused code points in the table, instead
# of mapping them to U+FFFD.
#
##################
0x0000 - 0x007E = 0x00 -
0x00A0 = 0xA0
0x00A9 = 0xFB
0x00AB = 0x80
0x00AE = 0xFA
0x00BB = 0x81
0x0E01 = 0xA1
0x0E02 = 0xA2
0x0E03 = 0xA3
0x0E04 = 0xA4
0x0E05 = 0xA5
0x0E06 = 0xA6
0x0E07 = 0xA7
0x0E08 = 0xA8
0x0E09 = 0xA9
0x0E0A = 0xAA
0x0E0B = 0xAB
0x0E0C = 0xAC
0x0E0D = 0xAD
0x0E0E = 0xAE
0x0E0F = 0xAF
0x0E10 = 0xB0
0x0E11 = 0xB1
0x0E12 = 0xB2
0x0E13 = 0xB3
0x0E14 = 0xB4
0x0E15 = 0xB5
0x0E16 = 0xB6
0x0E17 = 0xB7
0x0E18 = 0xB8
0x0E19 = 0xB9
0x0E1A = 0xBA
0x0E1B = 0xBB
0x0E1C = 0xBC
0x0E1D = 0xBD
0x0E1E = 0xBE
0x0E1F = 0xBF
0x0E20 = 0xC0
0x0E21 = 0xC1
0x0E22 = 0xC2
0x0E23 = 0xC3
0x0E24 = 0xC4
0x0E25 = 0xC5
0x0E26 = 0xC6
0x0E27 = 0xC7
0x0E28 = 0xC8
0x0E29 = 0xC9
0x0E2A = 0xCA
0x0E2B = 0xCB
0x0E2C = 0xCC
0x0E2D = 0xCD
0x0E2E = 0xCE
0x0E2F = 0xCF
0x0E30 = 0xD0
0x0E31 = 0x92
0x0E31 = 0xD1
0x0E32 = 0xD2
0x0E33 = 0xD3
0x0E34 = 0x94
0x0E34 = 0xD4
0x0E35 = 0x95
0x0E35 = 0xD5
0x0E36 = 0x96
0x0E36 = 0xD6
0x0E37 = 0x97
0x0E37 = 0xD7
0x0E38 = 0xD8
0x0E39 = 0xD9
0x0E3A = 0xDA
0x0E3F = 0xDF
0x0E40 = 0xE0
0x0E41 = 0xE1
0x0E42 = 0xE2
0x0E43 = 0xE3
0x0E44 = 0xE4
0x0E45 = 0xE5
0x0E46 = 0xE6
0x0E47 = 0x93
0x0E47 = 0xE7
0x0E48 = 0x83
0x0E48 = 0x88
0x0E48 = 0x98
0x0E48 = 0xE8
0x0E49 = 0x84
0x0E49 = 0x89
0x0E49 = 0x99
0x0E49 = 0xE9
0x0E4A = 0x85
0x0E4A = 0x8A
0x0E4A = 0x9A
0x0E4A = 0xEA
0x0E4B = 0x86
0x0E4B = 0x8B
0x0E4B = 0x9B
0x0E4B = 0xEB
0x0E4C = 0x87
0x0E4C = 0x8C
0x0E4C = 0x9C
0x0E4C = 0xEC
0x0E4D = 0x8F
0x0E4D = 0xED
0x0E4F = 0xEF
0x0E50 = 0xF0
0x0E51 = 0xF1
0x0E52 = 0xF2
0x0E53 = 0xF3
0x0E54 = 0xF4
0x0E55 = 0xF5
0x0E56 = 0xF6
0x0E57 = 0xF7
0x0E58 = 0xF8
0x0E59 = 0xF9
0x200B = 0xDC
0x2013 = 0xDD
0x2014 = 0xDE
0x2018 = 0x9D
0x2019 = 0x9E
0x201C = 0x8D
0x201D = 0x8E
0x2022 = 0x91
0x2026 = 0x82
0x2060 = 0xDB
0x2122 = 0xEE
END_MAP

View File

@ -0,0 +1,260 @@
# $NetBSD: UCS%TURKISH.src,v 1.2 2006/04/08 15:47:40 tnozaki Exp $
TYPE ROWCOL
NAME UCS/TURKISH
SRC_ZONE 0x0000-0xF8FF
OOB_MODE INVALID
DST_INVALID 0x100
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
#=======================================================================
# File name: TURKISH.TXT
#
# Contents: Map (external version) from Mac OS Turkish
# character set to Unicode 2.1 and later.
#
# Copyright: (c) 1995-2002, 2005 by Apple Computer, Inc., all rights
# reserved.
#
# Contact: charsets@apple.com
#
# Changes:
#
# c02 2005-Apr-05 Update header comments. Matches internal xml
# <c1.1> and Text Encoding Converter 2.0.
# b3,c1 2002-Dec-19 Update URLs, notes. Matches internal
# utom<b1>.
# b02 1999-Sep-22 Update contact e-mail address. Matches
# internal utom<b1>, ufrm<b1>, and Text
# Encoding Converter version 1.5.
# n05 1998-Feb-05 Minor update to header comments
# n03 1997-Dec-14 Update to match internal utom<n5>, ufrm<n15>:
# Change standard mapping for 0xBD from U+2126
# to its canonical decomposition, U+03A9.
# n02 1995-Apr-15 First version (after fixing some typos).
# Matches internal ufrm<n4>.
#
# Standard header:
# ----------------
#
# Apple, the Apple logo, and Macintosh are trademarks of Apple
# Computer, Inc., registered in the United States and other countries.
# Unicode is a trademark of Unicode Inc. For the sake of brevity,
# throughout this document, "Macintosh" can be used to refer to
# Macintosh computers and "Unicode" can be used to refer to the
# Unicode standard.
#
# Apple Computer, Inc. ("Apple") makes no warranty or representation,
# either express or implied, with respect to this document and the
# included data, its quality, accuracy, or fitness for a particular
# purpose. In no event will Apple be liable for direct, indirect,
# special, incidental, or consequential damages resulting from any
# defect or inaccuracy in this document or the included data.
#
# These mapping tables and character lists are subject to change.
# The latest tables should be available from the following:
#
# <http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/>
#
# For general information about Mac OS encodings and these mapping
# tables, see the file "README.TXT".
#
# Format:
# -------
#
# Three tab-separated columns;
# '#' begins a comment which continues to the end of the line.
# Column #1 is the Mac OS Turkish code (in hex as 0xNN)
# Column #2 is the corresponding Unicode (in hex as 0xNNNN)
# Column #3 is a comment containing the Unicode name
#
# The entries are in Mac OS Turkish code order.
#
# Two of these mappings requires the use of a corporate character.
# See the file "CORPCHAR.TXT" and notes below.
#
# Control character mappings are not shown in this table, following
# the conventions of the standard UTC mapping tables. However, the
# Mac OS Turkish character set uses the standard control characters at
# 0x00-0x1F and 0x7F.
#
# Notes on Mac OS Turkish:
# ------------------------
#
# This is a legacy Mac OS encoding; in the Mac OS X Carbon and Cocoa
# environments, it is only supported via transcoding to and from
# Unicode.
#
# Mac OS Turkish is used for Turkish.
#
# The Mac OS Turkish encoding shares the script code smRoman
# (0) with the Mac OS Roman encoding. To determine if the Turkish
# encoding is being used, you must also check if the system region
# code is 24, verTurkey.
#
# This character set is a variant of standard Mac OS Roman. It adds
# upper & lower G with breve, upper & lower S with cedilla, upper I
# with dot, and moves the dotless lower i from its position at 0xF5
# in standard Mac OS Roman to a position at 0xDD here (leaving the
# 0xF5 code point undefined in Mac OS Turkish). This gives a total
# of 7 code point differences from standard Mac OS Roman.
#
# Unicode mapping issues and notes:
# ---------------------------------
#
# The following corporate zone Unicode characters are used in this
# mapping:
#
# 0xF8A0 undefined1, used to map the single undefined code point
# in Mac OS Turkish (to obtain roundtrip fidelity for all
# code points).
# 0xF8FF Apple logo
#
# NOTE: The graphic image associated with the Apple logo character
# is not authorized for use without permission of Apple, and
# unauthorized use might constitute trademark infringement.
#
# Details of mapping changes in each version:
# -------------------------------------------
#
# Changes from version n02 to version n03:
#
# - Change mapping of 0xBD from U+2126 to its canonical
# decomposition, U+03A9.
#
##################
0x0000 - 0x007E = 0x00 -
0x00A0 = 0xCA
0x00A1 = 0xC1
0x00A2 = 0xA2
0x00A3 = 0xA3
0x00A5 = 0xB4
0x00A7 = 0xA4
0x00A8 = 0xAC
0x00A9 = 0xA9
0x00AA = 0xBB
0x00AB = 0xC7
0x00AC = 0xC2
0x00AE = 0xA8
0x00AF = 0xF8
0x00B0 = 0xA1
0x00B1 = 0xB1
0x00B4 = 0xAB
0x00B5 = 0xB5
0x00B6 = 0xA6
0x00B7 = 0xE1
0x00B8 = 0xFC
0x00BA = 0xBC
0x00BB = 0xC8
0x00BF = 0xC0
0x00C0 = 0xCB
0x00C1 = 0xE7
0x00C2 = 0xE5
0x00C3 = 0xCC
0x00C4 = 0x80
0x00C5 = 0x81
0x00C6 = 0xAE
0x00C7 = 0x82
0x00C8 = 0xE9
0x00C9 = 0x83
0x00CA = 0xE6
0x00CB = 0xE8
0x00CC = 0xED
0x00CD = 0xEA
0x00CE = 0xEB
0x00CF = 0xEC
0x00D1 = 0x84
0x00D2 = 0xF1
0x00D3 = 0xEE
0x00D4 = 0xEF
0x00D5 = 0xCD
0x00D6 = 0x85
0x00D8 = 0xAF
0x00D9 = 0xF4
0x00DA = 0xF2
0x00DB = 0xF3
0x00DC = 0x86
0x00DF = 0xA7
0x00E0 = 0x88
0x00E1 = 0x87
0x00E2 = 0x89
0x00E3 = 0x8B
0x00E4 = 0x8A
0x00E5 = 0x8C
0x00E6 = 0xBE
0x00E7 = 0x8D
0x00E8 = 0x8F
0x00E9 = 0x8E
0x00EA = 0x90
0x00EB = 0x91
0x00EC = 0x93
0x00ED = 0x92
0x00EE = 0x94
0x00EF = 0x95
0x00F1 = 0x96
0x00F2 = 0x98
0x00F3 = 0x97
0x00F4 = 0x99
0x00F5 = 0x9B
0x00F6 = 0x9A
0x00F7 = 0xD6
0x00F8 = 0xBF
0x00F9 = 0x9D
0x00FA = 0x9C
0x00FB = 0x9E
0x00FC = 0x9F
0x00FF = 0xD8
0x011E = 0xDA
0x011F = 0xDB
0x0130 = 0xDC
0x0131 = 0xDD
0x0152 = 0xCE
0x0153 = 0xCF
0x015E = 0xDE
0x015F = 0xDF
0x0178 = 0xD9
0x0192 = 0xC4
0x02C6 = 0xF6
0x02C7 = 0xFF
0x02D8 = 0xF9
0x02D9 = 0xFA
0x02DA = 0xFB
0x02DB = 0xFE
0x02DC = 0xF7
0x02DD = 0xFD
0x03A9 = 0xBD
0x03C0 = 0xB9
0x2013 = 0xD0
0x2014 = 0xD1
0x2018 = 0xD4
0x2019 = 0xD5
0x201A = 0xE2
0x201C = 0xD2
0x201D = 0xD3
0x201E = 0xE3
0x2020 = 0xA0
0x2021 = 0xE0
0x2022 = 0xA5
0x2026 = 0xC9
0x2030 = 0xE4
0x2122 = 0xAA
0x2202 = 0xB6
0x2206 = 0xC6
0x220F = 0xB8
0x2211 = 0xB7
0x221A = 0xC3
0x221E = 0xB0
0x222B = 0xBA
0x2248 = 0xC5
0x2260 = 0xAD
0x2264 = 0xB2
0x2265 = 0xB3
0x25CA = 0xD7
0xF8A0 = 0xF5
0xF8FF = 0xF0
END_MAP

View File

@ -0,0 +1,119 @@
# $NetBSD: ARMSCII-7%UCS.src,v 1.1 2006/04/01 04:13:21 tnozaki Exp $
TYPE ROWCOL
NAME ARMSCII-7/UCS
SRC_ZONE 0x00-0x7F
OOB_MODE ILSEQ
DST_ILSEQ 0xFFFE
DST_UNIT_BITS 16
BEGIN_MAP
#
# this data delived from:
#
# ARMENIAN CHARACTER SETS IMPLEMENTATION GUIDE
# Document version 006.en.html
# http://www.freenet.am/armscii/armcs-006.html
#
# Name: armscii-7
# Source: Armenian State Standard AST 34.005
# Basic 7-bit coded character set
# Alias: AST_34.005
#
0x00 - 0x20 = 0x0000 -
0x21 = 0xE000 # ARMENIAN ETERNITY SIGN, 0x0530? 0x2741?
0x22 = 0x0587 # 0x00A7?
0x23 = 0x0589
0x24 = 0x0029
0x25 = 0x0028
0x26 = 0x00BB
0x27 = 0x00AB
0x28 = 0x2014
0x29 = 0x002E
0x2A = 0x055D
0x2B = 0x002C
0x2C = 0x002D
0x2D = 0x058A # 0x055F?
0x2E = 0x2026
0x2F = 0x055C
0x30 = 0x055B
0x31 = 0x055E
0x32 = 0x0531
0x33 = 0x0561
0x34 = 0x0532
0x35 = 0x0562
0x36 = 0x0533
0x37 = 0x0563
0x38 = 0x0534
0x39 = 0x0564
0x3A = 0x0535
0x3B = 0x0565
0x3C = 0x0536
0x3D = 0x0566
0x3E = 0x0537
0x3F = 0x0567
0x40 = 0x0538
0x41 = 0x0568
0x42 = 0x0539
0x43 = 0x0569
0x44 = 0x053A
0x45 = 0x056A
0x46 = 0x053B
0x47 = 0x056B
0x48 = 0x053C
0x49 = 0x056C
0x4A = 0x053D
0x4B = 0x056D
0x4C = 0x053E
0x4D = 0x056E
0x4E = 0x053F
0x4F = 0x056F
0x50 = 0x0540
0x51 = 0x0570
0x52 = 0x0541
0x53 = 0x0571
0x54 = 0x0542
0x55 = 0x0572
0x56 = 0x0543
0x57 = 0x0573
0x58 = 0x0544
0x59 = 0x0574
0x5A = 0x0545
0x5B = 0x0575
0x5C = 0x0546
0x5D = 0x0576
0x5E = 0x0547
0x5F = 0x0577
0x60 = 0x0548
0x61 = 0x0578
0x62 = 0x0549
0x63 = 0x0579
0x64 = 0x054A
0x65 = 0x057A
0x66 = 0x054B
0x67 = 0x057B
0x68 = 0x054C
0x69 = 0x057C
0x6A = 0x054D
0x6B = 0x057D
0x6C = 0x054E
0x6D = 0x057E
0x6E = 0x054F
0x6F = 0x057F
0x70 = 0x0550
0x71 = 0x0580
0x72 = 0x0551
0x73 = 0x0581
0x74 = 0x0552
0x75 = 0x0582
0x76 = 0x0553
0x77 = 0x0583
0x78 = 0x0554
0x79 = 0x0584
0x7A = 0x0555
0x7B = 0x0585
0x7C = 0x0556
0x7D = 0x0586
0x7E = 0x055A # 0x2019?
0x7F = 0x0027
END_MAP

View File

@ -0,0 +1,119 @@
# $NetBSD: ARMSCII-8%UCS.src,v 1.1 2006/04/01 04:13:21 tnozaki Exp $
TYPE ROWCOL
NAME ARMSCII-8/UCS
SRC_ZONE 0x00-0xFF
OOB_MODE ILSEQ
DST_ILSEQ 0xFFFE
DST_UNIT_BITS 16
BEGIN_MAP
#
# this data delived from:
#
# ARMENIAN CHARACTER SETS IMPLEMENTATION GUIDE
# Document version 006.en.html
# http://www.freenet.am/armscii/armcs-006.html
#
# Name: armscii-8
# Source: Armenian State Standard AST 34.002
# Basic 8-bit coded character set
# Alias: AST_34.002
#
0x00 - 0xA0 = 0x0000 -
0xA1 = 0xE000 # ARMENIAN ETERNITY SIGN, 0x0530? 0x2741?
0xA2 = 0x0587 # 0x00A7?
0xA3 = 0x0589
0xA4 = 0x0029
0xA5 = 0x0028
0xA6 = 0x00BB
0xA7 = 0x00AB
0xA8 = 0x2014
0xA9 = 0x002E
0xAA = 0x055D
0xAB = 0x002C
0xAC = 0x002D
0xAD = 0x058A # 0x055F
0xAE = 0x2026
0xAF = 0x055C
0xB0 = 0x055B
0xB1 = 0x055E
0xB2 = 0x0531
0xB3 = 0x0561
0xB4 = 0x0532
0xB5 = 0x0562
0xB6 = 0x0533
0xB7 = 0x0563
0xB8 = 0x0534
0xB9 = 0x0564
0xBA = 0x0535
0xBB = 0x0565
0xBC = 0x0536
0xBD = 0x0566
0xBE = 0x0537
0xBF = 0x0567
0xC0 = 0x0538
0xC1 = 0x0568
0xC2 = 0x0539
0xC3 = 0x0569
0xC4 = 0x053A
0xC5 = 0x056A
0xC6 = 0x053B
0xC7 = 0x056B
0xC8 = 0x053C
0xC9 = 0x056C
0xCA = 0x053D
0xCB = 0x056D
0xCC = 0x053E
0xCD = 0x056E
0xCE = 0x053F
0xCF = 0x056F
0xD0 = 0x0540
0xD1 = 0x0570
0xD2 = 0x0541
0xD3 = 0x0571
0xD4 = 0x0542
0xD5 = 0x0572
0xD6 = 0x0543
0xD7 = 0x0573
0xD8 = 0x0544
0xD9 = 0x0574
0xDA = 0x0545
0xDB = 0x0575
0xDC = 0x0546
0xDD = 0x0576
0xDE = 0x0547
0xDF = 0x0577
0xE0 = 0x0548
0xE1 = 0x0578
0xE2 = 0x0549
0xE3 = 0x0579
0xE4 = 0x054A
0xE5 = 0x057A
0xE6 = 0x054B
0xE7 = 0x057B
0xE8 = 0x054C
0xE9 = 0x057C
0xEA = 0x054D
0xEB = 0x057D
0xEC = 0x054E
0xED = 0x057E
0xEE = 0x054F
0xEF = 0x057F
0xF0 = 0x0550
0xF1 = 0x0580
0xF2 = 0x0551
0xF3 = 0x0581
0xF4 = 0x0552
0xF5 = 0x0582
0xF6 = 0x0553
0xF7 = 0x0583
0xF8 = 0x0554
0xF9 = 0x0584
0xFA = 0x0555
0xFB = 0x0585
0xFC = 0x0556
0xFD = 0x0586
0xFE = 0x055A # 0x2019?
0xFF = 0x0027
END_MAP

View File

@ -0,0 +1,121 @@
# $NetBSD: ARMSCII-8A%UCS.src,v 1.1 2006/04/01 04:13:21 tnozaki Exp $
TYPE ROWCOL
NAME ARMSCII-8A/UCS
SRC_ZONE 0x00-0xFF
OOB_MODE ILSEQ
DST_ILSEQ 0xFFFE
DST_UNIT_BITS 16
BEGIN_MAP
#
# this data delived from:
#
# ARMENIAN CHARACTER SETS IMPLEMENTATION GUIDE
# Document version 006.en.html
# http://www.freenet.am/armscii/armcs-006.html
#
# Name: armscii-8a
# Source: Armenian State Standard AST 34.002 Alternative
# Alternative 8-bit coded character set
# Alias: AST_34.002_A
#
0x00 - 0x14 = 0x0000 -
0x15 = 0x0587 # 0x00A7?
0x16 - 0x26 = 0x0016 -
0x27 = 0x055B
0x28 - 0x2C = 0x0028 -
0x2D = 0x2014
0x2E - 0x39 = 0x002E -
0x3A = 0x0589
0x3B - 0x5E = 0x003B -
0x5F = 0x002D
0x60 = 0x055D
0x61 - 0x7D = 0x0061 -
0x7E = 0x055C
0x7F = 0x7F
0x80 = 0x0531
0x81 = 0x0561
0x82 = 0x0532
0x83 = 0x0562
0x84 = 0x0533
0x85 = 0x0563
0x86 = 0x0534
0x87 = 0x0564
0x88 = 0x0535
0x89 = 0x0565
0x8A = 0x0536
0x8B = 0x0566
0x8C = 0x0537
0x8D = 0x0567
0x8E = 0x0538
0x8F = 0x0568
0x90 = 0x0539
0x91 = 0x0569
0x92 = 0x053A
0x93 = 0x056A
0x94 = 0x053B
0x95 = 0x056B
0x96 = 0x053C
0x97 = 0x056C
0x98 = 0x053D
0x99 = 0x056D
0x9A = 0x053E
0x9B = 0x056E
0x9C = 0x053F
0x9D = 0x056F
0x9E = 0x0540
0x9F = 0x0570
0xA0 = 0x0541
0xA1 = 0x0571
0xA2 = 0x0542
0xA3 = 0x0572
0xA4 = 0x0543
0xA5 = 0x0573
0xA6 = 0x0544
0xA7 = 0x0574
0xA8 = 0x0545
0xA9 = 0x0575
0xAA = 0x0546
0xAB = 0x0576
0xAC = 0x0547
0xAD = 0x0577
0xAE = 0x00AB
0xAF = 0x00BB
0xDC = 0xE000 # ARMENIAN ETERNITY SIGN, 0x0530?, 0x2741?
0xDD = 0x058A # 0x055F?
0xDE = 0x2026
0xDF = 0x055E
0xE0 = 0x0548
0xE1 = 0x0578
0xE2 = 0x0549
0xE3 = 0x0579
0xE4 = 0x054A
0xE5 = 0x057A
0xE6 = 0x054B
0xE7 = 0x057B
0xE8 = 0x054C
0xE9 = 0x057C
0xEA = 0x054D
0xEB = 0x057D
0xEC = 0x054E
0xED = 0x057E
0xEE = 0x054F
0xEF = 0x057F
0xF0 = 0x0550
0xF1 = 0x0580
0xF2 = 0x0551
0xF3 = 0x0581
0xF4 = 0x0552
0xF5 = 0x0582
0xF6 = 0x0553
0xF7 = 0x0583
0xF8 = 0x0554
0xF9 = 0x0584
0xFA = 0x0555
0xFB = 0x0585
0xFC = 0x0556
0xFD = 0x0586
0xFE = 0x055A # 0x2019?
0xFF = 0x0027
END_MAP

View File

@ -0,0 +1,5 @@
# $NetBSD: ARMSCII.part,v 1.1 2006/04/01 04:13:21 tnozaki Exp $
7
8
8A

View File

@ -0,0 +1,45 @@
# $NetBSD: Makefile.inc,v 1.2 2008/10/25 22:35:36 apb Exp $
.PATH: ${.CURDIR}/AST
SRCS_mapper.dir+= mapper.dir.AST
SRCS_charset.pivot+= charset.pivot.AST
CLEANFILES+= mapper.dir.AST charset.pivot.AST
PART_ARMSCII!= ${TOOL_SED} '/^\#/d;/^$$/d;' ${.CURDIR}/AST/ARMSCII.part
.for i in ${PART_ARMSCII}
.if exists(${.CURDIR}/AST/ARMSCII-$i%UCS.src)
FILES+= ARMSCII-$i%UCS.mps
CLEANFILES+= ARMSCII-$i%UCS.mps
FILESDIR_ARMSCII-$i%UCS.mps= ${BINDIR}/AST
.endif
.if exists(${.CURDIR}/AST/UCS%ARMSCII-$i.src)
FILES+= UCS%ARMSCII-$i.mps
CLEANFILES+= UCS%ARMSCII-$i.mps
FILESDIR_UCS%ARMSCII-$i.mps= ${BINDIR}/AST
.endif
.endfor
mapper.dir.AST: ${.CURDIR}/AST/ARMSCII.part
${_MKTARGET_CREATE}
( \
echo "# AST"; \
for i in ${PART_ARMSCII}; do \
printf "%-32s%-32s%s\n" ARMSCII-$$i/UCS mapper_std \
AST/ARMSCII-$$i%UCS.mps; \
printf "%-32s%-32s%s\n" UCS/ARMSCII-$$i mapper_std \
AST/UCS%ARMSCII-$$i.mps; \
done; \
echo; \
) > ${.TARGET}
charset.pivot.AST: ${.CURDIR}/AST/ARMSCII.part
${_MKTARGET_CREATE}
( \
echo "# AST"; \
for i in ${PART_ARMSCII}; do \
printf "%-32s%-32s%d\n" ARMSCII-$$i UCS 1; \
printf "%-32s%-32s%d\n" UCS ARMSCII-$$i 1; \
done; \
echo; \
) > ${.TARGET}

View File

@ -0,0 +1,119 @@
# $NetBSD: UCS%ARMSCII-7.src,v 1.2 2006/04/08 15:47:40 tnozaki Exp $
TYPE ROWCOL
NAME UCS/ARMSCII-7
SRC_ZONE 0x0000-0xE000
OOB_MODE INVALID
DST_INVALID 0xFE
DST_UNIT_BITS 8
BEGIN_MAP
#
# this data delived from:
#
# ARMENIAN CHARACTER SETS IMPLEMENTATION GUIDE
# Document version 006.en.html
# http://www.freenet.am/armscii/armcs-006.html
#
# Name: armscii-7
# Source: Armenian State Standard AST 34.005
# Basic 7-bit coded character set
# Alias: AST_34.005
#
0x0000 - 0x0020 = 0x00 -
0x0027 = 0x7F
0x0028 = 0x25
0x0029 = 0x24
0x002C = 0x2B
0x002D = 0x2C
0x002E = 0x29
0x00AB = 0x27
0x00BB = 0x26
0x0531 = 0x32
0x0532 = 0x34
0x0533 = 0x36
0x0534 = 0x38
0x0535 = 0x3A
0x0536 = 0x3C
0x0537 = 0x3E
0x0538 = 0x40
0x0539 = 0x42
0x053A = 0x44
0x053B = 0x46
0x053C = 0x48
0x053D = 0x4A
0x053E = 0x4C
0x053F = 0x4E
0x0540 = 0x50
0x0541 = 0x52
0x0542 = 0x54
0x0543 = 0x56
0x0544 = 0x58
0x0545 = 0x5A
0x0546 = 0x5C
0x0547 = 0x5E
0x0548 = 0x60
0x0549 = 0x62
0x054A = 0x64
0x054B = 0x66
0x054C = 0x68
0x054D = 0x6A
0x054E = 0x6C
0x054F = 0x6E
0x0550 = 0x70
0x0551 = 0x72
0x0552 = 0x74
0x0553 = 0x76
0x0554 = 0x78
0x0555 = 0x7A
0x0556 = 0x7C
0x055A = 0x7E # 0x2019?
0x055B = 0x30
0x055C = 0x2F
0x055D = 0x2A
0x055E = 0x31
0x0561 = 0x33
0x0562 = 0x35
0x0563 = 0x37
0x0564 = 0x39
0x0565 = 0x3B
0x0566 = 0x3D
0x0567 = 0x3F
0x0568 = 0x41
0x0569 = 0x43
0x056A = 0x45
0x056B = 0x47
0x056C = 0x49
0x056D = 0x4B
0x056E = 0x4D
0x056F = 0x4F
0x0570 = 0x51
0x0571 = 0x53
0x0572 = 0x55
0x0573 = 0x57
0x0574 = 0x59
0x0575 = 0x5B
0x0576 = 0x5D
0x0577 = 0x5F
0x0578 = 0x61
0x0579 = 0x63
0x057A = 0x65
0x057B = 0x67
0x057C = 0x69
0x057D = 0x6B
0x057E = 0x6D
0x057F = 0x6F
0x0580 = 0x71
0x0581 = 0x73
0x0582 = 0x75
0x0583 = 0x77
0x0584 = 0x79
0x0585 = 0x7B
0x0586 = 0x7D
0x0587 = 0x22 # 0x00A7?
0x0589 = 0x23
0x058A = 0x2D # 0x055F?
0x2014 = 0x28
0x2026 = 0x2E
0xE000 = 0x21 # ARMENIAN ETERNITY SIGN, 0x530? 0x2741?
END_MAP

View File

@ -0,0 +1,119 @@
# $NetBSD: UCS%ARMSCII-8.src,v 1.2 2006/04/08 15:47:40 tnozaki Exp $
TYPE ROWCOL
NAME UCS/ARMSCII-8
SRC_ZONE 0x0000-0xE000
OOB_MODE INVALID
DST_INVALID 0x100
DST_UNIT_BITS 16
BEGIN_MAP
#
# this data delived from:
#
# ARMENIAN CHARACTER SETS IMPLEMENTATION GUIDE
# Document version 006.en.html
# http://www.freenet.am/armscii/armcs-006.html
#
# Name: armscii-8
# Source: Armenian State Standard AST 34.002
# Basic 8-bit coded character set
# Alias: AST_34.002
#
0x0000 - 0x00A0 = 0x00 -
#0x0027 = 0xFF
#0x0028 = 0xA5
#0x0029 = 0xA4
#0x002C = 0xAB
#0x002D = 0xAC
#0x002E = 0xA9
0x00AB = 0xA7
0x00BB = 0xA6
0x0531 = 0xB2
0x0532 = 0xB4
0x0533 = 0xB6
0x0534 = 0xB8
0x0535 = 0xBA
0x0536 = 0xBC
0x0537 = 0xBE
0x0538 = 0xC0
0x0539 = 0xC2
0x053A = 0xC4
0x053B = 0xC6
0x053C = 0xC8
0x053D = 0xCA
0x053E = 0xCC
0x053F = 0xCE
0x0540 = 0xD0
0x0541 = 0xD2
0x0542 = 0xD4
0x0543 = 0xD6
0x0544 = 0xD8
0x0545 = 0xDA
0x0546 = 0xDC
0x0547 = 0xDE
0x0548 = 0xE0
0x0549 = 0xE2
0x054A = 0xE4
0x054B = 0xE6
0x054C = 0xE8
0x054D = 0xEA
0x054E = 0xEC
0x054F = 0xEE
0x0550 = 0xF0
0x0551 = 0xF2
0x0552 = 0xF4
0x0553 = 0xF6
0x0554 = 0xF8
0x0555 = 0xFA
0x0556 = 0xFC
0x055A = 0xFE # 0x2019?
0x055B = 0xB0
0x055C = 0xAF
0x055D = 0xAA
0x055E = 0xB1
0x0561 = 0xB3
0x0562 = 0xB5
0x0563 = 0xB7
0x0564 = 0xB9
0x0565 = 0xBB
0x0566 = 0xBD
0x0567 = 0xBF
0x0568 = 0xC1
0x0569 = 0xC3
0x056A = 0xC5
0x056B = 0xC7
0x056C = 0xC9
0x056D = 0xCB
0x056E = 0xCD
0x056F = 0xCF
0x0570 = 0xD1
0x0571 = 0xD3
0x0572 = 0xD5
0x0573 = 0xD7
0x0574 = 0xD9
0x0575 = 0xDB
0x0576 = 0xDD
0x0577 = 0xDF
0x0578 = 0xE1
0x0579 = 0xE3
0x057A = 0xE5
0x057B = 0xE7
0x057C = 0xE9
0x057D = 0xEB
0x057E = 0xED
0x057F = 0xEF
0x0580 = 0xF1
0x0581 = 0xF3
0x0582 = 0xF5
0x0583 = 0xF7
0x0584 = 0xF9
0x0585 = 0xFB
0x0586 = 0xFD
0x0587 = 0xA2 # 0x00A7?
0x0589 = 0xA3
0x058A = 0xAD # 0x055F?
0x2014 = 0xA8
0x2026 = 0xAE
0xE000 = 0xA1 # ARMENIAN ETERNITY SIGN, 0x0530? 0x2741?
END_MAP

View File

@ -0,0 +1,121 @@
# $NetBSD: UCS%ARMSCII-8A.src,v 1.2 2006/04/08 15:47:40 tnozaki Exp $
TYPE ROWCOL
NAME UCS/ARMSCII-8A
SRC_ZONE 0x0000-0xE000
OOB_MODE INVALID
DST_INVALID 0x100
DST_UNIT_BITS 16
BEGIN_MAP
#
# this data delived from:
#
# ARMENIAN CHARACTER SETS IMPLEMENTATION GUIDE
# Document version 006.en.html
# http://www.freenet.am/armscii/armcs-006.html
#
# Name: armscii-8a
# Source: Armenian State Standard AST 34.002 Alternative
# Alternative 8-bit coded character set
# Alias: AST_34.002_A
#
0x0000 - 0x0014 = 0x00 -
0x0016 - 0x0026 = 0x16 -
0x0027 = 0xFF
0x0028 - 0x002C = 0x28 -
0x002D = 0x5F
0x002E - 0x0039 = 0x2E -
0x003B - 0x005E = 0x3B -
0x0061 - 0x007D = 0x61 -
0x007F = 0x7F
0x00AB = 0xAE
0x00BB = 0xAF
0x0531 = 0x80
0x0532 = 0x82
0x0533 = 0x84
0x0534 = 0x86
0x0535 = 0x88
0x0536 = 0x8A
0x0537 = 0x8C
0x0538 = 0x8E
0x0539 = 0x90
0x053A = 0x92
0x053B = 0x94
0x053C = 0x96
0x053D = 0x98
0x053E = 0x9A
0x053F = 0x9C
0x0540 = 0x9E
0x0541 = 0xA0
0x0542 = 0xA2
0x0543 = 0xA4
0x0544 = 0xA6
0x0545 = 0xA8
0x0546 = 0xAA
0x0547 = 0xAC
0x0548 = 0xE0
0x0549 = 0xE2
0x054A = 0xE4
0x054B = 0xE6
0x054C = 0xE8
0x054D = 0xEA
0x054E = 0xEC
0x054F = 0xEE
0x0550 = 0xF0
0x0551 = 0xF2
0x0552 = 0xF4
0x0553 = 0xF6
0x0554 = 0xF8
0x0555 = 0xFA
0x0556 = 0xFC
0x055A = 0xFE # 0x2019
0x055B = 0x27
0x055C = 0x7E
0x055D = 0x60
0x055E = 0xDF
0x0561 = 0x81
0x0562 = 0x83
0x0563 = 0x85
0x0564 = 0x87
0x0565 = 0x89
0x0566 = 0x8B
0x0567 = 0x8D
0x0568 = 0x8F
0x0569 = 0x91
0x056A = 0x93
0x056B = 0x95
0x056C = 0x97
0x056D = 0x99
0x056E = 0x9B
0x056F = 0x9D
0x0570 = 0x9F
0x0571 = 0xA1
0x0572 = 0xA3
0x0573 = 0xA5
0x0574 = 0xA7
0x0575 = 0xA9
0x0576 = 0xAB
0x0577 = 0xAD
0x0578 = 0xE1
0x0579 = 0xE3
0x057A = 0xE5
0x057B = 0xE7
0x057C = 0xE9
0x057D = 0xEB
0x057E = 0xED
0x057F = 0xEF
0x0580 = 0xF1
0x0581 = 0xF3
0x0582 = 0xF5
0x0583 = 0xF7
0x0584 = 0xF9
0x0585 = 0xFB
0x0586 = 0xFD
0x0587 = 0x15 # 0x00A7?
0x0589 = 0x3A
0x058A = 0xDD # 0x055F?
0x2014 = 0x2D
0x2026 = 0xDE
0xE000 = 0xDC # ARMENIAN ETERNITY SIGN, 0x0530? 0x2741?
END_MAP

File diff suppressed because it is too large Load Diff

View File

@ -0,0 +1,65 @@
# $NetBSD: Big5EXT@2003%UCS.src,v 1.1 2006/06/19 17:28:25 tnozaki Exp $
TYPE ROWCOL
NAME "Big5EXT:2003/UCS"
SRC_ZONE 0xA3-0xC8 / 0x40-0xFE / 8
OOB_MODE INVALID
DST_INVALID 0xFFFE
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by
# http://wakaba-web.hp.infoseek.co.jp/table/big5-eten.txt
# Original notice:
#
## Big5-ETen vs Unicode mapping table
##
## Date: 24 Feb 2002 19:01:00 +0900
## License: Public Domain.
##
## Big5 Unicode UnicodeAlternate UnicodeName
0xA3C0 - 0xA3E0 = 0x2400 -
0xA3E1 = 0x20AC
0xC8D4 = 0x309B
0xC8D5 = 0x309C
0xC8D6 = 0x2E80
0xC8D7 = 0x2E84
0xC8D8 = 0x2E86
0xC8D9 = 0x2E87
0xC8DA = 0x2E88
0xC8DB = 0x2E8A
0xC8DC = 0x2E8C
0xC8DD = 0x2E8D
0xC8DE = 0x2E95
0xC8DF = 0x2E9C
0xC8E0 = 0x2E9D
0xC8E1 = 0x2EA5
0xC8E2 = 0x2EA7
0xC8E3 = 0x2EAA
0xC8E4 = 0x2EAC
0xC8E5 = 0x2EAE
0xC8E6 = 0x2EB6
0xC8E7 = 0x2EBC
0xC8E8 = 0x2EBE
0xC8E9 = 0x2EC6
0xC8EA = 0x2ECA
0xC8EB = 0x2ECC
0xC8EC = 0x2ECD
0xC8ED = 0x2ECF
0xC8EE = 0x2ED6
0xC8EF = 0x2ED7
0xC8F0 = 0x2EDE
0xC8F1 = 0x2EE3
0xC8F5 = 0x0283
0xC8F6 = 0x0250
0xC8F7 = 0x025B
0xC8F8 = 0x0254
0xC8F9 = 0x0275
0xC8FA = 0x0153
0xC8FB = 0x00F8
0xC8FC = 0x014B
0xC8FD = 0x028A
0xC8FE = 0x026A
END_MAP

File diff suppressed because it is too large Load Diff

View File

@ -0,0 +1,466 @@
# $NetBSD: Big5EXT@IBM%UCS.src,v 1.1 2006/06/19 17:28:25 tnozaki Exp $
TYPE ROWCOL
NAME "Big5EXT:IBM/UCS"
SRC_ZONE 0xA3-0xF9 / 0x40-0xFE / 8
OOB_MODE INVALID
DST_INVALID 0xFFFE
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
# Name: BIG5 to Unicode table (complete)
# Unicode version: 1.1
# Table version: 0.0d3
# Table format: Format A
# Date: 11 February 1994
#
# Copyright (c) 1991-1994 Unicode, Inc. All Rights reserved.
#
# This file is provided as-is by Unicode, Inc. (The Unicode Consortium).
# No claims are made as to fitness for any particular purpose. No
# warranties of any kind are expressed or implied. The recipient
# agrees to determine applicability of information provided. If this
# file has been provided on magnetic media by Unicode, Inc., the sole
# remedy for any claim will be exchange of defective media within 90
# days of receipt.
#
# Recipient is granted the right to make copies in any form for
# internal distribution and to freely use the information supplied
# in the creation of products supporting Unicode. Unicode, Inc.
# specifically excludes the right to re-distribute this file directly
# to third parties or other organizations whether for profit or not.
#
# General notes:
#
#
# This table contains one set of mappings from BIG5 into Unicode.
# Note that these data are *possible* mappings only and may not be the
# same as those used by actual products, nor may they be the best suited
# for all uses. For more information on the mappings between various code
# pages incorporating the repertoire of BIG5 and Unicode, consult the
# VENDORS mapping data. Normative information on the mapping between
# BIG5 and Unicode may be found in the Unihan.txt file in the
# latest Unicode Character Database.
#
# If you have carefully considered the fact that the mappings in
# this table are only one possible set of mappings between BIG5 and
# Unicode and have no normative status, but still feel that you
# have located an error in the table that requires fixing, you may
# report any such error to errata@unicode.org.
#
# WARNING! It is currently impossible to provide round-trip compatibility
# between BIG5 and Unicode.
#
# A number of characters are not currently mapped because
# of conflicts with other mappings. They are as follows:
#
# BIG5 Description Comments
#
# 0xA15A SPACING UNDERSCORE duplicates A1C4
# 0xA1C3 SPACING HEAVY OVERSCORE not in Unicode
# 0xA1C5 SPACING HEAVY UNDERSCORE not in Unicode
# 0xA1FE LT DIAG UP RIGHT TO LOW LEFT duplicates A2AC
# 0xA240 LT DIAG UP LEFT TO LOW RIGHT duplicates A2AD
# 0xA2CC HANGZHOU NUMERAL TEN conflicts with A451 mapping
# 0xA2CE HANGZHOU NUMERAL THIRTY conflicts with A4CA mapping
#
# We currently map all of these characters to U+FFFD REPLACEMENT CHARACTER.
# It is also possible to map these characters to their duplicates, or to
# the user zone.
#
# Notes:
#
# 1. In addition to the above, there is some uncertainty about the
# mappings in the range C6A1 - C8FE, and F9DD - F9FE. The ETEN
# version of BIG5 organizes the former range differently, and adds
# additional characters in the latter range. The correct mappings
# these ranges need to be determined.
#
# 2. There is an uncertainty in the mapping of the Big Five character
# 0xA3BC. This character occurs within the Big Five block of tone marks
# for bopomofo and is intended to be the tone mark for the first tone in
# Mandarin Chinese. We have selected the mapping U+02C9 MODIFIER LETTER
# MACRON (Mandarin Chinese first tone) to reflect this semantic.
# However, because bopomofo uses the absense of a tone mark to indicate
# the first Mandarin tone, most implementations of Big Five represent
# this character with a blank space, and so a mapping such as U+2003 EM
# SPACE might be preferred.
#
# Format: Three tab-separated columns
# Column #1 is the BIG5 code (in hex as 0xXXXX)
# Column #2 is the Unicode (in hex as 0xXXXX)
# Column #3 is the Unicode name (follows a comment sign, '#')
# The official names for Unicode characters U+4E00
# to U+9FA5, inclusive, is "CJK UNIFIED IDEOGRAPH-XXXX",
# where XXXX is the code point. Including all these
# names in this file increases its size substantially
# and needlessly. The token "<CJK>" is used for the
# name of these characters. If necessary, it can be
# expanded algorithmically by a parser or editor.
#
# The entries are in BIG5 order
#
#
0xA3C0 - 0xA3E0 = 0x2400 -
0xC6A1 = 0x2460
0xC6A2 = 0x2461
0xC6A3 = 0x2462
0xC6A4 = 0x2463
0xC6A5 = 0x2464
0xC6A6 = 0x2465
0xC6A7 = 0x2466
0xC6A8 = 0x2467
0xC6A9 = 0x2468
0xC6AA = 0x2469
0xC6AB = 0x2474
0xC6AC = 0x2475
0xC6AD = 0x2476
0xC6AE = 0x2477
0xC6AF = 0x2478
0xC6B0 = 0x2479
0xC6B1 = 0x247A
0xC6B2 = 0x247B
0xC6B3 = 0x247C
0xC6B4 = 0x247D
0xC6B5 = 0x2170
0xC6B6 = 0x2171
0xC6B7 = 0x2172
0xC6B8 = 0x2173
0xC6B9 = 0x2174
0xC6BA = 0x2175
0xC6BB = 0x2176
0xC6BC = 0x2177
0xC6BD = 0x2178
0xC6BE = 0x2179
0xC6BF = 0x4E36
0xC6C0 = 0x4E3F
0xC6C1 = 0x4E85
0xC6C2 = 0x4EA0
0xC6C3 = 0x5182
0xC6C4 = 0x5196
0xC6C5 = 0x51AB
0xC6C6 = 0x52F9
0xC6C7 = 0x5338
0xC6C8 = 0x5369
0xC6C9 = 0x53B6
0xC6CA = 0x590A
0xC6CB = 0x5B80
0xC6CC = 0x5DDB
0xC6CD = 0x5E7A
0xC6CE = 0x5E7F
0xC6CF = 0x5EF4
0xC6D0 = 0x5F50
0xC6D1 = 0x5F61
0xC6D2 = 0x6534
0xC6D3 = 0x65E0
0xC6D4 = 0x7592
0xC6D5 = 0x7676
0xC6D6 = 0x8FB5
0xC6D7 = 0x96B6
0xC6D8 = 0x00A8
0xC6D9 = 0xFF3E
0xC6DA = 0x30FD
0xC6DB = 0x30FE
0xC6DC = 0x309D
0xC6DD = 0x309E
0xC6DE = 0x02BA
0xC6DF = 0xF83E
0xC6E0 = 0x3005
0xC6E1 = 0x3006
0xC6E2 = 0x3007
0xC6E3 = 0x30FC
0xC6E4 = 0xFF3B
0xC6E5 = 0xFF3D
0xC6E6 = 0x273D
0xC6E7 = 0x3041
0xC6E8 = 0x3042
0xC6E9 = 0x3043
0xC6EA = 0x3044
0xC6EB = 0x3045
0xC6EC = 0x3046
0xC6ED = 0x3047
0xC6EE = 0x3048
0xC6EF = 0x3049
0xC6F0 = 0x304A
0xC6F1 = 0x304B
0xC6F2 = 0x304C
0xC6F3 = 0x304D
0xC6F4 = 0x304E
0xC6F5 = 0x304F
0xC6F6 = 0x3050
0xC6F7 = 0x3051
0xC6F8 = 0x3052
0xC6F9 = 0x3053
0xC6FA = 0x3054
0xC6FB = 0x3055
0xC6FC = 0x3056
0xC6FD = 0x3057
0xC6FE = 0x3058
0xC740 = 0x3059
0xC741 = 0x305A
0xC742 = 0x305B
0xC743 = 0x305C
0xC744 = 0x305D
0xC745 = 0x305E
0xC746 = 0x305F
0xC747 = 0x3060
0xC748 = 0x3061
0xC749 = 0x3062
0xC74A = 0x3063
0xC74B = 0x3064
0xC74C = 0x3065
0xC74D = 0x3066
0xC74E = 0x3067
0xC74F = 0x3068
0xC750 = 0x3069
0xC751 = 0x306A
0xC752 = 0x306B
0xC753 = 0x306C
0xC754 = 0x306D
0xC755 = 0x306E
0xC756 = 0x306F
0xC757 = 0x3070
0xC758 = 0x3071
0xC759 = 0x3072
0xC75A = 0x3073
0xC75B = 0x3074
0xC75C = 0x3075
0xC75D = 0x3076
0xC75E = 0x3077
0xC75F = 0x3078
0xC760 = 0x3079
0xC761 = 0x307A
0xC762 = 0x307B
0xC763 = 0x307C
0xC764 = 0x307D
0xC765 = 0x307E
0xC766 = 0x307F
0xC767 = 0x3080
0xC768 = 0x3081
0xC769 = 0x3082
0xC76A = 0x3083
0xC76B = 0x3084
0xC76C = 0x3085
0xC76D = 0x3086
0xC76E = 0x3087
0xC76F = 0x3088
0xC770 = 0x3089
0xC771 = 0x308A
0xC772 = 0x308B
0xC773 = 0x308C
0xC774 = 0x308D
0xC775 = 0x308E
0xC776 = 0x308F
0xC777 = 0x3090
0xC778 = 0x3091
0xC779 = 0x3092
0xC77A = 0x3093
0xC77B = 0x30A1
0xC77C = 0x30A2
0xC77D = 0x30A3
0xC77E = 0x30A4
0xC7A1 = 0x30A5
0xC7A2 = 0x30A6
0xC7A3 = 0x30A7
0xC7A4 = 0x30A8
0xC7A5 = 0x30A9
0xC7A6 = 0x30AA
0xC7A7 = 0x30AB
0xC7A8 = 0x30AC
0xC7A9 = 0x30AD
0xC7AA = 0x30AE
0xC7AB = 0x30AF
0xC7AC = 0x30B0
0xC7AD = 0x30B1
0xC7AE = 0x30B2
0xC7AF = 0x30B3
0xC7B0 = 0x30B4
0xC7B1 = 0x30B5
0xC7B2 = 0x30B6
0xC7B3 = 0x30B7
0xC7B4 = 0x30B8
0xC7B5 = 0x30B9
0xC7B6 = 0x30BA
0xC7B7 = 0x30BB
0xC7B8 = 0x30BC
0xC7B9 = 0x30BD
0xC7BA = 0x30BE
0xC7BB = 0x30BF
0xC7BC = 0x30C0
0xC7BD = 0x30C1
0xC7BE = 0x30C2
0xC7BF = 0x30C3
0xC7C0 = 0x30C4
0xC7C1 = 0x30C5
0xC7C2 = 0x30C6
0xC7C3 = 0x30C7
0xC7C4 = 0x30C8
0xC7C5 = 0x30C9
0xC7C6 = 0x30CA
0xC7C7 = 0x30CB
0xC7C8 = 0x30CC
0xC7C9 = 0x30CD
0xC7CA = 0x30CE
0xC7CB = 0x30CF
0xC7CC = 0x30D0
0xC7CD = 0x30D1
0xC7CE = 0x30D2
0xC7CF = 0x30D3
0xC7D0 = 0x30D4
0xC7D1 = 0x30D5
0xC7D2 = 0x30D6
0xC7D3 = 0x30D7
0xC7D4 = 0x30D8
0xC7D5 = 0x30D9
0xC7D6 = 0x30DA
0xC7D7 = 0x30DB
0xC7D8 = 0x30DC
0xC7D9 = 0x30DD
0xC7DA = 0x30DE
0xC7DB = 0x30DF
0xC7DC = 0x30E0
0xC7DD = 0x30E1
0xC7DE = 0x30E2
0xC7DF = 0x30E3
0xC7E0 = 0x30E4
0xC7E1 = 0x30E5
0xC7E2 = 0x30E6
0xC7E3 = 0x30E7
0xC7E4 = 0x30E8
0xC7E5 = 0x30E9
0xC7E6 = 0x30EA
0xC7E7 = 0x30EB
0xC7E8 = 0x30EC
0xC7E9 = 0x30ED
0xC7EA = 0x30EE
0xC7EB = 0x30EF
0xC7EC = 0x30F0
0xC7ED = 0x30F1
0xC7EE = 0x30F2
0xC7EF = 0x30F3
0xC7F0 = 0x30F4
0xC7F1 = 0x30F5
0xC7F2 = 0x30F6
0xC7F3 = 0x0410
0xC7F4 = 0x0411
0xC7F5 = 0x0412
0xC7F6 = 0x0413
0xC7F7 = 0x0414
0xC7F8 = 0x0415
0xC7F9 = 0x0401
0xC7FA = 0x0416
0xC7FB = 0x0417
0xC7FC = 0x0418
0xC7FD = 0x0419
0xC7FE = 0x041A
0xC840 = 0x041B
0xC841 = 0x041C
0xC842 = 0x041D
0xC843 = 0x041E
0xC844 = 0x041F
0xC845 = 0x0420
0xC846 = 0x0421
0xC847 = 0x0422
0xC848 = 0x0423
0xC849 = 0x0424
0xC84A = 0x0425
0xC84B = 0x0426
0xC84C = 0x0427
0xC84D = 0x0428
0xC84E = 0x0429
0xC84F = 0x042A
0xC850 = 0x042B
0xC851 = 0x042C
0xC852 = 0x042D
0xC853 = 0x042E
0xC854 = 0x042F
0xC855 = 0x0430
0xC856 = 0x0431
0xC857 = 0x0432
0xC858 = 0x0433
0xC859 = 0x0434
0xC85A = 0x0435
0xC85B = 0x0451
0xC85C = 0x0436
0xC85D = 0x0437
0xC85E = 0x0438
0xC85F = 0x0439
0xC860 = 0x043A
0xC861 = 0x043B
0xC862 = 0x043C
0xC863 = 0x043D
0xC864 = 0x043E
0xC865 = 0x043F
0xC866 = 0x0440
0xC867 = 0x0441
0xC868 = 0x0442
0xC869 = 0x0443
0xC86A = 0x0444
0xC86B = 0x0445
0xC86C = 0x0446
0xC86D = 0x0447
0xC86E = 0x0448
0xC86F = 0x0449
0xC870 = 0x044A
0xC871 = 0x044B
0xC872 = 0x044C
0xC873 = 0x044D
0xC874 = 0x044E
0xC875 = 0x044F
0xC876 = 0x21E7
0xC877 = 0x21B8
0xC878 = 0x21B9
0xC8CD = 0xFFE2
0xC8CE = 0xFFE4
0xC8CF = 0xFF07
0xC8D0 = 0xFF02
0xC8D1 = 0x3231
0xC8D2 = 0x2116
0xC8D3 = 0x2121
0xF9D6 = 0xF813
0xF9D7 = 0xF814
0xF9D8 = 0xF815
0xF9D9 = 0xF816
0xF9DA = 0xF817
0xF9DB = 0xF818
0xF9DC = 0xF819
0xF9DD = 0xF81A
0xF9DE = 0xF81B
0xF9DF = 0xF81C
0xF9E0 = 0xF81D
0xF9E1 = 0xF81E
0xF9E2 = 0xF81F
0xF9E3 = 0xF820
0xF9E4 = 0xF821
0xF9E5 = 0xF822
0xF9E6 = 0xF823
0xF9E7 = 0xF824
0xF9E8 = 0xF825
0xF9E9 = 0xF826
0xF9EA = 0xF827
0xF9EB = 0xF828
0xF9EC = 0xF829
0xF9ED = 0xF82A
0xF9EE = 0xF82B
0xF9EF = 0xF82C
0xF9F0 = 0xF82D
0xF9F1 = 0xF82E
0xF9F2 = 0xF82F
0xF9F3 = 0xF830
0xF9F4 = 0xF831
0xF9F5 = 0xF832
0xF9F6 = 0xF833
0xF9F7 = 0xF834
0xF9F8 = 0xF835
0xF9F9 = 0xF836
0xF9FA = 0xF837
0xF9FB = 0xF838
0xF9FC = 0xF839
0xF9FD = 0xF83A
0xF9FE = 0xF83B
END_MAP

File diff suppressed because it is too large Load Diff

View File

@ -0,0 +1,115 @@
# $NetBSD: Big5UDA%UCS.src,v 1.2 2007/03/05 16:57:08 tnozaki Exp $
# Copyright (c)2006 Citrus Project,
# All rights reserved.
#
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions
# are met:
# 1. Redistributions of source code must retain the above copyright
# notice, this list of conditions and the following disclaimer.
# 2. Redistributions in binary form must reproduce the above copyright
# notice, this list of conditions and the following disclaimer in the
# documentation and/or other materials provided with the distribution.
#
# THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
# ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
# ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
# FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
# DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
# OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
# HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
# LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
# OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
# SUCH DAMAGE.
#
TYPE ROWCOL
NAME "Big5UDA/UCS"
SRC_ZONE 0x81-0xFE / 0x40-0xFE / 8
OOB_MODE INVALID
DST_INVALID 0xFFFE
DST_UNIT_BITS 32
BEGIN_MAP
0x8140 - 0x817E = 0xEEB8 -
0x81A1 - 0x81FE = 0xEEF7 -
0x8240 - 0x827E = 0xEF55 -
0x82A1 - 0x82FE = 0xEF94 -
0x8340 - 0x837E = 0xEFF2 -
0x83A1 - 0x83FE = 0xF031 -
0x8440 - 0x847E = 0xF08F -
0x84A1 - 0x84FE = 0xF0CE -
0x8540 - 0x857E = 0xF12C -
0x85A1 - 0x85FE = 0xF16B -
0x8640 - 0x867E = 0xF1C9 -
0x86A1 - 0x86FE = 0xF208 -
0x8740 - 0x877E = 0xF266 -
0x87A1 - 0x87FE = 0xF2A5 -
0x8840 - 0x887E = 0xF303 -
0x88A1 - 0x88FE = 0xF342 -
0x8940 - 0x897E = 0xF3A0 -
0x89A1 - 0x89FE = 0xF3DF -
0x8A40 - 0x8A7E = 0xF43D -
0x8AA1 - 0x8AFE = 0xF47C -
0x8B40 - 0x8B7E = 0xF4DA -
0x8BA1 - 0x8BFE = 0xF519 -
0x8C40 - 0x8C7E = 0xF577 -
0x8CA1 - 0x8CFE = 0xF5B6 -
0x8D40 - 0x8D7E = 0xF614 -
0x8DA1 - 0x8DFE = 0xF653 -
0x8E40 - 0x8E7E = 0xE311 -
0x8EA1 - 0x8EFE = 0xE350 -
0x8F40 - 0x8F7E = 0xE3AE -
0x8FA1 - 0x8FFE = 0xE3ED -
0x9040 - 0x907E = 0xE44B -
0x90A1 - 0x90FE = 0xE48A -
0x9140 - 0x917E = 0xE4E8 -
0x91A1 - 0x91FE = 0xE527 -
0x9240 - 0x927E = 0xE585 -
0x92A1 - 0x92FE = 0xE5C4 -
0x9340 - 0x937E = 0xE622 -
0x93A1 - 0x93FE = 0xE661 -
0x9440 - 0x947E = 0xE6BF -
0x94A1 - 0x94FE = 0xE6FE -
0x9540 - 0x957E = 0xE75C -
0x95A1 - 0x95FE = 0xE79B -
0x9640 - 0x967E = 0xE7F9 -
0x96A1 - 0x96FE = 0xE838 -
0x9740 - 0x977E = 0xE896 -
0x97A1 - 0x97FE = 0xE8D5 -
0x9840 - 0x987E = 0xE933 -
0x98A1 - 0x98FE = 0xE972 -
0x9940 - 0x997E = 0xE9D0 -
0x99A1 - 0x99FE = 0xEA0F -
0x9A40 - 0x9A7E = 0xEA6D -
0x9AA1 - 0x9AFE = 0xEAAC -
0x9B40 - 0x9B7E = 0xEB0A -
0x9BA1 - 0x9BFE = 0xEB49 -
0x9C40 - 0x9C7E = 0xEBA7 -
0x9CA1 - 0x9CFE = 0xEBE6 -
0x9D40 - 0x9D7E = 0xEC44 -
0x9DA1 - 0x9DFE = 0xEC83 -
0x9E40 - 0x9E7E = 0xECE1 -
0x9EA1 - 0x9EFE = 0xED20 -
0x9F40 - 0x9F7E = 0xED7E -
0x9FA1 - 0x9FFE = 0xEDBD -
0xA040 - 0xA07E = 0xEE1B -
0xA0A1 - 0xA0FE = 0xEE5A -
0xC6A1 - 0xC6FE = 0xF6B1 -
0xC740 - 0xC77E = 0xF70F -
0xC7A1 - 0xC7FE = 0xF74E -
0xC840 - 0xC87E = 0xF7AC -
0xC8A1 - 0xC8FE = 0xF7EB -
0xFA40 - 0xFA7E = 0xE000 -
0xFAA1 - 0xFAFE = 0xE03F -
0xFB40 - 0xFB7E = 0xE09D -
0xFBA1 - 0xFBFE = 0xE0DC -
0xFC40 - 0xFC7E = 0xE13A -
0xFCA1 - 0xFCFE = 0xE179 -
0xFD40 - 0xFD7E = 0xE1D7 -
0xFDA1 - 0xFDFE = 0xE216 -
0xFE40 - 0xFE7E = 0xE274 -
0xFEA1 - 0xFEFE = 0xE2B3 -
END_MAP

View File

@ -0,0 +1,134 @@
# $NetBSD: ETen%UCS@BMP.src,v 1.1 2007/03/05 16:57:09 tnozaki Exp $
TYPE ROWCOL
NAME "ETen/UCS:BMP"
SRC_ZONE 0xC6-0xF9 / 0x40-0xFE / 8
OOB_MODE INVALID
DST_INVALID 0xFFFE
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by
# http://wakaba-web.hp.infoseek.co.jp/table/big5-eten.txt
# Original notice:
#
## Big5-ETen vs Unicode mapping table
##
## Date: 24 Feb 2002 19:01:00 +0900
## License: Public Domain.
##
## Big5 Unicode UnicodeAlternate UnicodeName
0xC6A1 - 0xC6AA = 0x2460 -
0xC6AB - 0xC6B4 = 0x2474 -
0xC6B5 - 0xC6BE = 0x2170 -
0xC6BF = 0x2F02
0xC6C0 = 0x2F03
0xC6C1 = 0x2F05
0xC6C2 = 0x2F07
0xC6C3 = 0x2F0C
0xC6C4 = 0x2F0D
0xC6C5 = 0x2F0E
0xC6C6 = 0x2F13
0xC6C7 = 0x2F16
0xC6C8 = 0x2F19
0xC6C9 = 0x2F1B
0xC6CA = 0x2F22
0xC6CB = 0x2F27
0xC6CC = 0x2F2E
0xC6CD = 0x2F33
0xC6CE = 0x2F34
0xC6CF = 0x2F35
0xC6D0 = 0x2F39
0xC6D1 = 0x2F3A
0xC6D2 = 0x2F41
0xC6D3 = 0x2F46
0xC6D4 = 0x2F67
0xC6D5 = 0x2F68
0xC6D6 = 0x2FA1
0xC6D7 = 0x2FAA
0xC6D8 = 0x00A8
0xC6D9 = 0xFF3E # FULLWIDTH CIRCUMFLEX ACCENT
#0xC6D9 = 0x02C6 # MODIFIER LETTER CIRCUMFLEX ACCENT
0xC6DA = 0x30FD
0xC6DB = 0x30FE
0xC6DC = 0x309D
0xC6DD = 0x309E
#0xC6DE =
#0xC6DF =
0xC6E0 - 0xC6E2 = 0x3005 -
0xC6E3 = 0x30FC
0xC6E4 = 0xFF3B
0xC6E5 = 0xFF3D
0xC6E6 = 0x273D
0xC6E7 - 0xC6FE = 0x3041 -
0xC740 - 0xC77A = 0x3059 -
0xC77B - 0xC77E = 0x30A1 -
0xC7A1 - 0xC7F2 = 0x30A5 -
0xC7F3 - 0xC7F8 = 0x0410 -
0xC7F9 = 0x0401
0xC7FA - 0xC7FE = 0x0416 -
0xC840 - 0xC85A = 0x041B -
0xC85B = 0x0451
0xC85C - 0xC875 = 0x0436 -
0xC876 = 0x21E7
0xC877 = 0x21B8
0xC878 = 0x21B9
0xC879 = 0x31CF
0xC87B = 0x4E5A
0xC87D = 0x5202
0xC87E = 0x4491
0xC8A1 = 0x9FB0
0xC8A2 = 0x5188
0xC8A3 = 0x9FB1
#0xC8A5 - 0xC8CC =
0xC8CD = 0xFFE2
0xC8CE = 0xFFE4
0xC8CF = 0xFF07
0xC8D0 = 0xFF02
0xC8D1 = 0x3231
0xC8D2 = 0x2116
0xC8D3 = 0x2121
0xF9D6 = 0x7881
0xF9D7 = 0x92B9
0xF9D8 = 0x88CF
0xF9D9 = 0x58BB
0xF9DA = 0x6052
0xF9DB = 0x7CA7
0xF9DC = 0x5AFA
0xF9DD = 0x2554
0xF9DE = 0x2566
0xF9DF = 0x2557
0xF9E0 = 0x2560
0xF9E1 = 0x256C
0xF9E2 = 0x2563
0xF9E3 = 0x255A
0xF9E4 = 0x2569
0xF9E5 = 0x255D
0xF9E6 = 0x2552
0xF9E7 = 0x2564
0xF9E8 = 0x2555
0xF9E9 = 0x255E
0xF9EA = 0x256A
0xF9EB = 0x2561
0xF9EC = 0x2558
0xF9ED = 0x2567
0xF9EE = 0x255B
0xF9EF = 0x2553
0xF9F0 = 0x2565
0xF9F1 = 0x2556
0xF9F2 = 0x255F
0xF9F3 = 0x256B
0xF9F4 = 0x2562
0xF9F5 = 0x2559
0xF9F6 = 0x2568
0xF9F7 = 0x255C
0xF9F8 = 0x2551
0xF9F9 = 0x2550
0xF9FA = 0x256D
0xF9FB = 0x256E
0xF9FC = 0x2570
0xF9FD = 0x256F
0xF9FE = 0x2593
END_MAP

View File

@ -0,0 +1,26 @@
# $NetBSD: ETen%UCS@SIP.src,v 1.1 2007/03/05 16:57:09 tnozaki Exp $
TYPE ROWCOL
NAME "ETen/UCS:SIP"
SRC_ZONE 0xC6-0xF9 / 0x40-0xFE / 8
OOB_MODE INVALID
DST_INVALID 0xFFFE
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by
# http://wakaba-web.hp.infoseek.co.jp/table/big5-eten.txt
# Original notice:
#
## Big5-ETen vs Unicode mapping table
##
## Date: 24 Feb 2002 19:01:00 +0900
## License: Public Domain.
##
## Big5 Unicode UnicodeAlternate UnicodeName
0xC87A = 0x00CC
0xC87C = 0x008A
0xC8A4 = 0x7607
END_MAP

File diff suppressed because it is too large Load Diff

File diff suppressed because it is too large Load Diff

View File

@ -0,0 +1,37 @@
# $NetBSD: Makefile.inc,v 1.2 2007/03/05 16:57:10 tnozaki Exp $
.PATH: ${.CURDIR}/BIG5
SRCS_mapper.dir+= mapper.dir.BIG5
SRCS_charset.pivot+= charset.pivot.BIG5
CLEANFILES+= mapper.dir.BIG5 charset.pivot.BIG5
MAPS_BIG5= Big5@1984%UCS.mps \
Big5EXT@2003%UCS.mps \
Big5EXT@E%UCS.mps \
Big5EXT@IBM%UCS.mps \
Big5EXT@Plus%UCS.mps \
Big5UDA%UCS.mps \
ETen%UCS@BMP.mps ETen%UCS@SIP.mps \
HKSCS%UCS@BMP.mps HKSCS%UCS@SIP.mps \
UCS%Big5@1984.mps \
UCS%Big5EXT@2003.mps \
UCS%Big5EXT@E.mps \
UCS%Big5EXT@IBM.mps \
UCS%Big5EXT@Plus.mps \
UCS%Big5UDA.mps \
UCS@BMP%ETen.mps UCS@SIP%ETen.mps \
UCS@BMP%HKSCS.mps UCS@SIP%HKSCS.mps
mapper.dir.BIG5: ${.CURDIR}/BIG5/mapper.dir.BIG5.src
${_MKTARGET_CREATE}
(echo "# BIG5" ; cat ${.ALLSRC} ; echo ) > ${.TARGET}
charset.pivot.BIG5: ${.CURDIR}/BIG5/charset.pivot.BIG5.src
${_MKTARGET_CREATE}
(echo "# BIG5" ; cat ${.ALLSRC} ; echo ) > ${.TARGET}
FILES+= ${MAPS_BIG5}
CLEANFILES+= ${MAPS_BIG5}
.for i in ${MAPS_BIG5}
FILESDIR_$i= ${BINDIR}/BIG5
.endfor

File diff suppressed because it is too large Load Diff

View File

@ -0,0 +1,65 @@
# $NetBSD: UCS%Big5EXT@2003.src,v 1.1 2006/06/19 17:28:25 tnozaki Exp $
TYPE ROWCOL
NAME "UCS/Big5EXT:2003"
SRC_ZONE 0x00F8 - 0x309C
OOB_MODE INVALID
DST_INVALID 0xFFFF
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by
# http://wakaba-web.hp.infoseek.co.jp/table/big5-eten.txt
# Original notice:
#
## Big5-ETen vs Unicode mapping table
##
## Date: 24 Feb 2002 19:01:00 +0900
## License: Public Domain.
##
## Big5 Unicode UnicodeAlternate UnicodeName
0x00F8 = 0xC8FB
0x014B = 0xC8FC
0x0153 = 0xC8FA
0x0250 = 0xC8F6
0x0254 = 0xC8F8
0x025B = 0xC8F7
0x026A = 0xC8FE
0x0275 = 0xC8F9
0x0283 = 0xC8F5
0x028A = 0xC8FD
0x20AC = 0xA3E1
0x2400 - 0x2420 = 0xA3C0 -
0x2E80 = 0xC8D6
0x2E84 = 0xC8D7
0x2E86 = 0xC8D8
0x2E87 = 0xC8D9
0x2E88 = 0xC8DA
0x2E8A = 0xC8DB
0x2E8C = 0xC8DC
0x2E8D = 0xC8DD
0x2E95 = 0xC8DE
0x2E9C = 0xC8DF
0x2E9D = 0xC8E0
0x2EA5 = 0xC8E1
0x2EA7 = 0xC8E2
0x2EAA = 0xC8E3
0x2EAC = 0xC8E4
0x2EAE = 0xC8E5
0x2EB6 = 0xC8E6
0x2EBC = 0xC8E7
0x2EBE = 0xC8E8
0x2EC6 = 0xC8E9
0x2ECA = 0xC8EA
0x2ECC = 0xC8EB
0x2ECD = 0xC8EC
0x2ECF = 0xC8ED
0x2ED6 = 0xC8EE
0x2ED7 = 0xC8EF
0x2EDE = 0xC8F0
0x2EE3 = 0xC8F1
0x309B = 0xC8D4
0x309C = 0xC8D5
END_MAP

File diff suppressed because it is too large Load Diff

View File

@ -0,0 +1,466 @@
# $NetBSD: UCS%Big5EXT@IBM.src,v 1.1 2006/06/19 17:28:25 tnozaki Exp $
TYPE ROWCOL
NAME "UCS/Big5EXT:IBM"
SRC_ZONE 0x00A8 - 0xFFE4
OOB_MODE INVALID
DST_INVALID 0xFFFE
DST_UNIT_BITS 16
BEGIN_MAP
#
# This mapping data is made from the mapping data provided by Unicode, Inc.
# Original notice:
#
# Name: BIG5 to Unicode table (complete)
# Unicode version: 1.1
# Table version: 0.0d3
# Table format: Format A
# Date: 11 February 1994
#
# Copyright (c) 1991-1994 Unicode, Inc. All Rights reserved.
#
# This file is provided as-is by Unicode, Inc. (The Unicode Consortium).
# No claims are made as to fitness for any particular purpose. No
# warranties of any kind are expressed or implied. The recipient
# agrees to determine applicability of information provided. If this
# file has been provided on magnetic media by Unicode, Inc., the sole
# remedy for any claim will be exchange of defective media within 90
# days of receipt.
#
# Recipient is granted the right to make copies in any form for
# internal distribution and to freely use the information supplied
# in the creation of products supporting Unicode. Unicode, Inc.
# specifically excludes the right to re-distribute this file directly
# to third parties or other organizations whether for profit or not.
#
# General notes:
#
#
# This table contains one set of mappings from BIG5 into Unicode.
# Note that these data are *possible* mappings only and may not be the
# same as those used by actual products, nor may they be the best suited
# for all uses. For more information on the mappings between various code
# pages incorporating the repertoire of BIG5 and Unicode, consult the
# VENDORS mapping data. Normative information on the mapping between
# BIG5 and Unicode may be found in the Unihan.txt file in the
# latest Unicode Character Database.
#
# If you have carefully considered the fact that the mappings in
# this table are only one possible set of mappings between BIG5 and
# Unicode and have no normative status, but still feel that you
# have located an error in the table that requires fixing, you may
# report any such error to errata@unicode.org.
#
# WARNING! It is currently impossible to provide round-trip compatibility
# between BIG5 and Unicode.
#
# A number of characters are not currently mapped because
# of conflicts with other mappings. They are as follows:
#
# BIG5 Description Comments
#
# 0xA15A SPACING UNDERSCORE duplicates A1C4
# 0xA1C3 SPACING HEAVY OVERSCORE not in Unicode
# 0xA1C5 SPACING HEAVY UNDERSCORE not in Unicode
# 0xA1FE LT DIAG UP RIGHT TO LOW LEFT duplicates A2AC
# 0xA240 LT DIAG UP LEFT TO LOW RIGHT duplicates A2AD
# 0xA2CC HANGZHOU NUMERAL TEN conflicts with A451 mapping
# 0xA2CE HANGZHOU NUMERAL THIRTY conflicts with A4CA mapping
#
# We currently map all of these characters to U+FFFD REPLACEMENT CHARACTER.
# It is also possible to map these characters to their duplicates, or to
# the user zone.
#
# Notes:
#
# 1. In addition to the above, there is some uncertainty about the
# mappings in the range C6A1 - C8FE, and F9DD - F9FE. The ETEN
# version of BIG5 organizes the former range differently, and adds
# additional characters in the latter range. The correct mappings
# these ranges need to be determined.
#
# 2. There is an uncertainty in the mapping of the Big Five character
# 0xA3BC. This character occurs within the Big Five block of tone marks
# for bopomofo and is intended to be the tone mark for the first tone in
# Mandarin Chinese. We have selected the mapping U+02C9 MODIFIER LETTER
# MACRON (Mandarin Chinese first tone) to reflect this semantic.
# However, because bopomofo uses the absense of a tone mark to indicate
# the first Mandarin tone, most implementations of Big Five represent
# this character with a blank space, and so a mapping such as U+2003 EM
# SPACE might be preferred.
#
# Format: Three tab-separated columns
# Column #1 is the BIG5 code (in hex as 0xXXXX)
# Column #2 is the Unicode (in hex as 0xXXXX)
# Column #3 is the Unicode name (follows a comment sign, '#')
# The official names for Unicode characters U+4E00
# to U+9FA5, inclusive, is "CJK UNIFIED IDEOGRAPH-XXXX",
# where XXXX is the code point. Including all these
# names in this file increases its size substantially
# and needlessly. The token "<CJK>" is used for the
# name of these characters. If necessary, it can be
# expanded algorithmically by a parser or editor.
#
# The entries are in BIG5 order
#
#
0x00A8 = 0xC6D8
0x02BA = 0xC6DE
0x0401 = 0xC7F9
0x0410 = 0xC7F3
0x0411 = 0xC7F4
0x0412 = 0xC7F5
0x0413 = 0xC7F6
0x0414 = 0xC7F7
0x0415 = 0xC7F8
0x0416 = 0xC7FA
0x0417 = 0xC7FB
0x0418 = 0xC7FC
0x0419 = 0xC7FD
0x041A = 0xC7FE
0x041B = 0xC840
0x041C = 0xC841
0x041D = 0xC842
0x041E = 0xC843
0x041F = 0xC844
0x0420 = 0xC845
0x0421 = 0xC846
0x0422 = 0xC847
0x0423 = 0xC848
0x0424 = 0xC849
0x0425 = 0xC84A
0x0426 = 0xC84B
0x0427 = 0xC84C
0x0428 = 0xC84D
0x0429 = 0xC84E
0x042A = 0xC84F
0x042B = 0xC850
0x042C = 0xC851
0x042D = 0xC852
0x042E = 0xC853
0x042F = 0xC854
0x0430 = 0xC855
0x0431 = 0xC856
0x0432 = 0xC857
0x0433 = 0xC858
0x0434 = 0xC859
0x0435 = 0xC85A
0x0436 = 0xC85C
0x0437 = 0xC85D
0x0438 = 0xC85E
0x0439 = 0xC85F
0x043A = 0xC860
0x043B = 0xC861
0x043C = 0xC862
0x043D = 0xC863
0x043E = 0xC864
0x043F = 0xC865
0x0440 = 0xC866
0x0441 = 0xC867
0x0442 = 0xC868
0x0443 = 0xC869
0x0444 = 0xC86A
0x0445 = 0xC86B
0x0446 = 0xC86C
0x0447 = 0xC86D
0x0448 = 0xC86E
0x0449 = 0xC86F
0x044A = 0xC870
0x044B = 0xC871
0x044C = 0xC872
0x044D = 0xC873
0x044E = 0xC874
0x044F = 0xC875
0x0451 = 0xC85B
0x2116 = 0xC8D2
0x2121 = 0xC8D3
0x2170 = 0xC6B5
0x2171 = 0xC6B6
0x2172 = 0xC6B7
0x2173 = 0xC6B8
0x2174 = 0xC6B9
0x2175 = 0xC6BA
0x2176 = 0xC6BB
0x2177 = 0xC6BC
0x2178 = 0xC6BD
0x2179 = 0xC6BE
0x21B8 = 0xC877
0x21B9 = 0xC878
0x21E7 = 0xC876
0x2400 - 0x2420 = 0xA3C0 -
0x2460 = 0xC6A1
0x2461 = 0xC6A2
0x2462 = 0xC6A3
0x2463 = 0xC6A4
0x2464 = 0xC6A5
0x2465 = 0xC6A6
0x2466 = 0xC6A7
0x2467 = 0xC6A8
0x2468 = 0xC6A9
0x2469 = 0xC6AA
0x2474 = 0xC6AB
0x2475 = 0xC6AC
0x2476 = 0xC6AD
0x2477 = 0xC6AE
0x2478 = 0xC6AF
0x2479 = 0xC6B0
0x247A = 0xC6B1
0x247B = 0xC6B2
0x247C = 0xC6B3
0x247D = 0xC6B4
0x273D = 0xC6E6
0x3005 = 0xC6E0
0x3006 = 0xC6E1
0x3007 = 0xC6E2
0x3041 = 0xC6E7
0x3042 = 0xC6E8
0x3043 = 0xC6E9
0x3044 = 0xC6EA
0x3045 = 0xC6EB
0x3046 = 0xC6EC
0x3047 = 0xC6ED
0x3048 = 0xC6EE
0x3049 = 0xC6EF
0x304A = 0xC6F0
0x304B = 0xC6F1
0x304C = 0xC6F2
0x304D = 0xC6F3
0x304E = 0xC6F4
0x304F = 0xC6F5
0x3050 = 0xC6F6
0x3051 = 0xC6F7
0x3052 = 0xC6F8
0x3053 = 0xC6F9
0x3054 = 0xC6FA
0x3055 = 0xC6FB
0x3056 = 0xC6FC
0x3057 = 0xC6FD
0x3058 = 0xC6FE
0x3059 = 0xC740
0x305A = 0xC741
0x305B = 0xC742
0x305C = 0xC743
0x305D = 0xC744
0x305E = 0xC745
0x305F = 0xC746
0x3060 = 0xC747
0x3061 = 0xC748
0x3062 = 0xC749
0x3063 = 0xC74A
0x3064 = 0xC74B
0x3065 = 0xC74C
0x3066 = 0xC74D
0x3067 = 0xC74E
0x3068 = 0xC74F
0x3069 = 0xC750
0x306A = 0xC751
0x306B = 0xC752
0x306C = 0xC753
0x306D = 0xC754
0x306E = 0xC755
0x306F = 0xC756
0x3070 = 0xC757
0x3071 = 0xC758
0x3072 = 0xC759
0x3073 = 0xC75A
0x3074 = 0xC75B
0x3075 = 0xC75C
0x3076 = 0xC75D
0x3077 = 0xC75E
0x3078 = 0xC75F
0x3079 = 0xC760
0x307A = 0xC761
0x307B = 0xC762
0x307C = 0xC763
0x307D = 0xC764
0x307E = 0xC765
0x307F = 0xC766
0x3080 = 0xC767
0x3081 = 0xC768
0x3082 = 0xC769
0x3083 = 0xC76A
0x3084 = 0xC76B
0x3085 = 0xC76C
0x3086 = 0xC76D
0x3087 = 0xC76E
0x3088 = 0xC76F
0x3089 = 0xC770
0x308A = 0xC771
0x308B = 0xC772
0x308C = 0xC773
0x308D = 0xC774
0x308E = 0xC775
0x308F = 0xC776
0x3090 = 0xC777
0x3091 = 0xC778
0x3092 = 0xC779
0x3093 = 0xC77A
0x309D = 0xC6DC
0x309E = 0xC6DD
0x30A1 = 0xC77B
0x30A2 = 0xC77C
0x30A3 = 0xC77D
0x30A4 = 0xC77E
0x30A5 = 0xC7A1
0x30A6 = 0xC7A2
0x30A7 = 0xC7A3
0x30A8 = 0xC7A4
0x30A9 = 0xC7A5
0x30AA = 0xC7A6
0x30AB = 0xC7A7
0x30AC = 0xC7A8
0x30AD = 0xC7A9
0x30AE = 0xC7AA
0x30AF = 0xC7AB
0x30B0 = 0xC7AC
0x30B1 = 0xC7AD
0x30B2 = 0xC7AE
0x30B3 = 0xC7AF
0x30B4 = 0xC7B0
0x30B5 = 0xC7B1
0x30B6 = 0xC7B2
0x30B7 = 0xC7B3
0x30B8 = 0xC7B4
0x30B9 = 0xC7B5
0x30BA = 0xC7B6
0x30BB = 0xC7B7
0x30BC = 0xC7B8
0x30BD = 0xC7B9
0x30BE = 0xC7BA
0x30BF = 0xC7BB
0x30C0 = 0xC7BC
0x30C1 = 0xC7BD
0x30C2 = 0xC7BE
0x30C3 = 0xC7BF
0x30C4 = 0xC7C0
0x30C5 = 0xC7C1
0x30C6 = 0xC7C2
0x30C7 = 0xC7C3
0x30C8 = 0xC7C4
0x30C9 = 0xC7C5
0x30CA = 0xC7C6
0x30CB = 0xC7C7
0x30CC = 0xC7C8
0x30CD = 0xC7C9
0x30CE = 0xC7CA
0x30CF = 0xC7CB
0x30D0 = 0xC7CC
0x30D1 = 0xC7CD
0x30D2 = 0xC7CE
0x30D3 = 0xC7CF
0x30D4 = 0xC7D0
0x30D5 = 0xC7D1
0x30D6 = 0xC7D2
0x30D7 = 0xC7D3
0x30D8 = 0xC7D4
0x30D9 = 0xC7D5
0x30DA = 0xC7D6
0x30DB = 0xC7D7
0x30DC = 0xC7D8
0x30DD = 0xC7D9
0x30DE = 0xC7DA
0x30DF = 0xC7DB
0x30E0 = 0xC7DC
0x30E1 = 0xC7DD
0x30E2 = 0xC7DE
0x30E3 = 0xC7DF
0x30E4 = 0xC7E0
0x30E5 = 0xC7E1
0x30E6 = 0xC7E2
0x30E7 = 0xC7E3
0x30E8 = 0xC7E4
0x30E9 = 0xC7E5
0x30EA = 0xC7E6
0x30EB = 0xC7E7
0x30EC = 0xC7E8
0x30ED = 0xC7E9
0x30EE = 0xC7EA
0x30EF = 0xC7EB
0x30F0 = 0xC7EC
0x30F1 = 0xC7ED
0x30F2 = 0xC7EE
0x30F3 = 0xC7EF
0x30F4 = 0xC7F0
0x30F5 = 0xC7F1
0x30F6 = 0xC7F2
0x30FC = 0xC6E3
0x30FD = 0xC6DA
0x30FE = 0xC6DB
0x3231 = 0xC8D1
0x4E36 = 0xC6BF
0x4E3F = 0xC6C0
0x4E85 = 0xC6C1
0x4EA0 = 0xC6C2
0x5182 = 0xC6C3
0x5196 = 0xC6C4
0x51AB = 0xC6C5
0x52F9 = 0xC6C6
0x5338 = 0xC6C7
0x5369 = 0xC6C8
0x53B6 = 0xC6C9
0x590A = 0xC6CA
0x5B80 = 0xC6CB
0x5DDB = 0xC6CC
0x5E7A = 0xC6CD
0x5E7F = 0xC6CE
0x5EF4 = 0xC6CF
0x5F50 = 0xC6D0
0x5F61 = 0xC6D1
0x6534 = 0xC6D2
0x65E0 = 0xC6D3
0x7592 = 0xC6D4
0x7676 = 0xC6D5
0x8FB5 = 0xC6D6
0x96B6 = 0xC6D7
0xF813 = 0xF9D6
0xF814 = 0xF9D7
0xF815 = 0xF9D8
0xF816 = 0xF9D9
0xF817 = 0xF9DA
0xF818 = 0xF9DB
0xF819 = 0xF9DC
0xF81A = 0xF9DD
0xF81B = 0xF9DE
0xF81C = 0xF9DF
0xF81D = 0xF9E0
0xF81E = 0xF9E1
0xF81F = 0xF9E2
0xF820 = 0xF9E3
0xF821 = 0xF9E4
0xF822 = 0xF9E5
0xF823 = 0xF9E6
0xF824 = 0xF9E7
0xF825 = 0xF9E8
0xF826 = 0xF9E9
0xF827 = 0xF9EA
0xF828 = 0xF9EB
0xF829 = 0xF9EC
0xF82A = 0xF9ED
0xF82B = 0xF9EE
0xF82C = 0xF9EF
0xF82D = 0xF9F0
0xF82E = 0xF9F1
0xF82F = 0xF9F2
0xF830 = 0xF9F3
0xF831 = 0xF9F4
0xF832 = 0xF9F5
0xF833 = 0xF9F6
0xF834 = 0xF9F7
0xF835 = 0xF9F8
0xF836 = 0xF9F9
0xF837 = 0xF9FA
0xF838 = 0xF9FB
0xF839 = 0xF9FC
0xF83A = 0xF9FD
0xF83B = 0xF9FE
0xF83E = 0xC6DF
0xFF02 = 0xC8D0
0xFF07 = 0xC8CF
0xFF3B = 0xC6E4
0xFF3D = 0xC6E5
0xFF3E = 0xC6D9
0xFFE2 = 0xC8CD
0xFFE4 = 0xC8CE
END_MAP

File diff suppressed because it is too large Load Diff

Some files were not shown because too many files have changed in this diff Show More