New file.

This commit is contained in:
Kenichi Handa 2004-01-27 01:59:12 +00:00
parent 740ddd2766
commit 5d1bff2082
2 changed files with 140 additions and 0 deletions

View file

@ -0,0 +1,57 @@
# cp51932.awk -- Generate a translation table for CP51932.
# Copyright (C) 2004
# National Institute of Advanced Industrial Science and Technology (AIST)
# Registration Number H13PRO009
#
# This file is part of GNU Emacs.
#
# GNU Emacs is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2, or (at your option)
# any later version.
#
# GNU Emacs is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with GNU Emacs; see the file COPYING. If not, write to the
# Free Software Foundation, Inc., 59 Temple Place - Suite 330,
# Boston, MA 02111-1307, USA.
# Comment:
# Genereate a translation table for CP51932 (EUC-JP of MicroSoft Version).
# It maps invalid JISX0208 code points used by CP51932 to Unicode.
# 4th field of the input has these meanings:
# 0: JISX0208 characters.
# 1: NEC special characters.
# 2: IBM extension characters.
# 3: NEC selection of IBM extension characters.
# Among them, 1 and 3 are the target characters. 2 should have
# already been mapped to 1 or 3.
BEGIN {
print ";;; cp51932.el -- translation table for CP51932. -*- no-byte-compile: t -*-";
print ";;; Automatically genrated from CP932-2BYTE.map";
print "(let ((map";
printf " '(;JISEXT<->UNICODE";
}
/# [13]/ {
printf "\n (#x%s . #x%s)", $5 ,substr($2, 3, 4);
}
END {
print ")))";
print " (mapc #'(lambda (x)";
print " (setcar x (decode-char 'japanese-jisx0208 (car x))))";
print " map)";
print " (define-translation-table 'cp51932-decode map)";
print " (mapc #'(lambda (x)";
print " (let ((tmp (car x)))";
print " (setcar x (cdr x)) (setcdr x tmp)))";
print " map)";
print " (define-translation-table 'cp51932-encode map))";
}

View file

@ -0,0 +1,83 @@
# eucjp-ms.awk -- Generate a translation table for eucJP-ms.
# Copyright (C) 2004
# National Institute of Advanced Industrial Science and Technology (AIST)
# Registration Number H13PRO009
#
# This file is part of GNU Emacs.
#
# GNU Emacs is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2, or (at your option)
# any later version.
#
# GNU Emacs is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with GNU Emacs; see the file COPYING. If not, write to the
# Free Software Foundation, Inc., 59 Temple Place - Suite 330,
# Boston, MA 02111-1307, USA.
# Comment:
# eucJP-ms is one of eucJP-open encoding defined at this page:
# http://www.opengroup.or.jp/jvc/cde/appendix.html
BEGIN {
print ";;; eucjp-ms.el -- translation table for eucJP-ms. -*- no-byte-compile: t -*-";
print ";;; Automatically genrated from eucJP-13th.txt, eucJP-udc.txt, eucJP-ibmext.txt";
print "(let ((map";
printf " '(;JISEXT<->UNICODE";
tohex["A"] = 10;
tohex["B"] = 11;
tohex["C"] = 12;
tohex["D"] = 13;
tohex["E"] = 14;
tohex["F"] = 15;
}
function decode_hex(str) {
n = 0;
len = length(str);
for (i = 1; i <= len; i++)
{
c = substr(str, i, 1);
if (c >= "0" && c <= "9")
n = n * 16 + (c - "0");
else
n = n * 16 + tohex[c];
}
return n;
}
/0x8F/ {
code = decode_hex(substr($1, 5, 4));
code -= 32896; # code -= 0x8080
printf "\n (#x%04x #x%s)", code, substr($2, 3, 4);
next;
}
/0x[A-F]/ {
code = decode_hex(substr($1, 3, 4));
code -= 32896; # code -= 0x8080
printf "\n (#x%04x . #x%s)", code, substr($2, 3, 4);
}
END {
print ")))";
print " (mapc #'(lambda (x)";
print " (if (integerp (cdr x))";
print " (setcar x (decode-char 'japanese-jisx0208 (car x)))";
print " (setcar x (decode-char 'japanese-jisx0212 (car x)))";
print " (setcdr x (cadr x))))";
print " map)";
print " (define-translation-table 'eucjp-ms-decode map)";
print " (mapc #'(lambda (x)";
print " (let ((tmp (car x)))";
print " (setcar x (cdr x)) (setcdr x tmp)))";
print " map)";
print " (define-translation-table 'eucjp-ms-encode map))";
}