2004-01-27 01:59:12 +00:00
|
|
|
# eucjp-ms.awk -- Generate a translation table for eucJP-ms.
|
2011-01-02 23:50:46 +00:00
|
|
|
# Copyright (C) 2004, 2005, 2006, 2007, 2008, 2009, 2010, 2011
|
2004-01-27 01:59:12 +00:00
|
|
|
# National Institute of Advanced Industrial Science and Technology (AIST)
|
|
|
|
# Registration Number H13PRO009
|
2008-05-09 23:48:10 +00:00
|
|
|
|
2004-01-27 01:59:12 +00:00
|
|
|
# This file is part of GNU Emacs.
|
2008-05-09 23:48:10 +00:00
|
|
|
|
|
|
|
# GNU Emacs is free software: you can redistribute it and/or modify
|
2004-01-27 01:59:12 +00:00
|
|
|
# it under the terms of the GNU General Public License as published by
|
2008-05-09 23:48:10 +00:00
|
|
|
# the Free Software Foundation, either version 3 of the License, or
|
|
|
|
# (at your option) any later version.
|
|
|
|
|
2004-01-27 01:59:12 +00:00
|
|
|
# GNU Emacs is distributed in the hope that it will be useful,
|
|
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
# GNU General Public License for more details.
|
2008-05-09 23:48:10 +00:00
|
|
|
|
2004-01-27 01:59:12 +00:00
|
|
|
# You should have received a copy of the GNU General Public License
|
2017-09-13 22:52:52 +00:00
|
|
|
# along with GNU Emacs. If not, see <https://www.gnu.org/licenses/>.
|
2004-01-27 01:59:12 +00:00
|
|
|
|
2008-05-09 23:48:10 +00:00
|
|
|
# Commentary:
|
2004-01-27 01:59:12 +00:00
|
|
|
|
|
|
|
# eucJP-ms is one of eucJP-open encoding defined at this page:
|
2019-09-23 06:53:39 +00:00
|
|
|
# https://web.archive.org/web/20120207064433/http://home.m05.itscom.net/numa/cde/ucs-conv/appendix.html
|
2009-06-12 07:22:13 +00:00
|
|
|
# This program reads the mapping file EUC-JP-MS (of glibc) and
|
|
|
|
# generates the Elisp file eucjp-ms.el that defines two translation
|
2015-09-16 23:06:29 +00:00
|
|
|
# tables 'eucjp-ms-decode' and 'eucjp-ms-encode'.
|
2004-01-27 01:59:12 +00:00
|
|
|
|
|
|
|
BEGIN {
|
2009-06-12 07:22:13 +00:00
|
|
|
FS = "[ \t][ \t]*"
|
|
|
|
|
|
|
|
# STATE: 0/ignore, 1/JISX0208, 2/JISX0208 target range
|
|
|
|
# 3/JISX0212 4/JISX0212 target range
|
|
|
|
state = 0;
|
|
|
|
|
|
|
|
JISX0208_FROM1 = "/xad/xa1";
|
|
|
|
JISX0208_TO1 = "/xad/xfc";
|
|
|
|
JISX0208_FROM2 = "/xf5/xa1";
|
|
|
|
JISX0212_FROM = "/x8f/xf3/xf3";
|
|
|
|
|
2021-04-19 10:21:01 +00:00
|
|
|
print ";;; eucjp-ms.el --- translation table for eucJP-ms -*- lexical-binding:t -*-";
|
2009-06-12 07:22:13 +00:00
|
|
|
print ";;; Automatically generated from /usr/share/i18n/charmaps/EUC-JP-MS.gz";
|
2004-01-27 01:59:12 +00:00
|
|
|
print "(let ((map";
|
2009-06-12 07:22:13 +00:00
|
|
|
print " '(;JISEXT<->UNICODE";
|
2004-01-27 01:59:12 +00:00
|
|
|
}
|
|
|
|
|
2009-06-12 07:22:13 +00:00
|
|
|
function write_entry (unicode) {
|
|
|
|
if (state == 1) {
|
|
|
|
if ($2 == JISX0208_FROM1 || $2 == JISX0208_FROM2)
|
|
|
|
state = 2;
|
|
|
|
} else if (state == 3) {
|
|
|
|
if ($2 == JISX0212_FROM)
|
|
|
|
state = 4;
|
2004-01-27 01:59:12 +00:00
|
|
|
}
|
2009-06-12 07:22:13 +00:00
|
|
|
if (state == 2) {
|
|
|
|
jis = $2
|
|
|
|
gsub("/x", "", jis);
|
|
|
|
printf "\n (#x%s . #x%s)", jis, unicode;
|
|
|
|
if ($2 == JISX0208_TO1)
|
|
|
|
state = 1;
|
|
|
|
} else if (state == 4) {
|
|
|
|
jis = substr($2, 5, 8);
|
|
|
|
gsub("/x", "", jis);
|
|
|
|
printf "\n (#x%s #x%s)", jis, unicode;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/^% JIS X 0208/ {
|
|
|
|
state = 1;
|
|
|
|
next;
|
|
|
|
}
|
|
|
|
|
|
|
|
/^% JIS X 0212/ {
|
|
|
|
state = 3;
|
|
|
|
next;
|
|
|
|
}
|
|
|
|
|
|
|
|
/^END CHARMAP/ {
|
|
|
|
state = 0;
|
|
|
|
next;
|
2004-01-27 01:59:12 +00:00
|
|
|
}
|
|
|
|
|
2009-06-12 07:22:13 +00:00
|
|
|
/^<U[0-9A-Z][0-9A-Z][0-9A-Z][0-9A-Z]>/ {
|
|
|
|
if (state > 0)
|
|
|
|
write_entry(substr($1, 3, 4));
|
2004-01-27 01:59:12 +00:00
|
|
|
}
|
|
|
|
|
2009-06-12 07:22:13 +00:00
|
|
|
/^%IRREVERSIBLE%<U[0-9A-Z][0-9A-Z][0-9A-Z][0-9A-Z]>/ {
|
|
|
|
if (state > 0)
|
|
|
|
write_entry(substr($1, 17, 4));
|
2004-01-27 01:59:12 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
END {
|
|
|
|
print ")))";
|
2020-05-17 00:04:15 +00:00
|
|
|
print " (setq map";
|
|
|
|
print " (mapcar";
|
|
|
|
print " (lambda (x)";
|
2009-06-12 07:22:13 +00:00
|
|
|
print " (let ((code (logand (car x) #x7F7F)))";
|
|
|
|
print " (if (integerp (cdr x))";
|
2020-05-17 00:04:15 +00:00
|
|
|
print " (cons (decode-char 'japanese-jisx0208 code) (cdr x))";
|
|
|
|
print " (cons (decode-char 'japanese-jisx0212 code)"
|
|
|
|
print " (cadr x)))))";
|
|
|
|
print " map))";
|
2004-01-27 01:59:12 +00:00
|
|
|
print " (define-translation-table 'eucjp-ms-decode map)";
|
2020-05-17 00:04:15 +00:00
|
|
|
print " (mapc (lambda (x)";
|
2004-01-27 01:59:12 +00:00
|
|
|
print " (let ((tmp (car x)))";
|
|
|
|
print " (setcar x (cdr x)) (setcdr x tmp)))";
|
|
|
|
print " map)";
|
|
|
|
print " (define-translation-table 'eucjp-ms-encode map))";
|
2015-05-15 22:33:09 +00:00
|
|
|
print "";
|
|
|
|
print "(provide 'eucjp-ms)";
|
2004-01-27 01:59:12 +00:00
|
|
|
}
|