1
Fork 0
mirror of git://git.sv.gnu.org/emacs.git synced 2025-12-28 08:11:05 -08:00
emacs/admin/charsets/eucjp-ms.awk
Paul Eggert c7bc28bf03 Don’t attempt to modify constant conses
From a patch privately suggested by Mattias Engdegård on 2020-05-11
in a followup to Bug#40671.
* admin/charsets/cp51932.awk:
* admin/charsets/eucjp-ms.awk:
Generate code that does not modify constant conses.
* doc/misc/emacs-mime.texi (Encoding Customization):
* lisp/emacs-lisp/byte-opt.el (byte-compile-side-effect-free-ops):
* lisp/frameset.el (frameset-persistent-filter-alist):
* lisp/gnus/gnus-sum.el (gnus-article-mode-line-format-alist):
Use append instead of nconc.
* lisp/language/japanese.el (japanese-ucs-cp932-to-jis-map)
(jisx0213-to-unicode):
Use mapcar instead of mapc.
* lisp/language/lao-util.el (lao-transcription-consonant-alist)
(lao-transcription-vowel-alist):
* lisp/language/tibetan.el (tibetan-subjoined-transcription-alist):
Use copy-sequence.
* test/src/fns-tests.el (fns-tests-nreverse):
(fns-tests-sort, fns-tests-collate-sort)
(fns-tests-string-version-lessp, fns-tests-mapcan):
Use copy-sequence, vector, and list.
2020-05-16 17:05:37 -07:00

113 lines
3.1 KiB
Awk

# eucjp-ms.awk -- Generate a translation table for eucJP-ms.
# Copyright (C) 2004, 2005, 2006, 2007, 2008, 2009, 2010, 2011
# National Institute of Advanced Industrial Science and Technology (AIST)
# Registration Number H13PRO009
# This file is part of GNU Emacs.
# GNU Emacs is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
# GNU Emacs is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
# You should have received a copy of the GNU General Public License
# along with GNU Emacs. If not, see <https://www.gnu.org/licenses/>.
# Commentary:
# eucJP-ms is one of eucJP-open encoding defined at this page:
# https://web.archive.org/web/20120207064433/http://home.m05.itscom.net/numa/cde/ucs-conv/appendix.html
# This program reads the mapping file EUC-JP-MS (of glibc) and
# generates the Elisp file eucjp-ms.el that defines two translation
# tables 'eucjp-ms-decode' and 'eucjp-ms-encode'.
BEGIN {
FS = "[ \t][ \t]*"
# STATE: 0/ignore, 1/JISX0208, 2/JISX0208 target range
# 3/JISX0212 4/JISX0212 target range
state = 0;
JISX0208_FROM1 = "/xad/xa1";
JISX0208_TO1 = "/xad/xfc";
JISX0208_FROM2 = "/xf5/xa1";
JISX0212_FROM = "/x8f/xf3/xf3";
print ";;; eucjp-ms.el -- translation table for eucJP-ms";
print ";;; Automatically generated from /usr/share/i18n/charmaps/EUC-JP-MS.gz";
print "(let ((map";
print " '(;JISEXT<->UNICODE";
}
function write_entry (unicode) {
if (state == 1) {
if ($2 == JISX0208_FROM1 || $2 == JISX0208_FROM2)
state = 2;
} else if (state == 3) {
if ($2 == JISX0212_FROM)
state = 4;
}
if (state == 2) {
jis = $2
gsub("/x", "", jis);
printf "\n (#x%s . #x%s)", jis, unicode;
if ($2 == JISX0208_TO1)
state = 1;
} else if (state == 4) {
jis = substr($2, 5, 8);
gsub("/x", "", jis);
printf "\n (#x%s #x%s)", jis, unicode;
}
}
/^% JIS X 0208/ {
state = 1;
next;
}
/^% JIS X 0212/ {
state = 3;
next;
}
/^END CHARMAP/ {
state = 0;
next;
}
/^<U[0-9A-Z][0-9A-Z][0-9A-Z][0-9A-Z]>/ {
if (state > 0)
write_entry(substr($1, 3, 4));
}
/^%IRREVERSIBLE%<U[0-9A-Z][0-9A-Z][0-9A-Z][0-9A-Z]>/ {
if (state > 0)
write_entry(substr($1, 17, 4));
}
END {
print ")))";
print " (setq map";
print " (mapcar";
print " (lambda (x)";
print " (let ((code (logand (car x) #x7F7F)))";
print " (if (integerp (cdr x))";
print " (cons (decode-char 'japanese-jisx0208 code) (cdr x))";
print " (cons (decode-char 'japanese-jisx0212 code)"
print " (cadr x)))))";
print " map))";
print " (define-translation-table 'eucjp-ms-decode map)";
print " (mapc (lambda (x)";
print " (let ((tmp (car x)))";
print " (setcar x (cdr x)) (setcdr x tmp)))";
print " map)";
print " (define-translation-table 'eucjp-ms-encode map))";
print "";
print "(provide 'eucjp-ms)";
}