mirror of
git://git.sv.gnu.org/emacs.git
synced 2025-12-15 10:30:25 -08:00
dc4e6b1329; Update copyright years in more files64b3777631; Run set-copyright from admin.el8e1c56ae46; Add 2024 to copyright years # Conflicts: # doc/misc/modus-themes.org # doc/misc/texinfo.tex # etc/NEWS # etc/refcards/ru-refcard.tex # etc/themes/modus-operandi-theme.el # etc/themes/modus-themes.el # etc/themes/modus-vivendi-theme.el # lib/alloca.in.h # lib/binary-io.h # lib/c-ctype.h # lib/c-strcasecmp.c # lib/c-strncasecmp.c # lib/careadlinkat.c # lib/cloexec.c # lib/close-stream.c # lib/diffseq.h # lib/dup2.c # lib/filemode.h # lib/fpending.c # lib/fpending.h # lib/fsusage.c # lib/getgroups.c # lib/getloadavg.c # lib/gettext.h # lib/gettime.c # lib/gettimeofday.c # lib/group-member.c # lib/malloc.c # lib/md5-stream.c # lib/md5.c # lib/md5.h # lib/memmem.c # lib/memrchr.c # lib/nanosleep.c # lib/save-cwd.h # lib/sha1.c # lib/sig2str.c # lib/stdlib.in.h # lib/strtoimax.c # lib/strtol.c # lib/strtoll.c # lib/time_r.c # lib/xalloc-oversized.h # lisp/auth-source-pass.el # lisp/emacs-lisp/lisp-mnt.el # lisp/emacs-lisp/timer.el # lisp/info-look.el # lisp/jit-lock.el # lisp/loadhist.el # lisp/mail/rmail.el # lisp/net/ntlm.el # lisp/net/webjump.el # lisp/progmodes/asm-mode.el # lisp/progmodes/project.el # lisp/progmodes/sh-script.el # lisp/textmodes/flyspell.el # lisp/textmodes/reftex-toc.el # lisp/textmodes/reftex.el # lisp/textmodes/tex-mode.el # lisp/url/url-gw.el # m4/alloca.m4 # m4/clock_time.m4 # m4/d-type.m4 # m4/dirent_h.m4 # m4/dup2.m4 # m4/euidaccess.m4 # m4/fchmodat.m4 # m4/filemode.m4 # m4/fsusage.m4 # m4/getgroups.m4 # m4/getloadavg.m4 # m4/getrandom.m4 # m4/gettime.m4 # m4/gettimeofday.m4 # m4/gnulib-common.m4 # m4/group-member.m4 # m4/inttypes.m4 # m4/malloc.m4 # m4/manywarnings.m4 # m4/mempcpy.m4 # m4/memrchr.m4 # m4/mkostemp.m4 # m4/mktime.m4 # m4/nproc.m4 # m4/nstrftime.m4 # m4/pathmax.m4 # m4/pipe2.m4 # m4/pselect.m4 # m4/pthread_sigmask.m4 # m4/readlink.m4 # m4/realloc.m4 # m4/sig2str.m4 # m4/ssize_t.m4 # m4/stat-time.m4 # m4/stddef_h.m4 # m4/stdint.m4 # m4/stdio_h.m4 # m4/stdlib_h.m4 # m4/stpcpy.m4 # m4/strnlen.m4 # m4/strtoimax.m4 # m4/strtoll.m4 # m4/time_h.m4 # m4/timegm.m4 # m4/timer_time.m4 # m4/timespec.m4 # m4/unistd_h.m4 # m4/warnings.m4 # nt/configure.bat # nt/preprep.c # test/lisp/register-tests.el
272 lines
9.3 KiB
EmacsLisp
272 lines
9.3 KiB
EmacsLisp
;;; cyrillic.el --- support for Cyrillic -*- coding: utf-8; lexical-binding: t; -*-
|
||
|
||
;; Copyright (C) 1997-1998, 2001-2024 Free Software Foundation, Inc.
|
||
;; Copyright (C) 1995, 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004,
|
||
;; 2005, 2006, 2007, 2008, 2009, 2010, 2011
|
||
;; National Institute of Advanced Industrial Science and Technology (AIST)
|
||
;; Registration Number H14PRO021
|
||
;; Copyright (C) 2003
|
||
;; National Institute of Advanced Industrial Science and Technology (AIST)
|
||
;; Registration Number H13PRO009
|
||
|
||
;; Author: Kenichi Handa <handa@gnu.org>
|
||
;; Keywords: multilingual, Cyrillic, i18n
|
||
|
||
;; This file is part of GNU Emacs.
|
||
|
||
;; GNU Emacs is free software: you can redistribute it and/or modify
|
||
;; it under the terms of the GNU General Public License as published by
|
||
;; the Free Software Foundation, either version 3 of the License, or
|
||
;; (at your option) any later version.
|
||
|
||
;; GNU Emacs is distributed in the hope that it will be useful,
|
||
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
;; GNU General Public License for more details.
|
||
|
||
;; You should have received a copy of the GNU General Public License
|
||
;; along with GNU Emacs. If not, see <https://www.gnu.org/licenses/>.
|
||
|
||
;;; Commentary:
|
||
|
||
;; The character set ISO8859-5 is supported. KOI-8 and ALTERNATIVNYJ
|
||
;; are converted to Unicode internally. See
|
||
;; <URL:http://www.ecma.ch/ecma1/STAND/ECMA-113.HTM>. For more info
|
||
;; on Cyrillic charsets, see
|
||
;; <URL:https://czyborra.com/charsets/cyrillic.html>. The KOI and
|
||
;; Alternativnyj coding systems should live in code-pages.el, but
|
||
;; they've always been preloaded and the coding system autoload
|
||
;; mechanism didn't get accepted, so they have to stay here and
|
||
;; duplicate code-pages stuff.
|
||
|
||
;; Note that 8859-5 maps directly onto the Unicode Cyrillic block,
|
||
;; apart from codepoints 160 (NBSP, c.f. U+0400), 173 (soft hyphen,
|
||
;; c.f. U+04OD) and 253 (section sign, c.f U+045D). The KOI-8 and
|
||
;; Alternativnyj coding systems encode both 8859-5 and Unicode.
|
||
;; ucs-tables.el provides unification for cyrillic-iso-8bit.
|
||
|
||
;; Customizing `utf-fragment-on-decoding' allows decoding characters
|
||
;; from KOI and Alternativnyj into 8859-5 where that's possible.
|
||
;; cyrillic-iso8859-5 characters take half as much space in the buffer
|
||
;; as the mule-unicode-0100-24ff equivalents, though that's probably
|
||
;; not normally a big deal.
|
||
|
||
;;; Code:
|
||
|
||
;; Cyrillic (general)
|
||
|
||
;; ISO-8859-5 stuff
|
||
|
||
(define-coding-system 'cyrillic-iso-8bit
|
||
"ISO 2022 based 8-bit encoding for Cyrillic script (MIME:ISO-8859-5)."
|
||
:coding-type 'charset
|
||
:mnemonic ?5
|
||
:charset-list '(iso-8859-5)
|
||
:mime-charset 'iso-8859-5)
|
||
|
||
(define-coding-system-alias 'iso-8859-5 'cyrillic-iso-8bit)
|
||
|
||
(set-language-info-alist
|
||
"Cyrillic-ISO" '((charset iso-8859-5)
|
||
(coding-system cyrillic-iso-8bit)
|
||
(coding-priority cyrillic-iso-8bit)
|
||
(input-method . "cyrillic-yawerty") ; fixme
|
||
(nonascii-translation . iso-8859-5)
|
||
(unibyte-display . cyrillic-iso-8bit)
|
||
(features cyril-util)
|
||
(sample-text . "Russian (Русский) Здравствуйте!")
|
||
(documentation . "Support for Cyrillic ISO-8859-5."))
|
||
'("Cyrillic"))
|
||
|
||
;; KOI-8R stuff
|
||
|
||
(define-coding-system 'cyrillic-koi8
|
||
"KOI8 8-bit encoding for Cyrillic (MIME: KOI8-R)."
|
||
:coding-type 'charset
|
||
;; We used to use ?K. It is true that ?K is more strictly correct,
|
||
;; but it is also used for Korean. So people who use koi8 for
|
||
;; languages other than Russian will have to forgive us.
|
||
:mnemonic ?R
|
||
:charset-list '(koi8)
|
||
:mime-charset 'koi8-r)
|
||
|
||
(define-coding-system-alias 'koi8-r 'cyrillic-koi8)
|
||
(define-coding-system-alias 'koi8 'cyrillic-koi8)
|
||
(define-coding-system-alias 'cp878 'cyrillic-koi8)
|
||
|
||
(set-language-info-alist
|
||
"Cyrillic-KOI8" '((charset koi8)
|
||
(coding-system cyrillic-koi8)
|
||
(coding-priority cyrillic-koi8 cyrillic-iso-8bit)
|
||
(ctext-non-standard-encodings "koi8-r")
|
||
(nonascii-translation . koi8)
|
||
(input-method . "russian-typewriter")
|
||
(features cyril-util)
|
||
(unibyte-display . cyrillic-koi8)
|
||
(sample-text . "Russian (Русский) Здравствуйте!")
|
||
(documentation . "Support for Cyrillic KOI8-R."))
|
||
'("Cyrillic"))
|
||
|
||
(set-language-info-alist
|
||
"Russian" `((charset cyrillic-iso8859-5)
|
||
(nonascii-translation
|
||
. ,(get 'cyrillic-koi8-r-nonascii-translation-table
|
||
'translation-table))
|
||
(coding-system cyrillic-koi8)
|
||
(coding-priority cyrillic-koi8 cyrillic-iso-8bit)
|
||
(input-method . "russian-computer")
|
||
(features cyril-util)
|
||
(unibyte-display . cyrillic-koi8)
|
||
(sample-text . "Russian (Русский) Здравствуйте!")
|
||
(documentation . "\
|
||
Support for Russian using koi8-r and the russian-computer input method.")
|
||
(tutorial . "TUTORIAL.ru"))
|
||
'("Cyrillic"))
|
||
|
||
(define-coding-system 'koi8-u
|
||
"KOI8-U 8-bit encoding for Cyrillic (MIME: KOI8-U)"
|
||
:coding-type 'charset
|
||
;; This used to be ?U which collided with UTF-8.
|
||
:mnemonic ?У ; CYRILLIC CAPITAL LETTER U
|
||
:charset-list '(koi8-u)
|
||
:mime-charset 'koi8-u)
|
||
|
||
(set-language-info-alist
|
||
"Ukrainian" '((tutorial . "TUTORIAL.uk")
|
||
(charset koi8-u)
|
||
(coding-system koi8-u)
|
||
(coding-priority koi8-u)
|
||
(nonascii-translation . koi8-u)
|
||
(input-method . "ukrainian-computer")
|
||
(sample-text . "Ukrainian (Українська) Вітаю / Добрий день! / Привіт")
|
||
(documentation
|
||
. "Support for Ukrainian with koi8-u character set."))
|
||
'("Cyrillic"))
|
||
|
||
;;; ALTERNATIVNYJ stuff
|
||
|
||
(define-coding-system 'cyrillic-alternativnyj
|
||
"ALTERNATIVNYJ 8-bit encoding for Cyrillic."
|
||
:coding-type 'charset
|
||
:mnemonic ?A
|
||
:charset-list '(alternativnyj))
|
||
|
||
(define-coding-system-alias 'alternativnyj 'cyrillic-alternativnyj)
|
||
|
||
(set-language-info-alist
|
||
"Cyrillic-ALT" '((charset alternativnyj)
|
||
(coding-system cyrillic-alternativnyj)
|
||
(coding-priority cyrillic-alternativnyj)
|
||
(nonascii-translation . alternativnyj)
|
||
(input-method . "russian-typewriter")
|
||
(features cyril-util)
|
||
(unibyte-display . cyrillic-alternativnyj)
|
||
(sample-text . "Russian (Русский) Здравствуйте!")
|
||
(documentation . "Support for Cyrillic ALTERNATIVNYJ."))
|
||
'("Cyrillic"))
|
||
|
||
(define-coding-system 'cp866
|
||
"CP866 encoding for Cyrillic."
|
||
:coding-type 'charset
|
||
:mnemonic ?*
|
||
:charset-list '(ibm866)
|
||
:mime-charset 'cp866)
|
||
|
||
(define-coding-system 'koi8-t
|
||
"KOI8-T 8-bit encoding for Cyrillic"
|
||
:coding-type 'charset
|
||
:mnemonic ?*
|
||
:charset-list '(koi8-t)
|
||
:mime-charset 'koi8-t)
|
||
|
||
(define-coding-system 'windows-1251
|
||
"windows-1251 8-bit encoding for Cyrillic (MIME: WINDOWS-1251)"
|
||
:coding-type 'charset
|
||
:mnemonic ?b
|
||
:charset-list '(windows-1251)
|
||
:mime-charset 'windows-1251)
|
||
(define-coding-system-alias 'cp1251 'windows-1251)
|
||
|
||
(define-coding-system 'cp1125
|
||
"cp1125 8-bit encoding for Cyrillic"
|
||
:coding-type 'charset
|
||
:mnemonic ?*
|
||
:charset-list '(cp1125))
|
||
(define-coding-system-alias 'ruscii 'cp1125)
|
||
;; Original name for cp1125, says Serhii Hlodin <hlodin@lutsk.bank.gov.ua>
|
||
(define-coding-system-alias 'cp866u 'cp1125)
|
||
|
||
(define-coding-system 'cp855
|
||
"DOS codepage 855 (Russian)"
|
||
:coding-type 'charset
|
||
:mnemonic ?D
|
||
:charset-list '(cp855)
|
||
:mime-charset 'cp855)
|
||
(define-coding-system-alias 'ibm855 'cp855)
|
||
|
||
(define-coding-system 'mik
|
||
"Bulgarian DOS codepage"
|
||
:coding-type 'charset
|
||
:mnemonic ?D
|
||
:charset-list '(mik))
|
||
|
||
(define-coding-system 'pt154
|
||
"ParaType Asian Cyrillic codepage"
|
||
:coding-type 'charset
|
||
:mnemonic ?D
|
||
:charset-list '(pt154))
|
||
|
||
;; (set-language-info-alist
|
||
;; "Windows-1251" `((coding-system windows-1251)
|
||
;; (coding-priority windows-1251)
|
||
;; (input-method . "russian-typewriter") ; fixme?
|
||
;; (features code-pages)
|
||
;; (documentation . "Support for windows-1251 character set."))
|
||
;; '("Cyrillic"))
|
||
|
||
(set-language-info-alist
|
||
"Tajik" '((coding-system koi8-t)
|
||
(coding-priority koi8-t)
|
||
(nonascii-translation . cyrillic-koi8-t)
|
||
(charset koi8-t)
|
||
(input-method . "russian-typewriter") ; fixme?
|
||
(features code-pages)
|
||
(documentation . "Support for Tajik using KOI8-T."))
|
||
'("Cyrillic"))
|
||
|
||
(set-language-info-alist
|
||
"Bulgarian" '((coding-system windows-1251)
|
||
(coding-priority windows-1251)
|
||
(nonascii-translation . windows-1251)
|
||
(charset windows-1251)
|
||
(ctext-non-standard-encodings "microsoft-cp1251")
|
||
(input-method . "bulgarian-bds")
|
||
(documentation
|
||
. "Support for Bulgarian with windows-1251 character set."))
|
||
'("Cyrillic"))
|
||
|
||
(set-language-info-alist
|
||
"Belarusian" '((coding-system windows-1251)
|
||
(coding-priority windows-1251)
|
||
(nonascii-translation . windows-1251)
|
||
(charset windows-1251)
|
||
(ctext-non-standard-encodings "microsoft-cp1251")
|
||
(input-method . "belarusian")
|
||
(documentation
|
||
. "Support for Belarusian with windows-1251 character set.
|
||
\(The name Belarusian replaced Byelorussian in the early 1990s.)"))
|
||
'("Cyrillic"))
|
||
|
||
;; The Mongolian-traditional language environment is in misc-lang.el.
|
||
(set-language-info-alist
|
||
"Mongolian-cyrillic" '((coding-system utf-8)
|
||
(coding-priority utf-8)
|
||
(input-method . "cyrillic-mongolian")
|
||
(sample-text . "Mongolian (монгол хэл) Сайн байна уу?")
|
||
(documentation
|
||
. "Support for Mongolian language with Cyrillic alphabet."))
|
||
'("Cyrillic"))
|
||
|
||
(provide 'cyrillic)
|
||
|
||
;;; cyrillic.el ends here
|