1998-08-31 19:59:02 +00:00
|
|
|
|
;;; cyrillic.el --- Support for Cyrillic -*- coding: iso-2022-7bit; -*-
|
1997-02-20 07:02:49 +00:00
|
|
|
|
|
|
|
|
|
;; Copyright (C) 1995 Electrotechnical Laboratory, JAPAN.
|
1997-06-26 21:08:49 +00:00
|
|
|
|
;; Licensed to the Free Software Foundation.
|
1997-02-20 07:02:49 +00:00
|
|
|
|
|
|
|
|
|
;; Keywords: multilingual, Cyrillic
|
|
|
|
|
|
|
|
|
|
;; This file is part of GNU Emacs.
|
|
|
|
|
|
|
|
|
|
;; GNU Emacs is free software; you can redistribute it and/or modify
|
|
|
|
|
;; it under the terms of the GNU General Public License as published by
|
|
|
|
|
;; the Free Software Foundation; either version 2, or (at your option)
|
|
|
|
|
;; any later version.
|
|
|
|
|
|
|
|
|
|
;; GNU Emacs is distributed in the hope that it will be useful,
|
|
|
|
|
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
|
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
|
;; GNU General Public License for more details.
|
|
|
|
|
|
|
|
|
|
;; You should have received a copy of the GNU General Public License
|
1997-02-23 09:20:52 +00:00
|
|
|
|
;; along with GNU Emacs; see the file COPYING. If not, write to the
|
|
|
|
|
;; Free Software Foundation, Inc., 59 Temple Place - Suite 330,
|
|
|
|
|
;; Boston, MA 02111-1307, USA.
|
1997-02-20 07:02:49 +00:00
|
|
|
|
|
|
|
|
|
;;; Commentary:
|
|
|
|
|
|
1997-02-26 12:27:06 +00:00
|
|
|
|
;; The character set ISO8859-5 is supported. KOI-8 and ALTERNATIVNYJ
|
|
|
|
|
;; are converted to ISO8859-5 internally.
|
1997-02-20 07:02:49 +00:00
|
|
|
|
|
|
|
|
|
;;; Code:
|
|
|
|
|
|
1997-08-22 01:22:17 +00:00
|
|
|
|
;; Cyrillic (general)
|
|
|
|
|
|
1997-02-26 12:27:06 +00:00
|
|
|
|
;; ISO-8859-5 staff
|
|
|
|
|
|
1997-02-20 07:02:49 +00:00
|
|
|
|
(make-coding-system
|
1997-06-18 13:03:19 +00:00
|
|
|
|
'cyrillic-iso-8bit 2 ?5
|
|
|
|
|
"ISO 2022 based 8-bit encoding for Cyrillic script (MIME:ISO-8859-5)"
|
1998-01-22 01:48:25 +00:00
|
|
|
|
'(ascii cyrillic-iso8859-5 nil nil
|
|
|
|
|
nil nil nil nil nil nil nil)
|
|
|
|
|
'((safe-charsets ascii cyrillic-iso8859-5)
|
|
|
|
|
(mime-charset . iso-8859-5)))
|
1997-02-20 07:02:49 +00:00
|
|
|
|
|
1997-07-02 00:06:30 +00:00
|
|
|
|
(define-coding-system-alias 'iso-8859-5 'cyrillic-iso-8bit)
|
1997-06-18 13:03:19 +00:00
|
|
|
|
|
1997-08-22 01:22:17 +00:00
|
|
|
|
(set-language-info-alist
|
1998-08-10 06:29:02 +00:00
|
|
|
|
"Cyrillic-ISO" '((charset cyrillic-iso8859-5)
|
1998-01-22 01:48:25 +00:00
|
|
|
|
(coding-system cyrillic-iso-8bit)
|
|
|
|
|
(coding-priority cyrillic-iso-8bit)
|
1998-08-10 06:29:02 +00:00
|
|
|
|
(input-method . "cyrillic-yawerty")
|
|
|
|
|
(nonascii-translation . cyrillic-iso8859-5)
|
|
|
|
|
(unibyte-display . cyrillic-iso-8bit)
|
|
|
|
|
(features cyril-util)
|
1997-08-22 01:22:17 +00:00
|
|
|
|
(sample-text . "Russian (,L@caaZXY(B) ,L7T`PRabRcYbU(B!")
|
1998-01-22 01:48:25 +00:00
|
|
|
|
(documentation . "Support for Cyrillic ISO-8859-5."))
|
|
|
|
|
'("Cyrillic"))
|
1997-08-22 01:22:17 +00:00
|
|
|
|
|
1997-02-26 12:27:06 +00:00
|
|
|
|
;; KOI-8 staff
|
|
|
|
|
|
1998-08-02 01:06:57 +00:00
|
|
|
|
(eval-and-compile
|
|
|
|
|
|
|
|
|
|
(defvar cyrillic-koi8-r-decode-table
|
|
|
|
|
[
|
|
|
|
|
0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
|
|
|
|
|
16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
|
|
|
|
|
32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47
|
|
|
|
|
48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63
|
|
|
|
|
64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79
|
|
|
|
|
80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95
|
|
|
|
|
96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111
|
|
|
|
|
112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127
|
|
|
|
|
128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143
|
|
|
|
|
144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159
|
1999-09-29 11:44:57 +00:00
|
|
|
|
160 161 162 ?,Lq(B 164 165 166 167 168 169 170 171 172 173 174 175
|
|
|
|
|
176 177 178 ?,L!(B 180 181 182 183 184 185 186 187 188 189 190 191
|
1998-08-02 01:06:57 +00:00
|
|
|
|
?,Ln(B ?,LP(B ?,LQ(B ?,Lf(B ?,LT(B ?,LU(B ?,Ld(B ?,LS(B ?,Le(B ?,LX(B ?,LY(B ?,LZ(B ?,L[(B ?,L\(B ?,L](B ?,L^(B
|
|
|
|
|
?,L_(B ?,Lo(B ?,L`(B ?,La(B ?,Lb(B ?,Lc(B ?,LV(B ?,LR(B ?,Ll(B ?,Lk(B ?,LW(B ?,Lh(B ?,Lm(B ?,Li(B ?,Lg(B ?,Lj(B
|
|
|
|
|
?,LN(B ?,L0(B ?,L1(B ?,LF(B ?,L4(B ?,L5(B ?,LD(B ?,L3(B ?,LE(B ?,L8(B ?,L9(B ?,L:(B ?,L;(B ?,L<(B ?,L=(B ?,L>(B
|
|
|
|
|
?,L?(B ?,LO(B ?,L@(B ?,LA(B ?,LB(B ?,LC(B ?,L6(B ?,L2(B ?,LL(B ?,LK(B ?,L7(B ?,LH(B ?,LM(B ?,LI(B ?,LG(B ?,LJ(B ]
|
|
|
|
|
"Cyrillic KOI8-R decoding table.")
|
|
|
|
|
|
|
|
|
|
(defvar cyrillic-koi8-r-encode-table
|
|
|
|
|
(let ((table (make-vector 256 32))
|
|
|
|
|
(i 0))
|
|
|
|
|
(while (< i 256)
|
|
|
|
|
(let* ((ch (aref cyrillic-koi8-r-decode-table i))
|
|
|
|
|
(split (split-char ch)))
|
|
|
|
|
(if (eq (car split) 'cyrillic-iso8859-5)
|
|
|
|
|
(aset table (logior (nth 1 split) 128) i)
|
|
|
|
|
(if (/= ch 32)
|
|
|
|
|
(aset table ch i))))
|
|
|
|
|
(setq i (1+ i)))
|
|
|
|
|
table)
|
|
|
|
|
"Cyrillic KOI8-R encoding table.")
|
|
|
|
|
|
|
|
|
|
)
|
|
|
|
|
|
1997-02-26 12:27:06 +00:00
|
|
|
|
(define-ccl-program ccl-decode-koi8
|
1998-08-02 01:06:57 +00:00
|
|
|
|
`(3
|
1997-02-26 12:27:06 +00:00
|
|
|
|
((read r0)
|
|
|
|
|
(loop
|
1998-08-02 01:06:57 +00:00
|
|
|
|
(write-read-repeat r0 ,cyrillic-koi8-r-decode-table))))
|
1997-02-26 12:27:06 +00:00
|
|
|
|
"CCL program to decode KOI8.")
|
|
|
|
|
|
|
|
|
|
(define-ccl-program ccl-encode-koi8
|
|
|
|
|
`(1
|
|
|
|
|
((read r0)
|
|
|
|
|
(loop
|
|
|
|
|
(if (r0 != ,(charset-id 'cyrillic-iso8859-5))
|
|
|
|
|
(write-read-repeat r0)
|
|
|
|
|
((read r0)
|
1998-08-02 01:06:57 +00:00
|
|
|
|
(write-read-repeat r0 , cyrillic-koi8-r-encode-table))))))
|
1997-02-26 12:27:06 +00:00
|
|
|
|
"CCL program to encode KOI8.")
|
|
|
|
|
|
|
|
|
|
(make-coding-system
|
1997-06-10 01:08:21 +00:00
|
|
|
|
'cyrillic-koi8 4
|
1997-06-02 04:56:33 +00:00
|
|
|
|
;; We used to use ?K. It is true that ?K is more strictly correct,
|
|
|
|
|
;; but it is also used for Korean.
|
|
|
|
|
;; So people who use koi8 for languages other than Russian
|
|
|
|
|
;; will have to forgive us.
|
1997-06-18 13:03:19 +00:00
|
|
|
|
?R "KOI8 8-bit encoding for Cyrillic (MIME: KOI8-R)"
|
1998-04-20 02:14:20 +00:00
|
|
|
|
'(ccl-decode-koi8 . ccl-encode-koi8)
|
1998-01-22 01:48:25 +00:00
|
|
|
|
'((safe-charsets ascii cyrillic-iso8859-5)
|
1998-08-02 01:06:57 +00:00
|
|
|
|
(mime-charset . koi8-r)
|
1999-02-12 07:46:42 +00:00
|
|
|
|
(valid-codes (0 . 127) 163 179 (192 . 255))
|
|
|
|
|
(charset-origin-alist (cyrillic-iso8859-5 "KOI8-R"
|
|
|
|
|
cyrillic-encode-koi8-r-char))))
|
1997-02-26 12:27:06 +00:00
|
|
|
|
|
1997-07-02 00:06:30 +00:00
|
|
|
|
(define-coding-system-alias 'koi8-r 'cyrillic-koi8)
|
|
|
|
|
(define-coding-system-alias 'koi8 'cyrillic-koi8)
|
1997-02-26 12:27:06 +00:00
|
|
|
|
|
|
|
|
|
(define-ccl-program ccl-encode-koi8-font
|
1998-08-02 01:06:57 +00:00
|
|
|
|
`(0
|
|
|
|
|
((r1 |= 128)
|
|
|
|
|
(r1 = r1 ,cyrillic-koi8-r-encode-table)))
|
1997-02-26 12:27:06 +00:00
|
|
|
|
"CCL program to encode Cyrillic chars to KOI font.")
|
|
|
|
|
|
|
|
|
|
(setq font-ccl-encoder-alist
|
|
|
|
|
(cons (cons "koi8" ccl-encode-koi8-font) font-ccl-encoder-alist))
|
|
|
|
|
|
1998-08-02 01:06:57 +00:00
|
|
|
|
(defvar cyrillic-koi8-r-nonascii-translation-table
|
|
|
|
|
(make-translation-table-from-vector cyrillic-koi8-r-decode-table)
|
|
|
|
|
"Value of `nonascii-translation-table' in Cyrillic-KOI8 language environment..")
|
|
|
|
|
|
1997-08-22 01:22:17 +00:00
|
|
|
|
(set-language-info-alist
|
1998-08-10 06:29:02 +00:00
|
|
|
|
"Cyrillic-KOI8" `((charset cyrillic-iso8859-5)
|
|
|
|
|
(nonascii-translation
|
1998-08-02 01:06:57 +00:00
|
|
|
|
. ,cyrillic-koi8-r-nonascii-translation-table)
|
1998-01-22 01:48:25 +00:00
|
|
|
|
(coding-system cyrillic-koi8)
|
|
|
|
|
(coding-priority cyrillic-koi8)
|
1999-07-13 19:03:04 +00:00
|
|
|
|
(input-method . "cyrillic-jcuken")
|
1998-08-10 06:29:02 +00:00
|
|
|
|
(features cyril-util)
|
|
|
|
|
(unibyte-display . cyrillic-koi8)
|
1997-08-22 01:22:17 +00:00
|
|
|
|
(sample-text . "Russian (,L@caaZXY(B) ,L7T`PRabRcYbU(B!")
|
1998-08-02 01:06:57 +00:00
|
|
|
|
(documentation . "Support for Cyrillic KOI8-R."))
|
1998-01-22 01:48:25 +00:00
|
|
|
|
'("Cyrillic"))
|
1997-08-22 01:22:17 +00:00
|
|
|
|
|
1997-02-26 12:27:06 +00:00
|
|
|
|
;;; ALTERNATIVNYJ staff
|
|
|
|
|
|
1998-08-02 01:06:57 +00:00
|
|
|
|
(eval-and-compile
|
|
|
|
|
|
|
|
|
|
(defvar cyrillic-alternativnyj-decode-table
|
|
|
|
|
[
|
|
|
|
|
0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
|
|
|
|
|
16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
|
|
|
|
|
32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47
|
|
|
|
|
48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63
|
|
|
|
|
64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79
|
|
|
|
|
80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95
|
|
|
|
|
96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111
|
|
|
|
|
112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127
|
|
|
|
|
?,L0(B ?,L1(B ?,L2(B ?,L3(B ?,L4(B ?,L5(B ?,L6(B ?,L7(B ?,L8(B ?,L9(B ?,L:(B ?,L;(B ?,L<(B ?,L=(B ?,L>(B ?,L?(B
|
|
|
|
|
?,L@(B ?,LA(B ?,LB(B ?,LC(B ?,LD(B ?,LE(B ?,LF(B ?,LG(B ?,LH(B ?,LI(B ?,LJ(B ?,LK(B ?,LL(B ?,LM(B ?,LN(B ?,LO(B
|
|
|
|
|
?,LP(B ?,LQ(B ?,LR(B ?,LS(B ?,LT(B ?,LU(B ?,LV(B ?,LW(B ?,LX(B ?,LY(B ?,LZ(B ?,L[(B ?,L\(B ?,L](B ?,L^(B ?,L_(B
|
1999-09-29 11:44:57 +00:00
|
|
|
|
176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191
|
|
|
|
|
192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207
|
|
|
|
|
208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223
|
1998-08-02 01:06:57 +00:00
|
|
|
|
?,L`(B ?,La(B ?,Lb(B ?,Lc(B ?,Ld(B ?,Le(B ?,Lf(B ?,Lg(B ?,Lh(B ?,Li(B ?,Lj(B ?,Lk(B ?,Ll(B ?,Lm(B ?,Ln(B ?,Lo(B
|
1999-09-29 11:44:57 +00:00
|
|
|
|
?,L!(B ?,Lq(B 242 243 244 245 246 247 248 249 250 251 252 253 254 ?,Lp(B]
|
1998-08-02 01:06:57 +00:00
|
|
|
|
"Cyrillic ALTERNATIVNYJ decoding table.")
|
|
|
|
|
|
|
|
|
|
(defvar cyrillic-alternativnyj-encode-table
|
|
|
|
|
(let ((table (make-vector 256 32))
|
|
|
|
|
(i 0))
|
|
|
|
|
(while (< i 256)
|
|
|
|
|
(let* ((ch (aref cyrillic-alternativnyj-decode-table i))
|
|
|
|
|
(split (split-char ch)))
|
|
|
|
|
(if (eq (car split) 'cyrillic-iso8859-5)
|
1998-08-18 13:15:18 +00:00
|
|
|
|
(aset table (logior (nth 1 split) 128) i)
|
1998-08-02 01:06:57 +00:00
|
|
|
|
(if (/= ch 32)
|
|
|
|
|
(aset table ch i))))
|
|
|
|
|
(setq i (1+ i)))
|
|
|
|
|
table)
|
|
|
|
|
"Cyrillic ALTERNATIVNYJ encoding table.")
|
|
|
|
|
|
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
1997-02-26 12:27:06 +00:00
|
|
|
|
(define-ccl-program ccl-decode-alternativnyj
|
1998-08-02 01:06:57 +00:00
|
|
|
|
`(3
|
1997-02-26 12:27:06 +00:00
|
|
|
|
((read r0)
|
|
|
|
|
(loop
|
1998-08-02 01:06:57 +00:00
|
|
|
|
(write-read-repeat r0 ,cyrillic-alternativnyj-decode-table))))
|
1997-02-26 12:27:06 +00:00
|
|
|
|
"CCL program to decode Alternativnyj.")
|
|
|
|
|
|
|
|
|
|
(define-ccl-program ccl-encode-alternativnyj
|
|
|
|
|
`(1
|
|
|
|
|
((read r0)
|
|
|
|
|
(loop
|
|
|
|
|
(if (r0 != ,(charset-id 'cyrillic-iso8859-5))
|
|
|
|
|
(write-read-repeat r0)
|
|
|
|
|
((read r0)
|
1998-08-02 01:06:57 +00:00
|
|
|
|
(write-read-repeat r0 ,cyrillic-alternativnyj-encode-table))))))
|
1997-02-26 12:27:06 +00:00
|
|
|
|
"CCL program to encode Alternativnyj.")
|
|
|
|
|
|
|
|
|
|
(make-coding-system
|
1997-06-18 13:03:19 +00:00
|
|
|
|
'cyrillic-alternativnyj 4 ?A
|
|
|
|
|
"ALTERNATIVNYJ 8-bit encoding for Cyrillic"
|
1998-04-20 02:14:20 +00:00
|
|
|
|
'(ccl-decode-alternativnyj . ccl-encode-alternativnyj)
|
1998-08-02 01:06:57 +00:00
|
|
|
|
'((safe-charsets ascii cyrillic-iso8859-5)
|
1999-02-12 07:46:42 +00:00
|
|
|
|
(valid-codes (0 . 175) (224 . 241) 255)
|
|
|
|
|
(charset-origin-alist (cyrillic-iso8859-5 "ALTERNATIVNYJ"
|
|
|
|
|
cyrillic-encode-koi8-r-char))))
|
|
|
|
|
|
1997-02-26 12:27:06 +00:00
|
|
|
|
|
1997-07-02 00:06:30 +00:00
|
|
|
|
(define-coding-system-alias 'alternativnyj 'cyrillic-alternativnyj)
|
1997-06-18 13:03:19 +00:00
|
|
|
|
|
1997-02-26 12:27:06 +00:00
|
|
|
|
(define-ccl-program ccl-encode-alternativnyj-font
|
|
|
|
|
'(0
|
1998-08-02 01:06:57 +00:00
|
|
|
|
((r1 |= 128)
|
|
|
|
|
(r1 = r1 ,cyrillic-alternativnyj-encode-table)))
|
1997-02-26 12:27:06 +00:00
|
|
|
|
"CCL program to encode Cyrillic chars to Alternativnyj font.")
|
|
|
|
|
|
|
|
|
|
(setq font-ccl-encoder-alist
|
|
|
|
|
(cons (cons "alternativnyj" ccl-encode-alternativnyj-font)
|
|
|
|
|
font-ccl-encoder-alist))
|
|
|
|
|
|
1998-08-02 01:06:57 +00:00
|
|
|
|
(defvar cyrillic-alternativnyj-nonascii-translation-table
|
|
|
|
|
(make-translation-table-from-vector cyrillic-alternativnyj-decode-table)
|
|
|
|
|
"Value of `nonascii-translation-table' in Cyrillic-ALT language environment.")
|
|
|
|
|
|
1997-02-20 07:02:49 +00:00
|
|
|
|
(set-language-info-alist
|
1998-08-10 06:29:02 +00:00
|
|
|
|
"Cyrillic-ALT" `((charset cyrillic-iso8859-5)
|
|
|
|
|
(nonascii-translation
|
|
|
|
|
. ,cyrillic-alternativnyj-nonascii-translation-table)
|
1998-01-22 01:48:25 +00:00
|
|
|
|
(coding-system cyrillic-alternativnyj)
|
|
|
|
|
(coding-priority cyrillic-alternativnyj)
|
1999-07-13 19:03:04 +00:00
|
|
|
|
(input-method . "cyrillic-jcuken")
|
1998-08-10 06:29:02 +00:00
|
|
|
|
(features cyril-util)
|
|
|
|
|
(unibyte-display . cyrillic-alternativnyj)
|
1997-08-22 01:22:17 +00:00
|
|
|
|
(sample-text . "Russian (,L@caaZXY(B) ,L7T`PRabRcYbU(B!")
|
1998-01-22 01:48:25 +00:00
|
|
|
|
(documentation . "Support for Cyrillic ALTERNATIVNYJ."))
|
|
|
|
|
'("Cyrillic"))
|
1997-02-20 07:02:49 +00:00
|
|
|
|
|
|
|
|
|
;;; cyrillic.el ends here
|