1
0
mirror of https://git.savannah.gnu.org/git/emacs.git synced 2025-01-13 16:38:14 +00:00
emacs/lisp/language/thai.el
Eli Zaretskii eb0680bd57 Add support for Tai Tham script
* lisp/international/fontset.el (setup-default-fontset)
(script-representative-chars): Add tai-tham.
* lisp/language/thai.el ("Northern Thai"): New language
environment.  Patch by Richard Wordingham
<richard.wordingham@ntlworld.com>.  Set
'composition-function-table' for the Tai Tham block.  Original
code by Richard Wordingham <richard.wordingham@ntlworld.com>.

* etc/HELLO: Add Northern Thai greeting.
* etc/NEWS: Announce addition of Northern Thai language environment.
2022-02-16 17:07:58 +02:00

125 lines
4.7 KiB
EmacsLisp

;;; thai.el --- support for Thai -*- coding: utf-8; lexical-binding: t; -*-
;; Copyright (C) 1997-1998, 2000-2022 Free Software Foundation, Inc.
;; Copyright (C) 1995, 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004,
;; 2005, 2006, 2007, 2008, 2009, 2010, 2011
;; National Institute of Advanced Industrial Science and Technology (AIST)
;; Registration Number H13PRO009
;; Copyright (C) 2005
;; National Institute of Advanced Industrial Science and Technology (AIST)
;; Registration Number H14PRO021
;; Keywords: multilingual, Thai, i18n
;; This file is part of GNU Emacs.
;; GNU Emacs is free software: you can redistribute it and/or modify
;; it under the terms of the GNU General Public License as published by
;; the Free Software Foundation, either version 3 of the License, or
;; (at your option) any later version.
;; GNU Emacs is distributed in the hope that it will be useful,
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
;; GNU General Public License for more details.
;; You should have received a copy of the GNU General Public License
;; along with GNU Emacs. If not, see <https://www.gnu.org/licenses/>.
;;; Commentary:
;; For Thai, the character set TIS620 is supported.
;;; Code:
(define-coding-system 'thai-tis620
"8-bit encoding for ASCII (MSB=0) and Thai TIS620 (MSB=1)."
:coding-type 'charset
:mnemonic ?T
:charset-list '(tis620-2533))
(define-coding-system-alias 'th-tis620 'thai-tis620)
(define-coding-system-alias 'tis620 'thai-tis620)
(define-coding-system-alias 'tis-620 'thai-tis620)
(set-language-info-alist
"Thai" '((tutorial . "TUTORIAL.th")
(charset thai-tis620)
(coding-system thai-tis620 iso-8859-11 cp874)
(coding-priority thai-tis620)
(nonascii-translation . tis620-2533)
(input-method . "thai-kesmanee")
(unibyte-display . thai-tis620)
(features thai-util)
(setup-function . setup-thai-language-environment-internal)
(exit-function . exit-thai-language-environment-internal)
(sample-text
. (thai-compose-string
(copy-sequence "Thai (ภาษาไทย) สวัสดีครับ, สวัสดีค่ะ")))
(documentation . t)))
(define-coding-system 'cp874
"DOS codepage 874 (Thai)"
:coding-type 'charset
:mnemonic ?D
:charset-list '(cp874)
:mime-charset 'cp874)
(define-coding-system-alias 'ibm874 'cp874)
(define-coding-system 'iso-8859-11
"ISO/IEC 8859/11 (Latin/Thai)
This is the same as `thai-tis620' with the addition of no-break-space."
:coding-type 'charset
:mnemonic ?*
:mime-charset 'iso-8859-11 ; not actually registered as of 2002-05-24
:charset-list '(iso-8859-11))
;; For automatic composition.
(let ((chars "ัิีึืฺุู็่้๊๋์ํ๎")
(elt '(["[ก-ฯ].[่้๊๋์]?ำ?" 1 thai-composition-function]
[nil 0 thai-composition-function])))
(dotimes (i (length chars))
(aset composition-function-table (aref chars i) elt)))
(aset composition-function-table ?ำ '(["[ก-ฯ]." 1 thai-composition-function]))
;; Tai-Tham
(set-language-info-alist
"Northern Thai" '((charset unicode)
(coding-system utf-8)
(coding-priority utf-8)
(sample-text .
"Northern Thai (ᨣᩣᩴᨾᩮᩬᩥᨦ / ᨽᩣᩈᩣᩃ᩶ᩣ᩠ᨶᨶᩣ) ᩈ᩠ᩅᩢᩔ᩠ᨯᩦᨣᩕᩢ᩠ᨸ")
(documentation . t)))
;; From Richard Wordingham <richard.wordingham@ntlworld.com>:
(defvar tai-tham-composable-pattern
(let ((table
;; C is letters, independent vowels, digits, punctuation and symbols.
'(("C" . "[\u1A20-\u1A54\u1A80-\u1A89\u1A90-\u1A99\u1AA0-\u1AAD]")
("M" . ; Marks, CGJ, ZWNJ, ZWJ
"[\u0324\u034F\u0E49\u0E4A\u0E4B\u1A55-\u1A57\u1A59-\u1A5E\u1A61-\u1A7C\u1A7F\u200C\200D]")
("H" . "\u1A60") ; Sakot
("S" . ; Marks commuting with sakot
"[\u0E49-\u0E4B\u0EC9\u0ECB\u1A75-\u1A7C]")
("N" . "\u1A58"))) ; mai kang lai
(basic-syllable "C\\(N*\\(M\\|HS*C\\)\\)*")
(regexp "X\\(N\\(X\\)?\\)*H?")) ; where X is basic syllable
(let ((case-fold-search nil))
(setq regexp (replace-regexp-in-string "X" basic-syllable regexp t t))
(dolist (elt table)
(setq regexp (replace-regexp-in-string (car elt) (cdr elt)
regexp t t))))
regexp))
(let ((elt (list (vector tai-tham-composable-pattern 0 'font-shape-gstring)
)))
(set-char-table-range composition-function-table '(#x1A20 . #x1A54) elt)
(set-char-table-range composition-function-table '(#x1A80 . #x1A89) elt)
(set-char-table-range composition-function-table '(#x1A90 . #x1A99) elt)
(set-char-table-range composition-function-table '(#x1AA0 . #x1AAD) elt))
(provide 'thai)
;;; thai.el ends here