mirror of
https://git.savannah.gnu.org/git/emacs.git
synced 2024-12-19 10:22:27 +00:00
190 lines
6.2 KiB
EmacsLisp
190 lines
6.2 KiB
EmacsLisp
;;; indian.el --- Indian languages support -*- coding: utf-8; -*-
|
||
|
||
;; Copyright (C) 1997, 1999, 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009
|
||
;; Free Software Foundation, Inc.
|
||
;; Copyright (C) 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009
|
||
;; National Institute of Advanced Industrial Science and Technology (AIST)
|
||
;; Registration Number H14PRO021
|
||
|
||
;; Maintainer: Kenichi Handa <handa@m17n.org>
|
||
;; KAWABATA, Taichi <kawabata@m17n.org>
|
||
;; Keywords: multilingual, i18n, Indian
|
||
|
||
;; This file is part of GNU Emacs.
|
||
|
||
;; GNU Emacs is free software: you can redistribute it and/or modify
|
||
;; it under the terms of the GNU General Public License as published by
|
||
;; the Free Software Foundation, either version 3 of the License, or
|
||
;; (at your option) any later version.
|
||
|
||
;; GNU Emacs is distributed in the hope that it will be useful,
|
||
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
;; GNU General Public License for more details.
|
||
|
||
;; You should have received a copy of the GNU General Public License
|
||
;; along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>.
|
||
|
||
;;; Commentary:
|
||
|
||
;; This file contains definitions of Indian language environments, and
|
||
;; setups for displaying the scrtipts used there.
|
||
|
||
;;; Code:
|
||
|
||
(define-coding-system 'in-is13194-devanagari
|
||
"8-bit encoding for ASCII (MSB=0) and IS13194-Devanagari (MSB=1)."
|
||
:coding-type 'iso-2022
|
||
:mnemonic ?D
|
||
:designation [ascii indian-is13194 nil nil]
|
||
:charset-list '(ascii indian-is13194)
|
||
:post-read-conversion 'in-is13194-post-read-conversion
|
||
:pre-write-conversion 'in-is13194-pre-write-conversion)
|
||
|
||
(define-coding-system-alias 'devanagari 'in-is13194-devanagari)
|
||
|
||
(set-language-info-alist
|
||
"Devanagari" '((charset unicode)
|
||
(coding-system utf-8)
|
||
(coding-priority utf-8)
|
||
(input-method . "dev-aiba")
|
||
(documentation . "\
|
||
Such languages using Devanagari script as Hindi and Marathi
|
||
are supported in this language environment."))
|
||
'("Indian"))
|
||
|
||
(set-language-info-alist
|
||
"Bengali" '((charset unicode)
|
||
(coding-system utf-8)
|
||
(coding-priority utf-8)
|
||
(input-method . "bengali-itrans")
|
||
(documentation . "\
|
||
Such languages using Bengali script as Bengali and Assamese
|
||
are supported in this language environment."))
|
||
'("Indian"))
|
||
|
||
(set-language-info-alist
|
||
"Punjabi" '((charset unicode)
|
||
(coding-system utf-8)
|
||
(coding-priority utf-8)
|
||
(input-method . "punjabi-itrans")
|
||
(documentation . "\
|
||
North Indian language Punjabi is supported in this language environment."))
|
||
'("Indian"))
|
||
|
||
(set-language-info-alist
|
||
"Gujarati" '((charset unicode)
|
||
(coding-system utf-8)
|
||
(coding-priority utf-8)
|
||
(input-method . "gujarati-itrans")
|
||
(documentation . "\
|
||
North Indian language Gujarati is supported in this language environment."))
|
||
'("Indian"))
|
||
|
||
(set-language-info-alist
|
||
"Oriya" '((charset unicode)
|
||
(coding-system utf-8)
|
||
(coding-priority utf-8)
|
||
(input-method . "oriya-itrans")
|
||
(documentation . "\
|
||
Such languages using Oriya script as Oriya, Khonti, and Santali
|
||
are supported in this language environment."))
|
||
'("Indian"))
|
||
|
||
(set-language-info-alist
|
||
"Tamil" '((charset unicode)
|
||
(coding-system utf-8)
|
||
(coding-priority utf-8)
|
||
(input-method . "tamil-itrans")
|
||
(documentation . "\
|
||
South Indian Language Tamil is supported in this language environment."))
|
||
'("Indian"))
|
||
|
||
(set-language-info-alist
|
||
"Telugu" '((charset unicode)
|
||
(coding-system utf-8)
|
||
(coding-priority utf-8)
|
||
(input-method . "telugu-itrans")
|
||
(documentation . "\
|
||
South Indian Language Telugu is supported in this language environment."))
|
||
'("Indian"))
|
||
|
||
(set-language-info-alist
|
||
"Kannada" '((charset unicode)
|
||
(coding-system mule-utf-8)
|
||
(coding-priority mule-utf-8)
|
||
(input-method . "kannada-itrans")
|
||
(sample-text . "Kannada (ಕನ್ನಡ) ನಮಸ್ಕಾರ")
|
||
(documentation . "\
|
||
Kannada language and script is supported in this language
|
||
environment."))
|
||
'("Indian"))
|
||
|
||
(set-language-info-alist
|
||
"Malayalam" '((charset unicode)
|
||
(coding-system utf-8)
|
||
(coding-priority utf-8)
|
||
(input-method . "malayalam-itrans")
|
||
(documentation . "\
|
||
South Indian language Malayalam is supported in this language environment."))
|
||
'("Indian"))
|
||
|
||
(defconst devanagari-composable-pattern
|
||
(concat
|
||
"\\([अ-औॠॡ][ँं]?\\)\\|[ः।]"
|
||
"\\|\\("
|
||
"\\(?:\\(?:[क-हक़-य़]्\\)?\\(?:[क-हक़-य़]्\\)?\\(?:[क-हक़-य़]्\\)?[क-हक़-य़]्\\)?"
|
||
"[क-हक़-य़]\\(?:्\\|[ा-्ॢॣ]?[ंँ]?\\)?"
|
||
"\\)")
|
||
"Regexp matching a composable sequence of Devanagari characters.")
|
||
|
||
(defconst tamil-composable-pattern
|
||
(concat
|
||
"\\([அ-ஔ]\\)\\|"
|
||
"[ஂஃ]\\|" ;; vowel modifier considered independent
|
||
"\\(\\(?:\\(?:க்ஷ\\)\\|[க-ஹ]\\)[்ா-ௌ]?\\)\\|"
|
||
"\\(ஷ்ரீ\\)")
|
||
"Regexp matching a composable sequence of Tamil characters.")
|
||
|
||
(defconst kannada-composable-pattern
|
||
(concat
|
||
"\\([ಂ-ಔೠಌ]\\)\\|[ಃ]"
|
||
"\\|\\("
|
||
"\\(?:\\(?:[ಕ-ಹ]್\\)?\\(?:[ಕ-ಹ]್\\)?\\(?:[ಕ-ಹ]್\\)?[ಕ-ಹ]್\\)?"
|
||
"[ಕ-ಹ]\\(?:್\\|[ಾ-್ೕೃ]?\\)?"
|
||
"\\)")
|
||
"Regexp matching a composable sequence of Kannada characters.")
|
||
|
||
(defconst malayalam-composable-pattern
|
||
(concat
|
||
"\\([അ-ഔ][ം]?\\)\\|ഃ"
|
||
"\\|\\("
|
||
"\\(?:\\(?:[ക-ഹ]്\\)?\\(?:[ക-ഹ]്\\)?\\(?:[ക-ഹ]്\\)?[ക-ഹ]്\\)?"
|
||
"[ക-ഹ]\\(?:്\\|[ാ-ൃെേൈൊൊോൌ]?[ം്]?\\)?"
|
||
"\\)")
|
||
"Regexp matching a composable sequence of Malayalam characters.")
|
||
|
||
(let ((script-regexp-alist
|
||
`((devanagari . ,devanagari-composable-pattern)
|
||
(bengali . "[\x980-\x9FF\x200C\x200D]+")
|
||
(gurmukhi . "[\xA00-\xA7F\x200C\x200D]+")
|
||
(gujarati . "[\xA80-\xAFF\x200C\x200D]+")
|
||
(oriya . "[\xB00-\xB7F\x200C\x200D]+")
|
||
(tamil . ,tamil-composable-pattern)
|
||
(telugu . "[\xC00-\xC7F\x200C\x200D]+")
|
||
(kannada . ,kannada-composable-pattern)
|
||
(malayalam . ,malayalam-composable-pattern))))
|
||
(map-char-table
|
||
#'(lambda (key val)
|
||
(let ((slot (assq val script-regexp-alist)))
|
||
(if slot
|
||
(set-char-table-range
|
||
composition-function-table key
|
||
(list (vector (cdr slot) 0 'font-shape-gstring))))))
|
||
char-script-table))
|
||
|
||
(provide 'indian)
|
||
|
||
;; arch-tag: 83aa8fc7-7ee2-4364-a6e5-498f5e3b8c2f
|
||
;;; indian.el ends here
|