mirror of
https://git.savannah.gnu.org/git/emacs.git
synced 2024-12-15 09:47:20 +00:00
5beb269505
* admin/unidata/BidiBrackets.txt: * admin/unidata/BidiMirroring.txt: * admin/unidata/Blocks.txt: * admin/unidata/NormalizationTest.txt: * admin/unidata/SpecialCasing.txt: * admin/unidata/UnicodeData.txt: * admin/unidata/copyright.html: * test/manual/BidiCharacterTest.txt: Updated files imported from Unicode v13.0. * admin/unidata/blocks.awk: Add "Symbols for Legacy Computing" to known aliases. * lisp/international/fontset.el (script-representative-chars) (setup-default-fontset): Add new scripts. * lisp/international/characters.el: Set syntax for Symbols for Legacy Computing characters. Update setting of char-width-table. * lisp/international/mule-cmds.el (ucs-names): Update ranges of characters for which we want names in 'ucs-names'. * test/lisp/international/ucs-normalize-tests.el (ucs-normalize-tests--failing-lines-part1) (ucs-normalize-tests--failing-lines-part2): Update according to 'ucs-normalize-check-failing-lines'.
1442 lines
50 KiB
EmacsLisp
1442 lines
50 KiB
EmacsLisp
;;; fontset.el --- commands for handling fontset
|
||
|
||
;; Copyright (C) 1997-2020 Free Software Foundation, Inc.
|
||
;; Copyright (C) 1995, 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004,
|
||
;; 2005, 2006, 2007, 2008, 2009, 2010, 2011
|
||
;; National Institute of Advanced Industrial Science and Technology (AIST)
|
||
;; Registration Number H14PRO021
|
||
;; Copyright (C) 2003, 2006
|
||
;; National Institute of Advanced Industrial Science and Technology (AIST)
|
||
;; Registration Number H13PRO009
|
||
|
||
;; Keywords: mule, i18n, fontset
|
||
|
||
;; This file is part of GNU Emacs.
|
||
|
||
;; GNU Emacs is free software: you can redistribute it and/or modify
|
||
;; it under the terms of the GNU General Public License as published by
|
||
;; the Free Software Foundation, either version 3 of the License, or
|
||
;; (at your option) any later version.
|
||
|
||
;; GNU Emacs is distributed in the hope that it will be useful,
|
||
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
;; GNU General Public License for more details.
|
||
|
||
;; You should have received a copy of the GNU General Public License
|
||
;; along with GNU Emacs. If not, see <https://www.gnu.org/licenses/>.
|
||
|
||
;;; Commentary:
|
||
|
||
;;; Code:
|
||
|
||
;; Setup font-encoding-alist for all known encodings.
|
||
|
||
(setq font-encoding-alist
|
||
(mapcar (lambda (arg)
|
||
(cons (purecopy (car arg)) (cdr arg)))
|
||
'(("iso8859-1$" . iso-8859-1)
|
||
("iso8859-2$" . iso-8859-2)
|
||
("iso8859-3$" . iso-8859-3)
|
||
("iso8859-4$" . iso-8859-4)
|
||
("iso8859-5$" . iso-8859-5)
|
||
("iso8859-6$" . iso-8859-6)
|
||
("iso8859-7$" . iso-8859-7)
|
||
("iso8859-8$" . iso-8859-8)
|
||
("iso8859-9$" . iso-8859-9)
|
||
("iso8859-10$" . iso-8859-10)
|
||
("iso8859-11$" . iso-8859-11)
|
||
("iso8859-13$" . iso-8859-13)
|
||
("iso8859-14$" . iso-8859-14)
|
||
("iso8859-15$" . iso-8859-15)
|
||
("iso8859-16$" . iso-8859-16)
|
||
("ascii-0$" . ascii)
|
||
("gb2312.1980" . chinese-gb2312)
|
||
("gbk" . chinese-gbk)
|
||
;; GB18030 needs the characters encoded by gb18030, but a
|
||
;; gb18030 font doesn't necessarily support all of the GB18030
|
||
;; characters.
|
||
("gb18030" . (gb18030 . unicode))
|
||
("jisx0208.1978" . japanese-jisx0208-1978)
|
||
("jisx0208" . japanese-jisx0208)
|
||
("jisx0201" . jisx0201)
|
||
("jisx0212" . japanese-jisx0212)
|
||
("ksx1001" . korean-ksc5601)
|
||
("ksc5601.1987" . korean-ksc5601)
|
||
("cns11643.1992.*1" . chinese-cns11643-1)
|
||
("cns11643.1992.*2" . chinese-cns11643-2)
|
||
("cns11643.1992.*3" . chinese-cns11643-3)
|
||
("cns11643.1992.*4" . chinese-cns11643-4)
|
||
("cns11643.1992.*5" . chinese-cns11643-5)
|
||
("cns11643.1992.*6" . chinese-cns11643-6)
|
||
("cns11643.1992.*7" . chinese-cns11643-7)
|
||
("cns11643.92p1-0" . chinese-cns11643-1)
|
||
("cns11643.92p2-0" . chinese-cns11643-2)
|
||
("cns11643.92p3-0" . chinese-cns11643-3)
|
||
("cns11643.92p4-0" . chinese-cns11643-4)
|
||
("cns11643.92p5-0" . chinese-cns11643-5)
|
||
("cns11643.92p6-0" . chinese-cns11643-6)
|
||
("cns11643.92p7-0" . chinese-cns11643-7)
|
||
("big5" . big5)
|
||
("viscii" . viscii)
|
||
("tis620" . tis620-2533)
|
||
("microsoft-cp1251" . windows-1251)
|
||
("koi8-r" . koi8-r)
|
||
("jisx0213.2000-1" . japanese-jisx0213-1)
|
||
("jisx0213.2000-2" . japanese-jisx0213-2)
|
||
("jisx0213.2004-1" . japanese-jisx0213.2004-1)
|
||
("iso10646-1$" . (unicode-bmp . nil))
|
||
("iso10646.indian-1" . (unicode-bmp . nil))
|
||
("unicode-bmp" . (unicode-bmp . nil))
|
||
("abobe-symbol" . symbol)
|
||
("sisheng_cwnn" . chinese-sisheng)
|
||
("mulearabic-0" . arabic-digit)
|
||
("mulearabic-1" . arabic-1-column)
|
||
("mulearabic-2" . arabic-2-column)
|
||
("muleipa" . ipa)
|
||
("ethiopic-unicode" . (unicode-bmp . ethiopic))
|
||
("is13194-devanagari" . indian-is13194)
|
||
("Devanagari-CDAC" . devanagari-cdac)
|
||
("Sanskrit-CDAC" . sanskrit-cdac)
|
||
("Bengali-CDAC" . bengali-cdac)
|
||
("Assamese-CDAC" . assamese-cdac)
|
||
("Punjabi-CDAC" . punjabi-cdac)
|
||
("Gujarati-CDAC" . gujarati-cdac)
|
||
("Oriya-CDAC" . oriya-cdac)
|
||
("Tamil-CDAC" . tamil-cdac)
|
||
("Telugu-CDAC" . telugu-cdac)
|
||
("Kannada-CDAC" . kannada-cdac)
|
||
("Malayalam-CDAC" . malayalam-cdac)
|
||
("Devanagari-Akruti" . devanagari-akruti)
|
||
("Bengali-Akruti" . bengali-akruti)
|
||
("Punjabi-Akruti" . punjabi-akruti)
|
||
("Gujarati-Akruti" . gujarati-akruti)
|
||
("Oriya-Akruti" . oriya-akruti)
|
||
("Tamil-Akruti" . tamil-akruti)
|
||
("Telugu-Akruti" . telugu-akruti)
|
||
("Kannada-Akruti" . kannada-akruti)
|
||
("Malayalam-Akruti" . malayalam-akruti)
|
||
("muleindian-2" . indian-2-column)
|
||
("muleindian-1" . indian-1-column)
|
||
("mulelao-1" . mule-lao)
|
||
("muletibetan-2" . tibetan)
|
||
("muletibetan-0" . tibetan)
|
||
("muletibetan-1" . tibetan-1-column))))
|
||
|
||
(defvar font-encoding-charset-alist)
|
||
|
||
(setq font-encoding-charset-alist
|
||
'((latin-iso8859-1 . iso-8859-1)
|
||
(latin-iso8859-2 . iso-8859-2)
|
||
(latin-iso8859-3 . iso-8859-3)
|
||
(latin-iso8859-4 . iso-8859-4)
|
||
(latin-iso8859-9 . iso-8859-9)
|
||
(latin-iso8859-10 . iso-8859-10)
|
||
(latin-iso8859-13 . iso-8859-13)
|
||
(latin-iso8859-14 . iso-8859-14)
|
||
(latin-iso8859-15 . iso-8859-15)
|
||
(latin-iso8859-16 . iso-8859-16)
|
||
(cyrillic-iso8859-5 . iso-8859-5)
|
||
(greek-iso8859-7 . iso-8859-7)
|
||
(arabic-iso8859-6 . iso-8859-6)
|
||
(thai-tis620 . tis620-2533)
|
||
(latin-jisx0201 . jisx0201)
|
||
(katakana-jisx0201 . jisx0201)
|
||
(chinese-big5-1 . big5)
|
||
(chinese-big5-2 . big5)
|
||
(vietnamese-viscii-lower . viscii)
|
||
(vietnamese-viscii-upper . viscii)
|
||
(tibetan . unicode-bmp)))
|
||
|
||
(setq script-representative-chars
|
||
'((latin ?A ?Z ?a ?z #x00C0 #x0100 #x0180 #x1e00)
|
||
(phonetic #x250 #x283)
|
||
(greek #x3A9)
|
||
(coptic #x3E2)
|
||
(cyrillic #x42F)
|
||
(armenian #x531)
|
||
(hebrew #x5D0)
|
||
(vai #xA500)
|
||
(arabic #x628)
|
||
(syriac #x710)
|
||
(thaana #x78C)
|
||
(devanagari #x915)
|
||
(bengali #x995)
|
||
(gurmukhi #xA15)
|
||
(gujarati #xA95)
|
||
(oriya #xB15)
|
||
(tamil #xB95)
|
||
(telugu #xC15)
|
||
(kannada #xC95)
|
||
(malayalam #xD15)
|
||
(sinhala #xD95)
|
||
(thai #xE17)
|
||
(lao #xEA5)
|
||
(tibetan #xF40)
|
||
(burmese #x1000)
|
||
(georgian #x10D3)
|
||
(ethiopic #x1208)
|
||
(cherokee #x13B6)
|
||
(canadian-aboriginal #x14C0)
|
||
(ogham #x168F)
|
||
(runic #x16A0)
|
||
(khmer #x1780)
|
||
(mongolian #x1826)
|
||
(symbol . [#x201C #x2200 #x2500])
|
||
(braille #x2800)
|
||
(ideographic-description #x2FF0)
|
||
(cjk-misc #x300E)
|
||
(kana #x304B)
|
||
(bopomofo #x3105)
|
||
(kanbun #x319D)
|
||
(han #x5B57)
|
||
(yi #xA288)
|
||
(cham #xAA00)
|
||
(tai-viet #xAA80)
|
||
(hangul #xAC00)
|
||
(linear-b #x10000)
|
||
(aegean-number #x10100)
|
||
(ancient-greek-number #x10140)
|
||
(ancient-symbol #x10190)
|
||
(phaistos-disc #x101D0)
|
||
(lycian #x10280)
|
||
(carian #x102A0)
|
||
(old-italic #x10300)
|
||
(ugaritic #x10380)
|
||
(old-permic #x10350)
|
||
(old-persian #x103A0)
|
||
(deseret #x10400)
|
||
(shavian #x10450)
|
||
(osmanya #x10480)
|
||
(osage #x104B0)
|
||
(elbasan #x10500)
|
||
(caucasian-albanian #x10530)
|
||
(linear-a #x10600)
|
||
(cypriot-syllabary #x10800)
|
||
(palmyrene #x10860)
|
||
(nabataean #x10880)
|
||
(phoenician #x10900)
|
||
(lydian #x10920)
|
||
(kharoshthi #x10A00)
|
||
(manichaean #x10AC0)
|
||
(hanifi-rohingya #x10D00)
|
||
(yezidi #x10E80)
|
||
(old-sogdian #x10F00)
|
||
(sogdian #x10F30)
|
||
(chorasmian #x10FB0)
|
||
(elymaic #x10FE0)
|
||
(mahajani #x11150)
|
||
(sinhala-archaic-number #x111E1)
|
||
(khojki #x11200)
|
||
(khudawadi #x112B0)
|
||
(grantha #x11305)
|
||
(newa #x11400)
|
||
(tirhuta #x11481)
|
||
(siddham #x11580)
|
||
(modi #x11600)
|
||
(takri #x11680)
|
||
(dogra #x11800)
|
||
(warang-citi #x118A1)
|
||
(dives-akuru #x11900)
|
||
(nandinagari #x119a0)
|
||
(zanabazar-square #x11A00)
|
||
(soyombo #x11A50)
|
||
(pau-cin-hau #x11AC0)
|
||
(bhaiksuki #x11C00)
|
||
(marchen #x11C72)
|
||
(masaram-gondi #x11D00)
|
||
(gunjala-gondi #x11D60)
|
||
(makasar #x11EE0)
|
||
(cuneiform #x12000)
|
||
(cuneiform-numbers-and-punctuation #x12400)
|
||
(egyptian #x13000)
|
||
(mro #x16A40)
|
||
(bassa-vah #x16AD0)
|
||
(pahawh-hmong #x16B11)
|
||
(medefaidrin #x16E40)
|
||
(tangut #x17000)
|
||
(tangut-components #x18800)
|
||
(khitan-small-script #x18B00)
|
||
(nushu #x1B170)
|
||
(duployan-shorthand #x1BC20)
|
||
(byzantine-musical-symbol #x1D000)
|
||
(musical-symbol #x1D100)
|
||
(ancient-greek-musical-notation #x1D200)
|
||
(tai-xuan-jing-symbol #x1D300)
|
||
(counting-rod-numeral #x1D360)
|
||
(nyiakeng-puachue-hmong #x1e100)
|
||
(wancho #x1e2c0)
|
||
(mende-kikakui #x1E810)
|
||
(adlam #x1E900)
|
||
(indic-siyaq-number #x1ec71)
|
||
(ottoman-siyaq-number #x1ed01)
|
||
(mahjong-tile #x1F000)
|
||
(domino-tile #x1F030)))
|
||
|
||
(defvar otf-script-alist)
|
||
|
||
;; The below was synchronized with the latest Aug 16, 2018 version of
|
||
;; https://docs.microsoft.com/en-us/typography/opentype/spec/scripttags
|
||
(setq otf-script-alist
|
||
'((adlm . adlam)
|
||
(ahom . ahom)
|
||
(hluw . anatolian)
|
||
(arab . arabic)
|
||
(armi . aramaic)
|
||
(armn . armenian)
|
||
(avst . avestan)
|
||
(bali . balinese)
|
||
(bamu . bamum)
|
||
(bass . bassa-vah)
|
||
(batk . batak)
|
||
(bng2 . bengali)
|
||
(beng . bengali)
|
||
(bhks . bhaiksuki)
|
||
(bopo . bopomofo)
|
||
(brah . brahmi)
|
||
(brai . braille)
|
||
(bugi . buginese)
|
||
(buhd . buhid)
|
||
(byzm . byzantine-musical-symbol)
|
||
(cans . canadian-aboriginal)
|
||
(cari . carian)
|
||
(aghb . caucasian-albanian)
|
||
(cakm . chakma)
|
||
(cham . cham)
|
||
(cher . cherokee)
|
||
(copt . coptic)
|
||
(xsux . cuneiform)
|
||
(cprt . cypriot)
|
||
(cyrl . cyrillic)
|
||
(dsrt . deseret)
|
||
(deva . devanagari)
|
||
(dev2 . devanagari)
|
||
(dogr . dogra)
|
||
(dupl . duployan-shorthand)
|
||
(egyp . egyptian)
|
||
(elba . elbasan)
|
||
(ethi . ethiopic)
|
||
(geor . georgian)
|
||
(glag . glagolitic)
|
||
(goth . gothic)
|
||
(gran . grantha)
|
||
(grek . greek)
|
||
(gujr . gujarati)
|
||
(gjr2 . gujarati)
|
||
(gong . gunjala-gondi)
|
||
(guru . gurmukhi)
|
||
(gur2 . gurmukhi)
|
||
(hani . han)
|
||
(hang . hangul)
|
||
(jamo . hangul)
|
||
(rohg . hanifi-rohingya)
|
||
(hano . hanunoo)
|
||
(hatr . hatran)
|
||
(hebr . hebrew)
|
||
(hung . old-hungarian)
|
||
(phli . inscriptional-pahlavi)
|
||
(prti . inscriptional-parthian)
|
||
(java . javanese)
|
||
(kthi . kaithi)
|
||
(knda . kannada)
|
||
(knd2 . kannada)
|
||
(kana . kana) ; Hiragana
|
||
(kali . kayah-li)
|
||
(khar . kharoshthi)
|
||
(khmr . khmer)
|
||
(khoj . khojki)
|
||
(sind . khudawadi)
|
||
(lao\ . lao)
|
||
(latn . latin)
|
||
(lepc . lepcha)
|
||
(limb . limbu)
|
||
(lina . linear_a)
|
||
(linb . linear_b)
|
||
(lisu . lisu)
|
||
(lyci . lycian)
|
||
(lydi . lydian)
|
||
(mahj . mahajani)
|
||
(maka . makasar)
|
||
(marc . marchen)
|
||
(mlym . malayalam)
|
||
(mlm2 . malayalam)
|
||
(mand . mandaic)
|
||
(mani . manichaean)
|
||
(gonm . masaram-gondi)
|
||
(math . mathematical)
|
||
(medf . medefaidrin)
|
||
(mtei . meetei-mayek)
|
||
(mend . mende-kikakui)
|
||
(merc . meroitic)
|
||
(mero . meroitic)
|
||
(plrd . miao)
|
||
(modi . modi)
|
||
(mong . mongolian)
|
||
(mroo . mro)
|
||
(mult . multani)
|
||
(musc . musical-symbol)
|
||
(mym2 . burmese)
|
||
(mymr . burmese)
|
||
(nbat . nabataean)
|
||
(newa . newa)
|
||
(nko\ . nko)
|
||
(nshu . nushu)
|
||
(ogam . ogham)
|
||
(olck . ol-chiki)
|
||
(ital . old_italic)
|
||
(xpeo . old_persian)
|
||
(narb . old-north-arabian)
|
||
(perm . old-permic)
|
||
(sogo . old-sogdian)
|
||
(sarb . old-south-arabian)
|
||
(orkh . old-turkic)
|
||
(orya . oriya)
|
||
(ory2 . oriya)
|
||
(osge . osage)
|
||
(osma . osmanya)
|
||
(hmng . pahawh-hmong)
|
||
(palm . palmyrene)
|
||
(pauc . pau-cin-hau)
|
||
(phag . phags-pa)
|
||
(phli . inscriptional-pahlavi)
|
||
(phnx . phoenician)
|
||
(phlp . psalter-pahlavi)
|
||
(prti . inscriptional-parthian)
|
||
(rjng . rejang)
|
||
(runr . runic)
|
||
(samr . samaritan)
|
||
(saur . saurashtra)
|
||
(shrd . sharada)
|
||
(shaw . shavian)
|
||
(sidd . siddham)
|
||
(sgnw . sutton-sign-writing)
|
||
(sinh . sinhala)
|
||
(sogd . sogdian)
|
||
(sora . sora-sompeng)
|
||
(soyo . soyombo)
|
||
(sund . sundanese)
|
||
(sylo . syloti_nagri)
|
||
(syrc . syriac)
|
||
(tglg . tagalog)
|
||
(tagb . tagbanwa)
|
||
(tale . tai_le)
|
||
(talu . tai-lue)
|
||
(lana . tai-tham)
|
||
(tavt . tai-viet)
|
||
(takr . takri)
|
||
(taml . tamil)
|
||
(tml2 . tamil)
|
||
(tang . tangut)
|
||
(telu . telugu)
|
||
(tel2 . telugu)
|
||
(thaa . thaana)
|
||
(thai . thai)
|
||
(tibt . tibetan)
|
||
(tfng . tifinagh)
|
||
(tirh . tirhuta)
|
||
(ugar . ugaritic)
|
||
(vai\ . vai)
|
||
(wara . warang-citi)
|
||
(yi\ \ . yi)
|
||
(zanb . zanabazar-square)))
|
||
|
||
;; Set standard fontname specification of characters in the default
|
||
;; fontset to find an appropriate font for each script/charset. The
|
||
;; specification has the form ((SCRIPT FONT-SPEC ...) ...), where
|
||
;; FONT-SPEC is:
|
||
;; a cons (FAMILY . REGISTRY),
|
||
;; or a string FONT-NAME,
|
||
;; or an object created by `font-spec'.
|
||
;;
|
||
;; FAMILY may be nil, in which case, the corresponding name of
|
||
;; default face is used. If REGISTRY contains a character `-', the
|
||
;; string before that is embedded in `CHARSET_REGISTRY' field, and the
|
||
;; string after that is embedded in `CHARSET_ENCODING' field. If it
|
||
;; does not contain `-', the whole string is embedded in
|
||
;; `CHARSET_REGISTRY' field, and a wild card character `*' is embedded
|
||
;; in `CHARSET_ENCODING' field.
|
||
;;
|
||
;; SCRIPT is a symbol that appears as an element of the char table
|
||
;; `char-script-table'. SCRIPT may be a charset specifying the range
|
||
;; of characters.
|
||
|
||
(declare-function new-fontset "fontset.c" (name fontlist))
|
||
(declare-function set-fontset-font "fontset.c"
|
||
(name target font-spec &optional frame add))
|
||
|
||
(eval-when-compile
|
||
|
||
;; Build data to initialize the default fontset at compile time to
|
||
;; avoid loading charsets that won't be necessary at runtime.
|
||
|
||
;; The value is (CJK-REGISTRY-VECTOR TARGET-SPEC ...), where
|
||
;; CJK-REGISTRY-VECTOR is ["JISX0208.1983-0" "GB2312.1980-0" ...],
|
||
;; TARGET-SPEC is (TARGET . BITMASK) or (TARGET SPEC ...),
|
||
;; TARGET is CHAR or (FROM-CHAR . TO-CHAR),
|
||
;; BITMASK is a bitmask of indices to CJK-REGISTRY-VECTOR,
|
||
;; SPEC is a list of arguments to font-spec.
|
||
|
||
(defmacro build-default-fontset-data ()
|
||
(let* (;; CHARSET-REGISTRY CHARSET FROM-CODE TO-CODE
|
||
(cjk '(("JISX0208.1983-0" japanese-jisx0208 #x2121 #x287E)
|
||
("GB2312.1980-0" chinese-gb2312 #x2121 #x297E)
|
||
("BIG5-0" big5 #xA140 #xA3FE)
|
||
("CNS11643.1992-1" chinese-cns11643-1 #x2121 #x427E)
|
||
("KSC5601.1987-0" korean-ksc5601 #x2121 #x2C7E)))
|
||
(scripts '((tibetan
|
||
(:registry "iso10646-1" :otf (tibt nil (ccmp blws abvs)))
|
||
(:family "mtib" :registry "iso10646-1")
|
||
(:registry "muletibetan-2"))
|
||
(ethiopic
|
||
(:registry "iso10646-1" :script ethiopic)
|
||
(:registry "ethiopic-unicode"))
|
||
(phonetic
|
||
(:registry "iso10646-1" :script phonetic)
|
||
(:registry "MuleIPA-1")
|
||
(:registry "iso10646-1"))))
|
||
(cjk-table (make-char-table nil))
|
||
(script-coverage
|
||
#'(lambda (script)
|
||
(let ((coverage))
|
||
(map-char-table
|
||
#'(lambda (range val)
|
||
(when (eq val script)
|
||
(if (consp range)
|
||
(setq range (cons (car range) (cdr range))))
|
||
(push range coverage)))
|
||
char-script-table)
|
||
coverage)))
|
||
(data (list (vconcat (mapcar 'car cjk))))
|
||
(i 0))
|
||
(dolist (elt cjk)
|
||
(let ((mask (ash 1 i)))
|
||
(map-charset-chars
|
||
#'(lambda (range _arg)
|
||
(let ((from (car range)) (to (cdr range)))
|
||
(if (< to #x110000)
|
||
(while (<= from to)
|
||
(or (memq (aref char-script-table from)
|
||
'(kana hangul han cjk-misc))
|
||
(aset cjk-table from
|
||
(logior (or (aref cjk-table from) 0) mask)))
|
||
(setq from (1+ from))))))
|
||
(nth 1 elt) nil (nth 2 elt) (nth 3 elt)))
|
||
(setq i (1+ i)))
|
||
(map-char-table
|
||
#'(lambda (range val)
|
||
(if (consp range)
|
||
(setq range (cons (car range) (cdr range))))
|
||
(push (cons range val) data))
|
||
cjk-table)
|
||
(dolist (script scripts)
|
||
(dolist (range (funcall script-coverage (car script)))
|
||
(push (cons range (cdr script)) data)))
|
||
`(quote ,(nreverse data))))
|
||
)
|
||
|
||
(defun setup-default-fontset ()
|
||
"Setup the default fontset."
|
||
(new-fontset
|
||
"fontset-default"
|
||
`(;; for each script
|
||
(latin (nil . "ISO8859-1")
|
||
(nil . "ISO8859-2")
|
||
(nil . "ISO8859-3")
|
||
(nil . "ISO8859-4")
|
||
(nil . "ISO8859-9")
|
||
(nil . "ISO8859-10")
|
||
(nil . "ISO8859-13")
|
||
(nil . "ISO8859-14")
|
||
(nil . "ISO8859-15")
|
||
(nil . "ISO8859-16")
|
||
(nil . "VISCII1.1-1")
|
||
,(font-spec :registry "iso10646-1" :script 'latin))
|
||
|
||
(thai ,(font-spec :registry "iso10646-1" :otf '(thai nil nil (mark)))
|
||
,(font-spec :registry "iso10646-1" :script 'thai)
|
||
(nil . "TIS620*")
|
||
(nil . "ISO8859-11"))
|
||
|
||
(devanagari ,(font-spec :registry "iso10646-1" :otf '(dev2 nil (rphf)))
|
||
,(font-spec :registry "iso10646-1" :otf '(deva nil (rphf)))
|
||
(nil . "iso10646.indian-1"))
|
||
(bengali ,(font-spec :registry "iso10646-1" :otf '(bng2 nil (rphf)))
|
||
,(font-spec :registry "iso10646-1" :otf '(beng nil (rphf))))
|
||
(gurmukhi ,(font-spec :registry "iso10646-1" :otf '(gur2 nil (blwf)))
|
||
,(font-spec :registry "iso10646-1" :otf '(guru nil (blwf))))
|
||
(gujarati ,(font-spec :registry "iso10646-1" :otf '(gjr2 nil (rphf)))
|
||
,(font-spec :registry "iso10646-1" :otf '(gujr nil (rphf))))
|
||
(oriya ,(font-spec :registry "iso10646-1" :otf '(ory2 nil (rphf)))
|
||
,(font-spec :registry "iso10646-1" :otf '(orya nil (rphf))))
|
||
(tamil ,(font-spec :registry "iso10646-1" :otf '(tml2 nil (akhn)))
|
||
,(font-spec :registry "iso10646-1" :otf '(taml nil (akhn))))
|
||
(telugu ,(font-spec :registry "iso10646-1" :otf '(tel2 nil (blwf)))
|
||
,(font-spec :registry "iso10646-1" :otf '(telu nil (blwf))))
|
||
(kannada ,(font-spec :registry "iso10646-1" :otf '(knd2 nil (rphf)))
|
||
,(font-spec :registry "iso10646-1" :otf '(knda nil (rphf))))
|
||
(sinhala ,(font-spec :registry "iso10646-1" :otf '(sinh nil (akhn))))
|
||
(malayalam ,(font-spec :registry "iso10646-1" :otf '(mlm2 nil (akhn)))
|
||
,(font-spec :registry "iso10646-1" :otf '(mlym nil (akhn))))
|
||
|
||
(burmese ,(font-spec :registry "iso10646-1" :otf '(mym2 nil nil))
|
||
,(font-spec :registry "iso10646-1" :otf '(mymr nil nil))
|
||
,(font-spec :registry "iso10646-1" :script 'burmese))
|
||
|
||
(lao ,(font-spec :registry "iso10646-1" :otf '(lao\ nil nil (mark)))
|
||
,(font-spec :registry "iso10646-1" :script 'lao)
|
||
(nil . "MuleLao-1"))
|
||
|
||
(tai-viet ("TaiViet" . "iso10646-1"))
|
||
|
||
(greek ,(font-spec :registry "iso10646-1" :script 'greek)
|
||
(nil . "ISO8859-7"))
|
||
|
||
(cyrillic ,(font-spec :registry "iso10646-1" :script 'cyrillic)
|
||
(nil . "ISO8859-5")
|
||
(nil . "microsoft-cp1251")
|
||
(nil . "koi8-r"))
|
||
|
||
(arabic ,(font-spec :registry "iso10646-1"
|
||
:otf '(arab nil (init medi fina liga)))
|
||
(nil . "MuleArabic-0")
|
||
(nil . "MuleArabic-1")
|
||
(nil . "MuleArabic-2")
|
||
(nil . "ISO8859-6"))
|
||
|
||
(hebrew ,(font-spec :registry "iso10646-1" :script 'hebrew)
|
||
(nil . "ISO8859-8"))
|
||
|
||
(khmer ,(font-spec :registry "iso10646-1" :otf '(khmr nil (pres))))
|
||
|
||
(kana (nil . "JISX0208*")
|
||
(nil . "GB2312.1980-0")
|
||
(nil . "KSC5601.1987*")
|
||
(nil . "JISX0201*")
|
||
(nil . "JISX0213.2000-1")
|
||
(nil . "JISX0213.2004-1")
|
||
,(font-spec :registry "iso10646-1" :script 'kana))
|
||
|
||
(bopomofo ,(font-spec :registry "iso10646-1" :script 'bopomofo)
|
||
(nil . "sisheng_cwnn-0"))
|
||
|
||
(han (nil . "GB2312.1980-0")
|
||
(nil . "JISX0208*")
|
||
(nil . "JISX0212*")
|
||
(nil . "big5*")
|
||
(nil . "KSC5601.1987*")
|
||
(nil . "CNS11643.1992-1")
|
||
(nil . "CNS11643.1992-2")
|
||
(nil . "CNS11643.1992-3")
|
||
(nil . "CNS11643.1992-4")
|
||
(nil . "CNS11643.1992-5")
|
||
(nil . "CNS11643.1992-6")
|
||
(nil . "CNS11643.1992-7")
|
||
(nil . "gbk-0")
|
||
(nil . "gb18030")
|
||
(nil . "JISX0213.2000-1")
|
||
(nil . "JISX0213.2000-2")
|
||
(nil . "JISX0213.2004-1")
|
||
,(font-spec :registry "iso10646-1" :lang 'ja)
|
||
,(font-spec :registry "iso10646-1" :lang 'zh))
|
||
|
||
(cjk-misc (nil . "GB2312.1980-0")
|
||
(nil . "JISX0208*")
|
||
(nil . "JISX0212*")
|
||
(nil . "big5*")
|
||
(nil . "KSC5601.1987*")
|
||
(nil . "CNS11643.1992-1")
|
||
(nil . "CNS11643.1992-2")
|
||
(nil . "CNS11643.1992-3")
|
||
(nil . "CNS11643.1992-4")
|
||
(nil . "CNS11643.1992-5")
|
||
(nil . "CNS11643.1992-6")
|
||
(nil . "CNS11643.1992-7")
|
||
(nil . "gbk-0")
|
||
(nil . "gb18030")
|
||
(nil . "JISX0213.2000-1")
|
||
(nil . "JISX0213.2000-2")
|
||
,(font-spec :registry "iso10646-1" :lang 'ja)
|
||
,(font-spec :registry "iso10646-1" :lang 'zh))
|
||
|
||
(hangul (nil . "KSC5601.1987-0")
|
||
,(font-spec :registry "iso10646-1" :lang 'ko))
|
||
|
||
;; for each charset
|
||
(ascii (nil . "ISO8859-1"))
|
||
(arabic-digit ("*" . "MuleArabic-0"))
|
||
(arabic-1-column ("*" . "MuleArabic-1"))
|
||
(arabic-2-column ("*" . "MuleArabic-2"))
|
||
(indian-is13194 (nil . "is13194-devanagari"))
|
||
(indian-1-column ("*" . "muleindian-2"))
|
||
;; Indian CDAC
|
||
(devanagari-cdac (nil . "Devanagari-CDAC"))
|
||
(sanskrit-cdac (nil . "Sanskrit-CDAC"))
|
||
(bengali-cdac (nil . "Bengali-CDAC"))
|
||
(assamese-cdac (nil . "Assamese-CDAC"))
|
||
(punjabi-cdac (nil . "Punjabi-CDAC"))
|
||
(gujarati-cdac (nil . "Gujarati-CDAC"))
|
||
(oriya-cdac (nil . "Oriya-CDAC"))
|
||
(tamil-cdac (nil . "Tamil-CDAC"))
|
||
(telugu-cdac (nil . "Telugu-CDAC"))
|
||
(kannada-cdac (nil . "Kannada-CDAC"))
|
||
(malayalam-cdac (nil . "Malayalam-CDAC"))
|
||
;; Indian AKRUTI
|
||
(devanagari-akruti (nil . "Devanagari-Akruti"))
|
||
(bengali-akruti (nil . "Bengali-Akruti"))
|
||
(punjabi-akruti (nil . "Punjabi-Akruti"))
|
||
(gujarati-akruti (nil . "Gujarati-Akruti"))
|
||
(oriya-akruti (nil . "Oriya-Akruti"))
|
||
(tamil-akruti (nil . "Tamil-Akruti"))
|
||
(telugu-akruti (nil . "Telugu-Akruti"))
|
||
(kannada-akruti (nil . "Kannada-Akruti"))
|
||
(malayalam-akruti (nil . "Malayalam-Akruti"))
|
||
|
||
;; Fallback fonts
|
||
(nil (nil . "gb2312.1980")
|
||
(nil . "gbk-0")
|
||
(nil . "gb18030")
|
||
(nil . "jisx0208")
|
||
(nil . "ksc5601.1987")
|
||
(nil . "CNS11643.1992-1")
|
||
(nil . "CNS11643.1992-2")
|
||
(nil . "CNS11643.1992-3")
|
||
(nil . "CNS11643.1992-4")
|
||
(nil . "CNS11643.1992-5")
|
||
(nil . "CNS11643.1992-6")
|
||
(nil . "CNS11643.1992-7")
|
||
(nil . "big5")
|
||
(nil . "jisx0213.2000-1")
|
||
(nil . "jisx0213.2004-1")
|
||
(nil . "jisx0212"))
|
||
))
|
||
|
||
;; For simple scripts
|
||
(dolist (script '(phonetic
|
||
armenian
|
||
thaana
|
||
syriac
|
||
georgian
|
||
cherokee
|
||
canadian-aboriginal
|
||
ogham
|
||
runic
|
||
symbol
|
||
braille
|
||
yi
|
||
tai-viet
|
||
aegean-number
|
||
ancient-greek-number
|
||
ancient-symbol
|
||
phaistos-disc
|
||
lycian
|
||
carian
|
||
old-italic
|
||
ugaritic
|
||
old-persian
|
||
deseret
|
||
shavian
|
||
osmanya
|
||
osage
|
||
cypriot-syllabary
|
||
phoenician
|
||
lydian
|
||
yezidi
|
||
kharoshthi
|
||
manichaean
|
||
chorasmian
|
||
elymaic
|
||
makasar
|
||
dives-akuru
|
||
cuneiform-numbers-and-punctuation
|
||
cuneiform
|
||
egyptian
|
||
bassa-vah
|
||
pahawh-hmong
|
||
medefaidrin
|
||
byzantine-musical-symbol
|
||
musical-symbol
|
||
ancient-greek-musical-notation
|
||
tai-xuan-jing-symbol
|
||
counting-rod-numeral
|
||
adlam
|
||
mahjong-tile
|
||
domino-tile))
|
||
(set-fontset-font "fontset-default"
|
||
script (font-spec :registry "iso10646-1" :script script)
|
||
nil 'append))
|
||
|
||
;; Special settings for `MATHEMATICAL (U+1D400..U+1D7FF)'.
|
||
(dolist (math-subgroup '((#x1D400 #x1D433 mathematical-bold)
|
||
(#x1D434 #x1D467 mathematical-italic)
|
||
(#x1D468 #x1D49B mathematical-bold-italic)
|
||
(#x1D49C #x1D4CF mathematical-script)
|
||
(#x1D4D0 #x1D503 mathematical-bold-script)
|
||
(#x1D504 #x1D537 mathematical-fraktur)
|
||
(#x1D538 #x1D56B mathematical-double-struck)
|
||
(#x1D56C #x1D59F mathematical-bold-fraktur)
|
||
(#x1D5A0 #x1D5D3 mathematical-sans-serif)
|
||
(#x1D5D4 #x1D607 mathematical-sans-serif-bold)
|
||
(#x1D608 #x1D63B mathematical-sans-serif-italic)
|
||
(#x1D63C #x1D66F mathematical-sans-serif-bold-italic)
|
||
(#x1D670 #x1D6A3 mathematical-monospace)
|
||
(#x1D6A4 #x1D6A5 mathematical-italic)
|
||
(#x1D6A8 #x1D6E1 mathematical-bold)
|
||
(#x1D6E2 #x1D71B mathematical-italic)
|
||
(#x1D71C #x1D755 mathematical-bold-italic)
|
||
(#x1D756 #x1D78F mathematical-sans-serif-bold)
|
||
(#x1D790 #x1D7C9 mathematical-sans-serif-bold-italic)
|
||
(#x1D7CA #x1D7D7 mathematical-bold)
|
||
(#x1D7D8 #x1D7E1 mathematical-double-struck)
|
||
(#x1D7E2 #x1D7EB mathematical-sans-serif)
|
||
(#x1D7EC #x1D7F5 mathematical-sans-serif-bold)
|
||
(#x1D7F6 #x1D7FF mathematical-monospace)))
|
||
(let ((slot (assq (nth 2 math-subgroup) script-representative-chars)))
|
||
(if slot
|
||
(if (vectorp (cdr slot))
|
||
(setcdr slot (vconcat (cdr slot) (vector (car math-subgroup))))
|
||
(setcdr slot (vector (cadr slot) (car math-subgroup))))
|
||
(setq slot (list (nth 2 math-subgroup) (car math-subgroup)))
|
||
(nconc script-representative-chars (list slot))))
|
||
(set-fontset-font
|
||
"fontset-default"
|
||
(cons (car math-subgroup) (nth 1 math-subgroup))
|
||
(font-spec :registry "iso10646-1" :script (nth 2 math-subgroup))))
|
||
|
||
;; Special setup for various symbols and punctuation characters
|
||
;; covered well by Symbola, excluding those covered well by popular
|
||
;; Unicode fonts. We exclude the latter because users don't like us
|
||
;; invading on their font setups where they have good support from
|
||
;; other fonts.
|
||
(dolist (symbol-subgroup
|
||
'((#x2000 . #x2012) ;; General Punctuation
|
||
(#x2015 . #x2017)
|
||
#x201F
|
||
(#x2023 . #x202F)
|
||
(#x2031 . #x2038)
|
||
(#x203B . #x206F)
|
||
(#x2070 . #x209F) ;; Superscripts and Subscripts
|
||
(#x20B6 . #x20CF) ;; Currency Symbols
|
||
(#x2100 . #x2121) ;; Letterlike Symbols
|
||
(#x2123 . #x214F)
|
||
(#x2150 . #x215A) ;; Number Forms
|
||
(#x215F . #x218F)
|
||
(#x2194 . #x21FF) ;; Arrows
|
||
(#x2200 . #x2211) ;; Mathematical Operators
|
||
(#x2213 . #x2247)
|
||
(#x2249 . #x225F)
|
||
(#x2261 . #x2263)
|
||
(#x2266 . #x22FF)
|
||
(#x2300 . #x2301) ;; Miscellaneous Technical
|
||
(#x2303 . #x230F)
|
||
(#x2311 . #x231F)
|
||
(#x2322 . #x23FF)
|
||
(#x2400 . #x243F) ;; Control Pictures
|
||
(#x2440 . #x245F) ;; Optical Char Recognition
|
||
(#x2460 . #x24FF) ;; Enclosed Alphanumerics
|
||
(#x25A0 . #x25FF) ;; Geometric Shapes
|
||
(#x2600 . #x265F) ;; Miscellaneous Symbols
|
||
(#x2661 . #x2662)
|
||
#x2664
|
||
(#x2667 . #x2669)
|
||
(#x266C . #x26FF)
|
||
(#x2700 . #x27bF) ;; Dingbats
|
||
(#x27C0 . #x27EF) ;; Misc Mathematical Symbols-A
|
||
(#x27F0 . #x27FF) ;; Supplemental Arrows-A
|
||
(#x2900 . #x297F) ;; Supplemental Arrows-B
|
||
(#x2980 . #x29FF) ;; Misc Mathematical Symbols-B
|
||
(#x2A00 . #x2AFF) ;; Suppl. Math Operators
|
||
(#x2B00 . #x2BFF) ;; Misc Symbols and Arrows
|
||
(#x2E00 . #x2E7F) ;; Supplemental Punctuation
|
||
(#x4DC0 . #x4DFF) ;; Yijing Hexagram Symbols
|
||
(#xFE10 . #xFE1F) ;; Vertical Forms
|
||
(#x10100 . #x1013F) ;; Aegean Numbers
|
||
(#x10190 . #x101CF) ;; Ancient Symbols
|
||
(#x101D0 . #x101FF) ;; Phaistos Disc
|
||
(#x102E0 . #x102FF) ;; Coptic Epact Numbers
|
||
(#x1D000 . #x1D0FF) ;; Byzantine Musical Symbols
|
||
(#x1D200 . #x1D24F) ;; Ancient Greek Musical Notation
|
||
(#x1D2E0 . #x1D2FF) ;; Mayan Numerals
|
||
(#x1D300 . #x1D35F) ;; Tai Xuan Jing Symbols
|
||
(#x1D360 . #x1D37F) ;; Counting Rod Numerals
|
||
(#x1F000 . #x1F02F) ;; Mahjong Tiles
|
||
(#x1F030 . #x1F09F) ;; Domino Tiles
|
||
(#x1F0A0 . #x1F0FF) ;; Playing Cards
|
||
(#x1F100 . #x1F1FF) ;; Enclosed Alphanumeric Suppl
|
||
(#x1F300 . #x1F5FF) ;; Misc Symbols and Pictographs
|
||
(#x1F600 . #x1F64F) ;; Emoticons
|
||
(#x1F650 . #x1F67F) ;; Ornamental Dingbats
|
||
(#x1F680 . #x1F6FF) ;; Transport and Map Symbols
|
||
(#x1F700 . #x1F77F) ;; Alchemical Symbols
|
||
(#x1F780 . #x1F7FF) ;; Geometric Shapes Extended
|
||
(#x1F800 . #x1F8FF) ;; Supplemental Arrows-C
|
||
(#x1F900 . #x1F9FF) ;; Supplemental Symbols and Pictographs
|
||
(#x1FA00 . #x1FA6F))) ;; Chess Symbols
|
||
(set-fontset-font "fontset-default" symbol-subgroup
|
||
'("Symbola" . "iso10646-1") nil 'prepend))
|
||
;; Box Drawing and Block Elements
|
||
(set-fontset-font "fontset-default" '(#x2500 . #x259F)
|
||
'("FreeMono" . "iso10646-1") nil 'prepend)
|
||
|
||
;; Since standard-fontset-spec on X uses fixed-medium font, which
|
||
;; gets mapped to an iso8859-1 variant, we would like to prefer its
|
||
;; iso10646-1 variant for symbols, where the coverage is known to be
|
||
;; good.
|
||
(dolist (symbol-subgroup
|
||
'((#x2000 . #x206F) ;; General Punctuation
|
||
(#x2070 . #x209F) ;; Superscripts and Subscripts
|
||
(#x20A0 . #x20CF) ;; Currency Symbols
|
||
(#x2150 . #x218F) ;; Number Forms
|
||
(#x2190 . #x21FF) ;; Arrows
|
||
(#x2200 . #x22FF) ;; Mathematical Operators
|
||
(#x2300 . #x23FF) ;; Miscellaneous Technical
|
||
(#x2400 . #x243F) ;; Control Pictures
|
||
(#x2440 . #x245F) ;; Optical Char Recognition
|
||
(#x2460 . #x24FF) ;; Enclosed Alphanumerics
|
||
(#x2500 . #x257F) ;; Box Drawing
|
||
(#x2580 . #x259F) ;; Block Elements
|
||
(#x25A0 . #x25FF) ;; Geometric Shapes
|
||
(#x2600 . #x2689) ;; Miscellaneous Symbols
|
||
(#x2700 . #x27bF) ;; Dingbats
|
||
(#x27F5 . #x27FF))) ;; Supplemental Arrows-A
|
||
(set-fontset-font "fontset-default" symbol-subgroup
|
||
"-*-fixed-medium-*-*-*-*-*-*-*-*-*-iso10646-1"
|
||
nil 'prepend))
|
||
|
||
;; Append CJK fonts for characters other than han, kana, cjk-misc.
|
||
;; Append fonts for scripts whose name is also a charset name.
|
||
(let* ((data (build-default-fontset-data))
|
||
(registries (car data)))
|
||
(dolist (target-spec (cdr data))
|
||
(let ((target (car target-spec))
|
||
(spec (cdr target-spec)))
|
||
(if (integerp spec)
|
||
(dotimes (i (length registries))
|
||
(if (> (logand spec (ash 1 i)) 0)
|
||
(set-fontset-font "fontset-default" target
|
||
(cons nil (aref registries i))
|
||
nil 'append)))
|
||
(dolist (args spec)
|
||
(set-fontset-font "fontset-default" target
|
||
(apply 'font-spec args) nil 'append))))))
|
||
|
||
;; Append Unicode fonts.
|
||
;; This may find fonts with more variants (bold, italic) but which
|
||
;; don't cover many characters.
|
||
(set-fontset-font "fontset-default" nil
|
||
'(nil . "iso10646-1") nil 'prepend)
|
||
;; These may find fonts that cover many characters but with fewer
|
||
;; variants.
|
||
(set-fontset-font "fontset-default" nil
|
||
'("gnu-unifont" . "iso10646-1") nil 'prepend)
|
||
(set-fontset-font "fontset-default" nil
|
||
'("mutt-clearlyu" . "iso10646-1") nil 'prepend)
|
||
(set-fontset-font "fontset-default" '(#x20000 . #x2FFFF)
|
||
'(nil . "unicode-sip"))
|
||
|
||
(set-fontset-font "fontset-default" '(#xE000 . #xF8FF)
|
||
'(nil . "iso10646-1"))
|
||
;; Don't try the fallback fonts even if no suitable font was found
|
||
;; by the above font-spec.
|
||
(set-fontset-font "fontset-default" '(#xE000 . #xF8FF) nil nil 'append))
|
||
|
||
(defun create-default-fontset ()
|
||
"Create the default fontset.
|
||
Internal use only. Should be called at startup time."
|
||
(condition-case err
|
||
(setup-default-fontset)
|
||
(error (display-warning
|
||
'initialization
|
||
(format "Creation of the default fontsets failed: %s" err)
|
||
:error))))
|
||
|
||
;; These are the registered registries/encodings from
|
||
;; ftp://ftp.x.org/pub/DOCS/registry 2001/06/01
|
||
|
||
;; Name Reference
|
||
;; ---- ---------
|
||
;; "DEC" [27]
|
||
;; registry prefix
|
||
;; "DEC.CNS11643.1986-2" [53]
|
||
;; CNS11643 2-plane using the encoding
|
||
;; suggested in that standard
|
||
;; "DEC.DTSCS.1990-2" [54]
|
||
;; DEC Taiwan Supplemental Character Set
|
||
;; "fujitsu.u90x01.1991-0" [87]
|
||
;; "fujitsu.u90x03.1991-0" [87]
|
||
;; "GB2312.1980-0" [39],[12]
|
||
;; China (PRC) Hanzi, GL encoding
|
||
;; "GB2312.1980-1" [39]
|
||
;; (deprecated)
|
||
;; China (PRC) Hanzi, GR encoding
|
||
;; "HP-Arabic8" [36]
|
||
;; HPARABIC8 8-bit character set
|
||
;; "HP-East8" [36]
|
||
;; HPEAST8 8-bit character set
|
||
;; "HP-Greek8" [36]
|
||
;; HPGREEK8 8-bit character set
|
||
;; "HP-Hebrew8" [36]
|
||
;; HPHEBREW8 8-bit character set
|
||
;; "HP-Japanese15" [36]
|
||
;; HPJAPAN15 15-bit character set,
|
||
;; modified from industry de facto
|
||
;; standard Shift-JIS
|
||
;; "HP-Kana8" [36]
|
||
;; HPKANA8 8-bit character set
|
||
;; "HP-Korean15" [36]
|
||
;; HPKOREAN15 15-bit character set
|
||
;; "HP-Roman8" [36]
|
||
;; HPROMAN8 8-bit character set
|
||
;; "HP-SChinese15" [36]
|
||
;; HPSCHINA15 15-bit character set for
|
||
;; support of Simplified Chinese
|
||
;; "HP-TChinese15" [36]
|
||
;; HPTCHINA15 15-bit character set for
|
||
;; support of Traditional Chinese
|
||
;; "HP-Turkish8" [36]
|
||
;; HPTURKISH8 8-bit character set
|
||
;; "IPSYS" [59]
|
||
;; registry prefix
|
||
;; "IPSYS.IE-1" [59]
|
||
;; "ISO2022"<REG>"-"<ENC> [44]
|
||
;; "ISO646.1991-IRV" [107]
|
||
;; ISO 646 International Reference Version
|
||
;; "ISO8859-1" [15],[12]
|
||
;; ISO Latin alphabet No. 1
|
||
;; "ISO8859-2" [15],[12]
|
||
;; ISO Latin alphabet No. 2
|
||
;; "ISO8859-3" [15],[12]
|
||
;; ISO Latin alphabet No. 3
|
||
;; "ISO8859-4" [15],[12]
|
||
;; ISO Latin alphabet No. 4
|
||
;; "ISO8859-5" [15],[12]
|
||
;; ISO Latin/Cyrillic alphabet
|
||
;; "ISO8859-6" [15],[12]
|
||
;; ISO Latin/Arabic alphabet
|
||
;; "ISO8859-7" [15],[12]
|
||
;; ISO Latin/Greek alphabet
|
||
;; "ISO8859-8" [15],[12]
|
||
;; ISO Latin/Hebrew alphabet
|
||
;; "ISO8859-9" [15],[12]
|
||
;; ISO Latin alphabet No. 5
|
||
;; "ISO8859-10" [15],[12]
|
||
;; ISO Latin alphabet No. 6
|
||
;; "ISO8859-13" [15],[12]
|
||
;; ISO Latin alphabet No. 7
|
||
;; "ISO8859-14" [15],[12]
|
||
;; ISO Latin alphabet No. 8
|
||
;; "ISO8859-15" [15],[12]
|
||
;; ISO Latin alphabet No. 9
|
||
;; "FCD8859-15" [7]
|
||
;; (deprecated)
|
||
;; ISO Latin alphabet No. 9, Final Committee Draft
|
||
;; "ISO10646-1" [133]
|
||
;; Unicode Universal Multiple-Octet Coded Character Set
|
||
;; "ISO10646-MES" [133]
|
||
;; (deprecated)
|
||
;; Unicode Minimum European Subset
|
||
;; "JISX0201.1976-0" [38],[12]
|
||
;; 8-Bit Alphanumeric-Katakana Code
|
||
;; "JISX0208.1983-0" [40],[12]
|
||
;; Japanese Graphic Character Set,
|
||
;; GL encoding
|
||
;; "JISX0208.1990-0" [71]
|
||
;; Japanese Graphic Character Set,
|
||
;; GL encoding
|
||
;; "JISX0208.1983-1" [40]
|
||
;; (deprecated)
|
||
;; Japanese Graphic Character Set,
|
||
;; GR encoding
|
||
;; "JISX0212.1990-0" [72]
|
||
;; Supplementary Japanese Graphic Character Set,
|
||
;; GL encoding
|
||
;; "KOI8-R" [119]
|
||
;; Cyrillic alphabet
|
||
;; "KSC5601.1987-0" [41],[12]
|
||
;; Korean Graphic Character Set,
|
||
;; GL encoding
|
||
;; "KSC5601.1987-1" [41]
|
||
;; (deprecated)
|
||
;; Korean Graphic Character Set,
|
||
;; GR encoding
|
||
;; "omron_CNS11643-0" [45]
|
||
;; "omron_CNS11643-1" [45]
|
||
;; "omron_BIG5-0" [45]
|
||
;; "omron_BIG5-1" [45]
|
||
;; "wn.tamil.1993" [103]
|
||
|
||
(defun set-font-encoding (pattern charset)
|
||
"Set arguments in `font-encoding-alist' (which see)."
|
||
(let ((slot (assoc pattern font-encoding-alist)))
|
||
(if slot
|
||
(setcdr slot charset)
|
||
(setq font-encoding-alist
|
||
(cons (cons pattern charset) font-encoding-alist)))))
|
||
|
||
(defvar x-pixel-size-width-font-regexp)
|
||
(defvar vertical-centering-font-regexp)
|
||
|
||
;; Setting for suppressing XLoadQueryFont on big fonts.
|
||
(setq x-pixel-size-width-font-regexp
|
||
(purecopy "gb2312\\|gbk\\|gb18030\\|jisx0208\\|ksc5601\\|cns11643\\|big5"))
|
||
|
||
;; These fonts require vertical centering.
|
||
(setq vertical-centering-font-regexp
|
||
(purecopy "gb2312\\|gbk\\|gb18030\\|jisx0208\\|jisx0212\\|ksc5601\\|cns11643\\|big5"))
|
||
(put 'vertical-centering-font-regexp 'standard-value
|
||
(list vertical-centering-font-regexp))
|
||
|
||
;; CDAC fonts are actually smaller than their design sizes.
|
||
(setq face-font-rescale-alist
|
||
(list (cons (purecopy "-cdac$") 1.3)))
|
||
|
||
(defvar x-font-name-charset-alist nil
|
||
"This variable has no meaning now. Just kept for backward compatibility.")
|
||
|
||
;;; XLFD (X Logical Font Description) format handler.
|
||
|
||
;; Define XLFD's field index numbers. ; field name
|
||
(defconst xlfd-regexp-family-subnum 0) ; FOUNDRY and FAMILY
|
||
(defconst xlfd-regexp-weight-subnum 1) ; WEIGHT_NAME
|
||
(defconst xlfd-regexp-slant-subnum 2) ; SLANT
|
||
(defconst xlfd-regexp-swidth-subnum 3) ; SETWIDTH_NAME
|
||
(defconst xlfd-regexp-adstyle-subnum 4) ; ADD_STYLE_NAME
|
||
(defconst xlfd-regexp-pixelsize-subnum 5) ; PIXEL_SIZE
|
||
(defconst xlfd-regexp-pointsize-subnum 6) ; POINT_SIZE
|
||
(defconst xlfd-regexp-resx-subnum 7) ; RESOLUTION_X
|
||
(defconst xlfd-regexp-resy-subnum 8) ; RESOLUTION_Y
|
||
(defconst xlfd-regexp-spacing-subnum 8) ; SPACING
|
||
(defconst xlfd-regexp-avgwidth-subnum 10) ; AVERAGE_WIDTH
|
||
(defconst xlfd-regexp-registry-subnum 11) ; REGISTRY and ENCODING
|
||
|
||
;; Regular expression matching against a fontname which conforms to
|
||
;; XLFD (X Logical Font Description). All fields in XLFD should be
|
||
;; not be omitted (but can be a wild card) to be matched.
|
||
(defconst xlfd-tight-regexp
|
||
"^\
|
||
-\\([^-]*-[^-]*\\)-\\([^-]*\\)-\\([^-]*\\)-\\([^-]*\\)\
|
||
-\\([^-]*\\)-\\([^-]*\\)-\\([^-]*\\)-\\([^-]*\\)-\\([^-]*\\)\
|
||
-\\([^-]*\\)-\\([^-]*\\)-\\([^-]*-[^-]*\\)$")
|
||
|
||
;; Regular expression matching against a fontname which conforms to
|
||
;; XLFD (X Logical Font Description). All fields in XLFD from FOUNDRY
|
||
;; to ADSTYLE, REGISTRY, and ENCODING should be not be omitted (but
|
||
;; can be a wild card) to be matched.
|
||
(defconst xlfd-style-regexp
|
||
"^\
|
||
-\\([^-]*-[^-]*\\)-\\([^-]*\\)-\\([^-]*\\)-\\([^-]*\\)-\\([^-]*\\)-.*\
|
||
-\\([^-]*-[^-]*\\)$")
|
||
|
||
;; List of field numbers of XLFD whose values are numeric.
|
||
(defconst xlfd-regexp-numeric-subnums
|
||
(list xlfd-regexp-pixelsize-subnum ;5
|
||
xlfd-regexp-pointsize-subnum ;6
|
||
xlfd-regexp-resx-subnum ;7
|
||
xlfd-regexp-resy-subnum ;8
|
||
xlfd-regexp-avgwidth-subnum ;10
|
||
))
|
||
|
||
(defun x-decompose-font-name (pattern)
|
||
"Decompose PATTERN into XLFD fields and return a vector of the fields.
|
||
The length of the vector is 12.
|
||
The FOUNDRY and FAMILY fields are concatenated and stored in the first
|
||
element of the vector.
|
||
The REGISTRY and ENCODING fields are concatenated and stored in the last
|
||
element of the vector.
|
||
|
||
Return nil if PATTERN doesn't conform to XLFD."
|
||
(if (string-match xlfd-tight-regexp pattern)
|
||
(let ((xlfd-fields (make-vector 12 nil)))
|
||
(dotimes (i 12)
|
||
(aset xlfd-fields i (match-string (1+ i) pattern)))
|
||
(dotimes (i 12)
|
||
(if (string-match "^[*-]+$" (aref xlfd-fields i))
|
||
(aset xlfd-fields i nil)))
|
||
xlfd-fields)))
|
||
|
||
(defun x-compose-font-name (fields &optional _reduce)
|
||
"Compose X fontname from FIELDS.
|
||
FIELDS is a vector of XLFD fields, of length 12.
|
||
If a field is nil, wild-card letter `*' is embedded.
|
||
Optional argument REDUCE exists just for backward compatibility,
|
||
and is always ignored."
|
||
(concat "-" (mapconcat (lambda (x) (or x "*")) fields "-")))
|
||
|
||
|
||
(defun x-must-resolve-font-name (xlfd-fields)
|
||
"Like `x-resolve-font-name', but always return a font name.
|
||
XLFD-FIELDS is a vector of XLFD (X Logical Font Description) fields.
|
||
If no font matching XLFD-FIELDS is available, successively replace
|
||
parts of the font name pattern with \"*\" until some font is found.
|
||
Value is name of that font."
|
||
(let ((ascii-font nil) (index 0))
|
||
(while (and (null ascii-font) (<= index xlfd-regexp-registry-subnum))
|
||
(let ((pattern (x-compose-font-name xlfd-fields)))
|
||
(condition-case nil
|
||
(setq ascii-font (x-resolve-font-name pattern))
|
||
(error
|
||
(message "Warning: no fonts matching `%s' available" pattern)
|
||
(aset xlfd-fields index "*")
|
||
(setq index (1+ index))))))
|
||
(unless ascii-font
|
||
(error "No fonts found"))
|
||
ascii-font))
|
||
|
||
|
||
(defun x-complement-fontset-spec (default-spec fontlist)
|
||
"Complement elements of FONTLIST based on DEFAULT-SPEC.
|
||
DEFAULT-SPEC is a font-spec object providing default font properties.
|
||
FONTLIST is an alist of script names vs the corresponding font names.
|
||
|
||
The font names are parsed and unspecified font properties are
|
||
given from DEFAULT-SPEC."
|
||
(let ((prop-list '(:foundry :family :weight :slant :width :adstyle :size)))
|
||
(dolist (elt fontlist)
|
||
(let ((spec (font-spec :name (cadr elt))))
|
||
(dolist (prop prop-list)
|
||
(let ((val (font-get spec prop)))
|
||
(or val
|
||
(font-put spec prop (font-get default-spec prop)))))
|
||
(setcar (cdr elt) spec)))
|
||
fontlist))
|
||
|
||
(defvar fontset-alias-alist)
|
||
|
||
(defun fontset-name-p (fontset)
|
||
"Return non-nil if FONTSET is valid as fontset name.
|
||
A valid fontset name should conform to XLFD (X Logical Font Description)
|
||
with \"fontset-SOMETHING\" in `<CHARSET_REGISTRY>' field.
|
||
A fontset alias name recorded in `fontset-alias-alist' is also a valid
|
||
fontset name."
|
||
(or (and (string-match xlfd-tight-regexp fontset)
|
||
(let ((registry
|
||
(match-string (1+ xlfd-regexp-registry-subnum) fontset)))
|
||
(= 0 (string-match "\\`fontset-" registry))))
|
||
(consp (rassoc fontset fontset-alias-alist))))
|
||
|
||
(declare-function fontset-list "fontset.c" ())
|
||
|
||
(defun generate-fontset-menu ()
|
||
"Return list to be appended to `x-fixed-font-alist'.
|
||
Done when `mouse-set-font' is called."
|
||
(let (l)
|
||
(dolist (fontset (fontset-list))
|
||
(or (string-match "fontset-default$" fontset)
|
||
(string-match "fontset-auto[0-9]+$" fontset)
|
||
(push (list (fontset-plain-name fontset) fontset) l)))
|
||
(cons "Fontset"
|
||
(sort l #'(lambda (x y) (string< (car x) (car y)))))))
|
||
|
||
(declare-function query-fontset "fontset.c" (pattern &optional regexpp))
|
||
|
||
(defun fontset-plain-name (fontset)
|
||
"Return a plain and descriptive name of FONTSET."
|
||
(if (not (setq fontset (query-fontset fontset)))
|
||
(error "Invalid fontset: %s" fontset))
|
||
(let ((xlfd-fields (x-decompose-font-name fontset)))
|
||
(if xlfd-fields
|
||
(let ((family (aref xlfd-fields xlfd-regexp-family-subnum))
|
||
(weight (aref xlfd-fields xlfd-regexp-weight-subnum))
|
||
(slant (aref xlfd-fields xlfd-regexp-slant-subnum))
|
||
;(swidth (aref xlfd-fields xlfd-regexp-swidth-subnum))
|
||
(size (aref xlfd-fields xlfd-regexp-pixelsize-subnum))
|
||
(nickname (aref xlfd-fields xlfd-regexp-registry-subnum))
|
||
name)
|
||
(if (not (string-match "^fontset-\\(.*\\)$" nickname))
|
||
(setq nickname family)
|
||
(setq nickname (match-string 1 nickname)))
|
||
(if (and size (> (string-to-number size) 0))
|
||
(setq name (format "%s: %s-dot" nickname size))
|
||
(setq name nickname))
|
||
(and weight
|
||
(cond ((string-match "^medium$" weight)
|
||
(setq name (concat name " " "medium")))
|
||
((string-match "^bold$\\|^demibold$" weight)
|
||
(setq name (concat name " " weight)))))
|
||
(and slant
|
||
(cond ((string-match "^i$" slant)
|
||
(setq name (concat name " " "italic")))
|
||
((string-match "^o$" slant)
|
||
(setq name (concat name " " "slant")))
|
||
((string-match "^ri$" slant)
|
||
(setq name (concat name " " "reverse italic")))
|
||
((string-match "^ro$" slant)
|
||
(setq name (concat name " " "reverse slant")))))
|
||
name)
|
||
fontset)))
|
||
|
||
(defvar charset-script-alist
|
||
'((ascii . latin)
|
||
(latin-iso8859-1 . latin)
|
||
(latin-iso8859-2 . latin)
|
||
(latin-iso8859-3 . latin)
|
||
(latin-iso8859-4 . latin)
|
||
(latin-iso8859-9 . latin)
|
||
(latin-iso8859-10 . latin)
|
||
(latin-iso8859-13 . latin)
|
||
(latin-iso8859-14 . latin)
|
||
(latin-iso8859-15 . latin)
|
||
(latin-iso8859-16 . latin)
|
||
(latin-jisx0201 . latin)
|
||
(thai-iso8859-11 . thai)
|
||
(thai-tis620 . thai)
|
||
(cyrillic-iso8859-5 . cyrillic)
|
||
(arabic-iso8859-6 . arabic)
|
||
(greek-iso8859-7 . greek)
|
||
(hebrew-iso8859-8 . hebrew)
|
||
(katakana-jisx0201 . kana)
|
||
(chinese-gb2312 . han)
|
||
(chinese-gbk . han)
|
||
(gb18030-2-byte . han)
|
||
(gb18030-4-byte-bmp . han)
|
||
(gb18030-4-byte-ext-1 . han)
|
||
(gb18030-4-byte-ext-2 . han)
|
||
(gb18030-4-byte-smp . han)
|
||
(chinese-big5-1 . han)
|
||
(chinese-big5-2 . han)
|
||
(chinese-cns11643-1 . han)
|
||
(chinese-cns11643-2 . han)
|
||
(chinese-cns11643-3 . han)
|
||
(chinese-cns11643-4 . han)
|
||
(chinese-cns11643-5 . han)
|
||
(chinese-cns11643-6 . han)
|
||
(chinese-cns11643-7 . han)
|
||
(japanese-jisx0208 . han)
|
||
(japanese-jisx0208-1978 . han)
|
||
(japanese-jisx0212 . han)
|
||
(japanese-jisx0213-1 . han)
|
||
(japanese-jisx0213-2 . han)
|
||
(korean-ksc5601 . hangul)
|
||
(chinese-sisheng . bopomofo)
|
||
(vietnamese-viscii-lower . latin)
|
||
(vietnamese-viscii-upper . latin)
|
||
(arabic-digit . arabic)
|
||
(arabic-1-column . arabic)
|
||
(arabic-2-column . arabic)
|
||
(indian-is13194 . devanagari)
|
||
(indian-glyph . devanagari)
|
||
(indian-1-column . devanagari)
|
||
(indian-2-column . devanagari)
|
||
(tibetan-1-column . tibetan))
|
||
"Alist of charsets vs the corresponding most appropriate scripts.
|
||
|
||
This alist is used by the function `create-fontset-from-fontset-spec'
|
||
to map charsets to scripts.")
|
||
|
||
(defun create-fontset-from-fontset-spec (fontset-spec
|
||
&optional _style-variant _noerror)
|
||
"Create a fontset from fontset specification string FONTSET-SPEC.
|
||
FONTSET-SPEC is a string of the format:
|
||
FONTSET-NAME[,SCRIPT-NAME0:FONT-NAME0,SCRIPT-NAME1:FONT-NAME1] ...
|
||
Any number of SPACE, TAB, and NEWLINE can be put before and after commas.
|
||
|
||
When a frame uses the fontset as the `font' parameter, the frame's
|
||
default font name is derived from FONTSET-NAME by substituting
|
||
\"iso8859-1\" for the tail part \"fontset-XXX\". But, if SCRIPT-NAMEn
|
||
is \"ascii\", use the corresponding FONT-NAMEn as the default font
|
||
name.
|
||
|
||
Optional 2nd and 3rd arguments exist just for backward compatibility,
|
||
and are ignored.
|
||
|
||
It returns a name of the created fontset.
|
||
|
||
For backward compatibility, SCRIPT-NAME may be a charset name, in
|
||
which case, the corresponding script is decided by the variable
|
||
`charset-script-alist' (which see)."
|
||
(or (string-match "^[^,]+" fontset-spec)
|
||
(error "Invalid fontset spec: %s" fontset-spec))
|
||
(let ((idx (match-end 0))
|
||
(name (match-string 0 fontset-spec))
|
||
default-spec target script fontlist)
|
||
(or (string-match xlfd-tight-regexp name)
|
||
(error "Fontset name \"%s\" not conforming to XLFD" name))
|
||
(setq default-spec (font-spec :name name))
|
||
;; At first, extract pairs of charset and fontname from FONTSET-SPEC.
|
||
(while (string-match "[, \t\n]*\\([^:]+\\):[ \t]*\\([^,]+\\)"
|
||
fontset-spec idx)
|
||
(setq idx (match-end 0))
|
||
(setq target (intern (match-string 1 fontset-spec)))
|
||
(cond ((or (eq target 'ascii)
|
||
(memq target (char-table-extra-slot char-script-table 0)))
|
||
(push (list target (match-string 2 fontset-spec)) fontlist))
|
||
((setq script (cdr (assq target charset-script-alist)))
|
||
(push (list script (match-string 2 fontset-spec)) fontlist))
|
||
((charsetp target)
|
||
(push (list target (match-string 2 fontset-spec)) fontlist))))
|
||
|
||
;; Complement FONTLIST.
|
||
(setq fontlist (x-complement-fontset-spec default-spec fontlist))
|
||
|
||
;; Create a fontset.
|
||
(new-fontset name (nreverse fontlist))))
|
||
|
||
(defun create-fontset-from-ascii-font (font &optional resolved-font
|
||
fontset-name)
|
||
"Create a fontset from an ASCII font FONT.
|
||
|
||
Optional 2nd arg RESOLVED-FONT is a resolved name of FONT.
|
||
If omitted, `x-resolve-font-name' is called to get the resolved name.
|
||
At this time, if FONT is not available, an error is signaled.
|
||
|
||
Optional 3rd arg FONTSET-NAME is a string to be used in
|
||
`<CHARSET_ENCODING>' fields of a new fontset name. If it is omitted,
|
||
an appropriate name is generated automatically.
|
||
|
||
It returns a name of the created fontset."
|
||
(setq font (downcase font))
|
||
(setq resolved-font
|
||
(downcase (or resolved-font (x-resolve-font-name font))))
|
||
(let ((xlfd (x-decompose-font-name resolved-font))
|
||
fontset)
|
||
(if fontset-name
|
||
(setq fontset-name (downcase fontset-name))
|
||
(if (query-fontset "fontset-startup")
|
||
(setq fontset-name
|
||
(subst-char-in-string
|
||
?- ?_ (aref xlfd xlfd-regexp-registry-subnum) t))
|
||
(setq fontset-name "startup")))
|
||
(aset xlfd xlfd-regexp-registry-subnum
|
||
(format "fontset-%s" fontset-name))
|
||
(setq fontset (x-compose-font-name xlfd))
|
||
(or (query-fontset fontset)
|
||
(create-fontset-from-fontset-spec (concat fontset ", ascii:" font)))))
|
||
|
||
|
||
;; Create standard fontset from 16 dots fonts which are the most widely
|
||
;; installed fonts. Fonts for Chinese-GB, Korean, and Chinese-CNS are
|
||
;; specified here because FAMILY of those fonts are not "fixed" in
|
||
;; many cases.
|
||
(defvar standard-fontset-spec
|
||
(purecopy "-*-fixed-medium-r-normal-*-16-*-*-*-*-*-fontset-standard")
|
||
"String of fontset spec of the standard fontset.
|
||
You have the biggest chance to display international characters
|
||
with correct glyphs by using the standard fontset.
|
||
See the documentation of `create-fontset-from-fontset-spec' for the format.")
|
||
|
||
|
||
;; Create fontsets from X resources of the name `fontset-N (class
|
||
;; Fontset-N)' where N is integer 0, 1, ...
|
||
;; The values of the resources the string of the same format as
|
||
;; `standard-fontset-spec'.
|
||
|
||
(declare-function x-get-resource "frame.c"
|
||
(attribute class &optional component subclass))
|
||
|
||
(defun create-fontset-from-x-resource ()
|
||
(let ((idx 0)
|
||
fontset-spec)
|
||
(while (setq fontset-spec (x-get-resource (format "fontset-%d" idx)
|
||
(format "Fontset-%d" idx)))
|
||
(condition-case nil
|
||
(create-fontset-from-fontset-spec fontset-spec t)
|
||
(error (display-warning
|
||
'initialization
|
||
(format "Fontset-%d: invalid specification in X resource" idx)
|
||
:warning)))
|
||
(setq idx (1+ idx)))))
|
||
|
||
;;
|
||
(provide 'fontset)
|
||
|
||
;;; fontset.el ends here
|