123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614 |
- ;;; tibetan.el --- support for Tibetan language -*- coding: iso-2022-7bit; -*-
- ;; Copyright (C) 1997, 2001-2012 Free Software Foundation, Inc.
- ;; Copyright (C) 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005,
- ;; 2006, 2007, 2008, 2009, 2010, 2011
- ;; National Institute of Advanced Industrial Science and Technology (AIST)
- ;; Registration Number H14PRO021
- ;; Copyright (C) 2003
- ;; National Institute of Advanced Industrial Science and Technology (AIST)
- ;; Registration Number H13PRO009
- ;; Author: Toru TOMABECHI <Toru.Tomabechi@orient.unil.ch>
- ;; Created: Feb. 17. 1997
- ;; Keywords: multilingual, Tibetan, i18n
- ;; This file is part of GNU Emacs.
- ;; GNU Emacs is free software: you can redistribute it and/or modify
- ;; it under the terms of the GNU General Public License as published by
- ;; the Free Software Foundation, either version 3 of the License, or
- ;; (at your option) any later version.
- ;; GNU Emacs is distributed in the hope that it will be useful,
- ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
- ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- ;; GNU General Public License for more details.
- ;; You should have received a copy of the GNU General Public License
- ;; along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>.
- ;;; History:
- ;; 1997.03.13 Modification for special signs and punctuation.
- ;;; Commentary:
- ;;; Code:
- ;;; Tibetan Character set.
- ;;; \x2130 -- \x234a is a subset of Unicode v.2 \x0f00 - \x0fb9
- ;;; with a slight modification. And there are some subjoined
- ;;; consonants which are not specified in Unicode.
- ;;; I hope I can add missing characters later.
- ;;;
- ;;; 00 01 02 03 04 05 06 07 08 09 0A 0B 0C 0D 0E 0F
- ;;;2120 // $(7!!(B $(7!"(B $(7!#(B $(7!$(B $(7!%(B $(7!&(B $(7!'(B $(7!((B $(7!)(B $(7!*(B $(7!+(B $(7!,(B $(7!-(B $(7!.(B $(7!/(B ; obsolete glyphs (2123-5)
- ;;;2130 $(7!0(B $(7!1(B $(7!2(B $(7!3(B $(7!4(B $(7!5(B $(7!6(B $(7!7(B $(7!8(B $(7!9(B $(7!:(B $(7!;(B $(7!<(B $(7!=(B $(7!>(B $(7!?(B ; Punctuation,
- ;;;2140 $(7!@(B $(7!A(B $(7!B(B $(7!C(B $(7!D(B $(7!E(B $(7!F(B $(7!G(B $(7!H(B $(7!I(B $(7!J(B $(7!K(B $(7!L(B $(7!M(B $(7!N(B $(7!O(B ; Digits and
- ;;;2150 $(7!P(B $(7!Q(B $(7!R(B $(7!S(B $(7!T(B $(7!U(B $(7!V(B $(7!W(B $(7!X(B $(7!Y(B $(7!Z(B $(7![(B $(7!\(B $(7!](B $(7!^(B $(7!_(B ; Special signs.
- ;;;2160 $(7!`(B $(7!a(B $(7!b(B $(7!c(B $(7!d(B $(7!e(B $(7!f(B $(7!g(B $(7!h(B $(7!i(B $(7!j(B $(7!k(B $(7!l(B $(7!m(B $(7!n(B $(7!o(B ;
- ;;;2170 $(7!p(B $(7!q(B $(7!r(B $(7!s(B $(7!t(B $(7!u(B $(7!v(B $(7!w(B $(7!x(B $(7!y(B $(7!z(B $(7!{(B $(7!|(B $(7!}(B $(7!~(B // ;
- ;;;
- ;;; 00 01 02 03 04 05 06 07 08 09 0A 0B 0C 0D 0E 0F
- ;;;2220 // $(7"!(B $(7""(B $(7"#(B $(7"$(B $(7"%(B $(7"&(B $(7"'(B $(7"((B $(7")(B $(7"*(B $(7"+(B $(7",(B $(7"-(B $(7".(B $(7"/(B ; Base consonants
- ;;;2230 $(7"0(B $(7"1(B $(7"2(B $(7"3(B $(7"4(B $(7"5(B $(7"6(B $(7"7(B $(7"8(B $(7"9(B $(7":(B $(7";(B $(7"<(B $(7"=(B $(7">(B $(7"?(B ; and
- ;;;2240 $(7"@(B $(7"A(B $(7"B(B $(7"C(B $(7"D(B $(7"E(B $(7"F(B $(7"G(B $(7"H(B $(7"I(B $(7"J(B $(7"K(B $(7"L(B $(7"M(B $(7"N(B $(7"O(B ; Vowel signs.
- ;;;2250 $(7"P(B $(7"Q(B $(7"R(B $(7"S(B $(7"T(B $(7"U(B $(7"V(B $(7"W(B $(7"X(B $(7"Y(B $(7"Z(B $(7"[(B $(7"\(B $(7"](B $(7"^(B $(7"_(B ; (\x2251 = vowel a)
- ;;;2260 $(7"`(B $(7"a(B $(7"b(B $(7"c(B $(7"d(B $(7"e(B $(7"f(B $(7"g(B $(7"h(B $(7"i(B $(7"j(B $(7"k(B $(7"l(B $(7"m(B $(7"n(B $(7"o(B ; Long vowels and
- ;;;2270 $(7"p(B $(7"q(B $(7"r(B $(7"s(B $(7"t(B $(7"u(B $(7"v(B $(7"w(B $(7"x(B $(7"y(B $(7"z(B $(7"{(B $(7"|(B $(7"}(B $(7"~(B // ; vocalic r, l ARE
- ;;; ; atomically
- ;;; ; encoded.
- ;;; 00 01 02 03 04 05 06 07 08 09 0A 0B 0C 0D 0E 0F
- ;;;2320 // $(7#!(B $(7#"(B $(7##(B $(7#$(B $(7#%(B $(7#&(B $(7#'(B $(7#((B $(7#)(B $(7#*(B $(7#+(B $(7#,(B $(7#-(B $(7#.(B $(7#/(B ; Subjoined consonants
- ;;;2330 $(7#0(B $(7#1(B $(7#2(B $(7#3(B $(7#4(B $(7#5(B $(7#6(B $(7#7(B $(7#8(B $(7#9(B $(7#:(B $(7#;(B $(7#<(B $(7#=(B $(7#>(B $(7#?(B ;
- ;;;2340 $(7#@(B $(7#A(B $(7#B(B $(7#C(B $(7#D(B $(7#E(B $(7#F(B $(7#G(B $(7#H(B $(7#I(B $(7#J(B $(7#K(B $(7#L(B $(7#M(B $(7#N(B $(7#O(B ;
- ;;;2350 $(7#P(B $(7#Q(B $(7#R(B $(7#S(B $(7#T(B $(7#U(B $(7#V(B $(7#W(B $(7#X(B $(7#Y(B $(7#Z(B $(7#[(B $(7#\(B $(7#](B $(7#^(B $(7#_(B ; Hereafter, the chars
- ;;;2360 $(7#`(B $(7#a(B $(7#b(B $(7#c(B $(7#d(B $(7#e(B $(7#f(B $(7#g(B $(7#h(B $(7#i(B $(7#j(B $(7#k(B $(7#l(B $(7#m(B $(7#n(B $(7#o(B ; are not specified
- ;;;2370 $(7#p(B $(7#q(B $(7#r(B $(7#s(B $(7#t(B $(7#u(B $(7#v(B $(7#w(B $(7#x(B $(7#y(B $(7#z(B $(7#{(B $(7#|(B $(7#}(B $(7#~(B // ; in Unicode.
- ;;;
- ;;; 00 01 02 03 04 05 06 07 08 09 0A 0B 0C 0D 0E 0F
- ;;;2420 // $(7$!(B $(7$"(B $(7$#(B $(7$$(B $(7$%(B $(7$&(B $(7$'(B $(7$((B $(7$)(B $(7$*(B $(7$+(B $(7$,(B $(7$-(B $(7$.(B $(7$/(B ; Precomposed
- ;;;2430 $(7$0(B $(7$1(B $(7$2(B $(7$3(B $(7$4(B $(7$5(B $(7$6(B $(7$7(B $(7$8(B $(7$9(B $(7$:(B $(7$;(B $(7$<(B $(7$=(B $(7$>(B $(7$?(B ; consonants for
- ;;;2440 $(7$@(B $(7$A(B $(7$B(B $(7$C(B $(7$D(B $(7$E(B $(7$F(B $(7$G(B $(7$H(B $(7$I(B $(7$J(B $(7$K(B $(7$L(B $(7$M(B $(7$N(B $(7$O(B ; ordinary Tibetan.
- ;;;2450 $(7$P(B $(7$Q(B $(7$R(B $(7$S(B $(7$T(B $(7$U(B $(7$V(B $(7$W(B $(7$X(B $(7$Y(B $(7$Z(B $(7$[(B $(7$\(B $(7$](B $(7$^(B $(7$_(B ; They are decomposed
- ;;;2460 $(7$`(B $(7$a(B $(7$b(B $(7$c(B $(7$d(B $(7$e(B $(7$f(B $(7$g(B $(7$h(B $(7$i(B $(7$j(B $(7$k(B $(7$l(B $(7$m(B $(7$n(B $(7$o(B ; into base and
- ;;;2470 $(7$p(B $(7$q(B $(7$r(B $(7$s(B $(7$t(B $(7$u(B $(7$v(B $(7$w(B $(7$x(B $(7$y(B $(7$z(B $(7${(B $(7$|(B $(7$}(B $(7$~(B // ; subjoined consonants
- ;;; ; when written on a
- ;;; 00 01 02 03 04 05 06 07 08 09 0A 0B 0C 0D 0E 0F ; file in Tibetan
- ;;;2520 // $(7%!(B $(7%"(B $(7%#(B $(7%$(B $(7%%(B $(7%&(B $(7%'(B $(7%((B $(7%)(B $(7%*(B $(7%+(B $(7%,(B $(7%-(B $(7%.(B $(7%/(B ; coding system.
- ;;;2530 $(7%0(B $(7%1(B $(7%2(B $(7%3(B $(7%4(B $(7%5(B $(7%6(B $(7%7(B $(7%8(B $(7%9(B $(7%:(B $(7%;(B $(7%<(B $(7%=(B $(7%>(B $(7%?(B ;
- ;;;2540 $(7%@(B $(7%A(B $(7%B(B $(7%C(B $(7%D(B $(7%E(B $(7%F(B $(7%G(B $(7%H(B $(7%I(B $(7%J(B $(7%K(B $(7%L(B $(7%M(B $(7%N(B $(7%O(B ;
- ;;;2550 $(7%P(B $(7%Q(B $(7%R(B $(7%S(B $(7%T(B $(7%U(B $(7%V(B $(7%W(B $(7%X(B $(7%Y(B $(7%Z(B $(7%[(B $(7%\(B $(7%](B $(7%^(B $(7%_(B ;
- ;;;2560 $(7%`(B $(7%a(B $(7%b(B $(7%c(B $(7%d(B $(7%e(B $(7%f(B $(7%g(B $(7%h(B $(7%i(B $(7%j(B $(7%k(B $(7%l(B $(7%m(B $(7%n(B $(7%o(B ;
- ;;;2570 $(7%p(B $(7%q(B $(7%r(B $(7%s(B $(7%t(B $(7%u(B $(7%v(B $(7%w(B $(7%x(B $(7%y(B $(7%z(B $(7%{(B $(7%|(B $(7%}(B $(7%~(B // ;
- ;;;
- (define-coding-system 'tibetan-iso-8bit
- "8-bit encoding for ASCII (MSB=0) and TIBETAN (MSB=1)."
- :coding-type 'iso-2022
- :mnemonic ?Q
- :designation [ascii tibetan nil nil]
- :charset-list '(ascii tibetan))
- (define-coding-system-alias 'tibetan 'tibetan-iso-8bit)
- (set-language-info-alist
- "Tibetan" '((charset tibetan tibetan-1-column)
- (coding-system tibetan-iso-8bit)
- (coding-priority iso-2022-7bit tibetan-iso-8bit)
- (input-method . "tibetan-wylie")
- (features tibet-util)
- (documentation . t)
- (sample-text . "Tibetan ($(7"7"]"2!;"G#!"Q"2!;(B) $(7!4!5!5!>"7"!#C"Q!;"E"S"G!;"7"2"[!;"D"["#"G!>"I"]"_!;"9"Q!;"/"S!;"5"Q"2#9"[!;"H"A"U"c!>(B")))
- ;; `$(7"A(B' is included in the pattern for subjoined consonants because we
- ;; treat it specially in tibetan-add-components.
- ;; modified by Tomabechi 1999/12/10
- ;; modified by Tomabechi 2000/06/08
- ;; To allow infinite addition of vowels/modifiers
- ;; as specified in Unicode v.3
- ;; $(7"A(B is removed from the class of subjoined. Tomabechi 2000/06/08
- ;; (for Unicode support)
- (defconst tibetan-composable-pattern
- "[$(7"!(B-$(7"J"K(B][$(7#!(B-$(7#J#K#L#M(B]*[$,1FP$(7"Q"R"S(B-$(7"^"a"b"e(B]*[$(7"_"c"d"g(B-$(7"l!I!e!g(B]*"
- "Regexp matching a composable sequence of Tibetan characters.")
- ;;;
- ;;; Definitions of conversion data.
- ;;;
- ;;; alists for tibetan char <-> transcription conversion
- ;;; longer transcription should come first
- (defconst tibetan-consonant-transcription-alist
- '(("tsh" . "$(7";(B")
- ("dzh" . "$(7"=(B")
- ("kSH" . "$(7"J(B")
- ("kh" . "$(7""(B")
- ("gh" . "$(7"$(B")
- ("ng" . "$(7"%(B")
- ("ch" . "$(7"'(B")
- ("ny" . "$(7"*(B")
- ("TH" . "$(7",(B")
- ("DH" . "$(7".(B")
- ("th" . "$(7"1(B")
- ("dh" . "$(7"3(B")
- ("ph" . "$(7"6(B")
- ("bh" . "$(7"8(B")
- ("ts" . "$(7":(B")
- ("dz" . "$(7"<(B")
- ("zh" . "$(7"?(B")
- ("sh" . "$(7"E(B")
- ("SH" . "$(7"F(B")
- ("k" . "$(7"!(B")
- ("g" . "$(7"#(B")
- ("c" . "$(7"&(B")
- ("j" . "$(7"((B")
- ("T" . "$(7"+(B")
- ("D" . "$(7"-(B")
- ("N" . "$(7"/(B")
- ("t" . "$(7"0(B")
- ("d" . "$(7"2(B")
- ("n" . "$(7"4(B")
- ("p" . "$(7"5(B")
- ("b" . "$(7"7(B")
- ("m" . "$(7"9(B")
- ("w" . "$(7">(B")
- ("z" . "$(7"@(B")
- ("'" . "$(7"A(B")
- ("y" . "$(7"B(B")
- ("r" . "$(7"C(B")
- ("l" . "$(7"D(B")
- ("s" . "$(7"G(B")
- ("h" . "$(7"H(B")
- ("H" . "$(7"H(B")
- ("A" . "$(7"I(B")
- ;; Added by Tomabechi 1999/12/10
- ("R" . "$(7"K(B") ;; fixed form RA
- ))
- (defconst tibetan-vowel-transcription-alist
- '(
- ;; Composite Vowels
- ;; Added by Tomabechi 2000/06/08
- ("frr" . "$(7"X(B")
- ("fll" . "$(7"Z(B")
- ("fa" . "$(7"R(B")
- ("fi" . "$(7"T(B")
- ("fu" . "$(7"V(B")
- ("fr" . "$(7"W(B")
- ("fl" . "$(7"Y(B")
- ("fI" . "$(7"b(B")
- ;; Normal Vowels
- ("ai" . "$(7"\(B")
- ("au" . "$(7"^(B")
- ("ee" . "$(7"\(B")
- ("oo" . "$(7"^(B")
- ("a" . "$(7"Q(B") ; invisible vowel sign (\x2251)
- ("i" . "$(7"S(B")
- ("u" . "$(7"U(B")
- ("e" . "$(7"[(B")
- ("o" . "$(7"](B")
- ("E" . "$(7"\(B")
- ("O" . "$(7"^(B")
- ("I" . "$(7"a(B")
- ("," . "$(7"e(B") ; idem.
- ))
- (defconst tibetan-modifier-transcription-alist
- '(("M" . "$(7"_(B")
- ("~" . "$(7"c(B")
- ("`" . "$(7"d(B")
- ("x" . "$(7"i(B")
- ("X" . "$(7"j(B")
- ("v" . "$(7"g(B")
- ("V" . "$(7"h(B")
- ("q" . "$(7"k(B")
- ("Q" . "$(7"l(B")
- ("_/" . "$(7!I(B")
- ("_o" . "$(7!g(B")
- ("_O" . "$(7!e(B")))
- (defconst tibetan-precomposed-transcription-alist
- '(("phyw" . "$(7$G(B")
- ("tshw" . "$(7$)(B")
- ("rtsw" . "$(7%.(B")
- ("khw" . "$(7$"(B")
- ("nyw" . "$(7$%(B")
- ("tsw" . "$(7$((B")
- ("zhw" . "$(7$*(B")
- ("shw" . "$(7$.(B")
- ("khy" . "$(7$A(B")
- ("phy" . "$(7$D(B")
- ("khr" . "$(7$Q(B")
- ("thr" . "$(7$T(B")
- ("phr" . "$(7$W(B")
- ("shr" . "$(7$Z(B")
- ("dzr" . "$(7$^(B")
- ("grw" . "$(7$_(B")
- ("rng" . "$(7%#(B")
- ("rny" . "$(7%%(B")
- ("rts" . "$(7%+(B")
- ("rdz" . "$(7%,(B")
- ("rgw" . "$(7%-(B")
- ("rky" . "$(7%0(B")
- ("rgy" . "$(7%1(B")
- ("rmy" . "$(7%2(B")
- ("lng" . "$(7%B(B")
- ("sng" . "$(7%R(B")
- ("sny" . "$(7%S(B")
- ("sts" . "$(7%Z(B")
- ("sky" . "$(7%`(B")
- ("sgy" . "$(7%a(B")
- ("spy" . "$(7%b(B")
- ("sby" . "$(7%c(B")
- ("smy" . "$(7%d(B")
- ("skr" . "$(7%p(B")
- ("sgr" . "$(7%q(B")
- ("snr" . "$(7%r(B")
- ("spr" . "$(7%s(B")
- ("sbr" . "$(7%t(B")
- ("smr" . "$(7%u(B")
- ("kw" . "$(7$!(B")
- ("gw" . "$(7$#(B")
- ("cw" . "$(7$$(B")
- ("tw" . "$(7$&(B")
- ("dw" . "$(7$'(B")
- ("zw" . "$(7$+(B")
- ("rw" . "$(7$,(B")
- ("lw" . "$(7$-(B")
- ("sw" . "$(7$/(B")
- ("hw" . "$(7$0(B")
- ("ky" . "$(7$@(B")
- ("gy" . "$(7$B(B")
- ("py" . "$(7$C(B")
- ("by" . "$(7$E(B")
- ("my" . "$(7$F(B")
- ("kr" . "$(7$P(B")
- ("gr" . "$(7$R(B")
- ("tr" . "$(7$S(B")
- ("dr" . "$(7$U(B")
- ("pr" . "$(7$V(B")
- ("brk" . "$(7"7%!(B")
- ("brg" . "$(7"7%"(B")
- ("brng" . "$(7"7%#(B")
- ("brj" . "$(7"7%$(B")
- ("brny" . "$(7"7%%(B")
- ("brt" . "$(7"7%&(B")
- ("brd" . "$(7"7%'(B")
- ("brn" . "$(7"7%((B")
- ("brts" . "$(7"7%+(B")
- ("brdz" . "$(7"7%,(B")
- ("brl" . "$(7"7$d(B")
- ("br" . "$(7$X(B")
- ("mr" . "$(7$Y(B")
- ("sr" . "$(7$[(B")
- ("hr" . "$(7$\(B")
- ("jr" . "$(7$](B")
- ("kl" . "$(7$`(B")
- ("gl" . "$(7$a(B")
- ("blt" . "$(7"7%E(B")
- ("bld" . "$(7"7%F(B")
- ("bl" . "$(7$b(B")
- ("zl" . "$(7$c(B")
- ("rl" . "$(7$d(B")
- ("sl" . "$(7$e(B")
- ("rk" . "$(7%!(B")
- ("rg" . "$(7%"(B")
- ("rj" . "$(7%$(B")
- ("rt" . "$(7%&(B")
- ("rd" . "$(7%'(B")
- ("rn" . "$(7%((B")
- ("rb" . "$(7%)(B")
- ("rm" . "$(7%*(B")
- ("lk" . "$(7%@(B")
- ("lg" . "$(7%A(B")
- ("lc" . "$(7%C(B")
- ("lj" . "$(7%D(B")
- ("lt" . "$(7%E(B")
- ("ld" . "$(7%F(B")
- ("ln" . "$(7!!(B") ; dummy \x2121
- ("lp" . "$(7%G(B")
- ("lb" . "$(7%H(B")
- ("lh" . "$(7%I(B")
- ("sk" . "$(7%P(B")
- ("sg" . "$(7%Q(B")
- ("st" . "$(7%T(B")
- ("sd" . "$(7%U(B")
- ("sn" . "$(7%V(B")
- ("sp" . "$(7%W(B")
- ("sb" . "$(7%X(B")
- ("sm" . "$(7%Y(B"))
- )
- (defconst tibetan-subjoined-transcription-alist
- (sort '(("+k" . "$(7#!(B")
- ("+kh" . "$(7#"(B")
- ("+g" . "$(7##(B")
- ("+gh" . "$(7#$(B")
- ("+ng" . "$(7#%(B")
- ("+c" . "$(7#&(B")
- ("+ch" . "$(7#'(B")
- ("+j" . "$(7#((B")
- ("+ny" . "$(7#*(B")
- ("+T" . "$(7#+(B")
- ("+TH" . "$(7#,(B")
- ("+D" . "$(7#-(B")
- ("+DH" . "$(7#.(B")
- ("+N" . "$(7#/(B")
- ("+t" . "$(7#0(B")
- ("+th" . "$(7#1(B")
- ("+d" . "$(7#2(B")
- ("+dh" . "$(7#3(B")
- ("+n" . "$(7#4(B")
- ("+p" . "$(7#5(B")
- ("+ph" . "$(7#6(B")
- ("+b" . "$(7#7(B")
- ("+bh" . "$(7#8(B")
- ("+m" . "$(7#9(B")
- ("+ts" . "$(7#:(B")
- ("+tsh" . "$(7#;(B")
- ("+dz" . "$(7#<(B")
- ("+dzh" . "$(7#=(B")
- ("+w" . "$(7#>(B")
- ("+zh" . "$(7#?(B")
- ("+z" . "$(7#@(B")
- ("+'" . "$(7#A(B")
- ("+y" . "$(7#B(B")
- ("+r" . "$(7#C(B")
- ("+l" . "$(7#D(B")
- ("+sh" . "$(7#E(B")
- ("+SH" . "$(7#F(B")
- ("+s" . "$(7#G(B")
- ("+h" . "$(7#H(B")
- ("+A" . "$(7#I(B")
- ("+kSH" . "$(7#J(B")
- ;; Added by Tomabechi 1999/12/10
- ("+W" . "$(7#K(B") ;; fixed form subscribed WA
- ("+Y" . "$(7#L(B") ;; fixed form subscribed YA
- ("+R" . "$(7#M(B") ;; fixed form subscribed RA
- )
- (lambda (x y) (> (length (car x)) (length (car y))))))
- ;;;
- ;;; alist for Tibetan base consonant <-> subjoined consonant conversion.
- ;;;
- (defconst tibetan-base-to-subjoined-alist
- '(("$(7"!(B" . "$(7#!(B")
- ("$(7""(B" . "$(7#"(B")
- ("$(7"#(B" . "$(7##(B")
- ("$(7"$(B" . "$(7#$(B")
- ("$(7"%(B" . "$(7#%(B")
- ("$(7"&(B" . "$(7#&(B")
- ("$(7"'(B" . "$(7#'(B")
- ("$(7"((B" . "$(7#((B")
- ("$(7"*(B" . "$(7#*(B")
- ("$(7"+(B" . "$(7#+(B")
- ("$(7",(B" . "$(7#,(B")
- ("$(7"-(B" . "$(7#-(B")
- ("$(7".(B" . "$(7#.(B")
- ("$(7"/(B" . "$(7#/(B")
- ("$(7"0(B" . "$(7#0(B")
- ("$(7"1(B" . "$(7#1(B")
- ("$(7"2(B" . "$(7#2(B")
- ("$(7"3(B" . "$(7#3(B")
- ("$(7"4(B" . "$(7#4(B")
- ("$(7"5(B" . "$(7#5(B")
- ("$(7"6(B" . "$(7#6(B")
- ("$(7"7(B" . "$(7#7(B")
- ("$(7"8(B" . "$(7#8(B")
- ("$(7"9(B" . "$(7#9(B")
- ("$(7":(B" . "$(7#:(B")
- ("$(7";(B" . "$(7#;(B")
- ("$(7"<(B" . "$(7#<(B")
- ("$(7"=(B" . "$(7#=(B")
- ("$(7">(B" . "$(7#>(B")
- ("$(7"?(B" . "$(7#?(B")
- ("$(7"@(B" . "$(7#@(B")
- ("$(7"A(B" . "$(7#A(B")
- ("$(7"B(B" . "$(7#B(B")
- ("$(7"C(B" . "$(7#C(B")
- ("$(7"D(B" . "$(7#D(B")
- ("$(7"E(B" . "$(7#E(B")
- ("$(7"F(B" . "$(7#F(B")
- ("$(7"G(B" . "$(7#G(B")
- ("$(7"H(B" . "$(7#H(B")
- ("$(7"I(B" . "$(7#I(B")
- ("$(7"J(B" . "$(7#J(B")
- ;; Added by Tomabechi 1999/12/10
- ("$(7"K(B" . "$(7#M(B") ;; Fixed form RA (224B->234D)
- ))
- ;;; alist for Tibetan composite vowels (long i, vocalic r, etc.)
- ;;; New variable. created by Tomabechi 2000/06/08
- (defconst tibetan-composite-vowel-alist
- '(;; LONG A
- ;; ("$(7"R(B" . ((bc . tc) ?$(7"R(B))
- ;; LONG I
- ("$(7"T(B" . (?$(7"R(B (tc . bc) ?$(7"S(B))
- ;; LONG U
- ("$(7"V(B" . (?$(7"R(B (bc . tc) ?$(7"U(B))
- ;; VOCALIC R
- ("$(7"W(B" . (?$(7#C(B (tc . bc) ?$(7"a(B))
- ;; LONG VOCALIC R
- ("$(7"X(B" . (?$(7#C(B (bc . tc) ?$(7"R(B (tc . bc) ?$(7"a(B))
- ;; VOCALIC L
- ("$(7"Y(B" . (?$(7#D(B (tc . bc) ?$(7"a(B))
- ;;$(7!;(BLONG VOCALIC L
- ("$(7"Z(B" . (?$(7#D(B (bc . tc) ?$(7"R(B (tc . bc) ?$(7"a(B))
- ;; LONG REVERSE I
- ("$(7"b(B" . (?$(7"R(B (tc . bc) ?$(7"a(B))
- ))
- ;;;
- ;;; alist for Tibetan consonantic components <-> precomposed glyph conversion.
- ;;; (includes some punctuation conversion rules)
- ;;;
- (defconst tibetan-precomposition-rule-alist
- `(("$(7"6#B#>(B" . "$(7$G(B")
- ("$(7"##C#>(B" . "$(7$_(B")
- ("$(7";#>(B" . "$(7$)(B")
- ("$(7"C#:#>(B" . "$(7%.(B")
- ("$(7"C###>(B" . "$(7%-(B")
- ("$(7"C#!#B(B" . "$(7%0(B")
- ("$(7"C###B(B" . "$(7%1(B")
- ("$(7"C#9#B(B" . "$(7%2(B")
- ("$(7"G#!#B(B" . "$(7%`(B")
- ("$(7"G###B(B" . "$(7%a(B")
- ("$(7"G#5#B(B" . "$(7%b(B")
- ("$(7"G#7#B(B" . "$(7%c(B")
- ("$(7"G#9#B(B" . "$(7%d(B")
- ("$(7"G#!#C(B" . "$(7%p(B")
- ("$(7"G###C(B" . "$(7%q(B")
- ("$(7"G#4#C(B" . "$(7%r(B")
- ("$(7"G#5#C(B" . "$(7%s(B")
- ("$(7"G#7#C(B" . "$(7%t(B")
- ("$(7"G#9#C(B" . "$(7%u(B")
- ("$(7""#>(B" . "$(7$"(B")
- ("$(7"*#>(B" . "$(7$%(B")
- ("$(7":#>(B" . "$(7$((B")
- ("$(7"?#>(B" . "$(7$*(B")
- ("$(7"E#>(B" . "$(7$.(B")
- ("$(7""#B(B" . "$(7$A(B")
- ("$(7"6#B(B" . "$(7$D(B")
- ("$(7""#C(B" . "$(7$Q(B")
- ("$(7"1#C(B" . "$(7$T(B")
- ("$(7"6#C(B" . "$(7$W(B")
- ("$(7"E#C(B" . "$(7$Z(B")
- ("$(7"<#C(B" . "$(7$^(B")
- ("$(7"C#%(B" . "$(7%#(B")
- ("$(7"C#*(B" . "$(7%%(B")
- ("$(7"C#:(B" . "$(7%+(B")
- ("$(7"C#<(B" . "$(7%,(B")
- ("$(7"D#%(B" . "$(7%B(B")
- ("$(7"G#%(B" . "$(7%R(B")
- ("$(7"G#*(B" . "$(7%S(B")
- ("$(7"G#:(B" . "$(7%Z(B")
- ("$(7"!#>(B" . "$(7$!(B")
- ("$(7"##>(B" . "$(7$#(B")
- ("$(7"&#>(B" . "$(7$$(B")
- ("$(7"0#>(B" . "$(7$&(B")
- ("$(7"2#>(B" . "$(7$'(B")
- ("$(7"@#>(B" . "$(7$+(B")
- ("$(7"C#>(B" . "$(7$,(B")
- ("$(7"D#>(B" . "$(7$-(B")
- ("$(7"G#>(B" . "$(7$/(B")
- ("$(7"H#>(B" . "$(7$0(B")
- ("$(7"!#B(B" . "$(7$@(B")
- ("$(7"##B(B" . "$(7$B(B")
- ("$(7"5#B(B" . "$(7$C(B")
- ("$(7"7#B(B" . "$(7$E(B")
- ("$(7"9#B(B" . "$(7$F(B")
- ("$(7"!#C(B" . "$(7$P(B")
- ("$(7"##C(B" . "$(7$R(B")
- ("$(7"0#C(B" . "$(7$S(B")
- ("$(7"2#C(B" . "$(7$U(B")
- ("$(7"5#C(B" . "$(7$V(B")
- ("$(7"7#C(B" . "$(7$X(B")
- ("$(7"9#C(B" . "$(7$Y(B")
- ("$(7"G#C(B" . "$(7$[(B")
- ("$(7"H#C(B" . "$(7$\(B")
- ("$(7"(#C(B" . "$(7$](B")
- ("$(7"!#D(B" . "$(7$`(B")
- ("$(7"##D(B" . "$(7$a(B")
- ("$(7"7#D(B" . "$(7$b(B")
- ("$(7"@#D(B" . "$(7$c(B")
- ("$(7"C#D(B" . "$(7$d(B")
- ("$(7"G#D(B" . "$(7$e(B")
- ("$(7"C#!(B" . "$(7%!(B")
- ("$(7"C##(B" . "$(7%"(B")
- ("$(7"C#((B" . "$(7%$(B")
- ("$(7"C#0(B" . "$(7%&(B")
- ("$(7"C#2(B" . "$(7%'(B")
- ("$(7"C#4(B" . "$(7%((B")
- ("$(7"C#7(B" . "$(7%)(B")
- ("$(7"C#9(B" . "$(7%*(B")
- ("$(7"D#!(B" . "$(7%@(B")
- ("$(7"D##(B" . "$(7%A(B")
- ("$(7"D#4(B" . "$(7!!(B") ; dummy 0x2121 added 2000/06/08 for transition l -> lng
- ("$(7"D#&(B" . "$(7%C(B")
- ("$(7"D#((B" . "$(7%D(B")
- ("$(7"D#0(B" . "$(7%E(B")
- ("$(7"D#2(B" . "$(7%F(B")
- ("$(7"D#5(B" . "$(7%G(B")
- ("$(7"D#7(B" . "$(7%H(B")
- ("$(7"D#H(B" . "$(7%I(B")
- ("$(7"G#!(B" . "$(7%P(B")
- ("$(7"G##(B" . "$(7%Q(B")
- ("$(7"G#0(B" . "$(7%T(B")
- ("$(7"G#2(B" . "$(7%U(B")
- ("$(7"G#4(B" . "$(7%V(B")
- ("$(7"G#5(B" . "$(7%W(B")
- ("$(7"G#7(B" . "$(7%X(B")
- ("$(7"G#9(B" . "$(7%Y(B")))
- (defconst tibetan-regexp
- (let ((l (list tibetan-precomposed-transcription-alist
- tibetan-consonant-transcription-alist
- tibetan-vowel-transcription-alist
- tibetan-modifier-transcription-alist
- tibetan-subjoined-transcription-alist))
- (separator "\\|")
- tail pattern)
- (while l
- (setq tail (car l) l (cdr l))
- (while tail
- (setq pattern (cons separator (cons (car (car tail)) pattern))
- tail (cdr tail))))
- (apply 'concat (nreverse (cdr pattern))))
- "Regexp matching a Tibetan transcription of a composable Tibetan sequence.
- The result of matching is to be used for indexing alists at conversion
- from a roman transcription to the corresponding Tibetan character.")
- (defvar tibetan-precomposed-regexp
- (purecopy
- (let ((l tibetan-precomposed-transcription-alist)
- temp)
- (setq temp "^\\(")
- (setq temp
- (concat temp (car (car l))))
- (setq l (cdr l))
- (while l
- (setq temp
- (concat temp "\\|" (car (car l))))
- (setq l (cdr l)))
- (concat temp "\\)")))
- "Regexp string to match a romanized Tibetan complex consonant.
- The result of matching is to be used for indexing alists when the input key
- from an input method is converted to the corresponding precomposed glyph.")
- (defvar tibetan-precomposition-rule-regexp
- (purecopy
- (let ((l tibetan-precomposition-rule-alist)
- temp)
- (setq temp "\\(")
- (setq temp (concat temp (car (car l))))
- (setq l (cdr l))
- (while l
- (setq temp (concat temp "\\|" (car (car l))))
- (setq l (cdr l)))
- (concat temp "\\)")))
- "Regexp string to match a sequence of Tibetan consonantic components, i.e.,
- one base consonant and one or more subjoined consonants.
- The result of matching is to be used for indexing alist when the component
- sequence is converted to the corresponding precomposed glyph.
- This also matches some punctuation characters which need conversion.")
- (defvar tibetan-decomposed nil)
- (defvar tibetan-decomposed-temp nil)
- ;; For automatic composition.
- (set-char-table-range
- composition-function-table '(#xF00 . #xFD1)
- (list (vector tibetan-composable-pattern 0 'font-shape-gstring)))
- (provide 'tibetan)
- ;;; tibetan.el ends here
|