[Top][All Lists]
[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]
[Emacs-diffs] Changes to emacs/lisp/language/tibetan.el [emacs-unicode-2
From: |
Kenichi Handa |
Subject: |
[Emacs-diffs] Changes to emacs/lisp/language/tibetan.el [emacs-unicode-2] |
Date: |
Mon, 08 Sep 2003 08:55:55 -0400 |
Index: emacs/lisp/language/tibetan.el
diff -c /dev/null emacs/lisp/language/tibetan.el:1.20.6.1
*** /dev/null Mon Sep 8 08:55:55 2003
--- emacs/lisp/language/tibetan.el Mon Sep 8 08:53:41 2003
***************
*** 0 ****
--- 1,616 ----
+ ;;; tibetan.el --- support for Tibetan language -*- coding: iso-2022-7bit; -*-
+
+ ;; Copyright (C) 1997 Electrotechnical Laboratory, JAPAN.
+ ;; Licensed to the Free Software Foundation.
+ ;; Copyright (C) 2003
+ ;; National Institute of Advanced Industrial Science and Technology (AIST)
+ ;; Registration Number H13PRO009
+
+ ;; Keywords: multilingual, Tibetan, i18n
+
+ ;; This file is part of GNU Emacs.
+
+ ;; GNU Emacs is free software; you can redistribute it and/or modify
+ ;; it under the terms of the GNU General Public License as published by
+ ;; the Free Software Foundation; either version 2, or (at your option)
+ ;; any later version.
+
+ ;; GNU Emacs is distributed in the hope that it will be useful,
+ ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
+ ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ ;; GNU General Public License for more details.
+
+ ;; You should have received a copy of the GNU General Public License
+ ;; along with GNU Emacs; see the file COPYING. If not, write to the
+ ;; Free Software Foundation, Inc., 59 Temple Place - Suite 330,
+ ;; Boston, MA 02111-1307, USA.
+
+ ;; Author: Toru TOMABECHI, <address@hidden>
+
+ ;; Created: Feb. 17. 1997
+
+ ;; History:
+ ;; 1997.03.13 Modification for special signs and punctuations.
+
+ ;;; Commentary:
+
+ ;;; Code:
+
+ ;;; Tibetan Character set.
+ ;;; \x2130 -- \x234a is a subset of Unicode v.2 \x0f00 - \x0fb9
+ ;;; with a slight modification. And there are some subjoined
+ ;;; consonants which are not specified in Unicode.
+ ;;; I hope I can add missing characters later.
+ ;;;
+ ;;; 00 01 02 03 04 05 06 07 08 09 0A 0B 0C 0D 0E 0F
+ ;;;2120 // $(7!!(B $(7!"(B $(7!#(B $(7!$(B $(7!%(B $(7!&(B
$(7!'(B $(7!((B $(7!)(B $(7!*(B $(7!+(B $(7!,(B $(7!-(B $(7!.(B
$(7!/(B ; obsolete glyphs (2123-5)
+ ;;;2130 $(7!0(B $(7!1(B $(7!2(B $(7!3(B $(7!4(B $(7!5(B $(7!6(B
$(7!7(B $(7!8(B $(7!9(B $(7!:(B $(7!;(B $(7!<(B $(7!=(B $(7!>(B
$(7!?(B ; Punctuations,
+ ;;;2140 $(address@hidden(B $(7!A(B $(7!B(B $(7!C(B $(7!D(B $(7!E(B
$(7!F(B $(7!G(B $(7!H(B $(7!I(B $(7!J(B $(7!K(B $(7!L(B $(7!M(B
$(7!N(B $(7!O(B ; Digits and
+ ;;;2150 $(7!P(B $(7!Q(B $(7!R(B $(7!S(B $(7!T(B $(7!U(B $(7!V(B
$(7!W(B $(7!X(B $(7!Y(B $(7!Z(B $(7![(B $(7!\(B $(7!](B $(7!^(B
$(7!_(B ; Special signs.
+ ;;;2160 $(7!`(B $(7!a(B $(7!b(B $(7!c(B $(7!d(B $(7!e(B $(7!f(B
$(7!g(B $(7!h(B $(7!i(B $(7!j(B $(7!k(B $(7!l(B $(7!m(B $(7!n(B
$(7!o(B ;
+ ;;;2170 $(7!p(B $(7!q(B $(7!r(B $(7!s(B $(7!t(B $(7!u(B $(7!v(B
$(7!w(B $(7!x(B $(7!y(B $(7!z(B $(7!{(B $(7!|(B $(7!}(B $(7!~(B
// ;
+ ;;;
+ ;;; 00 01 02 03 04 05 06 07 08 09 0A 0B 0C 0D 0E 0F
+ ;;;2220 // $(7"!(B $(7""(B $(7"#(B $(7"$(B $(7"%(B $(7"&(B
$(7"'(B $(7"((B $(7")(B $(7"*(B $(7"+(B $(7",(B $(7"-(B $(7".(B
$(7"/(B ; Base consonants
+ ;;;2230 $(7"0(B $(7"1(B $(7"2(B $(7"3(B $(7"4(B $(7"5(B $(7"6(B
$(7"7(B $(7"8(B $(7"9(B $(7":(B $(7";(B $(7"<(B $(7"=(B $(7">(B
$(7"?(B ; and
+ ;;;2240 $(7"@(B $(7"A(B $(7"B(B $(7"C(B $(7"D(B $(7"E(B $(7"F(B
$(7"G(B $(7"H(B $(7"I(B $(7"J(B $(7"K(B $(7"L(B $(7"M(B $(7"N(B
$(7"O(B ; Vowel signs.
+ ;;;2250 $(7"P(B $(7"Q(B $(7"R(B $(7"S(B $(7"T(B $(7"U(B $(7"V(B
$(7"W(B $(7"X(B $(7"Y(B $(7"Z(B $(7"[(B $(7"\(B $(7"](B $(7"^(B
$(7"_(B ; (\x2251 = vowel a)
+ ;;;2260 $(7"`(B $(7"a(B $(7"b(B $(7"c(B $(7"d(B $(7"e(B $(7"f(B
$(7"g(B $(7"h(B $(7"i(B $(7"j(B $(7"k(B $(7"l(B $(7"m(B $(7"n(B
$(7"o(B ; Long vowels and
+ ;;;2270 $(7"p(B $(7"q(B $(7"r(B $(7"s(B $(7"t(B $(7"u(B $(7"v(B
$(7"w(B $(7"x(B $(7"y(B $(7"z(B $(7"{(B $(7"|(B $(7"}(B $(7"~(B
// ; vocalic r, l ARE
+ ;;; ; atomically
+ ;;; ; encoded.
+ ;;; 00 01 02 03 04 05 06 07 08 09 0A 0B 0C 0D 0E 0F
+ ;;;2320 // $(7#!(B $(7#"(B $(7##(B $(7#$(B $(7#%(B $(7#&(B
$(7#'(B $(7#((B $(7#)(B $(7#*(B $(7#+(B $(7#,(B $(7#-(B $(7#.(B
$(7#/(B ; Subjoined consonants
+ ;;;2330 $(7#0(B $(7#1(B $(7#2(B $(7#3(B $(7#4(B $(7#5(B $(7#6(B
$(7#7(B $(7#8(B $(7#9(B $(7#:(B $(7#;(B $(7#<(B $(7#=(B $(7#>(B
$(7#?(B ;
+ ;;;2340 $(address@hidden(B $(7#A(B $(7#B(B $(7#C(B $(7#D(B $(7#E(B
$(7#F(B $(7#G(B $(7#H(B $(7#I(B $(7#J(B $(7#K(B $(7#L(B $(7#M(B
$(7#N(B $(7#O(B ;
+ ;;;2350 $(7#P(B $(7#Q(B $(7#R(B $(7#S(B $(7#T(B $(7#U(B $(7#V(B
$(7#W(B $(7#X(B $(7#Y(B $(7#Z(B $(7#[(B $(7#\(B $(7#](B $(7#^(B
$(7#_(B ; Hereafter, the chars
+ ;;;2360 $(7#`(B $(7#a(B $(7#b(B $(7#c(B $(7#d(B $(7#e(B $(7#f(B
$(7#g(B $(7#h(B $(7#i(B $(7#j(B $(7#k(B $(7#l(B $(7#m(B $(7#n(B
$(7#o(B ; are not specified
+ ;;;2370 $(7#p(B $(7#q(B $(7#r(B $(7#s(B $(7#t(B $(7#u(B $(7#v(B
$(7#w(B $(7#x(B $(7#y(B $(7#z(B $(7#{(B $(7#|(B $(7#}(B $(7#~(B
// ; in Unicode.
+ ;;;
+ ;;; 00 01 02 03 04 05 06 07 08 09 0A 0B 0C 0D 0E 0F
+ ;;;2420 // $(7$!(B $(7$"(B $(7$#(B $(7$$(B $(7$%(B $(7$&(B
$(7$'(B $(7$((B $(7$)(B $(7$*(B $(7$+(B $(7$,(B $(7$-(B $(7$.(B
$(7$/(B ; Precomposed
+ ;;;2430 $(7$0(B $(7$1(B $(7$2(B $(7$3(B $(7$4(B $(7$5(B $(7$6(B
$(7$7(B $(7$8(B $(7$9(B $(7$:(B $(7$;(B $(7$<(B $(7$=(B $(7$>(B
$(7$?(B ; consonants for
+ ;;;2440 $(address@hidden(B $(7$A(B $(7$B(B $(7$C(B $(7$D(B $(7$E(B
$(7$F(B $(7$G(B $(7$H(B $(7$I(B $(7$J(B $(7$K(B $(7$L(B $(7$M(B
$(7$N(B $(7$O(B ; ordinary Tibetan.
+ ;;;2450 $(7$P(B $(7$Q(B $(7$R(B $(7$S(B $(7$T(B $(7$U(B $(7$V(B
$(7$W(B $(7$X(B $(7$Y(B $(7$Z(B $(7$[(B $(7$\(B $(7$](B $(7$^(B
$(7$_(B ; They are decomposed
+ ;;;2460 $(7$`(B $(7$a(B $(7$b(B $(7$c(B $(7$d(B $(7$e(B $(7$f(B
$(7$g(B $(7$h(B $(7$i(B $(7$j(B $(7$k(B $(7$l(B $(7$m(B $(7$n(B
$(7$o(B ; into base and
+ ;;;2470 $(7$p(B $(7$q(B $(7$r(B $(7$s(B $(7$t(B $(7$u(B $(7$v(B
$(7$w(B $(7$x(B $(7$y(B $(7$z(B $(7${(B $(7$|(B $(7$}(B $(7$~(B
// ; subjoined consonants
+ ;;; ; when written on a
+ ;;; 00 01 02 03 04 05 06 07 08 09 0A 0B 0C 0D 0E 0F ; file in Tibetan
+ ;;;2520 // $(7%!(B $(7%"(B $(7%#(B $(7%$(B $(7%%(B $(7%&(B
$(7%'(B $(7%((B $(7%)(B $(7%*(B $(7%+(B $(7%,(B $(7%-(B $(7%.(B
$(7%/(B ; coding system.
+ ;;;2530 $(7%0(B $(7%1(B $(7%2(B $(7%3(B $(7%4(B $(7%5(B $(7%6(B
$(7%7(B $(7%8(B $(7%9(B $(7%:(B $(7%;(B $(7%<(B $(7%=(B $(7%>(B
$(7%?(B ;
+ ;;;2540 $(address@hidden(B $(7%A(B $(7%B(B $(7%C(B $(7%D(B $(7%E(B
$(7%F(B $(7%G(B $(7%H(B $(7%I(B $(7%J(B $(7%K(B $(7%L(B $(7%M(B
$(7%N(B $(7%O(B ;
+ ;;;2550 $(7%P(B $(7%Q(B $(7%R(B $(7%S(B $(7%T(B $(7%U(B $(7%V(B
$(7%W(B $(7%X(B $(7%Y(B $(7%Z(B $(7%[(B $(7%\(B $(7%](B $(7%^(B
$(7%_(B ;
+ ;;;2560 $(7%`(B $(7%a(B $(7%b(B $(7%c(B $(7%d(B $(7%e(B $(7%f(B
$(7%g(B $(7%h(B $(7%i(B $(7%j(B $(7%k(B $(7%l(B $(7%m(B $(7%n(B
$(7%o(B ;
+ ;;;2570 $(7%p(B $(7%q(B $(7%r(B $(7%s(B $(7%t(B $(7%u(B $(7%v(B
$(7%w(B $(7%x(B $(7%y(B $(7%z(B $(7%{(B $(7%|(B $(7%}(B $(7%~(B
// ;
+ ;;;
+
+
+ (define-coding-system 'tibetan-iso-8bit
+ "8-bit encoding for ASCII (MSB=0) and TIBETAN (MSB=1)."
+ :coding-type 'iso-2022
+ :mnemonic ?Q
+ :designation [ascii tibetan nil nil]
+ :charset-list '(ascii tibetan))
+
+ (define-coding-system-alias 'tibetan 'tibetan-iso-8bit)
+
+ (set-language-info-alist
+ "Tibetan" '((charset tibetan tibetan-1-column)
+ (coding-system tibetan-iso-8bit)
+ (coding-priority iso-2022-7bit tibetan-iso-8bit)
+ (input-method . "tibetan-wylie")
+ (features tibet-util)
+ (documentation . t)
+ (sample-text "Tibetan ($(7"7"]"2!;"G#!"Q"2!;(B)
$(7!4!5!5!>"7"!#C"Q!;"E"S"G!;"7"2"[!;"D"["#"G!>"I"]"_!;"9"Q!;"/"S!;"5"Q"2#9"[!;"H"A"U"c!>(B")))
+
+ ;; `$(7"A(B' is included in the pattern for subjoined consonants because we
+ ;; treat it specially in tibetan-add-components.
+ ;; modified by Tomabechi 1999/12/10
+ ;; modified by Tomabechi 2000/06/08
+ ;; To allow infinite addition of vowels/modifiers
+ ;; as specified in Unicode v.3
+ ;; $(7"A(B is removed from the class of subjoined. Tomabechi 2000/06/08
+ ;; (for Unicode support)
+ (defconst tibetan-composable-pattern
+
"[$(7"!(B-$(7"J"K(B][$(7#!(B-$(7#J#K#L#M(B]*[$,1FP$(7"Q"R"S(B-$(7"^"a"b"e(B]*[$(7"_"c"d"g(B-$(7"l!I!e!g(B]*"
+ "Regexp matching a composable sequence of Tibetan characters.")
+
+ ;;;
+ ;;; Definitions of conversion data.
+ ;;;
+
+
+ ;;; alists for tibetan char <-> transcription conversion
+ ;;; longer transcription should come first
+ (defconst tibetan-consonant-transcription-alist
+ '(("tsh" . "$(7";(B")
+ ("dzh" . "$(7"=(B")
+ ("kSH" . "$(7"J(B")
+ ("kh" . "$(7""(B")
+ ("gh" . "$(7"$(B")
+ ("ng" . "$(7"%(B")
+ ("ch" . "$(7"'(B")
+ ("ny" . "$(7"*(B")
+ ("TH" . "$(7",(B")
+ ("DH" . "$(7".(B")
+ ("th" . "$(7"1(B")
+ ("dh" . "$(7"3(B")
+ ("ph" . "$(7"6(B")
+ ("bh" . "$(7"8(B")
+ ("ts" . "$(7":(B")
+ ("dz" . "$(7"<(B")
+ ("zh" . "$(7"?(B")
+ ("sh" . "$(7"E(B")
+ ("SH" . "$(7"F(B")
+ ("k" . "$(7"!(B")
+ ("g" . "$(7"#(B")
+ ("c" . "$(7"&(B")
+ ("j" . "$(7"((B")
+ ("T" . "$(7"+(B")
+ ("D" . "$(7"-(B")
+ ("N" . "$(7"/(B")
+ ("t" . "$(7"0(B")
+ ("d" . "$(7"2(B")
+ ("n" . "$(7"4(B")
+ ("p" . "$(7"5(B")
+ ("b" . "$(7"7(B")
+ ("m" . "$(7"9(B")
+ ("w" . "$(7">(B")
+ ("z" . "$(7"@(B")
+ ("'" . "$(7"A(B")
+ ("y" . "$(7"B(B")
+ ("r" . "$(7"C(B")
+ ("l" . "$(7"D(B")
+ ("s" . "$(7"G(B")
+ ("h" . "$(7"H(B")
+ ("H" . "$(7"H(B")
+ ("A" . "$(7"I(B")
+ ;; Added by Tomabechi 1999/12/10
+ ("R" . "$(7"K(B") ;; fixed form RA
+ ))
+
+
+ (defconst tibetan-vowel-transcription-alist
+ '(
+ ;; Composite Vowels
+ ;; Added by Tomabechi 2000/06/08
+ ("frr" . "$(7"X(B")
+ ("fll" . "$(7"Z(B")
+ ("fa" . "$(7"R(B")
+ ("fi" . "$(7"T(B")
+ ("fu" . "$(7"V(B")
+ ("fr" . "$(7"W(B")
+ ("fl" . "$(7"Y(B")
+ ("fI" . "$(7"b(B")
+ ;; Normal Vowels
+ ("ai" . "$(7"\(B")
+ ("au" . "$(7"^(B")
+ ("ee" . "$(7"\(B")
+ ("oo" . "$(7"^(B")
+ ("a" . "$(7"Q(B") ; invisible vowel sign (\x2251)
+ ("i" . "$(7"S(B")
+ ("u" . "$(7"U(B")
+ ("e" . "$(7"[(B")
+ ("o" . "$(7"](B")
+ ("E" . "$(7"\(B")
+ ("O" . "$(7"^(B")
+ ("I" . "$(7"a(B")
+ ("," . "$(7"e(B") ; idem.
+ ))
+
+ (defconst tibetan-modifier-transcription-alist
+ '(("M" . "$(7"_(B")
+ ("~" . "$(7"c(B")
+ ("`" . "$(7"d(B")
+ ("x" . "$(7"i(B")
+ ("X" . "$(7"j(B")
+ ("v" . "$(7"g(B")
+ ("V" . "$(7"h(B")
+ ("q" . "$(7"k(B")
+ ("Q" . "$(7"l(B")
+ ("_/" . "$(7!I(B")
+ ("_o" . "$(7!g(B")
+ ("_O" . "$(7!e(B")))
+
+ (defconst tibetan-precomposed-transcription-alist
+ '(("phyw" . "$(7$G(B")
+ ("tshw" . "$(7$)(B")
+ ("rtsw" . "$(7%.(B")
+ ("khw" . "$(7$"(B")
+ ("nyw" . "$(7$%(B")
+ ("tsw" . "$(7$((B")
+ ("zhw" . "$(7$*(B")
+ ("shw" . "$(7$.(B")
+ ("khy" . "$(7$A(B")
+ ("phy" . "$(7$D(B")
+ ("khr" . "$(7$Q(B")
+ ("thr" . "$(7$T(B")
+ ("phr" . "$(7$W(B")
+ ("shr" . "$(7$Z(B")
+ ("dzr" . "$(7$^(B")
+ ("grw" . "$(7$_(B")
+ ("rng" . "$(7%#(B")
+ ("rny" . "$(7%%(B")
+ ("rts" . "$(7%+(B")
+ ("rdz" . "$(7%,(B")
+ ("rgw" . "$(7%-(B")
+ ("rky" . "$(7%0(B")
+ ("rgy" . "$(7%1(B")
+ ("rmy" . "$(7%2(B")
+ ("lng" . "$(7%B(B")
+ ("sng" . "$(7%R(B")
+ ("sny" . "$(7%S(B")
+ ("sts" . "$(7%Z(B")
+ ("sky" . "$(7%`(B")
+ ("sgy" . "$(7%a(B")
+ ("spy" . "$(7%b(B")
+ ("sby" . "$(7%c(B")
+ ("smy" . "$(7%d(B")
+ ("skr" . "$(7%p(B")
+ ("sgr" . "$(7%q(B")
+ ("snr" . "$(7%r(B")
+ ("spr" . "$(7%s(B")
+ ("sbr" . "$(7%t(B")
+ ("smr" . "$(7%u(B")
+ ("kw" . "$(7$!(B")
+ ("gw" . "$(7$#(B")
+ ("cw" . "$(7$$(B")
+ ("tw" . "$(7$&(B")
+ ("dw" . "$(7$'(B")
+ ("zw" . "$(7$+(B")
+ ("rw" . "$(7$,(B")
+ ("lw" . "$(7$-(B")
+ ("sw" . "$(7$/(B")
+ ("hw" . "$(7$0(B")
+ ("ky" . "$(address@hidden(B")
+ ("gy" . "$(7$B(B")
+ ("py" . "$(7$C(B")
+ ("by" . "$(7$E(B")
+ ("my" . "$(7$F(B")
+ ("kr" . "$(7$P(B")
+ ("gr" . "$(7$R(B")
+ ("tr" . "$(7$S(B")
+ ("dr" . "$(7$U(B")
+ ("pr" . "$(7$V(B")
+ ("brk" . "$(7"7%!(B")
+ ("brg" . "$(7"7%"(B")
+ ("brng" . "$(7"7%#(B")
+ ("brj" . "$(7"7%$(B")
+ ("brny" . "$(7"7%%(B")
+ ("brt" . "$(7"7%&(B")
+ ("brd" . "$(7"7%'(B")
+ ("brn" . "$(7"7%((B")
+ ("brts" . "$(7"7%+(B")
+ ("brdz" . "$(7"7%,(B")
+ ("brl" . "$(7"7$d(B")
+ ("br" . "$(7$X(B")
+ ("mr" . "$(7$Y(B")
+ ("sr" . "$(7$[(B")
+ ("hr" . "$(7$\(B")
+ ("jr" . "$(7$](B")
+ ("kl" . "$(7$`(B")
+ ("gl" . "$(7$a(B")
+ ("blt" . "$(7"7%E(B")
+ ("bld" . "$(7"7%F(B")
+ ("bl" . "$(7$b(B")
+ ("zl" . "$(7$c(B")
+ ("rl" . "$(7$d(B")
+ ("sl" . "$(7$e(B")
+ ("rk" . "$(7%!(B")
+ ("rg" . "$(7%"(B")
+ ("rj" . "$(7%$(B")
+ ("rt" . "$(7%&(B")
+ ("rd" . "$(7%'(B")
+ ("rn" . "$(7%((B")
+ ("rb" . "$(7%)(B")
+ ("rm" . "$(7%*(B")
+ ("lk" . "$(address@hidden(B")
+ ("lg" . "$(7%A(B")
+ ("lc" . "$(7%C(B")
+ ("lj" . "$(7%D(B")
+ ("lt" . "$(7%E(B")
+ ("ld" . "$(7%F(B")
+ ("ln" . "$(7!!(B") ; dummy \x2121
+ ("lp" . "$(7%G(B")
+ ("lb" . "$(7%H(B")
+ ("lh" . "$(7%I(B")
+ ("sk" . "$(7%P(B")
+ ("sg" . "$(7%Q(B")
+ ("st" . "$(7%T(B")
+ ("sd" . "$(7%U(B")
+ ("sn" . "$(7%V(B")
+ ("sp" . "$(7%W(B")
+ ("sb" . "$(7%X(B")
+ ("sm" . "$(7%Y(B"))
+ )
+
+
+ (defconst tibetan-subjoined-transcription-alist
+ (sort '(("+k" . "$(7#!(B")
+ ("+kh" . "$(7#"(B")
+ ("+g" . "$(7##(B")
+ ("+gh" . "$(7#$(B")
+ ("+ng" . "$(7#%(B")
+ ("+c" . "$(7#&(B")
+ ("+ch" . "$(7#'(B")
+ ("+j" . "$(7#((B")
+ ("+ny" . "$(7#*(B")
+ ("+T" . "$(7#+(B")
+ ("+TH" . "$(7#,(B")
+ ("+D" . "$(7#-(B")
+ ("+DH" . "$(7#.(B")
+ ("+N" . "$(7#/(B")
+ ("+t" . "$(7#0(B")
+ ("+th" . "$(7#1(B")
+ ("+d" . "$(7#2(B")
+ ("+dh" . "$(7#3(B")
+ ("+n" . "$(7#4(B")
+ ("+p" . "$(7#5(B")
+ ("+ph" . "$(7#6(B")
+ ("+b" . "$(7#7(B")
+ ("+bh" . "$(7#8(B")
+ ("+m" . "$(7#9(B")
+ ("+ts" . "$(7#:(B")
+ ("+tsh" . "$(7#;(B")
+ ("+dz" . "$(7#<(B")
+ ("+dzh" . "$(7#=(B")
+ ("+w" . "$(7#>(B")
+ ("+zh" . "$(7#?(B")
+ ("+z" . "$(address@hidden(B")
+ ("+'" . "$(7#A(B")
+ ("+y" . "$(7#B(B")
+ ("+r" . "$(7#C(B")
+ ("+l" . "$(7#D(B")
+ ("+sh" . "$(7#E(B")
+ ("+SH" . "$(7#F(B")
+ ("+s" . "$(7#G(B")
+ ("+h" . "$(7#H(B")
+ ("+A" . "$(7#I(B")
+ ("+kSH" . "$(7#J(B")
+ ;; Added by Tomabechi 1999/12/10
+ ("+W" . "$(7#K(B") ;; fixed form subscribed WA
+ ("+Y" . "$(7#L(B") ;; fixed form subscribed YA
+ ("+R" . "$(7#M(B") ;; fixed form subscribed RA
+ )
+ (lambda (x y) (> (length (car x)) (length (car y))))))
+
+ ;;;
+ ;;; alist for Tibetan base consonant <-> subjoined consonant conversion.
+ ;;;
+ (defconst tibetan-base-to-subjoined-alist
+ '(("$(7"!(B" . "$(7#!(B")
+ ("$(7""(B" . "$(7#"(B")
+ ("$(7"#(B" . "$(7##(B")
+ ("$(7"$(B" . "$(7#$(B")
+ ("$(7"%(B" . "$(7#%(B")
+ ("$(7"&(B" . "$(7#&(B")
+ ("$(7"'(B" . "$(7#'(B")
+ ("$(7"((B" . "$(7#((B")
+ ("$(7"*(B" . "$(7#*(B")
+ ("$(7"+(B" . "$(7#+(B")
+ ("$(7",(B" . "$(7#,(B")
+ ("$(7"-(B" . "$(7#-(B")
+ ("$(7".(B" . "$(7#.(B")
+ ("$(7"/(B" . "$(7#/(B")
+ ("$(7"0(B" . "$(7#0(B")
+ ("$(7"1(B" . "$(7#1(B")
+ ("$(7"2(B" . "$(7#2(B")
+ ("$(7"3(B" . "$(7#3(B")
+ ("$(7"4(B" . "$(7#4(B")
+ ("$(7"5(B" . "$(7#5(B")
+ ("$(7"6(B" . "$(7#6(B")
+ ("$(7"7(B" . "$(7#7(B")
+ ("$(7"8(B" . "$(7#8(B")
+ ("$(7"9(B" . "$(7#9(B")
+ ("$(7":(B" . "$(7#:(B")
+ ("$(7";(B" . "$(7#;(B")
+ ("$(7"<(B" . "$(7#<(B")
+ ("$(7"=(B" . "$(7#=(B")
+ ("$(7">(B" . "$(7#>(B")
+ ("$(7"?(B" . "$(7#?(B")
+ ("$(7"@(B" . "$(address@hidden(B")
+ ("$(7"A(B" . "$(7#A(B")
+ ("$(7"B(B" . "$(7#B(B")
+ ("$(7"C(B" . "$(7#C(B")
+ ("$(7"D(B" . "$(7#D(B")
+ ("$(7"E(B" . "$(7#E(B")
+ ("$(7"F(B" . "$(7#F(B")
+ ("$(7"G(B" . "$(7#G(B")
+ ("$(7"H(B" . "$(7#H(B")
+ ("$(7"I(B" . "$(7#I(B")
+ ("$(7"J(B" . "$(7#J(B")
+ ;; Added by Tomabechi 1999/12/10
+ ("$(7"K(B" . "$(7#M(B") ;; Fixed form RA (224B->234D)
+ ))
+
+ ;;; alist for Tibetan composite vowels (long i, vocalic r, etc.)
+ ;;; New varialble. created by Tomabechi 2000/06/08
+ (defconst tibetan-composite-vowel-alist
+ '(;; LONG A
+ ;; ("$(7"R(B" . ((bc . tc) ?$(7"R(B))
+ ;; LONG I
+ ("$(7"T(B" . (?$(7"R(B (tc . bc) ?$(7"S(B))
+ ;; LONG U
+ ("$(7"V(B" . (?$(7"R(B (bc . tc) ?$(7"U(B))
+ ;; VOCALIC R
+ ("$(7"W(B" . (?$(7#C(B (tc . bc) ?$(7"a(B))
+ ;; LONG VOCALIC R
+ ("$(7"X(B" . (?$(7#C(B (bc . tc) ?$(7"R(B (tc . bc) ?$(7"a(B))
+ ;; VOCALIC L
+ ("$(7"Y(B" . (?$(7#D(B (tc . bc) ?$(7"a(B))
+ ;;$(7!;(BLONG VOCALIC L
+ ("$(7"Z(B" . (?$(7#D(B (bc . tc) ?$(7"R(B (tc . bc) ?$(7"a(B))
+ ;; LONG REVERSE I
+ ("$(7"b(B" . (?$(7"R(B (tc . bc) ?$(7"a(B))
+ ))
+
+
+
+ ;;;
+ ;;; alist for Tibetan consonantic components <-> precomposed glyph conversion.
+ ;;; (includes some punctuation conversion rules)
+ ;;;
+ (defconst tibetan-precomposition-rule-alist
+ `(("$(7"6#B#>(B" . "$(7$G(B")
+ ("$(7"##C#>(B" . "$(7$_(B")
+ ("$(7";#>(B" . "$(7$)(B")
+ ("$(7"C#:#>(B" . "$(7%.(B")
+ ("$(7"C###>(B" . "$(7%-(B")
+ ("$(7"C#!#B(B" . "$(7%0(B")
+ ("$(7"C###B(B" . "$(7%1(B")
+ ("$(7"C#9#B(B" . "$(7%2(B")
+ ("$(7"G#!#B(B" . "$(7%`(B")
+ ("$(7"G###B(B" . "$(7%a(B")
+ ("$(7"G#5#B(B" . "$(7%b(B")
+ ("$(7"G#7#B(B" . "$(7%c(B")
+ ("$(7"G#9#B(B" . "$(7%d(B")
+ ("$(7"G#!#C(B" . "$(7%p(B")
+ ("$(7"G###C(B" . "$(7%q(B")
+ ("$(7"G#4#C(B" . "$(7%r(B")
+ ("$(7"G#5#C(B" . "$(7%s(B")
+ ("$(7"G#7#C(B" . "$(7%t(B")
+ ("$(7"G#9#C(B" . "$(7%u(B")
+ ("$(7""#>(B" . "$(7$"(B")
+ ("$(7"*#>(B" . "$(7$%(B")
+ ("$(7":#>(B" . "$(7$((B")
+ ("$(7"?#>(B" . "$(7$*(B")
+ ("$(7"E#>(B" . "$(7$.(B")
+ ("$(7""#B(B" . "$(7$A(B")
+ ("$(7"6#B(B" . "$(7$D(B")
+ ("$(7""#C(B" . "$(7$Q(B")
+ ("$(7"1#C(B" . "$(7$T(B")
+ ("$(7"6#C(B" . "$(7$W(B")
+ ("$(7"E#C(B" . "$(7$Z(B")
+ ("$(7"<#C(B" . "$(7$^(B")
+ ("$(7"C#%(B" . "$(7%#(B")
+ ("$(7"C#*(B" . "$(7%%(B")
+ ("$(7"C#:(B" . "$(7%+(B")
+ ("$(7"C#<(B" . "$(7%,(B")
+ ("$(7"D#%(B" . "$(7%B(B")
+ ("$(7"G#%(B" . "$(7%R(B")
+ ("$(7"G#*(B" . "$(7%S(B")
+ ("$(7"G#:(B" . "$(7%Z(B")
+ ("$(7"!#>(B" . "$(7$!(B")
+ ("$(7"##>(B" . "$(7$#(B")
+ ("$(7"&#>(B" . "$(7$$(B")
+ ("$(7"0#>(B" . "$(7$&(B")
+ ("$(7"2#>(B" . "$(7$'(B")
+ ("$(7"@#>(B" . "$(7$+(B")
+ ("$(7"C#>(B" . "$(7$,(B")
+ ("$(7"D#>(B" . "$(7$-(B")
+ ("$(7"G#>(B" . "$(7$/(B")
+ ("$(7"H#>(B" . "$(7$0(B")
+ ("$(7"!#B(B" . "$(address@hidden(B")
+ ("$(7"##B(B" . "$(7$B(B")
+ ("$(7"5#B(B" . "$(7$C(B")
+ ("$(7"7#B(B" . "$(7$E(B")
+ ("$(7"9#B(B" . "$(7$F(B")
+ ("$(7"!#C(B" . "$(7$P(B")
+ ("$(7"##C(B" . "$(7$R(B")
+ ("$(7"0#C(B" . "$(7$S(B")
+ ("$(7"2#C(B" . "$(7$U(B")
+ ("$(7"5#C(B" . "$(7$V(B")
+ ("$(7"7#C(B" . "$(7$X(B")
+ ("$(7"9#C(B" . "$(7$Y(B")
+ ("$(7"G#C(B" . "$(7$[(B")
+ ("$(7"H#C(B" . "$(7$\(B")
+ ("$(7"(#C(B" . "$(7$](B")
+ ("$(7"!#D(B" . "$(7$`(B")
+ ("$(7"##D(B" . "$(7$a(B")
+ ("$(7"7#D(B" . "$(7$b(B")
+ ("$(7"@#D(B" . "$(7$c(B")
+ ("$(7"C#D(B" . "$(7$d(B")
+ ("$(7"G#D(B" . "$(7$e(B")
+ ("$(7"C#!(B" . "$(7%!(B")
+ ("$(7"C##(B" . "$(7%"(B")
+ ("$(7"C#((B" . "$(7%$(B")
+ ("$(7"C#0(B" . "$(7%&(B")
+ ("$(7"C#2(B" . "$(7%'(B")
+ ("$(7"C#4(B" . "$(7%((B")
+ ("$(7"C#7(B" . "$(7%)(B")
+ ("$(7"C#9(B" . "$(7%*(B")
+ ("$(7"D#!(B" . "$(address@hidden(B")
+ ("$(7"D##(B" . "$(7%A(B")
+ ("$(7"D#4(B" . "$(7!!(B") ; dummy 0x2121 added 2000/06/08 for
transition l -> lng
+ ("$(7"D#&(B" . "$(7%C(B")
+ ("$(7"D#((B" . "$(7%D(B")
+ ("$(7"D#0(B" . "$(7%E(B")
+ ("$(7"D#2(B" . "$(7%F(B")
+ ("$(7"D#5(B" . "$(7%G(B")
+ ("$(7"D#7(B" . "$(7%H(B")
+ ("$(7"D#H(B" . "$(7%I(B")
+ ("$(7"G#!(B" . "$(7%P(B")
+ ("$(7"G##(B" . "$(7%Q(B")
+ ("$(7"G#0(B" . "$(7%T(B")
+ ("$(7"G#2(B" . "$(7%U(B")
+ ("$(7"G#4(B" . "$(7%V(B")
+ ("$(7"G#5(B" . "$(7%W(B")
+ ("$(7"G#7(B" . "$(7%X(B")
+ ("$(7"G#9(B" . "$(7%Y(B")))
+
+ (defconst tibetan-regexp
+ (let ((l (list tibetan-precomposed-transcription-alist
+ tibetan-consonant-transcription-alist
+ tibetan-vowel-transcription-alist
+ tibetan-modifier-transcription-alist
+ tibetan-subjoined-transcription-alist))
+ (separator "\\|")
+ tail pattern)
+ (while l
+ (setq tail (car l) l (cdr l))
+ (while tail
+ (setq pattern (cons separator (cons (car (car tail)) pattern))
+ tail (cdr tail))))
+ (apply 'concat (nreverse (cdr pattern))))
+ "Regexp matching a Tibetan transcription of a composable Tibetan sequence.
+ The result of matching is to be used for indexing alists at conversion
+ from a roman transcription to the corresponding Tibetan character.")
+
+ (defvar tibetan-precomposed-regexp
+ (let ((l tibetan-precomposed-transcription-alist)
+ temp)
+ (setq temp "^\\(")
+ (setq temp
+ (concat temp (car (car l))))
+ (setq l (cdr l))
+ (while l
+ (setq temp
+ (concat temp "\\|" (car (car l))))
+ (setq l (cdr l)))
+ (concat temp "\\)"))
+ "Regexp string to match a romanized Tibetan complex consonant.
+ The result of matching is to be used for indexing alists when the input key
+ from an input method is converted to the corresponding precomposed glyph.")
+
+ (defvar tibetan-precomposition-rule-regexp
+ (let ((l tibetan-precomposition-rule-alist)
+ temp)
+ (setq temp "\\(")
+ (setq temp (concat temp (car (car l))))
+ (setq l (cdr l))
+ (while l
+ (setq temp (concat temp "\\|" (car (car l))))
+ (setq l (cdr l)))
+ (concat temp "\\)"))
+ "Regexp string to match a sequence of Tibetan consonantic components, i.e.,
+ one base consonant and one or more subjoined consonants.
+ The result of matching is to be used for indexing alist when the component
+ sequence is converted to the corresponding precomposed glyph.
+ This also matches some punctuation characters which need conversion.")
+
+ (defvar tibetan-decomposed nil)
+ (defvar tibetan-decomposed-temp nil)
+
+
+ ;; For automatic composition.
+ (dolist (range '((?$(7#!(B . ?$(7#J(B) "$(7#K#L#M"Q"R(B" (?$(7"S(B .
?$(7"^(B) "$(7"a"b"e"_"c"d(B" (?$(7"g(B . ?$(7"l(B) "$(7!I!e!g(B"))
+ (if (stringp range)
+ (dotimes (i (length range))
+ (aset composition-function-table (aref range i)
+ 'tibetan-composition-function))
+ (set-char-table-range composition-function-table range
+ 'tibetan-composition-function)))
+
+ (provide 'tibetan)
+
+ ;;; tibetan.el ends here
[Prev in Thread] |
Current Thread |
[Next in Thread] |
- [Emacs-diffs] Changes to emacs/lisp/language/tibetan.el [emacs-unicode-2],
Kenichi Handa <=