summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorKenichi Handa <handa@m17n.org>1997-04-05 02:44:02 +0000
committerKenichi Handa <handa@m17n.org>1997-04-05 02:44:02 +0000
commit8d941f84d701cea344bf9321150bcf5fb35c2b3e (patch)
treed7c034dd6835850e5d26a346837d34a29e3ce974
parentfa9241652a4b410ab528a460e11b358283180f57 (diff)
downloademacs-8d941f84d701cea344bf9321150bcf5fb35c2b3e.tar.gz
Initial revision
-rw-r--r--lisp/language/english.el74
-rw-r--r--lisp/language/tibet-util.el453
-rw-r--r--lisp/language/tibetan.el620
3 files changed, 1147 insertions, 0 deletions
diff --git a/lisp/language/english.el b/lisp/language/english.el
new file mode 100644
index 00000000000..e4ff06861ad
--- /dev/null
+++ b/lisp/language/english.el
@@ -0,0 +1,74 @@
+;;; english.el --- English support
+
+;; Copyright (C) 1997 Free Software Foundation, Inc.
+;; Copyright (C) 1997 Electrotechnical Laboratory, JAPAN.
+
+;; Keywords: multibyte character, character set, syntax, category
+
+;; This file is part of GNU Emacs.
+
+;; GNU Emacs is free software; you can redistribute it and/or modify
+;; it under the terms of the GNU General Public License as published by
+;; the Free Software Foundation; either version 2, or (at your option)
+;; any later version.
+
+;; GNU Emacs is distributed in the hope that it will be useful,
+;; but WITHOUT ANY WARRANTY; without even the implied warranty of
+;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+;; GNU General Public License for more details.
+
+;; You should have received a copy of the GNU General Public License
+;; along with GNU Emacs; see the file COPYING. If not, write to the
+;; Free Software Foundation, Inc., 59 Temple Place - Suite 330,
+;; Boston, MA 02111-1307, USA.
+
+;;; Commentary:
+
+;; We need nothing special to support English on Emacs. Selecting
+;; English as a language environment is one of the ways to reset
+;; various multilingual environment to the original settting.
+
+;;; Code
+
+(defun setup-english-environment ()
+ "Reset MULE (multilingual environment) to the default status."
+ (interactive)
+ (setq-default enable-multibyte-characters t)
+ (if (local-variable-p 'enable-multibyte-characters)
+ (setq enable-multibyte-characters t))
+
+ (setq coding-category-internal 'internal
+ coding-category-iso-7 'iso-2022-7
+ coding-category-iso-8-1 'iso-8859-1
+ coding-category-iso-8-2 'iso-8859-1
+ coding-category-iso-else 'iso-8859-1
+ coding-category-sjis 'sjis
+ coding-category-big5 'big5
+ coding-category-binary 'no-conversion)
+
+ (set-coding-priority
+ '(coding-category-iso-7
+ coding-category-iso-8-2
+ coding-category-iso-8-1
+ coding-category-iso-else
+ coding-category-internal
+ coding-category-binary
+ coding-category-sjis
+ coding-category-big5))
+
+ (setq-default buffer-file-coding-system 'iso-8859-1)
+ (set-terminal-coding-system 'iso-8859-1)
+ (set-keyboard-coding-system 'iso-8859-1)
+ )
+
+(set-language-info-alist
+ "English" '((setup-function . setup-english-environment)
+ (tutorial . "TUTORIAL")
+ (charset . (ascii))
+ (documentation . t)
+ (sample-text . "Hello!, Hi!, How are you?")))
+
+(register-input-method "English"
+ '("quail-dvorak" quail-use-package "quail/latin"))
+
+;;; english.el ends here
diff --git a/lisp/language/tibet-util.el b/lisp/language/tibet-util.el
new file mode 100644
index 00000000000..cc4624e4014
--- /dev/null
+++ b/lisp/language/tibet-util.el
@@ -0,0 +1,453 @@
+;;; language/tibet-util.el -- Support for inputting Tibetan characters
+
+;; Copyright (C) 1995 Free Software Foundation, Inc.
+;; Copyright (C) 1995 Electrotechnical Laboratory, JAPAN.
+
+;; Keywords: multilingual, Tibetan
+
+;; This file is part of GNU Emacs.
+
+;; GNU Emacs is free software; you can redistribute it and/or modify
+;; it under the terms of the GNU General Public License as published by
+;; the Free Software Foundation; either version 2, or (at your option)
+;; any later version.
+
+;; GNU Emacs is distributed in the hope that it will be useful,
+;; but WITHOUT ANY WARRANTY; without even the implied warranty of
+;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+;; GNU General Public License for more details.
+
+;; You should have received a copy of the GNU General Public License
+;; along with GNU Emacs; see the file COPYING. If not, write to the
+;; Free Software Foundation, Inc., 59 Temple Place - Suite 330,
+;; Boston, MA 02111-1307, USA.
+
+;; Author: Toru TOMABECHI, <Toru.Tomabechi@orient.unil.ch>
+
+;; Created: Feb. 17. 1997
+
+;; History:
+;; 1997.03.13 Modification in treatment of text properties;
+;; Support for some special signs and punctuations.
+
+;;; Code:
+
+;;; This function makes a transcription string for
+;;; re-composing a character.
+
+;;;###autoload
+(defun tibetan-tibetan-to-transcription (ch)
+ "Return a transcription string of Tibetan character CH"
+ (let ((char ch)
+ (l (append tibetan-consonant-transcription-alist
+ tibetan-vowel-transcription-alist
+ tibetan-precomposed-transcription-alist
+ tibetan-subjoined-transcription-alist))
+ decomp-l t-char trans str result)
+ (if (eq (char-charset char) 'composition)
+ (setq decomp-l (decompose-composite-char char 'list nil))
+ (setq decomp-l (cons char nil)))
+ (setq str "")
+ (while decomp-l
+ (setq t-char (char-to-string (car decomp-l)))
+ (setq trans (car (rassoc t-char l)))
+ (setq str (concat str trans))
+ (setq decomp-l (cdr decomp-l)))
+ (setq result str)))
+
+;;; This function translates transcription string into a string of
+;;; Tibetan characters.
+
+;;;###autoload
+(defun tibetan-transcription-to-tibetan (transcription)
+ "Translate Roman transcription into a sequence of Tibetan components."
+ (let ((trans transcription)
+ (lp tibetan-precomposed-transcription-alist)
+ (l (append tibetan-consonant-transcription-alist
+ tibetan-vowel-transcription-alist
+ tibetan-subjoined-transcription-alist))
+ (case-fold-search nil)
+ substr t-char p-str t-str result)
+ (setq substr "")
+ (setq p-str "")
+ (setq t-str "")
+ (cond ((string-match tibetan-precomposed-regexp trans)
+ (setq substr (substring trans (match-beginning 0) (match-end 0)))
+ (setq trans (substring trans (match-end 0)))
+ (setq t-char (cdr (assoc substr lp)))
+ (setq p-str t-char)))
+ (while (string-match tibetan-regexp trans)
+ (setq substr (substring trans (match-beginning 0) (match-end 0)))
+ (setq trans (substring trans 0 (match-beginning 0)))
+ (setq t-char
+ (cdr (assoc substr l)))
+ (setq t-str (concat t-char t-str)))
+ (setq result (concat p-str t-str))))
+
+
+;;;
+;;; Functions for composing Tibetan character.
+;;;
+;;; A Tibetan syllable is typically structured as follows:
+;;;
+;;; [Prefix] C [C+] V [M] [Suffix [Post suffix]]
+;;;
+;;; where C's are all vertically stacked, V appears below or above
+;;; consonant cluster and M is always put above the C[C+]V combination.
+;;; (Sanskrit visarga, though it is a vowel modifier, is considered
+;;; to be a punctuation.)
+;;;
+;;; Here are examples of the words "bsgrubs" and "h'uM"
+;;;
+;;; $(7"72%q`"U1"7"G(B 2$(7"H`#A`"U0"_1(B
+;;;
+;;; M
+;;; b s b s h
+;;; g '
+;;; r u
+;;; u
+;;;
+;;; Consonants ''', 'w', 'y', 'r' take special forms when they are used
+;;; as subjoined consonant. Consonant 'r' takes another special form
+;;; when used as superjoined as in "rka", and so on, while it does not
+;;; change its form when conjoined with subjoined ''', 'w' or 'y'
+;;; as in "rwa", "rya".
+;;;
+;;;
+;;; As a Tibetan input method should avoid using conversion key,
+;;; we use a "Tibetan glyph -> transcription -> Tibetan glyph"
+;;; translation at each key input.
+;;;
+;;; 1st stage - Check the preceding char.
+;;; If the preceding char is Tibetan and composable, then
+;;;
+;;; 2nd stage - Translate the preceding char into transcription
+;;;
+;;; 3rd stage - Concatenate the transcription of preceding char
+;;; and the current input key.
+;;;
+;;; 4th stage - Re-translate the concatenated transcription into
+;;; a sequence of Tibetan letters.
+;;;
+;;; 5th stage - Convert leading consonants into one single precomposed char
+;;; if possible.
+;;;
+;;; 6th stage - Compose the consonants into one composite glyph.
+;;;
+;;; (If the current input is a vowel sign or a vowel modifier,
+;;; then it is composed with preceding char without checking
+;;; except when the preceding char is a punctuation or a digit.)
+;;;
+;;;
+
+;;; This function is used to avoid composition
+;;; between Tibetan and non-Tibetan chars.
+
+;;;###autoload
+(defun tibetan-char-examin (ch)
+ "Check if char CH is Tibetan character.
+Returns non-nil if CH is Tibetan. Otherwise, returns nil."
+ (let ((chr ch))
+ (if (eq (char-charset chr) 'composition)
+ (string-match "\\cq+" (decompose-composite-char chr))
+ (string-match "\\cq" (char-to-string chr)))))
+
+;;; This is used to avoid composition between digits, signs, punctuations
+;;; and word constituents.
+
+;;;###autoload
+(defun tibetan-composable-examin (ch)
+ "Check if Tibetan char CH is composable.
+Returns t if CH is a composable char \(i.e. neither punctuation nor digit)."
+ (let ((chr ch)
+ chstr)
+ (if (eq (char-charset chr) 'composition)
+ (setq chstr (decompose-composite-char chr))
+ (setq chstr (char-to-string chr)))
+ (not (string-match "[$(7!1(B-$(7!o"f$(8!;!=!?!@!A!D"`(B]" chstr))))
+
+
+;;; This checks if a character to be composed contains already
+;;; one or more vowels / vowel modifiers. If the character contains
+;;; them, then no more consonant should be added.
+
+;;;###autoload
+(defun tibetan-complete-char-examin (ch)
+ "Check if composite char CH contains one or more vowel/vowel modifiers.
+Returns non-nil, if CH contains vowel/vowel modifiers."
+ (let ((chr ch)
+ chstr)
+ (if (eq (char-charset chr) 'composition)
+ (setq chstr (decompose-composite-char chr))
+ (setq chstr (char-to-string chr)))
+ (string-match "[$(7!g!e"Q(B-$(7"^"_(B-$(7"l(B]" chstr)))
+
+;;; This function makes a composite character consisting of two characters
+;;; vertically stacked.
+
+;;;###autoload
+(defun tibetan-vertical-stacking (first second upward)
+ "Return a vertically stacked composite char consisting of FIRST and SECOND.
+If UPWARD is non-nil, then SECOND is put above FIRST."
+ (if upward
+ (compose-chars first '(tc . bc) second)
+ (compose-chars first '(bc . tc) second)))
+
+;;; This function makes a composite char from a string.
+;;; Note that this function returns a string, not a char.
+
+;;;###autoload
+(defun tibetan-compose-string (str)
+ "Compose a sequence of Tibetan character components into a composite character.
+Returns a string containing a composite character."
+ (let ((t-str str)
+ f-str s-str f-ch s-ch rest composed result)
+ ;;Make sure no redundant vowel sign is present.
+ (if (string-match
+ "^\\(.+\\)\\($(7"Q(B\\)\\([$(7!I!g!e"Q(B-$(7"^"_(B-$(7"l(B]\\)" t-str)
+ (setq t-str (concat
+ (match-string 1 t-str)
+ (match-string 3 t-str))))
+ (if (string-match
+ "^\\(.+\\)\\([$(7!I!g!e"Q(B-$(7"^"_(B-$(7"l(B]\\)\\($(7"Q(B\\)" t-str)
+ (setq t-str (concat
+ (match-string 1 t-str)
+ (match-string 2 t-str))))
+ ;;Start conversion.
+ (setq result "")
+ ;; Consecutive base/precomposed consonants are reduced to the last one.
+ (while (string-match "^\\([$(7"!(B-$(7"J$!(B-$(7%u(B]\\)\\([$(7"!(B-$(7"@"B(B-$(7"J$!(B-$(7%u(B].*\\)" t-str)
+ (setq result (concat result (match-string 1 t-str)))
+ (setq t-str (match-string 2 t-str)))
+ ;; Vowel/vowel modifier, subjoined consonants are added one by one
+ ;; to the preceding element.
+ (while
+ (string-match "^\\(.\\)\\([$(7"A#!(B-$(7#J!I!g!e"Q(B-$(7"^"_(B-$(7"l(B]\\)\\(.*\\)" t-str)
+ (setq f-str (match-string 1 t-str))
+ (setq f-ch (string-to-char f-str))
+ (setq s-str (match-string 2 t-str))
+ ;;Special treatment for 'a chung.
+ ;;If 'a follows a consonant, then turned into its subjoined form.
+ (if (and (string-match "$(7"A(B" s-str)
+ (not (tibetan-complete-char-examin f-ch)))
+ (setq s-str "$(7#A(B"))
+ (setq s-ch (string-to-char s-str))
+ (setq rest (match-string 3 t-str))
+ (cond ((string-match "\\c2" s-str);; upper vowel sign
+ (setq composed
+ (tibetan-vertical-stacking f-ch s-ch t)))
+ ((string-match "\\c3" s-str);; lower vowel sign
+ (setq composed
+ (tibetan-vertical-stacking f-ch s-ch nil)))
+ ;;Automatic conversion of ra-mgo (superscribed r).
+ ;;'r' is converted if followed by a subjoined consonant
+ ;;other than w, ', y, r.
+ ((and (string-match "$(7"C(B" f-str)
+ (not (string-match "[$(7#>#A#B#C(B]" s-str)))
+ (setq f-ch ?$(7#P(B)
+ (setq composed
+ (tibetan-vertical-stacking f-ch s-ch nil)))
+ ((not (tibetan-complete-char-examin f-ch))
+ ;;Initial base consonant is tranformed, if followed by
+ ;;a subjoined consonant, except when it is followed
+ ;;by a subscribed 'a.
+ (if (and (string-match "[$(7"!(B-$(7"="?"@"D(B-$(7"J(B]" f-str)
+ (not (string-match "$(7#A(B" s-str)))
+ (setq f-ch
+ (string-to-char
+ (cdr (assoc f-str tibetan-base-to-subjoined-alist)))))
+ (setq composed
+ (tibetan-vertical-stacking f-ch s-ch nil)))
+ (t
+ (setq composed s-str)
+ (setq result (concat result f-str))))
+ (setq t-str (concat composed rest)))
+ (setq result (concat result t-str))))
+
+;;; quail <-> conversion interface.
+
+(defun tibetan-composition (pc key)
+ "Interface to quail input method.
+Takes two arguments: char PC and string KEY, where PC is the preceding
+character to be composed with current input KEY.
+Returns a string which is the result of composition."
+ (let (trans cur-ch t-str result)
+ ;; Make a tibetan character corresponding to current input key.
+ (setq cur-ch (tibetan-transcription-to-tibetan key))
+ ;; Check if the preceding character is Tibetan and composable.
+ (cond ((and (tibetan-char-examin pc)
+ (tibetan-composable-examin pc))
+ ;;If Tibetan char corresponding to the current input key exists,
+ (cond (cur-ch
+ ;; Then,
+ ;; Convert the preceding character into transcription,
+ ;; and concatenate it with the current input key,
+ (setq trans (tibetan-tibetan-to-transcription pc))
+ (setq trans (concat trans key))
+ ;; Concatenated transcription is converted to
+ ;; a sequence of Tibetan characters,
+ (setq t-str (tibetan-transcription-to-tibetan trans))
+ ;; And it is composed into a composite character.
+ (setq result (tibetan-compose-string t-str)))
+ ;; Else,
+ (t
+ ;; Simply concatenate the preceding character and
+ ;; the current input key.
+ (setq result (char-to-string pc))
+ (setq result (concat result key)))))
+ ;; If the preceding char is not Tibetan or not composable,
+ (t
+ ;; pc = 0 means the point is at the beginning of buffer.
+ (if (not (eq pc 0))
+ (setq result (char-to-string pc)))
+ (if cur-ch
+ (setq result (concat result cur-ch))
+ (setq result (concat result key))))
+ )))
+
+
+;;;###autoload
+(defun tibetan-decompose-region (beg end)
+ "Decompose Tibetan characters in the region BEG END into their components.
+Components are: base and subjoined consonants, vowel signs, vowel modifiers.
+One column punctuations are converted to their 2 column equivalents."
+ (interactive "r")
+ (let (ch-str ch-beg ch-end)
+ (save-excursion
+ (save-restriction
+ (narrow-to-region beg end)
+ (goto-char (point-min))
+ ;; \\cq = Tibetan character
+ (while (re-search-forward "\\cq" nil t)
+ (setq ch-str (buffer-substring-no-properties
+ (match-beginning 0) (match-end 0)))
+ ;; Save the points. Maybe, using save-match-data is preferable.
+ ;; But in order not to lose the trace(because the body is too long),
+ ;; we save the points in variables.
+ (setq ch-beg (match-beginning 0))
+ (setq ch-end (match-end 0))
+ ;; Here starts the decomposition.
+ (cond
+ ;; 1 column punctuations -> 2 column equivalent
+ ((string-match "[$(8!D!;!=!?!@!A"`(B]" ch-str)
+ (setq ch-str
+ (car (rassoc ch-str tibetan-precomposition-rule-alist))))
+ ;; Decomposition of composite character.
+ ((eq (char-charset (string-to-char ch-str)) 'composition)
+ ;; Make a string which consists of a sequence of
+ ;; components.
+ (setq ch-str (decompose-composite-char (string-to-char ch-str)))
+ ;; Converts nyi zla into base elements.
+ (cond ((string= ch-str "$(7#R#S#S#S(B")
+ (setq ch-str "$(7!4!5!5(B"))
+ ((string= ch-str "$(7#R#S#S(B")
+ (setq ch-str "$(7!4!5(B"))
+ ((string= ch-str "$(7#R#S!I(B")
+ (setq ch-str "$(7!6(B"))
+ ((string= ch-str "$(7#R#S(B")
+ (setq ch-str "$(7!4(B")))))
+ ;; If the sequence of components starts with a subjoined consonants,
+ (if (string-match "^\\([$(7#!(B-$(7#J(B]\\)\\(.*\\)$" ch-str)
+ ;; then the first components is converted to its base form.
+ (setq ch-str
+ (concat (car (rassoc (match-string 1 ch-str)
+ tibetan-base-to-subjoined-alist))
+ (match-string 2 ch-str))))
+ ;; If the sequence of components starts with a precomposed character,
+ (if (string-match "^\\([$(7$!(B-$(7%u(B]\\)\\(.*\\)$" ch-str)
+ ;; then it is converted into a sequence of components.
+ (setq ch-str
+ (concat (car (rassoc (match-string 1 ch-str)
+ tibetan-precomposition-rule-alist))
+ (match-string 2 ch-str))))
+ ;; Special treatment for superscribed r.
+ (if (string-match "^$(7#P(B\\(.*\\)$" ch-str)
+ (setq ch-str (concat "$(7"C(B" (match-string 1 ch-str))))
+ ;; Finally, the result of decomposition is inserted, and
+ ;; the composite character is deleted.
+ (insert-and-inherit ch-str)
+ (delete-region ch-beg ch-end))))))
+
+;;;###autoload
+(defun tibetan-compose-region (beg end)
+ "Make composite chars from Tibetan character components in the region BEG END.
+Two column punctuations are converted to their 1 column equivalents."
+ (interactive "r")
+ (let (str result)
+ (save-excursion
+ (save-restriction
+ (narrow-to-region beg end)
+ (goto-char (point-min))
+ ;; First, sequence of components which has a precomposed equivalent
+ ;; is converted.
+ (while (re-search-forward
+ tibetan-precomposition-rule-regexp nil t)
+ (setq str (buffer-substring-no-properties
+ (match-beginning 0) (match-end 0)))
+ (save-match-data
+ (insert-and-inherit
+ (cdr (assoc str tibetan-precomposition-rule-alist))))
+ (delete-region (match-beginning 0) (match-end 0)))
+ (goto-char (point-min))
+ ;; Then, composable elements are put into a composite character.
+ (while (re-search-forward
+ "[$(7"!(B-$(7"J$!(B-$(7%u(B]+[$(7#!(B-$(7#J!I!g!e"Q(B-$(7"^"_(B-$(7"l(B]+"
+ nil t)
+ (setq str (buffer-substring-no-properties
+ (match-beginning 0) (match-end 0)))
+ (save-match-data
+ (setq result (tibetan-compose-string str))
+ (insert-and-inherit result))
+ (delete-region (match-beginning 0) (match-end 0)))))))
+
+;;;
+;;; This variable is used to avoid repeated decomposition.
+;;;
+(setq-default tibetan-decomposed nil)
+
+;;;###autoload
+(defun tibetan-decompose-buffer ()
+ "Decomposes Tibetan characters in the buffer into their components.
+See also docstring of the function tibetan-decompose-region."
+ (interactive)
+ (make-local-variable 'tibetan-decomposed)
+ (cond ((not tibetan-decomposed)
+ (tibetan-decompose-region (point-min) (point-max))
+ (setq tibetan-decomposed t))))
+
+;;;###autoload
+(defun tibetan-compose-buffer ()
+ "Composes Tibetan character components in the buffer.
+See also docstring of the function tibetan-compose-region."
+ (interactive)
+ (make-local-variable 'tibetan-decomposed)
+ (tibetan-compose-region (point-min) (point-max))
+ (setq tibetan-decomposed nil))
+
+;;;###autoload
+(defun tibetan-post-read-conversion (len)
+ (save-excursion
+ (save-restriction
+ (let ((buffer-modified-p (buffer-modified-p)))
+ (narrow-to-region (point) (+ (point) len))
+ (tibetan-compose-region (point-min) (point-max))
+ (set-buffer-modified-p buffer-modified-p)
+ (point-max))))
+ (make-local-variable 'tibetan-decomposed)
+ (setq tibetan-decomposed nil))
+
+
+;;;###autoload
+(defun tibetan-pre-write-conversion (from to)
+ (setq tibetan-decomposed-temp tibetan-decomposed)
+ (let ((old-buf (current-buffer))
+ (work-buf (get-buffer-create " *tibetan-work*")))
+ (set-buffer work-buf)
+ (erase-buffer)
+ (insert-buffer-substring old-buf from to)
+ (if (not tibetan-decomposed-temp)
+ (tibetan-decompose-region (point-min) (point-max)))))
+
+(provide 'language/tibet-util)
+
+;;; language/tibet-util.el ends here.
diff --git a/lisp/language/tibetan.el b/lisp/language/tibetan.el
new file mode 100644
index 00000000000..d54689119c6
--- /dev/null
+++ b/lisp/language/tibetan.el
@@ -0,0 +1,620 @@
+;;; tibetan.el --- Support for Tibetan language
+
+;; Copyright (C) 1997 Free Software Foundation, Inc.
+;; Copyright (C) 1997 Electrotechnical Laboratory, JAPAN.
+
+;; Keywords: multilingual, Tibetan
+
+;; This file is part of GNU Emacs.
+
+;; GNU Emacs is free software; you can redistribute it and/or modify
+;; it under the terms of the GNU General Public License as published by
+;; the Free Software Foundation; either version 2, or (at your option)
+;; any later version.
+
+;; GNU Emacs is distributed in the hope that it will be useful,
+;; but WITHOUT ANY WARRANTY; without even the implied warranty of
+;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+;; GNU General Public License for more details.
+
+;; You should have received a copy of the GNU General Public License
+;; along with GNU Emacs; see the file COPYING. If not, write to the
+;; Free Software Foundation, Inc., 59 Temple Place - Suite 330,
+;; Boston, MA 02111-1307, USA.
+
+;; Author: Toru TOMABECHI, <Toru.Tomabechi@orient.unil.ch>
+
+;; Created: Feb. 17. 1997
+
+;; History:
+;; 1997.03.13 Modification for special signs and punctuations.
+
+;;; Code:
+
+(define-category ?q "Tibetan")
+(modify-category-entry (make-char 'tibetan) ?q)
+(modify-category-entry (make-char 'tibetan-1-column) ?q)
+
+(let ((row 33))
+ (while (< row 38)
+ (modify-category-entry (make-char 'tibetan row) ?q)
+ (setq row (1+ row))))
+
+(modify-category-entry (make-char 'tibetan-1-column 33) ?q)
+
+(let ((deflist '(;; chars syntax category
+ ("$(7"!(B-$(7"J(B" "w" ?0) ; consonant
+ ("$(7#!(B-$(7#J#P#Q(B" "w" ?0) ;
+ ("$(7$!(B-$(7$e(B" "w" ?0) ;
+ ("$(7%!(B-$(7%u(B" "w" ?0) ;
+ ("$(7"S"["\"]"^"a(B" "w" ?2) ; upper vowel
+ ("$(7"_"c"d"g"h"i"j"k"l(B" "w" ?2) ; upper modifier
+ ("$(7!I"Q"U"e!e!g(B" "w" ?3) ; lowel vowel/modifier
+ ("$(7!P(B-$(7!Y!Z(B-$(7!c(B" "w" ?6) ; digit
+ ("$(7!;!=(B-$(7!B!D"`(B" "." ?|) ; line-break char
+ ("$(8!;!=!?!@!A!D"`(B" "." ?|) ;
+ ("$(7!8!;!=(B-$(7!B!D"`!m!d(B" "." ?>) ; prohibition
+ ("$(8!;!=!?!@!A!D"`(B" "." ?>) ;
+ ("$(7!0(B-$(7!:!l#R#S"f(B" "." ?<) ; prohibition
+ ("$(7!C!E(B-$(7!H!J(B-$(7!O!f!h(B-$(7!k!n!o(B" "." ?q) ; others
+ ))
+ elm chars len syntax category to ch i)
+ (while deflist
+ (setq elm (car deflist))
+ (setq chars (car elm)
+ len (length chars)
+ syntax (nth 1 elm)
+ category (nth 2 elm)
+ i 0)
+ (while (< i len)
+ (if (= (aref chars i) ?-)
+ (setq i (1+ i)
+ to (sref chars i))
+ (setq ch (sref chars i)
+ to ch))
+ (while (<= ch to)
+ (modify-syntax-entry ch syntax)
+ (modify-category-entry ch category)
+ (setq ch (1+ ch)))
+ (setq i (+ i (char-bytes to))))
+ (setq deflist (cdr deflist))))
+
+
+;;; Tibetan Character set.
+;;; \x2130 -- \x234a is a subset of Unicode v.2 \x0f00 - \x0fb9
+;;; with a slight modification. And there are some subjoined
+;;; consonants which are not specified in Unicode.
+;;; I hope I can add missing characters later.
+;;;
+;;; 00 01 02 03 04 05 06 07 08 09 0A 0B 0C 0D 0E 0F
+;;;2120 // $(7!!(B $(7!"(B $(7!#(B $(7!$(B $(7!%(B $(7!&(B $(7!'(B $(7!((B $(7!)(B $(7!*(B $(7!+(B $(7!,(B $(7!-(B $(7!.(B $(7!/(B ;
+;;;2130 $(7!0(B $(7!1(B $(7!2(B $(7!3(B $(7!4(B $(7!5(B $(7!6(B $(7!7(B $(7!8(B $(7!9(B $(7!:(B $(7!;(B $(7!<(B $(7!=(B $(7!>(B $(7!?(B ; Punctuations,
+;;;2140 $(7!@(B $(7!A(B $(7!B(B $(7!C(B $(7!D(B $(7!E(B $(7!F(B $(7!G(B $(7!H(B $(7!I(B $(7!J(B $(7!K(B $(7!L(B $(7!M(B $(7!N(B $(7!O(B ; Digits and
+;;;2150 $(7!P(B $(7!Q(B $(7!R(B $(7!S(B $(7!T(B $(7!U(B $(7!V(B $(7!W(B $(7!X(B $(7!Y(B $(7!Z(B $(7![(B $(7!\(B $(7!](B $(7!^(B $(7!_(B ; Special signs.
+;;;2160 $(7!`(B $(7!a(B $(7!b(B $(7!c(B $(7!d(B $(7!e(B $(7!f(B $(7!g(B $(7!h(B $(7!i(B $(7!j(B $(7!k(B $(7!l(B $(7!m(B $(7!n(B $(7!o(B ;
+;;;2170 $(7!p(B $(7!q(B $(7!r(B $(7!s(B $(7!t(B $(7!u(B $(7!v(B $(7!w(B $(7!x(B $(7!y(B $(7!z(B $(7!{(B $(7!|(B $(7!}(B $(7!~(B // ;
+;;;
+;;; 00 01 02 03 04 05 06 07 08 09 0A 0B 0C 0D 0E 0F
+;;;2220 // $(7"!(B $(7""(B $(7"#(B $(7"$(B $(7"%(B $(7"&(B $(7"'(B $(7"((B $(7")(B $(7"*(B $(7"+(B $(7",(B $(7"-(B $(7".(B $(7"/(B ; Base consonants
+;;;2230 $(7"0(B $(7"1(B $(7"2(B $(7"3(B $(7"4(B $(7"5(B $(7"6(B $(7"7(B $(7"8(B $(7"9(B $(7":(B $(7";(B $(7"<(B $(7"=(B $(7">(B $(7"?(B ; and
+;;;2240 $(7"@(B $(7"A(B $(7"B(B $(7"C(B $(7"D(B $(7"E(B $(7"F(B $(7"G(B $(7"H(B $(7"I(B $(7"J(B $(7"K(B $(7"L(B $(7"M(B $(7"N(B $(7"O(B ; Vowel signs.
+;;;2250 $(7"P(B $(7"Q(B $(7"R(B $(7"S(B $(7"T(B $(7"U(B $(7"V(B $(7"W(B $(7"X(B $(7"Y(B $(7"Z(B $(7"[(B $(7"\(B $(7"](B $(7"^(B $(7"_(B ; (\x2251 = vowel a)
+;;;2260 $(7"`(B $(7"a(B $(7"b(B $(7"c(B $(7"d(B $(7"e(B $(7"f(B $(7"g(B $(7"h(B $(7"i(B $(7"j(B $(7"k(B $(7"l(B $(7"m(B $(7"n(B $(7"o(B ; Long vowels and
+;;;2270 $(7"p(B $(7"q(B $(7"r(B $(7"s(B $(7"t(B $(7"u(B $(7"v(B $(7"w(B $(7"x(B $(7"y(B $(7"z(B $(7"{(B $(7"|(B $(7"}(B $(7"~(B // ; vocalic r, l are
+;;; ; not atomically
+;;; ; encoded.
+;;; 00 01 02 03 04 05 06 07 08 09 0A 0B 0C 0D 0E 0F
+;;;2320 // $(7#!(B $(7#"(B $(7##(B $(7#$(B $(7#%(B $(7#&(B $(7#'(B $(7#((B $(7#)(B $(7#*(B $(7#+(B $(7#,(B $(7#-(B $(7#.(B $(7#/(B ; Subjoined consonants
+;;;2330 $(7#0(B $(7#1(B $(7#2(B $(7#3(B $(7#4(B $(7#5(B $(7#6(B $(7#7(B $(7#8(B $(7#9(B $(7#:(B $(7#;(B $(7#<(B $(7#=(B $(7#>(B $(7#?(B ;
+;;;2340 $(7#@(B $(7#A(B $(7#B(B $(7#C(B $(7#D(B $(7#E(B $(7#F(B $(7#G(B $(7#H(B $(7#I(B $(7#J(B $(7#K(B $(7#L(B $(7#M(B $(7#N(B $(7#O(B ; 'a chung (\x2341)is
+;;; ; here,
+;;; ; while in Unicode
+;;; ; it is classified
+;;; ; as a vowel sign
+;;; ; (\x0f71).
+;;;
+;;;2350 $(7#P(B $(7#Q(B $(7#R(B $(7#S(B $(7#T(B $(7#U(B $(7#V(B $(7#W(B $(7#X(B $(7#Y(B $(7#Z(B $(7#[(B $(7#\(B $(7#](B $(7#^(B $(7#_(B ; Hereafter, the chars
+;;;2360 $(7#`(B $(7#a(B $(7#b(B $(7#c(B $(7#d(B $(7#e(B $(7#f(B $(7#g(B $(7#h(B $(7#i(B $(7#j(B $(7#k(B $(7#l(B $(7#m(B $(7#n(B $(7#o(B ; are not specified
+;;;2370 $(7#p(B $(7#q(B $(7#r(B $(7#s(B $(7#t(B $(7#u(B $(7#v(B $(7#w(B $(7#x(B $(7#y(B $(7#z(B $(7#{(B $(7#|(B $(7#}(B $(7#~(B // ; in Unicode.
+;;; ; The character \x2351
+;;; ; is not used in our
+;;; ; implementation.
+;;; 00 01 02 03 04 05 06 07 08 09 0A 0B 0C 0D 0E 0F
+;;;2420 // $(7$!(B $(7$"(B $(7$#(B $(7$$(B $(7$%(B $(7$&(B $(7$'(B $(7$((B $(7$)(B $(7$*(B $(7$+(B $(7$,(B $(7$-(B $(7$.(B $(7$/(B ; Precomposed
+;;;2430 $(7$0(B $(7$1(B $(7$2(B $(7$3(B $(7$4(B $(7$5(B $(7$6(B $(7$7(B $(7$8(B $(7$9(B $(7$:(B $(7$;(B $(7$<(B $(7$=(B $(7$>(B $(7$?(B ; consonants for
+;;;2440 $(7$@(B $(7$A(B $(7$B(B $(7$C(B $(7$D(B $(7$E(B $(7$F(B $(7$G(B $(7$H(B $(7$I(B $(7$J(B $(7$K(B $(7$L(B $(7$M(B $(7$N(B $(7$O(B ; ordinary Tibetan.
+;;;2450 $(7$P(B $(7$Q(B $(7$R(B $(7$S(B $(7$T(B $(7$U(B $(7$V(B $(7$W(B $(7$X(B $(7$Y(B $(7$Z(B $(7$[(B $(7$\(B $(7$](B $(7$^(B $(7$_(B ; They are decomposed
+;;;2460 $(7$`(B $(7$a(B $(7$b(B $(7$c(B $(7$d(B $(7$e(B $(7$f(B $(7$g(B $(7$h(B $(7$i(B $(7$j(B $(7$k(B $(7$l(B $(7$m(B $(7$n(B $(7$o(B ; into base and
+;;;2470 $(7$p(B $(7$q(B $(7$r(B $(7$s(B $(7$t(B $(7$u(B $(7$v(B $(7$w(B $(7$x(B $(7$y(B $(7$z(B $(7${(B $(7$|(B $(7$}(B $(7$~(B // ; subjoined consonants
+;;; ; when written on a
+;;; 00 01 02 03 04 05 06 07 08 09 0A 0B 0C 0D 0E 0F ; file in Tibetan
+;;;2520 // $(7%!(B $(7%"(B $(7%#(B $(7%$(B $(7%%(B $(7%&(B $(7%'(B $(7%((B $(7%)(B $(7%*(B $(7%+(B $(7%,(B $(7%-(B $(7%.(B $(7%/(B ; coding system.
+;;;2530 $(7%0(B $(7%1(B $(7%2(B $(7%3(B $(7%4(B $(7%5(B $(7%6(B $(7%7(B $(7%8(B $(7%9(B $(7%:(B $(7%;(B $(7%<(B $(7%=(B $(7%>(B $(7%?(B ;
+;;;2540 $(7%@(B $(7%A(B $(7%B(B $(7%C(B $(7%D(B $(7%E(B $(7%F(B $(7%G(B $(7%H(B $(7%I(B $(7%J(B $(7%K(B $(7%L(B $(7%M(B $(7%N(B $(7%O(B ;
+;;;2550 $(7%P(B $(7%Q(B $(7%R(B $(7%S(B $(7%T(B $(7%U(B $(7%V(B $(7%W(B $(7%X(B $(7%Y(B $(7%Z(B $(7%[(B $(7%\(B $(7%](B $(7%^(B $(7%_(B ;
+;;;2560 $(7%`(B $(7%a(B $(7%b(B $(7%c(B $(7%d(B $(7%e(B $(7%f(B $(7%g(B $(7%h(B $(7%i(B $(7%j(B $(7%k(B $(7%l(B $(7%m(B $(7%n(B $(7%o(B ;
+;;;2570 $(7%p(B $(7%q(B $(7%r(B $(7%s(B $(7%t(B $(7%u(B $(7%v(B $(7%w(B $(7%x(B $(7%y(B $(7%z(B $(7%{(B $(7%|(B $(7%}(B $(7%~(B // ;
+;;;
+
+
+(make-coding-system
+ 'tibetan 2 ?Q
+ "Coding-system used for ASCII(MSB=0) & TIBETAN(MSB=1)."
+ '((ascii t) (tibetan t) nil nil
+ nil ascii-eol))
+
+(put 'tibetan 'post-read-conversion 'tibetan-post-read-conversion)
+(put 'tibetan 'pre-write-conversion 'tibetan-pre-write-conversion)
+
+(register-input-method
+ "Tibetan" '("quail-tibetan-wylie" quail-use-package "quail/tibetan"))
+(register-input-method
+ "Tibetan" '("quail-tibetan-tibkey" quail-use-package "quail/tibetan"))
+
+(defun setup-tibetan-environment ()
+ (setq coding-category-iso-7 'tibetan)
+
+ (set-coding-priority
+ '(coding-category-iso-7
+ coding-category-iso-8-1))
+
+ (setq-default buffer-file-coding-system 'iso-2022-7)
+
+ (setq default-input-method '("Tibetan" . "quail-tibetan-wylie")))
+
+(set-language-info-alist
+ "Tibetan" '((setup-function . setup-tibetan-environment)
+ (charset . (tibetan tibetan-1-column))
+ (coding-system . (tibetan))
+ (documentation . t)
+ (sample-text .
+"Tibetan (2$(7"70"]1"2$(8!;2$(7%P`"Q1"2$(8!;(B) 2$(7#RP#SP#S1!>"72$P`"Q1$(8!;2$(7"E0"S1"G$(8!;$(7"72"20"[1$(8!;2$(7"D0"[1"#"G!>2"I0"]0"_1$(8!;2$(7"9`"Q1$(8!;2$(7"/0"S1$(8!;2$(7"5`"Q12#2`#90"[1$(8!;2$(7"H`#A`"U0"c1!>(B")))
+
+
+;;;
+;;; Definitions of conversion data.
+;;;
+
+
+;;; alists for tibetan char <-> transcription conversion
+;;; longer transcription should come first
+(defconst tibetan-consonant-transcription-alist
+ '(("tsh" . "$(7";(B")
+ ("dzh" . "$(7"=(B")
+ ("kSH" . "$(7"J(B")
+ ("kh" . "$(7""(B")
+ ("gh" . "$(7"$(B")
+ ("ng" . "$(7"%(B")
+ ("ch" . "$(7"'(B")
+ ("ny" . "$(7"*(B")
+ ("TH" . "$(7",(B")
+ ("DH" . "$(7".(B")
+ ("th" . "$(7"1(B")
+ ("dh" . "$(7"3(B")
+ ("ph" . "$(7"6(B")
+ ("bh" . "$(7"8(B")
+ ("ts" . "$(7":(B")
+ ("dz" . "$(7"<(B")
+ ("zh" . "$(7"?(B")
+ ("sh" . "$(7"E(B")
+ ("SH" . "$(7"F(B")
+ ("k" . "$(7"!(B")
+ ("g" . "$(7"#(B")
+ ("c" . "$(7"&(B")
+ ("j" . "$(7"((B")
+ ("T" . "$(7"+(B")
+ ("D" . "$(7"-(B")
+ ("N" . "$(7"/(B")
+ ("t" . "$(7"0(B")
+ ("d" . "$(7"2(B")
+ ("n" . "$(7"4(B")
+ ("p" . "$(7"5(B")
+ ("b" . "$(7"7(B")
+ ("m" . "$(7"9(B")
+ ("w" . "$(7">(B")
+ ("z" . "$(7"@(B")
+ ("'" . "$(7"A(B")
+ ("y" . "$(7"B(B")
+ ("r" . "$(7"C(B")
+ ("l" . "$(7"D(B")
+ ("s" . "$(7"G(B")
+ ("h" . "$(7"H(B")
+ ("H" . "$(7"H(B")
+ ("A" . "$(7"I(B")))
+
+
+(defconst tibetan-vowel-transcription-alist
+ '(("ai" . "$(7"\(B")
+ ("au" . "$(7"^(B")
+ ("ee" . "$(7"\(B")
+ ("oo" . "$(7"^(B")
+ ("a" . "$(7"Q(B") ; invisible vowel sign (\x2251)
+ ("i" . "$(7"S(B")
+ ("u" . "$(7"U(B")
+ ("e" . "$(7"[(B")
+ ("o" . "$(7"](B")
+ ("E" . "$(7"\(B")
+ ("O" . "$(7"^(B")
+ ("I" . "$(7"a(B")
+ ("M" . "$(7"_(B")
+ ("~" . "$(7"c(B") ; not specified in Ext.wylie
+ ("`" . "$(7"d(B") ; idem.
+ ("," . "$(7"e(B") ; idem.
+ ("v" . "$(7"g(B") ; idem.
+ ("V" . "$(7"h(B") ; idem.
+ ("x" . "$(7"i(B") ; idem.
+ ("X" . "$(7"j(B") ; idem.
+ ("q" . "$(7"k(B") ; idem.
+ ("Q" . "$(7"l(B") ; idem.
+ ("_o" . "$(7!g(B") ; idem.
+ ("_O" . "$(7!e(B") ; idem.
+ ("_/" . "$(7!I(B") ; idem.
+ ))
+
+(defconst tibetan-precomposed-transcription-alist
+ '(("phyw" . "$(7$G(B")
+ ("tshw" . "$(7$)(B")
+ ("rtsw" . "$(7%.(B")
+ ("khw" . "$(7$"(B")
+ ("nyw" . "$(7$%(B")
+ ("tsw" . "$(7$((B")
+ ("zhw" . "$(7$*(B")
+ ("shw" . "$(7$.(B")
+ ("khy" . "$(7$A(B")
+ ("phy" . "$(7$D(B")
+ ("khr" . "$(7$Q(B")
+ ("thr" . "$(7$T(B")
+ ("phr" . "$(7$W(B")
+ ("shr" . "$(7$Z(B")
+ ("dzr" . "$(7$^(B")
+ ("grw" . "$(7$_(B")
+ ("rng" . "$(7%#(B")
+ ("rny" . "$(7%%(B")
+ ("rts" . "$(7%+(B")
+ ("rdz" . "$(7%,(B")
+ ("rgw" . "$(7%-(B")
+ ("rky" . "$(7%0(B")
+ ("rgy" . "$(7%1(B")
+ ("rmy" . "$(7%2(B")
+ ("lng" . "$(7%B(B")
+ ("sng" . "$(7%R(B")
+ ("sny" . "$(7%S(B")
+ ("sts" . "$(7%Z(B")
+ ("sky" . "$(7%`(B")
+ ("sgy" . "$(7%a(B")
+ ("spy" . "$(7%b(B")
+ ("sby" . "$(7%c(B")
+ ("smy" . "$(7%d(B")
+ ("skr" . "$(7%p(B")
+ ("sgr" . "$(7%q(B")
+ ("snr" . "$(7%r(B")
+ ("spr" . "$(7%s(B")
+ ("sbr" . "$(7%t(B")
+ ("smr" . "$(7%u(B")
+ ("kw" . "$(7$!(B")
+ ("gw" . "$(7$#(B")
+ ("cw" . "$(7$$(B")
+ ("tw" . "$(7$&(B")
+ ("dw" . "$(7$'(B")
+ ("zw" . "$(7$+(B")
+ ("rw" . "$(7$,(B")
+ ("lw" . "$(7$-(B")
+ ("sw" . "$(7$/(B")
+ ("hw" . "$(7$0(B")
+ ("ky" . "$(7$@(B")
+ ("gy" . "$(7$B(B")
+ ("py" . "$(7$C(B")
+ ("by" . "$(7$E(B")
+ ("my" . "$(7$F(B")
+ ("kr" . "$(7$P(B")
+ ("gr" . "$(7$R(B")
+ ("tr" . "$(7$S(B")
+ ("dr" . "$(7$U(B")
+ ("pr" . "$(7$V(B")
+ ("brk" . "$(7"7%!(B")
+ ("brg" . "$(7"7%"(B")
+ ("brng" . "$(7"7%#(B")
+ ("brj" . "$(7"7%$(B")
+ ("brny" . "$(7"7%%(B")
+ ("brt" . "$(7"7%&(B")
+ ("brd" . "$(7"7%'(B")
+ ("brn" . "$(7"7%((B")
+ ("brts" . "$(7"7%+(B")
+ ("brdz" . "$(7"7%,(B")
+ ("brl" . "$(7"7$d(B")
+ ("br" . "$(7$X(B")
+ ("mr" . "$(7$Y(B")
+ ("sr" . "$(7$[(B")
+ ("hr" . "$(7$\(B")
+ ("jr" . "$(7$](B")
+ ("kl" . "$(7$`(B")
+ ("gl" . "$(7$a(B")
+ ("blt" . "$(7"7%E(B")
+ ("bld" . "$(7"7%F(B")
+ ("bl" . "$(7$b(B")
+ ("zl" . "$(7$c(B")
+ ("rl" . "$(7$d(B")
+ ("sl" . "$(7$e(B")
+ ("rk" . "$(7%!(B")
+ ("rg" . "$(7%"(B")
+ ("rj" . "$(7%$(B")
+ ("rt" . "$(7%&(B")
+ ("rd" . "$(7%'(B")
+ ("rn" . "$(7%((B")
+ ("rb" . "$(7%)(B")
+ ("rm" . "$(7%*(B")
+ ("lk" . "$(7%@(B")
+ ("lg" . "$(7%A(B")
+ ("lc" . "$(7%C(B")
+ ("lj" . "$(7%D(B")
+ ("lt" . "$(7%E(B")
+ ("ld" . "$(7%F(B")
+ ("ln" . "$(7!!(B") ; dummy \x2121
+ ("lp" . "$(7%G(B")
+ ("lb" . "$(7%H(B")
+ ("lh" . "$(7%I(B")
+ ("sk" . "$(7%P(B")
+ ("sg" . "$(7%Q(B")
+ ("st" . "$(7%T(B")
+ ("sd" . "$(7%U(B")
+ ("sn" . "$(7%V(B")
+ ("sp" . "$(7%W(B")
+ ("sb" . "$(7%X(B")
+ ("sm" . "$(7%Y(B")))
+
+(defconst tibetan-subjoined-transcription-alist
+ '(("+k" . "$(7#!(B")
+ ("+kh" . "$(7#"(B")
+ ("+g" . "$(7##(B")
+ ("+gh" . "$(7#$(B")
+ ("+ng" . "$(7#%(B")
+ ("+c" . "$(7#&(B")
+ ("+ch" . "$(7#'(B")
+ ("+j" . "$(7#((B")
+ ("+ny" . "$(7#*(B")
+ ("+T" . "$(7#+(B")
+ ("+TH" . "$(7#,(B")
+ ("+D" . "$(7#-(B")
+ ("+DH" . "$(7#.(B")
+ ("+N" . "$(7#/(B")
+ ("+t" . "$(7#0(B")
+ ("+th" . "$(7#1(B")
+ ("+d" . "$(7#2(B")
+ ("+dh" . "$(7#3(B")
+ ("+n" . "$(7#4(B")
+ ("+p" . "$(7#5(B")
+ ("+ph" . "$(7#6(B")
+ ("+b" . "$(7#7(B")
+ ("+bh" . "$(7#8(B")
+ ("+m" . "$(7#9(B")
+ ("+ts" . "$(7#:(B")
+ ("+tsh" . "$(7#;(B")
+ ("+dz" . "$(7#<(B")
+ ("+dzh" . "$(7#=(B")
+ ("+w" . "$(7#>(B")
+ ("+zh" . "$(7#?(B")
+ ("+z" . "$(7#@(B")
+ ("+'" . "$(7#A(B")
+ ("+y" . "$(7#B(B")
+ ("+r" . "$(7#C(B")
+ ("+l" . "$(7#D(B")
+ ("+sh" . "$(7#E(B")
+ ("+SH" . "$(7#F(B")
+ ("+s" . "$(7#G(B")
+ ("+h" . "$(7#H(B")
+ ("+A" . "$(7#I(B")
+ ("+kSH" . "$(7#J(B")
+ ("R" . "$(7#P(B")))
+
+;;;
+;;; alist for Tibetan base consonant <-> subjoined consonant conversion.
+;;;
+(defconst tibetan-base-to-subjoined-alist
+ '(("$(7"!(B" . "$(7#!(B")
+ ("$(7""(B" . "$(7#"(B")
+ ("$(7"#(B" . "$(7##(B")
+ ("$(7"$(B" . "$(7#$(B")
+ ("$(7"%(B" . "$(7#%(B")
+ ("$(7"&(B" . "$(7#&(B")
+ ("$(7"'(B" . "$(7#'(B")
+ ("$(7"((B" . "$(7#((B")
+ ("$(7"*(B" . "$(7#*(B")
+ ("$(7"+(B" . "$(7#+(B")
+ ("$(7",(B" . "$(7#,(B")
+ ("$(7"-(B" . "$(7#-(B")
+ ("$(7".(B" . "$(7#.(B")
+ ("$(7"/(B" . "$(7#/(B")
+ ("$(7"0(B" . "$(7#0(B")
+ ("$(7"1(B" . "$(7#1(B")
+ ("$(7"2(B" . "$(7#2(B")
+ ("$(7"3(B" . "$(7#3(B")
+ ("$(7"4(B" . "$(7#4(B")
+ ("$(7"5(B" . "$(7#5(B")
+ ("$(7"6(B" . "$(7#6(B")
+ ("$(7"7(B" . "$(7#7(B")
+ ("$(7"8(B" . "$(7#8(B")
+ ("$(7"9(B" . "$(7#9(B")
+ ("$(7":(B" . "$(7#:(B")
+ ("$(7";(B" . "$(7#;(B")
+ ("$(7"<(B" . "$(7#<(B")
+ ("$(7"=(B" . "$(7#=(B")
+ ("$(7">(B" . "$(7#>(B")
+ ("$(7"?(B" . "$(7#?(B")
+ ("$(7"@(B" . "$(7#@(B")
+ ("$(7"A(B" . "$(7#A(B")
+ ("$(7"B(B" . "$(7#B(B")
+ ("$(7"C(B" . "$(7#C(B")
+ ("$(7"D(B" . "$(7#D(B")
+ ("$(7"E(B" . "$(7#E(B")
+ ("$(7"F(B" . "$(7#F(B")
+ ("$(7"G(B" . "$(7#G(B")
+ ("$(7"H(B" . "$(7#H(B")
+ ("$(7"I(B" . "$(7#I(B")
+ ("$(7"J(B" . "$(7#J(B")))
+
+;;;
+;;; alist for Tibetan consonantic components <-> precomposed glyph conversion.
+;;; (includes some punctuation conversion rules)
+;;;
+(defconst tibetan-precomposition-rule-alist
+ '(("$(7"6#B#>(B" . "$(7$G(B")
+ ("$(7"##C#>(B" . "$(7$_(B")
+ ("$(7";#>(B" . "$(7$)(B")
+ ("$(7"C#:#>(B" . "$(7%.(B")
+ ("$(7"C###>(B" . "$(7%-(B")
+ ("$(7"C#!#B(B" . "$(7%0(B")
+ ("$(7"C###B(B" . "$(7%1(B")
+ ("$(7"C#9#B(B" . "$(7%2(B")
+ ("$(7"G#!#B(B" . "$(7%`(B")
+ ("$(7"G###B(B" . "$(7%a(B")
+ ("$(7"G#5#B(B" . "$(7%b(B")
+ ("$(7"G#7#B(B" . "$(7%c(B")
+ ("$(7"G#9#B(B" . "$(7%d(B")
+ ("$(7"G#!#C(B" . "$(7%p(B")
+ ("$(7"G###C(B" . "$(7%q(B")
+ ("$(7"G#4#C(B" . "$(7%r(B")
+ ("$(7"G#5#C(B" . "$(7%s(B")
+ ("$(7"G#7#C(B" . "$(7%t(B")
+ ("$(7"G#9#C(B" . "$(7%u(B")
+ ("$(7""#>(B" . "$(7$"(B")
+ ("$(7"*#>(B" . "$(7$%(B")
+ ("$(7":#>(B" . "$(7$((B")
+ ("$(7"?#>(B" . "$(7$*(B")
+ ("$(7"E#>(B" . "$(7$.(B")
+ ("$(7""#B(B" . "$(7$A(B")
+ ("$(7"6#B(B" . "$(7$D(B")
+ ("$(7""#C(B" . "$(7$Q(B")
+ ("$(7"1#C(B" . "$(7$T(B")
+ ("$(7"6#C(B" . "$(7$W(B")
+ ("$(7"E#C(B" . "$(7$Z(B")
+ ("$(7"<#C(B" . "$(7$^(B")
+ ("$(7"C#%(B" . "$(7%#(B")
+ ("$(7"C#*(B" . "$(7%%(B")
+ ("$(7"C#:(B" . "$(7%+(B")
+ ("$(7"C#<(B" . "$(7%,(B")
+ ("$(7"D#%(B" . "$(7%B(B")
+ ("$(7"G#%(B" . "$(7%R(B")
+ ("$(7"G#*(B" . "$(7%S(B")
+ ("$(7"G#:(B" . "$(7%Z(B")
+ ("$(7"!#>(B" . "$(7$!(B")
+ ("$(7"##>(B" . "$(7$#(B")
+ ("$(7"&#>(B" . "$(7$$(B")
+ ("$(7"0#>(B" . "$(7$&(B")
+ ("$(7"2#>(B" . "$(7$'(B")
+ ("$(7"@#>(B" . "$(7$+(B")
+ ("$(7"C#>(B" . "$(7$,(B")
+ ("$(7"D#>(B" . "$(7$-(B")
+ ("$(7"G#>(B" . "$(7$/(B")
+ ("$(7"H#>(B" . "$(7$0(B")
+ ("$(7"!#B(B" . "$(7$@(B")
+ ("$(7"##B(B" . "$(7$B(B")
+ ("$(7"5#B(B" . "$(7$C(B")
+ ("$(7"7#B(B" . "$(7$E(B")
+ ("$(7"9#B(B" . "$(7$F(B")
+ ("$(7"!#C(B" . "$(7$P(B")
+ ("$(7"##C(B" . "$(7$R(B")
+ ("$(7"0#C(B" . "$(7$S(B")
+ ("$(7"2#C(B" . "$(7$U(B")
+ ("$(7"5#C(B" . "$(7$V(B")
+ ("$(7"7#C(B" . "$(7$X(B")
+ ("$(7"9#C(B" . "$(7$Y(B")
+ ("$(7"G#C(B" . "$(7$[(B")
+ ("$(7"H#C(B" . "$(7$\(B")
+ ("$(7"(#C(B" . "$(7$](B")
+ ("$(7"!#D(B" . "$(7$`(B")
+ ("$(7"##D(B" . "$(7$a(B")
+ ("$(7"7#D(B" . "$(7$b(B")
+ ("$(7"@#D(B" . "$(7$c(B")
+ ("$(7"C#D(B" . "$(7$d(B")
+ ("$(7"G#D(B" . "$(7$e(B")
+ ("$(7"C#!(B" . "$(7%!(B")
+ ("$(7"C##(B" . "$(7%"(B")
+ ("$(7"C#((B" . "$(7%$(B")
+ ("$(7"C#0(B" . "$(7%&(B")
+ ("$(7"C#2(B" . "$(7%'(B")
+ ("$(7"C#4(B" . "$(7%((B")
+ ("$(7"C#7(B" . "$(7%)(B")
+ ("$(7"C#9(B" . "$(7%*(B")
+ ("$(7"D#!(B" . "$(7%@(B")
+ ("$(7"D##(B" . "$(7%A(B")
+ ("$(7"D#&(B" . "$(7%C(B")
+ ("$(7"D#((B" . "$(7%D(B")
+ ("$(7"D#0(B" . "$(7%E(B")
+ ("$(7"D#2(B" . "$(7%F(B")
+ ("$(7"D#5(B" . "$(7%G(B")
+ ("$(7"D#7(B" . "$(7%H(B")
+ ("$(7"D#H(B" . "$(7%I(B")
+ ("$(7"G#!(B" . "$(7%P(B")
+ ("$(7"G##(B" . "$(7%Q(B")
+ ("$(7"G#0(B" . "$(7%T(B")
+ ("$(7"G#2(B" . "$(7%U(B")
+ ("$(7"G#4(B" . "$(7%V(B")
+ ("$(7"G#5(B" . "$(7%W(B")
+ ("$(7"G#7(B" . "$(7%X(B")
+ ("$(7"G#9(B" . "$(7%Y(B")
+ ("$(7!=(B" . "$(8!=(B") ; 2 col <-> 1 col
+ ("$(7!?(B" . "$(8!?(B")
+ ("$(7!@(B" . "$(8!@(B")
+ ("$(7!A(B" . "$(8!A(B")
+ ("$(7"`(B" . "$(8"`(B")
+ ("$(7!;(B" . "$(8!;(B")
+ ("$(7!D(B" . "$(8!D(B")
+ ("$(7!>(B $(7!>(B" . "2$(7!>P(B P$(7!>1(B") ; Yes this is dirty. But ...
+ ("$(7!4!5!5(B" . "2$(7#RP#SP#SP#S1(B")
+ ("$(7!4!5(B" . "2$(7#RP#SP#S1(B")
+ ("$(7!6(B" . "2$(7#RP#S_!I1(B")
+ ("$(7!4(B" . "2$(7#RP#S1(B")))
+
+(defvar tibetan-regexp
+ (let ((l (append tibetan-consonant-transcription-alist
+ tibetan-vowel-transcription-alist
+ tibetan-subjoined-transcription-alist))
+ temp)
+ (setq temp "\\(")
+ (setq temp (concat temp (car (car l))))
+ (setq l (cdr l))
+ (while l
+ (setq temp (concat temp "\\|" (car (car l))))
+ (setq l (cdr l)))
+ (concat temp "\\)$"))
+ "Regexp string to match a romanized Tibetan character component, i.e.,
+base and subjoined consonant, vowel and vowel modifier. The result of matching
+is to be used for indexing alists at conversion from a roman transcription to
+the corresponding Tibetan character.")
+
+(defvar tibetan-precomposed-regexp
+ (let ((l tibetan-precomposed-transcription-alist)
+ temp)
+ (setq temp "^\\(")
+ (setq temp
+ (concat temp (car (car l))))
+ (setq l (cdr l))
+ (while l
+ (setq temp
+ (concat temp "\\|" (car (car l))))
+ (setq l (cdr l)))
+ (concat temp "\\)"))
+ "Regexp string to match a romanized Tibetan complex consonant.
+The result of matching is to be used for indexing alists when the input key
+from an input method is converted to the corresponding precomposed glyph.")
+
+(defvar tibetan-precomposition-rule-regexp
+ (let ((l tibetan-precomposition-rule-alist)
+ temp)
+ (setq temp "\\(")
+ (setq temp (concat temp (car (car l))))
+ (setq l (cdr l))
+ (while l
+ (setq temp (concat temp "\\|" (car (car l))))
+ (setq l (cdr l)))
+ (concat temp "\\)"))
+ "Regexp string to match a sequence of Tibetan consonantic components, i.e.,
+one base consonant and one or more subjoined consonants.
+The result of matching is to be used for indexing alist when the component
+sequence is converted to the corresponding precomposed glyph.
+This also matches some punctuation characters which need conversion.")
+
+(defvar tibetan-decomposed nil)
+(defvar tibetan-decomposed-temp nil)
+
+;;; language/tibetan.el ends here