-;;; devan-util.el --- Support for Devanagari Script Composition
-
-;; Copyright (C) 1996 Free Software Foundation, Inc.
-
-;; Author: KAWABATA, Taichi <kawabata@is.s.u-tokyo.ac.jp>
-
-;; Keywords: multilingual, Indian, Devanagari
-
-;; This file is part of GNU Emacs.
-
-;; GNU Emacs is free software; you can redistribute it and/or modify
-;; it under the terms of the GNU General Public License as published by
-;; the Free Software Foundation; either version 2, or (at your option)
-;; any later version.
-
-;; GNU Emacs is distributed in the hope that it will be useful,
-;; but WITHOUT ANY WARRANTY; without even the implied warranty of
-;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-;; GNU General Public License for more details.
-
-;; You should have received a copy of the GNU General Public License
-;; along with GNU Emacs; see the file COPYING. If not, write to the
-;; Free Software Foundation, Inc., 59 Temple Place - Suite 330,
-;; Boston, MA 02111-1307, USA.
-
-;;; Commentary:
-
-;; History:
-;; 1996.10.18 written by KAWABATA, Taichi <kawabata@is.s.u-tokyo.ac.jp>
-;; 1997.1.20 fixed some bugs.
-;; 1997.3.24 fixed some bugs.
-
-;; Future work ::
-;; Decompose the input characters and process them on the character basis.
-
-;; Devanagari script composition rules and related programs.
-
-;;; Code:
-
-;;;
-;;; Steps toward composition of Devanagari Characters.
-;;;
-
-;;; Intersection Function will be used.
-(require 'cl)
-
-;;;###autoload
-(defun setup-devanagari-environment ()
- "Setup multilingual environment (MULE) for languages using Devanagari."
- (interactive)
- (setup-8-bit-environment nil 'in-is13194-devanagari
- '("Devanagari" . "quail-devanagari-itrans")))
-
-;;; Basic functions.
-
-;;;###autoload
-(defun indian-to-devanagari (ch)
- "Convert IS 13194 characters to Devanagari basic characters."
- (let ((charcodes (split-char ch)))
- (if (eq (car charcodes) 'indian-is13194)
- (make-char 'indian-2-column ?\x21 (nth 1 charcodes))
- ch)))
-
-;;;###autoload
-(defun devanagari-to-indian (ch)
- "Convert Devanagari basic characters to IS 13194 characters."
- (let* ((charcodes (split-char ch))
- (charset (car charcodes))
- (code-h (car (cdr charcodes))))
- (if (and (eq (car charcodes) 'indian-2-column)
- (= (nth 1 charcodes) ?\x21))
- (make-char 'indian-is13194 (nth 2 charcodes))
- ch)))
-
-;;;###autoload
-(defun indian-to-devanagari-region (from to)
- "Convert IS 13194 characters in region to Devanagari basic characters."
- (interactive "r")
- (save-restriction
- (narrow-to-region from to)
- (goto-char (point-min))
-; (while (re-search-forward "\\cd" nil t)
- (while (re-search-forward "." nil t)
- (let* ((devanagari-char (indian-to-devanagari (preceding-char))))
- (delete-char -1)
- (insert devanagari-char)))))
-
-;;;###autoload
-(defun devanagari-to-indian-region (from to)
- "Convert Devanagari basic characters in region to Indian characters."
- (interactive "r")
- (save-restriction
- (narrow-to-region from to)
- (goto-char (point-min))
-; (while (re-search-forward "\\cD" nil t) ; Devanagari Character Code.
- (while (re-search-forward "." nil t)
- (let* ((indian-char (devanagari-to-indian (preceding-char))))
- (delete-char -1)
- (insert indian-char)))))
-
-;;;###autoload
-(defun indian-to-devanagari-string (str)
- "Convert Indian String to Devanagari Basic Character String."
- (let ((pos 0) (dst "") (src str) char)
- (while (not (equal src ""))
- (setq char (string-to-char src))
- (setq src (substring src (char-bytes char)))
- (setq dst (concat dst (char-to-string (indian-to-devanagari char)))))
- dst))
-
-;; Phase 0 - Determine whether the characters can be composed.
-;;
-;;;
-;;; Regular expressions to split characters for composition.
-;;;
-;;
-;; Indian script word contains one or more syllables.
-;; In BNF, it can be expressed as follows:
-;;
-;; Word ::= {Syllable} [Cons-Syllable]
-;; Syllable ::= Cons-Vowel-Syllable | Vowel-Syllable
-;; Vowel-Syllable ::= V[D]
-;; Cons-Vowel-Syllable ::= [Cons-Syllable] Full-Cons [M] [D]
-;; Cons-Syllable ::= [Pure-Cons] [Pure-Cons] [Pure-Cons] Pure-Cons
-;; Pure-Cons ::= Full-Cons H
-;; Full-Cons ::= C [N]
-;;
-;; {} repeat, [] optional
-;;
-;; C - Consonant (\e$(5!3!4!5!6!7!8!9!:!;!<!=!>!?!@!A!B!C!D!E\e(B
-;; \e$(5!F!G!H!I!J!K!L!M!N!O!P!Q!R!S!T!U!V!W!X\e(B)
-;; N - Nukta (\e$(5!i\e(B)
-;; H - Halant(\e$(5!h\e(B) or Virama
-;; V - Vowel (\e$(5!$!%!&!'!(!)!*!+!,!-!.!/!0!1!2#&#'#*\e(B)
-;; ("\e$(5#&#'#*\e(B" can be obtained by IS13194 vowels with nukta.)
-;; D - Vowel Modifiers, i.e. Anuswar, Chandrabindu (\e$(5!!!"\e(B)
-;; (Visaraga (\e$(5!#\e(B) is excluded.)
-;; M - Matra (\e$(5!Z![!\!]!^!_!`!a!b!c!d!e!f!g#K#L#M\e(B)
-;; ("\e$(5#K#L#M\e(B" can be obtained by IS13194 matras with nukta.)
-;;
-;; In Emacs, one syllable of Indian language is considered to be one
-;; composite glyph. If we expand the above expression for
-;; cons-vowel-syllable, it would be:
-;;
-;; [[C [N] H] [C [N] H] [C [N] H] C [N] H] C [N] [M] [D]
-;;
-;; Therefore, in worst case, the one syllable may contain
-;; following characters.
-;;
-;; C N H C N H C N H C N H C N M D
-;;
-;; The example is a sanskrit word "kArtsnya", where five consecutive
-;; consonants appear.
-;;
-;; On the other hand, consonant-syllable, which appears at the end of
-;; the word, would have the following expression:
-;;
-;; [C [N] H] [C [N] H] [C [N] H] C [N] H
-;;
-;; This is acceptable BEFORE proper consonant-syllable is input. The
-;; string which doesn't match with the above expression is invalid and
-;; thus must be fixed.
-;;
-;; Note:
-;; Third case can be considered, which is acceptable syllable and can
-;; not add any code more.
-;;
-;; [[C [N] H] [C [N] H] [C [N] H] C [N] H] C [N] [M] D
-;;
-;; However, to make editing possible even in this condition, we will
-;; not consider about this case.
-;;
-;; Note:
-;; Currently, it seems that the only following consonants would have
-;; Nukta sign attatched.
-;; (\e$(5!3!4!5!:!?!@!I\e(B)
-;; Therefore, [\e$(5!3\e(B-\e$(5!X\e(B]\e$(5!i\e(B? can be re-written as
-;; \\([\e$(5!3!4!5!:!?!@!I\e(B]\e$(5!i\e(B\\)\\|[\e$(5!3\e(B-\e$(5!X\e(B]
-
-(defconst devanagari-full-cons
- "\\(\\([\e$(5!3!4!5!:!?!@!I\e(B]\e$(5!i\e(B\\)\\|[\e$(5!3\e(B-\e$(5!X$.$E"%\e(B]\\)"
- "Devanagari full consonant")
-
-(defconst devanagari-pure-cons
- (concat "\\(" devanagari-full-cons "\e$(5!h\e(B\\)")
- "Devanagari pure consonant")
-
-(defconst devanagari-matra
- "\\(\\([\e$(5!_![!\\e(B]\e$(5!i\e(B\\)\\|[\e$(5!Z\e(B-\e$(5!g#K#L#M\e(B]\\)"
- "Devanagari Matra Signs. '\e$(5#K#L#M\e(B' can also be created from the combination
-of '\e$(5!_![!\\e(B' and nukta sign.")
-
-(defconst devanagari-vowel
- "\\(\\([\e$(5!*!&!'\e(B]\e$(5!i\e(B\\)\\|[\e$(5!$\e(B-\e$(5!2#&#'#*\e(B]\\)"
- "Devanagari Vowels. '\e$(5#&#'#*\e(B' can also be created from the combination
-of '\e$(5!*!&!'\e(B' and nukta sign.")
-
-(defconst devanagari-vowel-syllable
- (concat devanagari-vowel "[\e$(5!!!"\e(B]?")
- "Devanagari vowel syllable.")
-
-(defconst devanagari-cons-syllable
- (concat devanagari-pure-cons "?" devanagari-pure-cons "?"
- devanagari-pure-cons "?" devanagari-pure-cons "$")
- "Devanagari consonant syllable")
-
-(defconst devanagari-cons-vowel-syllable
- (concat "\\("
- devanagari-pure-cons "?" devanagari-pure-cons "?"
- devanagari-pure-cons "?" devanagari-pure-cons "\\)?"
- devanagari-full-cons devanagari-matra "?[\e$(5!!!"\e(B]?")
- "Devanagari consonant vowel syllable.")
-
-;;
-;; Also, digits and virams should be processed other than syllables.
-;;
-;; In IS 13194, Avagrah is obtained by Nukta after Viram, and
-;; OM is obtained by Nukta after Chandrabindu
-;;
-
-(defconst devanagari-digit-viram-visarga
- "[\e$(5!q\e(B-\e$(5!z!j!#\e(B]")
-(defconst devanagari-other-sign
- "\\([\e$(5!!!j\e(B]\e$(5!i\e(B\\)\\|\\([\e$(5#!#J\e(B]\\)")
-
-(defconst devanagari-composite-glyph-unit
- (concat "\\(" devanagari-cons-syllable
- "\\)\\|\\(" devanagari-vowel-syllable
- "\\)\\|\\(" devanagari-digit-viram-visarga
- "\\)\\|\\(" devanagari-cons-vowel-syllable
- "\\)\\|\\(" devanagari-other-sign "\\)")
- "Regexp matching to Devanagari string to be composed form one glyph.")
-
-;;(put-charset-property charset-devanagari-1-column
-;; 'char-to-glyph 'devanagari-compose-string)
-;;(put-charset-property charset-devanagari-2-column
-;; 'char-to-glyph 'devanagari-compose-string)
-
-;; Sample
-;;
-;;(string-match devanagari-cons-vowel-syllable-examine "\e$(5!X![\e(B") => 0
-;;(string-match devanagari-cons-vowel-syllable-examine "\e$(5!F!h!D!\\e(B") => 0
-;;(string-match devanagari-cons-vowel-syllable-examine "\e$(5!X![!F!h!D!\\e(B") => 0
-
-;;
-;; Steps toward the composition
-;; Converting Character Codes to Composite Glyph.
-;;
-;; Example : \e$(5!X![\e(B/\e$(5!F!h!D!\\e(B
-;;
-;; First, convert Characters to appropriate glyphs.
-;;
-;; => \e$(5!X![\e(B/\e$(5"F!D!\\e(B
-;;
-;; Then, determine the base glyph, apply-orders and apply-rules.
-;;
-;; => \e$(5!X\e(B (ml.mr) \e$(5![\e(B / \e$(5!D\e(B (ml.mr) \e$(5"F\e(B (mr ml) \e$(5!\\e(B
-;;
-;; Finally, convert 2-column glyphs to 1-column glyph
-;; if such a glyph exist.
-;;
-;; => \e$(6![\e(B (ml.mr) \e$(6!X\e(B / \e$(6!D\e(B (ml.mr) \e$(6"F\e(B (mr ml) \e$(6!\\e(B
-;;
-;; Compose the glyph.
-;;
-;; => \e2\e$(6!X@![\e1\e(B/\e2\e$(6!D@"FP!\\e1\e(B
-;; => \e2\e$(6!X@![\e1\e2!D@"FP!\\e1\e(B
-;;
-
-;;
-;; Phase 1: Converting Character Code to Glyph Code.
-;;
-;;
-;; IMPORTANT:
-;; There may be many rules which you many want to be suppressed.
-;; In that case, please comment out that rule.
-;;
-;; RULES WILL BE EVALUATED FROM FIRST TO LAST.
-;; PUT MORE SPECIFIC RULES FIRST.
-;;
-;; TO DO:
-;; Prepare multiple specific list of rules for each languages
-;; which adopts Devanagari script.
-;;
-
-
-(defconst devanagari-char-to-glyph-rules
- '(
-
- ;; `r' at the top of syllable and followed by other consonants.
- ;; ("[^\e$(5!h\e(B]\\(\e$(5!O!h\e(B\\)[\e$(5!3\e(B-\e$(5!X\e(B]" "\e$(5"p\e(B")
- ("^\\(\e$(5!O!h\e(B\\)[\e$(5!3\e(B-\e$(5!X\e(B]" "\e$(5"p\e(B")
-
- ;; Ligature Rules
- ("\\(\e$(5!3!h!B!h!O!h!M\e(B\\)" "\e$(5$!\e(B" sanskrit)
- ("\\(\e$(5!3!h!B!h!T\e(B\\)" "\e$(5$"\e(B" sanskrit)
- ("\\(\e$(5!3!h!B!h!M\e(B\\)" "\e$(5$#\e(B" sanskrit)
- ("\\(\e$(5!3!h!F!h!M\e(B\\)" "\e$(5$$\e(B")
- ("\\(\e$(5!3!h!O!h!M\e(B\\)" "\e$(5$%\e(B")
- ("\\(\e$(5!3!h!O\e(B\\)" "\e$(5"#\e(B") ; Post "r"
- ("\\(\e$(5!3!h!T!h!M\e(B\\)" "\e$(5$&\e(B" sanskrit)
- ("\\(\e$(5!3!h\e(B\\)\e$(5!3!h\e(B[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"3\e(B") ; Special Half Form
- ("\\(\e$(5!3!h!3\e(B\\)" "\e$(5$'\e(B")
- ("\\(\e$(5!3!h\e(B\\)\e$(5!B!h!O\e(B" "\e$(5"3\e(B") ; Special Rules for "k-tr"
- ("\\(\e$(5!3!h!B\e(B\\)" "\e$(5$(\e(B")
- ("\\(\e$(5!3!h!F\e(B\\)" "\e$(5$)\e(B")
- ("\\(\e$(5!3!h!L\e(B\\)" "\e$(5$*\e(B")
- ("\\(\e$(5!3!h!M\e(B\\)" "\e$(5$+\e(B")
- ("\\(\e$(5!3!h!Q\e(B\\)" "\e$(5$,\e(B")
- ("\\(\e$(5!3!h!T\e(B\\)" "\e$(5$-\e(B")
- ("\\(\e$(5!3!h!V!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"l\e(B") ; Half Form
- ("\\(\e$(5$.!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"l\e(B") ; Half Form
- ("\\(\e$(5!3!h!V\e(B\\)" "\e$(5$.\e(B")
- ("\\(\e$(5!3!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"3\e(B") ; Half Form
- ("\\(\e$(5!3!i!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"s\e(B") ; Nukta Half Form
- ("\\(\e$(5!3!i\e(B\\)" "\e$(5#3\e(B") ; Nukta
- ("\\(\e$(5!4!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"4\e(B") ; Half Form
- ("\\(\e$(5!4!i!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"t\e(B") ; Nukta Half Form
- ("\\(\e$(5!4!i\e(B\\)" "\e$(5#4\e(B") ; Nukta
- ("\\(\e$(5!5!h!O!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"`\e(B") ; Half Form
- ("\\(\e$(5!5!h!O\e(B\\)" "\e$(5"$\e(B") ; Post "r"
- ("\\(\e$(5!5!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"5\e(B") ; Half Form
- ("\\(\e$(5!5!i!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"u\e(B") ; Nukta Half Form
- ("\\(\e$(5!5!i\e(B\\)" "\e$(5#5\e(B") ; Nukta
- ("\\(\e$(5!6!h!F!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"a\e(B") ; Half Form
- ("\\(\e$(5!6!h!F\e(B\\)" "\e$(5$/\e(B")
- ; Slot
- ("\\(\e$(5!6!h!O\e(B\\)" "\e$(5!6"q\e(B") ; Post "r"
- ("\\(\e$(5!6!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"6\e(B") ; Half Form
- ("\\(\e$(5!7!h!3!h!B!h!M\e(B\\)" "\e$(5$0\e(B" sanskrit)
- ("\\(\e$(5!7!h!3!h!V!h!T\e(B\\)" "\e$(5$1\e(B" sanskrit)
- ("\\(\e$(5!7!h!3!h!B\e(B\\)" "\e$(5$2\e(B" sanskrit)
- ("\\(\e$(5!7!h!3!h!V\e(B\\)" "\e$(5$3\e(B" sanskrit)
- ("\\(\e$(5!7!h!3!h!O\e(B\\)" "\e$(5$9"q\e(B") ; Special Rule. May be precomposed font needed.
- ("\\(\e$(5!7!h!6!h!O\e(B\\)" "\e$(5$4\e(B" sanskrit)
- ("\\(\e$(5!7!h!3!h!M\e(B\\)" "\e$(5$5\e(B" sanskrit)
- ("\\(\e$(5!7!h!4!h!M\e(B\\)" "\e$(5$6\e(B" sanskrit)
- ("\\(\e$(5!7!h!5!h!M\e(B\\)" "\e$(5$7\e(B" sanskrit)
- ("\\(\e$(5!7!h!6!h!M\e(B\\)" "\e$(5$8\e(B" sanskrit)
- ("\\(\e$(5!7!h!3\e(B\\)" "\e$(5$9\e(B")
- ("\\(\e$(5!7!h!4\e(B\\)" "\e$(5$:\e(B")
- ("\\(\e$(5!7!h!5!h!O\e(B\\)" "\e$(5$;"q\e(B") ; Special Rule. May be precomposed font needed.
- ("\\(\e$(5!7!h!5\e(B\\)" "\e$(5$;\e(B")
- ("\\(\e$(5!7!h!6\e(B\\)" "\e$(5$<\e(B")
- ("\\(\e$(5!7!h!7\e(B\\)" "\e$(5$=\e(B")
- ("\\(\e$(5!7!h!F\e(B\\)" "\e$(5$>\e(B")
- ("\\(\e$(5!7!h!L\e(B\\)" "\e$(5$?\e(B")
- ("\\(\e$(5!7!h!M\e(B\\)" "\e$(5$@\e(B")
- ("\\(\e$(5!8!h\e(B\\)[\e$(5!8!<\e(B]\e$(5!h\e(B" "\e$(5"8\e(B") ; Half Form
- ("\\(\e$(5!8!h!8\e(B\\)" "\e$(5$A\e(B")
- ("\\(\e$(5!8!h!<\e(B\\)" "\e$(5$B\e(B")
- ("\\(\e$(5!8!h!O!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"8"q\e(B") ; Half Form Post "r"
- ("\\(\e$(5!8!h!O\e(B\\)" "\e$(5!8"q\e(B") ; Post "r"
- ("\\(\e$(5!8!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"8\e(B") ; Half Form
- ("\\(\e$(5!9!h!M\e(B\\)" "\e$(5$C\e(B")
- ("\\(\e$(5!:!h!O\e(B\\)" "\e$(5$D\e(B")
- ("\\(\e$(5!:!h!<!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"m\e(B") ; Half Form
- ("\\(\e$(5!:!h!<\e(B\\)" "\e$(5$E\e(B")
- ("\\(\e$(5!:!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5":\e(B") ; Half Form
- ("\\(\e$(5!:!i!h!O\e(B\\)" "\e$(5"!\e(B") ; Nukta Post "r"
- ("\\(\e$(5!:!i!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"z\e(B") ; Nukta Half Form
- ("\\(\e$(5!:!i\e(B\\)" "\e$(5#:\e(B") ; Nukta
- ("\\(\e$(5!;!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5";\e(B") ; Half Form
- ("\\(\e$(5!<!h\e(B\\)\e$(5!8!h\e(B[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"<\e(B") ; Special Half Form
- ("\\(\e$(5!<!h!8\e(B\\)" "\e$(5$F\e(B")
- ("\\(\e$(5!<!h\e(B\\)\e$(5!:!h\e(B[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"<\e(B") ; Special Half Form
- ("\\(\e$(5!<!h!:\e(B\\)" "\e$(5$G\e(B")
- ("\\(\e$(5!<!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"<\e(B") ; Half Form
- ("\\(\e$(5!=!h!3\e(B\\)" "\e$(5$H\e(B")
- ("\\(\e$(5!=!h!=\e(B\\)" "\e$(5$I\e(B")
- ("\\(\e$(5!=!h!>\e(B\\)" "\e$(5$J\e(B")
- ("\\(\e$(5!=!h!M\e(B\\)" "\e$(5$K\e(B")
- ("\\(\e$(5!>!h!M\e(B\\)" "\e$(5$L\e(B")
- ("\\(\e$(5!?!h!5!h!M\e(B\\)" "\e$(5$M\e(B" sanskrit)
- ("\\(\e$(5!?!h!6!h!O\e(B\\)" "\e$(5$N\e(B" sanskrit)
- ("\\(\e$(5!?!h!O!h!M\e(B\\)" "\e$(5$O\e(B")
- ("\\(\e$(5!?!h!5\e(B\\)" "\e$(5$P\e(B")
- ("\\(\e$(5!?!h!6\e(B\\)" "\e$(5$Q\e(B")
- ("\\(\e$(5!?!h!?\e(B\\)" "\e$(5$R\e(B")
- ("\\(\e$(5!?!h!L\e(B\\)" "\e$(5$S\e(B")
- ("\\(\e$(5!?!h!M\e(B\\)" "\e$(5$T\e(B")
- ("\\(\e$(5!?!i\e(B\\)" "\e$(5#?\e(B") ; Nukta
- ("\\(\e$(5!@!h!M\e(B\\)" "\e$(5$`\e(B")
- ("\\(\e$(5!@!i\e(B\\)" "\e$(5#@\e(B") ; Nukta
- ("\\(\e$(5!A!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"A\e(B") ; Half Form
- ("\\(\e$(5!B!h\e(B\\)\e$(5!B!h!O\e(B" "\e$(5"B\e(B") ; Special Rule for "t-tr"
- ("\\(\e$(5!B!h!B!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"c\e(B") ; Half Form
- ("\\(\e$(5!B!h!B\e(B\\)" "\e$(5$a\e(B")
- ("\\(\e$(5!B!h!F\e(B\\)" "\e$(5$b\e(B")
- ("\\(\e$(5!B!h!O!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"d\e(B") ; Half Form Post "r"
- ("\\(\e$(5!B!h!O\e(B\\)" "\e$(5"%\e(B") ; Post "r"
- ("\\(\e$(5!B!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"B\e(B") ; Half Form
- ("\\(\e$(5!C!h!O\e(B\\)" "\e$(5!C"q\e(B") ; Post "r"
- ("\\(\e$(5!C!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"C\e(B") ; Half Form
- ("\\(\e$(5!D!h!D!h!M\e(B\\)" "\e$(5$c\e(B")
- ("\\(\e$(5!D!h!E!h!M\e(B\\)" "\e$(5$d\e(B")
- ("\\(\e$(5!D!h!K!h!M\e(B\\)" "\e$(5$e\e(B")
- ("\\(\e$(5!D!h!K!h!O\e(B\\)" "\e$(5$r"r\e(B") ; Special Case for "dbhr" ; ***
- ("\\(\e$(5!D!h!O!h!M\e(B\\)" "\e$(5$f\e(B")
- ("\\(\e$(5!D!h!T!h!M\e(B\\)" "\e$(5$g\e(B")
- ("\\(\e$(5!D!h!5!h!O\e(B\\)" "\e$(5$h\e(B")
- ("\\(\e$(5!D!h!6!h!O\e(B\\)" "\e$(5$i\e(B")
- ("\\(\e$(5!D!h!D!h!T\e(B\\)" "\e$(5$j\e(B")
- ("\\(\e$(5!D!h!E!h!T\e(B\\)" "\e$(5$k\e(B")
- ("\\(\e$(5!D!h\e(B\\)\e$(5!E!h\e(B[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5!D!h\e(B") ; Special Half Form (for ddhra)
- ("\\(\e$(5!D!h!5\e(B\\)" "\e$(5$l\e(B")
- ("\\(\e$(5!D!h!6\e(B\\)" "\e$(5$m\e(B")
- ("\\(\e$(5!D!h!D\e(B\\)" "\e$(5$n\e(B")
- ("\\(\e$(5!D!h!E\e(B\\)" "\e$(5$o\e(B")
- ("\\(\e$(5!D!h!F\e(B\\)" "\e$(5$p\e(B")
- ("\\(\e$(5!D!h\e(B\\)\e$(5!J!h\e(B" "\e$(5!D!h\e(B") ; Suppressing "db-"
- ("\\(\e$(5!D!h!J\e(B\\)" "\e$(5$q\e(B")
- ("\\(\e$(5!D!h!K\e(B\\)" "\e$(5$r\e(B")
- ("\\(\e$(5!D!h!L\e(B\\)" "\e$(5$s\e(B")
- ("\\(\e$(5!D!h!M\e(B\\)" "\e$(5$t\e(B")
- ("\\(\e$(5!D!h!T\e(B\\)" "\e$(5$u\e(B")
- ("\\(\e$(5!E!h!F!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"e\e(B") ; Half Form
- ("\\(\e$(5!E!h!F\e(B\\)" "\e$(5$v\e(B")
- ("\\(\e$(5!E!h!O!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"f\e(B") ; Half Form Post "r"
- ("\\(\e$(5!E!h!O\e(B\\)" "\e$(5!E"q\e(B") ; Post "r"
- ("\\(\e$(5!E!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"E\e(B") ; Half Form
- ("\\(\e$(5!F!h!F!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"k\e(B") ; Half Form
- ("\\(\e$(5!F!h!F\e(B\\)" "\e$(5$w\e(B")
- ("\\(\e$(5!F!h!O\e(B\\)" "\e$(5!F"q\e(B")
- ("\\(\e$(5!F!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"F\e(B") ; Half Form
- ("\\(\e$(5!G!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"G\e(B") ; Nukta Half Form
- ("\\(\e$(5!H!h\e(B\\)\e$(5!B!h!O\e(B" "\e$(5"H\e(B") ; Special Rule for "p-tr"
- ("\\(\e$(5!H!h!B!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"g\e(B") ; Half Form
- ("\\(\e$(5!H!h!B\e(B\\)" "\e$(5$x\e(B")
- ("\\(\e$(5!H!h!F\e(B\\)" "\e$(5$y\e(B")
- ("\\(\e$(5!H!h!Q\e(B\\)" "\e$(5$z\e(B")
- ("\\(\e$(5!H!h!O\e(B\\)" "\e$(5"&\e(B") ; Post "r"
- ("\\(\e$(5!H!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"H\e(B") ; Half Form
- ("\\(\e$(5!I!h!O\e(B\\)" "\e$(5"'\e(B") ; Post "r"
- ("\\(\e$(5!I!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"I\e(B") ; Half Form
- ("\\(\e$(5!I!i!h!O\e(B\\)" "\e$(5""\e(B") ; Nukta Post "r"
- ("\\(\e$(5!I!i!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"y\e(B") ; Nukta Half Form
- ("\\(\e$(5!I!i\e(B\\)" "\e$(5#I\e(B") ; Nukta
- ("\\(\e$(5!J!h\e(B\\)\e$(5!F!h\e(B[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"J\e(B") ; Special Half Form
- ("\\(\e$(5!J!h!F\e(B\\)" "\e$(5${\e(B")
- ("\\(\e$(5!J!h\e(B\\)\e$(5!J!h\e(B[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"J\e(B") ; Special Half Form
- ("\\(\e$(5!J!h!J\e(B\\)" "\e$(5$|\e(B")
- ("\\(\e$(5!J!h\e(B\\)\e$(5!T!h\e(B[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"J\e(B") ; Special Half Form
- ("\\(\e$(5!J!h!T\e(B\\)" "\e$(5$}\e(B")
- ("\\(\e$(5!J!h!O\e(B\\)" "\e$(5!J"q\e(B") ; Post "r"
- ("\\(\e$(5!J!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"J\e(B") ; Half Form
- ("\\(\e$(5!K!h!F\e(B\\)" "\e$(5$~\e(B")
- ("\\(\e$(5!K!h!O\e(B\\)" "\e$(5!K"q\e(B") ; Post "r"
- ("\\(\e$(5!K!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"K\e(B") ; Half Form
- ("\\(\e$(5!L!h!F\e(B\\)" "\e$(5#P\e(B")
- ("\\(\e$(5!L!h!Q\e(B\\)" "\e$(5#Q\e(B")
- ("\\(\e$(5!L!h!O\e(B\\)" "\e$(5!L"q\e(B") ; Post "r"
- ("\\(\e$(5!L!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"L\e(B") ; Half Form
- ("\\(\e$(5!M!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"M\e(B") ; Half Form
- ("\\(\e$(5!N!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"N\e(B") ; Half Form
- ;; special form for "ru".
- ("\\(\e$(5!O!]\e(B\\)" "\e$(5",\e(B")
- ("\\(\e$(5!O!^\e(B\\)" "\e$(5"-\e(B")
- ("\\(\e$(5!P!]\e(B\\)" "\e$(5".\e(B")
- ("\\(\e$(5!P!^\e(B\\)" "\e$(5"/\e(B")
- ;;
- ("\\(\e$(5!Q!h!Q\e(B\\)" "\e$(5#`\e(B" sanskrit)
- ("\\(\e$(5!Q!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"Q\e(B") ; Half Form
- ("\\(\e$(5!R!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"R\e(B") ; Half Form
- ("\\(\e$(5!S!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"S\e(B") ; Half Form
- ("\\(\e$(5!T!h!F\e(B\\)" "\e$(5#a\e(B")
- ("\\(\e$(5!T!h!T\e(B\\)" "\e$(5#b\e(B")
- ("\\(\e$(5!T!h!O\e(B\\)" "\e$(5!T"q\e(B") ; Post "r"
- ("\\(\e$(5!T!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"T\e(B") ; Half Form
- ("\\(\e$(5!U!h!8!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"h\e(B") ; Half Form
- ("\\(\e$(5!U!h!8\e(B\\)" "\e$(5#c\e(B")
- ("\\(\e$(5!U!h!F\e(B\\)" "\e$(5#d\e(B")
- ("\\(\e$(5!U!h!J\e(B\\)" "\e$(5#e\e(B")
- ("\\(\e$(5!U!h!Q\e(B\\)" "\e$(5#f\e(B")
- ("\\(\e$(5!U!h\e(B\\)\e$(5!T!h!O\e(B" "\e$(5"U\e(B") ; Special Half Form
- ("\\(\e$(5!U!h!T!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"j\e(B") ; Half Form
-; ("\\(\e$(5!U!h!T\e(B\\)" "\e$(5#g\e(B")
- ("\\(\e$(5!U!h!O!h!T\e(B\\)" "\e$(5#g\e(B")
- ("\\(\e$(5!U!h!O!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"i\e(B") ; Half Form
- ("\\(\e$(5!U!h!O\e(B\\)" "\e$(5")\e(B") ; Post "r"
- ("\\(\e$(5!U!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"U\e(B") ; Half Form
- ("\\(\e$(5!V!h!=!h!O!h!M\e(B\\)" "\e$(5#h\e(B")
- ("\\(\e$(5!V!h!=!h!M\e(B\\)" "\e$(5#i\e(B")
- ("\\(\e$(5!V!h!=!h!T\e(B\\)" "\e$(5#j\e(B")
- ("\\(\e$(5!V!h!=\e(B\\)" "\e$(5#k\e(B")
- ("\\(\e$(5!V!h!>\e(B\\)" "\e$(5#l\e(B")
- ("\\(\e$(5!V!h!O\e(B\\)" "\e$(5!V"q\e(B") ; Post "r"
- ("\\(\e$(5!V!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"V\e(B") ; Half Form
- ("\\(\e$(5!W!h!F!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"W"F\e(B") ; Special Half Form
- ("\\(\e$(5!W!h!F\e(B\\)" "\e$(5#m\e(B")
- ("\\(\e$(5!W!h!O\e(B\\)" "\e$(5#n\e(B")
- ("\\(\e$(5!W!h\e(B\\)[\e$(5!3\e(B-\e$(5!N!P\e(B-\e$(5!X\e(B]" "\e$(5"W\e(B") ; Half Form
- ("\\(\e$(5!X!h!A\e(B\\)" "\e$(5#p\e(B")
- ("\\(\e$(5!X!h!F\e(B\\)" "\e$(5#q\e(B")
- ("\\(\e$(5!X!h!L\e(B\\)" "\e$(5#r\e(B")
- ("\\(\e$(5!X!h!M\e(B\\)" "\e$(5#s\e(B")
- ("\\(\e$(5!X!h!O\e(B\\)" "\e$(5#t\e(B")
- ("\\(\e$(5!X!h!Q\e(B\\)" "\e$(5#u\e(B")
- ("\\(\e$(5!X!h!T\e(B\\)" "\e$(5#v\e(B")
- ;; Special Ligature Rules
- ("\\(\e$(5!X!_\e(B\\)" "\e$(5#R\e(B")
-
- ;; For consonants other than listed above, glyph-composition will
- ;; be applied. If the consonant which is preceding "\e$(5!O\e(B" does not
- ;; have the vertical line (such as "\e$(5!?\e(B"), "\e$(5"r\e(B" is put beneath the
- ;; consonant.
- ;;
- ("[\e$(5!7!9!=!>!?!@!D!O!P!R!S!X\e(B]\\(\e$(5!h!O\e(B\\)" "\e$(5"r\e(B")
- ("[\e$(5!6!8!C!E!F!H!J!K!L!M!T!V\e(B]\\(\e$(5!h!O\e(B\\)" "\e$(5"q\e(B")
- ("\e$(5!?!i\e(B\\(\e$(5!h!O\e(B\\)" "\e$(5"r\e(B")
- ("\e$(5!@!i\e(B\\(\e$(5!h!O\e(B\\)" "\e$(5"r\e(B")
-
- ;; Nukta with Non-Consonants
- ("\\(\e$(5!!!i\e(B\\)" "\e$(5#!\e(B")
- ("\\(\e$(5!&!i\e(B\\)" "\e$(5#&\e(B")
- ("\\(\e$(5!'!i\e(B\\)" "\e$(5#'\e(B")
- ("\\(\e$(5!*!i\e(B\\)" "\e$(5#*\e(B")
- ("\\(\e$(5![!i\e(B\\)" "\e$(5#L\e(B")
- ("\\(\e$(5!\!i\e(B\\)" "\e$(5#M\e(B")
- ("\\(\e$(5!_!i\e(B\\)" "\e$(5#K\e(B")
- ("\\(\e$(5!j!i\e(B\\)" "\e$(5#J\e(B")
-
- ;; Special rule for "r + some vowels"
- ("\\(\e$(5!O!_\e(B\\)" "\e$(5!*"p\e(B")
- ("\\(\e$(5!O#L\e(B\\)" "\e$(5#&"p\e(B")
- ("\\(\e$(5!O#K\e(B\\)" "\e$(5#*"p\e(B")
- ("\\(\e$(5!O#M\e(B\\)" "\e$(5#'"p\e(B")
- ;; If everything fails, "y" will connect to the front consonant.
- ("\\(\e$(5!h!M\e(B\\)" "\e$(5"]\e(B")
- )
- "Alist of regexps of Devanagari character sequences vs composed characters.")
-
-(let ((rules devanagari-char-to-glyph-rules))
- (while rules
- (let ((rule (car rules))
- (chars) (char) (glyphs) (glyph))
- (setq rules (cdr rules))
- (string-match "\\\\(\\(.+\\)\\\\)" (car rule))
- (setq chars (substring (car rule) (match-beginning 1) (match-end 1)))
- (setq char (string-to-char chars))
- (setq glyphs (cdr rule))
- (setq glyph (string-to-char (car glyphs)))
- (put-char-code-property
- char 'char-to-glyph
- ;; We don't "cons" it since priority is top to down.
- (append (get-char-code-property char 'char-to-glyph) (list rule)))
-
- (if (and (< ?\e(5z\e(B glyph) ; Glyphs only.
- (null (get-char-code-property glyph 'glyph-to-char)))
- ; One glyph may corresponds to multiple characters,
- ; e.g., surrounding vowel in Tamil, etc.
- ; but for Devanagari, we put this restriction
- ; to make sure the fact that one glyph corresponds to one char.
- (put-char-code-property
- glyph 'glyph-to-char
- (cons (list (car glyphs) chars)
- (get-char-code-property glyph 'glyph-to-char)
- ))))))
-
-;;
-;; Function used in both characters-to-glyphs conversion and
-;; glyphs-to-characters conversion.
-;;
-
-(defun max-match-len (regexp-str)
- "This returns the possible length of matched string of given regexp.
- Only [...] pattern of regexp is recognized. The last character of
- inside of [....] is used for its length."
- (let ((dest-str regexp-str))
- (while (string-match "\\[\\([^\]]\\)+\\]" dest-str)
- (setq dest-str
- (concat (substring dest-str 0 (match-beginning 0))
- (substring dest-str (match-beginning 1) (match-end 1))
- (substring dest-str (match-end 0)))))
- (length dest-str)))
-
-(defun string-conversion-by-rule (src-str symbol &rest specs)
- " This function converts the SRC-STR to the new string according to
-the rules described in the each character's SYMBOL property. The
-rules are described in the forms of '((regexp str <specs>) ...), and
-the character sequence in the string which matches to 'regexp' are
-replaced with str. If SPECS are not specified, only rules with no
-<specs> would be applied. If SPECS are specified, then rules with no
-<specs> specified and rules with <spec> matches with SPECS would be
-applied. Rules are tested in the order of the list, thus more
-specific rules should be placed in front of less important rules. No
-composite character is supported, thus such must be converted by
-decompose-char before applying to this function. If rule is given in
-the forms of regexp '...\\(...\\)...', then inside the parenthesis is
-the subject of the match. Otherwise, the entire expression is the
-subject of the match."
- (let ((pos 0)
- (dst-str ""))
- (while (< pos (length src-str))
- (let ((found nil)
- (rules (get-char-code-property
- (string-to-char
- (substring src-str pos)) symbol)))
- (while rules
- (let* ((rule (car rules))
- (regexp (car rule))
- (replace-str (car (cdr rule)))
- (rule-specs (cdr (cdr rule)))
- search-pos)
- (if (not (or (null rule-specs)
- (intersection specs rule-specs)))
- (setq rules (cdr rules))
- (if (null (string-match "\\\\(.+\\\\)" regexp))
- (progn
- (setq regexp (concat "\\(" regexp "\\)"))
- (setq search-pos pos))
- (setq search-pos (- pos (max-match-len
- (substring regexp
- (string-match "^[^\\\\]*" regexp)
- (match-end 0))))))
- (if (< search-pos 0) (setq search-pos 0))
- (if (string-match regexp src-str search-pos)
- (if (= (match-beginning 1) pos)
- (progn
- (setq dst-str (concat dst-str replace-str))
- (setq rules nil) ; Get out of the loop.
- (setq found t)
- ;; proceed `pos' for replaced characters.
- (setq pos (match-end 1)))
- (setq rules (cdr rules)))
- (setq rules (cdr rules))))))
- ;; proceed to next position
- (if (not found)
- (let ((nextchar (string-to-char (substring src-str pos))))
- (setq pos (+ pos
- (char-bytes (string-to-char (substring src-str pos)))))
- (setq dst-str (concat dst-str (char-to-string nextchar)))))))
- dst-str))
-
-
-;;
-;; Convert Character Code to Glyph Code
-;;
-
-;;;###autoload
-(defun char-to-glyph-devanagari (src-str &rest langs)
- "Convert Devanagari characters in the string to Devanagari glyphs.
-Ligatures and special rules are processed."
- (apply
- 'string-conversion-by-rule
- (append (list src-str 'char-to-glyph) langs)))
-
-;; Example:
-;;(char-to-glyph-devanagari "\e$(5!X![!F!h!D!\\e(B") => "\e$(5!X!["F!D!\\e(B"
-;;(char-to-glyph-devanagari "\e$(5!O!Z!V!h!=!h!O![!M\e(B") => ???
-
-;;
-;; Phase 2: Compose Glyphs to form One Glyph.
-;;
-
-;; Each list consist of glyph, application-priority and application-direction.
-;;
-;; Glyphs will be ordered from low priority number to high priority number.
-;; If application-priority is omitted, it is assumed to be 0.
-;; If application-direction is omitted, it is asumbed to be '(mr . ml).
-
-(defconst devanagari-composition-rules
- '((?\e$(5!!\e(B 0 (tr . br))
- (?\e$(5!"\e(B 0 (mr . mr))
- (?\e$(5!#\e(B 0)
- (?\e$(5!$\e(B 0)
- (?\e$(5!%\e(B 0)
- (?\e$(5!&\e(B 0)
- (?\e$(5!'\e(B 0)
- (?\e$(5!(\e(B 0)
- (?\e$(5!)\e(B 0)
- (?\e$(5!*\e(B 0)
- (?\e$(5!+\e(B 0)
- (?\e$(5!,\e(B 0)
- (?\e$(5!-\e(B 0)
- (?\e$(5!.\e(B 0)
- (?\e$(5!/\e(B 0)
- (?\e$(5!0\e(B 0)
- (?\e$(5!1\e(B 0)
- (?\e$(5!2\e(B 0)
- (?\e$(5!3\e(B 0)
- (?\e$(5!4\e(B 0)
- (?\e$(5!5\e(B 0)
- (?\e$(5!6\e(B 0)
- (?\e$(5!7\e(B 0)
- (?\e$(5!8\e(B 0)
- (?\e$(5!9\e(B 0)
- (?\e$(5!:\e(B 0)
- (?\e$(5!;\e(B 0)
- (?\e$(5!<\e(B 0)
- (?\e$(5!=\e(B 0)
- (?\e$(5!>\e(B 0)
- (?\e$(5!?\e(B 0)
- (?\e$(5!@\e(B 0)
- (?\e$(5!A\e(B 0)
- (?\e$(5!B\e(B 0)
- (?\e$(5!C\e(B 0)
- (?\e$(5!D\e(B 0)
- (?\e$(5!E\e(B 0)
- (?\e$(5!F\e(B 0)
- (?\e$(5!G\e(B 0)
- (?\e$(5!H\e(B 0)
- (?\e$(5!I\e(B 0)
- (?\e$(5!J\e(B 0)
- (?\e$(5!K\e(B 0)
- (?\e$(5!L\e(B 0)
- (?\e$(5!M\e(B 0)
- (?\e$(5!N\e(B 0)
- (?\e$(5!O\e(B 0)
- (?\e$(5!P\e(B 0)
- (?\e$(5!Q\e(B 0)
- (?\e$(5!R\e(B 0)
- (?\e$(5!S\e(B 0)
- (?\e$(5!T\e(B 0)
- (?\e$(5!U\e(B 0)
- (?\e$(5!V\e(B 0)
- (?\e$(5!W\e(B 0)
- (?\e$(5!X\e(B 0)
- (?\e$(5!Y\e(B 0)
- (?\e$(5!Z\e(B 0)
- (?\e$(5![\e(B 0 (ml . mr))
- (?\e$(5!\\e(B 0)
- (?\e$(5!]\e(B 0 (br . tr))
- (?\e$(5!^\e(B 0 (br . tr))
- (?\e$(5!_\e(B 0 (br . tr))
- (?\e$(5!`\e(B 0 (mr . mr)) ; (tc . bc)
- (?\e$(5!a\e(B 0 (mr . mr))
- (?\e$(5!b\e(B 0 (mr . mr))
- (?\e$(5!c\e(B 0 (mr . mr))
- (?\e$(5!d\e(B 0)
- (?\e$(5!e\e(B 0)
- (?\e$(5!f\e(B 0)
- (?\e$(5!g\e(B 0)
- (?\e$(5!h\e(B 0 (br . tr))
- (?\e$(5!i\e(B 0 (br . tr))
- (?\e$(5!j\e(B 0)
- (nil 0)
- (nil 0)
- (nil 0)
- (nil 0)
- (nil 0)
- (nil 0)
- (?\e$(5!q\e(B 0)
- (?\e$(5!r\e(B 0)
- (?\e$(5!s\e(B 0)
- (?\e$(5!t\e(B 0)
- (?\e$(5!u\e(B 0)
- (?\e$(5!v\e(B 0)
- (?\e$(5!w\e(B 0)
- (?\e$(5!x\e(B 0)
- (?\e$(5!y\e(B 0)
- (?\e$(5!z\e(B 0)
- (nil 0)
- (nil 0)
- (nil 0)
- (nil 0)
- (?\e$(5"!\e(B 0)
- (?\e$(5""\e(B 0)
- (?\e$(5"#\e(B 0)
- (?\e$(5"$\e(B 0)
- (?\e$(5"%\e(B 0)
- (?\e$(5"&\e(B 0)
- (?\e$(5"'\e(B 0)
- (?\e$(5"(\e(B 0)
- (?\e$(5")\e(B 0)
- (?\e$(5"*\e(B 0)
- (?\e$(5"+\e(B 0)
- (?\e$(5",\e(B 0)
- (?\e$(5"-\e(B 0)
- (?\e$(5".\e(B 0)
- (?\e$(5"/\e(B 0)
- (?\e$(5"0\e(B 0)
- (?\e$(5"1\e(B 0)
- (?\e$(5"2\e(B 0)
- (?\e$(5"3\e(B 0)
- (?\e$(5"4\e(B 0)
- (?\e$(5"5\e(B 0)
- (?\e$(5"6\e(B 0)
- (?\e$(5"7\e(B 0)
- (?\e$(5"8\e(B 0)
- (?\e$(5"9\e(B 0)
- (?\e$(5":\e(B 0)
- (?\e$(5";\e(B 0)
- (?\e$(5"<\e(B 0)
- (?\e$(5"=\e(B 0)
- (?\e$(5">\e(B 0)
- (?\e$(5"?\e(B 0)
- (?\e$(5"@\e(B 0)
- (?\e$(5"A\e(B 0)
- (?\e$(5"B\e(B 0)
- (?\e$(5"C\e(B 0)
- (?\e$(5"D\e(B 0)
- (?\e$(5"E\e(B 0)
- (?\e$(5"F\e(B 0)
- (?\e$(5"G\e(B 0)
- (?\e$(5"H\e(B 0)
- (?\e$(5"I\e(B 0)
- (?\e$(5"J\e(B 0)
- (?\e$(5"K\e(B 0)
- (?\e$(5"L\e(B 0)
- (?\e$(5"M\e(B 0)
- (?\e$(5"N\e(B 0)
- (?\e$(5"O\e(B 0)
- (?\e$(5"P\e(B 0)
- (?\e$(5"Q\e(B 0)
- (?\e$(5"R\e(B 0)
- (?\e$(5"S\e(B 0)
- (?\e$(5"T\e(B 0)
- (?\e$(5"U\e(B 0)
- (?\e$(5"V\e(B 0)
- (?\e$(5"W\e(B 0)
- (?\e$(5"X\e(B 0)
- (?\e$(5"Y\e(B 0)
- (?\e$(5"Z\e(B 0)
- (?\e$(5"[\e(B 0)
- (?\e$(5"\\e(B 0)
- (?\e$(5"]\e(B 0)
- (?\e$(5"^\e(B 0)
- (?\e$(5"_\e(B 0)
- (?\e$(5"`\e(B 0)
- (?\e$(5"a\e(B 0)
- (?\e$(5"b\e(B 0)
- (?\e$(5"c\e(B 0)
- (?\e$(5"d\e(B 0)
- (?\e$(5"e\e(B 0)
- (?\e$(5"f\e(B 0)
- (?\e$(5"g\e(B 0)
- (?\e$(5"h\e(B 0)
- (?\e$(5"i\e(B 0)
- (?\e$(5"j\e(B 0)
- (?\e$(5"k\e(B 0)
- (?\e$(5"l\e(B 0)
- (?\e$(5"m\e(B 0)
- (?\e$(5"n\e(B 0)
- (?\e$(5"o\e(B 0)
- (?\e$(5"p\e(B 10 (mr . mr))
- (?\e$(5"q\e(B 0 (br . br))
- (?\e$(5"r\e(B 0 (br . tr))
- (?\e$(5"s\e(B 0)
- (?\e$(5"t\e(B 0)
- (?\e$(5"u\e(B 0)
- (?\e$(5"v\e(B 0)
- (?\e$(5"w\e(B 0)
- (?\e$(5"x\e(B 0)
- (?\e$(5"y\e(B 0)
- (?\e$(5"z\e(B 0)
- (?\e$(5"{\e(B 0)
- (?\e$(5"|\e(B 0)
- (?\e$(5"}\e(B 0)
- (?\e$(5"~\e(B 0)
- (?\e$(5#!\e(B 0)
- (?\e$(5#"\e(B 0)
- (?\e$(5##\e(B 0)
- (?\e$(5#$\e(B 0)
- (?\e$(5#%\e(B 0)
- (?\e$(5#&\e(B 0)
- (?\e$(5#'\e(B 0)
- (?\e$(5#(\e(B 0)
- (?\e$(5#)\e(B 0)
- (?\e$(5#*\e(B 0)
- (?\e$(5#+\e(B 0)
- (?\e$(5#,\e(B 0)
- (?\e$(5#-\e(B 0)
- (?\e$(5#.\e(B 0)
- (?\e$(5#/\e(B 0)
- (?\e$(5#0\e(B 0)
- (?\e$(5#1\e(B 0)
- (?\e$(5#2\e(B 0)
- (?\e$(5#3\e(B 0)
- (?\e$(5#4\e(B 0)
- (?\e$(5#5\e(B 0)
- (?\e$(5#6\e(B 0)
- (?\e$(5#7\e(B 0)
- (?\e$(5#8\e(B 0)
- (?\e$(5#9\e(B 0)
- (?\e$(5#:\e(B 0)
- (?\e$(5#;\e(B 0)
- (?\e$(5#<\e(B 0)
- (?\e$(5#=\e(B 0)
- (?\e$(5#>\e(B 0)
- (?\e$(5#?\e(B 0)
- (?\e$(5#@\e(B 0)
- (?\e$(5#A\e(B 0)
- (?\e$(5#B\e(B 0)
- (?\e$(5#C\e(B 0)
- (?\e$(5#D\e(B 0)
- (?\e$(5#E\e(B 0)
- (?\e$(5#F\e(B 0)
- (?\e$(5#G\e(B 0)
- (?\e$(5#H\e(B 0)
- (?\e$(5#I\e(B 0)
- (?\e$(5#J\e(B 0)
- (?\e$(5#K\e(B 0 (br . tr))
- (?\e$(5#L\e(B 0 (br . tr))
- (?\e$(5#M\e(B 0 (br . tr))
- (?\e$(5#N\e(B 0)
- (?\e$(5#O\e(B 0)
- (?\e$(5#P\e(B 0)
- (?\e$(5#Q\e(B 0)
- (?\e$(5#R\e(B 0)
- (?\e$(5#S\e(B 0)
- (?\e$(5#T\e(B 0)
- (?\e$(5#U\e(B 0)
- (?\e$(5#V\e(B 0)
- (?\e$(5#W\e(B 0)
- (?\e$(5#X\e(B 0)
- (?\e$(5#Y\e(B 0)
- (?\e$(5#Z\e(B 0)
- (?\e$(5#[\e(B 0)
- (?\e$(5#\\e(B 0)
- (?\e$(5#]\e(B 0)
- (?\e$(5#^\e(B 0)
- (?\e$(5#_\e(B 0)
- (?\e$(5#`\e(B 0)
- (?\e$(5#a\e(B 0)
- (?\e$(5#b\e(B 0)
- (?\e$(5#c\e(B 0)
- (?\e$(5#d\e(B 0)
- (?\e$(5#e\e(B 0)
- (?\e$(5#f\e(B 0)
- (?\e$(5#g\e(B 0)
- (?\e$(5#h\e(B 0)
- (?\e$(5#i\e(B 0)
- (?\e$(5#j\e(B 0)
- (?\e$(5#k\e(B 0)
- (?\e$(5#l\e(B 0)
- (?\e$(5#m\e(B 0)
- (?\e$(5#n\e(B 0)
- (?\e$(5#o\e(B 0)
- (?\e$(5#p\e(B 0)
- (?\e$(5#q\e(B 0)
- (?\e$(5#r\e(B 0)
- (?\e$(5#s\e(B 0)
- (?\e$(5#t\e(B 0)
- (?\e$(5#u\e(B 0)
- (?\e$(5#v\e(B 0)
- (?\e$(5#w\e(B 0)
- (?\e$(5#x\e(B 0)
- (?\e$(5#y\e(B 0)
- (?\e$(5#z\e(B 0)
- (?\e$(5#{\e(B 0)
- (?\e$(5#|\e(B 0)
- (?\e$(5#}\e(B 0)
- (?\e$(5#~\e(B 0)
- (?\e$(5$!\e(B 0)
- (?\e$(5$"\e(B 0)
- (?\e$(5$#\e(B 0)
- (?\e$(5$$\e(B 0)
- (?\e$(5$%\e(B 0)
- (?\e$(5$&\e(B 0)
- (?\e$(5$'\e(B 0)
- (?\e$(5$(\e(B 0)
- (?\e$(5$)\e(B 0)
- (?\e$(5$*\e(B 0)
- (?\e$(5$+\e(B 0)
- (?\e$(5$,\e(B 0)
- (?\e$(5$-\e(B 0)
- (?\e$(5$.\e(B 0)
- (?\e$(5$/\e(B 0)
- (?\e$(5$0\e(B 0)
- (?\e$(5$1\e(B 0)
- (?\e$(5$2\e(B 0)
- (?\e$(5$3\e(B 0)
- (?\e$(5$4\e(B 0)
- (?\e$(5$5\e(B 0)
- (?\e$(5$6\e(B 0)
- (?\e$(5$7\e(B 0)
- (?\e$(5$8\e(B 0)
- (?\e$(5$9\e(B 0)
- (?\e$(5$:\e(B 0)
- (?\e$(5$;\e(B 0)
- (?\e$(5$<\e(B 0)
- (?\e$(5$=\e(B 0)
- (?\e$(5$>\e(B 0)
- (?\e$(5$?\e(B 0)
- (?\e$(5$@\e(B 0)
- (?\e$(5$A\e(B 0)
- (?\e$(5$B\e(B 0)
- (?\e$(5$C\e(B 0)
- (?\e$(5$D\e(B 0)
- (?\e$(5$E\e(B 0)
- (?\e$(5$F\e(B 0)
- (?\e$(5$G\e(B 0)
- (?\e$(5$H\e(B 0)
- (?\e$(5$I\e(B 0)
- (?\e$(5$J\e(B 0)
- (?\e$(5$K\e(B 0)
- (?\e$(5$L\e(B 0)
- (?\e$(5$M\e(B 0)
- (?\e$(5$N\e(B 0)
- (?\e$(5$O\e(B 0)
- (?\e$(5$P\e(B 0)
- (?\e$(5$Q\e(B 0)
- (?\e$(5$R\e(B 0)
- (?\e$(5$S\e(B 0)
- (?\e$(5$T\e(B 0)
- (?\e$(5$U\e(B 0)
- (?\e$(5$V\e(B 0)
- (?\e$(5$W\e(B 0)
- (?\e$(5$X\e(B 0)
- (?\e$(5$Y\e(B 0)
- (?\e$(5$Z\e(B 0)
- (?\e$(5$[\e(B 0)
- (?\e$(5$\\e(B 0)
- (?\e$(5$]\e(B 0)
- (?\e$(5$^\e(B 0)
- (?\e$(5$_\e(B 0)
- (?\e$(5$`\e(B 0)
- (?\e$(5$a\e(B 0)
- (?\e$(5$b\e(B 0)
- (?\e$(5$c\e(B 0)
- (?\e$(5$d\e(B 0)
- (?\e$(5$e\e(B 0)
- (?\e$(5$f\e(B 0)
- (?\e$(5$g\e(B 0)
- (?\e$(5$h\e(B 0)
- (?\e$(5$i\e(B 0)
- (?\e$(5$j\e(B 0)
- (?\e$(5$k\e(B 0)
- (?\e$(5$l\e(B 0)
- (?\e$(5$m\e(B 0)
- (?\e$(5$n\e(B 0)
- (?\e$(5$o\e(B 0)
- (?\e$(5$p\e(B 0)
- (?\e$(5$q\e(B 0)
- (?\e$(5$r\e(B 0)
- (?\e$(5$s\e(B 0)
- (?\e$(5$t\e(B 0)
- (?\e$(5$u\e(B 0)
- (?\e$(5$v\e(B 0)
- (?\e$(5$w\e(B 0)
- (?\e$(5$x\e(B 0)
- (?\e$(5$y\e(B 0)
- (?\e$(5$z\e(B 0)
- (?\e$(5${\e(B 0)
- (?\e$(5$|\e(B 0)
- (?\e$(5$}\e(B 0)
- (?\e$(5$~\e(B 0)
- ))
-
-;; Determine composition priority and rule of the array of Glyphs.
-;; Sort the glyphs with their priority.
-
-(defun devanagari-reorder-glyphs-for-composition (glyph-alist)
- (let* ((pos 0)
- (ordered-glyphs '()))
- (while (< pos (length glyph-alist))
- (let* ((glyph (aref glyph-alist pos)))
- (setq pos (1+ pos))
- (setq ordered-glyphs
- (append ordered-glyphs (list (assq glyph devanagari-composition-rules))))))
- (sort ordered-glyphs '(lambda (x y) (< (car (cdr x)) (car (cdr y)))))))
-
-;;(devanagari-compose-to-one-glyph "\e$(5"5!X![\e(B") => "\e2\e$(6!XP"5@![\e1\e(B"
-
-(defun devanagari-compose-to-one-glyph (devanagari-string)
- (let* ((o-glyph-list (devanagari-reorder-glyphs-for-composition
- (string-to-vector devanagari-string)))
- ;; List of glyphs to be composed.
- (cmp-glyph-list (list (car (car o-glyph-list))))
- (o-glyph-list (cdr o-glyph-list)))
- (while o-glyph-list
- (let* ((o-glyph (car o-glyph-list))
- (glyph (if (< 2 (length o-glyph))
- ;; default composition
- (list (car (cdr (cdr o-glyph))) (car o-glyph))
- ;; composition with a specified rule
- (list '(mr . ml) (car o-glyph)))))
- (setq o-glyph-list (cdr o-glyph-list))
- (setq cmp-glyph-list (append cmp-glyph-list glyph))))
- ;; Before applying compose-chars, convert glyphs to
- ;; 1-column width if possible.
- (setq cmp-glyph-list (devanagari-wide-to-narrow cmp-glyph-list))
- (if (= (length cmp-glyph-list) 1) (char-to-string (car cmp-glyph-list))
- (apply 'compose-chars cmp-glyph-list))))
-
-;; Utility function for Phase 2.5
-;; Check whether given glyph is a Devanagari vertical modifier or not.
-;; If it is a vertical modifier, whether it should be 1-column shape or not
-;; depends on previous non-vertical modifier.
- ; return nil if it is not vertical modifier.
-(defun devanagari-vertical-modifier-p (glyph)
- (string-match (char-to-string glyph)
- "[\e$(5!]!^!_!`!a!b!c!h!i"p"q"r#K#L#M\e(B]"))
-
-(defun devanagari-non-vertical-modifier-p (glyph)
- (string-match (char-to-string glyph)
- "[\e$(5!Z![!\!d!e!f!g\e(B]"))
-
-
-;;
-;; Phase 2.5 Convert Appropriate Character to 1-column shape.
-;;
-;; This is temporary and should be removed out when Emacs supports
-;; variable width characters.
-;;
-;; This will convert the composing glyphs (2 column glyphs)
-;; to narrow (1 column) glyphs if they exist.
-;;
-;; devanagari-wide-to-narrow-old converts glyphs simply.
-;; devanagari-wide-to-narrow takes care of upper/lower apply-glyphs
-;; with 2 column base-glyph.
-;;
-;; Execution Examples
-;;(devanagari-wide-to-narrow '(?\e$(5!3\e(B (ml . ml) ?\e$(5!a\e(B))
-;;(devanagari-wide-to-narrow '(?\e$(5!F\e(B (ml . ml) ?\e$(5!a\e(B))
-
-;(defun devanagari-wide-to-narrow (src-list)
-; (if (null src-list) '()
-; (cons
-; (if (and (numberp (car src-list))
-; (cdr (assq (car src-list) devanagari-1-column-char)))
-; (cdr (assq (car src-list) devanagari-1-column-char))
-; (car src-list))
-; (devanagari-wide-to-narrow (cdr src-list)))))
-
-(defun devanagari-wide-to-narrow (src-list)
- (devanagari-wide-to-narrow-iter src-list t))
-
-(defun devanagari-wide-to-narrow-iter (src-list wide-p)
- (let ((glyph (car src-list)))
- (cond ((null src-list) '())
- ; not glyph code
- ((not (numberp glyph))
- (cons glyph (devanagari-wide-to-narrow-iter (cdr src-list) wide-p)))
- ; vertical modifier glyph
- ((devanagari-vertical-modifier-p glyph)
- (if (and (null wide-p)
- (cdr (assq glyph devanagari-1-column-char)))
- (cons (cdr (assq glyph devanagari-1-column-char))
- (devanagari-wide-to-narrow-iter (cdr src-list) nil))
- (cons glyph
- (devanagari-wide-to-narrow-iter (cdr src-list) t))))
- ; nonvertical modifier glyph
- ((devanagari-non-vertical-modifier-p glyph)
- (if (cdr (assq glyph devanagari-1-column-char))
- (cons (cdr (assq glyph devanagari-1-column-char))
- (devanagari-wide-to-narrow-iter (cdr src-list) wide-p))
- (cons glyph
- (devanagari-wide-to-narrow-iter (cdr src-list) wide-p))))
- ; normal glyph
- (t
- (if (cdr (assq glyph devanagari-1-column-char))
- (cons (cdr (assq glyph devanagari-1-column-char))
- (devanagari-wide-to-narrow-iter (cdr src-list) nil))
- (cons glyph
- (devanagari-wide-to-narrow-iter (cdr src-list) t)))))))
-
-
-;;
-;; Summary
-;;
-
-;;
-;; Decomposition of composite font.
-;;
-
-(defun devanagari-normalize-narrow-glyph (charlist)
- (let ((wide-char (car (rassoc (car charlist) devanagari-1-column-char))))
- (if (null charlist) nil
- (cons (if (null wide-char) (car charlist) wide-char)
- (devanagari-normalize-narrow-glyph (cdr charlist))))))
-
-(defvar devanagari-decomposition-rules
- '(
- (?\e$(5"p\e(B -10)
- )
- )
-
-(defun devanagari-reorder-glyphs-for-decomposition (glyphlist)
- "This function re-orders glyph list for decomposition."
- (sort glyphlist
- '(lambda (x y)
- (let ((xx (assoc x devanagari-decomposition-rules))
- (yy (assoc y devanagari-decomposition-rules)))
- (if (null xx) (setq xx 0))
- (if (null yy) (setq yy 0))
- (< xx yy)))))
-
-(defun devanagari-decompose-char (glyph)
- "This function decomposes one Devanagari composite glyph to
- basic Devanagari characters as a string."
- (let ((glyphlist
- (if (eq (car (split-char glyph)) 'composition)
- (string-to-list (decompose-composite-char glyph))
- (list glyph))))
- (setq glyphlist (devanagari-normalize-narrow-glyph glyphlist))
- (setq glyphlist (devanagari-reorder-glyphs-for-decomposition glyphlist))
- (string-conversion-by-rule
- (mapconcat 'char-to-string glyphlist "") 'glyph-to-char)))
-
-;;;###autoload
-(defun devanagari-decompose-string (str)
- "This function Decomposes Devanagari glyph string to
-basic Devanagari character string."
- (let ((src str) (dst ""))
- (while (not (equal src ""))
- (let* ((char (string-to-char src))
- (clen (char-bytes char)))
- (setq src (substring src clen))
- (setq dst (concat dst
- (devanagari-decompose-char char)))))
- dst))
-
-;;;###autoload
-(defun devanagari-decompose-region (from to)
- (interactive "r")
- (save-restriction
- (narrow-to-region from to)
- (goto-char (point-min))
- (while (re-search-forward "." nil t)
- (let* ((match-b (match-beginning 0)) (match-e (match-end 0))
- (decmps (devanagari-decompose-string (buffer-substring match-b match-e))))
- (delete-char -1)
- (insert decmps)))))
-
-;;;
-;;; Composition
-;;;
-
-;;;###autoload
-(defun devanagari-compose-string (str &rest langs)
- (let ((len (length str))
- (src (devanagari-decompose-string str)) (dst "") rest match-b match-e)
- (while (string-match devanagari-composite-glyph-unit src)
- (setq match-b (match-beginning 0) match-e (match-end 0))
- (setq dst
- (concat dst
- (substring src 0 match-b)
- (devanagari-compose-to-one-glyph
- (apply
- 'char-to-glyph-devanagari
- (cons (substring src match-b match-e)
- langs)))))
- (setq src (substring src match-e)))
- (setq dst (concat dst src))
- dst))
-
-;;;###autoload
-(defun devanagari-compose-region (from to &rest langs)
- (interactive "r")
- (save-restriction
- (narrow-to-region from to)
- (goto-char (point-min))
- (while (re-search-forward devanagari-composite-glyph-unit nil t)
- (let* ((match-b (match-beginning 0)) (match-e (match-end 0))
- (cmps (devanagari-compose-to-one-glyph
- (apply
- 'char-to-glyph-devanagari
- (cons (buffer-substring match-b match-e)
- langs)))))
- (delete-region match-b match-e)
- (insert cmps)))))
-
-;; For pre-write and post-read conversion
-
-;;;###autoload
-(defun devanagari-compose-from-is13194-region (from to)
- "Compose IS 13194 characters in the region to Devanagari characters."
- (interactive "r")
- (save-restriction
- (narrow-to-region from to)
- (indian-to-devanagari-region (point-min) (point-max))
- (devanagari-compose-region (point-min) (point-max))))
-
-;;;###autoload
-(defun in-is13194-devanagari-post-read-conversion (len)
- (let ((pos (point)))
- (devanagari-compose-from-is13194-region pos (+ pos len))))
-
-;;;###autoload
-(defun devanagari-decompose-to-is13194-region (from to)
- "Decompose Devanagari characters in the region to IS 13194 characters."
- (interactive "r")
- (save-restriction
- (narrow-to-region from to)
- (devanagari-decompose-region (point-min) (point-max))
- (devanagari-to-indian-region (point-min) (point-max))))
-
-;;;###autoload
-(defun in-is13194-devanagari-pre-write-conversion (from to)
- (let ((old-buf (current-buffer))
- (work-buf (get-buffer-create " *devanagari-work*")))
- (set-buffer work-buf)
- (erase-buffer)
- (if (stringp from)
- (insert from)
- (insert-buffer-substring old-buf from to))
- (devanagari-decompose-to-is13194-region (point-min) (point-max))
- ;; Should return nil as annotations.
- nil))
-
-;; For input/output of ITRANS
-
-;;;###autoload
-(defun devanagari-encode-itrans-region (from to)
- (interactive "r")
- (save-restriction
- (narrow-to-region from to)
- (devanagari-decompose-to-is13194-region (point-min) (point-max))
- (indian-encode-itrans-region (point-min) (point-max))))
-
-;;;###autoload
-(defun devanagari-decode-itrans-region (from to)
- (interactive "r")
- (save-restriction
- (narrow-to-region from to)
- (indian-decode-itrans-region (point-min) (point-max))
- (devanagari-compose-from-is13194-region (point-min) (point-max))))
-
-;; Test comment.
-
-;;
-(provide 'language/devan-util)
-
-;;; Local Variables:
-;;; generated-autoload-file: "../loaddefs.el"
-;;; End:
-;;; devan-util.el end here
+;;; devan-util.el --- Support for composing Devanagari characters
+
+;; Copyright (C) 2001 Free Software Foundation, Inc.
+
+;; Maintainer: KAWABATA, Taichi <batta@beige.ocn.ne.jp>
+;; Keywords: multilingual, Devanagari
+
+;; This file is part of GNU Emacs.
+
+;; GNU Emacs is free software; you can redistribute it and/or modify
+;; it under the terms of the GNU General Public License as published by
+;; the Free Software Foundation; either version 2, or (at your option)
+;; any later version.
+
+;; GNU Emacs is distributed in the hope that it will be useful,
+;; but WITHOUT ANY WARRANTY; without even the implied warranty of
+;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+;; GNU General Public License for more details.
+
+;; You should have received a copy of the GNU General Public License
+;; along with GNU Emacs; see the file COPYING. If not, write to the
+;; Free Software Foundation, Inc., 59 Temple Place - Suite 330,
+;; Boston, MA 02111-1307, USA.
+
+;; Created: Feb. 17. 2001
+
+;;; Commentary:
+
+;; This file provides character(Unicode) to glyph(CDAC) conversion and
+;; composition of Devanagari script characters.
+
+;;; Code:
+
+;;;###autoload
+
+;; Devanagari Composable Pattern
+;; C .. Consonants
+;; V .. Vowel
+;; H .. Halant
+;; M .. Matra
+;; V .. Vowel
+;; A .. Anuswar
+;; D .. Chandrabindu
+;; (N .. Zerowidth Non Joiner)
+;; (J .. Zerowidth Joiner. )
+;; 1. vowel
+;; V(A/D)?
+;; 2. syllable : maximum of 5 consecutive consonants. (e.g. kartsnya)
+;; ((CH)?(CH)?(CH)?CH)?C(MA?|D|H)?
+
+(defconst devanagari-consonant
+ "[\e$,15U\e(B-\e$,15y68\e(B-\e$,16?\e(B]")
+
+(defconst devanagari-composable-pattern
+ (concat
+ "\\([\e$,15E\e(B-\e$,15T6@6A\e(B][\e$,15A5B\e(B]?\\)\\|\e$,15C\e(B"
+ "\\|\\("
+ "\\(?:\\(?:[\e$,15U\e(B-\e$,15y68\e(B-\e$,16?\e(B]\e$,16-\e(B\\)?\\(?:[\e$,15U\e(B-\e$,15y68\e(B-\e$,16?\e(B]\e$,16-\e(B\\)?\\(?:[\e$,15U\e(B-\e$,15y68\e(B-\e$,16?\e(B]\e$,16-\e(B\\)?[\e$,15U\e(B-\e$,15y68\e(B-\e$,16?\e(B]\e$,16-\e(B\\)?"
+ "[\e$,15U\e(B-\e$,15y68\e(B-\e$,16?\e(B]\\(?:\e$,16-\e(B\\|[\e$,15~\e(B-\e$,16-6B6C\e(B]?[\e$,15B5A\e(B]?\\)?"
+ "\\)")
+ "Regexp matching a composable sequence of Devanagari characters.")
+
+(defun devanagari-compose-region (from to)
+ (interactive "r")
+ (save-excursion
+ (save-restriction
+ (narrow-to-region from to)
+ (goto-char (point-min))
+ (while (re-search-forward devanagari-composable-pattern nil t)
+ (devanagari-compose-syllable-region (match-beginning 0)
+ (match-end 0))))))
+(defun devanagari-compose-string (string)
+ (with-temp-buffer
+ (insert (decompose-string string))
+ (devanagari-compose-region (point-min) (point-max))
+ (buffer-string)))
+
+(defun range (from to)
+ "Make the list of the integers of range FROM to TO."
+ (let (result)
+ (while (<= from to) (setq result (cons to result) to (1- to))) result))
+
+(defun regexp-of-hashtbl-keys (hashtbl)
+ "Returns the regular expression of hashtable keys."
+ (let ((max-specpdl-size 1000))
+ (regexp-opt
+ (sort
+ (let (dummy)
+ (maphash (function (lambda (key val) (setq dummy (cons key dummy)))) hashtbl)
+ dummy)
+ (function (lambda (x y) (> (length x) (length y))))))))
+
+(defun devanagari-composition-function (from to pattern &optional string)
+ "Compose Devanagari characters in REGION, or STRING if specified.
+Assume that the REGION or STRING must fully match the composable
+PATTERN regexp."
+ (if string (devanagari-compose-syllable-string string)
+ (devanagari-compose-syllable-region from to))
+ (- to from))
+
+;; Register a function to compose Devanagari characters.
+(mapc
+ (function (lambda (ucs)
+ (aset composition-function-table (decode-char 'ucs ucs)
+ (list (cons devanagari-composable-pattern
+ 'devanagari-composition-function)))))
+ (nconc '(#x0903) (range #x0905 #x0939) (range #x0958 #x0961)))
+
+;; Notes on conversion steps.
+
+;; 1. chars to glyphs
+;;
+;; Rules will not be applied to the halant appeared at the end of the
+;; text. Also, the preceding/following "r" will be treated as special case.
+
+;; 2. glyphs reordering.
+;;
+;; The glyphs are split by halant, and each glyph groups are
+;; re-ordered in the following order.
+;;
+;; Note that `consonant-glyph' mentioned here does not contain the
+;; vertical bar (right modifier) attached at the right of the
+;; consonant.
+;;
+;; If the glyph-group contains right modifier,
+;; (1) consonant-glyphs/vowels, with nukta sign
+;; (2) spacing
+;; (3) right modifier (may be matra)
+;; (4) top matra
+;; (5) preceding "r"
+;; (6) anuswar
+;; (7) following "r"
+;; (8) bottom matra or halant.
+;;
+;; Otherwise,
+;; (1) consonant-glyph/vowels, with nukta sign
+;; (3) left matra
+;; (4) top matra
+;; (5) preceding "r"
+;; (6) anuswar
+;; (7) following "r"
+;; (8) bottom matra or halant.
+;; (2) spacing
+
+;; 3. glyph to glyph
+;;
+;; For better display, some glyph display would be tuned.
+
+;; 4. Composition.
+;;
+;; left modifiers will be attached at the left.
+;; others will be attached right.
+
+;; Problem::
+;; Can we generalize this methods to other Indian scripts?
+
+(defvar dev-char-glyph
+ '(("\e$,15E\e(B" . "\e$,4 K\e(B")
+ ("\e$,15F\e(B" . "\e$,4 K\")\e(B")
+ ("\e$,15~\e(B" . "\e$,4\")\e(B")
+ ("\e$,15G\e(B" . "\e$,4 \\e(B")
+ ("\e$,15\7f\e(B" . "\e$,4\"*\e(B")
+ ("\e$,15\7f5A\e(B" . "\e$,4\"*\e(B\\e$,4\"&\e(B")
+ ("\e$,15H\e(B" . "\e$,4 \"'\e(B")
+ ("\e$,15H5A\e(B" . "\e$,4 \"'\"&\e(B")
+ ("\e$,16 \e(B" . "\e$,4\"2\e(B")
+ ("\e$,16 5A\e(B" . "\e$,4\"2\"&\e(B")
+ ("\e$,15I\e(B" . "\e$,4 ]\e(B")
+ ("\e$,16!\e(B" . "\e$,4\"6\e(B")
+ ("\e$,15J\e(B" . "\e$,4 ^\"P\e(B")
+ ("\e$,16"\e(B" . "\e$,4\":\e(B")
+ ("\e$,15K\e(B" . "\e$,4 `\"Q\e(B")
+ ("\e$,16#\e(B" . "\e$,4\">\e(B")
+ ;;("\e$,15L\e(B" . nil) ; not implemented.
+ ("\e$,16$\e(B" . "\e$,4\"?\e(B")
+ ("\e$,15M\e(B" . "\e$,4 b\"L\e(B")
+ ("\e$,15M5A\e(B" . "\e$,4 b\"$\e(B")
+ ("\e$,15M5B\e(B" . "\e$,4 b\"$\e(B")
+ ("\e$,16%\e(B" . "\\e$,4\"L\e(B")
+ ("\e$,15N\e(B" . "\e$,4 b\"@\e(B")
+ ("\e$,15N5A\e(B" . "\e$,4 b\"@\"&\e(B")
+ ("\e$,16&\e(B" . "\\e$,4\"@\e(B")
+ ("\e$,16&5A\e(B" . "\\e$,4\"@\e(B\\e$,4\"&\e(B")
+ ("\e$,15O\e(B" . "\e$,4 b\e(B")
+ ("\e$,16'\e(B" . "\\e$,4\"D\e(B")
+ ("\e$,16'5A\e(B" . "\\e$,4\"D\e(B\\e$,4\"&\e(B")
+ ("\e$,15P\e(B" . "\e$,4 b\"D\e(B")
+ ("\e$,15P5A\e(B" . "\e$,4 b\"D\"&\e(B")
+ ("\e$,16(\e(B" . "\\e$,4\"H\e(B")
+ ("\e$,16(5A\e(B" . "\\e$,4\"H\e(B\\e$,4\"&\e(B")
+ ("\e$,15Q\e(B" . "\e$,4 K\")\"L\e(B") ;; special rule for reodering.
+ ("\e$,15Q5A\e(B" . "\e$,4 K\")\"$\e(B")
+ ("\e$,15Q5B\e(B" . "\e$,4 K\")\"$\e(B")
+ ("\e$,16)\e(B" . "\\e$,4\")\"L\e(B")
+ ("\e$,16)5A\e(B" . "\\e$,4\")\"$\e(B")
+ ("\e$,16)5B\e(B" . "\\e$,4\")\"$\e(B")
+ ("\e$,15R\e(B" . "\e$,4 K\")\"@\e(B")
+ ("\e$,15R5A\e(B" . "\e$,4 K\")\"@\"&\e(B")
+ ("\e$,16*\e(B" . "\\e$,4\")\"@\e(B")
+ ("\e$,16*5A\e(B" . "\\e$,4\")\"@\"&\e(B")
+ ("\e$,15S\e(B" . "\e$,4 K\")\"D\e(B")
+ ("\e$,15S5A\e(B" . "\e$,4 K\")\"D\"&\e(B")
+ ("\e$,16+\e(B" . "\\e$,4\")\"D\e(B")
+ ("\e$,16+5A\e(B" . "\\e$,4\")\"D\"&\e(B")
+ ("\e$,15T\e(B" . "\e$,4 K\")\"H\e(B")
+ ("\e$,15T5A\e(B" . "\e$,4 K\")\"H\"&\e(B")
+ ("\e$,16,\e(B" . "\\e$,4\")\"H\e(B")
+ ("\e$,16,5A\e(B" . "\\e$,4\")\"H\"&\e(B")
+ ("\e$,16@\e(B" . "\e$,4 a\"Q\e(B")
+ ;;("\e$,16B\e(B" . nil)
+ ;;("\e$,16A\e(B" . nil)
+ ;;("\e$,16C\e(B" . nil)
+
+ ;; GRUTTALS
+ ("\e$,15U\e(B" . "\e$,4 e\"R\e(B")
+ ("\e$,15U6-\e(B" . "\e$,4 c\e(B")
+ ("\e$,15U6-5p\e(B" . "\e$,4 g\"R\e(B")
+ ("\e$,15U6-5d\e(B" . "\e$,4 h\"R\e(B")
+ ("\e$,15U6-5w\e(B" . "\e$,4 i\")\e(B")
+ ("\e$,15U6-5w6-\e(B" . "\e$,4 i\e(B")
+
+ ("\e$,15V\e(B" . "\e$,4 j\")\e(B")
+ ("\e$,15V6-\e(B" . "\e$,4 j\e(B")
+ ("\e$,15V6-5p\e(B" . "\e$,4 l\")\e(B")
+ ("\e$,15V6-5p6-\e(B" . "\e$,4 l\e(B")
+
+ ("\e$,15W\e(B" . "\e$,4 m\")\e(B")
+ ("\e$,15W6-\e(B" . "\e$,4 m\e(B")
+ ("\e$,15W6-5p\e(B" . "\e$,4 o\")\e(B")
+ ("\e$,15W6-5p6-\e(B" . "\e$,4 o\e(B")
+
+ ("\e$,15X\e(B" . "\e$,4 p\")\e(B")
+ ("\e$,15X6-\e(B" . "\e$,4 p\e(B")
+ ("\e$,15X6-5p\e(B" . "\e$,4 q\")\e(B")
+ ("\e$,15X6-5p6-\e(B" . "\e$,4 q\e(B")
+
+ ("\e$,15Y\e(B" . "\e$,4 r\"S\e(B")
+ ;; PALATALS
+ ("\e$,15Z\e(B" . "\e$,4 s\")\e(B")
+ ("\e$,15Z6-\e(B" . "\e$,4 s\e(B")
+ ("\e$,15Z6-5p\e(B" . "\e$,4 t\")\e(B")
+ ("\e$,15Z6-5p6-\e(B" . "\e$,4 t\e(B")
+
+ ("\e$,15[\e(B" . "\e$,4 u\"T\e(B")
+
+ ("\e$,15\\e(B" . "\e$,4 v\")\e(B")
+ ("\e$,15\6-\e(B" . "\e$,4 v\e(B")
+ ("\e$,15\6-5p\e(B" . "\e$,4 x\")\e(B")
+ ("\e$,15\6-5p6-\e(B" . "\e$,4 x\e(B")
+ ("\e$,15\6-5^\e(B" . "\e$,4 y\")\e(B")
+ ("\e$,15\6-5^6-\e(B" . "\e$,4 y\e(B")
+
+ ("\e$,15]\e(B" . "\e$,4 z\")\e(B")
+ ("\e$,15]6-\e(B" . "\e$,4 z\e(B")
+ ("\e$,15]6-5p\e(B" . "\e$,4 {\")\e(B")
+ ("\e$,15]6-5p6-\e(B" . "\e$,4 {\e(B")
+
+ ("\e$,15^\e(B" . "\e$,4 |\")\e(B")
+ ("\e$,15^6-\e(B" . "\e$,4 |\e(B")
+ ;; CEREBRALS
+ ("\e$,15_\e(B" . "\e$,4 }\"U\e(B")
+ ("\e$,15_6-5_\e(B" . "\e$,4 ~\"U\e(B")
+ ("\e$,15_6-5`\e(B" . "\e$,4 \7f\"U\e(B")
+
+ ("\e$,15`\e(B" . "\e$,4! \"V\e(B")
+ ("\e$,15`6-5`\e(B" . "\e$,4!!\"V\e(B")
+
+ ("\e$,15a\e(B" . "\e$,4!\"\"W\e(B")
+ ("\e$,15a6-5a\e(B" . "\e$,4!$\"W\e(B")
+ ("\e$,15a6-5b\e(B" . "\e$,4!%\"W\e(B")
+
+ ("\e$,15b\e(B" . "\e$,4!&\"X\e(B")
+
+ ("\e$,15c\e(B" . "\e$,4!(\")\e(B")
+ ("\e$,15c6-\e(B" . "\e$,4!(\e(B")
+ ;; DENTALS
+ ("\e$,15d\e(B" . "\e$,4!)\")\e(B")
+ ("\e$,15d6-\e(B" . "\e$,4!)\e(B")
+ ("\e$,15d6-5p\e(B" . "\e$,4!*\")\e(B")
+ ("\e$,15d6-5p6-\e(B" . "\e$,4!*\e(B")
+ ("\e$,15d6-5d\e(B" . "\e$,4!+\")\e(B")
+ ("\e$,15d6-5d6-\e(B" . "\e$,4!+\e(B")
+
+ ("\e$,15e\e(B" . "\e$,4!,\")\e(B")
+ ("\e$,15e6-\e(B" . "\e$,4!,\e(B")
+ ("\e$,15e6-5p\e(B" . "\e$,4!-\")\e(B")
+ ("\e$,15e6-5p6-\e(B" . "\e$,4!-\e(B")
+
+ ("\e$,15f\e(B" . "\e$,4!.\"Y\e(B")
+ ("\e$,15f6#\e(B" . "\e$,4!/\"Y\e(B")
+ ("\e$,15f6-5p\e(B" . "\e$,4!0\"Y\e(B")
+ ("\e$,15f6-5f\e(B" . "\e$,4!1\"Y\e(B")
+ ("\e$,15f6-5g\e(B" . "\e$,4!2\"Y\e(B")
+ ("\e$,15f6-5n\e(B" . "\e$,4!3\e(B")
+ ("\e$,15f6-5o\e(B" . "\e$,4!4\e(B")
+ ("\e$,15f6-5u\e(B" . "\e$,4!5\"Y\e(B")
+
+ ("\e$,15g\e(B" . "\e$,4!6\")\e(B")
+ ("\e$,15g6-\e(B" . "\e$,4!6\e(B")
+ ("\e$,15g6-5p\e(B" . "\e$,4!7\")\e(B")
+ ("\e$,15g6-5p6-\e(B" . "\e$,4!7\e(B")
+
+ ("\e$,15h\e(B" . "\e$,4!8\")\e(B")
+ ("\e$,15h6-\e(B" . "\e$,4!8\e(B")
+ ("\e$,15h6-5p\e(B" . "\e$,4!9\")\e(B")
+ ("\e$,15h6-5p6-\e(B" . "\e$,4!9\")\e(B")
+ ("\e$,15h6-5h\e(B" . "\e$,4!:\")\e(B")
+ ("\e$,15h6-5h6-\e(B" . "\e$,4!:\e(B")
+
+ ("\e$,15i\e(B" . "\e$,4!8"#")\e(B")
+ ;; LABIALS
+ ("\e$,15j\e(B" . "\e$,4!;\")\e(B")
+ ("\e$,15j6-\e(B" . "\e$,4!;\e(B")
+ ("\e$,15j6-5p\e(B" . "\e$,4!<\")\e(B")
+ ("\e$,15j6-5p6-\e(B" . "\e$,4!<\e(B")
+
+ ("\e$,15k\e(B" . "\e$,4!a\"[\e(B")
+ ("\e$,15k6-\e(B" . "\e$,4!=\e(B")
+ ("\e$,15k6-5p\e(B" . "\e$,4!c\"[\e(B")
+
+ ("\e$,15l\e(B" . "\e$,4!d\")\e(B")
+ ("\e$,15l6-\e(B" . "\e$,4!d\e(B")
+ ("\e$,15l6-5p\e(B" . "\e$,4!e\")\e(B")
+ ("\e$,15l6-5p6-\e(B" . "\e$,4!e\e(B")
+
+ ("\e$,15m\e(B" . "\e$,4!f\")\e(B")
+ ("\e$,15m6-\e(B" . "\e$,4!f\e(B")
+ ("\e$,15m6-5p\e(B" . "\e$,4!g\")\e(B")
+ ("\e$,15m6-5p6-\e(B" . "\e$,4!g\e(B")
+
+ ("\e$,15n\e(B" . "\e$,4!h\")\e(B")
+ ("\e$,15n6-\e(B" . "\e$,4!h\e(B")
+ ("\e$,15n6-5p\e(B" . "\e$,4!i\")\e(B")
+ ("\e$,15n6-5p6-\e(B" . "\e$,4!i\e(B")
+ ;; SEMIVOWELS
+ ("\e$,15o\e(B" . "\e$,4!j\")\e(B")
+ ("\e$,15o6-\e(B" . "\e$,4!j\e(B")
+ ("\e$,15o6-5p\e(B" . "\e$,4!k\")\e(B")
+ ("\e$,15o6-5p6-\e(B" . "\e$,4!k\e(B")
+ ("\e$,16-5o\e(B" . "\e$,4!l\e(B") ;; when every ohter lig. fails.
+
+ ("\e$,15p\e(B" . "\e$,4!n\"W\e(B")
+ ;; ("\e$,15p6-\e(B" . "\\e$,4"'\e(B") ;; special case. only the topmost pos.
+ ("\e$,15q\e(B" . "\e$,4!n"#"W\e(B")
+ ("\e$,15q6-\e(B" . "\e$,4!m\e(B") ;; IS 13194 speical rule.
+ ("\e$,15p6!\e(B" . "\e$,4!o\"[\e(B")
+ ("\e$,15p6"\e(B" . "\e$,4!p\"\\e(B")
+
+ ("\e$,15r\e(B" . "\e$,4!q\")\e(B")
+ ("\e$,15r6-\e(B" . "\e$,4!q\e(B")
+ ("\e$,15s\e(B" . "\e$,4!s\e(B")
+ ("\e$,15s6-\e(B" . "\e$,4!r\e(B")
+ ("\e$,15t\e(B" . "\e$,4!s\"#\e(B")
+ ("\e$,15t6-\e(B" . "\e$,4!r\"#\e(B")
+
+ ("\e$,15u\e(B" . "\e$,4!t\")\e(B")
+ ("\e$,15u6-\e(B" . "\e$,4!t\e(B")
+ ("\e$,15u6-5p\e(B" . "\e$,4!u\")\e(B")
+ ("\e$,15u6-5p6-\e(B" . "\e$,4!u\e(B")
+ ;; SIBILANTS
+ ("\e$,15v\e(B" . "\e$,4!v\")\e(B")
+ ("\e$,15v6-\e(B" . "\e$,4!v\e(B")
+ ("\e$,15v6-5u\e(B" . "\e$,4!w\")\e(B")
+ ("\e$,15v6-5u6-\e(B" . "\e$,4!w\e(B")
+ ("\e$,15v6-5p\e(B" . "\e$,4!x\")\e(B")
+ ("\e$,15v6-5p6-\e(B" . "\e$,4!x\e(B")
+
+ ("\e$,15w\e(B" . "\e$,4!y\")\e(B")
+ ("\e$,15w6-\e(B" . "\e$,4!y\e(B")
+ ("\e$,15x\e(B" . "\e$,4!z\")\e(B")
+ ("\e$,15x6-\e(B" . "\e$,4!z\e(B")
+ ("\e$,15x6-5p\e(B" . "\e$,4!{\")\e(B")
+ ("\e$,15x6-5p6-\e(B" . "\e$,4!{\e(B")
+
+ ("\e$,15y\e(B" . "\e$,4!}\e(B")
+ ("\e$,15y6-\e(B" . "\e$,4!|\e(B")
+ ("\e$,15y6#\e(B" . "\e$,4!~\e(B")
+ ("\e$,15y6-5p\e(B" . "\e$,4!\7f\e(B")
+ ("\e$,15y6-5n\e(B" . "\e$,4\" \e(B")
+ ("\e$,15y6-5o\e(B" . "\e$,4\"!\e(B")
+ ;; NUKTAS
+ ("\e$,168\e(B" . "\e$,4 f"R"S\e(B")
+ ("\e$,1686-\e(B" . "\e$,4 d\e(B")
+ ("\e$,169\e(B" . "\e$,4 k\")\e(B")
+ ("\e$,1696-\e(B" . "\e$,4 k\e(B")
+ ("\e$,16:\e(B" . "\e$,4 n\")\e(B")
+ ("\e$,16:6-\e(B" . "\e$,4 n\e(B")
+ ("\e$,16;\e(B" . "\e$,4 w\")\e(B")
+ ("\e$,16;6-\e(B" . "\e$,4 w\e(B")
+ ("\e$,16<\e(B" . "\e$,4!#\"W\e(B")
+ ("\e$,16=\e(B" . "\e$,4!'\"X\e(B")
+ ("\e$,16>\e(B" . "\e$,4!b\"[\e(B")
+ ("\e$,16>6-\e(B" . "\e$,4!>\e(B")
+ ("\e$,16?\e(B" . "\e$,4!j"#")\e(B")
+ ;; misc modifiers.
+ ("\e$,15A\e(B" . "\\e$,4\"$\e(B")
+ ("\e$,15B\e(B" . "\\e$,4\"&\e(B")
+ ("\e$,15C\e(B" . "\e$,4 F\e(B")
+ ("\e$,15|\e(B" . "\e$,4\"#\e(B")
+ ("\e$,15}\e(B" . "\e$,4 E\e(B")
+ ("\e$,16-\e(B" . "\e$,4\"\"\e(B")
+ ("\e$,16-5p\e(B" . "\e$,4\"%\e(B") ;; following "r"
+ ;; ("\e$,160\e(B" . "\e$,4 D\e(B")
+ ;; ("\e$,16D\e(B" . "\e$,4 J\e(B")
+ ;; ("\e$,16F\e(B" . "")
+ ;; ("\e$,16G\e(B" . "")
+ ;; ("\e$,16H\e(B" . "")
+ ;; ("\e$,16I\e(B" . "")
+ ;; ("\e$,16J\e(B" . "")
+ ;; ("\e$,16K\e(B" . "")
+ ;; ("\e$,16L\e(B" . "")
+ ;; ("\e$,16M\e(B" . "")
+ ;; ("\e$,16N\e(B" . "")
+ ;; ("\e$,16O\e(B" . "")
+ )
+ "Devanagari characters to glyphs conversion table.
+Default value contains only the basic rules. You may add your own
+preferred rule from the sanskrit fonts." )
+
+(defvar dev-char-glyph-hash
+ (let* ((hash (makehash 'equal)))
+ (mapc (function (lambda (x) (puthash (car x) (cdr x) hash)))
+ dev-char-glyph)
+ hash))
+
+(defvar dev-char-glyph-regexp
+ (regexp-of-hashtbl-keys dev-char-glyph-hash))
+
+;; glyph-to-glyph conversion table.
+;; it is supposed that glyphs are ordered in
+;; [consonant/nukta] - [matra/halant] - [preceding-r] - [anuswar].
+
+(defvar dev-glyph-glyph
+ '(("\\e$,4"'\e(B\\e$,4"&\e(B" . "\\e$,4"(\e(B")
+ ("\\e$,4"'\e(B\\e$,4"$\e(B" . "\\e$,4"(\e(B")
+ ("\e$,4"*\e(B\\e$,4"&\e(B" . "\e$,4"+\e(B")
+ ("\e$,4"*\e(B\\e$,4"'\e(B" . "\e$,4",\e(B")
+ ("\e$,4"*\e(B\\e$,4"'\e(B\\e$,4"&\e(B" . "\e$,4"-\e(B")
+ ("\e$,4"2\e(B\\e$,4"&\e(B" . "\e$,4"3\e(B")
+ ("\e$,4"2\e(B\\e$,4"'\e(B" . "\e$,4"4\e(B")
+ ("\e$,4"2\e(B\\e$,4"'\e(B\\e$,4"&\e(B" . "\e$,4"5\e(B")
+ ("\e$,4"#\e(B\\e$,4"6\e(B" . "\e$,4"7\e(B")
+ ("\e$,4"%\e(B\\e$,4"6\e(B" . "\e$,4"8\e(B")
+ ;;("\e$,4"6\e(B" . "\e$,4"9\e(B")
+ ("\e$,4"#\e(B\\e$,4":\e(B" . "\e$,4";\e(B")
+ ("\e$,4"%\e(B\\e$,4":\e(B" . "\e$,4"<\e(B")
+ ;;("\e$,4":\e(B" . "\e$,4"=\e(B")
+ ("\\e$,4"@\e(B\\e$,4"&\e(B" . "\\e$,4"A\e(B")
+ ("\\e$,4"@\e(B\\e$,4"'\e(B" . "\\e$,4"B\e(B")
+ ("\\e$,4"@\e(B\\e$,4"'\e(B\\e$,4"&\e(B" . "\\e$,4"C\e(B")
+ ("\\e$,4"D\e(B\\e$,4"&\e(B" . "\\e$,4"E\e(B")
+ ("\\e$,4"D\e(B\\e$,4"'\e(B" . "\\e$,4"F\e(B")
+ ("\\e$,4"D\e(B\\e$,4"'\e(B\\e$,4"&\e(B" . "\\e$,4"G\e(B")
+ ("\\e$,4"H\e(B\\e$,4"&\e(B" . "\\e$,4"I\e(B")
+ ("\\e$,4"H\e(B\\e$,4"'\e(B" . "\\e$,4"J\e(B")
+ ("\\e$,4"H\e(B\\e$,4"'\e(B\\e$,4"&\e(B" . "\\e$,4"K\e(B")
+ ("\\e$,4"L\e(B\\e$,4"&\e(B" . "\\e$,4"M\e(B")
+ ("\\e$,4"L\e(B\\e$,4"'\e(B" . "\\e$,4"N\e(B")
+ ("\\e$,4"L\e(B\\e$,4"'\e(B\\e$,4"&\e(B" . "\\e$,4"O\e(B")
+ ))
+(defvar dev-glyph-glyph-hash
+ (let* ((hash (makehash 'equal)))
+ (mapc (function (lambda (x) (puthash (car x) (cdr x) hash)))
+ dev-glyph-glyph)
+ hash))
+(defvar dev-glyph-glyph-regexp
+ (regexp-of-hashtbl-keys dev-glyph-glyph-hash))
+
+
+;; yet another glyph-to-glyph conversions.
+(defvar dev-glyph-glyph-2
+ '(("\e$,4"*\e(B" . "\e$,4".\e(B")
+ ("\e$,4"+\e(B" . "\e$,4"/\e(B")
+ ("\e$,4",\e(B" . "\e$,4"0\e(B")
+ ("\e$,4"-\e(B" . "\e$,4"1\e(B")))
+(defvar dev-glyph-glyph-2-hash
+ (let* ((hash (makehash 'equal)))
+ (mapc (function (lambda (x) (puthash (car x) (cdr x) hash)))
+ dev-glyph-glyph-2)
+ hash))
+(defvar dev-glyph-glyph-2-regexp
+ (regexp-of-hashtbl-keys dev-glyph-glyph-2-hash))
+
+
+(defun dev-charseq (from &optional to)
+ (if (null to) (setq to from))
+ (mapcar (function (lambda (x) (indian-glyph-char x 'devanagari)))
+ (range from to)))
+
+(defvar dev-glyph-cvn
+ (append
+ (dev-charseq #x2b)
+ (dev-charseq #x3c #xc1)
+ (dev-charseq #xc3))
+ "Devanagari Consonants/Vowels/Nukta Glyphs")
+
+(defvar dev-glyph-space
+ (dev-charseq #xf0 #xfe)
+ "Devanagari Spacing Glyphs")
+
+(defvar dev-glyph-right-modifier
+ (append
+ (dev-charseq #xc9)
+ (dev-charseq #xd2 #xd5))
+ "Devanagari Modifiers attached at the right side.")
+
+(defvar dev-glyph-right-modifier-regexp
+ (concat "[" dev-glyph-right-modifier "]"))
+
+(defvar dev-glyph-left-matra
+ (dev-charseq #xca #xd1)
+ "Devanagari Matras attached at the left side.")
+
+(defvar dev-glyph-top-matra
+ (dev-charseq #xe0 #xef)
+ "Devanagari Matras attached at the top side.")
+
+(defvar dev-glyph-bottom-modifier
+ (append
+ (dev-charseq #xd6 #xdf)
+ (dev-charseq #xc2))
+ "Devanagari Modifiers attached at the bottom.")
+
+(defvar dev-glyph-order
+ `((,dev-glyph-cvn . 1)
+ (,dev-glyph-space . 2)
+ (,dev-glyph-right-modifier . 3)
+ (,dev-glyph-left-matra . 3) ;; processed by reference point.
+ (,dev-glyph-top-matra . 4)
+ (,(dev-charseq #xc7 #xc8) . 5)
+ (,(dev-charseq #xc6) . 6)
+ (,(dev-charseq #xc5) . 7)
+ (,dev-glyph-bottom-modifier . 8)))
+
+(mapc
+ (function (lambda (x)
+ (mapc
+ (function (lambda (y)
+ (put-char-code-property y 'composition-order (cdr x))))
+ (car x))))
+ dev-glyph-order)
+
+(mapc
+ (function (lambda (x)
+ (put-char-code-property x 'reference-point '(3 . 5))))
+ dev-glyph-left-matra)
+
+(defun devanagari-compose-syllable-string (string)
+ (with-temp-buffer
+ (insert (decompose-string string))
+ (devanagari-compose-syllable-region (point-min) (point-max))
+ (buffer-string)))
+
+(defun devanagari-compose-syllable-region (from to)
+ "Compose devanagari syllable in region FROM to TO."
+ (let ((glyph-str nil) (cons-num 0) glyph-str-list
+ (last-halant nil) (preceding-r nil) (last-modifier nil)
+ (last-char (char-before to)) match-str
+ glyph-block split-pos)
+ (save-excursion
+ (save-restriction
+ ;;; *** char-to-glyph conversion ***
+ ;; Special rule 1. -- Last halant must be preserved.
+ (if (eq last-char ?\e$,16-\e(B)
+ (progn
+ (setq last-halant t)
+ (narrow-to-region from (1- to)))
+ (narrow-to-region from to)
+ ;; note if the last char is modifier.
+ (if (or (eq last-char ?\e$,15A\e(B) (eq last-char ?\e$,15B\e(B))
+ (setq last-modifier t)))
+ (goto-char (point-min))
+ ;; Special rule 2. -- preceding "r halant" must be modifier.
+ (when (looking-at "\e$,15p6-\e(B.")
+ (setq preceding-r t)
+ (goto-char (+ 2 (point))))
+ ;; translate the rest characters into glyphs
+ (while (re-search-forward dev-char-glyph-regexp nil t)
+ (setq match-str (match-string 0))
+ (setq glyph-str
+ (concat glyph-str
+ (gethash match-str dev-char-glyph-hash)))
+ ;; count the number of consonant-glyhs.
+ (if (string-match devanagari-consonant match-str)
+ (setq cons-num (1+ cons-num))))
+ ;; preceding-r must be attached before the anuswar if exists.
+ (if preceding-r
+ (if last-modifier
+ (setq glyph-str (concat (substring glyph-str 0 -1)
+ "\e$,4"'\e(B" (substring glyph-str -1)))
+ (setq glyph-str (concat glyph-str "\e$,4"'\e(B"))))
+ (if last-halant (setq glyph-str (concat glyph-str "\e$,4""\e(B")))
+ ;;; *** glyph-to-glyph conversion ***
+ (when (string-match dev-glyph-glyph-regexp glyph-str)
+ (setq glyph-str
+ (replace-match (gethash (match-string 0 glyph-str)
+ dev-glyph-glyph-hash)
+ nil t glyph-str))
+ (if (and (> cons-num 1)
+ (string-match dev-glyph-glyph-2-regexp glyph-str))
+ (setq glyph-str
+ (replace-match (gethash (match-string 0 glyph-str)
+ dev-glyph-glyph-2-hash)
+ nil t glyph-str))))
+ ;;; *** glyph reordering ***
+ (while (setq split-pos (string-match "\e$,4""\e(B\\|.$" glyph-str))
+ (setq glyph-block (substring glyph-str 0 (1+ split-pos)))
+ (setq glyph-str (substring glyph-str (1+ split-pos)))
+ (setq
+ glyph-block
+ (if (string-match dev-glyph-right-modifier-regexp glyph-block)
+ (sort (string-to-list glyph-block)
+ (function (lambda (x y)
+ (< (get-char-code-property x 'composition-order)
+ (get-char-code-property y 'composition-order)))))
+ (sort (string-to-list glyph-block)
+ (function (lambda (x y)
+ (let ((xo (get-char-code-property x 'composition-order))
+ (yo (get-char-code-property y 'composition-order)))
+ (if (= xo 2) nil (if (= yo 2) t (< xo yo)))))))))
+ (setq glyph-str-list (nconc glyph-str-list glyph-block)))
+ ;; concatenate and attach reference-points.
+ (setq glyph-str
+ (cdr
+ (apply
+ 'nconc
+ (mapcar
+ (function (lambda (x)
+ (list
+ (or (get-char-code-property x 'reference-point)
+ '(5 . 3) ;; default reference point.
+ )
+ x)))
+ glyph-str-list))))))
+ (compose-region from to glyph-str)))
+
+(provide 'devan-util)