Commit | Line | Data |
---|---|---|
c7211fed | 1 | ;;; titdic-cnv.el --- convert cxterm dictionary (TIT format) to Quail package -*- coding:iso-2022-7bit; -*- |
4ed46869 | 2 | |
73b0cd50 | 3 | ;; Copyright (C) 1997-1998, 2000-2011 Free Software Foundation, Inc. |
7976eda0 | 4 | ;; Copyright (C) 1995, 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004, |
5df4f04c | 5 | ;; 2005, 2006, 2007, 2008, 2009, 2010, 2011 |
2fd125a3 KH |
6 | ;; National Institute of Advanced Industrial Science and Technology (AIST) |
7 | ;; Registration Number H14PRO021 | |
8f924df7 KH |
8 | ;; Copyright (C) 2003 |
9 | ;; National Institute of Advanced Industrial Science and Technology (AIST) | |
10 | ;; Registration Number H13PRO009 | |
4ed46869 KH |
11 | |
12 | ;; Keywords: Quail, TIT, cxterm | |
13 | ||
14 | ;; This file is part of GNU Emacs. | |
15 | ||
4936186e | 16 | ;; GNU Emacs is free software: you can redistribute it and/or modify |
4ed46869 | 17 | ;; it under the terms of the GNU General Public License as published by |
4936186e GM |
18 | ;; the Free Software Foundation, either version 3 of the License, or |
19 | ;; (at your option) any later version. | |
4ed46869 KH |
20 | |
21 | ;; GNU Emacs is distributed in the hope that it will be useful, | |
22 | ;; but WITHOUT ANY WARRANTY; without even the implied warranty of | |
23 | ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
24 | ;; GNU General Public License for more details. | |
25 | ||
26 | ;; You should have received a copy of the GNU General Public License | |
4936186e | 27 | ;; along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>. |
4ed46869 | 28 | |
60370d40 | 29 | ;;; Commentary: |
4ed46869 | 30 | |
49ed466f | 31 | ;; Convert cxterm dictionary (of TIT format) to quail-package. |
4ed46869 KH |
32 | ;; |
33 | ;; Usage (within Emacs): | |
49ed466f | 34 | ;; M-x titdic-convert<CR>CXTERM-DICTIONARY-NAME<CR> |
4ed46869 | 35 | ;; Usage (from shell): |
49ed466f | 36 | ;; % emacs -batch -l titdic-cnv -f batch-titdic-convert\ |
4ed46869 KH |
37 | ;; [-dir DIR] [DIR | FILE] ... |
38 | ;; | |
39 | ;; When you run titdic-convert within Emacs, you have a chance to | |
40 | ;; modify arguments of `quail-define-package' before saving the | |
41 | ;; converted file. For instance, you are likely to modify TITLE, | |
42 | ;; DOCSTRING, and KEY-BINDINGS. | |
43 | ||
49ed466f | 44 | ;; Cxterm dictionary file (*.tit) is a line-oriented text (English, |
4ed46869 KH |
45 | ;; Chinese, Japanese, and Korean) file. The whole file contains of |
46 | ;; two parts, the definition part (`header' here after) followed by | |
47 | ;; the dictionary part (`body' here after). All lines begin with | |
48 | ;; leading '#' are ignored. | |
49 | ;; | |
50 | ;; Each line in the header part has two fields, KEY and VALUE. These | |
51 | ;; fields are separated by one or more white characters. | |
52 | ;; | |
53 | ;; Each line in the body part has two fields, KEYSEQ and TRANSLATIONS. | |
54 | ;; These fields are separated by one or more white characters. | |
55 | ;; | |
56 | ;; See the manual page of `tit2cit' of cxterm distribution for more | |
57 | ;; detail. | |
c063e381 | 58 | ;; |
b138056a | 59 | ;; Near the end of this file, we also have a few other tools to convert |
c063e381 | 60 | ;; miscellaneous dictionaries. |
4ed46869 KH |
61 | |
62 | ;;; Code: | |
63 | ||
64 | (require 'quail) | |
65 | ||
49ed466f | 66 | ;; List of values of key "ENCODE:" and the corresponding Emacs |
4ed46869 KH |
67 | ;; coding-system and language environment name. |
68 | (defvar tit-encode-list | |
a7f2c216 KH |
69 | '(("GB" euc-china "Chinese-GB") |
70 | ("BIG5" cn-big5 "Chinese-BIG5") | |
71 | ("JIS" euc-japan "Japanese") | |
49ed466f KH |
72 | ("KS" euc-kr "Korean"))) |
73 | ||
4558e816 KH |
74 | ;; Alist of input method names and the corresponding title and extra |
75 | ;; docstring. For each of input method generated from TIT dictionary, | |
76 | ;; a docstring is automatically generated from the comments in the | |
77 | ;; dictionary. The extra docstring in this alist is to add more | |
78 | ;; information. | |
79 | ;; The command describe-input-method shows the automatically generated | |
c7211fed | 80 | ;; docstring, then an extra docstring while replacing the form \<VAR> |
4558e816 KH |
81 | ;; by the value of variable VAR. For instance, the form |
82 | ;; \<quail-translation-docstring> is replaced by a description about | |
83 | ;; how to select a translation from a list of candidates. | |
84 | ||
6b1e079c KH |
85 | (defvar quail-cxterm-package-ext-info |
86 | '(("chinese-4corner" "\e$(0(?-F\e(B") | |
87 | ("chinese-array30" "\e$(0#R#O\e(B") | |
4558e816 KH |
88 | ("chinese-ccdospy" "\e$AKuF4\e(B" |
89 | "Pinyin base input method for Chinese charset GB2312 \(`chinese-gb2312'). | |
90 | ||
c7211fed | 91 | Pinyin is the standard Roman transliteration method for Chinese. |
4558e816 KH |
92 | For the detail of Pinyin system, see the documentation of the input |
93 | method `chinese-py'. | |
94 | ||
95 | This input method works almost the same way as `chinese-py'. The | |
96 | difference is that you type a single key for these Pinyin spelling. | |
97 | Pinyin: zh en eng ang ch an ao ai ong sh ing yu(\e$A(9\e(B) | |
98 | keyseq: a f g h i j k l s u y v | |
c7211fed | 99 | For example: |
4558e816 KH |
100 | Chinese: \e$A0!\e(B \e$A9{\e(B \e$AVP\e(B \e$AND\e(B \e$A9b\e(B \e$ASq\e(B \e$AH+\e(B |
101 | Pinyin: a guo zhong wen guang yu quan | |
102 | Keyseq: a1 guo4 as1 wf4 guh1 yu..6 qvj6 | |
103 | ||
104 | \\<quail-translation-docstring> | |
105 | ||
106 | For double-width GB2312 characters correponding to ASCII, use the | |
107 | input method `chinese-qj'.") | |
108 | ||
4558e816 | 109 | ("chinese-ecdict" "\e$(05CKH\e(B" |
c0943d3d | 110 | "In this input method, you enter a Chinese (Big5) character or word |
4558e816 KH |
111 | by typing the corresponding English word. For example, if you type |
112 | \"computer\", \"\e$(0IZH+\e(B\" is input. | |
113 | ||
114 | \\<quail-translation-docstring>") | |
115 | ||
116 | ("chinese-etzy" "\e$(06/0D\e(B" | |
117 | "Zhuyin base input method for Chinese Big5 characters (`chinese-big5-1', | |
118 | `chinese-big5-2'). | |
119 | ||
120 | Zhuyin is a kind of phonetic symbol. One to three Zhuyin symbols | |
121 | compose one Chinese character. | |
122 | ||
123 | In this input method, you enter a Chinese character by first typing | |
124 | keys corresponding to Zhuyin symbols (see the above table) followed by | |
125 | SPC, 1, 2, 3, or 4 specifing a tone (SPC:\e$(0?v(N\e(B, 1:\e$(0M=Vy\e(B, 2:\e$(0Dm(N\e(B, 3: \e$(0&9Vy\e(B, | |
126 | 4:\e$(0(+Vy\e(B). | |
127 | ||
128 | \\<quail-translation-docstring>") | |
6b1e079c KH |
129 | |
130 | ("chinese-punct-b5" "\e$(0O:\e(BB" | |
131 | "Input method for Chinese punctuations and symbols of Big5 | |
132 | \(`chinese-big5-1' and `chinese-big5-2').") | |
133 | ||
134 | ("chinese-punct" "\e$A1j\e(BG" | |
135 | "Input method for Chinese punctuations and symbols of GB2312 | |
136 | \(`chinese-gb2312').") | |
137 | ||
138 | ("chinese-py-b5" "\e$(03<\e(BB" | |
139 | "Pinyin base input method for Chinese Big5 characters | |
140 | \(`chinese-big5-1', `chinese-big5-2'). | |
141 | ||
142 | This input method works almost the same way as `chinese-py' (which | |
143 | see). | |
144 | ||
145 | This input method supports only Han characters. The more convenient | |
43b11fee EZ |
146 | method is `chinese-py-punct-b5', which is the combination of this |
147 | method and `chinese-punct-b5' and which supports both Han characters | |
148 | and punctuation/symbols. | |
6b1e079c | 149 | |
43b11fee | 150 | For double-width Big5 characters corresponding to ASCII, use the input |
6b1e079c KH |
151 | method `chinese-qj-b5'. |
152 | ||
153 | The input method `chinese-py' and `chinese-tonepy' are also Pinyin | |
43b11fee | 154 | based, but for the character set GB2312 (`chinese-gb2312').") |
6b1e079c | 155 | |
4558e816 KH |
156 | ("chinese-qj-b5" "\e$(0)A\e(BB") |
157 | ||
158 | ("chinese-qj" "\e$AH+\e(BG") | |
159 | ||
6b1e079c | 160 | ("chinese-sw" "\e$AJWN2\e(B" |
4558e816 KH |
161 | "Radical base input method for Chinese charset GB2312 (`chinese-gb2312'). |
162 | ||
d20faceb EZ |
163 | In this input method, you enter a Chinese character by typing two |
164 | keys. The first key corresponds to the first (\e$AJW\e(B) radical, the second | |
165 | key corresponds to the last (\e$AN2\e(B) radical. The correspondence of keys | |
166 | and radicals is as below: | |
4558e816 KH |
167 | |
168 | first radical: | |
169 | a b c d e f g h i j k l m n o p q r s t u v w x y z | |
a1506d29 | 170 | \e$APD\e(B \e$AZ"\e(B \e$AJ,\e(B \e$AX<\e(B \e$A;p\e(B \e$A?Z\e(B \e$A^P\e(B \e$Ac_\e(B \e$AZ%\e(B \e$A\3\e(B \e$AXi\e(B \e$AD>\e(B \e$Alj\e(B \e$Ab;\e(B \e$ATB\e(B \e$Afy\e(B \e$AJ/\e(B \e$AMu\e(B \e$A0K\e(B \e$AX/\e(B \e$AHU\e(B \e$AeA\e(B \e$Aak\e(B \e$AVq\e(B \e$AR;\e(B \e$AHK\e(B |
4558e816 KH |
171 | last radical: |
172 | a b c d e f g h i j k l m n o p q r s t u v w x y z | |
a1506d29 | 173 | \e$ASV\e(B \e$AI=\e(B \e$AMA\e(B \e$A56\e(B \e$AZb\e(B \e$A?Z\e(B \e$ARB\e(B \e$Aqb\e(B \e$A4s\e(B \e$A6!\e(B \e$A[L\e(B \e$Ala\e(B \e$AJ.\e(B \e$A4u\e(B \e$AXg\e(B \e$ACE\e(B \e$A=q\e(B \e$AX-\e(B \e$AE.\e(B \e$ARR\e(B \e$A`m\e(B \e$AP!\e(B \e$A3'\e(B \e$A3f\e(B \e$A_.\e(B \e$A27\e(B |
4558e816 | 174 | |
43e5a7fe | 175 | \\<quail-translation-docstring>") |
4558e816 | 176 | |
6b1e079c KH |
177 | ("chinese-tonepy" "\e$A5wF4\e(B" |
178 | "Pinyin base input method for Chinese charset GB2312 (`chinese-gb2312'). | |
179 | ||
c3ff164a | 180 | Pinyin is the standard roman transliteration method for Chinese. |
d20faceb | 181 | For the details of Pinyin system, see the documentation of the input |
6b1e079c KH |
182 | method `chinese-py'. |
183 | ||
184 | This input method works almost the same way as `chinese-py'. The | |
4558e816 KH |
185 | difference is that you must type 1..5 after each Pinyin spelling to |
186 | specify a tone (1:\e$ARuF=\e(B, 2:\e$AQtF=\e(B, 3:\e$AIOIy\e(B, 4\e$AOBIy\e(B, 5:\e$AGaIy\e(B). | |
187 | ||
43e5a7fe | 188 | \\<quail-translation-docstring> |
4558e816 KH |
189 | |
190 | For instance, to input \e$ADc\e(B, you type \"n i 3 3\", the first \"n i\" is | |
191 | a Pinyin, the next \"3\" specifies tone, and the last \"3\" selects | |
192 | the third character from the candidate list. | |
6b1e079c KH |
193 | |
194 | For double-width GB2312 characters correponding to ASCII, use the | |
195 | input method `chinese-qj'.") | |
196 | ||
4558e816 KH |
197 | ("chinese-zozy" "\e$(0I\0D\e(B" |
198 | "Zhuyin base input method for Chinese Big5 characters (`chinese-big5-1', | |
199 | `chinese-big5-2'). | |
200 | ||
d20faceb | 201 | Zhuyin is a kind of a phonetic symbol. One to three Zhuyin symbols |
4558e816 KH |
202 | compose a Chinese character. |
203 | ||
204 | In this input method, you enter a Chinese character by first typing | |
205 | keys corresponding to Zhuyin symbols (see the above table) followed by | |
206 | SPC, 6, 3, 4, or 7 specifing a tone (SPC:\e$(0?v(N\e(B, 6:\e$(0Dm(N\e(B, 3:\e$(0&9Vy\e(B, 4:\e$(0(+Vy\e(B, | |
207 | 7:\e$(0M=Vy\e(B). | |
208 | ||
43e5a7fe | 209 | \\<quail-translation-docstring>"))) |
4ed46869 KH |
210 | |
211 | ;; Return a value of the key in the current line. | |
212 | (defsubst tit-read-key-value () | |
6b61353c | 213 | (if (looking-at "[^ \t\r\n]+") |
4ed46869 KH |
214 | (car (read-from-string (concat "\"" (match-string 0) "\""))))) |
215 | ||
216 | ;; Return an appropriate quail-package filename from FILENAME (TIT | |
49ed466f KH |
217 | ;; dictionary filename). For instance, ".../ZOZY.tit" -> "ZOZY.el". |
218 | (defun tit-make-quail-package-file-name (filename &optional dirname) | |
4ed46869 | 219 | (expand-file-name |
49ed466f | 220 | (concat (file-name-nondirectory (substring filename 0 -4)) ".el") |
4ed46869 KH |
221 | dirname)) |
222 | ||
1375754c | 223 | ;; This value is nil if we are processing phrase dictionary. |
8c1ccc6c | 224 | (defvar tit-dictionary t) |
4ed46869 KH |
225 | (defvar tit-encode nil) |
226 | (defvar tit-default-encode "GB") | |
227 | ||
228 | ;; Generate elements of KEY-BINDINGS arg for `quail-define-package' so | |
229 | ;; that each characters in KEYS invokes FUNCTION-SYMBOL. | |
230 | (defun tit-generate-key-bindings (keys function-symbol) | |
231 | (let ((len (length keys)) | |
232 | (i 0) | |
1375754c | 233 | (first t) |
4ed46869 KH |
234 | key) |
235 | (while (< i len) | |
1375754c | 236 | (or first (princ "\n ")) |
4ed46869 | 237 | (setq key (aref keys i)) |
1375754c KH |
238 | (if (if (< key ?\ ) |
239 | (eq (lookup-key quail-translation-keymap | |
240 | (char-to-string key)) | |
4ed46869 | 241 | 'quail-execute-non-quail-command) |
1375754c KH |
242 | (<= key 127)) |
243 | (progn | |
244 | (princ (cons (cond ((< key ?\ ) (format "\"\\C-%c\"" (+ key ?@))) | |
245 | ((< key 127) (format "\"%c\"" key)) | |
246 | (t "\"\\C-?\"")) | |
247 | function-symbol)) | |
248 | (setq first nil))) | |
4ed46869 KH |
249 | (setq i (1+ i))))) |
250 | ||
251 | ;; Analyze header part of TIT dictionary and generate an appropriate | |
252 | ;; `quail-define-package' function call. | |
253 | (defun tit-process-header (filename) | |
254 | (message "Processing header part...") | |
255 | (goto-char (point-min)) | |
256 | ||
1375754c KH |
257 | ;; At first, generate header part of the Quail package while |
258 | ;; collecting information from the original header. | |
259 | (let ((package (concat | |
260 | "chinese-" | |
261 | (substring (downcase (file-name-nondirectory filename)) | |
262 | 0 -4))) | |
263 | ;; TIT keywords and the corresponding default values. | |
4ed46869 KH |
264 | (tit-multichoice t) |
265 | (tit-prompt "") | |
266 | (tit-comments nil) | |
267 | (tit-backspace "\010\177") | |
268 | (tit-deleteall "\015\025") | |
269 | (tit-moveright ".>") | |
270 | (tit-moveleft ",<") | |
271 | (tit-keyprompt nil)) | |
1375754c KH |
272 | |
273 | (princ ";; Quail package `") | |
98223b73 | 274 | (princ package) |
53cfe624 | 275 | (princ (format "' -*- coding:%s -*-\n" coding-system-for-write)) |
c7211fed | 276 | (princ ";; Generated by the command `titdic-convert'\n;;\tDate: ") |
1375754c KH |
277 | (princ (current-time-string)) |
278 | (princ "\n;;\tOriginal TIT dictionary file: ") | |
279 | (princ (file-name-nondirectory filename)) | |
280 | (princ "\n\n;;; Comment:\n\n") | |
86e4f7c0 | 281 | (princ ";; Byte-compile this file again after any modification.\n\n") |
1375754c KH |
282 | (princ ";;; Start of the header of original TIT dictionary.\n\n") |
283 | ||
4ed46869 | 284 | (while (not (eobp)) |
1375754c KH |
285 | (let ((ch (following-char)) |
286 | (pos (point))) | |
4ed46869 KH |
287 | (cond ((= ch ?C) ; COMMENT |
288 | (cond ((looking-at "COMMENT") | |
289 | (let ((pos (match-end 0))) | |
290 | (end-of-line) | |
8b735b2b KH |
291 | (setq tit-comments |
292 | (cons (buffer-substring-no-properties pos (point)) | |
293 | tit-comments)))))) | |
4ed46869 KH |
294 | ((= ch ?M) ; MULTICHOICE, MOVERIGHT, MOVELEFT |
295 | (cond ((looking-at "MULTICHOICE:[ \t]*") | |
296 | (goto-char (match-end 0)) | |
297 | (setq tit-multichoice (looking-at "YES"))) | |
298 | ((looking-at "MOVERIGHT:[ \t]*") | |
299 | (goto-char (match-end 0)) | |
300 | (setq tit-moveright (tit-read-key-value))) | |
301 | ((looking-at "MOVELEFT:[ \t]*") | |
302 | (goto-char (match-end 0)) | |
303 | (setq tit-moveleft (tit-read-key-value))))) | |
304 | ((= ch ?P) ; PROMPT | |
305 | (cond ((looking-at "PROMPT:[ \t]*") | |
306 | (goto-char (match-end 0)) | |
6b1e079c KH |
307 | (setq tit-prompt (tit-read-key-value)) |
308 | ;; Some TIT dictionaies that are encoded by | |
309 | ;; euc-china contains invalid character at the tail. | |
310 | (let* ((last (aref tit-prompt (1- (length tit-prompt)))) | |
311 | (split (split-char last))) | |
312 | (if (or (eq (nth 1 split) 32) | |
313 | (eq (nth 2 split) 32)) | |
314 | (setq tit-prompt (substring tit-prompt 0 -1))))))) | |
4ed46869 KH |
315 | ((= ch ?B) ; BACKSPACE, BEGINDICTIONARY, |
316 | ; BEGINPHRASE | |
317 | (cond ((looking-at "BACKSPACE:[ \t]*") | |
318 | (goto-char (match-end 0)) | |
319 | (setq tit-backspace (tit-read-key-value))) | |
320 | ((looking-at "BEGINDICTIONARY") | |
1375754c | 321 | (setq tit-dictionary t)) |
4ed46869 | 322 | ((looking-at "BEGINPHRASE") |
1375754c | 323 | (setq tit-dictionary nil)))) |
4ed46869 KH |
324 | ((= ch ?K) ; KEYPROMPT |
325 | (cond ((looking-at "KEYPROMPT(\\(.*\\)):[ \t]*") | |
326 | (let ((key-char (match-string 1))) | |
327 | (goto-char (match-end 0)) | |
1fa1e1f5 RS |
328 | (if (string-match "\\\\[0-9]+" key-char) |
329 | (setq key-char | |
330 | (car (read-from-string (format "\"%s\"" | |
331 | key-char))))) | |
4ed46869 KH |
332 | (setq tit-keyprompt |
333 | (cons (cons key-char (tit-read-key-value)) | |
1375754c KH |
334 | tit-keyprompt))))))) |
335 | (end-of-line) | |
336 | (princ ";; ") | |
8b735b2b | 337 | (princ (buffer-substring-no-properties pos (point))) |
1375754c KH |
338 | (princ "\n") |
339 | (forward-line 1))) | |
a1506d29 | 340 | |
1375754c KH |
341 | (princ "\n;;; End of the header of original TIT dictionary.\n\n") |
342 | (princ ";;; Code:\n\n(require 'quail)\n\n") | |
343 | ||
344 | (princ "(quail-define-package ") | |
345 | ;; Args NAME, LANGUAGE, TITLE | |
6b1e079c | 346 | (let ((title (nth 1 (assoc package quail-cxterm-package-ext-info)))) |
1375754c KH |
347 | (princ "\"") |
348 | (princ package) | |
349 | (princ "\" \"") | |
350 | (princ (nth 2 (assoc tit-encode tit-encode-list))) | |
351 | (princ "\" \"") | |
352 | (princ (or title | |
353 | (if (string-match "[:\e$A!K\e$(0!(!J\e(B]+\\([^:\e$A!K\e$(0!(!K\e(B]+\\)" tit-prompt) | |
354 | (substring tit-prompt (match-beginning 1) (match-end 1)) | |
355 | tit-prompt))) | |
356 | (princ "\"\n")) | |
4ed46869 KH |
357 | |
358 | ;; Arg GUIDANCE | |
359 | (if tit-keyprompt | |
360 | (progn | |
1375754c | 361 | (princ " '(") |
4ed46869 | 362 | (while tit-keyprompt |
1375754c KH |
363 | (princ " ") |
364 | (princ (format "(%d . \"%s\")\n" | |
365 | (string-to-char (car (car tit-keyprompt))) | |
366 | (cdr (car tit-keyprompt)))) | |
4ed46869 | 367 | (setq tit-keyprompt (cdr tit-keyprompt))) |
1375754c KH |
368 | (princ ")")) |
369 | (princ " t\n")) | |
4ed46869 KH |
370 | |
371 | ;; Arg DOCSTRING | |
6b1e079c KH |
372 | (let ((doc (concat tit-prompt "\n")) |
373 | (comments (if tit-comments | |
374 | (mapconcat 'identity (nreverse tit-comments) "\n"))) | |
375 | (doc-ext (nth 2 (assoc package quail-cxterm-package-ext-info)))) | |
376 | (if comments | |
377 | (setq doc (concat doc "\n" comments "\n"))) | |
378 | (if doc-ext | |
379 | (setq doc (concat doc "\n" doc-ext "\n"))) | |
380 | (prin1 doc) | |
381 | (terpri)) | |
4ed46869 KH |
382 | |
383 | ;; Arg KEY-BINDINGS | |
1375754c | 384 | (princ " '(") |
4ed46869 | 385 | (tit-generate-key-bindings tit-backspace 'quail-delete-last-char) |
1375754c | 386 | (princ "\n ") |
4ed46869 | 387 | (tit-generate-key-bindings tit-deleteall 'quail-abort-translation) |
1375754c | 388 | (princ "\n ") |
4ed46869 | 389 | (tit-generate-key-bindings tit-moveright 'quail-next-translation) |
1375754c | 390 | (princ "\n ") |
4ed46869 | 391 | (tit-generate-key-bindings tit-moveleft 'quail-prev-translation) |
1375754c | 392 | (princ ")\n") |
4ed46869 KH |
393 | |
394 | ;; Args FORGET-TRANSLATION, DETERMINISTIC, KBD-TRANSLATE, SHOW-LAYOUT. | |
395 | ;; The remaining args are all nil. | |
1375754c KH |
396 | (princ " nil") |
397 | (princ (if tit-multichoice " nil" " t")) | |
398 | (princ (if tit-keyprompt " t t)\n\n" " nil nil)\n\n")))) | |
399 | ||
400 | (defsubst tit-flush-translations (key translations) | |
401 | (if (string-match "\\\\[0-9][0-9][0-9]" key) | |
402 | (let ((newkey (concat (substring key 0 (match-beginning 0)) | |
403 | (car (read-from-string | |
404 | (concat "\"" (match-string 0 key) "\""))))) | |
405 | (idx (match-end 0))) | |
406 | (while (string-match "\\\\[0-9][0-9][0-9]" key idx) | |
407 | (setq newkey (concat | |
408 | newkey | |
409 | (substring key idx (match-beginning 0)) | |
410 | (car (read-from-string | |
411 | (concat "\"" (match-string 0 key) "\""))))) | |
412 | (setq idx (match-end 0))) | |
413 | (setq key (concat newkey (substring key idx))))) | |
414 | (prin1 (list key (if tit-dictionary translations | |
415 | (vconcat (nreverse translations))))) | |
416 | (princ "\n")) | |
4ed46869 KH |
417 | |
418 | ;; Convert body part of TIT dictionary into `quail-define-rules' | |
419 | ;; function call. | |
420 | (defun tit-process-body () | |
421 | (message "Formatting translation rules...") | |
1375754c KH |
422 | (let* ((template (list nil nil)) |
423 | (second (cdr template)) | |
424 | (prev-key "") | |
425 | ch key translations pos) | |
426 | (princ "(quail-define-rules\n") | |
4ed46869 | 427 | (while (null (eobp)) |
1375754c KH |
428 | (setq ch (following-char)) |
429 | (if (or (= ch ?#) (= ch ?\n)) | |
430 | (forward-line 1) | |
4ed46869 | 431 | (setq pos (point)) |
1375754c | 432 | (skip-chars-forward "^ \t\n") |
8b735b2b | 433 | (setq key (buffer-substring-no-properties pos (point))) |
4ed46869 | 434 | (skip-chars-forward " \t") |
1375754c KH |
435 | (setq ch (following-char)) |
436 | (if (or (= ch ?#) (= ch ?\n)) | |
08a1bf22 | 437 | ;; This entry contains no translations. Let's ignore it. |
1375754c KH |
438 | (forward-line 1) |
439 | (or (string= key prev-key) | |
08a1bf22 | 440 | (progn |
1375754c KH |
441 | (if translations |
442 | (tit-flush-translations prev-key translations)) | |
443 | (setq translations nil | |
444 | prev-key key))) | |
445 | (if tit-dictionary | |
446 | (progn | |
447 | (setq pos (point)) | |
448 | (skip-chars-forward "^ \t#\n") | |
449 | (setq translations | |
450 | (if translations | |
451 | (concat translations | |
8b735b2b KH |
452 | (buffer-substring-no-properties pos (point))) |
453 | (buffer-substring-no-properties pos (point))))) | |
1375754c KH |
454 | (while (not (eolp)) |
455 | (setq pos (point)) | |
456 | (skip-chars-forward "^ \t\n") | |
8b735b2b KH |
457 | (setq translations (cons (buffer-substring-no-properties |
458 | pos (point)) | |
1375754c KH |
459 | translations)) |
460 | (skip-chars-forward " \t") | |
461 | (setq ch (following-char)) | |
462 | (if (= ch ?#) (end-of-line)))) | |
08a1bf22 | 463 | (forward-line 1)))) |
1375754c KH |
464 | |
465 | (if translations | |
466 | (tit-flush-translations prev-key translations)) | |
467 | (princ ")\n"))) | |
4ed46869 KH |
468 | |
469 | ;;;###autoload | |
470 | (defun titdic-convert (filename &optional dirname) | |
471 | "Convert a TIT dictionary of FILENAME into a Quail package. | |
472 | Optional argument DIRNAME if specified is the directory name under which | |
473 | the generated Quail package is saved." | |
474 | (interactive "FTIT dictionary file: ") | |
98223b73 | 475 | (let ((coding-system-for-write nil)) |
c7211fed | 476 | (with-temp-file (tit-make-quail-package-file-name filename dirname) |
c7211fed DL |
477 | (let ((standard-output (current-buffer))) |
478 | (with-temp-buffer | |
479 | (set-buffer-multibyte nil) | |
f9362982 KH |
480 | ;; Here we must use `raw-text' instead of `no-conversion' to |
481 | ;; enable auto-decoding of eol format (CRLF->LF). | |
482 | (let ((coding-system-for-read 'raw-text)) | |
c7211fed | 483 | (insert-file-contents (expand-file-name filename))) |
a1506d29 | 484 | |
c7211fed DL |
485 | ;; Decode the buffer contents from the encoding specified by a |
486 | ;; value of the key "ENCODE:". | |
487 | (if (not (search-forward "\nBEGIN" nil t)) | |
488 | (error "TIT dictionary doesn't have body part")) | |
489 | (let ((limit (point)) | |
490 | coding-system slot) | |
491 | (goto-char (point-min)) | |
492 | (if (re-search-forward "^ENCODE:[ \t]*" limit t) | |
493 | (progn | |
494 | (goto-char (match-end 0)) | |
495 | (setq tit-encode (tit-read-key-value))) | |
496 | (setq tit-encode tit-default-encode)) | |
497 | (setq slot (assoc tit-encode tit-encode-list)) | |
498 | (if (not slot) | |
499 | (error "Invalid ENCODE: value in TIT dictionary")) | |
500 | (setq coding-system (nth 1 slot)) | |
501 | (message "Decoding with coding system %s..." coding-system) | |
502 | (goto-char (point-min)) | |
98223b73 | 503 | (decode-coding-region (point-min) (point-max) coding-system) |
f9362982 KH |
504 | ;; Explicitly set eol format to `unix'. |
505 | (setq coding-system-for-write | |
506 | (coding-system-change-eol-conversion coding-system 'unix)) | |
98223b73 | 507 | (remove-text-properties (point-min) (point-max) '(charset nil))) |
c7211fed | 508 | |
66b820ba | 509 | (set-buffer-multibyte t) |
c7211fed | 510 | ;; Set point the starting position of the body part. |
1375754c | 511 | (goto-char (point-min)) |
c7211fed DL |
512 | (if (not (search-forward "\nBEGIN" nil t)) |
513 | (error "TIT dictionary can't be decoded correctly")) | |
514 | ||
2db18278 | 515 | ;; Process the header part. |
c7211fed DL |
516 | (forward-line 1) |
517 | (narrow-to-region (point-min) (point)) | |
518 | (tit-process-header filename) | |
519 | (widen) | |
520 | ||
8f924df7 | 521 | ;; Process the body part |
c7211fed | 522 | (tit-process-body)))))) |
4ed46869 KH |
523 | |
524 | ;;;###autoload | |
44cbfae9 | 525 | (defun batch-titdic-convert (&optional force) |
4ed46869 KH |
526 | "Run `titdic-convert' on the files remaining on the command line. |
527 | Use this from the command line, with `-batch'; | |
528 | it won't work in an interactive Emacs. | |
529 | For example, invoke \"emacs -batch -f batch-titdic-convert XXX.tit\" to | |
530 | generate Quail package file \"xxx.el\" from TIT dictionary file \"XXX.tit\". | |
531 | To get complete usage, invoke \"emacs -batch -f batch-titdic-convert -h\"." | |
532 | (defvar command-line-args-left) ; Avoid compiler warning. | |
533 | (if (not noninteractive) | |
534 | (error "`batch-titdic-convert' should be used only with -batch")) | |
535 | (if (string= (car command-line-args-left) "-h") | |
536 | (progn | |
537 | (message "To convert XXX.tit and YYY.tit into xxx.el and yyy.el:") | |
538 | (message " %% emacs -batch -l titdic-cnv -f batch-titdic-convert XXX.tit YYY.tit") | |
539 | (message "To convert XXX.tit into DIR/xxx.el:") | |
540 | (message " %% emacs -batch -l titdic-cnv -f batch-titdic-convert -dir DIR XXX.tit")) | |
541 | (let (targetdir filename files file) | |
542 | (if (string= (car command-line-args-left) "-dir") | |
543 | (progn | |
544 | (setq command-line-args-left (cdr command-line-args-left)) | |
545 | (setq targetdir (car command-line-args-left)) | |
546 | (setq command-line-args-left (cdr command-line-args-left)))) | |
547 | (while command-line-args-left | |
548 | (setq filename (expand-file-name (car command-line-args-left))) | |
549 | (if (file-directory-p filename) | |
550 | (progn | |
551 | (message "Converting all tit files in the directory %s" filename) | |
552 | (setq files (directory-files filename t "\\.tit$"))) | |
553 | (setq files (list filename))) | |
554 | (while files | |
555 | (setq file (expand-file-name (car files))) | |
44cbfae9 KH |
556 | (when (or force |
557 | (file-newer-than-file-p | |
558 | file (tit-make-quail-package-file-name file targetdir))) | |
559 | (message "Converting %s to quail-package..." file) | |
560 | (titdic-convert file targetdir)) | |
4ed46869 KH |
561 | (setq files (cdr files))) |
562 | (setq command-line-args-left (cdr command-line-args-left))) | |
86e4f7c0 | 563 | (message "Byte-compile the created files by:") |
4ed46869 KH |
564 | (message " %% emacs -batch -f batch-byte-compile XXX.el"))) |
565 | (kill-emacs 0)) | |
566 | ||
c063e381 KH |
567 | \f |
568 | ;;; Converter of miscellaneous dictionaries other than TIT format. | |
569 | ||
570 | ;; Alist of input method names and the corresponding information. | |
571 | ;; Each element has this form: | |
572 | ;; (INPUT-METHOD-NAME ;; Name of the input method. | |
a1506d29 | 573 | ;; INPUT-METHOD-TITLE ;; Title string of the input method |
c063e381 KH |
574 | ;; DICFILE ;; Name of the source dictionary file. |
575 | ;; CODING ;; Coding system of the dictionary file. | |
576 | ;; QUAILFILE ;; Name of the Quail package file. | |
577 | ;; CONVERTER ;; Function to generate the Quail package. | |
578 | ;; COPYRIGHT-NOTICE ;; Copyright notice of the source dictionary. | |
579 | ;; ) | |
580 | ||
581 | (defvar quail-misc-package-ext-info | |
582 | '(("chinese-b5-tsangchi" "\e$(06A\e(BB" | |
a1506d29 | 583 | "cangjie-table.b5" big5 "tsang-b5.el" |
c063e381 KH |
584 | tsang-b5-converter |
585 | "\ | |
586 | ;; # Copyright 2001 Christian Wittern <wittern@iis.sinica.edu.tw> | |
587 | ;; # | |
588 | ;; # Permission to copy and distribute both modified and | |
589 | ;; # unmodified versions is granted without royalty provided | |
590 | ;; # this notice is preserved.") | |
591 | ||
592 | ("chinese-b5-quick" "\e$(0X|\e(BB" | |
a1506d29 | 593 | "cangjie-table.b5" big5 "quick-b5.el" |
c063e381 KH |
594 | quick-b5-converter |
595 | "\ | |
596 | ;; # Copyright 2001 Christian Wittern <wittern@iis.sinica.edu.tw> | |
597 | ;; # | |
598 | ;; # Permission to copy and distribute both modified and | |
599 | ;; # unmodified versions is granted without royalty provided | |
600 | ;; # this notice is preserved.") | |
601 | ||
602 | ("chinese-cns-tsangchi" "\e$(GT?\e(BC" | |
603 | "cangjie-table.cns" iso-2022-cn-ext "tsang-cns.el" | |
604 | tsang-cns-converter | |
605 | "\ | |
606 | ;; # Copyright 2001 Christian Wittern <wittern@iis.sinica.edu.tw> | |
607 | ;; # | |
608 | ;; # Permission to copy and distribute both modified and | |
609 | ;; # unmodified versions is granted without royalty provided | |
610 | ;; # this notice is preserved.") | |
611 | ||
612 | ("chinese-cns-quick" "\e$(Gv|\e(BC" | |
613 | "cangjie-table.cns" iso-2022-cn-ext "quick-cns.el" | |
614 | quick-cns-converter | |
615 | "\ | |
616 | ;; # Copyright 2001 Christian Wittern <wittern@iis.sinica.edu.tw> | |
617 | ;; # | |
618 | ;; # Permission to copy and distribute both modified and | |
619 | ;; # unmodified versions is granted without royalty provided | |
620 | ;; # this notice is preserved.") | |
621 | ||
622 | ("chinese-py" "\e$AF4\e(BG" | |
623 | "pinyin.map" cn-gb-2312 "PY.el" | |
624 | py-converter | |
625 | "\ | |
626 | ;; \"pinyin.map\" is included in a free package called CCE. It is | |
627 | ;; available at: | |
628 | ;; http://ftp.debian.org/debian/dists/potato/main | |
629 | ;; /source/utils/cce_0.36.orig.tar.gz | |
630 | ;; This package contains the following copyright notice. | |
631 | ;; | |
632 | ;; | |
633 | ;; Copyright (C) 1999, Rui He, herui@cs.duke.edu | |
a1506d29 JB |
634 | ;; |
635 | ;; | |
c063e381 | 636 | ;; CCE(Console Chinese Environment) 0.32 |
a1506d29 JB |
637 | ;; |
638 | ;; CCE is free software; you can redistribute it and/or modify it under the | |
639 | ;; terms of the GNU General Public License as published by the Free Software | |
640 | ;; Foundation; either version 1, or (at your option) any later version. | |
641 | ;; | |
642 | ;; CCE is distributed in the hope that it will be useful, but WITHOUT ANY | |
643 | ;; WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS | |
644 | ;; FOR A PARTICULAR PURPOSE. See the GNU General Public License for more | |
645 | ;; details. | |
646 | ;; | |
c063e381 | 647 | ;; You should have received a copy of the GNU General Public License along with |
a1506d29 | 648 | ;; CCE; see the file COPYING. If not, write to the Free Software Foundation, |
3ef97fb6 | 649 | ;; 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.") |
c063e381 KH |
650 | |
651 | ("chinese-ziranma" "\e$AWTH;\e(B" | |
652 | "ziranma.cin" cn-gb-2312 "ZIRANMA.el" | |
653 | ziranma-converter | |
654 | "\ | |
655 | ;; \"ziranma.cin\" is included in a free package called CCE. It is | |
656 | ;; available at: | |
657 | ;; http://ftp.debian.org/debian/dists/potato/main | |
658 | ;; /source/utils/cce_0.36.orig.tar.gz | |
659 | ;; This package contains the following copyright notice. | |
660 | ;; | |
661 | ;; | |
662 | ;; Copyright (C) 1999, Rui He, herui@cs.duke.edu | |
a1506d29 JB |
663 | ;; |
664 | ;; | |
c063e381 | 665 | ;; CCE(Console Chinese Environment) 0.32 |
a1506d29 JB |
666 | ;; |
667 | ;; CCE is free software; you can redistribute it and/or modify it under the | |
668 | ;; terms of the GNU General Public License as published by the Free Software | |
669 | ;; Foundation; either version 1, or (at your option) any later version. | |
670 | ;; | |
671 | ;; CCE is distributed in the hope that it will be useful, but WITHOUT ANY | |
672 | ;; WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS | |
673 | ;; FOR A PARTICULAR PURPOSE. See the GNU General Public License for more | |
674 | ;; details. | |
675 | ;; | |
c063e381 | 676 | ;; You should have received a copy of the GNU General Public License along with |
a1506d29 | 677 | ;; CCE; see the file COPYING. If not, write to the Free Software Foundation, |
3ef97fb6 | 678 | ;; 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.") |
a4c4011b | 679 | |
a4c4011b AC |
680 | ("chinese-ctlau" "\e$AAuTA\e(B" |
681 | "CTLau.html" cn-gb-2312 "CTLau.el" | |
682 | ctlau-gb-converter | |
683 | "\ | |
684 | ;; \"CTLau.html\" is available at: | |
685 | ;; | |
686 | ;; http://umunhum.stanford.edu/~lee/chicomp/CTLau.html | |
687 | ;; | |
688 | ;; It contains the following copyright notice: | |
689 | ;; | |
690 | ;; # Copyright (C) 1988-2001 Fung Fung Lee (lee@umunhum.stanford.edu) | |
a1506d29 | 691 | ;; # |
a4c4011b AC |
692 | ;; # This program is free software; you can redistribute it and/or |
693 | ;; # modify it under the terms of the GNU General Public License | |
694 | ;; # as published by the Free Software Foundation; either version 2 | |
695 | ;; # of the License, or any later version. | |
a1506d29 | 696 | ;; # |
a4c4011b AC |
697 | ;; # This program is distributed in the hope that it will be useful, |
698 | ;; # but WITHOUT ANY WARRANTY; without even the implied warranty of | |
699 | ;; # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
700 | ;; # GNU General Public License for more details. | |
a1506d29 | 701 | ;; # |
a4c4011b AC |
702 | ;; # You should have received a copy of the GNU General Public License |
703 | ;; # along with this program; if not, write to the Free Software Foundation, | |
086add15 | 704 | ;; # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.") |
a4c4011b | 705 | |
e089be2d | 706 | ("chinese-ctlaub" "\e$(0N,Gn\e(B" |
2bef0948 | 707 | "CTLau-b5.html" big5 "CTLau-b5.el" |
a4c4011b AC |
708 | ctlau-b5-converter |
709 | "\ | |
710 | ;; \"CTLau-b5.html\" is available at: | |
711 | ;; | |
712 | ;; http://umunhum.stanford.edu/~lee/chicomp/CTLau-b5.html | |
713 | ;; | |
714 | ;; It contains the following copyright notice: | |
715 | ;; | |
716 | ;; # Copyright (C) 1988-2001 Fung Fung Lee (lee@umunhum.stanford.edu) | |
a1506d29 | 717 | ;; # |
a4c4011b AC |
718 | ;; # This program is free software; you can redistribute it and/or |
719 | ;; # modify it under the terms of the GNU General Public License | |
720 | ;; # as published by the Free Software Foundation; either version 2 | |
721 | ;; # of the License, or any later version. | |
a1506d29 | 722 | ;; # |
a4c4011b AC |
723 | ;; # This program is distributed in the hope that it will be useful, |
724 | ;; # but WITHOUT ANY WARRANTY; without even the implied warranty of | |
725 | ;; # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
726 | ;; # GNU General Public License for more details. | |
a1506d29 | 727 | ;; # |
a4c4011b AC |
728 | ;; # You should have received a copy of the GNU General Public License |
729 | ;; # along with this program; if not, write to the Free Software Foundation, | |
086add15 | 730 | ;; # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.") |
c063e381 KH |
731 | )) |
732 | ||
733 | ;; Generate a code of a Quail package in the current buffer from Tsang | |
734 | ;; dictionary in the buffer DICBUF. The input method name of the | |
735 | ;; Quail package is NAME, and the title string is TITLE. | |
736 | ||
0b381c7e | 737 | ;; TSANG-P is non-nil, generate \e$(06AQo\e(B input method. Otherwise |
c063e381 KH |
738 | ;; generate \e$(0X|/y\e(B (simple version of \e$(06AQo\e(B). If BIG5-P is non-nil, the |
739 | ;; input method is for inputting Big5 characters. Otherwise the input | |
740 | ;; method is for inputting CNS characters. | |
741 | ||
742 | (defun tsang-quick-converter (dicbuf name title tsang-p big5-p) | |
743 | (let ((fulltitle (if tsang-p (if big5-p "\e$(06AQo\e(B" "\e$(GT?on\e(B") | |
744 | (if big5-p "\e$(0X|/y\e(B" "\e$(Gv|Mx\e(B"))) | |
745 | dic) | |
746 | (goto-char (point-max)) | |
747 | (if big5-p | |
748 | (insert (format "\"\e$(0&d'GTT&,!J\e(B%s\e$(0!K\e(BBIG5 | |
749 | ||
750 | \e$(0KHM$\e(B%s\e$(0TT&,WoOu\e(B | |
751 | ||
752 | [Q \e$(0'D\e(B] [W \e$(0(q\e(B] [E \e$(0'V\e(B] [R \e$(0&H\e(B] [T \e$(0'>\e(B] [Y \e$(0&4\e(B] [U \e$(0&U\e(B] [I \e$(0'B\e(B] [O \e$(0&*\e(B] [P \e$(0'A\e(B] | |
753 | ||
754 | [A \e$(0'K\e(B] [S \e$(0&T\e(B] [D \e$(0'N\e(B] [F \e$(0'W\e(B] [G \e$(0&I\e(B] [H \e$(0*M\e(B] [J \e$(0&3\e(B] [L \e$(0&d\e(B] | |
a1506d29 | 755 | |
c063e381 KH |
756 | [Z ] [X \e$(0[E\e(B] [C \e$(01[\e(B] [V \e$(0&M\e(B] [B \e$(0'M\e(B] [N \e$(0&_\e(B] [M \e$(0&"\e(B] |
757 | ||
758 | \\\\<quail-translation-docstring>\"\n" | |
759 | fulltitle fulltitle)) | |
760 | (insert (format "\"\e$(GDcEFrSD+!J\e(B%s\e$(G!K\e(BCNS | |
761 | ||
762 | \e$(GiGk#\e(B%s\e$(GrSD+uomu\e(B | |
763 | ||
764 | [Q \e$(GEC\e(B] [W \e$(GFp\e(B] [E \e$(GEU\e(B] [R \e$(GDG\e(B] [T \e$(GE=\e(B] [Y \e$(GD3\e(B] [U \e$(GDT\e(B] [I \e$(GEA\e(B] [O \e$(GD)\e(B] [P \e$(GE@\e(B] | |
765 | ||
766 | [A \e$(GEJ\e(B] [S \e$(GDS\e(B] [D \e$(GEM\e(B] [F \e$(GEV\e(B] [G \e$(GDH\e(B] [H \e$(GHL\e(B] [J \e$(GD2\e(B] [L \e$(GDc\e(B] | |
a1506d29 JB |
767 | |
768 | [Z ] [X \e$(GyE\e(B] [C \e$(GOZ\e(B] [V \e$(GDL\e(B] [B \e$(GEL\e(B] [N \e$(GD^\e(B] [M \e$(GD!\e(B] | |
c063e381 KH |
769 | |
770 | \\\\<quail-translation-docstring>\"\n" | |
771 | fulltitle fulltitle))) | |
772 | (insert " '((\".\" . quail-next-translation-block) | |
773 | (\",\" . quail-prev-translation-block)) | |
774 | nil nil)\n\n") | |
775 | (insert "(quail-define-rules\n") | |
9a529312 | 776 | (with-current-buffer dicbuf |
6b61353c KH |
777 | ;; Handle double CR line ends, which result when checking out of |
778 | ;; CVS on MS-Windows. | |
779 | (goto-char (point-min)) | |
c063e381 KH |
780 | (search-forward "A440") |
781 | (beginning-of-line) | |
782 | (let ((table (make-hash-table :test 'equal)) | |
783 | val) | |
784 | (while (not (eobp)) | |
785 | (forward-char 5) | |
786 | (let ((trans (char-to-string (following-char))) | |
787 | key slot) | |
8b735b2b | 788 | (re-search-forward "\\([A-Z]+\\)\r*$" nil t) |
c063e381 KH |
789 | (setq key (downcase |
790 | (if (or tsang-p | |
8b735b2b KH |
791 | (<= (- (match-end 1) (match-beginning 1)) 1)) |
792 | (match-string 1) | |
793 | (string (char-after (match-beginning 1)) | |
794 | (char-after (1- (match-end 1))))))) | |
c063e381 KH |
795 | (setq val (gethash key table)) |
796 | (if val (setq trans (concat val trans))) | |
797 | (puthash key trans table) | |
798 | (forward-line 1))) | |
799 | (maphash #'(lambda (key val) (setq dic (cons (cons key val) dic))) | |
800 | table))) | |
801 | (setq dic (sort dic (function (lambda (x y) (string< (car x ) (car y)))))) | |
802 | (dolist (elt dic) | |
803 | (insert (format "(%S\t%S)\n" (car elt) (cdr elt)))) | |
804 | (let ((punctuations '((";" "\e$(0!'!2!"!#!.!/\e(B" "\e$(G!'!2!"!#!.!/\e(B") | |
805 | (":" "\e$(0!(!+!3!%!$!&!0!1\e(B" "\e$(G!(!+!3!%!$!&!0!1\e(B") | |
806 | ("'" "\e$(0!e!d\e(B" "\e$(G!e!d\e(B") | |
807 | ("\"" "\e$(0!g!f!h!i!q\e(B" "\e$(G!g!f!h!i!q\e(B") | |
808 | ("\\" "\e$(0"`"b#M\e(B" "\e$(G"`"b#M\e(B") | |
809 | ("|" "\e$(0!6!8!:"^\e(B" "\e$(G!6!8!:"^\e(B") | |
810 | ("/" "\e$(0"_"a#L\e(B" "\e$(G"_"a#L\e(B") | |
811 | ("?" "\e$(0!)!4\e(B" "\e$(G!)!4\e(B") | |
812 | ("<" "\e$(0!R"6"A!T"H\e(B" "\e$(G!R"6"A!T"H\e(B") | |
813 | (">" "\e$(0!S"7"B!U\e(B" "\e$(G!S"7"B!U\e(B") | |
814 | ("[" "\e$(0!F!J!b!H!L!V!Z!X!\\e(B" "\e$(G!F!J!b!H!L!V!Z!X!\\e(B") | |
815 | ("]" "\e$(0!G!K!c!I!M!W![!Y!]\e(B" "\e$(G!G!K!c!I!M!W![!Y!]\e(B") | |
816 | ("{" "\e$(0!B!`!D\e(B " "\e$(G!B!`!D\e(B ") | |
817 | ("}" "\e$(0!C!a!E\e(B" "\e$(G!C!a!E\e(B") | |
818 | ("`" "\e$(0!j!k\e(B" "\e$(G!j!k\e(B") | |
819 | ("~" "\e$(0"D"+",!<!=\e(B" "\e$(G"D"+",!<!=\e(B") | |
820 | ("!" "\e$(0!*!5\e(B" "\e$(G!*!5\e(B") | |
821 | ("@" "\e$(0"i"n\e(B" "\e$(G"i"n\e(B") | |
822 | ("#" "\e$(0!l"-\e(B" "\e$(G!l"-\e(B") | |
823 | ("$" "\e$(0"c"l\e(B" "\e$(G"c"l\e(B") | |
824 | ("%" "\e$(0"h"m\e(B" "\e$(G"h"m\e(B") | |
825 | ("&" "\e$(0!m".\e(B" "\e$(G!m".\e(B") | |
826 | ("*" "\e$(0!n"/!o!w!x\e(B" "\e$(G!n"/!o!w!x\e(B") | |
827 | ("(" "\e$(0!>!^!@\e(B" "\e$(G!>!^!@\e(B") | |
828 | (")" "\e$(0!?!_!A\e(B" "\e$(G!?!_!A\e(B") | |
829 | ("-" "\e$(0!7!9"#"$"1"@\e(B" "\e$(G!7!9"#"$"1"@\e(B") | |
830 | ("_" "\e$(0"%"&\e(B" "\e$(G"%"&\e(B") | |
831 | ("=" "\e$(0"8"C\e(B" "\e$(G"8"C\e(B") | |
832 | ("+" "\e$(0"0"?\e(B" "\e$(G"0"?\e(B")))) | |
833 | (dolist (elt punctuations) | |
834 | (insert (format "(%S %S)\n" (concat "z" (car elt)) | |
835 | (if big5-p (nth 1 elt) (nth 2 elt)))))) | |
836 | (insert ")\n"))) | |
837 | ||
838 | (defun tsang-b5-converter (dicbuf name title) | |
839 | (tsang-quick-converter dicbuf name title t t)) | |
840 | ||
841 | (defun quick-b5-converter (dicbuf name title) | |
842 | (tsang-quick-converter dicbuf name title nil t)) | |
843 | ||
844 | (defun tsang-cns-converter (dicbuf name title) | |
845 | (tsang-quick-converter dicbuf name title t nil)) | |
846 | ||
847 | (defun quick-cns-converter (dicbuf name title) | |
848 | (tsang-quick-converter dicbuf name title nil nil)) | |
849 | ||
850 | ;; Generate a code of a Quail package in the current buffer from | |
851 | ;; Pinyin dictionary in the buffer DICBUF. The input method name of | |
852 | ;; the Quail package is NAME, and the title string is TITLE. | |
853 | ||
854 | (defun py-converter (dicbuf name title) | |
855 | (goto-char (point-max)) | |
856 | (insert (format "%S\n" "\e$A::WVJdHk!KF4Rt!K\e(B | |
857 | ||
858 | \e$AF4Rt7=08\e(B | |
859 | ||
860 | \e$AP!P4S"NDWVD84z1m!8F4Rt!97{:E#,\e(B \"u(yu) \e$ATrSC\e(B u: \e$A1mJ>!C\e(B | |
861 | ||
862 | Pinyin base input method for Chinese charset GB2312 (`chinese-gb2312'). | |
863 | ||
c3ff164a | 864 | Pinyin is the standard roman transliteration method for Chinese. |
c063e381 KH |
865 | Pinyin uses a sequence of Latin alphabetic characters for each Chinese |
866 | character. The sequence is made by the combination of the initials | |
867 | \(the beginning sounds) and finals (the ending sounds). | |
868 | ||
869 | initials: b p m f d t n l z c s zh ch sh r j q x g k h | |
870 | finals: a o e i er ai ei oa ou an en ang eng ong i ia iao ie iu ian in | |
871 | iang ing iong u ua uo uai ui uan un uan ueng yu yue yuan yun | |
872 | ||
873 | (Note: In the correct Pinyin writing, the sequence \"yu\" in the last | |
874 | four finals should be written by the character u-umlaut `\e$A(9\e(B'.) | |
875 | ||
876 | With this input method, you enter a Chinese character by first | |
877 | entering its pinyin spelling. | |
878 | ||
879 | \\<quail-translation-docstring> | |
880 | ||
881 | For instance, to input \e$ADc\e(B, you type \"n i C-n 3\". The first \"n i\" | |
882 | is a Pinyin, \"C-n\" selects the next group of candidates (each group | |
883 | contains at most 10 characters), \"3\" select the third character in | |
884 | that group. | |
885 | ||
886 | This input method supports only Han characters. The related input | |
887 | method `chinese-py-punct' is the combination of this method and | |
888 | `chinese-punct'; it supports both Han characters and punctuation | |
889 | characters. | |
890 | ||
891 | For double-width GB2312 characters corresponding to ASCII, use the | |
892 | input method `chinese-qj'. | |
893 | ||
894 | The correct Pinyin system specifies tones by diacritical marks, but | |
895 | this input method doesn't use them, which results in easy (you don't | |
896 | have to know the exact tones), but verbose (many characters are assigned | |
897 | to the same key sequence) input. You may also want to try the input | |
898 | method `chinese-tonepy' with which you must specify tones by digits | |
899 | \(1..5).")) | |
900 | (insert " '((\"\C-?\" . quail-delete-last-char) | |
901 | (\".\" . quail-next-translation) | |
902 | (\">\" . quail-next-translation) | |
903 | (\",\" . quail-prev-translation) | |
904 | (\"<\" . quail-prev-translation)) | |
905 | nil nil nil nil)\n\n") | |
906 | (insert "(quail-define-rules\n") | |
907 | (let ((pos (point))) | |
8b735b2b | 908 | (insert-buffer-substring-no-properties dicbuf) |
c063e381 | 909 | (goto-char pos) |
8c8d1081 | 910 | (re-search-forward "^[a-z]") |
7d15a839 KH |
911 | (beginning-of-line) |
912 | (delete-region pos (point)) | |
c063e381 KH |
913 | (while (not (eobp)) |
914 | (insert "(\"") | |
915 | (skip-chars-forward "a-z") | |
916 | (insert "\" \"") | |
917 | (delete-char 1) | |
918 | (end-of-line) | |
8b735b2b KH |
919 | (while (= (preceding-char) ?\r) |
920 | (delete-char -1)) | |
c063e381 KH |
921 | (insert "\")") |
922 | (forward-line 1))) | |
923 | (insert ")\n")) | |
924 | ||
925 | ;; Generate a code of a Quail package in the current buffer from | |
926 | ;; Ziranma dictionary in the buffer DICBUF. The input method name of | |
927 | ;; the Quail package is NAME, and the title string is TITLE. | |
928 | ||
929 | (defun ziranma-converter (dicbuf name title) | |
930 | (let (dic) | |
9a529312 | 931 | (with-current-buffer dicbuf |
c063e381 | 932 | (goto-char (point-min)) |
8b735b2b KH |
933 | (search-forward "\n%keyname end") |
934 | (forward-line 1) | |
c063e381 KH |
935 | (let ((table (make-hash-table :test 'equal)) |
936 | elt pos key trans val) | |
937 | (while (not (eobp)) | |
938 | (setq pos (point)) | |
939 | (skip-chars-forward "^ \t") | |
8b735b2b | 940 | (setq key (buffer-substring-no-properties pos (point))) |
c063e381 | 941 | (skip-chars-forward " \t") |
8b735b2b KH |
942 | (setq pos (point)) |
943 | (skip-chars-forward "^\r\n") | |
944 | (setq trans (vector (buffer-substring-no-properties pos (point)))) | |
c063e381 KH |
945 | (setq val (gethash key table)) |
946 | (if val (setq trans (vconcat val trans))) | |
947 | (puthash key trans table) | |
948 | (forward-line 1)) | |
949 | (maphash #'(lambda (key trans) | |
950 | (let ((len (length trans)) | |
951 | i) | |
952 | (if (and (= len 1) (= (length (aref trans 0)) 1)) | |
953 | (setq trans (aref trans 0)) | |
954 | (setq i 0) | |
955 | (while (and (< i len) | |
956 | (= (length (aref trans i)) 1)) | |
957 | (setq i (1+ i))) | |
958 | (if (= i len) | |
959 | (setq trans (mapconcat 'identity trans ""))))) | |
960 | (setq dic (cons (cons key trans) dic))) | |
961 | table))) | |
962 | (setq dic (sort dic (function (lambda (x y) (string< (car x) (car y)))))) | |
963 | (goto-char (point-max)) | |
964 | (insert (format "%S\n" "\e$A::WVJdHk!K!>WTH;!?!K\e(B | |
965 | ||
966 | \e$A<|EL6TUU1m\e(B: | |
967 | \e$A)3)%)%)W)%)%)W)%)%)W)%)%)W)%)%)W)%)%)W)%)%)W)%)%)W)%)%)W)%)%)7\e(B | |
968 | \e$A)'#Q\e(B \e$A)'#W\e(B \e$A)'#E\e(B \e$A)'#R\e(B \e$A)'#T\e(B \e$A)'#Y\e(B \e$A)'#U\e(Bsh\e$A)'#I\e(Bch\e$A)'#O\e(B \e$A)'#P\e(B \e$A)'\e(B | |
969 | \e$A)'\e(B iu\e$A)'\e(B ua\e$A)'\e(B e\e$A)'\e(B uan\e$A)'\e(B ue\e$A)'\e(B uai\e$A)'\e(B u\e$A)'\e(B i\e$A)'\e(B o\e$A)'\e(B un\e$A)'\e(B | |
970 | \e$A)'\e(B \e$A)'\e(B ia\e$A)'\e(B \e$A)'\e(B van\e$A)'\e(B ve\e$A)'\e(B ing\e$A)'\e(B \e$A)'\e(B \e$A)'\e(B uo\e$A)'\e(B vn\e$A)'\e(B | |
971 | \e$A);)W)%)_)W)%)_)W)%)_)W)%)_)W)%)_)W)%)_)W)%)_)W)%)_)W)%)_)W)%)?\e(B | |
972 | \e$A)'#A\e(B \e$A)'#S\e(B \e$A)'#D\e(B \e$A)'#F\e(B \e$A)'#G\e(B \e$A)'#H\e(B \e$A)'#J\e(B \e$A)'#K\e(B \e$A)'#L\e(B \e$A)'\e(B | |
973 | \e$A)'\e(B a\e$A)'\e(Biong\e$A)'\e(Buang\e$A)'\e(B en\e$A)'\e(B eng\e$A)'\e(B ang\e$A)'\e(B an\e$A)'\e(B ao\e$A)'\e(B ai\e$A)'\e(B | |
974 | \e$A)'\e(B \e$A)'\e(B ong\e$A)'\e(Biang\e$A)'\e(B \e$A)'\e(B ng\e$A)'\e(B \e$A)'\e(B \e$A)'\e(B \e$A)'\e(B \e$A)'\e(B | |
975 | \e$A);)W)%)_)W)%)_)W)%)_)W)%)_)W)%)_)W)%)_)W)%)_)W)%)_)W)%)_)W)%)%)7\e(B | |
976 | \e$A)'#Z\e(B \e$A)'#X\e(B \e$A)'#C\e(B \e$A)'#V\e(Bzh\e$A)'#B\e(B \e$A)'#N\e(B \e$A)'#M\e(B \e$A)'#,\e(B \e$A)'#.\e(B \e$A)'\e(B \e$A#/\e(B \e$A)'\e(B | |
977 | \e$A)'\e(B ei\e$A)'\e(B ie\e$A)'\e(B iao\e$A)'\e(B ui\e$A)'\e(B ou\e$A)'\e(B in\e$A)'\e(B ian\e$A)'G0R3)':sR3)'7{:E)'\e(B | |
978 | \e$A)'\e(B \e$A)'\e(B \e$A)'\e(B \e$A)'\e(B v\e$A)'\e(B \e$A)'\e(B \e$A)'\e(B \e$A)'\e(B \e$A)'\e(B \e$A)'\e(B \e$A)'\e(B | |
979 | \e$A);)%)%)_)%)%)_)%)%)_)%)%)_)%)%)_)%)%)_)%)%)_)%)%)_)%)%)_)%)%)?\e(B | |
980 | ||
981 | ||
982 | Pinyin base input method for Chinese GB2312 characters (`chinese-gb2312'). | |
983 | ||
984 | Pinyin is the standard roman transliteration method for Chinese. | |
985 | For the details of Pinyin system, see the documentation of the input | |
986 | method `chinese-py'. | |
987 | ||
988 | Unlike the standard spelling of Pinyin, in this input method all | |
989 | initials and finals are assigned to single keys (see the above table). | |
990 | For instance, the initial \"ch\" is assigned to the key `i', the final | |
991 | \"iu\" is assigned to the key `q', and tones 1, 2, 3, 4, and \e$AGaIy\e(B are | |
992 | assigned to the keys `q', `w', `e', `r', `t' respectively. | |
993 | ||
994 | \\<quail-translation-docstring> | |
995 | ||
996 | To input one-letter words, you type 4 keys, the first two for the | |
997 | Pinyin of the letter, next one for tone, and the last one is always a | |
998 | quote ('). For instance, \"vsq'\" input \e$AVP\e(B. Exceptions are these | |
999 | letters. You can input them just by typing a single key. | |
1000 | ||
1001 | Character: \e$A04\e(B \e$A2;\e(B \e$A4N\e(B \e$A5D\e(B \e$A6~\e(B \e$A7"\e(B \e$A8v\e(B \e$A:M\e(B \e$A3v\e(B \e$A<0\e(B \e$A?I\e(B \e$AAK\e(B \e$AC;\e(B | |
1002 | Key: a b c d e f g h i j k l m | |
1003 | Character: \e$ADc\e(B \e$AE7\e(B \e$AF,\e(B \e$AF_\e(B \e$AHK\e(B \e$AH}\e(B \e$AK{\e(B \e$AJG\e(B \e$AWE\e(B \e$ANR\e(B \e$AP!\e(B \e$AR;\e(B \e$ATZ\e(B | |
1004 | Key: n o p q r s t u v w x y z | |
1005 | ||
1006 | To input two-letter words, you have two ways. One way is to type 4 | |
1007 | keys, two for the first Pinyin, two for the second Pinyin. For | |
1008 | instance, \"vsgo\" inputs \e$AVP9z\e(B. Another way is to type 3 keys: 2 | |
1009 | initials of two letters, and quote ('). For instance, \"vg'\" also | |
1010 | inputs \e$AVP9z\e(B. | |
1011 | ||
1012 | To input three-letter words, you type 4 keys: initials of three | |
1013 | letters, and the last is quote ('). For instance, \"bjy'2\" inputs \e$A11\e(B | |
1014 | \e$A>)Q<\e(B (the last `2' is to select one of the candidates). | |
1015 | ||
1016 | To input words of more than three letters, you type 4 keys, initials | |
1017 | of the first three letters and the last letter. For instance, | |
1018 | \"bjdt\" inputs \e$A11>)5gJSL(\e(B. | |
1019 | ||
1020 | To input symbols and punctuations, type `/' followed by one of `a' to | |
1021 | `z', then select one of the candidates.")) | |
1022 | (insert " '((\"\C-?\" . quail-delete-last-char) | |
1023 | (\".\" . quail-next-translation) | |
1024 | (\"[\" . quail-next-translation) | |
1025 | (\",\" . quail-prev-translation) | |
1026 | (\"]\" . quail-prev-translation)) | |
1027 | nil nil nil nil)\n\n") | |
1028 | (insert "(quail-define-rules\n") | |
1029 | (dolist (elt dic) | |
1030 | (insert (format "(%S %S)\n" (car elt) (cdr elt)))) | |
1031 | (insert ")\n"))) | |
1032 | ||
a4c4011b AC |
1033 | ;; Generate the code for a Quail package in the current buffer from a |
1034 | ;; CTLau or CTLau-b5 dictionary in the buffer DICBUF. The input | |
1035 | ;; method name of the Quail package is NAME, and the title string is | |
1036 | ;; TITLE. DESCRIPTION is the string shown by describe-input-method. | |
1037 | ||
1038 | (defun ctlau-converter (dicbuf name title description) | |
1039 | (goto-char (point-max)) | |
1040 | (insert (format "%S\n" description)) | |
1041 | (insert " '((\"\C-?\" . quail-delete-last-char) | |
1042 | (\".\" . quail-next-translation) | |
1043 | (\">\" . quail-next-translation) | |
1044 | (\",\" . quail-prev-translation) | |
1045 | (\"<\" . quail-prev-translation)) | |
1046 | nil nil nil nil)\n\n") | |
1047 | (insert "(quail-define-rules\n") | |
1048 | (let (dicbuf-start dicbuf-end key-start key (pos (point))) | |
1049 | ;; Find the dictionary, which starts below a horizontal rule and | |
1050 | ;; ends at the second to last line in the HTML file. | |
9a529312 | 1051 | (with-current-buffer dicbuf |
a4c4011b | 1052 | (goto-char (point-min)) |
8b735b2b KH |
1053 | (re-search-forward "^#<hr>") |
1054 | (forward-line 1) | |
a4c4011b AC |
1055 | (setq dicbuf-start (point)) |
1056 | (goto-char (point-max)) | |
8b735b2b | 1057 | (re-search-backward "^<hr>") |
a4c4011b | 1058 | (setq dicbuf-end (point))) |
8b735b2b | 1059 | (insert-buffer-substring-no-properties dicbuf dicbuf-start dicbuf-end) |
a4c4011b AC |
1060 | ;; CTLau-b5.html contains characters (0xa1 0xbc) which show up as |
1061 | ;; hollow boxes when the original characters in CTLau.html from | |
1062 | ;; which the file is converted have no Big5 equivalent. Go | |
1063 | ;; through and delete them. | |
1064 | (goto-char pos) | |
1065 | (while (search-forward "\e$(0!{\e(B" nil t) | |
1066 | (delete-char -1)) | |
1067 | ;; Uppercase keys in dictionary need to be downcased. Backslashes | |
1068 | ;; at the beginning of keys need to be turned into double | |
1069 | ;; backslashes. | |
1070 | (goto-char pos) | |
1071 | (while (not (eobp)) | |
1072 | (insert "(\"") | |
1073 | (if (char-equal (following-char) ?\\) | |
1074 | (insert "\\")) | |
1075 | (setq key-start (point)) | |
1076 | (skip-chars-forward "\\\\A-Z") | |
1077 | (downcase-region key-start (point)) | |
1078 | (insert "\" \"") | |
1079 | (delete-char 1) | |
1080 | (end-of-line) | |
8b735b2b KH |
1081 | (while (= (preceding-char) ?\r) |
1082 | (delete-char -1)) | |
a4c4011b AC |
1083 | (insert "\")") |
1084 | (forward-line 1))) | |
1085 | (insert ")\n")) | |
1086 | ||
1087 | (defun ctlau-gb-converter (dicbuf name title) | |
1088 | (ctlau-converter dicbuf name title | |
1089 | "\e$A::WVJdHk!KAuN}OiJ=TARt!K\e(B | |
1090 | ||
1091 | \e$AAuN}OiJ=TASoW"Rt7=08\e(B | |
1092 | Sidney Lau's Cantonese transcription scheme as described in his book | |
1093 | \"Elementary Cantonese\", The Government Printer, Hong Kong, 1972. | |
1094 | This file was prepared by Fung Fung Lee (\e$A@n7c7e\e(B). | |
1095 | Originally converted from CTCPS3.tit | |
1096 | Last modified: June 2, 1993. | |
1097 | ||
4e7e1f03 | 1098 | Some infrequent GB characters are accessed by typing \\, followed by |
a4c4011b AC |
1099 | the Cantonese romanization of the respective radical (\e$A2?JW\e(B).")) |
1100 | ||
1101 | (defun ctlau-b5-converter (dicbuf name title) | |
1102 | (ctlau-converter dicbuf name title | |
1103 | "\e$(0KH)tTT&,!(N,Tg>A*#Gn5x!(\e(B | |
1104 | ||
1105 | \e$(0N,Tg>A*#GnM$0D5x'J7{\e(B | |
1106 | Sidney Lau's Cantonese transcription scheme as described in his book | |
1107 | \"Elementary Cantonese\", The Government Printer, Hong Kong, 1972. | |
1108 | This file was prepared by Fung Fung Lee (\e$(0,XFS76\e(B). | |
1109 | Originally converted from CTCPS3.tit | |
1110 | Last modified: June 2, 1993. | |
1111 | ||
4e7e1f03 | 1112 | Some infrequent characters are accessed by typing \\, followed by |
a4c4011b AC |
1113 | the Cantonese romanization of the respective radical (\e$(0?f5}\e(B).")) |
1114 | ||
5cec3056 | 1115 | (declare-function dos-8+3-filename "dos-fns.el" (filename)) |
73e6adaa | 1116 | |
c063e381 | 1117 | (defun miscdic-convert (filename &optional dirname) |
a1506d29 | 1118 | "Convert a dictionary file FILENAME into a Quail package. |
c063e381 KH |
1119 | Optional argument DIRNAME if specified is the directory name under which |
1120 | the generated Quail package is saved." | |
1121 | (interactive "FInput method dictionary file: ") | |
1122 | (or (file-readable-p filename) | |
1123 | (error "%s does not exist" filename)) | |
1124 | (let ((tail quail-misc-package-ext-info) | |
98223b73 | 1125 | coding-system-for-write |
c063e381 KH |
1126 | slot |
1127 | name title dicfile coding quailfile converter copyright | |
1128 | dicbuf) | |
1129 | (while tail | |
d1df889e KH |
1130 | (setq slot (car tail) |
1131 | dicfile (nth 2 slot) | |
1132 | quailfile (nth 4 slot)) | |
1133 | (when (and (or (string-match dicfile filename) | |
1134 | ;; MS-DOS filesystem truncates file names to 8+3 | |
1135 | ;; limits, so "cangjie-table.cns" becomes | |
1136 | ;; "cangjie-.cns", and the above string-match | |
1137 | ;; fails. Give DOS users a chance... | |
1138 | (and (fboundp 'msdos-long-file-names) | |
1139 | (not (msdos-long-file-names)) | |
1140 | (string-match (dos-8+3-filename dicfile) filename))) | |
1141 | (if (file-newer-than-file-p | |
1142 | filename (expand-file-name quailfile dirname)) | |
1143 | t | |
1144 | (message "%s is up to date" quailfile) | |
1145 | nil)) | |
1146 | (setq name (car slot) | |
c063e381 | 1147 | title (nth 1 slot) |
c063e381 | 1148 | coding (nth 3 slot) |
c063e381 KH |
1149 | converter (nth 5 slot) |
1150 | copyright (nth 6 slot)) | |
1151 | (message "Converting %s to %s..." dicfile quailfile) | |
f9362982 KH |
1152 | ;; Explicitly set eol format to `unix'. |
1153 | (setq coding-system-for-write | |
1154 | (coding-system-change-eol-conversion coding 'unix)) | |
c063e381 | 1155 | (with-temp-file (expand-file-name quailfile dirname) |
53cfe624 SM |
1156 | (insert (format ";; Quail package `%s' -*- coding:%s -*-\n" |
1157 | name coding)) | |
c063e381 KH |
1158 | (insert ";; Generated by the command `miscdic-convert'\n") |
1159 | (insert ";; Date: " (current-time-string) "\n") | |
1160 | (insert ";; Source dictionary file: " dicfile "\n") | |
1161 | (insert ";; Copyright notice of the source file\n") | |
1162 | (insert ";;------------------------------------------------------\n") | |
1163 | (insert copyright "\n") | |
1164 | (insert ";;------------------------------------------------------\n") | |
1165 | (insert "\n") | |
1166 | (insert ";;; Code:\n\n") | |
1167 | (insert "(require 'quail)\n") | |
1168 | (insert "(quail-define-package \"" name "\" \"" | |
98223b73 KH |
1169 | (if (eq coding 'big5) "Chinese-BIG5" |
1170 | (if (eq coding 'iso-2022-cn-ext) "Chinese-CNS" | |
1171 | "Chinese-GB")) | |
c063e381 | 1172 | "\" \"" title "\" t\n") |
8b735b2b KH |
1173 | (let* ((coding-system-for-read |
1174 | (coding-system-change-eol-conversion coding 'unix)) | |
c063e381 KH |
1175 | (dicbuf (find-file-noselect filename))) |
1176 | (funcall converter dicbuf name title) | |
1177 | (kill-buffer dicbuf))) | |
1178 | (message "Converting %s to %s...done" dicfile quailfile)) | |
1179 | (setq tail (cdr tail))))) | |
1180 | ||
1181 | (defun batch-miscdic-convert () | |
1182 | "Run `miscdic-convert' on the files remaing on the command line. | |
1183 | Use this from the command line, with `-batch'; | |
1184 | it won't work in an interactive Emacs. | |
1185 | If there's an argument \"-dir\", the next argument specifies a directory | |
1186 | to store generated Quail packages." | |
1187 | (defvar command-line-args-left) ; Avoid compiler warning. | |
1188 | (if (not noninteractive) | |
1189 | (error "`batch-miscdic-convert' should be used only with -batch")) | |
1190 | (let ((dir default-directory) | |
1191 | filename) | |
1192 | (while command-line-args-left | |
1193 | (if (string= (car command-line-args-left) "-dir") | |
1194 | (progn | |
1195 | (setq command-line-args-left (cdr command-line-args-left)) | |
0631f894 KH |
1196 | (setq dir (car command-line-args-left)) |
1197 | (setq command-line-args-left (cdr command-line-args-left)))) | |
c063e381 KH |
1198 | (setq filename (car command-line-args-left) |
1199 | command-line-args-left (cdr command-line-args-left)) | |
1200 | (if (file-directory-p filename) | |
1201 | (dolist (file (directory-files filename t nil t)) | |
98223b73 KH |
1202 | (or (file-directory-p file) |
1203 | (miscdic-convert file dir))) | |
c063e381 KH |
1204 | (miscdic-convert filename dir)))) |
1205 | (kill-emacs 0)) | |
1206 | ||
5cdaf2a5 KH |
1207 | ;; Local Variables: |
1208 | ;; coding: iso-2022-7bit | |
1209 | ;; End: | |
60370d40 PJ |
1210 | |
1211 | ;;; titdic-cnv.el ends here |