In setup-LANGUAGE-environment functions,
[bpt/emacs.git] / lisp / language / japan-util.el
CommitLineData
3fdc9c8f 1;;; japan-util.el --- utilities for Japanese
4ed46869 2
4ed46869 3;; Copyright (C) 1995 Electrotechnical Laboratory, JAPAN.
fa526c4a 4;; Licensed to the Free Software Foundation.
4ed46869
KH
5
6;; Keywords: mule, multilingual, Japanese
7
8;; This file is part of GNU Emacs.
9
10;; GNU Emacs is free software; you can redistribute it and/or modify
11;; it under the terms of the GNU General Public License as published by
12;; the Free Software Foundation; either version 2, or (at your option)
13;; any later version.
14
15;; GNU Emacs is distributed in the hope that it will be useful,
16;; but WITHOUT ANY WARRANTY; without even the implied warranty of
17;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18;; GNU General Public License for more details.
19
20;; You should have received a copy of the GNU General Public License
369314dc
KH
21;; along with GNU Emacs; see the file COPYING. If not, write to the
22;; Free Software Foundation, Inc., 59 Temple Place - Suite 330,
23;; Boston, MA 02111-1307, USA.
4ed46869
KH
24
25;;; Code:
26
335a7ad7
KH
27;;;###autoload
28(defun setup-japanese-environment ()
29 "Setup multilingual environment (MULE) for Japanese."
30 (interactive)
31 (setup-english-environment)
8f3969f8
KH
32 (set-language-environment-coding-systems "Japanese")
33 (if (eq system-type 'ms-dos)
34 (prefer-coding-system 'japanese-shift-jis))
a5aab75c 35 (setq default-input-method "japanese"))
335a7ad7 36
4ed46869
KH
37(defconst japanese-kana-table
38 '((?\e$B$"\e(B ?\e$B%"\e(B ?\e(I1\e(B) (?\e$B$$\e(B ?\e$B%$\e(B ?\e(I2\e(B) (?\e$B$&\e(B ?\e$B%&\e(B ?\e(I3\e(B) (?\e$B$(\e(B ?\e$B%(\e(B ?\e(I4\e(B) (?\e$B$*\e(B ?\e$B%*\e(B ?\e(I5\e(B)
39 (?\e$B$+\e(B ?\e$B%+\e(B ?\e(I6\e(B) (?\e$B$-\e(B ?\e$B%-\e(B ?\e(I7\e(B) (?\e$B$/\e(B ?\e$B%/\e(B ?\e(I8\e(B) (?\e$B$1\e(B ?\e$B%1\e(B ?\e(I9\e(B) (?\e$B$3\e(B ?\e$B%3\e(B ?\e(I:\e(B)
40 (?\e$B$5\e(B ?\e$B%5\e(B ?\e(I;\e(B) (?\e$B$7\e(B ?\e$B%7\e(B ?\e(I<\e(B) (?\e$B$9\e(B ?\e$B%9\e(B ?\e(I=\e(B) (?\e$B$;\e(B ?\e$B%;\e(B ?\e(I>\e(B) (?\e$B$=\e(B ?\e$B%=\e(B ?\e(I?\e(B)
41 (?\e$B$?\e(B ?\e$B%?\e(B ?\e(I@\e(B) (?\e$B$A\e(B ?\e$B%A\e(B ?\e(IA\e(B) (?\e$B$D\e(B ?\e$B%D\e(B ?\e(IB\e(B) (?\e$B$F\e(B ?\e$B%F\e(B ?\e(IC\e(B) (?\e$B$H\e(B ?\e$B%H\e(B ?\e(ID\e(B)
42 (?\e$B$J\e(B ?\e$B%J\e(B ?\e(IE\e(B) (?\e$B$K\e(B ?\e$B%K\e(B ?\e(IF\e(B) (?\e$B$L\e(B ?\e$B%L\e(B ?\e(IG\e(B) (?\e$B$M\e(B ?\e$B%M\e(B ?\e(IH\e(B) (?\e$B$N\e(B ?\e$B%N\e(B ?\e(II\e(B)
43 (?\e$B$O\e(B ?\e$B%O\e(B ?\e(IJ\e(B) (?\e$B$R\e(B ?\e$B%R\e(B ?\e(IK\e(B) (?\e$B$U\e(B ?\e$B%U\e(B ?\e(IL\e(B) (?\e$B$X\e(B ?\e$B%X\e(B ?\e(IM\e(B) (?\e$B$[\e(B ?\e$B%[\e(B ?\e(IN\e(B)
44 (?\e$B$^\e(B ?\e$B%^\e(B ?\e(IO\e(B) (?\e$B$_\e(B ?\e$B%_\e(B ?\e(IP\e(B) (?\e$B$`\e(B ?\e$B%`\e(B ?\e(IQ\e(B) (?\e$B$a\e(B ?\e$B%a\e(B ?\e(IR\e(B) (?\e$B$b\e(B ?\e$B%b\e(B ?\e(IS\e(B)
45 (?\e$B$d\e(B ?\e$B%d\e(B ?\e(IT\e(B) (?\e$B$f\e(B ?\e$B%f\e(B ?\e(IU\e(B) (?\e$B$h\e(B ?\e$B%h\e(B ?\e(IV\e(B)
46 (?\e$B$i\e(B ?\e$B%i\e(B ?\e(IW\e(B) (?\e$B$j\e(B ?\e$B%j\e(B ?\e(IX\e(B) (?\e$B$k\e(B ?\e$B%k\e(B ?\e(IY\e(B) (?\e$B$l\e(B ?\e$B%l\e(B ?\e(IZ\e(B) (?\e$B$m\e(B ?\e$B%m\e(B ?\e(I[\e(B)
47 (?\e$B$o\e(B ?\e$B%o\e(B ?\e(I\\e(B) (?\e$B$p\e(B ?\e$B%p\e(B nil) (?\e$B$q\e(B ?\e$B%q\e(B nil) (?\e$B$r\e(B ?\e$B%r\e(B ?\e(I&\e(B)
48 (?\e$B$s\e(B ?\e$B%s\e(B ?\e(I]\e(B)
49 (?\e$B$,\e(B ?\e$B%,\e(B "\e(I6^\e(B") (?\e$B$.\e(B ?\e$B%.\e(B "\e(I7^\e(B") (?\e$B$0\e(B ?\e$B%0\e(B "\e(I8^\e(B") (?\e$B$2\e(B ?\e$B%2\e(B "\e(I9^\e(B") (?\e$B$4\e(B ?\e$B%4\e(B "\e(I:^\e(B")
50 (?\e$B$6\e(B ?\e$B%6\e(B "\e(I;^\e(B") (?\e$B$8\e(B ?\e$B%8\e(B "\e(I<^\e(B") (?\e$B$:\e(B ?\e$B%:\e(B "\e(I=^\e(B") (?\e$B$<\e(B ?\e$B%<\e(B "\e(I>^\e(B") (?\e$B$>\e(B ?\e$B%>\e(B "\e(I?^\e(B")
51 (?\e$B$@\e(B ?\e$B%@\e(B "\e(I@^\e(B") (?\e$B$B\e(B ?\e$B%B\e(B "\e(IA^\e(B") (?\e$B$E\e(B ?\e$B%E\e(B "\e(IB^\e(B") (?\e$B$G\e(B ?\e$B%G\e(B "\e(IC^\e(B") (?\e$B$I\e(B ?\e$B%I\e(B "\e(ID^\e(B")
52 (?\e$B$P\e(B ?\e$B%P\e(B "\e(IJ^\e(B") (?\e$B$S\e(B ?\e$B%S\e(B "\e(IK^\e(B") (?\e$B$V\e(B ?\e$B%V\e(B "\e(IL^\e(B") (?\e$B$Y\e(B ?\e$B%Y\e(B "\e(IM^\e(B") (?\e$B$\\e(B ?\e$B%\\e(B "\e(IN^\e(B")
53 (?\e$B$Q\e(B ?\e$B%Q\e(B "\e(IJ_\e(B") (?\e$B$T\e(B ?\e$B%T\e(B "\e(IK_\e(B") (?\e$B$W\e(B ?\e$B%W\e(B "\e(IL_\e(B") (?\e$B$Z\e(B ?\e$B%Z\e(B "\e(IM_\e(B") (?\e$B$]\e(B ?\e$B%]\e(B "\e(IN_\e(B")
54 (?\e$B$!\e(B ?\e$B%!\e(B ?\e(I'\e(B) (?\e$B$#\e(B ?\e$B%#\e(B ?\e(I(\e(B) (?\e$B$%\e(B ?\e$B%%\e(B ?\e(I)\e(B) (?\e$B$'\e(B ?\e$B%'\e(B ?\e(I*\e(B) (?\e$B$)\e(B ?\e$B%)\e(B ?\e(I+\e(B)
55 (?\e$B$C\e(B ?\e$B%C\e(B ?\e(I/\e(B)
56 (?\e$B$c\e(B ?\e$B%c\e(B ?\e(I,\e(B) (?\e$B$e\e(B ?\e$B%e\e(B ?\e(I-\e(B) (?\e$B$g\e(B ?\e$B%g\e(B ?\e(I.\e(B)
57 (?\e$B$n\e(B ?\e$B%n\e(B nil)
58 (nil ?\e$B%t\e(B "\e(I3^\e(B") (nil ?\e$B%u\e(B nil) (nil ?\e$B%v\e(B nil))
59 "Japanese JISX0208 Kana character table.
60Each element is of the form (HIRAGANA KATAKANA HANKAKU-KATAKANA), where
61HIRAGANA and KATAKANA belong to `japanese-jisx0208',
62HANKAKU-KATAKANA belongs to `japanese-jisx0201-kana'.")
63
64;; Put properties 'katakana, 'hiragana, and 'jix0201 to each Japanese
65;; kana characters for conversion among them.
66(let ((l japanese-kana-table)
67 slot hiragana katakana jisx0201)
68 (while l
69 (setq slot (car l)
70 hiragana (car slot) katakana (nth 1 slot) jisx0201 (nth 2 slot)
71 l (cdr l))
72 (if hiragana
73 (progn
74 (put-char-code-property hiragana 'katakana katakana)
75 (put-char-code-property katakana 'hiragana hiragana)
76 (if jisx0201
77 (progn
78 (put-char-code-property hiragana 'jisx0201 jisx0201)
79 (if (integerp jisx0201)
80 (put-char-code-property jisx0201 'hiragana hiragana))))))
81 (if jisx0201
82 (progn
83 (put-char-code-property katakana 'jisx0201 jisx0201)
84 (if (integerp jisx0201)
85 (put-char-code-property jisx0201 'katakana katakana))))))
86
87(defconst japanese-symbol-table
88 '((?\\e$B!!\e(B ?\ ) (?\e$B!"\e(B ?, ?\e(I$\e(B) (?\e$B!#\e(B ?. ?\e(I!\e(B) (?\e$B!$\e(B ?, ?\e(I$\e(B) (?\e$B!%\e(B ?. ?\e(I!\e(B) (?\e$B!&\e(B nil ?\e(I%\e(B)
89 (?\e$B!'\e(B ?:) (?\e$B!(\e(B ?\;) (?\e$B!)\e(B ??) (?\e$B!*\e(B ?!) (?\e$B!+\e(B nil ?\e(I^\e(B) (?\e$B!,\e(B nil ?\e(I_\e(B)
90 (?\e$B!-\e(B ?') (?\e$B!.\e(B ?`) (?\e$B!0\e(B ?^) (?\e$B!2\e(B ?_) (?\e$B!<\e(B ?-) (?\e$B!=\e(B ?-) (?\e$B!>\e(B ?-)
91 (?\e$B!?\e(B ?/) (?\e$B!@\e(B ?\\) (?\e$B!A\e(B ?~) (?\e$B!C\e(B ?|) (?\e$B!F\e(B ?`) (?\e$B!G\e(B ?') (?\e$B!H\e(B ?\") (?\e$B!I\e(B ?\")
92 (?\\e$B!J\e(B ?\() (?\\e$B!K\e(B ?\)) (?\\e$B!N\e(B ?[) (?\\e$B!O\e(B ?]) (?\\e$B!P\e(B ?{) (?\\e$B!Q\e(B ?})
93 (?\e$B!R\e(B ?<) (?\e$B!S\e(B ?>) (?\e$B!\\e(B ?+) (?\e$B!]\e(B ?-) (?\e$B!a\e(B ?=) (?\e$B!c\e(B ?<) (?\e$B!d\e(B ?>)
94 (?\e$B!l\e(B ?') (?\e$B!m\e(B ?\") (?\e$B!o\e(B ?\\) (?\e$B!p\e(B ?$) (?\e$B!s\e(B ?%) (?\e$B!t\e(B ?#) (?\e$B!u\e(B ?&) (?\e$B!v\e(B ?*)
95 (?\e$B!w\e(B ?@))
96 "Japanese JISX0208 symbol character table.
97 Each element is of the form (SYMBOL ASCII HANKAKU), where SYMBOL
98belongs to `japanese-jisx0208', ASCII belongs to `ascii', and HANKAKU
99belongs to `japanese-jisx0201-kana'.")
100
101;; Put properties 'jisx0208, 'jisx0201, and 'ascii to each Japanese
102;; symbol and ASCII characters for conversion among them.
103(let ((l japanese-symbol-table)
104 slot jisx0208 ascii jisx0201)
105 (while l
106 (setq slot (car l)
107 jisx0208 (car slot) ascii (nth 1 slot) jisx0201 (nth 2 slot)
108 l (cdr l))
109 (if ascii
110 (progn
111 (put-char-code-property jisx0208 'ascii ascii)
112 (put-char-code-property ascii 'jisx0208 jisx0208)))
113 (if jisx0201
114 (progn
115 (put-char-code-property jisx0208 'jisx0201 jisx0201)
116 (put-char-code-property jisx0201 'jisx0208 jisx0208)))))
117
118(defconst japanese-alpha-numeric-table
119 '((?\e$B#0\e(B . ?0) (?\e$B#1\e(B . ?1) (?\e$B#2\e(B . ?2) (?\e$B#3\e(B . ?3) (?\e$B#4\e(B . ?4)
120 (?\e$B#5\e(B . ?5) (?\e$B#6\e(B . ?6) (?\e$B#7\e(B . ?7) (?\e$B#8\e(B . ?8) (?\e$B#9\e(B . ?9)
121 (?\e$B#A\e(B . ?A) (?\e$B#B\e(B . ?B) (?\e$B#C\e(B . ?C) (?\e$B#D\e(B . ?D) (?\e$B#E\e(B . ?E)
122 (?\e$B#F\e(B . ?F) (?\e$B#G\e(B . ?G) (?\e$B#H\e(B . ?H) (?\e$B#I\e(B . ?I) (?\e$B#J\e(B . ?J)
123 (?\e$B#K\e(B . ?K) (?\e$B#L\e(B . ?L) (?\e$B#M\e(B . ?M) (?\e$B#N\e(B . ?N) (?\e$B#O\e(B . ?O)
124 (?\e$B#P\e(B . ?P) (?\e$B#Q\e(B . ?Q) (?\e$B#R\e(B . ?R) (?\e$B#S\e(B . ?S) (?\e$B#T\e(B . ?T)
125 (?\e$B#U\e(B . ?U) (?\e$B#V\e(B . ?V) (?\e$B#W\e(B . ?W) (?\e$B#X\e(B . ?X) (?\e$B#Y\e(B . ?Y) (?\e$B#Z\e(B . ?Z)
126 (?\e$B#a\e(B . ?a) (?\e$B#b\e(B . ?b) (?\e$B#c\e(B . ?c) (?\e$B#d\e(B . ?d) (?\e$B#e\e(B . ?e)
127 (?\e$B#f\e(B . ?f) (?\e$B#g\e(B . ?g) (?\e$B#h\e(B . ?h) (?\e$B#i\e(B . ?i) (?\e$B#j\e(B . ?j)
128 (?\e$B#k\e(B . ?k) (?\e$B#l\e(B . ?l) (?\e$B#m\e(B . ?m) (?\e$B#n\e(B . ?n) (?\e$B#o\e(B . ?o)
129 (?\e$B#p\e(B . ?p) (?\e$B#q\e(B . ?q) (?\e$B#r\e(B . ?r) (?\e$B#s\e(B . ?s) (?\e$B#t\e(B . ?t)
130 (?\e$B#u\e(B . ?u) (?\e$B#v\e(B . ?v) (?\e$B#w\e(B . ?w) (?\e$B#x\e(B . ?x) (?\e$B#y\e(B . ?y) (?\e$B#z\e(B . ?z))
131 "Japanese JISX0208 alpha numeric character table.
132Each element is of the form (ALPHA-NUMERIC ASCII), where ALPHA-NUMERIC
133belongs to `japanese-jisx0208', ASCII belongs to `ascii'.")
134
135;; Put properties 'jisx0208 and 'ascii to each Japanese alpha numeric
136;; and ASCII characters for conversion between them.
137(let ((l japanese-alpha-numeric-table)
138 slot jisx0208 ascii)
139 (while l
140 (setq slot (car l)
141 jisx0208 (car slot) ascii (cdr slot)
142 l (cdr l))
143 (put-char-code-property jisx0208 'ascii ascii)
144 (put-char-code-property ascii 'jisx0208 jisx0208)))
145
146;; Convert string STR by FUNC and return a resulting string.
147(defun japanese-string-conversion (str func &rest args)
148 (let ((buf (get-buffer-create " *Japanese work*")))
149 (save-excursion
150 (set-buffer buf)
151 (erase-buffer)
152 (insert str)
153 (apply func 1 (point) args)
154 (buffer-string))))
155
156;;;###autoload
157(defun japanese-katakana (obj &optional hankaku)
158 "Convert argument to Katakana and return that.
159The argument may be a character or string. The result has the same type.
160The argument object is not altered--the value is a copy.
161Optional argument HANKAKU t means to convert to `hankaku' Katakana
162 \(`japanese-jisx0201-kana'), in which case return value
163 may be a string even if OBJ is a character if two Katakanas are
164 necessary to represent OBJ."
165 (if (stringp obj)
166 (japanese-string-conversion obj 'japanese-katakana-region hankaku)
167 (or (get-char-code-property obj (if hankaku 'jisx0201 'katakana))
168 obj)))
169
170;;;###autoload
171(defun japanese-hiragana (obj)
172 "Convert argument to Hiragana and return that.
173The argument may be a character or string. The result has the same type.
174The argument object is not altered--the value is a copy."
175 (if (stringp obj)
176 (japanese-string-conversion obj 'japanese-hiragana-region)
177 (or (get-char-code-property obj 'hiragana)
178 obj)))
179
180;;;###autoload
181(defun japanese-hankaku (obj &optional ascii-only)
182 "Convert argument to `hankaku' and return that.
183The argument may be a character or string. The result has the same type.
184The argument object is not altered--the value is a copy.
185Optional argument ASCII-ONLY non-nil means to return only ASCII character."
186 (if (stringp obj)
187 (japanese-string-conversion obj 'japanese-hankaku-region ascii-only)
188 (or (get-char-code-property obj 'ascii)
189 (and (not ascii-only)
190 (get-char-code-property obj 'jisx0201))
191 obj)))
192
193;;;###autoload
194(defun japanese-zenkaku (obj)
195 "Convert argument to `zenkaku' and return that.
196The argument may be a character or string. The result has the same type.
197The argument object is not altered--the value is a copy."
198 (if (stringp obj)
199 (japanese-string-conversion obj 'japanese-zenkaku-region)
200 (or (get-char-code-property obj 'jisx0208)
201 obj)))
202
203;;;###autoload
204(defun japanese-katakana-region (from to &optional hankaku)
205 "Convert Japanese `hiragana' chars in the region to `katakana' chars.
206Optional argument HANKAKU t means to convert to `hankaku katakana' character
207of which charset is `japanese-jisx0201-kana'."
208 (interactive "r\nP")
209 (save-restriction
210 (narrow-to-region from to)
211 (goto-char (point-min))
212 (while (re-search-forward "\\cH\\|\\cK" nil t)
213 (let* ((hira (preceding-char))
214 (kata (japanese-katakana hira hankaku)))
215 (if kata
216 (progn
217 (delete-region (match-beginning 0) (match-end 0))
218 (insert kata)))))))
219
220;;;###autoload
221(defun japanese-hiragana-region (from to)
222 "Convert Japanese `katakana' chars in the region to `hiragana' chars."
223 (interactive "r")
224 (save-restriction
225 (narrow-to-region from to)
226 (goto-char (point-min))
227 (while (re-search-forward "\\cK\\|\\ck" nil t)
228 (let* ((kata (preceding-char))
229 (hira (japanese-hiragana kata)))
230 (if hira
231 (progn
232 (delete-region (match-beginning 0) (match-end 0))
233 (insert hira)))))))
234
235;;;###autoload
236(defun japanese-hankaku-region (from to &optional ascii-only)
237 "Convert Japanese `zenkaku' chars in the region to `hankaku' chars.
238`Zenkaku' chars belong to `japanese-jisx0208'
239`Hankaku' chars belong to `ascii' or `japanese-jisx0201-kana'.
240Optional argument ASCII-ONLY non-nil means to convert only to ASCII char."
241 (interactive "r\nP")
242 (save-restriction
243 (narrow-to-region from to)
244 (goto-char (point-min))
245 (while (re-search-forward "\\cj" nil t)
246 (let* ((zenkaku (preceding-char))
247 (hankaku (japanese-hankaku zenkaku ascii-only)))
248 (if hankaku
249 (progn
250 (delete-region (match-beginning 0) (match-end 0))
251 (insert hankaku)))))))
252
253;;;###autoload
254(defun japanese-zenkaku-region (from to)
255 "Convert hankaku' chars in the region to Japanese `zenkaku' chars.
256`Zenkaku' chars belong to `japanese-jisx0208'
257`Hankaku' chars belong to `ascii' or `japanese-jisx0201-kana'."
258 (interactive "r")
259 (save-restriction
260 (narrow-to-region from to)
261 (goto-char (point-min))
262 (while (re-search-forward "\\ca\\|\\ck" nil t)
263 (let* ((hankaku (preceding-char))
264 (zenkaku (japanese-zenkaku hankaku)))
265 (if zenkaku
266 (progn
267 (delete-region (match-beginning 0) (match-end 0))
268 (insert zenkaku)))))))
269
270;;;###autoload
271(defun read-hiragana-string (prompt &optional initial-input)
272 "Read a Hiragana string from the minibuffer, prompting with string PROMPT.
273If non-nil, second arg INITIAL-INPUT is a string to insert before reading."
a6385fa9 274 (read-multilingual-string prompt initial-input "japanese-hiragana"))
4ed46869
KH
275
276;;
650e8505 277(provide 'japan-util)
4ed46869 278
4ed46869 279;;; japan-util.el ends here