1 ;;; ccl.el --- CCL (Code Conversion Language) compiler
3 ;; Copyright (C) 1995 Electrotechnical Laboratory, JAPAN.
4 ;; Licensed to the Free Software Foundation.
6 ;; Keywords: CCL, mule, multilingual, character set, coding-system
8 ;; This file is part of GNU Emacs.
10 ;; GNU Emacs is free software; you can redistribute it and/or modify
11 ;; it under the terms of the GNU General Public License as published by
12 ;; the Free Software Foundation; either version 2, or (at your option)
15 ;; GNU Emacs is distributed in the hope that it will be useful,
16 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
17 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 ;; GNU General Public License for more details.
20 ;; You should have received a copy of the GNU General Public License
21 ;; along with GNU Emacs; see the file COPYING. If not, write to the
22 ;; Free Software Foundation, Inc., 59 Temple Place - Suite 330,
23 ;; Boston, MA 02111-1307, USA.
27 ;; CCL (Code Conversion Language) is a simple programming language to
28 ;; be used for various kind of code conversion. CCL program is
29 ;; compiled to CCL code (vector of integers) and executed by CCL
30 ;; interpreter of Emacs.
32 ;; CCL is used for code conversion at process I/O and file I/O for
33 ;; non-standard coding-system. In addition, it is used for
34 ;; calculating a code point of X's font from a character code.
35 ;; However, since CCL is designed as a powerful programming language,
36 ;; it can be used for more generic calculation. For instance,
37 ;; combination of three or more arithmetic operations can be
38 ;; calculated faster than Emacs Lisp.
40 ;; Here's the syntax of CCL program in BNF notation.
43 ;; (BUFFER_MAGNIFICATION
47 ;; BUFFER_MAGNIFICATION := integer
48 ;; CCL_MAIN_BLOCK := CCL_BLOCK
49 ;; CCL_EOF_BLOCK := CCL_BLOCK
52 ;; STATEMENT | (STATEMENT [STATEMENT ...])
54 ;; SET | IF | BRANCH | LOOP | REPEAT | BREAK | READ | WRITE | CALL
58 ;; | (REG ASSIGNMENT_OPERATOR EXPRESSION)
61 ;; EXPRESSION := ARG | (EXPRESSION OPERATOR ARG)
63 ;; IF := (if EXPRESSION CCL_BLOCK CCL_BLOCK)
64 ;; BRANCH := (branch EXPRESSION CCL_BLOCK [CCL_BLOCK ...])
65 ;; LOOP := (loop STATEMENT [STATEMENT ...])
69 ;; | (write-repeat [REG | integer | string])
70 ;; | (write-read-repeat REG [integer | ARRAY])
73 ;; | (read-if (REG OPERATOR ARG) CCL_BLOCK CCL_BLOCK)
74 ;; | (read-branch REG CCL_BLOCK [CCL_BLOCK ...])
75 ;; | (read-multibyte-character REG {charset} REG {code-point})
78 ;; | (write EXPRESSION)
79 ;; | (write integer) | (write string) | (write REG ARRAY)
81 ;; | (write-multibyte-character REG(charset) REG(codepoint))
83 ;; (translate-character REG(table) REG(charset) REG(codepoint))
84 ;; | (translate-character SYMBOL REG(charset) REG(codepoint))
86 ;; (iterate-multiple-map REG REG MAP-IDs)
87 ;; | (map-multiple REG REG (MAP-SET))
88 ;; | (map-single REG REG MAP-ID)
89 ;; MAP-IDs := MAP-ID ...
90 ;; MAP-SET := MAP-IDs | (MAP-IDs) MAP-SET
93 ;; CALL := (call ccl-program-name)
96 ;; REG := r0 | r1 | r2 | r3 | r4 | r5 | r6 | r7
97 ;; ARG := REG | integer
99 ;; + | - | * | / | % | & | '|' | ^ | << | >> | <8 | >8 | //
100 ;; | < | > | == | <= | >= | != | de-sjis | en-sjis
101 ;; ASSIGNMENT_OPERATOR :=
102 ;; += | -= | *= | /= | %= | &= | '|=' | ^= | <<= | >>=
103 ;; ARRAY := '[' integer ... ']'
108 "CCL (Code Conversion Language) compiler."
112 (defconst ccl-command-table
113 [if branch loop break repeat write-repeat write-read-repeat
114 read read-if read-branch write call end
115 read-multibyte-character write-multibyte-character
117 iterate-multiple-map map-multiple map-single
]
118 "Vector of CCL commands (symbols).")
120 ;; Put a property to each symbol of CCL commands for the compiler.
121 (let (op (i 0) (len (length ccl-command-table
)))
123 (setq op
(aref ccl-command-table i
))
124 (put op
'ccl-compile-function
(intern (format "ccl-compile-%s" op
)))
127 (defconst ccl-code-table
135 write-register-read-jump
137 write-const-read-jump
139 write-array-read-jump
151 set-assign-expr-const
152 set-assign-expr-register
156 jump-cond-expr-register
157 read-jump-cond-expr-const
158 read-jump-cond-expr-register
161 "Vector of CCL compiled codes (symbols).")
163 (defconst ccl-extended-code-table
164 [read-multibyte-character
165 write-multibyte-character
167 translate-character-const-tbl
168 nil nil nil nil nil nil nil nil nil nil nil nil
; 0x04-0x0f
173 "Vector of CCL extended compiled codes (symbols).")
175 ;; Put a property to each symbol of CCL codes for the disassembler.
176 (let (code (i 0) (len (length ccl-code-table
)))
178 (setq code
(aref ccl-code-table i
))
179 (put code
'ccl-code i
)
180 (put code
'ccl-dump-function
(intern (format "ccl-dump-%s" code
)))
183 (let (code (i 0) (len (length ccl-extended-code-table
)))
185 (setq code
(aref ccl-extended-code-table i
))
188 (put code
'ccl-ex-code i
)
189 (put code
'ccl-dump-function
(intern (format "ccl-dump-%s" code
)))))
192 (defconst ccl-jump-code-list
193 '(jump jump-cond write-register-jump write-register-read-jump
194 write-const-jump write-const-read-jump write-string-jump
195 write-array-read-jump read-jump
))
197 ;; Put a property `jump-flag' to each CCL code which execute jump in
199 (let ((l ccl-jump-code-list
))
201 (put (car l
) 'jump-flag t
)
204 (defconst ccl-register-table
205 [r0 r1 r2 r3 r4 r5 r6 r7
]
206 "Vector of CCL registers (symbols).")
208 ;; Put a property to indicate register number to each symbol of CCL.
210 (let (reg (i 0) (len (length ccl-register-table
)))
212 (setq reg
(aref ccl-register-table i
))
213 (put reg
'ccl-register-number i
)
216 (defconst ccl-arith-table
217 [+ -
* / %
& | ^
<< >> <8 >8 // nil nil nil
218 < > == <= >= != de-sjis en-sjis
]
219 "Vector of CCL arithmetic/logical operators (symbols).")
221 ;; Put a property to each symbol of CCL operators for the compiler.
222 (let (arith (i 0) (len (length ccl-arith-table
)))
224 (setq arith
(aref ccl-arith-table i
))
225 (if arith
(put arith
'ccl-arith-code i
))
228 (defconst ccl-assign-arith-table
229 [+= -
= *= /= %
= &= |
= ^
= <<= >>= <8= >8= //=]
230 "Vector of CCL assignment operators (symbols).")
232 ;; Put a property to each symbol of CCL assignment operators for the compiler.
233 (let (arith (i 0) (len (length ccl-assign-arith-table
)))
235 (setq arith
(aref ccl-assign-arith-table i
))
236 (put arith
'ccl-self-arith-code i
)
239 (defvar ccl-program-vector nil
240 "Working vector of CCL codes produced by CCL compiler.")
241 (defvar ccl-current-ic
0
242 "The current index for `ccl-program-vector'.")
244 ;; Embed integer DATA in `ccl-program-vector' at `ccl-current-ic' and
245 ;; increment it. If IC is specified, embed DATA at IC.
246 (defun ccl-embed-data (data &optional ic
)
248 (aset ccl-program-vector ic data
)
249 (let ((len (length ccl-program-vector
)))
250 (if (>= ccl-current-ic len
)
251 (let ((new (make-vector (* len
2) nil
)))
254 (aset new len
(aref ccl-program-vector len
)))
255 (setq ccl-program-vector new
))))
256 (aset ccl-program-vector ccl-current-ic data
)
257 (setq ccl-current-ic
(1+ ccl-current-ic
))))
259 ;; Embed pair of SYMBOL and PROP where (get SYMBOL PROP) should give
260 ;; proper index number for SYMBOL. PROP should be
261 ;; `translation-table-id', `code-conversion-map-id', or
262 ;; `ccl-program-idx'.
263 (defun ccl-embed-symbol (symbol prop
)
264 (ccl-embed-data (cons symbol prop
)))
266 ;; Embed string STR of length LEN in `ccl-program-vector' at
268 (defun ccl-embed-string (len str
)
271 (ccl-embed-data (logior (ash (aref str i
) 16)
273 (ash (aref str
(1+ i
)) 8)
280 ;; Embed a relative jump address to `ccl-current-ic' in
281 ;; `ccl-program-vector' at IC without altering the other bit field.
282 (defun ccl-embed-current-address (ic)
283 (let ((relative (- ccl-current-ic
(1+ ic
))))
284 (aset ccl-program-vector ic
285 (logior (aref ccl-program-vector ic
) (ash relative
8)))))
287 ;; Embed CCL code for the operation OP and arguments REG and DATA in
288 ;; `ccl-program-vector' at `ccl-current-ic' in the following format.
289 ;; |----------------- integer (28-bit) ------------------|
290 ;; |------------ 20-bit ------------|- 3-bit --|- 5-bit -|
291 ;; |------------- DATA -------------|-- REG ---|-- OP ---|
292 ;; If REG2 is specified, embed a code in the following format.
293 ;; |------- 17-bit ------|- 3-bit --|- 3-bit --|- 5-bit -|
294 ;; |-------- DATA -------|-- REG2 --|-- REG ---|-- OP ---|
296 ;; If REG is a CCL register symbol (e.g. r0, r1...), the register
297 ;; number is embedded. If OP is one of unconditional jumps, DATA is
298 ;; changed to an relative jump address.
300 (defun ccl-embed-code (op reg data
&optional reg2
)
301 (if (and (> data
0) (get op
'jump-flag
))
302 ;; DATA is an absolute jump address. Make it relative to the
303 ;; next of jump code.
304 (setq data
(- data
(1+ ccl-current-ic
))))
305 (let ((code (logior (get op
'ccl-code
)
307 (if (symbolp reg
) (get reg
'ccl-register-number
) reg
) 5)
309 (logior (ash (get reg2
'ccl-register-number
) 8)
312 (ccl-embed-data code
)))
314 ;; extended ccl command format
315 ;; |- 14-bit -|- 3-bit --|- 3-bit --|- 3-bit --|- 5-bit -|
316 ;; |- EX-OP --|-- REG3 --|-- REG2 --|-- REG ---|-- OP ---|
317 (defun ccl-embed-extended-command (ex-op reg reg2 reg3
)
318 (let ((data (logior (ash (get ex-op
'ccl-ex-code
) 3)
320 (get reg3
'ccl-register-number
)
322 (ccl-embed-code 'ex-cmd reg data reg2
)))
324 ;; Just advance `ccl-current-ic' by INC.
325 (defun ccl-increment-ic (inc)
326 (setq ccl-current-ic
(+ ccl-current-ic inc
)))
328 ;; If non-nil, index of the start of the current loop.
329 (defvar ccl-loop-head nil
)
330 ;; If non-nil, list of absolute addresses of the breaking points of
332 (defvar ccl-breaks nil
)
335 (defun ccl-compile (ccl-program)
336 "Return a compiled code of CCL-PROGRAM as a vector of integer."
337 (if (or (null (consp ccl-program
))
338 (null (integerp (car ccl-program
)))
339 (null (listp (car (cdr ccl-program
)))))
340 (error "CCL: Invalid CCL program: %s" ccl-program
))
341 (if (null (vectorp ccl-program-vector
))
342 (setq ccl-program-vector
(make-vector 8192 0)))
343 (setq ccl-loop-head nil ccl-breaks nil
)
344 (setq ccl-current-ic
0)
346 ;; The first element is the buffer magnification.
347 (ccl-embed-data (car ccl-program
))
349 ;; The second element is the address of the start CCL code for
350 ;; processing end of input buffer (we call it eof-processor). We
354 ;; Compile the main body of the CCL program.
355 (ccl-compile-1 (car (cdr ccl-program
)))
357 ;; Embed the address of eof-processor.
358 (ccl-embed-data ccl-current-ic
1)
360 ;; Then compile eof-processor.
361 (if (nth 2 ccl-program
)
362 (ccl-compile-1 (nth 2 ccl-program
)))
364 ;; At last, embed termination code.
365 (ccl-embed-code 'end
0 0)
367 (let ((vec (make-vector ccl-current-ic
0))
369 (while (< i ccl-current-ic
)
370 (aset vec i
(aref ccl-program-vector i
))
374 ;; Signal syntax error.
375 (defun ccl-syntax-error (cmd)
376 (error "CCL: Syntax error: %s" cmd
))
378 ;; Check if ARG is a valid CCL register.
379 (defun ccl-check-register (arg cmd
)
380 (if (get arg
'ccl-register-number
)
382 (error "CCL: Invalid register %s in %s." arg cmd
)))
384 ;; Check if ARG is a valid CCL command.
385 (defun ccl-check-compile-function (arg cmd
)
386 (or (get arg
'ccl-compile-function
)
387 (error "CCL: Invalid command: %s" cmd
)))
389 ;; In the following code, most ccl-compile-XXXX functions return t if
390 ;; they end with unconditional jump, else return nil.
392 ;; Compile CCL-BLOCK (see the syntax above).
393 (defun ccl-compile-1 (ccl-block)
394 (let (unconditional-jump
396 (if (or (integerp ccl-block
)
398 (and ccl-block
(symbolp (car ccl-block
))))
399 ;; This block consists of single statement.
400 (setq ccl-block
(list ccl-block
)))
402 ;; Now CCL-BLOCK is a list of statements. Compile them one by
405 (setq cmd
(car ccl-block
))
406 (setq unconditional-jump
407 (cond ((integerp cmd
)
408 ;; SET statement for the register 0.
409 (ccl-compile-set (list 'r0
'= cmd
)))
412 ;; WRITE statement of string argument.
413 (ccl-compile-write-string cmd
))
416 ;; The other statements.
417 (cond ((eq (nth 1 cmd
) '=)
418 ;; SET statement of the form `(REG = EXPRESSION)'.
419 (ccl-compile-set cmd
))
421 ((and (symbolp (nth 1 cmd
))
422 (get (nth 1 cmd
) 'ccl-self-arith-code
))
423 ;; SET statement with an assignment operation.
424 (ccl-compile-self-set cmd
))
427 (funcall (ccl-check-compile-function (car cmd
) cmd
)
431 (ccl-syntax-error cmd
))))
432 (setq ccl-block
(cdr ccl-block
)))
435 (defconst ccl-max-short-const
(ash 1 19))
436 (defconst ccl-min-short-const
(ash -
1 19))
438 ;; Compile SET statement.
439 (defun ccl-compile-set (cmd)
440 (let ((rrr (ccl-check-register (car cmd
) cmd
))
443 ;; CMD has the form `(RRR = (XXX OP YYY))'.
444 (ccl-compile-expression rrr right
))
447 ;; CMD has the form `(RRR = integer)'.
448 (if (and (<= right ccl-max-short-const
)
449 (>= right ccl-min-short-const
))
450 (ccl-embed-code 'set-short-const rrr right
)
451 (ccl-embed-code 'set-const rrr
0)
452 (ccl-embed-data right
)))
455 ;; CMD has the form `(RRR = rrr [ array ])'.
456 (ccl-check-register right cmd
)
457 (let ((ary (nth 3 cmd
)))
459 (let ((i 0) (len (length ary
)))
460 (ccl-embed-code 'set-array rrr len right
)
462 (ccl-embed-data (aref ary i
))
464 (ccl-embed-code 'set-register rrr
0 right
))))))
467 ;; Compile SET statement with ASSIGNMENT_OPERATOR.
468 (defun ccl-compile-self-set (cmd)
469 (let ((rrr (ccl-check-register (car cmd
) cmd
))
472 ;; CMD has the form `(RRR ASSIGN_OP (XXX OP YYY))', compile
473 ;; the right hand part as `(r7 = (XXX OP YYY))' (note: the
474 ;; register 7 can be used for storing temporary value).
476 (ccl-compile-expression 'r7 right
)
478 ;; Now CMD has the form `(RRR ASSIGN_OP ARG)'. Compile it as
479 ;; `(RRR = (RRR OP ARG))'.
480 (ccl-compile-expression
482 (list rrr
(intern (substring (symbol-name (nth 1 cmd
)) 0 -
1)) right
)))
485 ;; Compile SET statement of the form `(RRR = EXPR)'.
486 (defun ccl-compile-expression (rrr expr
)
487 (let ((left (car expr
))
488 (op (get (nth 1 expr
) 'ccl-arith-code
))
489 (right (nth 2 expr
)))
492 ;; EXPR has the form `((EXPR2 OP2 ARG) OP RIGHT)'. Compile
493 ;; the first term as `(r7 = (EXPR2 OP2 ARG)).'
494 (ccl-compile-expression 'r7 left
)
497 ;; Now EXPR has the form (LEFT OP RIGHT).
498 (if (and (eq rrr left
)
499 (< op
(length ccl-assign-arith-table
)))
500 ;; Compile this SET statement as `(RRR OP= RIGHT)'.
503 (ccl-embed-code 'set-assign-expr-const rrr
(ash op
3) 'r0
)
504 (ccl-embed-data right
))
505 (ccl-check-register right expr
)
506 (ccl-embed-code 'set-assign-expr-register rrr
(ash op
3) right
))
508 ;; Compile this SET statement as `(RRR = (LEFT OP RIGHT))'.
511 (ccl-embed-code 'set-expr-const rrr
(ash op
3) left
)
512 (ccl-embed-data right
))
513 (ccl-check-register right expr
)
514 (ccl-embed-code 'set-expr-register
516 (logior (ash op
3) (get right
'ccl-register-number
))
519 ;; Compile WRITE statement with string argument.
520 (defun ccl-compile-write-string (str)
521 (setq str
(string-as-unibyte str
))
522 (let ((len (length str
)))
523 (ccl-embed-code 'write-const-string
1 len
)
524 (ccl-embed-string len str
))
527 ;; Compile IF statement of the form `(if CONDITION TRUE-PART FALSE-PART)'.
528 ;; If READ-FLAG is non-nil, this statement has the form
529 ;; `(read-if (REG OPERATOR ARG) TRUE-PART FALSE-PART)'.
530 (defun ccl-compile-if (cmd &optional read-flag
)
531 (if (and (/= (length cmd
) 3) (/= (length cmd
) 4))
532 (error "CCL: Invalid number of arguments: %s" cmd
))
533 (let ((condition (nth 1 cmd
))
534 (true-cmds (nth 2 cmd
))
535 (false-cmds (nth 3 cmd
))
538 (if (and (listp condition
)
539 (listp (car condition
)))
540 ;; If CONDITION is a nested expression, the inner expression
541 ;; should be compiled at first as SET statement, i.e.:
542 ;; `(if ((X OP2 Y) OP Z) ...)' is compiled into two statements:
543 ;; `(r7 = (X OP2 Y)) (if (r7 OP Z) ...)'.
545 (ccl-compile-expression 'r7
(car condition
))
546 (setq condition
(cons 'r7
(cdr condition
)))
547 (setq cmd
(cons (car cmd
)
548 (cons condition
(cdr (cdr cmd
)))))))
550 (setq jump-cond-address ccl-current-ic
)
551 ;; Compile CONDITION.
552 (if (symbolp condition
)
553 ;; CONDITION is a register.
555 (ccl-check-register condition cmd
)
556 (ccl-embed-code 'jump-cond condition
0))
557 ;; CONDITION is a simple expression of the form (RRR OP ARG).
558 (let ((rrr (car condition
))
559 (op (get (nth 1 condition
) 'ccl-arith-code
))
560 (arg (nth 2 condition
)))
561 (ccl-check-register rrr cmd
)
564 (ccl-embed-code (if read-flag
'read-jump-cond-expr-const
565 'jump-cond-expr-const
)
568 (ccl-embed-data arg
))
569 (ccl-check-register arg cmd
)
570 (ccl-embed-code (if read-flag
'read-jump-cond-expr-register
571 'jump-cond-expr-register
)
574 (ccl-embed-data (get arg
'ccl-register-number
)))))
576 ;; Compile TRUE-PART.
577 (let ((unconditional-jump (ccl-compile-1 true-cmds
)))
578 (if (null false-cmds
)
579 ;; This is the place to jump to if condition is false.
581 (ccl-embed-current-address jump-cond-address
)
582 (setq unconditional-jump nil
))
583 (let (end-true-part-address)
584 (if (not unconditional-jump
)
586 ;; If TRUE-PART does not end with unconditional jump, we
587 ;; have to jump to the end of FALSE-PART from here.
588 (setq end-true-part-address ccl-current-ic
)
589 (ccl-embed-code 'jump
0 0)))
590 ;; This is the place to jump to if CONDITION is false.
591 (ccl-embed-current-address jump-cond-address
)
592 ;; Compile FALSE-PART.
593 (setq unconditional-jump
594 (and (ccl-compile-1 false-cmds
) unconditional-jump
))
595 (if end-true-part-address
596 ;; This is the place to jump to after the end of TRUE-PART.
597 (ccl-embed-current-address end-true-part-address
))))
598 unconditional-jump
)))
600 ;; Compile BRANCH statement.
601 (defun ccl-compile-branch (cmd)
602 (if (< (length cmd
) 3)
603 (error "CCL: Invalid number of arguments: %s" cmd
))
604 (ccl-compile-branch-blocks 'branch
605 (ccl-compile-branch-expression (nth 1 cmd
) cmd
)
608 ;; Compile READ statement of the form `(read-branch EXPR BLOCK0 BLOCK1 ...)'.
609 (defun ccl-compile-read-branch (cmd)
610 (if (< (length cmd
) 3)
611 (error "CCL: Invalid number of arguments: %s" cmd
))
612 (ccl-compile-branch-blocks 'read-branch
613 (ccl-compile-branch-expression (nth 1 cmd
) cmd
)
616 ;; Compile EXPRESSION part of BRANCH statement and return register
617 ;; which holds a value of the expression.
618 (defun ccl-compile-branch-expression (expr cmd
)
620 ;; EXPR has the form `(EXPR2 OP ARG)'. Compile it as SET
621 ;; statement of the form `(r7 = (EXPR2 OP ARG))'.
623 (ccl-compile-expression 'r7 expr
)
625 (ccl-check-register expr cmd
)))
627 ;; Compile BLOCKs of BRANCH statement. CODE is 'branch or 'read-branch.
628 ;; REG is a register which holds a value of EXPRESSION part. BLOCKs
629 ;; is a list of CCL-BLOCKs.
630 (defun ccl-compile-branch-blocks (code rrr blocks
)
631 (let ((branches (length blocks
))
633 jump-table-head-address
636 block-unconditional-jump
)
637 (ccl-embed-code code rrr branches
)
638 (setq jump-table-head-address ccl-current-ic
)
639 ;; The size of jump table is the number of blocks plus 1 (for the
640 ;; case RRR is out of range).
641 (ccl-increment-ic (1+ branches
))
642 (setq empty-block-indexes
(list branches
))
643 ;; Compile each block.
646 (if (null (car blocks
))
647 ;; This block is empty.
648 (setq empty-block-indexes
(cons branch-idx empty-block-indexes
)
649 block-unconditional-jump t
)
650 ;; This block is not empty.
651 (ccl-embed-data (- ccl-current-ic jump-table-head-address
)
652 (+ jump-table-head-address branch-idx
))
653 (setq block-unconditional-jump
(ccl-compile-1 (car blocks
)))
654 (if (not block-unconditional-jump
)
656 ;; Jump address of the end of branches are embedded later.
657 ;; For the moment, just remember where to embed them.
658 (setq block-tail-addresses
659 (cons ccl-current-ic block-tail-addresses
))
660 (ccl-embed-code 'jump
0 0))))
661 (setq branch-idx
(1+ branch-idx
))
662 (setq blocks
(cdr blocks
)))
663 (if (not block-unconditional-jump
)
664 ;; We don't need jump code at the end of the last block.
665 (setq block-tail-addresses
(cdr block-tail-addresses
)
666 ccl-current-ic
(1- ccl-current-ic
)))
667 ;; Embed jump address at the tailing jump commands of blocks.
668 (while block-tail-addresses
669 (ccl-embed-current-address (car block-tail-addresses
))
670 (setq block-tail-addresses
(cdr block-tail-addresses
)))
671 ;; For empty blocks, make entries in the jump table point directly here.
672 (while empty-block-indexes
673 (ccl-embed-data (- ccl-current-ic jump-table-head-address
)
674 (+ jump-table-head-address
(car empty-block-indexes
)))
675 (setq empty-block-indexes
(cdr empty-block-indexes
))))
676 ;; Branch command ends by unconditional jump if RRR is out of range.
679 ;; Compile LOOP statement.
680 (defun ccl-compile-loop (cmd)
681 (if (< (length cmd
) 2)
682 (error "CCL: Invalid number of arguments: %s" cmd
))
683 (let* ((ccl-loop-head ccl-current-ic
)
689 (setq unconditional-jump t
)
691 (setq unconditional-jump
692 (and (ccl-compile-1 (car cmd
)) unconditional-jump
))
693 (setq cmd
(cdr cmd
)))
696 ;; Embed jump address for break statements encountered in
699 (ccl-embed-current-address (car ccl-breaks
))
700 (setq ccl-breaks
(cdr ccl-breaks
))))
703 ;; Compile BREAK statement.
704 (defun ccl-compile-break (cmd)
705 (if (/= (length cmd
) 1)
706 (error "CCL: Invalid number of arguments: %s" cmd
))
707 (if (null ccl-loop-head
)
708 (error "CCL: No outer loop: %s" cmd
))
709 (setq ccl-breaks
(cons ccl-current-ic ccl-breaks
))
710 (ccl-embed-code 'jump
0 0)
713 ;; Compile REPEAT statement.
714 (defun ccl-compile-repeat (cmd)
715 (if (/= (length cmd
) 1)
716 (error "CCL: Invalid number of arguments: %s" cmd
))
717 (if (null ccl-loop-head
)
718 (error "CCL: No outer loop: %s" cmd
))
719 (ccl-embed-code 'jump
0 ccl-loop-head
)
722 ;; Compile WRITE-REPEAT statement.
723 (defun ccl-compile-write-repeat (cmd)
724 (if (/= (length cmd
) 2)
725 (error "CCL: Invalid number of arguments: %s" cmd
))
726 (if (null ccl-loop-head
)
727 (error "CCL: No outer loop: %s" cmd
))
728 (let ((arg (nth 1 cmd
)))
729 (cond ((integerp arg
)
730 (ccl-embed-code 'write-const-jump
0 ccl-loop-head
)
731 (ccl-embed-data arg
))
733 (setq arg
(string-as-unibyte arg
))
734 (let ((len (length arg
))
736 (ccl-embed-code 'write-string-jump
0 ccl-loop-head
)
738 (ccl-embed-string len arg
)))
740 (ccl-check-register arg cmd
)
741 (ccl-embed-code 'write-register-jump arg ccl-loop-head
))))
744 ;; Compile WRITE-READ-REPEAT statement.
745 (defun ccl-compile-write-read-repeat (cmd)
746 (if (or (< (length cmd
) 2) (> (length cmd
) 3))
747 (error "CCL: Invalid number of arguments: %s" cmd
))
748 (if (null ccl-loop-head
)
749 (error "CCL: No outer loop: %s" cmd
))
750 (let ((rrr (ccl-check-register (nth 1 cmd
) cmd
))
753 (ccl-embed-code 'write-register-read-jump rrr ccl-loop-head
))
755 (ccl-embed-code 'write-const-read-jump rrr arg ccl-loop-head
))
757 (let ((len (length arg
))
759 (ccl-embed-code 'write-array-read-jump rrr ccl-loop-head
)
762 (ccl-embed-data (aref arg i
))
765 (error "CCL: Invalid argument %s: %s" arg cmd
)))
766 (ccl-embed-code 'read-jump rrr ccl-loop-head
))
769 ;; Compile READ statement.
770 (defun ccl-compile-read (cmd)
771 (if (< (length cmd
) 2)
772 (error "CCL: Invalid number of arguments: %s" cmd
))
773 (let* ((args (cdr cmd
))
774 (i (1- (length args
))))
776 (let ((rrr (ccl-check-register (car args
) cmd
)))
777 (ccl-embed-code 'read-register rrr i
)
778 (setq args
(cdr args
) i
(1- i
)))))
781 ;; Compile READ-IF statement.
782 (defun ccl-compile-read-if (cmd)
783 (ccl-compile-if cmd
'read
))
785 ;; Compile WRITE statement.
786 (defun ccl-compile-write (cmd)
787 (if (< (length cmd
) 2)
788 (error "CCL: Invalid number of arguments: %s" cmd
))
789 (let ((rrr (nth 1 cmd
)))
790 (cond ((integerp rrr
)
791 (ccl-embed-code 'write-const-string
0 rrr
))
793 (ccl-compile-write-string rrr
))
794 ((and (symbolp rrr
) (vectorp (nth 2 cmd
)))
795 (ccl-check-register rrr cmd
)
796 ;; CMD has the form `(write REG ARRAY)'.
797 (let* ((arg (nth 2 cmd
))
800 (ccl-embed-code 'write-array rrr len
)
802 (if (not (integerp (aref arg i
)))
803 (error "CCL: Invalid argument %s: %s" arg cmd
))
804 (ccl-embed-data (aref arg i
))
808 ;; CMD has the form `(write REG ...)'.
809 (let* ((args (cdr cmd
))
810 (i (1- (length args
))))
812 (setq rrr
(ccl-check-register (car args
) cmd
))
813 (ccl-embed-code 'write-register rrr i
)
814 (setq args
(cdr args
) i
(1- i
)))))
817 ;; CMD has the form `(write (LEFT OP RIGHT))'.
818 (let ((left (car rrr
))
819 (op (get (nth 1 rrr
) 'ccl-arith-code
))
823 ;; RRR has the form `((EXPR OP2 ARG) OP RIGHT)'.
824 ;; Compile the first term as `(r7 = (EXPR OP2 ARG))'.
825 (ccl-compile-expression 'r7 left
)
827 ;; Now RRR has the form `(ARG OP RIGHT)'.
830 (ccl-embed-code 'write-expr-const
0 (ash op
3) left
)
831 (ccl-embed-data right
))
832 (ccl-check-register right rrr
)
833 (ccl-embed-code 'write-expr-register
0
835 (get right
'ccl-register-number
))))))
838 (error "CCL: Invalid argument: %s" cmd
))))
841 ;; Compile CALL statement.
842 (defun ccl-compile-call (cmd)
843 (if (/= (length cmd
) 2)
844 (error "CCL: Invalid number of arguments: %s" cmd
))
845 (if (not (symbolp (nth 1 cmd
)))
846 (error "CCL: Subroutine should be a symbol: %s" cmd
))
847 (ccl-embed-code 'call
1 0)
848 (ccl-embed-symbol (nth 1 cmd
) 'ccl-program-idx
)
851 ;; Compile END statement.
852 (defun ccl-compile-end (cmd)
853 (if (/= (length cmd
) 1)
854 (error "CCL: Invalid number of arguments: %s" cmd
))
855 (ccl-embed-code 'end
0 0)
858 ;; Compile read-multibyte-character
859 (defun ccl-compile-read-multibyte-character (cmd)
860 (if (/= (length cmd
) 3)
861 (error "CCL: Invalid number of arguments: %s" cmd
))
862 (let ((RRR (nth 1 cmd
))
864 (ccl-check-register rrr cmd
)
865 (ccl-check-register RRR cmd
)
866 (ccl-embed-extended-command 'read-multibyte-character rrr RRR
0))
869 ;; Compile write-multibyte-character
870 (defun ccl-compile-write-multibyte-character (cmd)
871 (if (/= (length cmd
) 3)
872 (error "CCL: Invalid number of arguments: %s" cmd
))
873 (let ((RRR (nth 1 cmd
))
875 (ccl-check-register rrr cmd
)
876 (ccl-check-register RRR cmd
)
877 (ccl-embed-extended-command 'write-multibyte-character rrr RRR
0))
880 ;; Compile translate-character
881 (defun ccl-compile-translate-character (cmd)
882 (if (/= (length cmd
) 4)
883 (error "CCL: Invalid number of arguments: %s" cmd
))
884 (let ((Rrr (nth 1 cmd
))
887 (ccl-check-register rrr cmd
)
888 (ccl-check-register RRR cmd
)
889 (cond ((and (symbolp Rrr
) (not (get Rrr
'ccl-register-number
)))
890 (ccl-embed-extended-command 'translate-character-const-tbl
892 (ccl-embed-symbol Rrr
'translation-table-id
))
894 (ccl-check-register Rrr cmd
)
895 (ccl-embed-extended-command 'translate-character rrr RRR Rrr
))))
898 (defun ccl-compile-iterate-multiple-map (cmd)
899 (ccl-compile-multiple-map-function 'iterate-multiple-map cmd
)
902 (defun ccl-compile-map-multiple (cmd)
903 (if (/= (length cmd
) 4)
904 (error "CCL: Invalid number of arguments: %s" cmd
))
908 (let ((len 0) result add
)
910 (if (consp (car arg
))
911 (setq add
(funcall func
(car arg
) t
)
912 result
(append result add
)
913 add
(+ (- (car add
)) 1))
921 (cons (- len
) result
)
923 (setq arg
(append (list (nth 0 cmd
) (nth 1 cmd
) (nth 2 cmd
))
924 (funcall func
(nth 3 cmd
) nil
)))
925 (ccl-compile-multiple-map-function 'map-multiple arg
))
928 (defun ccl-compile-map-single (cmd)
929 (if (/= (length cmd
) 4)
930 (error "CCL: Invalid number of arguments: %s" cmd
))
931 (let ((RRR (nth 1 cmd
))
935 (ccl-check-register rrr cmd
)
936 (ccl-check-register RRR cmd
)
937 (ccl-embed-extended-command 'map-single rrr RRR
0)
939 (if (get map
'code-conversion-map
)
940 (ccl-embed-symbol map
'code-conversion-map-id
)
941 (error "CCL: Invalid map: %s" map
)))
943 (error "CCL: Invalid type of arguments: %s" cmd
))))
946 (defun ccl-compile-multiple-map-function (command cmd
)
947 (if (< (length cmd
) 4)
948 (error "CCL: Invalid number of arguments: %s" cmd
))
949 (let ((RRR (nth 1 cmd
))
951 (args (nthcdr 3 cmd
))
953 (ccl-check-register rrr cmd
)
954 (ccl-check-register RRR cmd
)
955 (ccl-embed-extended-command command rrr RRR
0)
956 (ccl-embed-data (length args
))
958 (setq map
(car args
))
960 (if (get map
'code-conversion-map
)
961 (ccl-embed-symbol map
'code-conversion-map-id
)
962 (error "CCL: Invalid map: %s" map
)))
964 (ccl-embed-data map
))
966 (error "CCL: Invalid type of arguments: %s" cmd
)))
967 (setq args
(cdr args
)))))
972 ;; To avoid byte-compiler warning.
976 (defun ccl-dump (ccl-code)
977 "Disassemble compiled CCL-CODE."
978 (let ((len (length ccl-code
))
979 (buffer-mag (aref ccl-code
0)))
980 (cond ((= buffer-mag
0)
981 (insert "Don't output anything.\n"))
983 (insert "Out-buffer must be as large as in-buffer.\n"))
986 (format "Out-buffer must be %d times bigger than in-buffer.\n"
988 (insert "Main-body:\n")
989 (setq ccl-current-ic
2)
990 (if (> (aref ccl-code
1) 0)
992 (while (< ccl-current-ic
(aref ccl-code
1))
994 (insert "At EOF:\n")))
995 (while (< ccl-current-ic len
)
999 ;; Return a CCL code in `ccl-code' at `ccl-current-ic'.
1000 (defun ccl-get-next-code ()
1002 (aref ccl-code ccl-current-ic
)
1003 (setq ccl-current-ic
(1+ ccl-current-ic
))))
1005 (defun ccl-dump-1 ()
1006 (let* ((code (ccl-get-next-code))
1007 (cmd (aref ccl-code-table
(logand code
31)))
1008 (rrr (ash (logand code
255) -
5))
1010 (insert (format "%5d:[%s] " (1- ccl-current-ic
) cmd
))
1011 (funcall (get cmd
'ccl-dump-function
) rrr cc
)))
1013 (defun ccl-dump-set-register (rrr cc
)
1014 (insert (format "r%d = r%d\n" rrr cc
)))
1016 (defun ccl-dump-set-short-const (rrr cc
)
1017 (insert (format "r%d = %d\n" rrr cc
)))
1019 (defun ccl-dump-set-const (rrr ignore
)
1020 (insert (format "r%d = %d\n" rrr
(ccl-get-next-code))))
1022 (defun ccl-dump-set-array (rrr cc
)
1023 (let ((rrr2 (logand cc
7))
1026 (insert (format "r%d = array[r%d] of length %d\n\t"
1029 (insert (format "%d " (ccl-get-next-code)))
1033 (defun ccl-dump-jump (ignore cc
&optional address
)
1034 (insert (format "jump to %d(" (+ (or address ccl-current-ic
) cc
)))
1037 (insert (format "%d)\n" (1+ cc
))))
1039 (defun ccl-dump-jump-cond (rrr cc
)
1040 (insert (format "if (r%d == 0), " rrr
))
1041 (ccl-dump-jump nil cc
))
1043 (defun ccl-dump-write-register-jump (rrr cc
)
1044 (insert (format "write r%d, " rrr
))
1045 (ccl-dump-jump nil cc
))
1047 (defun ccl-dump-write-register-read-jump (rrr cc
)
1048 (insert (format "write r%d, read r%d, " rrr rrr
))
1049 (ccl-dump-jump nil cc
)
1050 (ccl-get-next-code) ; Skip dummy READ-JUMP
1053 (defun ccl-extract-arith-op (cc)
1054 (aref ccl-arith-table
(ash cc -
6)))
1056 (defun ccl-dump-write-expr-const (ignore cc
)
1057 (insert (format "write (r%d %s %d)\n"
1059 (ccl-extract-arith-op cc
)
1060 (ccl-get-next-code))))
1062 (defun ccl-dump-write-expr-register (ignore cc
)
1063 (insert (format "write (r%d %s r%d)\n"
1065 (ccl-extract-arith-op cc
)
1066 (logand (ash cc -
3) 7))))
1068 (defun ccl-dump-insert-char (cc)
1069 (cond ((= cc ?
\t) (insert " \"^I\""))
1070 ((= cc ?
\n) (insert " \"^J\""))
1071 (t (insert (format " \"%c\"" cc
)))))
1073 (defun ccl-dump-write-const-jump (ignore cc
)
1074 (let ((address ccl-current-ic
))
1075 (insert "write char")
1076 (ccl-dump-insert-char (ccl-get-next-code))
1078 (ccl-dump-jump nil cc address
)))
1080 (defun ccl-dump-write-const-read-jump (rrr cc
)
1081 (let ((address ccl-current-ic
))
1082 (insert "write char")
1083 (ccl-dump-insert-char (ccl-get-next-code))
1084 (insert (format ", read r%d, " rrr
))
1085 (ccl-dump-jump cc address
)
1086 (ccl-get-next-code) ; Skip dummy READ-JUMP
1089 (defun ccl-dump-write-string-jump (ignore cc
)
1090 (let ((address ccl-current-ic
)
1091 (len (ccl-get-next-code))
1095 (let ((code (ccl-get-next-code)))
1096 (insert (ash code -
16))
1097 (if (< (1+ i
) len
) (insert (logand (ash code -
8) 255)))
1098 (if (< (+ i
2) len
) (insert (logand code
255))))
1101 (ccl-dump-jump nil cc address
)))
1103 (defun ccl-dump-write-array-read-jump (rrr cc
)
1104 (let ((address ccl-current-ic
)
1105 (len (ccl-get-next-code))
1107 (insert (format "write array[r%d] of length %d,\n\t" rrr len
))
1109 (ccl-dump-insert-char (ccl-get-next-code))
1111 (insert (format "\n\tthen read r%d, " rrr
))
1112 (ccl-dump-jump nil cc address
)
1113 (ccl-get-next-code) ; Skip dummy READ-JUMP.
1116 (defun ccl-dump-read-jump (rrr cc
)
1117 (insert (format "read r%d, " rrr
))
1118 (ccl-dump-jump nil cc
))
1120 (defun ccl-dump-branch (rrr len
)
1121 (let ((jump-table-head ccl-current-ic
)
1123 (insert (format "jump to array[r%d] of length %d\n\t" rrr len
))
1125 (insert (format "%d " (+ jump-table-head
(ccl-get-next-code))))
1129 (defun ccl-dump-read-register (rrr cc
)
1130 (insert (format "read r%d (%d remaining)\n" rrr cc
)))
1132 (defun ccl-dump-read-branch (rrr len
)
1133 (insert (format "read r%d, " rrr
))
1134 (ccl-dump-branch rrr len
))
1136 (defun ccl-dump-write-register (rrr cc
)
1137 (insert (format "write r%d (%d remaining)\n" rrr cc
)))
1139 (defun ccl-dump-call (ignore cc
)
1140 (insert (format "call subroutine #%d\n" cc
)))
1142 (defun ccl-dump-write-const-string (rrr cc
)
1145 (insert "write char")
1146 (ccl-dump-insert-char cc
)
1152 (let ((code (ccl-get-next-code)))
1153 (insert (format "%c" (lsh code -
16)))
1155 (insert (format "%c" (logand (lsh code -
8) 255))))
1157 (insert (format "%c" (logand code
255))))
1161 (defun ccl-dump-write-array (rrr cc
)
1163 (insert (format "write array[r%d] of length %d\n\t" rrr cc
))
1165 (ccl-dump-insert-char (ccl-get-next-code))
1169 (defun ccl-dump-end (&rest ignore
)
1172 (defun ccl-dump-set-assign-expr-const (rrr cc
)
1173 (insert (format "r%d %s= %d\n"
1175 (ccl-extract-arith-op cc
)
1176 (ccl-get-next-code))))
1178 (defun ccl-dump-set-assign-expr-register (rrr cc
)
1179 (insert (format "r%d %s= r%d\n"
1181 (ccl-extract-arith-op cc
)
1184 (defun ccl-dump-set-expr-const (rrr cc
)
1185 (insert (format "r%d = r%d %s %d\n"
1188 (ccl-extract-arith-op cc
)
1189 (ccl-get-next-code))))
1191 (defun ccl-dump-set-expr-register (rrr cc
)
1192 (insert (format "r%d = r%d %s r%d\n"
1195 (ccl-extract-arith-op cc
)
1196 (logand (ash cc -
3) 7))))
1198 (defun ccl-dump-jump-cond-expr-const (rrr cc
)
1199 (let ((address ccl-current-ic
))
1200 (insert (format "if !(r%d %s %d), "
1202 (aref ccl-arith-table
(ccl-get-next-code))
1203 (ccl-get-next-code)))
1204 (ccl-dump-jump nil cc address
)))
1206 (defun ccl-dump-jump-cond-expr-register (rrr cc
)
1207 (let ((address ccl-current-ic
))
1208 (insert (format "if !(r%d %s r%d), "
1210 (aref ccl-arith-table
(ccl-get-next-code))
1211 (ccl-get-next-code)))
1212 (ccl-dump-jump nil cc address
)))
1214 (defun ccl-dump-read-jump-cond-expr-const (rrr cc
)
1215 (insert (format "read r%d, " rrr
))
1216 (ccl-dump-jump-cond-expr-const rrr cc
))
1218 (defun ccl-dump-read-jump-cond-expr-register (rrr cc
)
1219 (insert (format "read r%d, " rrr
))
1220 (ccl-dump-jump-cond-expr-register rrr cc
))
1222 (defun ccl-dump-binary (ccl-code)
1223 (let ((len (length ccl-code
))
1226 (let ((code (aref ccl-code i
))
1229 (insert (if (= (logand code
(ash 1 j
)) 0) ?
0 ?
1))
1231 (setq code
(logand code
31))
1232 (if (< code
(length ccl-code-table
))
1233 (insert (format ":%s" (aref ccl-code-table code
))))
1237 (defun ccl-dump-ex-cmd (rrr cc
)
1238 (let* ((RRR (logand cc ?\x7
))
1239 (Rrr (logand (ash cc -
3) ?\x7
))
1240 (ex-op (aref ccl-extended-code-table
(logand (ash cc -
6) ?
\x3fff
))))
1241 (insert (format "<%s> " ex-op
))
1242 (funcall (get ex-op
'ccl-dump-function
) rrr RRR Rrr
)))
1244 (defun ccl-dump-read-multibyte-character (rrr RRR Rrr
)
1245 (insert (format "read-multibyte-character r%d r%d\n" RRR rrr
)))
1247 (defun ccl-dump-write-multibyte-character (rrr RRR Rrr
)
1248 (insert (format "write-multibyte-character r%d r%d\n" RRR rrr
)))
1250 (defun ccl-dump-translate-character (rrr RRR Rrr
)
1251 (insert (format "translation table(r%d) r%d r%d\n" Rrr RRR rrr
)))
1253 (defun ccl-dump-translate-character-const-tbl (rrr RRR Rrr
)
1254 (let ((tbl (ccl-get-next-code)))
1255 (insert (format "translation table(%S) r%d r%d\n" tbl RRR rrr
))))
1257 (defun ccl-dump-iterate-multiple-map (rrr RRR Rrr
)
1258 (let ((notbl (ccl-get-next-code))
1260 (insert (format "iterate-multiple-map r%d r%d\n" RRR rrr
))
1261 (insert (format "\tnumber of maps is %d .\n\t [" notbl
))
1263 (setq id
(ccl-get-next-code))
1264 (insert (format "%S" id
))
1268 (defun ccl-dump-map-multiple (rrr RRR Rrr
)
1269 (let ((notbl (ccl-get-next-code))
1271 (insert (format "map-multiple r%d r%d\n" RRR rrr
))
1272 (insert (format "\tnumber of maps and separators is %d\n\t [" notbl
))
1274 (setq id
(ccl-get-next-code))
1277 (insert (format "%S " id
)))
1281 (defun ccl-dump-map-single (rrr RRR Rrr
)
1282 (let ((id (ccl-get-next-code)))
1283 (insert (format "map-single r%d r%d map(%S)\n" RRR rrr id
))))
1286 ;; CCL emulation staffs
1288 ;; Not yet implemented.
1290 ;; Auto-loaded functions.
1293 (defmacro declare-ccl-program
(name &optional vector
)
1294 "Declare NAME as a name of CCL program.
1296 This macro exists for backward compatibility. In the old version of
1297 Emacs, to compile a CCL program which calls another CCL program not
1298 yet defined, it must be declared as a CCL program in advance. But,
1299 now CCL program names are resolved not at compile time but before
1302 Optional arg VECTOR is a compiled CCL code of the CCL program."
1303 `(put ',name
'ccl-program-idx
(register-ccl-program ',name
,vector
)))
1306 (defmacro define-ccl-program
(name ccl-program
&optional doc
)
1307 "Set NAME the compiled code of CCL-PROGRAM.
1308 CCL-PROGRAM is `eval'ed before being handed to the CCL compiler `ccl-compile'.
1309 The compiled code is a vector of integers."
1310 `(let ((prog ,(ccl-compile (eval ccl-program
))))
1311 (defconst ,name prog
,doc
)
1312 (put ',name
'ccl-program-idx
(register-ccl-program ',name prog
))
1316 (defmacro check-ccl-program
(ccl-program &optional name
)
1317 "Check validity of CCL-PROGRAM.
1318 If CCL-PROGRAM is a symbol denoting a CCL program, return
1319 CCL-PROGRAM, else return nil.
1320 If CCL-PROGRAM is a vector and optional arg NAME (symbol) is supplied,
1321 register CCL-PROGRAM by name NAME, and return NAME."
1322 `(if (ccl-program-p ,ccl-program
)
1323 (if (vectorp ,ccl-program
)
1325 (register-ccl-program ,name
,ccl-program
)
1330 (defun ccl-execute-with-args (ccl-prog &rest args
)
1331 "Execute CCL-PROGRAM with registers initialized by the remaining args.
1332 The return value is a vector of resulting CCL registers."
1333 (let ((reg (make-vector 8 0))
1335 (while (and args
(< i
8))
1336 (if (not (integerp (car args
)))
1337 (error "Arguments should be integer"))
1338 (aset reg i
(car args
))
1339 (setq args
(cdr args
) i
(1+ i
)))
1340 (ccl-execute ccl-prog reg
)