(composition_compute_stop_pos): Limit the search of composition to
[bpt/emacs.git] / src / composite.c
1 /* Composite sequence support.
2 Copyright (C) 2001, 2002, 2003, 2004, 2005,
3 2006, 2007, 2008 Free Software Foundation, Inc.
4 Copyright (C) 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008
5 National Institute of Advanced Industrial Science and Technology (AIST)
6 Registration Number H14PRO021
7 Copyright (C) 2003, 2006
8 National Institute of Advanced Industrial Science and Technology (AIST)
9 Registration Number H13PRO009
10
11 This file is part of GNU Emacs.
12
13 GNU Emacs is free software: you can redistribute it and/or modify
14 it under the terms of the GNU General Public License as published by
15 the Free Software Foundation, either version 3 of the License, or
16 (at your option) any later version.
17
18 GNU Emacs is distributed in the hope that it will be useful,
19 but WITHOUT ANY WARRANTY; without even the implied warranty of
20 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
21 GNU General Public License for more details.
22
23 You should have received a copy of the GNU General Public License
24 along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>. */
25
26 #include <config.h>
27 #include "lisp.h"
28 #include "buffer.h"
29 #include "character.h"
30 #include "intervals.h"
31 #include "window.h"
32 #include "frame.h"
33 #include "dispextern.h"
34 #include "font.h"
35
36 /* Emacs uses special text property `composition' to support character
37 composition. A sequence of characters that have the same (i.e. eq)
38 `composition' property value is treated as a single composite
39 sequence (we call it just `composition' here after). Characters in
40 a composition are all composed somehow on the screen.
41
42 The property value has this form when the composition is made:
43 ((LENGTH . COMPONENTS) . MODIFICATION-FUNC)
44 then turns to this form:
45 (COMPOSITION-ID . (LENGTH COMPONENTS-VEC . MODIFICATION-FUNC))
46 when the composition is registered in composition_hash_table and
47 composition_table. These rather peculiar structures were designed
48 to make it easy to distinguish them quickly (we can do that by
49 checking only the first element) and to extract LENGTH (from the
50 former form) and COMPOSITION-ID (from the latter form).
51
52 We register a composition when it is displayed, or when the width
53 is required (for instance, to calculate columns).
54
55 LENGTH -- Length of the composition. This information is used to
56 check the validity of the composition.
57
58 COMPONENTS -- Character, string, vector, list, or nil.
59
60 If it is nil, characters in the text are composed relatively
61 according to their metrics in font glyphs.
62
63 If it is a character or a string, the character or characters
64 in the string are composed relatively.
65
66 If it is a vector or list of integers, the element is a
67 character or an encoded composition rule. The characters are
68 composed according to the rules. (2N)th elements are
69 characters to be composed and (2N+1)th elements are
70 composition rules to tell how to compose (2N+2)th element with
71 the previously composed 2N glyphs.
72
73 COMPONENTS-VEC -- Vector of integers. In relative composition, the
74 elements are characters to be composed. In rule-base
75 composition, the elements are characters or encoded
76 composition rules.
77
78 MODIFICATION-FUNC -- If non nil, it is a function to call when the
79 composition gets invalid after a modification in a buffer. If
80 it is nil, a function in `composition-function-table' of the
81 first character in the sequence is called.
82
83 COMPOSITION-ID --Identification number of the composition. It is
84 used as an index to composition_table for the composition.
85
86 When Emacs has to display a composition or has to know its
87 displaying width, the function get_composition_id is called. It
88 returns COMPOSITION-ID so that the caller can access the
89 information about the composition through composition_table. If a
90 COMPOSITION-ID has not yet been assigned to the composition,
91 get_composition_id checks the validity of `composition' property,
92 and, if valid, assigns a new ID, registers the information in
93 composition_hash_table and composition_table, and changes the form
94 of the property value. If the property is invalid, return -1
95 without changing the property value.
96
97 We use two tables to keep information about composition;
98 composition_hash_table and composition_table.
99
100 The former is a hash table in which keys are COMPONENTS-VECs and
101 values are the corresponding COMPOSITION-IDs. This hash table is
102 weak, but as each key (COMPONENTS-VEC) is also kept as a value of the
103 `composition' property, it won't be collected as garbage until all
104 bits of text that have the same COMPONENTS-VEC are deleted.
105
106 The latter is a table of pointers to `struct composition' indexed
107 by COMPOSITION-ID. This structure keeps the other information (see
108 composite.h).
109
110 In general, a text property holds information about individual
111 characters. But, a `composition' property holds information about
112 a sequence of characters (in this sense, it is like the `intangible'
113 property). That means that we should not share the property value
114 in adjacent compositions -- we can't distinguish them if they have the
115 same property. So, after any changes, we call
116 `update_compositions' and change a property of one of adjacent
117 compositions to a copy of it. This function also runs a proper
118 composition modification function to make a composition that gets
119 invalid by the change valid again.
120
121 As the value of the `composition' property holds information about a
122 specific range of text, the value gets invalid if we change the
123 text in the range. We treat the `composition' property as always
124 rear-nonsticky (currently by setting default-text-properties to
125 (rear-nonsticky (composition))) and we never make properties of
126 adjacent compositions identical. Thus, any such changes make the
127 range just shorter. So, we can check the validity of the `composition'
128 property by comparing LENGTH information with the actual length of
129 the composition.
130
131 */
132
133
134 Lisp_Object Qcomposition;
135
136 /* Table of pointers to the structure `composition' indexed by
137 COMPOSITION-ID. This structure is for storing information about
138 each composition except for COMPONENTS-VEC. */
139 struct composition **composition_table;
140
141 /* The current size of `composition_table'. */
142 static int composition_table_size;
143
144 /* Number of compositions currently made. */
145 int n_compositions;
146
147 /* Hash table for compositions. The key is COMPONENTS-VEC of
148 `composition' property. The value is the corresponding
149 COMPOSITION-ID. */
150 Lisp_Object composition_hash_table;
151
152 /* Function to call to adjust composition. */
153 Lisp_Object Vcompose_chars_after_function;
154
155 Lisp_Object Qauto_composed;
156 Lisp_Object Vauto_composition_function;
157 Lisp_Object Qauto_composition_function;
158 Lisp_Object Vcomposition_function_table;
159
160 EXFUN (Fremove_list_of_text_properties, 4);
161
162 /* Temporary variable used in macros COMPOSITION_XXX. */
163 Lisp_Object composition_temp;
164
165 \f
166 /* Return COMPOSITION-ID of a composition at buffer position
167 CHARPOS/BYTEPOS and length NCHARS. The `composition' property of
168 the sequence is PROP. STRING, if non-nil, is a string that
169 contains the composition instead of the current buffer.
170
171 If the composition is invalid, return -1. */
172
173 int
174 get_composition_id (charpos, bytepos, nchars, prop, string)
175 int charpos, bytepos, nchars;
176 Lisp_Object prop, string;
177 {
178 Lisp_Object id, length, components, key, *key_contents;
179 int glyph_len;
180 struct Lisp_Hash_Table *hash_table = XHASH_TABLE (composition_hash_table);
181 int hash_index;
182 unsigned hash_code;
183 struct composition *cmp;
184 int i, ch;
185
186 /* PROP should be
187 Form-A: ((LENGTH . COMPONENTS) . MODIFICATION-FUNC)
188 or
189 Form-B: (COMPOSITION-ID . (LENGTH COMPONENTS-VEC . MODIFICATION-FUNC))
190 */
191 if (nchars == 0 || !CONSP (prop))
192 goto invalid_composition;
193
194 id = XCAR (prop);
195 if (INTEGERP (id))
196 {
197 /* PROP should be Form-B. */
198 if (XINT (id) < 0 || XINT (id) >= n_compositions)
199 goto invalid_composition;
200 return XINT (id);
201 }
202
203 /* PROP should be Form-A.
204 Thus, ID should be (LENGTH . COMPONENTS). */
205 if (!CONSP (id))
206 goto invalid_composition;
207 length = XCAR (id);
208 if (!INTEGERP (length) || XINT (length) != nchars)
209 goto invalid_composition;
210
211 components = XCDR (id);
212
213 /* Check if the same composition has already been registered or not
214 by consulting composition_hash_table. The key for this table is
215 COMPONENTS (converted to a vector COMPONENTS-VEC) or, if it is
216 nil, vector of characters in the composition range. */
217 if (INTEGERP (components))
218 key = Fmake_vector (make_number (1), components);
219 else if (STRINGP (components) || CONSP (components))
220 key = Fvconcat (1, &components);
221 else if (VECTORP (components))
222 key = components;
223 else if (NILP (components))
224 {
225 key = Fmake_vector (make_number (nchars), Qnil);
226 if (STRINGP (string))
227 for (i = 0; i < nchars; i++)
228 {
229 FETCH_STRING_CHAR_ADVANCE (ch, string, charpos, bytepos);
230 XVECTOR (key)->contents[i] = make_number (ch);
231 }
232 else
233 for (i = 0; i < nchars; i++)
234 {
235 FETCH_CHAR_ADVANCE (ch, charpos, bytepos);
236 XVECTOR (key)->contents[i] = make_number (ch);
237 }
238 }
239 else
240 goto invalid_composition;
241
242 hash_index = hash_lookup (hash_table, key, &hash_code);
243 if (hash_index >= 0)
244 {
245 /* We have already registered the same composition. Change PROP
246 from Form-A above to Form-B while replacing COMPONENTS with
247 COMPONENTS-VEC stored in the hash table. We can directly
248 modify the cons cell of PROP because it is not shared. */
249 key = HASH_KEY (hash_table, hash_index);
250 id = HASH_VALUE (hash_table, hash_index);
251 XSETCAR (prop, id);
252 XSETCDR (prop, Fcons (make_number (nchars), Fcons (key, XCDR (prop))));
253 return XINT (id);
254 }
255
256 /* This composition is a new one. We must register it. */
257
258 /* Check if we have sufficient memory to store this information. */
259 if (composition_table_size == 0)
260 {
261 composition_table_size = 256;
262 composition_table
263 = (struct composition **) xmalloc (sizeof (composition_table[0])
264 * composition_table_size);
265 }
266 else if (composition_table_size <= n_compositions)
267 {
268 composition_table_size += 256;
269 composition_table
270 = (struct composition **) xrealloc (composition_table,
271 sizeof (composition_table[0])
272 * composition_table_size);
273 }
274
275 key_contents = XVECTOR (key)->contents;
276
277 /* Check if the contents of COMPONENTS are valid if COMPONENTS is a
278 vector or a list. It should be a sequence of:
279 char1 rule1 char2 rule2 char3 ... ruleN charN+1 */
280
281 if (VECTORP (components)
282 && ASIZE (components) >= 2
283 && VECTORP (AREF (components, 0)))
284 {
285 /* COMPONENTS is a glyph-string. */
286 int len = ASIZE (key);
287
288 for (i = 1; i < len; i++)
289 if (! VECTORP (AREF (key, i)))
290 goto invalid_composition;
291 }
292 else if (VECTORP (components) || CONSP (components))
293 {
294 int len = XVECTOR (key)->size;
295
296 /* The number of elements should be odd. */
297 if ((len % 2) == 0)
298 goto invalid_composition;
299 /* All elements should be integers (character or encoded
300 composition rule). */
301 for (i = 0; i < len; i++)
302 {
303 if (!INTEGERP (key_contents[i]))
304 goto invalid_composition;
305 }
306 }
307
308 /* Change PROP from Form-A above to Form-B. We can directly modify
309 the cons cell of PROP because it is not shared. */
310 XSETFASTINT (id, n_compositions);
311 XSETCAR (prop, id);
312 XSETCDR (prop, Fcons (make_number (nchars), Fcons (key, XCDR (prop))));
313
314 /* Register the composition in composition_hash_table. */
315 hash_index = hash_put (hash_table, key, id, hash_code);
316
317 /* Register the composition in composition_table. */
318 cmp = (struct composition *) xmalloc (sizeof (struct composition));
319
320 cmp->method = (NILP (components)
321 ? COMPOSITION_RELATIVE
322 : ((INTEGERP (components) || STRINGP (components))
323 ? COMPOSITION_WITH_ALTCHARS
324 : COMPOSITION_WITH_RULE_ALTCHARS));
325 cmp->hash_index = hash_index;
326 glyph_len = (cmp->method == COMPOSITION_WITH_RULE_ALTCHARS
327 ? (XVECTOR (key)->size + 1) / 2
328 : XVECTOR (key)->size);
329 cmp->glyph_len = glyph_len;
330 cmp->offsets = (short *) xmalloc (sizeof (short) * glyph_len * 2);
331 cmp->font = NULL;
332
333 if (cmp->method != COMPOSITION_WITH_RULE_ALTCHARS)
334 {
335 /* Relative composition. */
336 cmp->width = 0;
337 for (i = 0; i < glyph_len; i++)
338 {
339 int this_width;
340 ch = XINT (key_contents[i]);
341 this_width = (ch == '\t' ? 1 : CHAR_WIDTH (ch));
342 if (cmp->width < this_width)
343 cmp->width = this_width;
344 }
345 }
346 else
347 {
348 /* Rule-base composition. */
349 float leftmost = 0.0, rightmost;
350
351 ch = XINT (key_contents[0]);
352 rightmost = ch != '\t' ? CHAR_WIDTH (ch) : 1;
353
354 for (i = 1; i < glyph_len; i += 2)
355 {
356 int rule, gref, nref, xoff, yoff;
357 int this_width;
358 float this_left;
359
360 rule = XINT (key_contents[i]);
361 ch = XINT (key_contents[i + 1]);
362 this_width = ch != '\t' ? CHAR_WIDTH (ch) : 1;
363
364 /* A composition rule is specified by an integer value
365 that encodes global and new reference points (GREF and
366 NREF). GREF and NREF are specified by numbers as
367 below:
368 0---1---2 -- ascent
369 | |
370 | |
371 | |
372 9--10--11 -- center
373 | |
374 ---3---4---5--- baseline
375 | |
376 6---7---8 -- descent
377 */
378 COMPOSITION_DECODE_RULE (rule, gref, nref, xoff, yoff);
379 this_left = (leftmost
380 + (gref % 3) * (rightmost - leftmost) / 2.0
381 - (nref % 3) * this_width / 2.0);
382
383 if (this_left < leftmost)
384 leftmost = this_left;
385 if (this_left + this_width > rightmost)
386 rightmost = this_left + this_width;
387 }
388
389 cmp->width = rightmost - leftmost;
390 if (cmp->width < (rightmost - leftmost))
391 /* To get a ceiling integer value. */
392 cmp->width++;
393 }
394
395 composition_table[n_compositions] = cmp;
396
397 return n_compositions++;
398
399 invalid_composition:
400 /* Would it be better to remove this `composition' property? */
401 return -1;
402 }
403
404 \f
405 /* Find a static composition at or nearest to position POS of OBJECT
406 (buffer or string).
407
408 OBJECT defaults to the current buffer. If there's a composition at
409 POS, set *START and *END to the start and end of the sequence,
410 *PROP to the `composition' property, and return 1.
411
412 If there's no composition at POS and LIMIT is negative, return 0.
413
414 Otherwise, search for a composition forward (LIMIT > POS) or
415 backward (LIMIT < POS). In this case, LIMIT bounds the search.
416
417 If a composition is found, set *START, *END, and *PROP as above,
418 and return 1, else return 0.
419
420 This doesn't check the validity of composition. */
421
422 int
423 find_composition (pos, limit, start, end, prop, object)
424 int pos, limit;
425 EMACS_INT *start, *end;
426 Lisp_Object *prop, object;
427 {
428 Lisp_Object val;
429
430 if (get_property_and_range (pos, Qcomposition, prop, start, end, object))
431 return 1;
432
433 if (limit < 0 || limit == pos)
434 return 0;
435
436 if (limit > pos) /* search forward */
437 {
438 val = Fnext_single_property_change (make_number (pos), Qcomposition,
439 object, make_number (limit));
440 pos = XINT (val);
441 if (pos == limit)
442 return 0;
443 }
444 else /* search backward */
445 {
446 if (get_property_and_range (pos - 1, Qcomposition, prop, start, end,
447 object))
448 return 1;
449 val = Fprevious_single_property_change (make_number (pos), Qcomposition,
450 object, make_number (limit));
451 pos = XINT (val);
452 if (pos == limit)
453 return 0;
454 pos--;
455 }
456 get_property_and_range (pos, Qcomposition, prop, start, end, object);
457 return 1;
458 }
459
460 /* Run a proper function to adjust the composition sitting between
461 FROM and TO with property PROP. */
462
463 static void
464 run_composition_function (from, to, prop)
465 int from, to;
466 Lisp_Object prop;
467 {
468 Lisp_Object func;
469 EMACS_INT start, end;
470
471 func = COMPOSITION_MODIFICATION_FUNC (prop);
472 /* If an invalid composition precedes or follows, try to make them
473 valid too. */
474 if (from > BEGV
475 && find_composition (from - 1, -1, &start, &end, &prop, Qnil)
476 && !COMPOSITION_VALID_P (start, end, prop))
477 from = start;
478 if (to < ZV
479 && find_composition (to, -1, &start, &end, &prop, Qnil)
480 && !COMPOSITION_VALID_P (start, end, prop))
481 to = end;
482 if (!NILP (Ffboundp (func)))
483 call2 (func, make_number (from), make_number (to));
484 }
485
486 /* Make invalid compositions adjacent to or inside FROM and TO valid.
487 CHECK_MASK is bitwise `or' of mask bits defined by macros
488 CHECK_XXX (see the comment in composite.h).
489
490 It also resets the text-property `auto-composed' to a proper region
491 so that automatic character composition works correctly later while
492 displaying the region.
493
494 This function is called when a buffer text is changed. If the
495 change is deletion, FROM == TO. Otherwise, FROM < TO. */
496
497 void
498 update_compositions (from, to, check_mask)
499 EMACS_INT from, to;
500 int check_mask;
501 {
502 Lisp_Object prop;
503 EMACS_INT start, end;
504 /* The beginning and end of the region to set the property
505 `auto-composed' to nil. */
506 EMACS_INT min_pos = from, max_pos = to;
507
508 if (inhibit_modification_hooks)
509 return;
510
511 /* If FROM and TO are not in a valid range, do nothing. */
512 if (! (BEGV <= from && from <= to && to <= ZV))
513 return;
514
515 if (check_mask & CHECK_HEAD)
516 {
517 /* FROM should be at composition boundary. But, insertion or
518 deletion will make two compositions adjacent and
519 indistinguishable when they have same (eq) property. To
520 avoid it, in such a case, we change the property of the
521 latter to the copy of it. */
522 if (from > BEGV
523 && find_composition (from - 1, -1, &start, &end, &prop, Qnil)
524 && COMPOSITION_VALID_P (start, end, prop))
525 {
526 min_pos = start;
527 if (end > to)
528 max_pos = end;
529 if (from < end)
530 Fput_text_property (make_number (from), make_number (end),
531 Qcomposition,
532 Fcons (XCAR (prop), XCDR (prop)), Qnil);
533 run_composition_function (start, end, prop);
534 from = end;
535 }
536 else if (from < ZV
537 && find_composition (from, -1, &start, &from, &prop, Qnil)
538 && COMPOSITION_VALID_P (start, from, prop))
539 {
540 if (from > to)
541 max_pos = from;
542 run_composition_function (start, from, prop);
543 }
544 }
545
546 if (check_mask & CHECK_INSIDE)
547 {
548 /* In this case, we are sure that (check & CHECK_TAIL) is also
549 nonzero. Thus, here we should check only compositions before
550 (to - 1). */
551 while (from < to - 1
552 && find_composition (from, to, &start, &from, &prop, Qnil)
553 && COMPOSITION_VALID_P (start, from, prop)
554 && from < to - 1)
555 run_composition_function (start, from, prop);
556 }
557
558 if (check_mask & CHECK_TAIL)
559 {
560 if (from < to
561 && find_composition (to - 1, -1, &start, &end, &prop, Qnil)
562 && COMPOSITION_VALID_P (start, end, prop))
563 {
564 /* TO should be also at composition boundary. But,
565 insertion or deletion will make two compositions adjacent
566 and indistinguishable when they have same (eq) property.
567 To avoid it, in such a case, we change the property of
568 the former to the copy of it. */
569 if (to < end)
570 {
571 Fput_text_property (make_number (start), make_number (to),
572 Qcomposition,
573 Fcons (XCAR (prop), XCDR (prop)), Qnil);
574 max_pos = end;
575 }
576 run_composition_function (start, end, prop);
577 }
578 else if (to < ZV
579 && find_composition (to, -1, &start, &end, &prop, Qnil)
580 && COMPOSITION_VALID_P (start, end, prop))
581 {
582 run_composition_function (start, end, prop);
583 max_pos = end;
584 }
585 }
586 if (min_pos < max_pos)
587 {
588 int count = SPECPDL_INDEX ();
589
590 specbind (Qinhibit_read_only, Qt);
591 specbind (Qinhibit_modification_hooks, Qt);
592 specbind (Qinhibit_point_motion_hooks, Qt);
593 Fremove_list_of_text_properties (make_number (min_pos),
594 make_number (max_pos),
595 Fcons (Qauto_composed, Qnil), Qnil);
596 unbind_to (count, Qnil);
597 }
598 }
599
600
601 /* Modify composition property values in LIST destructively. LIST is
602 a list as returned from text_property_list. Change values to the
603 top-level copies of them so that none of them are `eq'. */
604
605 void
606 make_composition_value_copy (list)
607 Lisp_Object list;
608 {
609 Lisp_Object plist, val;
610
611 for (; CONSP (list); list = XCDR (list))
612 {
613 plist = XCAR (XCDR (XCDR (XCAR (list))));
614 while (CONSP (plist) && CONSP (XCDR (plist)))
615 {
616 if (EQ (XCAR (plist), Qcomposition)
617 && (val = XCAR (XCDR (plist)), CONSP (val)))
618 XSETCAR (XCDR (plist), Fcons (XCAR (val), XCDR (val)));
619 plist = XCDR (XCDR (plist));
620 }
621 }
622 }
623
624
625 /* Make text in the region between START and END a composition that
626 has COMPONENTS and MODIFICATION-FUNC.
627
628 If STRING is non-nil, then operate on characters contained between
629 indices START and END in STRING. */
630
631 void
632 compose_text (start, end, components, modification_func, string)
633 int start, end;
634 Lisp_Object components, modification_func, string;
635 {
636 Lisp_Object prop;
637
638 prop = Fcons (Fcons (make_number (end - start), components),
639 modification_func);
640 Fput_text_property (make_number (start), make_number (end),
641 Qcomposition, prop, string);
642 }
643
644
645 static Lisp_Object autocmp_chars P_ ((Lisp_Object, EMACS_INT, EMACS_INT,
646 EMACS_INT, struct window *,
647 struct face *, Lisp_Object));
648
649 \f
650 /* Lisp glyph-string handlers */
651
652 /* Hash table for automatic composition. The key is a header of a
653 lgstring (Lispy glyph-string), and the value is a body of a
654 lgstring. */
655
656 static Lisp_Object gstring_hash_table;
657
658 static Lisp_Object gstring_lookup_cache P_ ((Lisp_Object));
659
660 static Lisp_Object
661 gstring_lookup_cache (header)
662 Lisp_Object header;
663 {
664 struct Lisp_Hash_Table *h = XHASH_TABLE (gstring_hash_table);
665 int i = hash_lookup (h, header, NULL);
666
667 return (i >= 0 ? HASH_VALUE (h, i) : Qnil);
668 }
669
670 Lisp_Object
671 composition_gstring_put_cache (gstring, len)
672 Lisp_Object gstring;
673 int len;
674 {
675 struct Lisp_Hash_Table *h = XHASH_TABLE (gstring_hash_table);
676 unsigned hash;
677 Lisp_Object header, copy;
678 int i;
679
680 header = LGSTRING_HEADER (gstring);
681 hash = h->hashfn (h, header);
682 if (len < 0)
683 {
684 len = LGSTRING_GLYPH_LEN (gstring);
685 for (i = 0; i < len; i++)
686 if (NILP (LGSTRING_GLYPH (gstring, i)))
687 break;
688 len = i;
689 }
690
691 copy = Fmake_vector (make_number (len + 2), Qnil);
692 LGSTRING_SET_HEADER (copy, Fcopy_sequence (header));
693 for (i = 0; i < len; i++)
694 LGSTRING_SET_GLYPH (copy, i, Fcopy_sequence (LGSTRING_GLYPH (gstring, i)));
695 i = hash_put (h, LGSTRING_HEADER (copy), copy, hash);
696 LGSTRING_SET_ID (copy, make_number (i));
697 return copy;
698 }
699
700 Lisp_Object
701 composition_gstring_from_id (id)
702 int id;
703 {
704 struct Lisp_Hash_Table *h = XHASH_TABLE (gstring_hash_table);
705
706 return HASH_VALUE (h, id);
707 }
708
709 static Lisp_Object fill_gstring_header P_ ((Lisp_Object, Lisp_Object,
710 Lisp_Object, Lisp_Object,
711 Lisp_Object));
712
713 int
714 composition_gstring_p (gstring)
715 Lisp_Object gstring;
716 {
717 Lisp_Object header;
718 int i;
719
720 if (! VECTORP (gstring) || ASIZE (gstring) < 2)
721 return 0;
722 header = LGSTRING_HEADER (gstring);
723 if (! VECTORP (header) || ASIZE (header) < 2)
724 return 0;
725 if (! NILP (LGSTRING_FONT (gstring))
726 && ! FONT_OBJECT_P (LGSTRING_FONT (gstring)))
727 return 0;
728 for (i = 1; i < ASIZE (LGSTRING_HEADER (gstring)); i++)
729 if (! NATNUMP (AREF (LGSTRING_HEADER (gstring), i)))
730 return 0;
731 if (! NILP (LGSTRING_ID (gstring)) && ! NATNUMP (LGSTRING_ID (gstring)))
732 return 0;
733 for (i = 0; i < LGSTRING_GLYPH_LEN (gstring); i++)
734 {
735 Lisp_Object glyph = LGSTRING_GLYPH (gstring, i);
736 if (NILP (glyph))
737 break;
738 if (! VECTORP (glyph) || ASIZE (glyph) != LGLYPH_SIZE)
739 return 0;
740 }
741 return 1;
742 }
743
744 int
745 composition_gstring_width (gstring, from, to, metrics)
746 Lisp_Object gstring;
747 int from, to;
748 struct font_metrics *metrics;
749 {
750 Lisp_Object *glyph;
751 int width = 0;
752
753 if (metrics)
754 {
755 Lisp_Object font_object = LGSTRING_FONT (gstring);
756 struct font *font = XFONT_OBJECT (font_object);
757
758 metrics->ascent = font->ascent;
759 metrics->descent = font->descent;
760 metrics->width = metrics->lbearing = metrics->rbearing = 0;
761 }
762 for (glyph = &LGSTRING_GLYPH (gstring, from); from < to; from++, glyph++)
763 {
764 int x;
765
766 if (NILP (LGLYPH_ADJUSTMENT (*glyph)))
767 width += LGLYPH_WIDTH (*glyph);
768 else
769 width += LGLYPH_WADJUST (*glyph);
770 if (metrics)
771 {
772 x = metrics->width + LGLYPH_LBEARING (*glyph) + LGLYPH_XOFF (*glyph);
773 if (metrics->lbearing > x)
774 metrics->lbearing = x;
775 x = metrics->width + LGLYPH_RBEARING (*glyph) + LGLYPH_XOFF (*glyph);
776 if (metrics->rbearing < x)
777 metrics->rbearing = x;
778 metrics->width = width;
779 x = LGLYPH_ASCENT (*glyph) - LGLYPH_YOFF (*glyph);
780 if (metrics->ascent < x)
781 metrics->ascent = x;
782 x = LGLYPH_DESCENT (*glyph) - LGLYPH_YOFF (*glyph);
783 if (metrics->descent < x)
784 metrics->descent = x;
785 }
786 }
787 return width;
788 }
789
790
791 static Lisp_Object gstring_work;
792 static Lisp_Object gstring_work_headers;
793
794 static Lisp_Object
795 fill_gstring_header (header, start, end, font_object, string)
796 Lisp_Object header, start, end, font_object, string;
797 {
798 EMACS_INT from, to, from_byte;
799 EMACS_INT len, i;
800
801 if (NILP (string))
802 {
803 if (NILP (current_buffer->enable_multibyte_characters))
804 error ("Attempt to shape unibyte text");
805 validate_region (&start, &end);
806 from = XFASTINT (start);
807 to = XFASTINT (end);
808 from_byte = CHAR_TO_BYTE (from);
809 }
810 else
811 {
812 CHECK_STRING (string);
813 if (! STRING_MULTIBYTE (current_buffer->enable_multibyte_characters))
814 error ("Attempt to shape unibyte text");
815 CHECK_NATNUM (start);
816 from = XINT (start);
817 CHECK_NATNUM (end);
818 to = XINT (end);
819 if (from < 0 || from > to || to > SCHARS (string))
820 args_out_of_range_3 (string, start, end);
821 from_byte = string_char_to_byte (string, from);
822 }
823
824 len = to - from;
825 if (len == 0)
826 error ("Attempt to shape zero-length text");
827 if (VECTORP (header))
828 {
829 if (ASIZE (header) != len + 1)
830 args_out_of_range (header, make_number (len + 1));
831 }
832 else
833 {
834 if (len <= 8)
835 header = AREF (gstring_work_headers, len - 1);
836 else
837 header = Fmake_vector (make_number (len + 1), Qnil);
838 }
839
840 ASET (header, 0, font_object);
841 for (i = 0; i < len; i++)
842 {
843 int c;
844
845 if (NILP (string))
846 FETCH_CHAR_ADVANCE_NO_CHECK (c, from, from_byte);
847 else
848 FETCH_STRING_CHAR_ADVANCE_NO_CHECK (c, string, from, from_byte);
849 ASET (header, i + 1, make_number (c));
850 }
851 return header;
852 }
853
854 extern void font_fill_lglyph_metrics P_ ((Lisp_Object, Lisp_Object));
855
856 static void
857 fill_gstring_body (gstring)
858 Lisp_Object gstring;
859 {
860 Lisp_Object font_object = LGSTRING_FONT (gstring);
861 Lisp_Object header = AREF (gstring, 0);
862 EMACS_INT len = LGSTRING_CHAR_LEN (gstring);
863 EMACS_INT i;
864
865 for (i = 0; i < len; i++)
866 {
867 Lisp_Object g = LGSTRING_GLYPH (gstring, i);
868 EMACS_INT c = XINT (AREF (header, i + 1));
869
870 if (NILP (g))
871 {
872 g = LGLYPH_NEW ();
873 LGSTRING_SET_GLYPH (gstring, i, g);
874 }
875 LGLYPH_SET_FROM (g, i);
876 LGLYPH_SET_TO (g, i);
877 LGLYPH_SET_CHAR (g, c);
878 if (! NILP (font_object))
879 {
880 font_fill_lglyph_metrics (g, font_object);
881 }
882 else
883 {
884 int width = XFASTINT (CHAR_TABLE_REF (Vchar_width_table, c));
885
886 LGLYPH_SET_CODE (g, c);
887 LGLYPH_SET_LBEARING (g, 0);
888 LGLYPH_SET_RBEARING (g, width);
889 LGLYPH_SET_WIDTH (g, width);
890 LGLYPH_SET_ASCENT (g, 1);
891 LGLYPH_SET_DESCENT (g, 0);
892 }
893 LGLYPH_SET_ADJUSTMENT (g, Qnil);
894 }
895 if (i < LGSTRING_GLYPH_LEN (gstring))
896 LGSTRING_SET_GLYPH (gstring, i, Qnil);
897 }
898
899 EXFUN (Fre_search_forward, 4);
900
901 /* Try to compose the characters at CHARPOS according to CFT_ELEMENT
902 which is an element of composition-fucntion-table (which see).
903 LIMIT limits the characters to compose. STRING, if not nil, is a
904 target string. WIN is a window where the characters are being
905 displayed. */
906
907 static Lisp_Object
908 autocmp_chars (cft_element, charpos, bytepos, limit, win, face, string)
909 Lisp_Object cft_element;
910 EMACS_INT charpos, bytepos, limit;
911 struct window *win;
912 struct face *face;
913 Lisp_Object string;
914 {
915 int count = SPECPDL_INDEX ();
916 FRAME_PTR f = XFRAME (win->frame);
917 Lisp_Object pos = make_number (charpos);
918 EMACS_INT pt = PT, pt_byte = PT_BYTE;
919 int lookback;
920
921 record_unwind_save_match_data ();
922 for (lookback = -1; CONSP (cft_element); cft_element = XCDR (cft_element))
923 {
924 Lisp_Object elt = XCAR (cft_element);
925 Lisp_Object re;
926 Lisp_Object font_object = Qnil, gstring;
927 EMACS_INT to;
928
929 if (! VECTORP (elt) || ASIZE (elt) != 3)
930 continue;
931 if (lookback < 0)
932 lookback = XFASTINT (AREF (elt, 1));
933 else if (lookback != XFASTINT (AREF (elt, 1)))
934 break;
935 re = AREF (elt, 0);
936 if (NILP (string))
937 TEMP_SET_PT_BOTH (charpos, bytepos);
938 if (NILP (re)
939 || (STRINGP (re)
940 && (STRINGP (string)
941 ? EQ (Fstring_match (re, string, pos), pos)
942 : (! NILP (Fre_search_forward (re, make_number (limit), Qt, Qnil))
943 && EQ (Fmatch_beginning (make_number (0)), pos)))))
944 {
945 to = (NILP (re) ? charpos + 1 : XINT (Fmatch_end (make_number (0))));
946 #ifdef HAVE_WINDOW_SYSTEM
947 if (FRAME_WINDOW_P (f))
948 {
949 font_object = font_range (charpos, &to, win, face, string);
950 if (! FONT_OBJECT_P (font_object))
951 {
952 if (NILP (string))
953 TEMP_SET_PT_BOTH (pt, pt_byte);
954 return unbind_to (count, Qnil);
955 }
956 }
957 #endif /* not HAVE_WINDOW_SYSTEM */
958 gstring = Fcomposition_get_gstring (pos, make_number (to),
959 font_object, string);
960 if (NILP (LGSTRING_ID (gstring)))
961 {
962 Lisp_Object args[6];
963
964 args[0] = Vauto_composition_function;
965 args[1] = AREF (elt, 2);
966 args[2] = pos;
967 args[3] = make_number (to);
968 args[4] = font_object;
969 args[5] = string;
970 gstring = safe_call (6, args);
971 }
972 if (NILP (string))
973 TEMP_SET_PT_BOTH (pt, pt_byte);
974 return unbind_to (count, gstring);
975 }
976 }
977 if (NILP (string))
978 TEMP_SET_PT_BOTH (pt, pt_byte);
979 return unbind_to (count, Qnil);
980 }
981
982
983 /* Update cmp_it->stop_pos to the next position after CHARPOS (and
984 BYTEPOS) where character composition may happen. If BYTEPOS is
985 negative, compoute it. If it is a static composition, set
986 cmp_it->ch to -1. Otherwise, set cmp_it->ch to the character that
987 triggers a automatic composition. */
988
989 void
990 composition_compute_stop_pos (cmp_it, charpos, bytepos, endpos, string)
991 struct composition_it *cmp_it;
992 EMACS_INT charpos, bytepos, endpos;
993 Lisp_Object string;
994 {
995 EMACS_INT start, end, c;
996 Lisp_Object prop, val;
997 /* This is from forward_to_next_line_start in xdisp.c. */
998 const int MAX_NEWLINE_DISTANCE = 500;
999
1000 if (endpos > charpos + MAX_NEWLINE_DISTANCE)
1001 endpos = charpos + MAX_NEWLINE_DISTANCE;
1002 cmp_it->stop_pos = endpos;
1003 if (find_composition (charpos, endpos, &start, &end, &prop, string)
1004 && COMPOSITION_VALID_P (start, end, prop))
1005 {
1006 cmp_it->stop_pos = endpos = start;
1007 cmp_it->ch = -1;
1008 }
1009 if (NILP (current_buffer->enable_multibyte_characters)
1010 || ! FUNCTIONP (Vauto_composition_function))
1011 return;
1012 if (bytepos < 0)
1013 {
1014 if (STRINGP (string))
1015 bytepos = string_char_to_byte (string, charpos);
1016 else
1017 bytepos = CHAR_TO_BYTE (charpos);
1018 }
1019
1020 start = charpos;
1021 while (charpos < endpos)
1022 {
1023 if (STRINGP (string))
1024 FETCH_STRING_CHAR_ADVANCE (c, string, charpos, bytepos);
1025 else
1026 FETCH_CHAR_ADVANCE (c, charpos, bytepos);
1027 if (c == '\n')
1028 break;
1029 val = CHAR_TABLE_REF (Vcomposition_function_table, c);
1030 if (! NILP (val))
1031 {
1032 Lisp_Object elt;
1033
1034 for (; CONSP (val); val = XCDR (val))
1035 {
1036 elt = XCAR (val);
1037 if (VECTORP (elt) && ASIZE (elt) == 3 && NATNUMP (AREF (elt, 1))
1038 && charpos - 1 - XFASTINT (AREF (elt, 1)) >= start)
1039 break;
1040 }
1041 if (CONSP (val))
1042 {
1043 cmp_it->lookback = XFASTINT (AREF (elt, 1));
1044 cmp_it->stop_pos = charpos - 1 - cmp_it->lookback;
1045 cmp_it->ch = c;
1046 break;
1047 }
1048 }
1049 }
1050 if (charpos == endpos)
1051 {
1052 cmp_it->stop_pos = endpos;
1053 cmp_it->ch = -2;
1054 }
1055 }
1056
1057 /* Check if the character at CHARPOS (and BYTEPOS) is composed
1058 (possibly with the following charaters) on window W. ENDPOS limits
1059 characters to be composed. FACE, in non-NULL, is a base face of
1060 the character. If STRING is not nil, it is a string containing the
1061 character to check, and CHARPOS and BYTEPOS are indices in the
1062 string. In that case, FACE must not be NULL.
1063
1064 If the character is composed, setup members of CMP_IT (id, nglyphs,
1065 and from), and return 1. Otherwise, update CMP_IT->stop_pos, and
1066 return 0. */
1067
1068 int
1069 composition_reseat_it (cmp_it, charpos, bytepos, endpos, w, face, string)
1070 struct composition_it *cmp_it;
1071 EMACS_INT charpos, bytepos, endpos;
1072 struct window *w;
1073 struct face *face;
1074 Lisp_Object string;
1075 {
1076 if (cmp_it->ch == -2)
1077 {
1078 composition_compute_stop_pos (cmp_it, charpos, bytepos, endpos, string);
1079 if (cmp_it->ch == -2)
1080 return 0;
1081 }
1082
1083 if (cmp_it->ch < 0)
1084 {
1085 /* We are looking at a static composition. */
1086 EMACS_INT start, end;
1087 Lisp_Object prop;
1088
1089 find_composition (charpos, -1, &start, &end, &prop, string);
1090 cmp_it->id = get_composition_id (charpos, bytepos, end - start,
1091 prop, string);
1092 if (cmp_it->id < 0)
1093 goto no_composition;
1094 cmp_it->nchars = end - start;
1095 cmp_it->nglyphs = composition_table[cmp_it->id]->glyph_len;
1096 }
1097 else
1098 {
1099 Lisp_Object val, elt;
1100 int i;
1101
1102 val = CHAR_TABLE_REF (Vcomposition_function_table, cmp_it->ch);
1103 for (; CONSP (val); val = XCDR (val))
1104 {
1105 elt = XCAR (val);
1106 if (cmp_it->lookback == XFASTINT (AREF (elt, 1)))
1107 break;
1108 }
1109 if (NILP (val))
1110 goto no_composition;
1111
1112 val = autocmp_chars (val, charpos, bytepos, endpos, w, face, string);
1113 if (! composition_gstring_p (val))
1114 goto no_composition;
1115 if (NILP (LGSTRING_ID (val)))
1116 val = composition_gstring_put_cache (val, -1);
1117 cmp_it->id = XINT (LGSTRING_ID (val));
1118 for (i = 0; i < LGSTRING_GLYPH_LEN (val); i++)
1119 if (NILP (LGSTRING_GLYPH (val, i)))
1120 break;
1121 cmp_it->nglyphs = i;
1122 }
1123 cmp_it->from = 0;
1124 return 1;
1125
1126 no_composition:
1127 charpos++;
1128 if (STRINGP (string))
1129 bytepos += MULTIBYTE_LENGTH_NO_CHECK (SDATA (string) + bytepos);
1130 else
1131 INC_POS (bytepos);
1132 composition_compute_stop_pos (cmp_it, charpos, bytepos, endpos, string);
1133 return 0;
1134 }
1135
1136 int
1137 composition_update_it (cmp_it, charpos, bytepos, string)
1138 struct composition_it *cmp_it;
1139 EMACS_INT charpos, bytepos;
1140 Lisp_Object string;
1141 {
1142 int i, c;
1143
1144 if (cmp_it->ch < 0)
1145 {
1146 struct composition *cmp = composition_table[cmp_it->id];
1147
1148 cmp_it->to = cmp_it->nglyphs;
1149 if (cmp_it->nglyphs == 0)
1150 c = -1;
1151 else
1152 {
1153 for (i = 0; i < cmp->glyph_len; i++)
1154 if ((c = COMPOSITION_GLYPH (cmp, i)) != '\t')
1155 break;
1156 if (c == '\t')
1157 c = ' ';
1158 }
1159 cmp_it->width = cmp->width;
1160 }
1161 else
1162 {
1163 Lisp_Object gstring = composition_gstring_from_id (cmp_it->id);
1164
1165 if (cmp_it->nglyphs == 0)
1166 {
1167 c = -1;
1168 cmp_it->nchars = LGSTRING_CHAR_LEN (gstring);
1169 cmp_it->width = 0;
1170 }
1171 else
1172 {
1173 Lisp_Object glyph = LGSTRING_GLYPH (gstring, cmp_it->from);
1174 int from = LGLYPH_FROM (glyph);
1175
1176 c = XINT (LGSTRING_CHAR (gstring, from));
1177 cmp_it->nchars = LGLYPH_TO (glyph) - from + 1;
1178 cmp_it->width = (LGLYPH_WIDTH (glyph) > 0
1179 ? CHAR_WIDTH (LGLYPH_CHAR (glyph)) : 0);
1180 for (cmp_it->to = cmp_it->from + 1; cmp_it->to < cmp_it->nglyphs;
1181 cmp_it->to++)
1182 {
1183 glyph = LGSTRING_GLYPH (gstring, cmp_it->to);
1184 if (LGLYPH_FROM (glyph) != from)
1185 break;
1186 if (LGLYPH_WIDTH (glyph) > 0)
1187 cmp_it->width += CHAR_WIDTH (LGLYPH_CHAR (glyph));
1188 }
1189 }
1190 }
1191
1192 charpos += cmp_it->nchars;
1193 if (STRINGP (string))
1194 cmp_it->nbytes = string_char_to_byte (string, charpos) - bytepos;
1195 else
1196 cmp_it->nbytes = CHAR_TO_BYTE (charpos) - bytepos;
1197 return c;
1198 }
1199
1200
1201 struct position_record
1202 {
1203 EMACS_INT pos, pos_byte;
1204 unsigned char *p;
1205 };
1206
1207 /* Update the members of POSTION to the next character boundary. */
1208 #define FORWARD_CHAR(POSITION, STOP) \
1209 do { \
1210 (POSITION).pos++; \
1211 if ((POSITION).pos == (STOP)) \
1212 { \
1213 (POSITION).p = GAP_END_ADDR; \
1214 (POSITION).pos_byte = GPT_BYTE; \
1215 } \
1216 else \
1217 { \
1218 (POSITION).pos_byte += BYTES_BY_CHAR_HEAD (*((POSITION).p)); \
1219 (POSITION).p += BYTES_BY_CHAR_HEAD (*((POSITION).p)); \
1220 } \
1221 } while (0)
1222
1223 /* Update the members of POSTION to the previous character boundary. */
1224 #define BACKWARD_CHAR(POSITION, STOP) \
1225 do { \
1226 if ((POSITION).pos == STOP) \
1227 (POSITION).p = GPT_ADDR; \
1228 do { \
1229 (POSITION).pos_byte--; \
1230 (POSITION).p--; \
1231 } while (! CHAR_HEAD_P (*((POSITION).p))); \
1232 (POSITION).pos--; \
1233 } while (0)
1234
1235 static Lisp_Object _work_val;
1236 static int _work_char;
1237
1238 /* 1 iff the character C is composable. */
1239 #define CHAR_COMPOSABLE_P(C) \
1240 (_work_val = CHAR_TABLE_REF (Vunicode_category_table, (C)), \
1241 (SYMBOLP (_work_val) \
1242 && (_work_char = SDATA (SYMBOL_NAME (_work_val))[0]) != 'C' \
1243 && _work_char != 'Z'))
1244
1245 /* This is like find_composition, but find an automatic composition
1246 instead. If found, set *GSTRING to the glyph-string representing
1247 the composition, and return 1. Otherwise, return 0. */
1248
1249 static int
1250 find_automatic_composition (pos, limit, start, end, gstring, string)
1251 EMACS_INT pos, limit, *start, *end;
1252 Lisp_Object *gstring, string;
1253 {
1254 EMACS_INT head, tail, stop;
1255 struct position_record orig, cur, check, prev;
1256 Lisp_Object check_val, val, elt;
1257 int check_lookback;
1258 int c;
1259 struct window *w;
1260
1261 orig.pos = pos;
1262 if (NILP (string))
1263 {
1264 head = BEGV, tail = ZV, stop = GPT;
1265 orig.pos_byte = CHAR_TO_BYTE (orig.pos);
1266 orig.p = BYTE_POS_ADDR (orig.pos_byte);
1267 }
1268 else
1269 {
1270 head = 0, tail = SCHARS (string), stop = -1;
1271 orig.pos_byte = string_char_to_byte (string, orig.pos);
1272 orig.p = SDATA (string) + orig.pos_byte;
1273 }
1274 if (limit < pos)
1275 {
1276 head = max (head, limit);
1277 tail = min (tail, pos + 3);
1278 }
1279 else
1280 {
1281 tail = min (tail, limit + 3);
1282 }
1283 w = XWINDOW (selected_window);
1284 cur = orig;
1285
1286 retry:
1287 check_val = Qnil;
1288 /* At first, check if POS is compoable. */
1289 c = STRING_CHAR (cur.p, 0);
1290 if (! CHAR_COMPOSABLE_P (c))
1291 {
1292 if (limit < 0)
1293 return 0;
1294 if (limit >= cur.pos)
1295 goto search_forward;
1296 }
1297 else
1298 {
1299 val = CHAR_TABLE_REF (Vcomposition_function_table, c);
1300 if (! NILP (val))
1301 check_val = val, check = cur;
1302 else
1303 while (cur.pos + 1 < tail)
1304 {
1305 FORWARD_CHAR (cur, stop);
1306 c = STRING_CHAR (cur.p, 0);
1307 if (! CHAR_COMPOSABLE_P (c))
1308 break;
1309 val = CHAR_TABLE_REF (Vcomposition_function_table, c);
1310 if (NILP (val))
1311 continue;
1312 check_val = val, check = cur;
1313 break;
1314 }
1315 cur = orig;
1316 }
1317 /* Rewind back to the position where we can safely search forward
1318 for compositions. */
1319 while (cur.pos > head)
1320 {
1321 BACKWARD_CHAR (cur, stop);
1322 c = STRING_CHAR (cur.p, 0);
1323 if (! CHAR_COMPOSABLE_P (c))
1324 break;
1325 val = CHAR_TABLE_REF (Vcomposition_function_table, c);
1326 if (! NILP (val))
1327 check_val = val, check = cur;
1328 }
1329 prev = cur;
1330 /* Now search forward. */
1331 search_forward:
1332 *gstring = Qnil;
1333 if (! NILP (check_val) || limit >= orig.pos)
1334 {
1335 if (NILP (check_val))
1336 cur = orig;
1337 else
1338 cur = check;
1339 while (cur.pos < tail)
1340 {
1341 int need_adjustment = 0;
1342
1343 if (NILP (check_val))
1344 {
1345 c = STRING_CHAR (cur.p, 0);
1346 check_val = CHAR_TABLE_REF (Vcomposition_function_table, c);
1347 }
1348 for (; CONSP (check_val); check_val = XCDR (check_val))
1349 {
1350 elt = XCAR (check_val);
1351 if (VECTORP (elt) && ASIZE (elt) == 3 && NATNUMP (AREF (elt, 1))
1352 && cur.pos - XFASTINT (AREF (elt, 1)) >= head)
1353 {
1354 check.pos = cur.pos - XFASTINT (AREF (elt, 1));
1355 if (check.pos == cur.pos)
1356 check.pos_byte = cur.pos_byte;
1357 else
1358 check.pos_byte = CHAR_TO_BYTE (check.pos);
1359 val = autocmp_chars (check_val, check.pos, check.pos_byte,
1360 tail, w, NULL, string);
1361 need_adjustment = 1;
1362 if (! NILP (val))
1363 {
1364 *gstring = val;
1365 *start = check.pos;
1366 *end = check.pos + LGSTRING_CHAR_LEN (*gstring);
1367 if (*start <= orig.pos ? *end > orig.pos
1368 : limit >= orig.pos)
1369 return 1;
1370 cur.pos = *end;
1371 cur.pos_byte = CHAR_TO_BYTE (cur.pos);
1372 break;
1373 }
1374 }
1375 }
1376 if (need_adjustment)
1377 {
1378 /* As we have called Lisp, there's a possibilily that
1379 buffer/string is relocated. */
1380 if (NILP (string))
1381 cur.p = BYTE_POS_ADDR (cur.pos_byte);
1382 else
1383 cur.p = SDATA (string) + cur.pos_byte;
1384 }
1385 if (! CONSP (check_val))
1386 FORWARD_CHAR (cur, stop);
1387 check_val = Qnil;
1388 }
1389 }
1390 if (! NILP (*gstring))
1391 return (limit >= 0 || (*start <= orig.pos && *end > orig.pos));
1392 if (limit >= 0 && limit < orig.pos && prev.pos > head)
1393 {
1394 cur = prev;
1395 BACKWARD_CHAR (cur, stop);
1396 orig = cur;
1397 tail = orig.pos;
1398 goto retry;
1399 }
1400 return 0;
1401 }
1402
1403 int
1404 composition_adjust_point (last_pt)
1405 EMACS_INT last_pt;
1406 {
1407 EMACS_INT charpos, bytepos, startpos, beg, end, pos;
1408 Lisp_Object val;
1409 int i;
1410
1411 if (PT == BEGV || PT == ZV)
1412 return PT;
1413
1414 /* At first check the static composition. */
1415 if (get_property_and_range (PT, Qcomposition, &val, &beg, &end, Qnil)
1416 && COMPOSITION_VALID_P (beg, end, val)
1417 && beg < PT /* && end > PT <- It's always the case. */
1418 && (last_pt <= beg || last_pt >= end))
1419 return (PT < last_pt ? beg : end);
1420
1421 if (NILP (current_buffer->enable_multibyte_characters)
1422 || ! FUNCTIONP (Vauto_composition_function))
1423 return PT;
1424
1425 /* Next check the automatic composition. */
1426 if (! find_automatic_composition (PT, -1, &beg, &end, &val, Qnil)
1427 || beg == PT)
1428 return PT;
1429 for (i = 0; i < LGSTRING_GLYPH_LEN (val); i++)
1430 {
1431 Lisp_Object glyph = LGSTRING_GLYPH (val, i);
1432
1433 if (NILP (glyph))
1434 break;
1435 if (beg + LGLYPH_FROM (glyph) == PT)
1436 return PT;
1437 if (beg + LGLYPH_TO (glyph) >= PT)
1438 return (PT < last_pt
1439 ? beg + LGLYPH_FROM (glyph)
1440 : beg + LGLYPH_TO (glyph) + 1);
1441 }
1442 return PT;
1443 }
1444
1445 DEFUN ("composition-get-gstring", Fcomposition_get_gstring,
1446 Scomposition_get_gstring, 4, 4, 0,
1447 doc: /* Return a glyph-string for characters between FROM and TO.
1448 If the glhph string is for graphic display, FONT-OBJECT must be
1449 a font-object to use for those characters.
1450 Otherwise (for terminal display), FONT-OBJECT must be nil.
1451
1452 If the optional 4th argument STRING is not nil, it is a string
1453 containing the target characters between indices FROM and TO.
1454
1455 A glhph-string is a vector containing information about how to display
1456 specific character sequence. The format is:
1457 [HEADER ID GLYPH ...]
1458
1459 HEADER is a vector of this form:
1460 [FONT-OBJECT CHAR ...]
1461 where
1462 FONT-OBJECT is a font-object for all glyphs in the glyph-string,
1463 or nil if not yet decided.
1464 CHARs are characters to be composed by GLYPHs.
1465
1466 ID is an identification number of the glyph-string. It may be nil if
1467 not yet shaped.
1468
1469 GLYPH is a vector whose elements has this form:
1470 [ FROM-IDX TO-IDX C CODE WIDTH LBEARING RBEARING ASCENT DESCENT
1471 [ [X-OFF Y-OFF WADJUST] | nil] ]
1472 where
1473 FROM-IDX and TO-IDX are used internally and should not be touched.
1474 C is the character of the glyph.
1475 CODE is the glyph-code of C in FONT-OBJECT.
1476 WIDTH thru DESCENT are the metrics (in pixels) of the glyph.
1477 X-OFF and Y-OFF are offests to the base position for the glyph.
1478 WADJUST is the adjustment to the normal width of the glyph.
1479
1480 If GLYPH is nil, the remaining elements of the glhph-string vector
1481 must be ignore. */)
1482 (from, to, font_object, string)
1483 Lisp_Object font_object, from, to, string;
1484 {
1485 Lisp_Object gstring, header;
1486
1487 if (! NILP (font_object))
1488 CHECK_FONT_OBJECT (font_object);
1489 header = fill_gstring_header (Qnil, from, to, font_object, string);
1490 gstring = gstring_lookup_cache (header);
1491 if (! NILP (gstring))
1492 return gstring;
1493 LGSTRING_SET_HEADER (gstring_work, header);
1494 LGSTRING_SET_ID (gstring_work, Qnil);
1495 fill_gstring_body (gstring_work);
1496 return gstring_work;
1497 }
1498
1499 \f
1500 /* Emacs Lisp APIs. */
1501
1502 DEFUN ("compose-region-internal", Fcompose_region_internal,
1503 Scompose_region_internal, 2, 4, 0,
1504 doc: /* Internal use only.
1505
1506 Compose text in the region between START and END.
1507 Optional 3rd and 4th arguments are COMPONENTS and MODIFICATION-FUNC
1508 for the composition. See `compose-region' for more detail. */)
1509 (start, end, components, modification_func)
1510 Lisp_Object start, end, components, modification_func;
1511 {
1512 validate_region (&start, &end);
1513 if (!NILP (components)
1514 && !INTEGERP (components)
1515 && !CONSP (components)
1516 && !STRINGP (components))
1517 CHECK_VECTOR (components);
1518
1519 compose_text (XINT (start), XINT (end), components, modification_func, Qnil);
1520 return Qnil;
1521 }
1522
1523 DEFUN ("compose-string-internal", Fcompose_string_internal,
1524 Scompose_string_internal, 3, 5, 0,
1525 doc: /* Internal use only.
1526
1527 Compose text between indices START and END of STRING.
1528 Optional 4th and 5th arguments are COMPONENTS and MODIFICATION-FUNC
1529 for the composition. See `compose-string' for more detail. */)
1530 (string, start, end, components, modification_func)
1531 Lisp_Object string, start, end, components, modification_func;
1532 {
1533 CHECK_STRING (string);
1534 CHECK_NUMBER (start);
1535 CHECK_NUMBER (end);
1536
1537 if (XINT (start) < 0 ||
1538 XINT (start) > XINT (end)
1539 || XINT (end) > SCHARS (string))
1540 args_out_of_range (start, end);
1541
1542 compose_text (XINT (start), XINT (end), components, modification_func, string);
1543 return string;
1544 }
1545
1546 DEFUN ("find-composition-internal", Ffind_composition_internal,
1547 Sfind_composition_internal, 4, 4, 0,
1548 doc: /* Internal use only.
1549
1550 Return information about composition at or nearest to position POS.
1551 See `find-composition' for more detail. */)
1552 (pos, limit, string, detail_p)
1553 Lisp_Object pos, limit, string, detail_p;
1554 {
1555 Lisp_Object prop, tail, gstring;
1556 EMACS_INT start, end, from, to;
1557 int id;
1558
1559 CHECK_NUMBER_COERCE_MARKER (pos);
1560 from = XINT (pos);
1561 if (!NILP (limit))
1562 {
1563 CHECK_NUMBER_COERCE_MARKER (limit);
1564 to = XINT (limit);
1565 }
1566 else
1567 to = -1;
1568
1569 if (!NILP (string))
1570 {
1571 CHECK_STRING (string);
1572 if (XINT (pos) < 0 || XINT (pos) > SCHARS (string))
1573 args_out_of_range (string, pos);
1574 }
1575 else
1576 {
1577 if (XINT (pos) < BEGV || XINT (pos) > ZV)
1578 args_out_of_range (Fcurrent_buffer (), pos);
1579 }
1580
1581 if (!find_composition (from, to, &start, &end, &prop, string))
1582 {
1583 if (!NILP (current_buffer->enable_multibyte_characters)
1584 && FUNCTIONP (Vauto_composition_function)
1585 && find_automatic_composition (from, to, &start, &end, &gstring,
1586 string))
1587 return list3 (make_number (start), make_number (end), gstring);
1588 return Qnil;
1589 }
1590 if ((end <= XINT (pos) || start > XINT (pos)))
1591 {
1592 EMACS_INT s, e;
1593
1594 if (find_automatic_composition (from, to, &s, &e, &gstring, string)
1595 && (e <= XINT (pos) ? e > end : s < start))
1596 return list3 (make_number (start), make_number (end), gstring);
1597 }
1598 if (!COMPOSITION_VALID_P (start, end, prop))
1599 return Fcons (make_number (start), Fcons (make_number (end),
1600 Fcons (Qnil, Qnil)));
1601 if (NILP (detail_p))
1602 return Fcons (make_number (start), Fcons (make_number (end),
1603 Fcons (Qt, Qnil)));
1604
1605 if (COMPOSITION_REGISTERD_P (prop))
1606 id = COMPOSITION_ID (prop);
1607 else
1608 {
1609 int start_byte = (NILP (string)
1610 ? CHAR_TO_BYTE (start)
1611 : string_char_to_byte (string, start));
1612 id = get_composition_id (start, start_byte, end - start, prop, string);
1613 }
1614
1615 if (id >= 0)
1616 {
1617 Lisp_Object components, relative_p, mod_func;
1618 enum composition_method method = COMPOSITION_METHOD (prop);
1619 int width = composition_table[id]->width;
1620
1621 components = Fcopy_sequence (COMPOSITION_COMPONENTS (prop));
1622 relative_p = (method == COMPOSITION_WITH_RULE_ALTCHARS
1623 ? Qnil : Qt);
1624 mod_func = COMPOSITION_MODIFICATION_FUNC (prop);
1625 tail = Fcons (components,
1626 Fcons (relative_p,
1627 Fcons (mod_func,
1628 Fcons (make_number (width), Qnil))));
1629 }
1630 else
1631 tail = Qnil;
1632
1633 return Fcons (make_number (start), Fcons (make_number (end), tail));
1634 }
1635
1636 \f
1637 void
1638 syms_of_composite ()
1639 {
1640 int i;
1641
1642 Qcomposition = intern ("composition");
1643 staticpro (&Qcomposition);
1644
1645 /* Make a hash table for static composition. */
1646 {
1647 Lisp_Object args[6];
1648 extern Lisp_Object QCsize;
1649
1650 args[0] = QCtest;
1651 args[1] = Qequal;
1652 args[2] = QCweakness;
1653 /* We used to make the hash table weak so that unreferenced
1654 compositions can be garbage-collected. But, usually once
1655 created compositions are repeatedly used in an Emacs session,
1656 and thus it's not worth to save memory in such a way. So, we
1657 make the table not weak. */
1658 args[3] = Qnil;
1659 args[4] = QCsize;
1660 args[5] = make_number (311);
1661 composition_hash_table = Fmake_hash_table (6, args);
1662 staticpro (&composition_hash_table);
1663 }
1664
1665 /* Make a hash table for glyph-string. */
1666 {
1667 Lisp_Object args[6];
1668 extern Lisp_Object QCsize;
1669
1670 args[0] = QCtest;
1671 args[1] = Qequal;
1672 args[2] = QCweakness;
1673 args[3] = Qnil;
1674 args[4] = QCsize;
1675 args[5] = make_number (311);
1676 gstring_hash_table = Fmake_hash_table (6, args);
1677 staticpro (&gstring_hash_table);
1678 }
1679
1680 staticpro (&gstring_work_headers);
1681 gstring_work_headers = Fmake_vector (make_number (8), Qnil);
1682 for (i = 0; i < 8; i++)
1683 ASET (gstring_work_headers, i, Fmake_vector (make_number (i + 2), Qnil));
1684 staticpro (&gstring_work);
1685 gstring_work = Fmake_vector (make_number (10), Qnil);
1686
1687 /* Text property `composition' should be nonsticky by default. */
1688 Vtext_property_default_nonsticky
1689 = Fcons (Fcons (Qcomposition, Qt), Vtext_property_default_nonsticky);
1690
1691 DEFVAR_LISP ("compose-chars-after-function", &Vcompose_chars_after_function,
1692 doc: /* Function to adjust composition of buffer text.
1693
1694 The function is called with three arguments FROM, TO, and OBJECT.
1695 FROM and TO specify the range of text of which composition should be
1696 adjusted. OBJECT, if non-nil, is a string that contains the text.
1697
1698 This function is called after a text with `composition' property is
1699 inserted or deleted to keep `composition' property of buffer text
1700 valid.
1701
1702 The default value is the function `compose-chars-after'. */);
1703 Vcompose_chars_after_function = intern ("compose-chars-after");
1704
1705 Qauto_composed = intern ("auto-composed");
1706 staticpro (&Qauto_composed);
1707
1708 Qauto_composition_function = intern ("auto-composition-function");
1709 staticpro (&Qauto_composition_function);
1710
1711 DEFVAR_LISP ("auto-composition-function", &Vauto_composition_function,
1712 doc: /* Function to call to compose characters automatically.
1713 The function is called from the display routine with four arguments,
1714 FROM, TO, WINDOW, and STRING.
1715
1716 If STRING is nil, the function must compose characters in the region
1717 between FROM and TO in the current buffer.
1718
1719 Otherwise, STRING is a string, and FROM and TO are indices into the
1720 string. In this case, the function must compose characters in the
1721 string. */);
1722 Vauto_composition_function = Qnil;
1723
1724 DEFVAR_LISP ("composition-function-table", &Vcomposition_function_table,
1725 doc: /* Char-able of functions for automatic character composition.
1726 For each character that has to be composed automatically with
1727 preceding and/or following characters, this char-table contains
1728 a function to call to compose that character.
1729
1730 The element at index C in the table, if non-nil, is a list of
1731 this form: ([PATTERN PREV-CHARS FUNC] ...)
1732
1733 PATTERN is a regular expression with which C and the surrounding
1734 characters must match.
1735
1736 PREV-CHARS is a number of characters before C to check the
1737 matching with PATTERN. If it is 0, PATTERN must match with C and
1738 the following characters. If it is 1, PATTERN must match with a
1739 character before C and the following characters.
1740
1741 If PREV-CHARS is 0, PATTERN can be nil, which means that the
1742 single character C should be composed.
1743
1744 FUNC is a function to return a glyph-string representing a
1745 composition of the characters matching with PATTERN. It is
1746 called with one argument GSTRING.
1747
1748 GSTRING is a template of a glyph-string to return. It is already
1749 filled with a proper header for the characters to compose, and
1750 glyphs corresponding to those characters one by one. The
1751 function must return a new glyph-string of the same header as
1752 GSTRING, or modify GSTRING itself and return it.
1753
1754 See also the documentation of `auto-composition-mode'. */);
1755 Vcomposition_function_table = Fmake_char_table (Qnil, Qnil);
1756
1757 defsubr (&Scompose_region_internal);
1758 defsubr (&Scompose_string_internal);
1759 defsubr (&Sfind_composition_internal);
1760 defsubr (&Scomposition_get_gstring);
1761 }
1762
1763 /* arch-tag: 79cefaf8-ca48-4eed-97e5-d5afb290d272
1764 (do not change this comment) */