Fix typo in comment delimiter.
[bpt/emacs.git] / src / search.c
CommitLineData
ca1d1d23
JB
1/* String search routines for GNU Emacs.
2 Copyright (C) 1985, 1986, 1987, 1992 Free Software Foundation, Inc.
3
4This file is part of GNU Emacs.
5
6GNU Emacs is free software; you can redistribute it and/or modify
7it under the terms of the GNU General Public License as published by
8the Free Software Foundation; either version 1, or (at your option)
9any later version.
10
11GNU Emacs is distributed in the hope that it will be useful,
12but WITHOUT ANY WARRANTY; without even the implied warranty of
13MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14GNU General Public License for more details.
15
16You should have received a copy of the GNU General Public License
17along with GNU Emacs; see the file COPYING. If not, write to
18the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA. */
19
20
21#include "config.h"
22#include "lisp.h"
23#include "syntax.h"
24#include "buffer.h"
25#include "commands.h"
9ac0d9e0 26#include "blockinput.h"
4746118a 27
ca1d1d23
JB
28#include <sys/types.h>
29#include "regex.h"
30
31#define max(a, b) ((a) > (b) ? (a) : (b))
32#define min(a, b) ((a) < (b) ? (a) : (b))
33
34/* We compile regexps into this buffer and then use it for searching. */
35
36struct re_pattern_buffer searchbuf;
37
38char search_fastmap[0400];
39
40/* Last regexp we compiled */
41
42Lisp_Object last_regexp;
43
4746118a
JB
44/* Every call to re_match, etc., must pass &search_regs as the regs
45 argument unless you can show it is unnecessary (i.e., if re_match
46 is certainly going to be called again before region-around-match
47 can be called).
48
49 Since the registers are now dynamically allocated, we need to make
50 sure not to refer to the Nth register before checking that it has
1113d9db
JB
51 been allocated by checking search_regs.num_regs.
52
53 The regex code keeps track of whether it has allocated the search
54 buffer using bits in searchbuf. This means that whenever you
55 compile a new pattern, it completely forgets whether it has
56 allocated any registers, and will allocate new registers the next
57 time you call a searching or matching function. Therefore, we need
58 to call re_set_registers after compiling a new pattern or after
59 setting the match registers, so that the regex functions will be
60 able to free or re-allocate it properly. */
ca1d1d23
JB
61static struct re_registers search_regs;
62
daa37602
JB
63/* The buffer in which the last search was performed, or
64 Qt if the last search was done in a string;
65 Qnil if no searching has been done yet. */
66static Lisp_Object last_thing_searched;
ca1d1d23
JB
67
68/* error condition signalled when regexp compile_pattern fails */
69
70Lisp_Object Qinvalid_regexp;
71
72static void
73matcher_overflow ()
74{
75 error ("Stack overflow in regexp matcher");
76}
77
78#ifdef __STDC__
79#define CONST const
80#else
81#define CONST
82#endif
83
84/* Compile a regexp and signal a Lisp error if anything goes wrong. */
85
1113d9db 86compile_pattern (pattern, bufp, regp, translate)
ca1d1d23
JB
87 Lisp_Object pattern;
88 struct re_pattern_buffer *bufp;
1113d9db 89 struct re_registers *regp;
ca1d1d23
JB
90 char *translate;
91{
92 CONST char *val;
93 Lisp_Object dummy;
94
95 if (EQ (pattern, last_regexp)
96 && translate == bufp->translate)
97 return;
1113d9db 98
ca1d1d23
JB
99 last_regexp = Qnil;
100 bufp->translate = translate;
9ac0d9e0 101 BLOCK_INPUT;
ca1d1d23
JB
102 val = re_compile_pattern ((char *) XSTRING (pattern)->data,
103 XSTRING (pattern)->size,
104 bufp);
9ac0d9e0 105 UNBLOCK_INPUT;
ca1d1d23
JB
106 if (val)
107 {
108 dummy = build_string (val);
109 while (1)
110 Fsignal (Qinvalid_regexp, Fcons (dummy, Qnil));
111 }
1113d9db 112
ca1d1d23 113 last_regexp = pattern;
1113d9db
JB
114
115 /* Advise the searching functions about the space we have allocated
116 for register data. */
9ac0d9e0 117 BLOCK_INPUT;
ebb9e16f
JB
118 if (regp)
119 re_set_registers (bufp, regp, regp->num_regs, regp->start, regp->end);
9ac0d9e0 120 UNBLOCK_INPUT;
1113d9db 121
ca1d1d23
JB
122 return;
123}
124
125/* Error condition used for failing searches */
126Lisp_Object Qsearch_failed;
127
128Lisp_Object
129signal_failure (arg)
130 Lisp_Object arg;
131{
132 Fsignal (Qsearch_failed, Fcons (arg, Qnil));
133 return Qnil;
134}
135\f
136DEFUN ("looking-at", Flooking_at, Slooking_at, 1, 1, 0,
e065a56e
JB
137 "Return t if text after point matches regular expression PAT.\n\
138This function modifies the match data that `match-beginning',\n\
139`match-end' and `match-data' access; save and restore the match\n\
fe99283d 140data if you want to preserve them.")
ca1d1d23
JB
141 (string)
142 Lisp_Object string;
143{
144 Lisp_Object val;
145 unsigned char *p1, *p2;
146 int s1, s2;
147 register int i;
148
149 CHECK_STRING (string, 0);
1113d9db 150 compile_pattern (string, &searchbuf, &search_regs,
ca1d1d23
JB
151 !NILP (current_buffer->case_fold_search) ? DOWNCASE_TABLE : 0);
152
153 immediate_quit = 1;
154 QUIT; /* Do a pending quit right away, to avoid paradoxical behavior */
155
156 /* Get pointers and sizes of the two strings
157 that make up the visible portion of the buffer. */
158
159 p1 = BEGV_ADDR;
160 s1 = GPT - BEGV;
161 p2 = GAP_END_ADDR;
162 s2 = ZV - GPT;
163 if (s1 < 0)
164 {
165 p2 = p1;
166 s2 = ZV - BEGV;
167 s1 = 0;
168 }
169 if (s2 < 0)
170 {
171 s1 = ZV - BEGV;
172 s2 = 0;
173 }
174
9ac0d9e0 175 BLOCK_INPUT;
ca1d1d23
JB
176 i = re_match_2 (&searchbuf, (char *) p1, s1, (char *) p2, s2,
177 point - BEGV, &search_regs,
178 ZV - BEGV);
9ac0d9e0 179 UNBLOCK_INPUT;
ca1d1d23
JB
180 if (i == -2)
181 matcher_overflow ();
182
183 val = (0 <= i ? Qt : Qnil);
4746118a 184 for (i = 0; i < search_regs.num_regs; i++)
ca1d1d23
JB
185 if (search_regs.start[i] >= 0)
186 {
187 search_regs.start[i] += BEGV;
188 search_regs.end[i] += BEGV;
189 }
daa37602 190 XSET (last_thing_searched, Lisp_Buffer, current_buffer);
ca1d1d23
JB
191 immediate_quit = 0;
192 return val;
193}
194
195DEFUN ("string-match", Fstring_match, Sstring_match, 2, 3, 0,
196 "Return index of start of first match for REGEXP in STRING, or nil.\n\
197If third arg START is non-nil, start search at that index in STRING.\n\
198For index of first char beyond the match, do (match-end 0).\n\
199`match-end' and `match-beginning' also give indices of substrings\n\
200matched by parenthesis constructs in the pattern.")
201 (regexp, string, start)
202 Lisp_Object regexp, string, start;
203{
204 int val;
205 int s;
206
207 CHECK_STRING (regexp, 0);
208 CHECK_STRING (string, 1);
209
210 if (NILP (start))
211 s = 0;
212 else
213 {
214 int len = XSTRING (string)->size;
215
216 CHECK_NUMBER (start, 2);
217 s = XINT (start);
218 if (s < 0 && -s <= len)
219 s = len - s;
220 else if (0 > s || s > len)
221 args_out_of_range (string, start);
222 }
223
1113d9db 224 compile_pattern (regexp, &searchbuf, &search_regs,
ca1d1d23
JB
225 !NILP (current_buffer->case_fold_search) ? DOWNCASE_TABLE : 0);
226 immediate_quit = 1;
9ac0d9e0 227 BLOCK_INPUT;
ca1d1d23
JB
228 val = re_search (&searchbuf, (char *) XSTRING (string)->data,
229 XSTRING (string)->size, s, XSTRING (string)->size - s,
230 &search_regs);
9ac0d9e0 231 UNBLOCK_INPUT;
ca1d1d23 232 immediate_quit = 0;
daa37602 233 last_thing_searched = Qt;
ca1d1d23
JB
234 if (val == -2)
235 matcher_overflow ();
236 if (val < 0) return Qnil;
237 return make_number (val);
238}
e59a8453
RS
239
240/* Match REGEXP against STRING, searching all of STRING,
241 and return the index of the match, or negative on failure.
242 This does not clobber the match data. */
243
244int
245fast_string_match (regexp, string)
246 Lisp_Object regexp, string;
247{
248 int val;
249
250 compile_pattern (regexp, &searchbuf, 0, 0);
251 immediate_quit = 1;
9ac0d9e0 252 BLOCK_INPUT;
e59a8453
RS
253 val = re_search (&searchbuf, (char *) XSTRING (string)->data,
254 XSTRING (string)->size, 0, XSTRING (string)->size,
255 0);
9ac0d9e0 256 UNBLOCK_INPUT;
e59a8453
RS
257 immediate_quit = 0;
258 return val;
259}
ca1d1d23 260\f
ffd56f97
JB
261/* Search for COUNT instances of the character TARGET, starting at START.
262 If COUNT is negative, search backwards.
263
264 If we find COUNT instances, set *SHORTAGE to zero, and return the
5bfe95c9
RS
265 position after the COUNTth match. Note that for reverse motion
266 this is not the same as the usual convention for Emacs motion commands.
ffd56f97
JB
267
268 If we don't find COUNT instances before reaching the end of the
269 buffer (or the beginning, if scanning backwards), set *SHORTAGE to
270 the number of TARGETs left unfound, and return the end of the
271 buffer we bumped up against. */
272
273scan_buffer (target, start, count, shortage)
274 int *shortage, start;
275 register int count, target;
ca1d1d23 276{
ffd56f97
JB
277 int limit = ((count > 0) ? ZV - 1 : BEGV);
278 int direction = ((count > 0) ? 1 : -1);
279
280 register unsigned char *cursor;
ca1d1d23 281 unsigned char *base;
ffd56f97
JB
282
283 register int ceiling;
284 register unsigned char *ceiling_addr;
ca1d1d23
JB
285
286 if (shortage != 0)
287 *shortage = 0;
288
289 immediate_quit = 1;
290
ffd56f97
JB
291 if (count > 0)
292 while (start != limit + 1)
ca1d1d23 293 {
ffd56f97
JB
294 ceiling = BUFFER_CEILING_OF (start);
295 ceiling = min (limit, ceiling);
296 ceiling_addr = &FETCH_CHAR (ceiling) + 1;
297 base = (cursor = &FETCH_CHAR (start));
ca1d1d23
JB
298 while (1)
299 {
ffd56f97 300 while (*cursor != target && ++cursor != ceiling_addr)
ca1d1d23 301 ;
ffd56f97 302 if (cursor != ceiling_addr)
ca1d1d23 303 {
ffd56f97 304 if (--count == 0)
ca1d1d23
JB
305 {
306 immediate_quit = 0;
ffd56f97 307 return (start + cursor - base + 1);
ca1d1d23
JB
308 }
309 else
ffd56f97 310 if (++cursor == ceiling_addr)
ca1d1d23
JB
311 break;
312 }
313 else
314 break;
315 }
ffd56f97 316 start += cursor - base;
ca1d1d23
JB
317 }
318 else
319 {
ffd56f97
JB
320 start--; /* first character we scan */
321 while (start > limit - 1)
322 { /* we WILL scan under start */
323 ceiling = BUFFER_FLOOR_OF (start);
324 ceiling = max (limit, ceiling);
325 ceiling_addr = &FETCH_CHAR (ceiling) - 1;
326 base = (cursor = &FETCH_CHAR (start));
ca1d1d23
JB
327 cursor++;
328 while (1)
329 {
ffd56f97 330 while (--cursor != ceiling_addr && *cursor != target)
ca1d1d23 331 ;
ffd56f97 332 if (cursor != ceiling_addr)
ca1d1d23 333 {
ffd56f97 334 if (++count == 0)
ca1d1d23
JB
335 {
336 immediate_quit = 0;
ffd56f97 337 return (start + cursor - base + 1);
ca1d1d23
JB
338 }
339 }
340 else
341 break;
342 }
ffd56f97 343 start += cursor - base;
ca1d1d23
JB
344 }
345 }
346 immediate_quit = 0;
347 if (shortage != 0)
ffd56f97
JB
348 *shortage = count * direction;
349 return (start + ((direction == 1 ? 0 : 1)));
ca1d1d23
JB
350}
351
352int
353find_next_newline (from, cnt)
354 register int from, cnt;
355{
356 return (scan_buffer ('\n', from, cnt, (int *) 0));
357}
358\f
c1dc99a1
JB
359Lisp_Object skip_chars ();
360
ca1d1d23
JB
361DEFUN ("skip-chars-forward", Fskip_chars_forward, Sskip_chars_forward, 1, 2, 0,
362 "Move point forward, stopping before a char not in CHARS, or at position LIM.\n\
363CHARS is like the inside of a `[...]' in a regular expression\n\
364except that `]' is never special and `\\' quotes `^', `-' or `\\'.\n\
365Thus, with arg \"a-zA-Z\", this skips letters stopping before first nonletter.\n\
c1dc99a1
JB
366With arg \"^a-zA-Z\", skips nonletters stopping before first letter.\n\
367Returns the distance traveled, either zero or positive.")
ca1d1d23
JB
368 (string, lim)
369 Lisp_Object string, lim;
370{
17431c60 371 return skip_chars (1, 0, string, lim);
ca1d1d23
JB
372}
373
374DEFUN ("skip-chars-backward", Fskip_chars_backward, Sskip_chars_backward, 1, 2, 0,
375 "Move point backward, stopping after a char not in CHARS, or at position LIM.\n\
c1dc99a1
JB
376See `skip-chars-forward' for details.\n\
377Returns the distance traveled, either zero or negative.")
ca1d1d23
JB
378 (string, lim)
379 Lisp_Object string, lim;
380{
17431c60
RS
381 return skip_chars (0, 0, string, lim);
382}
383
384DEFUN ("skip-syntax-forward", Fskip_syntax_forward, Sskip_syntax_forward, 1, 2, 0,
385 "Move point forward across chars in specified syntax classes.\n\
386SYNTAX is a string of syntax code characters.\n\
387Stop before a char whose syntax is not in SYNTAX, or at position LIM.\n\
388If SYNTAX starts with ^, skip characters whose syntax is NOT in SYNTAX.\n\
389This function returns the distance traveled, either zero or positive.")
390 (syntax, lim)
391 Lisp_Object syntax, lim;
392{
393 return skip_chars (1, 1, syntax, lim);
394}
395
396DEFUN ("skip-syntax-backward", Fskip_syntax_backward, Sskip_syntax_backward, 1, 2, 0,
397 "Move point backward across chars in specified syntax classes.\n\
398SYNTAX is a string of syntax code characters.\n\
399Stop on reaching a char whose syntax is not in SYNTAX, or at position LIM.\n\
400If SYNTAX starts with ^, skip characters whose syntax is NOT in SYNTAX.\n\
401This function returns the distance traveled, either zero or negative.")
402 (syntax, lim)
403 Lisp_Object syntax, lim;
404{
405 return skip_chars (0, 1, syntax, lim);
ca1d1d23
JB
406}
407
c1dc99a1 408Lisp_Object
17431c60
RS
409skip_chars (forwardp, syntaxp, string, lim)
410 int forwardp, syntaxp;
ca1d1d23
JB
411 Lisp_Object string, lim;
412{
413 register unsigned char *p, *pend;
414 register unsigned char c;
415 unsigned char fastmap[0400];
416 int negate = 0;
417 register int i;
418
419 CHECK_STRING (string, 0);
420
421 if (NILP (lim))
422 XSET (lim, Lisp_Int, forwardp ? ZV : BEGV);
423 else
424 CHECK_NUMBER_COERCE_MARKER (lim, 1);
425
426#if 0 /* This breaks some things... jla. */
427 /* In any case, don't allow scan outside bounds of buffer. */
428 if (XFASTINT (lim) > ZV)
429 XFASTINT (lim) = ZV;
430 if (XFASTINT (lim) < BEGV)
431 XFASTINT (lim) = BEGV;
432#endif
433
434 p = XSTRING (string)->data;
435 pend = p + XSTRING (string)->size;
436 bzero (fastmap, sizeof fastmap);
437
438 if (p != pend && *p == '^')
439 {
440 negate = 1; p++;
441 }
442
17431c60
RS
443 /* Find the characters specified and set their elements of fastmap.
444 If syntaxp, each character counts as itself.
445 Otherwise, handle backslashes and ranges specially */
ca1d1d23
JB
446
447 while (p != pend)
448 {
449 c = *p++;
17431c60
RS
450 if (syntaxp)
451 fastmap[c] = 1;
452 else
ca1d1d23 453 {
17431c60 454 if (c == '\\')
ca1d1d23 455 {
17431c60
RS
456 if (p == pend) break;
457 c = *p++;
458 }
459 if (p != pend && *p == '-')
460 {
461 p++;
462 if (p == pend) break;
463 while (c <= *p)
464 {
465 fastmap[c] = 1;
466 c++;
467 }
468 p++;
ca1d1d23 469 }
17431c60
RS
470 else
471 fastmap[c] = 1;
ca1d1d23 472 }
ca1d1d23
JB
473 }
474
475 /* If ^ was the first character, complement the fastmap. */
476
477 if (negate)
478 for (i = 0; i < sizeof fastmap; i++)
479 fastmap[i] ^= 1;
480
c1dc99a1
JB
481 {
482 int start_point = point;
483
484 immediate_quit = 1;
17431c60 485 if (syntaxp)
c1dc99a1 486 {
17431c60
RS
487
488 if (forwardp)
489 {
490 while (point < XINT (lim)
491 && fastmap[(unsigned char) syntax_code_spec[(int) SYNTAX (FETCH_CHAR (point))]])
492 SET_PT (point + 1);
493 }
494 else
495 {
496 while (point > XINT (lim)
497 && fastmap[(unsigned char) syntax_code_spec[(int) SYNTAX (FETCH_CHAR (point - 1))]])
498 SET_PT (point - 1);
499 }
c1dc99a1
JB
500 }
501 else
502 {
17431c60
RS
503 if (forwardp)
504 {
505 while (point < XINT (lim) && fastmap[FETCH_CHAR (point)])
506 SET_PT (point + 1);
507 }
508 else
509 {
510 while (point > XINT (lim) && fastmap[FETCH_CHAR (point - 1)])
511 SET_PT (point - 1);
512 }
c1dc99a1
JB
513 }
514 immediate_quit = 0;
515
516 return make_number (point - start_point);
517 }
ca1d1d23
JB
518}
519\f
520/* Subroutines of Lisp buffer search functions. */
521
522static Lisp_Object
523search_command (string, bound, noerror, count, direction, RE)
524 Lisp_Object string, bound, noerror, count;
525 int direction;
526 int RE;
527{
528 register int np;
529 int lim;
530 int n = direction;
531
532 if (!NILP (count))
533 {
534 CHECK_NUMBER (count, 3);
535 n *= XINT (count);
536 }
537
538 CHECK_STRING (string, 0);
539 if (NILP (bound))
540 lim = n > 0 ? ZV : BEGV;
541 else
542 {
543 CHECK_NUMBER_COERCE_MARKER (bound, 1);
544 lim = XINT (bound);
545 if (n > 0 ? lim < point : lim > point)
546 error ("Invalid search bound (wrong side of point)");
547 if (lim > ZV)
548 lim = ZV;
549 if (lim < BEGV)
550 lim = BEGV;
551 }
552
553 np = search_buffer (string, point, lim, n, RE,
554 (!NILP (current_buffer->case_fold_search)
555 ? XSTRING (current_buffer->case_canon_table)->data : 0),
556 (!NILP (current_buffer->case_fold_search)
557 ? XSTRING (current_buffer->case_eqv_table)->data : 0));
558 if (np <= 0)
559 {
560 if (NILP (noerror))
561 return signal_failure (string);
562 if (!EQ (noerror, Qt))
563 {
564 if (lim < BEGV || lim > ZV)
565 abort ();
a5f217b8
RS
566 SET_PT (lim);
567 return Qnil;
568#if 0 /* This would be clean, but maybe programs depend on
569 a value of nil here. */
481399bf 570 np = lim;
a5f217b8 571#endif
ca1d1d23 572 }
481399bf
RS
573 else
574 return Qnil;
ca1d1d23
JB
575 }
576
577 if (np < BEGV || np > ZV)
578 abort ();
579
580 SET_PT (np);
581
582 return make_number (np);
583}
584\f
585/* search for the n'th occurrence of STRING in the current buffer,
586 starting at position POS and stopping at position LIM,
587 treating PAT as a literal string if RE is false or as
588 a regular expression if RE is true.
589
590 If N is positive, searching is forward and LIM must be greater than POS.
591 If N is negative, searching is backward and LIM must be less than POS.
592
593 Returns -x if only N-x occurrences found (x > 0),
594 or else the position at the beginning of the Nth occurrence
595 (if searching backward) or the end (if searching forward). */
596
597search_buffer (string, pos, lim, n, RE, trt, inverse_trt)
598 Lisp_Object string;
599 int pos;
600 int lim;
601 int n;
602 int RE;
603 register unsigned char *trt;
604 register unsigned char *inverse_trt;
605{
606 int len = XSTRING (string)->size;
607 unsigned char *base_pat = XSTRING (string)->data;
608 register int *BM_tab;
609 int *BM_tab_base;
610 register int direction = ((n > 0) ? 1 : -1);
611 register int dirlen;
612 int infinity, limit, k, stride_for_teases;
613 register unsigned char *pat, *cursor, *p_limit;
614 register int i, j;
615 unsigned char *p1, *p2;
616 int s1, s2;
617
618 /* Null string is found at starting position. */
619 if (!len)
620 return pos;
621
622 if (RE)
1113d9db 623 compile_pattern (string, &searchbuf, &search_regs, (char *) trt);
ca1d1d23
JB
624
625 if (RE /* Here we detect whether the */
626 /* generality of an RE search is */
627 /* really needed. */
628 /* first item is "exact match" */
4746118a 629 && *(searchbuf.buffer) == (char) RE_EXACTN_VALUE
ca1d1d23
JB
630 && searchbuf.buffer[1] + 2 == searchbuf.used) /*first is ONLY item */
631 {
632 RE = 0; /* can do straight (non RE) search */
633 pat = (base_pat = (unsigned char *) searchbuf.buffer + 2);
634 /* trt already applied */
635 len = searchbuf.used - 2;
636 }
637 else if (!RE)
638 {
639 pat = (unsigned char *) alloca (len);
640
641 for (i = len; i--;) /* Copy the pattern; apply trt */
642 *pat++ = (((int) trt) ? trt [*base_pat++] : *base_pat++);
643 pat -= len; base_pat = pat;
644 }
645
646 if (RE)
647 {
648 immediate_quit = 1; /* Quit immediately if user types ^G,
649 because letting this function finish
650 can take too long. */
651 QUIT; /* Do a pending quit right away,
652 to avoid paradoxical behavior */
653 /* Get pointers and sizes of the two strings
654 that make up the visible portion of the buffer. */
655
656 p1 = BEGV_ADDR;
657 s1 = GPT - BEGV;
658 p2 = GAP_END_ADDR;
659 s2 = ZV - GPT;
660 if (s1 < 0)
661 {
662 p2 = p1;
663 s2 = ZV - BEGV;
664 s1 = 0;
665 }
666 if (s2 < 0)
667 {
668 s1 = ZV - BEGV;
669 s2 = 0;
670 }
671 while (n < 0)
672 {
9ac0d9e0 673 BLOCK_INPUT;
ca1d1d23
JB
674 int val = re_search_2 (&searchbuf, (char *) p1, s1, (char *) p2, s2,
675 pos - BEGV, lim - pos, &search_regs,
676 /* Don't allow match past current point */
677 pos - BEGV);
9ac0d9e0 678 UNBLOCK_INPUT;
ca1d1d23
JB
679 if (val == -2)
680 matcher_overflow ();
681 if (val >= 0)
682 {
683 j = BEGV;
4746118a 684 for (i = 0; i < search_regs.num_regs; i++)
ca1d1d23
JB
685 if (search_regs.start[i] >= 0)
686 {
687 search_regs.start[i] += j;
688 search_regs.end[i] += j;
689 }
daa37602 690 XSET (last_thing_searched, Lisp_Buffer, current_buffer);
ca1d1d23
JB
691 /* Set pos to the new position. */
692 pos = search_regs.start[0];
693 }
694 else
695 {
696 immediate_quit = 0;
697 return (n);
698 }
699 n++;
700 }
701 while (n > 0)
702 {
9ac0d9e0 703 BLOCK_INPUT;
ca1d1d23
JB
704 int val = re_search_2 (&searchbuf, (char *) p1, s1, (char *) p2, s2,
705 pos - BEGV, lim - pos, &search_regs,
706 lim - BEGV);
9ac0d9e0 707 UNBLOCK_INPUT;
ca1d1d23
JB
708 if (val == -2)
709 matcher_overflow ();
710 if (val >= 0)
711 {
712 j = BEGV;
4746118a 713 for (i = 0; i < search_regs.num_regs; i++)
ca1d1d23
JB
714 if (search_regs.start[i] >= 0)
715 {
716 search_regs.start[i] += j;
717 search_regs.end[i] += j;
718 }
daa37602 719 XSET (last_thing_searched, Lisp_Buffer, current_buffer);
ca1d1d23
JB
720 pos = search_regs.end[0];
721 }
722 else
723 {
724 immediate_quit = 0;
725 return (0 - n);
726 }
727 n--;
728 }
729 immediate_quit = 0;
730 return (pos);
731 }
732 else /* non-RE case */
733 {
734#ifdef C_ALLOCA
735 int BM_tab_space[0400];
736 BM_tab = &BM_tab_space[0];
737#else
738 BM_tab = (int *) alloca (0400 * sizeof (int));
739#endif
740 /* The general approach is that we are going to maintain that we know */
741 /* the first (closest to the present position, in whatever direction */
742 /* we're searching) character that could possibly be the last */
743 /* (furthest from present position) character of a valid match. We */
744 /* advance the state of our knowledge by looking at that character */
745 /* and seeing whether it indeed matches the last character of the */
746 /* pattern. If it does, we take a closer look. If it does not, we */
747 /* move our pointer (to putative last characters) as far as is */
748 /* logically possible. This amount of movement, which I call a */
749 /* stride, will be the length of the pattern if the actual character */
750 /* appears nowhere in the pattern, otherwise it will be the distance */
751 /* from the last occurrence of that character to the end of the */
752 /* pattern. */
753 /* As a coding trick, an enormous stride is coded into the table for */
754 /* characters that match the last character. This allows use of only */
755 /* a single test, a test for having gone past the end of the */
756 /* permissible match region, to test for both possible matches (when */
757 /* the stride goes past the end immediately) and failure to */
758 /* match (where you get nudged past the end one stride at a time). */
759
760 /* Here we make a "mickey mouse" BM table. The stride of the search */
761 /* is determined only by the last character of the putative match. */
762 /* If that character does not match, we will stride the proper */
763 /* distance to propose a match that superimposes it on the last */
764 /* instance of a character that matches it (per trt), or misses */
765 /* it entirely if there is none. */
766
767 dirlen = len * direction;
768 infinity = dirlen - (lim + pos + len + len) * direction;
769 if (direction < 0)
770 pat = (base_pat += len - 1);
771 BM_tab_base = BM_tab;
772 BM_tab += 0400;
773 j = dirlen; /* to get it in a register */
774 /* A character that does not appear in the pattern induces a */
775 /* stride equal to the pattern length. */
776 while (BM_tab_base != BM_tab)
777 {
778 *--BM_tab = j;
779 *--BM_tab = j;
780 *--BM_tab = j;
781 *--BM_tab = j;
782 }
783 i = 0;
784 while (i != infinity)
785 {
786 j = pat[i]; i += direction;
787 if (i == dirlen) i = infinity;
788 if ((int) trt)
789 {
790 k = (j = trt[j]);
791 if (i == infinity)
792 stride_for_teases = BM_tab[j];
793 BM_tab[j] = dirlen - i;
794 /* A translation table is accompanied by its inverse -- see */
795 /* comment following downcase_table for details */
796 while ((j = inverse_trt[j]) != k)
797 BM_tab[j] = dirlen - i;
798 }
799 else
800 {
801 if (i == infinity)
802 stride_for_teases = BM_tab[j];
803 BM_tab[j] = dirlen - i;
804 }
805 /* stride_for_teases tells how much to stride if we get a */
806 /* match on the far character but are subsequently */
807 /* disappointed, by recording what the stride would have been */
808 /* for that character if the last character had been */
809 /* different. */
810 }
811 infinity = dirlen - infinity;
812 pos += dirlen - ((direction > 0) ? direction : 0);
813 /* loop invariant - pos points at where last char (first char if reverse)
814 of pattern would align in a possible match. */
815 while (n != 0)
816 {
817 if ((lim - pos - (direction > 0)) * direction < 0)
818 return (n * (0 - direction));
819 /* First we do the part we can by pointers (maybe nothing) */
820 QUIT;
821 pat = base_pat;
822 limit = pos - dirlen + direction;
823 limit = ((direction > 0)
824 ? BUFFER_CEILING_OF (limit)
825 : BUFFER_FLOOR_OF (limit));
826 /* LIMIT is now the last (not beyond-last!) value
827 POS can take on without hitting edge of buffer or the gap. */
828 limit = ((direction > 0)
829 ? min (lim - 1, min (limit, pos + 20000))
830 : max (lim, max (limit, pos - 20000)));
831 if ((limit - pos) * direction > 20)
832 {
833 p_limit = &FETCH_CHAR (limit);
834 p2 = (cursor = &FETCH_CHAR (pos));
835 /* In this loop, pos + cursor - p2 is the surrogate for pos */
836 while (1) /* use one cursor setting as long as i can */
837 {
838 if (direction > 0) /* worth duplicating */
839 {
840 /* Use signed comparison if appropriate
841 to make cursor+infinity sure to be > p_limit.
842 Assuming that the buffer lies in a range of addresses
843 that are all "positive" (as ints) or all "negative",
844 either kind of comparison will work as long
845 as we don't step by infinity. So pick the kind
846 that works when we do step by infinity. */
847 if ((int) (p_limit + infinity) > (int) p_limit)
848 while ((int) cursor <= (int) p_limit)
849 cursor += BM_tab[*cursor];
850 else
851 while ((unsigned int) cursor <= (unsigned int) p_limit)
852 cursor += BM_tab[*cursor];
853 }
854 else
855 {
856 if ((int) (p_limit + infinity) < (int) p_limit)
857 while ((int) cursor >= (int) p_limit)
858 cursor += BM_tab[*cursor];
859 else
860 while ((unsigned int) cursor >= (unsigned int) p_limit)
861 cursor += BM_tab[*cursor];
862 }
863/* If you are here, cursor is beyond the end of the searched region. */
864 /* This can happen if you match on the far character of the pattern, */
865 /* because the "stride" of that character is infinity, a number able */
866 /* to throw you well beyond the end of the search. It can also */
867 /* happen if you fail to match within the permitted region and would */
868 /* otherwise try a character beyond that region */
869 if ((cursor - p_limit) * direction <= len)
870 break; /* a small overrun is genuine */
871 cursor -= infinity; /* large overrun = hit */
872 i = dirlen - direction;
873 if ((int) trt)
874 {
875 while ((i -= direction) + direction != 0)
876 if (pat[i] != trt[*(cursor -= direction)])
877 break;
878 }
879 else
880 {
881 while ((i -= direction) + direction != 0)
882 if (pat[i] != *(cursor -= direction))
883 break;
884 }
885 cursor += dirlen - i - direction; /* fix cursor */
886 if (i + direction == 0)
887 {
888 cursor -= direction;
1113d9db
JB
889
890 /* Make sure we have registers in which to store
891 the match position. */
892 if (search_regs.num_regs == 0)
893 {
894 regoff_t *starts, *ends;
895
896 starts =
897 (regoff_t *) xmalloc (2 * sizeof (regoff_t));
898 ends =
899 (regoff_t *) xmalloc (2 * sizeof (regoff_t));
9ac0d9e0 900 BLOCK_INPUT;
1113d9db
JB
901 re_set_registers (&searchbuf,
902 &search_regs,
903 2, starts, ends);
9ac0d9e0 904 UNBLOCK_INPUT;
1113d9db
JB
905 }
906
ca1d1d23
JB
907 search_regs.start[0]
908 = pos + cursor - p2 + ((direction > 0)
909 ? 1 - len : 0);
910 search_regs.end[0] = len + search_regs.start[0];
daa37602 911 XSET (last_thing_searched, Lisp_Buffer, current_buffer);
ca1d1d23
JB
912 if ((n -= direction) != 0)
913 cursor += dirlen; /* to resume search */
914 else
915 return ((direction > 0)
916 ? search_regs.end[0] : search_regs.start[0]);
917 }
918 else
919 cursor += stride_for_teases; /* <sigh> we lose - */
920 }
921 pos += cursor - p2;
922 }
923 else
924 /* Now we'll pick up a clump that has to be done the hard */
925 /* way because it covers a discontinuity */
926 {
927 limit = ((direction > 0)
928 ? BUFFER_CEILING_OF (pos - dirlen + 1)
929 : BUFFER_FLOOR_OF (pos - dirlen - 1));
930 limit = ((direction > 0)
931 ? min (limit + len, lim - 1)
932 : max (limit - len, lim));
933 /* LIMIT is now the last value POS can have
934 and still be valid for a possible match. */
935 while (1)
936 {
937 /* This loop can be coded for space rather than */
938 /* speed because it will usually run only once. */
939 /* (the reach is at most len + 21, and typically */
940 /* does not exceed len) */
941 while ((limit - pos) * direction >= 0)
942 pos += BM_tab[FETCH_CHAR(pos)];
943 /* now run the same tests to distinguish going off the */
944 /* end, a match or a phoney match. */
945 if ((pos - limit) * direction <= len)
946 break; /* ran off the end */
947 /* Found what might be a match.
948 Set POS back to last (first if reverse) char pos. */
949 pos -= infinity;
950 i = dirlen - direction;
951 while ((i -= direction) + direction != 0)
952 {
953 pos -= direction;
954 if (pat[i] != (((int) trt)
955 ? trt[FETCH_CHAR(pos)]
956 : FETCH_CHAR (pos)))
957 break;
958 }
959 /* Above loop has moved POS part or all the way
960 back to the first char pos (last char pos if reverse).
961 Set it once again at the last (first if reverse) char. */
962 pos += dirlen - i- direction;
963 if (i + direction == 0)
964 {
965 pos -= direction;
1113d9db
JB
966
967 /* Make sure we have registers in which to store
968 the match position. */
969 if (search_regs.num_regs == 0)
970 {
971 regoff_t *starts, *ends;
972
973 starts =
974 (regoff_t *) xmalloc (2 * sizeof (regoff_t));
975 ends =
976 (regoff_t *) xmalloc (2 * sizeof (regoff_t));
9ac0d9e0 977 BLOCK_INPUT;
1113d9db
JB
978 re_set_registers (&searchbuf,
979 &search_regs,
980 2, starts, ends);
9ac0d9e0 981 UNBLOCK_INPUT;
1113d9db
JB
982 }
983
ca1d1d23
JB
984 search_regs.start[0]
985 = pos + ((direction > 0) ? 1 - len : 0);
986 search_regs.end[0] = len + search_regs.start[0];
daa37602 987 XSET (last_thing_searched, Lisp_Buffer, current_buffer);
ca1d1d23
JB
988 if ((n -= direction) != 0)
989 pos += dirlen; /* to resume search */
990 else
991 return ((direction > 0)
992 ? search_regs.end[0] : search_regs.start[0]);
993 }
994 else
995 pos += stride_for_teases;
996 }
997 }
998 /* We have done one clump. Can we continue? */
999 if ((lim - pos) * direction < 0)
1000 return ((0 - n) * direction);
1001 }
1002 return pos;
1003 }
1004}
1005\f
1006/* Given a string of words separated by word delimiters,
1007 compute a regexp that matches those exact words
1008 separated by arbitrary punctuation. */
1009
1010static Lisp_Object
1011wordify (string)
1012 Lisp_Object string;
1013{
1014 register unsigned char *p, *o;
1015 register int i, len, punct_count = 0, word_count = 0;
1016 Lisp_Object val;
1017
1018 CHECK_STRING (string, 0);
1019 p = XSTRING (string)->data;
1020 len = XSTRING (string)->size;
1021
1022 for (i = 0; i < len; i++)
1023 if (SYNTAX (p[i]) != Sword)
1024 {
1025 punct_count++;
1026 if (i > 0 && SYNTAX (p[i-1]) == Sword) word_count++;
1027 }
1028 if (SYNTAX (p[len-1]) == Sword) word_count++;
1029 if (!word_count) return build_string ("");
1030
1031 val = make_string (p, len - punct_count + 5 * (word_count - 1) + 4);
1032
1033 o = XSTRING (val)->data;
1034 *o++ = '\\';
1035 *o++ = 'b';
1036
1037 for (i = 0; i < len; i++)
1038 if (SYNTAX (p[i]) == Sword)
1039 *o++ = p[i];
1040 else if (i > 0 && SYNTAX (p[i-1]) == Sword && --word_count)
1041 {
1042 *o++ = '\\';
1043 *o++ = 'W';
1044 *o++ = '\\';
1045 *o++ = 'W';
1046 *o++ = '*';
1047 }
1048
1049 *o++ = '\\';
1050 *o++ = 'b';
1051
1052 return val;
1053}
1054\f
1055DEFUN ("search-backward", Fsearch_backward, Ssearch_backward, 1, 4,
1056 "sSearch backward: ",
1057 "Search backward from point for STRING.\n\
1058Set point to the beginning of the occurrence found, and return point.\n\
1059An optional second argument bounds the search; it is a buffer position.\n\
1060The match found must not extend before that position.\n\
1061Optional third argument, if t, means if fail just return nil (no error).\n\
1062 If not nil and not t, position at limit of search and return nil.\n\
1063Optional fourth argument is repeat count--search for successive occurrences.\n\
1064See also the functions `match-beginning', `match-end' and `replace-match'.")
1065 (string, bound, noerror, count)
1066 Lisp_Object string, bound, noerror, count;
1067{
1068 return search_command (string, bound, noerror, count, -1, 0);
1069}
1070
1071DEFUN ("search-forward", Fsearch_forward, Ssearch_forward, 1, 4, "sSearch: ",
1072 "Search forward from point for STRING.\n\
1073Set point to the end of the occurrence found, and return point.\n\
1074An optional second argument bounds the search; it is a buffer position.\n\
1075The match found must not extend after that position. nil is equivalent\n\
1076 to (point-max).\n\
1077Optional third argument, if t, means if fail just return nil (no error).\n\
1078 If not nil and not t, move to limit of search and return nil.\n\
1079Optional fourth argument is repeat count--search for successive occurrences.\n\
1080See also the functions `match-beginning', `match-end' and `replace-match'.")
1081 (string, bound, noerror, count)
1082 Lisp_Object string, bound, noerror, count;
1083{
1084 return search_command (string, bound, noerror, count, 1, 0);
1085}
1086
1087DEFUN ("word-search-backward", Fword_search_backward, Sword_search_backward, 1, 4,
1088 "sWord search backward: ",
1089 "Search backward from point for STRING, ignoring differences in punctuation.\n\
1090Set point to the beginning of the occurrence found, and return point.\n\
1091An optional second argument bounds the search; it is a buffer position.\n\
1092The match found must not extend before that position.\n\
1093Optional third argument, if t, means if fail just return nil (no error).\n\
1094 If not nil and not t, move to limit of search and return nil.\n\
1095Optional fourth argument is repeat count--search for successive occurrences.")
1096 (string, bound, noerror, count)
1097 Lisp_Object string, bound, noerror, count;
1098{
1099 return search_command (wordify (string), bound, noerror, count, -1, 1);
1100}
1101
1102DEFUN ("word-search-forward", Fword_search_forward, Sword_search_forward, 1, 4,
1103 "sWord search: ",
1104 "Search forward from point for STRING, ignoring differences in punctuation.\n\
1105Set point to the end of the occurrence found, and return point.\n\
1106An optional second argument bounds the search; it is a buffer position.\n\
1107The match found must not extend after that position.\n\
1108Optional third argument, if t, means if fail just return nil (no error).\n\
1109 If not nil and not t, move to limit of search and return nil.\n\
1110Optional fourth argument is repeat count--search for successive occurrences.")
1111 (string, bound, noerror, count)
1112 Lisp_Object string, bound, noerror, count;
1113{
1114 return search_command (wordify (string), bound, noerror, count, 1, 1);
1115}
1116
1117DEFUN ("re-search-backward", Fre_search_backward, Sre_search_backward, 1, 4,
1118 "sRE search backward: ",
1119 "Search backward from point for match for regular expression REGEXP.\n\
1120Set point to the beginning of the match, and return point.\n\
1121The match found is the one starting last in the buffer\n\
1122and yet ending before the place the origin of the search.\n\
1123An optional second argument bounds the search; it is a buffer position.\n\
1124The match found must start at or after that position.\n\
1125Optional third argument, if t, means if fail just return nil (no error).\n\
1126 If not nil and not t, move to limit of search and return nil.\n\
1127Optional fourth argument is repeat count--search for successive occurrences.\n\
1128See also the functions `match-beginning', `match-end' and `replace-match'.")
1129 (string, bound, noerror, count)
1130 Lisp_Object string, bound, noerror, count;
1131{
1132 return search_command (string, bound, noerror, count, -1, 1);
1133}
1134
1135DEFUN ("re-search-forward", Fre_search_forward, Sre_search_forward, 1, 4,
1136 "sRE search: ",
1137 "Search forward from point for regular expression REGEXP.\n\
1138Set point to the end of the occurrence found, and return point.\n\
1139An optional second argument bounds the search; it is a buffer position.\n\
1140The match found must not extend after that position.\n\
1141Optional third argument, if t, means if fail just return nil (no error).\n\
1142 If not nil and not t, move to limit of search and return nil.\n\
1143Optional fourth argument is repeat count--search for successive occurrences.\n\
1144See also the functions `match-beginning', `match-end' and `replace-match'.")
1145 (string, bound, noerror, count)
1146 Lisp_Object string, bound, noerror, count;
1147{
1148 return search_command (string, bound, noerror, count, 1, 1);
1149}
1150\f
1151DEFUN ("replace-match", Freplace_match, Sreplace_match, 1, 3, 0,
1152 "Replace text matched by last search with NEWTEXT.\n\
1153If second arg FIXEDCASE is non-nil, do not alter case of replacement text.\n\
1154Otherwise convert to all caps or cap initials, like replaced text.\n\
1155If third arg LITERAL is non-nil, insert NEWTEXT literally.\n\
1156Otherwise treat `\\' as special:\n\
1157 `\\&' in NEWTEXT means substitute original matched text.\n\
1158 `\\N' means substitute what matched the Nth `\\(...\\)'.\n\
1159 If Nth parens didn't match, substitute nothing.\n\
1160 `\\\\' means insert one `\\'.\n\
1113d9db 1161FIXEDCASE and LITERAL are optional arguments.\n\
ca1d1d23
JB
1162Leaves point at end of replacement text.")
1163 (string, fixedcase, literal)
1164 Lisp_Object string, fixedcase, literal;
1165{
1166 enum { nochange, all_caps, cap_initial } case_action;
1167 register int pos, last;
1168 int some_multiletter_word;
97832bd0
RS
1169 int some_lowercase;
1170 int some_uppercase_initial;
ca1d1d23
JB
1171 register int c, prevc;
1172 int inslen;
1173
1174 CHECK_STRING (string, 0);
1175
1176 case_action = nochange; /* We tried an initialization */
1177 /* but some C compilers blew it */
4746118a
JB
1178
1179 if (search_regs.num_regs <= 0)
1180 error ("replace-match called before any match found");
1181
ca1d1d23
JB
1182 if (search_regs.start[0] < BEGV
1183 || search_regs.start[0] > search_regs.end[0]
1184 || search_regs.end[0] > ZV)
97832bd0
RS
1185 args_out_of_range (make_number (search_regs.start[0]),
1186 make_number (search_regs.end[0]));
ca1d1d23
JB
1187
1188 if (NILP (fixedcase))
1189 {
1190 /* Decide how to casify by examining the matched text. */
1191
1192 last = search_regs.end[0];
1193 prevc = '\n';
1194 case_action = all_caps;
1195
1196 /* some_multiletter_word is set nonzero if any original word
1197 is more than one letter long. */
1198 some_multiletter_word = 0;
97832bd0
RS
1199 some_lowercase = 0;
1200 some_uppercase_initial = 0;
ca1d1d23
JB
1201
1202 for (pos = search_regs.start[0]; pos < last; pos++)
1203 {
1204 c = FETCH_CHAR (pos);
1205 if (LOWERCASEP (c))
1206 {
1207 /* Cannot be all caps if any original char is lower case */
1208
97832bd0 1209 some_lowercase = 1;
ca1d1d23 1210 if (SYNTAX (prevc) != Sword)
97832bd0 1211 ;
ca1d1d23
JB
1212 else
1213 some_multiletter_word = 1;
1214 }
1215 else if (!NOCASEP (c))
1216 {
97832bd0
RS
1217 if (SYNTAX (prevc) != Sword)
1218 some_uppercase_initial = 1;
1219 else
ca1d1d23
JB
1220 some_multiletter_word = 1;
1221 }
1222
1223 prevc = c;
1224 }
1225
97832bd0
RS
1226 /* Convert to all caps if the old text is all caps
1227 and has at least one multiletter word. */
1228 if (! some_lowercase && some_multiletter_word)
1229 case_action = all_caps;
1230 /* Capitalize each word, if the old text has a capitalized word. */
1231 else if (some_uppercase_initial)
ca1d1d23 1232 case_action = cap_initial;
97832bd0
RS
1233 else
1234 case_action = nochange;
ca1d1d23
JB
1235 }
1236
1237 SET_PT (search_regs.end[0]);
1238 if (!NILP (literal))
1239 Finsert (1, &string);
1240 else
1241 {
1242 struct gcpro gcpro1;
1243 GCPRO1 (string);
1244
1245 for (pos = 0; pos < XSTRING (string)->size; pos++)
1246 {
1247 c = XSTRING (string)->data[pos];
1248 if (c == '\\')
1249 {
1250 c = XSTRING (string)->data[++pos];
1251 if (c == '&')
1252 Finsert_buffer_substring (Fcurrent_buffer (),
1253 make_number (search_regs.start[0]),
1254 make_number (search_regs.end[0]));
4746118a 1255 else if (c >= '1' && c <= search_regs.num_regs + '0')
ca1d1d23
JB
1256 {
1257 if (search_regs.start[c - '0'] >= 1)
1258 Finsert_buffer_substring (Fcurrent_buffer (),
1259 make_number (search_regs.start[c - '0']),
1260 make_number (search_regs.end[c - '0']));
1261 }
1262 else
1263 insert_char (c);
1264 }
1265 else
1266 insert_char (c);
1267 }
1268 UNGCPRO;
1269 }
1270
1271 inslen = point - (search_regs.end[0]);
1272 del_range (search_regs.start[0], search_regs.end[0]);
1273
1274 if (case_action == all_caps)
1275 Fupcase_region (make_number (point - inslen), make_number (point));
1276 else if (case_action == cap_initial)
1277 upcase_initials_region (make_number (point - inslen), make_number (point));
1278 return Qnil;
1279}
1280\f
1281static Lisp_Object
1282match_limit (num, beginningp)
1283 Lisp_Object num;
1284 int beginningp;
1285{
1286 register int n;
1287
1288 CHECK_NUMBER (num, 0);
1289 n = XINT (num);
4746118a
JB
1290 if (n < 0 || n >= search_regs.num_regs)
1291 args_out_of_range (num, make_number (search_regs.num_regs));
1292 if (search_regs.num_regs <= 0
1293 || search_regs.start[n] < 0)
ca1d1d23
JB
1294 return Qnil;
1295 return (make_number ((beginningp) ? search_regs.start[n]
1296 : search_regs.end[n]));
1297}
1298
1299DEFUN ("match-beginning", Fmatch_beginning, Smatch_beginning, 1, 1, 0,
1300 "Return position of start of text matched by last search.\n\
1301ARG, a number, specifies which parenthesized expression in the last regexp.\n\
1302 Value is nil if ARGth pair didn't match, or there were less than ARG pairs.\n\
1303Zero means the entire text matched by the whole regexp or whole string.")
1304 (num)
1305 Lisp_Object num;
1306{
1307 return match_limit (num, 1);
1308}
1309
1310DEFUN ("match-end", Fmatch_end, Smatch_end, 1, 1, 0,
1311 "Return position of end of text matched by last search.\n\
1312ARG, a number, specifies which parenthesized expression in the last regexp.\n\
1313 Value is nil if ARGth pair didn't match, or there were less than ARG pairs.\n\
1314Zero means the entire text matched by the whole regexp or whole string.")
1315 (num)
1316 Lisp_Object num;
1317{
1318 return match_limit (num, 0);
1319}
1320
1321DEFUN ("match-data", Fmatch_data, Smatch_data, 0, 0, 0,
1322 "Return a list containing all info on what the last search matched.\n\
1323Element 2N is `(match-beginning N)'; element 2N + 1 is `(match-end N)'.\n\
1324All the elements are markers or nil (nil if the Nth pair didn't match)\n\
1325if the last match was on a buffer; integers or nil if a string was matched.\n\
1326Use `store-match-data' to reinstate the data in this list.")
1327 ()
1328{
4746118a 1329 Lisp_Object *data;
ca1d1d23
JB
1330 int i, len;
1331
daa37602
JB
1332 if (NILP (last_thing_searched))
1333 error ("match-data called before any match found");
1334
4746118a
JB
1335 data = (Lisp_Object *) alloca ((2 * search_regs.num_regs)
1336 * sizeof (Lisp_Object));
1337
ca1d1d23 1338 len = -1;
4746118a 1339 for (i = 0; i < search_regs.num_regs; i++)
ca1d1d23
JB
1340 {
1341 int start = search_regs.start[i];
1342 if (start >= 0)
1343 {
daa37602 1344 if (EQ (last_thing_searched, Qt))
ca1d1d23
JB
1345 {
1346 XFASTINT (data[2 * i]) = start;
1347 XFASTINT (data[2 * i + 1]) = search_regs.end[i];
1348 }
daa37602 1349 else if (XTYPE (last_thing_searched) == Lisp_Buffer)
ca1d1d23
JB
1350 {
1351 data[2 * i] = Fmake_marker ();
daa37602
JB
1352 Fset_marker (data[2 * i],
1353 make_number (start),
1354 last_thing_searched);
ca1d1d23
JB
1355 data[2 * i + 1] = Fmake_marker ();
1356 Fset_marker (data[2 * i + 1],
daa37602
JB
1357 make_number (search_regs.end[i]),
1358 last_thing_searched);
ca1d1d23 1359 }
daa37602
JB
1360 else
1361 /* last_thing_searched must always be Qt, a buffer, or Qnil. */
1362 abort ();
1363
ca1d1d23
JB
1364 len = i;
1365 }
1366 else
1367 data[2 * i] = data [2 * i + 1] = Qnil;
1368 }
1369 return Flist (2 * len + 2, data);
1370}
1371
1372
1373DEFUN ("store-match-data", Fstore_match_data, Sstore_match_data, 1, 1, 0,
1374 "Set internal data on last search match from elements of LIST.\n\
1375LIST should have been created by calling `match-data' previously.")
1376 (list)
1377 register Lisp_Object list;
1378{
1379 register int i;
1380 register Lisp_Object marker;
1381
1382 if (!CONSP (list) && !NILP (list))
b37902c8 1383 list = wrong_type_argument (Qconsp, list);
ca1d1d23 1384
daa37602
JB
1385 /* Unless we find a marker with a buffer in LIST, assume that this
1386 match data came from a string. */
1387 last_thing_searched = Qt;
1388
4746118a
JB
1389 /* Allocate registers if they don't already exist. */
1390 {
d084e942 1391 int length = XFASTINT (Flength (list)) / 2;
4746118a
JB
1392
1393 if (length > search_regs.num_regs)
1394 {
1113d9db
JB
1395 if (search_regs.num_regs == 0)
1396 {
1397 search_regs.start
1398 = (regoff_t *) xmalloc (length * sizeof (regoff_t));
1399 search_regs.end
1400 = (regoff_t *) xmalloc (length * sizeof (regoff_t));
1401 }
4746118a 1402 else
1113d9db
JB
1403 {
1404 search_regs.start
1405 = (regoff_t *) xrealloc (search_regs.start,
1406 length * sizeof (regoff_t));
1407 search_regs.end
1408 = (regoff_t *) xrealloc (search_regs.end,
1409 length * sizeof (regoff_t));
1410 }
4746118a 1411
9ac0d9e0 1412 BLOCK_INPUT;
1113d9db
JB
1413 re_set_registers (&searchbuf, &search_regs, length,
1414 search_regs.start, search_regs.end);
9ac0d9e0 1415 UNBLOCK_INPUT;
4746118a
JB
1416 }
1417 }
1418
1419 for (i = 0; i < search_regs.num_regs; i++)
ca1d1d23
JB
1420 {
1421 marker = Fcar (list);
1422 if (NILP (marker))
1423 {
1424 search_regs.start[i] = -1;
1425 list = Fcdr (list);
1426 }
1427 else
1428 {
daa37602
JB
1429 if (XTYPE (marker) == Lisp_Marker)
1430 {
1431 if (XMARKER (marker)->buffer == 0)
1432 XFASTINT (marker) = 0;
1433 else
1434 XSET (last_thing_searched, Lisp_Buffer,
1435 XMARKER (marker)->buffer);
1436 }
ca1d1d23
JB
1437
1438 CHECK_NUMBER_COERCE_MARKER (marker, 0);
1439 search_regs.start[i] = XINT (marker);
1440 list = Fcdr (list);
1441
1442 marker = Fcar (list);
1443 if (XTYPE (marker) == Lisp_Marker
1444 && XMARKER (marker)->buffer == 0)
1445 XFASTINT (marker) = 0;
1446
1447 CHECK_NUMBER_COERCE_MARKER (marker, 0);
1448 search_regs.end[i] = XINT (marker);
1449 }
1450 list = Fcdr (list);
1451 }
1452
1453 return Qnil;
1454}
1455
1456/* Quote a string to inactivate reg-expr chars */
1457
1458DEFUN ("regexp-quote", Fregexp_quote, Sregexp_quote, 1, 1, 0,
1459 "Return a regexp string which matches exactly STRING and nothing else.")
1460 (str)
1461 Lisp_Object str;
1462{
1463 register unsigned char *in, *out, *end;
1464 register unsigned char *temp;
1465
1466 CHECK_STRING (str, 0);
1467
1468 temp = (unsigned char *) alloca (XSTRING (str)->size * 2);
1469
1470 /* Now copy the data into the new string, inserting escapes. */
1471
1472 in = XSTRING (str)->data;
1473 end = in + XSTRING (str)->size;
1474 out = temp;
1475
1476 for (; in != end; in++)
1477 {
1478 if (*in == '[' || *in == ']'
1479 || *in == '*' || *in == '.' || *in == '\\'
1480 || *in == '?' || *in == '+'
1481 || *in == '^' || *in == '$')
1482 *out++ = '\\';
1483 *out++ = *in;
1484 }
1485
1486 return make_string (temp, out - temp);
1487}
1488\f
1489syms_of_search ()
1490{
1491 register int i;
1492
1493 searchbuf.allocated = 100;
8c0e7b73 1494 searchbuf.buffer = (unsigned char *) malloc (searchbuf.allocated);
ca1d1d23
JB
1495 searchbuf.fastmap = search_fastmap;
1496
1497 Qsearch_failed = intern ("search-failed");
1498 staticpro (&Qsearch_failed);
1499 Qinvalid_regexp = intern ("invalid-regexp");
1500 staticpro (&Qinvalid_regexp);
1501
1502 Fput (Qsearch_failed, Qerror_conditions,
1503 Fcons (Qsearch_failed, Fcons (Qerror, Qnil)));
1504 Fput (Qsearch_failed, Qerror_message,
1505 build_string ("Search failed"));
1506
1507 Fput (Qinvalid_regexp, Qerror_conditions,
1508 Fcons (Qinvalid_regexp, Fcons (Qerror, Qnil)));
1509 Fput (Qinvalid_regexp, Qerror_message,
1510 build_string ("Invalid regexp"));
1511
1512 last_regexp = Qnil;
1513 staticpro (&last_regexp);
1514
daa37602
JB
1515 last_thing_searched = Qnil;
1516 staticpro (&last_thing_searched);
1517
ca1d1d23
JB
1518 defsubr (&Sstring_match);
1519 defsubr (&Slooking_at);
1520 defsubr (&Sskip_chars_forward);
1521 defsubr (&Sskip_chars_backward);
17431c60
RS
1522 defsubr (&Sskip_syntax_forward);
1523 defsubr (&Sskip_syntax_backward);
ca1d1d23
JB
1524 defsubr (&Ssearch_forward);
1525 defsubr (&Ssearch_backward);
1526 defsubr (&Sword_search_forward);
1527 defsubr (&Sword_search_backward);
1528 defsubr (&Sre_search_forward);
1529 defsubr (&Sre_search_backward);
1530 defsubr (&Sreplace_match);
1531 defsubr (&Smatch_beginning);
1532 defsubr (&Smatch_end);
1533 defsubr (&Smatch_data);
1534 defsubr (&Sstore_match_data);
1535 defsubr (&Sregexp_quote);
1536}