(compute_motion): Initialize prev_hpos.
[bpt/emacs.git] / src / search.c
CommitLineData
ca1d1d23 1/* String search routines for GNU Emacs.
c6c5df7f 2 Copyright (C) 1985, 1986, 1987, 1993 Free Software Foundation, Inc.
ca1d1d23
JB
3
4This file is part of GNU Emacs.
5
6GNU Emacs is free software; you can redistribute it and/or modify
7it under the terms of the GNU General Public License as published by
8the Free Software Foundation; either version 1, or (at your option)
9any later version.
10
11GNU Emacs is distributed in the hope that it will be useful,
12but WITHOUT ANY WARRANTY; without even the implied warranty of
13MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14GNU General Public License for more details.
15
16You should have received a copy of the GNU General Public License
17along with GNU Emacs; see the file COPYING. If not, write to
18the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA. */
19
20
18160b98 21#include <config.h>
ca1d1d23
JB
22#include "lisp.h"
23#include "syntax.h"
24#include "buffer.h"
25#include "commands.h"
9ac0d9e0 26#include "blockinput.h"
4746118a 27
ca1d1d23
JB
28#include <sys/types.h>
29#include "regex.h"
30
31#define max(a, b) ((a) > (b) ? (a) : (b))
32#define min(a, b) ((a) < (b) ? (a) : (b))
33
34/* We compile regexps into this buffer and then use it for searching. */
35
36struct re_pattern_buffer searchbuf;
37
38char search_fastmap[0400];
39
40/* Last regexp we compiled */
41
42Lisp_Object last_regexp;
43
4746118a
JB
44/* Every call to re_match, etc., must pass &search_regs as the regs
45 argument unless you can show it is unnecessary (i.e., if re_match
46 is certainly going to be called again before region-around-match
47 can be called).
48
49 Since the registers are now dynamically allocated, we need to make
50 sure not to refer to the Nth register before checking that it has
1113d9db
JB
51 been allocated by checking search_regs.num_regs.
52
53 The regex code keeps track of whether it has allocated the search
54 buffer using bits in searchbuf. This means that whenever you
55 compile a new pattern, it completely forgets whether it has
56 allocated any registers, and will allocate new registers the next
57 time you call a searching or matching function. Therefore, we need
58 to call re_set_registers after compiling a new pattern or after
59 setting the match registers, so that the regex functions will be
60 able to free or re-allocate it properly. */
ca1d1d23
JB
61static struct re_registers search_regs;
62
daa37602
JB
63/* The buffer in which the last search was performed, or
64 Qt if the last search was done in a string;
65 Qnil if no searching has been done yet. */
66static Lisp_Object last_thing_searched;
ca1d1d23
JB
67
68/* error condition signalled when regexp compile_pattern fails */
69
70Lisp_Object Qinvalid_regexp;
71
ca325161
RS
72static void set_search_regs ();
73
ca1d1d23
JB
74static void
75matcher_overflow ()
76{
77 error ("Stack overflow in regexp matcher");
78}
79
80#ifdef __STDC__
81#define CONST const
82#else
83#define CONST
84#endif
85
86/* Compile a regexp and signal a Lisp error if anything goes wrong. */
87
1113d9db 88compile_pattern (pattern, bufp, regp, translate)
ca1d1d23
JB
89 Lisp_Object pattern;
90 struct re_pattern_buffer *bufp;
1113d9db 91 struct re_registers *regp;
ca1d1d23
JB
92 char *translate;
93{
94 CONST char *val;
95 Lisp_Object dummy;
96
97 if (EQ (pattern, last_regexp)
98 && translate == bufp->translate)
99 return;
1113d9db 100
ca1d1d23
JB
101 last_regexp = Qnil;
102 bufp->translate = translate;
9ac0d9e0 103 BLOCK_INPUT;
b90d9e80
RS
104 val = (CONST char *) re_compile_pattern ((char *) XSTRING (pattern)->data,
105 XSTRING (pattern)->size, bufp);
9ac0d9e0 106 UNBLOCK_INPUT;
ca1d1d23
JB
107 if (val)
108 {
109 dummy = build_string (val);
110 while (1)
111 Fsignal (Qinvalid_regexp, Fcons (dummy, Qnil));
112 }
1113d9db 113
ca1d1d23 114 last_regexp = pattern;
1113d9db
JB
115
116 /* Advise the searching functions about the space we have allocated
117 for register data. */
9ac0d9e0 118 BLOCK_INPUT;
ebb9e16f
JB
119 if (regp)
120 re_set_registers (bufp, regp, regp->num_regs, regp->start, regp->end);
9ac0d9e0 121 UNBLOCK_INPUT;
1113d9db 122
ca1d1d23
JB
123 return;
124}
125
126/* Error condition used for failing searches */
127Lisp_Object Qsearch_failed;
128
129Lisp_Object
130signal_failure (arg)
131 Lisp_Object arg;
132{
133 Fsignal (Qsearch_failed, Fcons (arg, Qnil));
134 return Qnil;
135}
136\f
137DEFUN ("looking-at", Flooking_at, Slooking_at, 1, 1, 0,
e065a56e
JB
138 "Return t if text after point matches regular expression PAT.\n\
139This function modifies the match data that `match-beginning',\n\
140`match-end' and `match-data' access; save and restore the match\n\
fe99283d 141data if you want to preserve them.")
ca1d1d23
JB
142 (string)
143 Lisp_Object string;
144{
145 Lisp_Object val;
146 unsigned char *p1, *p2;
147 int s1, s2;
148 register int i;
149
150 CHECK_STRING (string, 0);
1113d9db 151 compile_pattern (string, &searchbuf, &search_regs,
ca1d1d23
JB
152 !NILP (current_buffer->case_fold_search) ? DOWNCASE_TABLE : 0);
153
154 immediate_quit = 1;
155 QUIT; /* Do a pending quit right away, to avoid paradoxical behavior */
156
157 /* Get pointers and sizes of the two strings
158 that make up the visible portion of the buffer. */
159
160 p1 = BEGV_ADDR;
161 s1 = GPT - BEGV;
162 p2 = GAP_END_ADDR;
163 s2 = ZV - GPT;
164 if (s1 < 0)
165 {
166 p2 = p1;
167 s2 = ZV - BEGV;
168 s1 = 0;
169 }
170 if (s2 < 0)
171 {
172 s1 = ZV - BEGV;
173 s2 = 0;
174 }
175
176 i = re_match_2 (&searchbuf, (char *) p1, s1, (char *) p2, s2,
177 point - BEGV, &search_regs,
178 ZV - BEGV);
179 if (i == -2)
180 matcher_overflow ();
181
182 val = (0 <= i ? Qt : Qnil);
4746118a 183 for (i = 0; i < search_regs.num_regs; i++)
ca1d1d23
JB
184 if (search_regs.start[i] >= 0)
185 {
186 search_regs.start[i] += BEGV;
187 search_regs.end[i] += BEGV;
188 }
daa37602 189 XSET (last_thing_searched, Lisp_Buffer, current_buffer);
ca1d1d23
JB
190 immediate_quit = 0;
191 return val;
192}
193
194DEFUN ("string-match", Fstring_match, Sstring_match, 2, 3, 0,
195 "Return index of start of first match for REGEXP in STRING, or nil.\n\
196If third arg START is non-nil, start search at that index in STRING.\n\
197For index of first char beyond the match, do (match-end 0).\n\
198`match-end' and `match-beginning' also give indices of substrings\n\
199matched by parenthesis constructs in the pattern.")
200 (regexp, string, start)
201 Lisp_Object regexp, string, start;
202{
203 int val;
204 int s;
205
206 CHECK_STRING (regexp, 0);
207 CHECK_STRING (string, 1);
208
209 if (NILP (start))
210 s = 0;
211 else
212 {
213 int len = XSTRING (string)->size;
214
215 CHECK_NUMBER (start, 2);
216 s = XINT (start);
217 if (s < 0 && -s <= len)
218 s = len - s;
219 else if (0 > s || s > len)
220 args_out_of_range (string, start);
221 }
222
1113d9db 223 compile_pattern (regexp, &searchbuf, &search_regs,
ca1d1d23
JB
224 !NILP (current_buffer->case_fold_search) ? DOWNCASE_TABLE : 0);
225 immediate_quit = 1;
226 val = re_search (&searchbuf, (char *) XSTRING (string)->data,
227 XSTRING (string)->size, s, XSTRING (string)->size - s,
228 &search_regs);
229 immediate_quit = 0;
daa37602 230 last_thing_searched = Qt;
ca1d1d23
JB
231 if (val == -2)
232 matcher_overflow ();
233 if (val < 0) return Qnil;
234 return make_number (val);
235}
e59a8453
RS
236
237/* Match REGEXP against STRING, searching all of STRING,
238 and return the index of the match, or negative on failure.
239 This does not clobber the match data. */
240
241int
242fast_string_match (regexp, string)
243 Lisp_Object regexp, string;
244{
245 int val;
246
247 compile_pattern (regexp, &searchbuf, 0, 0);
248 immediate_quit = 1;
249 val = re_search (&searchbuf, (char *) XSTRING (string)->data,
250 XSTRING (string)->size, 0, XSTRING (string)->size,
251 0);
252 immediate_quit = 0;
253 return val;
254}
ca1d1d23 255\f
ffd56f97
JB
256/* Search for COUNT instances of the character TARGET, starting at START.
257 If COUNT is negative, search backwards.
258
259 If we find COUNT instances, set *SHORTAGE to zero, and return the
5bfe95c9
RS
260 position after the COUNTth match. Note that for reverse motion
261 this is not the same as the usual convention for Emacs motion commands.
ffd56f97
JB
262
263 If we don't find COUNT instances before reaching the end of the
264 buffer (or the beginning, if scanning backwards), set *SHORTAGE to
265 the number of TARGETs left unfound, and return the end of the
087a5f81 266 buffer we bumped up against.
ffd56f97 267
087a5f81
RS
268 If ALLOW_QUIT is non-zero, set immediate_quit. That's good to do
269 except when inside redisplay. */
270
271scan_buffer (target, start, count, shortage, allow_quit)
ffd56f97
JB
272 int *shortage, start;
273 register int count, target;
087a5f81 274 int allow_quit;
ca1d1d23 275{
ffd56f97
JB
276 int limit = ((count > 0) ? ZV - 1 : BEGV);
277 int direction = ((count > 0) ? 1 : -1);
278
279 register unsigned char *cursor;
ca1d1d23 280 unsigned char *base;
ffd56f97
JB
281
282 register int ceiling;
283 register unsigned char *ceiling_addr;
ca1d1d23
JB
284
285 if (shortage != 0)
286 *shortage = 0;
287
087a5f81 288 immediate_quit = allow_quit;
ca1d1d23 289
ffd56f97
JB
290 if (count > 0)
291 while (start != limit + 1)
ca1d1d23 292 {
ffd56f97
JB
293 ceiling = BUFFER_CEILING_OF (start);
294 ceiling = min (limit, ceiling);
295 ceiling_addr = &FETCH_CHAR (ceiling) + 1;
296 base = (cursor = &FETCH_CHAR (start));
ca1d1d23
JB
297 while (1)
298 {
ffd56f97 299 while (*cursor != target && ++cursor != ceiling_addr)
ca1d1d23 300 ;
ffd56f97 301 if (cursor != ceiling_addr)
ca1d1d23 302 {
ffd56f97 303 if (--count == 0)
ca1d1d23
JB
304 {
305 immediate_quit = 0;
ffd56f97 306 return (start + cursor - base + 1);
ca1d1d23
JB
307 }
308 else
ffd56f97 309 if (++cursor == ceiling_addr)
ca1d1d23
JB
310 break;
311 }
312 else
313 break;
314 }
ffd56f97 315 start += cursor - base;
ca1d1d23
JB
316 }
317 else
318 {
ffd56f97
JB
319 start--; /* first character we scan */
320 while (start > limit - 1)
321 { /* we WILL scan under start */
322 ceiling = BUFFER_FLOOR_OF (start);
323 ceiling = max (limit, ceiling);
324 ceiling_addr = &FETCH_CHAR (ceiling) - 1;
325 base = (cursor = &FETCH_CHAR (start));
ca1d1d23
JB
326 cursor++;
327 while (1)
328 {
ffd56f97 329 while (--cursor != ceiling_addr && *cursor != target)
ca1d1d23 330 ;
ffd56f97 331 if (cursor != ceiling_addr)
ca1d1d23 332 {
ffd56f97 333 if (++count == 0)
ca1d1d23
JB
334 {
335 immediate_quit = 0;
ffd56f97 336 return (start + cursor - base + 1);
ca1d1d23
JB
337 }
338 }
339 else
340 break;
341 }
ffd56f97 342 start += cursor - base;
ca1d1d23
JB
343 }
344 }
345 immediate_quit = 0;
346 if (shortage != 0)
ffd56f97
JB
347 *shortage = count * direction;
348 return (start + ((direction == 1 ? 0 : 1)));
ca1d1d23
JB
349}
350
351int
352find_next_newline (from, cnt)
353 register int from, cnt;
354{
087a5f81 355 return scan_buffer ('\n', from, cnt, (int *) 0, 1);
ca1d1d23
JB
356}
357\f
c1dc99a1
JB
358Lisp_Object skip_chars ();
359
ca1d1d23 360DEFUN ("skip-chars-forward", Fskip_chars_forward, Sskip_chars_forward, 1, 2, 0,
3acb9a69
RS
361 "Move point forward, stopping before a char not in STRING, or at pos LIM.\n\
362STRING is like the inside of a `[...]' in a regular expression\n\
ca1d1d23
JB
363except that `]' is never special and `\\' quotes `^', `-' or `\\'.\n\
364Thus, with arg \"a-zA-Z\", this skips letters stopping before first nonletter.\n\
c1dc99a1
JB
365With arg \"^a-zA-Z\", skips nonletters stopping before first letter.\n\
366Returns the distance traveled, either zero or positive.")
ca1d1d23
JB
367 (string, lim)
368 Lisp_Object string, lim;
369{
17431c60 370 return skip_chars (1, 0, string, lim);
ca1d1d23
JB
371}
372
373DEFUN ("skip-chars-backward", Fskip_chars_backward, Sskip_chars_backward, 1, 2, 0,
3acb9a69 374 "Move point backward, stopping after a char not in STRING, or at pos LIM.\n\
c1dc99a1
JB
375See `skip-chars-forward' for details.\n\
376Returns the distance traveled, either zero or negative.")
ca1d1d23
JB
377 (string, lim)
378 Lisp_Object string, lim;
379{
17431c60
RS
380 return skip_chars (0, 0, string, lim);
381}
382
383DEFUN ("skip-syntax-forward", Fskip_syntax_forward, Sskip_syntax_forward, 1, 2, 0,
384 "Move point forward across chars in specified syntax classes.\n\
385SYNTAX is a string of syntax code characters.\n\
386Stop before a char whose syntax is not in SYNTAX, or at position LIM.\n\
387If SYNTAX starts with ^, skip characters whose syntax is NOT in SYNTAX.\n\
388This function returns the distance traveled, either zero or positive.")
389 (syntax, lim)
390 Lisp_Object syntax, lim;
391{
392 return skip_chars (1, 1, syntax, lim);
393}
394
395DEFUN ("skip-syntax-backward", Fskip_syntax_backward, Sskip_syntax_backward, 1, 2, 0,
396 "Move point backward across chars in specified syntax classes.\n\
397SYNTAX is a string of syntax code characters.\n\
398Stop on reaching a char whose syntax is not in SYNTAX, or at position LIM.\n\
399If SYNTAX starts with ^, skip characters whose syntax is NOT in SYNTAX.\n\
400This function returns the distance traveled, either zero or negative.")
401 (syntax, lim)
402 Lisp_Object syntax, lim;
403{
404 return skip_chars (0, 1, syntax, lim);
ca1d1d23
JB
405}
406
c1dc99a1 407Lisp_Object
17431c60
RS
408skip_chars (forwardp, syntaxp, string, lim)
409 int forwardp, syntaxp;
ca1d1d23
JB
410 Lisp_Object string, lim;
411{
412 register unsigned char *p, *pend;
413 register unsigned char c;
414 unsigned char fastmap[0400];
415 int negate = 0;
416 register int i;
417
418 CHECK_STRING (string, 0);
419
420 if (NILP (lim))
421 XSET (lim, Lisp_Int, forwardp ? ZV : BEGV);
422 else
423 CHECK_NUMBER_COERCE_MARKER (lim, 1);
424
ca1d1d23 425 /* In any case, don't allow scan outside bounds of buffer. */
c5241910
RS
426 /* jla turned this off, for no known reason.
427 bfox turned the ZV part on, and rms turned the
428 BEGV part back on. */
429 if (XINT (lim) > ZV)
ca1d1d23 430 XFASTINT (lim) = ZV;
c5241910 431 if (XINT (lim) < BEGV)
ca1d1d23 432 XFASTINT (lim) = BEGV;
ca1d1d23
JB
433
434 p = XSTRING (string)->data;
435 pend = p + XSTRING (string)->size;
436 bzero (fastmap, sizeof fastmap);
437
438 if (p != pend && *p == '^')
439 {
440 negate = 1; p++;
441 }
442
17431c60
RS
443 /* Find the characters specified and set their elements of fastmap.
444 If syntaxp, each character counts as itself.
445 Otherwise, handle backslashes and ranges specially */
ca1d1d23
JB
446
447 while (p != pend)
448 {
449 c = *p++;
17431c60
RS
450 if (syntaxp)
451 fastmap[c] = 1;
452 else
ca1d1d23 453 {
17431c60 454 if (c == '\\')
ca1d1d23 455 {
17431c60
RS
456 if (p == pend) break;
457 c = *p++;
458 }
459 if (p != pend && *p == '-')
460 {
461 p++;
462 if (p == pend) break;
463 while (c <= *p)
464 {
465 fastmap[c] = 1;
466 c++;
467 }
468 p++;
ca1d1d23 469 }
17431c60
RS
470 else
471 fastmap[c] = 1;
ca1d1d23 472 }
ca1d1d23
JB
473 }
474
9239c6c1
RS
475 if (syntaxp && fastmap['-'] != 0)
476 fastmap[' '] = 1;
477
ca1d1d23
JB
478 /* If ^ was the first character, complement the fastmap. */
479
480 if (negate)
481 for (i = 0; i < sizeof fastmap; i++)
482 fastmap[i] ^= 1;
483
c1dc99a1
JB
484 {
485 int start_point = point;
486
487 immediate_quit = 1;
17431c60 488 if (syntaxp)
c1dc99a1 489 {
17431c60
RS
490
491 if (forwardp)
492 {
493 while (point < XINT (lim)
494 && fastmap[(unsigned char) syntax_code_spec[(int) SYNTAX (FETCH_CHAR (point))]])
495 SET_PT (point + 1);
496 }
497 else
498 {
499 while (point > XINT (lim)
500 && fastmap[(unsigned char) syntax_code_spec[(int) SYNTAX (FETCH_CHAR (point - 1))]])
501 SET_PT (point - 1);
502 }
c1dc99a1
JB
503 }
504 else
505 {
17431c60
RS
506 if (forwardp)
507 {
508 while (point < XINT (lim) && fastmap[FETCH_CHAR (point)])
509 SET_PT (point + 1);
510 }
511 else
512 {
513 while (point > XINT (lim) && fastmap[FETCH_CHAR (point - 1)])
514 SET_PT (point - 1);
515 }
c1dc99a1
JB
516 }
517 immediate_quit = 0;
518
519 return make_number (point - start_point);
520 }
ca1d1d23
JB
521}
522\f
523/* Subroutines of Lisp buffer search functions. */
524
525static Lisp_Object
526search_command (string, bound, noerror, count, direction, RE)
527 Lisp_Object string, bound, noerror, count;
528 int direction;
529 int RE;
530{
531 register int np;
532 int lim;
533 int n = direction;
534
535 if (!NILP (count))
536 {
537 CHECK_NUMBER (count, 3);
538 n *= XINT (count);
539 }
540
541 CHECK_STRING (string, 0);
542 if (NILP (bound))
543 lim = n > 0 ? ZV : BEGV;
544 else
545 {
546 CHECK_NUMBER_COERCE_MARKER (bound, 1);
547 lim = XINT (bound);
548 if (n > 0 ? lim < point : lim > point)
549 error ("Invalid search bound (wrong side of point)");
550 if (lim > ZV)
551 lim = ZV;
552 if (lim < BEGV)
553 lim = BEGV;
554 }
555
556 np = search_buffer (string, point, lim, n, RE,
557 (!NILP (current_buffer->case_fold_search)
558 ? XSTRING (current_buffer->case_canon_table)->data : 0),
559 (!NILP (current_buffer->case_fold_search)
560 ? XSTRING (current_buffer->case_eqv_table)->data : 0));
561 if (np <= 0)
562 {
563 if (NILP (noerror))
564 return signal_failure (string);
565 if (!EQ (noerror, Qt))
566 {
567 if (lim < BEGV || lim > ZV)
568 abort ();
a5f217b8
RS
569 SET_PT (lim);
570 return Qnil;
571#if 0 /* This would be clean, but maybe programs depend on
572 a value of nil here. */
481399bf 573 np = lim;
a5f217b8 574#endif
ca1d1d23 575 }
481399bf
RS
576 else
577 return Qnil;
ca1d1d23
JB
578 }
579
580 if (np < BEGV || np > ZV)
581 abort ();
582
583 SET_PT (np);
584
585 return make_number (np);
586}
587\f
ca325161 588/* Search for the n'th occurrence of STRING in the current buffer,
ca1d1d23
JB
589 starting at position POS and stopping at position LIM,
590 treating PAT as a literal string if RE is false or as
591 a regular expression if RE is true.
592
593 If N is positive, searching is forward and LIM must be greater than POS.
594 If N is negative, searching is backward and LIM must be less than POS.
595
596 Returns -x if only N-x occurrences found (x > 0),
597 or else the position at the beginning of the Nth occurrence
598 (if searching backward) or the end (if searching forward). */
599
600search_buffer (string, pos, lim, n, RE, trt, inverse_trt)
601 Lisp_Object string;
602 int pos;
603 int lim;
604 int n;
605 int RE;
606 register unsigned char *trt;
607 register unsigned char *inverse_trt;
608{
609 int len = XSTRING (string)->size;
610 unsigned char *base_pat = XSTRING (string)->data;
611 register int *BM_tab;
612 int *BM_tab_base;
613 register int direction = ((n > 0) ? 1 : -1);
614 register int dirlen;
615 int infinity, limit, k, stride_for_teases;
616 register unsigned char *pat, *cursor, *p_limit;
617 register int i, j;
618 unsigned char *p1, *p2;
619 int s1, s2;
620
621 /* Null string is found at starting position. */
3f57a499 622 if (len == 0)
ca325161
RS
623 {
624 set_search_regs (pos, 0);
625 return pos;
626 }
3f57a499
RS
627
628 /* Searching 0 times means don't move. */
629 if (n == 0)
ca1d1d23
JB
630 return pos;
631
632 if (RE)
1113d9db 633 compile_pattern (string, &searchbuf, &search_regs, (char *) trt);
ca1d1d23
JB
634
635 if (RE /* Here we detect whether the */
636 /* generality of an RE search is */
637 /* really needed. */
638 /* first item is "exact match" */
4746118a 639 && *(searchbuf.buffer) == (char) RE_EXACTN_VALUE
ca1d1d23
JB
640 && searchbuf.buffer[1] + 2 == searchbuf.used) /*first is ONLY item */
641 {
642 RE = 0; /* can do straight (non RE) search */
643 pat = (base_pat = (unsigned char *) searchbuf.buffer + 2);
644 /* trt already applied */
645 len = searchbuf.used - 2;
646 }
647 else if (!RE)
648 {
649 pat = (unsigned char *) alloca (len);
650
651 for (i = len; i--;) /* Copy the pattern; apply trt */
652 *pat++ = (((int) trt) ? trt [*base_pat++] : *base_pat++);
653 pat -= len; base_pat = pat;
654 }
655
656 if (RE)
657 {
658 immediate_quit = 1; /* Quit immediately if user types ^G,
659 because letting this function finish
660 can take too long. */
661 QUIT; /* Do a pending quit right away,
662 to avoid paradoxical behavior */
663 /* Get pointers and sizes of the two strings
664 that make up the visible portion of the buffer. */
665
666 p1 = BEGV_ADDR;
667 s1 = GPT - BEGV;
668 p2 = GAP_END_ADDR;
669 s2 = ZV - GPT;
670 if (s1 < 0)
671 {
672 p2 = p1;
673 s2 = ZV - BEGV;
674 s1 = 0;
675 }
676 if (s2 < 0)
677 {
678 s1 = ZV - BEGV;
679 s2 = 0;
680 }
681 while (n < 0)
682 {
42db823b 683 int val;
42db823b
RS
684 val = re_search_2 (&searchbuf, (char *) p1, s1, (char *) p2, s2,
685 pos - BEGV, lim - pos, &search_regs,
686 /* Don't allow match past current point */
687 pos - BEGV);
ca1d1d23
JB
688 if (val == -2)
689 matcher_overflow ();
690 if (val >= 0)
691 {
692 j = BEGV;
4746118a 693 for (i = 0; i < search_regs.num_regs; i++)
ca1d1d23
JB
694 if (search_regs.start[i] >= 0)
695 {
696 search_regs.start[i] += j;
697 search_regs.end[i] += j;
698 }
daa37602 699 XSET (last_thing_searched, Lisp_Buffer, current_buffer);
ca1d1d23
JB
700 /* Set pos to the new position. */
701 pos = search_regs.start[0];
702 }
703 else
704 {
705 immediate_quit = 0;
706 return (n);
707 }
708 n++;
709 }
710 while (n > 0)
711 {
42db823b 712 int val;
42db823b
RS
713 val = re_search_2 (&searchbuf, (char *) p1, s1, (char *) p2, s2,
714 pos - BEGV, lim - pos, &search_regs,
715 lim - BEGV);
ca1d1d23
JB
716 if (val == -2)
717 matcher_overflow ();
718 if (val >= 0)
719 {
720 j = BEGV;
4746118a 721 for (i = 0; i < search_regs.num_regs; i++)
ca1d1d23
JB
722 if (search_regs.start[i] >= 0)
723 {
724 search_regs.start[i] += j;
725 search_regs.end[i] += j;
726 }
daa37602 727 XSET (last_thing_searched, Lisp_Buffer, current_buffer);
ca1d1d23
JB
728 pos = search_regs.end[0];
729 }
730 else
731 {
732 immediate_quit = 0;
733 return (0 - n);
734 }
735 n--;
736 }
737 immediate_quit = 0;
738 return (pos);
739 }
740 else /* non-RE case */
741 {
742#ifdef C_ALLOCA
743 int BM_tab_space[0400];
744 BM_tab = &BM_tab_space[0];
745#else
746 BM_tab = (int *) alloca (0400 * sizeof (int));
747#endif
748 /* The general approach is that we are going to maintain that we know */
749 /* the first (closest to the present position, in whatever direction */
750 /* we're searching) character that could possibly be the last */
751 /* (furthest from present position) character of a valid match. We */
752 /* advance the state of our knowledge by looking at that character */
753 /* and seeing whether it indeed matches the last character of the */
754 /* pattern. If it does, we take a closer look. If it does not, we */
755 /* move our pointer (to putative last characters) as far as is */
756 /* logically possible. This amount of movement, which I call a */
757 /* stride, will be the length of the pattern if the actual character */
758 /* appears nowhere in the pattern, otherwise it will be the distance */
759 /* from the last occurrence of that character to the end of the */
760 /* pattern. */
761 /* As a coding trick, an enormous stride is coded into the table for */
762 /* characters that match the last character. This allows use of only */
763 /* a single test, a test for having gone past the end of the */
764 /* permissible match region, to test for both possible matches (when */
765 /* the stride goes past the end immediately) and failure to */
766 /* match (where you get nudged past the end one stride at a time). */
767
768 /* Here we make a "mickey mouse" BM table. The stride of the search */
769 /* is determined only by the last character of the putative match. */
770 /* If that character does not match, we will stride the proper */
771 /* distance to propose a match that superimposes it on the last */
772 /* instance of a character that matches it (per trt), or misses */
773 /* it entirely if there is none. */
774
775 dirlen = len * direction;
776 infinity = dirlen - (lim + pos + len + len) * direction;
777 if (direction < 0)
778 pat = (base_pat += len - 1);
779 BM_tab_base = BM_tab;
780 BM_tab += 0400;
781 j = dirlen; /* to get it in a register */
782 /* A character that does not appear in the pattern induces a */
783 /* stride equal to the pattern length. */
784 while (BM_tab_base != BM_tab)
785 {
786 *--BM_tab = j;
787 *--BM_tab = j;
788 *--BM_tab = j;
789 *--BM_tab = j;
790 }
791 i = 0;
792 while (i != infinity)
793 {
794 j = pat[i]; i += direction;
795 if (i == dirlen) i = infinity;
796 if ((int) trt)
797 {
798 k = (j = trt[j]);
799 if (i == infinity)
800 stride_for_teases = BM_tab[j];
801 BM_tab[j] = dirlen - i;
802 /* A translation table is accompanied by its inverse -- see */
803 /* comment following downcase_table for details */
804 while ((j = inverse_trt[j]) != k)
805 BM_tab[j] = dirlen - i;
806 }
807 else
808 {
809 if (i == infinity)
810 stride_for_teases = BM_tab[j];
811 BM_tab[j] = dirlen - i;
812 }
813 /* stride_for_teases tells how much to stride if we get a */
814 /* match on the far character but are subsequently */
815 /* disappointed, by recording what the stride would have been */
816 /* for that character if the last character had been */
817 /* different. */
818 }
819 infinity = dirlen - infinity;
820 pos += dirlen - ((direction > 0) ? direction : 0);
821 /* loop invariant - pos points at where last char (first char if reverse)
822 of pattern would align in a possible match. */
823 while (n != 0)
824 {
825 if ((lim - pos - (direction > 0)) * direction < 0)
826 return (n * (0 - direction));
827 /* First we do the part we can by pointers (maybe nothing) */
828 QUIT;
829 pat = base_pat;
830 limit = pos - dirlen + direction;
831 limit = ((direction > 0)
832 ? BUFFER_CEILING_OF (limit)
833 : BUFFER_FLOOR_OF (limit));
834 /* LIMIT is now the last (not beyond-last!) value
835 POS can take on without hitting edge of buffer or the gap. */
836 limit = ((direction > 0)
837 ? min (lim - 1, min (limit, pos + 20000))
838 : max (lim, max (limit, pos - 20000)));
839 if ((limit - pos) * direction > 20)
840 {
841 p_limit = &FETCH_CHAR (limit);
842 p2 = (cursor = &FETCH_CHAR (pos));
843 /* In this loop, pos + cursor - p2 is the surrogate for pos */
844 while (1) /* use one cursor setting as long as i can */
845 {
846 if (direction > 0) /* worth duplicating */
847 {
848 /* Use signed comparison if appropriate
849 to make cursor+infinity sure to be > p_limit.
850 Assuming that the buffer lies in a range of addresses
851 that are all "positive" (as ints) or all "negative",
852 either kind of comparison will work as long
853 as we don't step by infinity. So pick the kind
854 that works when we do step by infinity. */
855 if ((int) (p_limit + infinity) > (int) p_limit)
856 while ((int) cursor <= (int) p_limit)
857 cursor += BM_tab[*cursor];
858 else
859 while ((unsigned int) cursor <= (unsigned int) p_limit)
860 cursor += BM_tab[*cursor];
861 }
862 else
863 {
864 if ((int) (p_limit + infinity) < (int) p_limit)
865 while ((int) cursor >= (int) p_limit)
866 cursor += BM_tab[*cursor];
867 else
868 while ((unsigned int) cursor >= (unsigned int) p_limit)
869 cursor += BM_tab[*cursor];
870 }
871/* If you are here, cursor is beyond the end of the searched region. */
872 /* This can happen if you match on the far character of the pattern, */
873 /* because the "stride" of that character is infinity, a number able */
874 /* to throw you well beyond the end of the search. It can also */
875 /* happen if you fail to match within the permitted region and would */
876 /* otherwise try a character beyond that region */
877 if ((cursor - p_limit) * direction <= len)
878 break; /* a small overrun is genuine */
879 cursor -= infinity; /* large overrun = hit */
880 i = dirlen - direction;
881 if ((int) trt)
882 {
883 while ((i -= direction) + direction != 0)
884 if (pat[i] != trt[*(cursor -= direction)])
885 break;
886 }
887 else
888 {
889 while ((i -= direction) + direction != 0)
890 if (pat[i] != *(cursor -= direction))
891 break;
892 }
893 cursor += dirlen - i - direction; /* fix cursor */
894 if (i + direction == 0)
895 {
896 cursor -= direction;
1113d9db 897
ca325161
RS
898 set_search_regs (pos + cursor - p2 + ((direction > 0)
899 ? 1 - len : 0),
900 len);
901
ca1d1d23
JB
902 if ((n -= direction) != 0)
903 cursor += dirlen; /* to resume search */
904 else
905 return ((direction > 0)
906 ? search_regs.end[0] : search_regs.start[0]);
907 }
908 else
909 cursor += stride_for_teases; /* <sigh> we lose - */
910 }
911 pos += cursor - p2;
912 }
913 else
914 /* Now we'll pick up a clump that has to be done the hard */
915 /* way because it covers a discontinuity */
916 {
917 limit = ((direction > 0)
918 ? BUFFER_CEILING_OF (pos - dirlen + 1)
919 : BUFFER_FLOOR_OF (pos - dirlen - 1));
920 limit = ((direction > 0)
921 ? min (limit + len, lim - 1)
922 : max (limit - len, lim));
923 /* LIMIT is now the last value POS can have
924 and still be valid for a possible match. */
925 while (1)
926 {
927 /* This loop can be coded for space rather than */
928 /* speed because it will usually run only once. */
929 /* (the reach is at most len + 21, and typically */
930 /* does not exceed len) */
931 while ((limit - pos) * direction >= 0)
932 pos += BM_tab[FETCH_CHAR(pos)];
933 /* now run the same tests to distinguish going off the */
eb8c3be9 934 /* end, a match or a phony match. */
ca1d1d23
JB
935 if ((pos - limit) * direction <= len)
936 break; /* ran off the end */
937 /* Found what might be a match.
938 Set POS back to last (first if reverse) char pos. */
939 pos -= infinity;
940 i = dirlen - direction;
941 while ((i -= direction) + direction != 0)
942 {
943 pos -= direction;
944 if (pat[i] != (((int) trt)
945 ? trt[FETCH_CHAR(pos)]
946 : FETCH_CHAR (pos)))
947 break;
948 }
949 /* Above loop has moved POS part or all the way
950 back to the first char pos (last char pos if reverse).
951 Set it once again at the last (first if reverse) char. */
952 pos += dirlen - i- direction;
953 if (i + direction == 0)
954 {
955 pos -= direction;
1113d9db 956
ca325161
RS
957 set_search_regs (pos + ((direction > 0) ? 1 - len : 0),
958 len);
959
ca1d1d23
JB
960 if ((n -= direction) != 0)
961 pos += dirlen; /* to resume search */
962 else
963 return ((direction > 0)
964 ? search_regs.end[0] : search_regs.start[0]);
965 }
966 else
967 pos += stride_for_teases;
968 }
969 }
970 /* We have done one clump. Can we continue? */
971 if ((lim - pos) * direction < 0)
972 return ((0 - n) * direction);
973 }
974 return pos;
975 }
976}
ca325161
RS
977
978/* Record beginning BEG and end BEG + LEN
979 for a match just found in the current buffer. */
980
981static void
982set_search_regs (beg, len)
983 int beg, len;
984{
985 /* Make sure we have registers in which to store
986 the match position. */
987 if (search_regs.num_regs == 0)
988 {
989 regoff_t *starts, *ends;
990
991 starts = (regoff_t *) xmalloc (2 * sizeof (regoff_t));
992 ends = (regoff_t *) xmalloc (2 * sizeof (regoff_t));
993 BLOCK_INPUT;
994 re_set_registers (&searchbuf,
995 &search_regs,
996 2, starts, ends);
997 UNBLOCK_INPUT;
998 }
999
1000 search_regs.start[0] = beg;
1001 search_regs.end[0] = beg + len;
1002 XSET (last_thing_searched, Lisp_Buffer, current_buffer);
1003}
ca1d1d23
JB
1004\f
1005/* Given a string of words separated by word delimiters,
1006 compute a regexp that matches those exact words
1007 separated by arbitrary punctuation. */
1008
1009static Lisp_Object
1010wordify (string)
1011 Lisp_Object string;
1012{
1013 register unsigned char *p, *o;
1014 register int i, len, punct_count = 0, word_count = 0;
1015 Lisp_Object val;
1016
1017 CHECK_STRING (string, 0);
1018 p = XSTRING (string)->data;
1019 len = XSTRING (string)->size;
1020
1021 for (i = 0; i < len; i++)
1022 if (SYNTAX (p[i]) != Sword)
1023 {
1024 punct_count++;
1025 if (i > 0 && SYNTAX (p[i-1]) == Sword) word_count++;
1026 }
1027 if (SYNTAX (p[len-1]) == Sword) word_count++;
1028 if (!word_count) return build_string ("");
1029
1030 val = make_string (p, len - punct_count + 5 * (word_count - 1) + 4);
1031
1032 o = XSTRING (val)->data;
1033 *o++ = '\\';
1034 *o++ = 'b';
1035
1036 for (i = 0; i < len; i++)
1037 if (SYNTAX (p[i]) == Sword)
1038 *o++ = p[i];
1039 else if (i > 0 && SYNTAX (p[i-1]) == Sword && --word_count)
1040 {
1041 *o++ = '\\';
1042 *o++ = 'W';
1043 *o++ = '\\';
1044 *o++ = 'W';
1045 *o++ = '*';
1046 }
1047
1048 *o++ = '\\';
1049 *o++ = 'b';
1050
1051 return val;
1052}
1053\f
1054DEFUN ("search-backward", Fsearch_backward, Ssearch_backward, 1, 4,
1055 "sSearch backward: ",
1056 "Search backward from point for STRING.\n\
1057Set point to the beginning of the occurrence found, and return point.\n\
1058An optional second argument bounds the search; it is a buffer position.\n\
1059The match found must not extend before that position.\n\
1060Optional third argument, if t, means if fail just return nil (no error).\n\
1061 If not nil and not t, position at limit of search and return nil.\n\
1062Optional fourth argument is repeat count--search for successive occurrences.\n\
1063See also the functions `match-beginning', `match-end' and `replace-match'.")
1064 (string, bound, noerror, count)
1065 Lisp_Object string, bound, noerror, count;
1066{
1067 return search_command (string, bound, noerror, count, -1, 0);
1068}
1069
1070DEFUN ("search-forward", Fsearch_forward, Ssearch_forward, 1, 4, "sSearch: ",
1071 "Search forward from point for STRING.\n\
1072Set point to the end of the occurrence found, and return point.\n\
1073An optional second argument bounds the search; it is a buffer position.\n\
1074The match found must not extend after that position. nil is equivalent\n\
1075 to (point-max).\n\
1076Optional third argument, if t, means if fail just return nil (no error).\n\
1077 If not nil and not t, move to limit of search and return nil.\n\
1078Optional fourth argument is repeat count--search for successive occurrences.\n\
1079See also the functions `match-beginning', `match-end' and `replace-match'.")
1080 (string, bound, noerror, count)
1081 Lisp_Object string, bound, noerror, count;
1082{
1083 return search_command (string, bound, noerror, count, 1, 0);
1084}
1085
1086DEFUN ("word-search-backward", Fword_search_backward, Sword_search_backward, 1, 4,
1087 "sWord search backward: ",
1088 "Search backward from point for STRING, ignoring differences in punctuation.\n\
1089Set point to the beginning of the occurrence found, and return point.\n\
1090An optional second argument bounds the search; it is a buffer position.\n\
1091The match found must not extend before that position.\n\
1092Optional third argument, if t, means if fail just return nil (no error).\n\
1093 If not nil and not t, move to limit of search and return nil.\n\
1094Optional fourth argument is repeat count--search for successive occurrences.")
1095 (string, bound, noerror, count)
1096 Lisp_Object string, bound, noerror, count;
1097{
1098 return search_command (wordify (string), bound, noerror, count, -1, 1);
1099}
1100
1101DEFUN ("word-search-forward", Fword_search_forward, Sword_search_forward, 1, 4,
1102 "sWord search: ",
1103 "Search forward from point for STRING, ignoring differences in punctuation.\n\
1104Set point to the end of the occurrence found, and return point.\n\
1105An optional second argument bounds the search; it is a buffer position.\n\
1106The match found must not extend after that position.\n\
1107Optional third argument, if t, means if fail just return nil (no error).\n\
1108 If not nil and not t, move to limit of search and return nil.\n\
1109Optional fourth argument is repeat count--search for successive occurrences.")
1110 (string, bound, noerror, count)
1111 Lisp_Object string, bound, noerror, count;
1112{
1113 return search_command (wordify (string), bound, noerror, count, 1, 1);
1114}
1115
1116DEFUN ("re-search-backward", Fre_search_backward, Sre_search_backward, 1, 4,
1117 "sRE search backward: ",
1118 "Search backward from point for match for regular expression REGEXP.\n\
1119Set point to the beginning of the match, and return point.\n\
1120The match found is the one starting last in the buffer\n\
1121and yet ending before the place the origin of the search.\n\
1122An optional second argument bounds the search; it is a buffer position.\n\
1123The match found must start at or after that position.\n\
1124Optional third argument, if t, means if fail just return nil (no error).\n\
1125 If not nil and not t, move to limit of search and return nil.\n\
1126Optional fourth argument is repeat count--search for successive occurrences.\n\
1127See also the functions `match-beginning', `match-end' and `replace-match'.")
1128 (string, bound, noerror, count)
1129 Lisp_Object string, bound, noerror, count;
1130{
1131 return search_command (string, bound, noerror, count, -1, 1);
1132}
1133
1134DEFUN ("re-search-forward", Fre_search_forward, Sre_search_forward, 1, 4,
1135 "sRE search: ",
1136 "Search forward from point for regular expression REGEXP.\n\
1137Set point to the end of the occurrence found, and return point.\n\
1138An optional second argument bounds the search; it is a buffer position.\n\
1139The match found must not extend after that position.\n\
1140Optional third argument, if t, means if fail just return nil (no error).\n\
1141 If not nil and not t, move to limit of search and return nil.\n\
1142Optional fourth argument is repeat count--search for successive occurrences.\n\
1143See also the functions `match-beginning', `match-end' and `replace-match'.")
1144 (string, bound, noerror, count)
1145 Lisp_Object string, bound, noerror, count;
1146{
1147 return search_command (string, bound, noerror, count, 1, 1);
1148}
1149\f
1150DEFUN ("replace-match", Freplace_match, Sreplace_match, 1, 3, 0,
1151 "Replace text matched by last search with NEWTEXT.\n\
1152If second arg FIXEDCASE is non-nil, do not alter case of replacement text.\n\
1153Otherwise convert to all caps or cap initials, like replaced text.\n\
1154If third arg LITERAL is non-nil, insert NEWTEXT literally.\n\
1155Otherwise treat `\\' as special:\n\
1156 `\\&' in NEWTEXT means substitute original matched text.\n\
1157 `\\N' means substitute what matched the Nth `\\(...\\)'.\n\
1158 If Nth parens didn't match, substitute nothing.\n\
1159 `\\\\' means insert one `\\'.\n\
1113d9db 1160FIXEDCASE and LITERAL are optional arguments.\n\
ca1d1d23 1161Leaves point at end of replacement text.")
16fdc568
BF
1162 (newtext, fixedcase, literal)
1163 Lisp_Object newtext, fixedcase, literal;
ca1d1d23
JB
1164{
1165 enum { nochange, all_caps, cap_initial } case_action;
1166 register int pos, last;
1167 int some_multiletter_word;
97832bd0
RS
1168 int some_lowercase;
1169 int some_uppercase_initial;
ca1d1d23
JB
1170 register int c, prevc;
1171 int inslen;
1172
16fdc568 1173 CHECK_STRING (newtext, 0);
ca1d1d23
JB
1174
1175 case_action = nochange; /* We tried an initialization */
1176 /* but some C compilers blew it */
4746118a
JB
1177
1178 if (search_regs.num_regs <= 0)
1179 error ("replace-match called before any match found");
1180
ca1d1d23
JB
1181 if (search_regs.start[0] < BEGV
1182 || search_regs.start[0] > search_regs.end[0]
1183 || search_regs.end[0] > ZV)
97832bd0
RS
1184 args_out_of_range (make_number (search_regs.start[0]),
1185 make_number (search_regs.end[0]));
ca1d1d23
JB
1186
1187 if (NILP (fixedcase))
1188 {
1189 /* Decide how to casify by examining the matched text. */
1190
1191 last = search_regs.end[0];
1192 prevc = '\n';
1193 case_action = all_caps;
1194
1195 /* some_multiletter_word is set nonzero if any original word
1196 is more than one letter long. */
1197 some_multiletter_word = 0;
97832bd0
RS
1198 some_lowercase = 0;
1199 some_uppercase_initial = 0;
ca1d1d23
JB
1200
1201 for (pos = search_regs.start[0]; pos < last; pos++)
1202 {
1203 c = FETCH_CHAR (pos);
1204 if (LOWERCASEP (c))
1205 {
1206 /* Cannot be all caps if any original char is lower case */
1207
97832bd0 1208 some_lowercase = 1;
ca1d1d23 1209 if (SYNTAX (prevc) != Sword)
97832bd0 1210 ;
ca1d1d23
JB
1211 else
1212 some_multiletter_word = 1;
1213 }
1214 else if (!NOCASEP (c))
1215 {
97832bd0
RS
1216 if (SYNTAX (prevc) != Sword)
1217 some_uppercase_initial = 1;
1218 else
ca1d1d23
JB
1219 some_multiletter_word = 1;
1220 }
1221
1222 prevc = c;
1223 }
1224
97832bd0
RS
1225 /* Convert to all caps if the old text is all caps
1226 and has at least one multiletter word. */
1227 if (! some_lowercase && some_multiletter_word)
1228 case_action = all_caps;
1229 /* Capitalize each word, if the old text has a capitalized word. */
1230 else if (some_uppercase_initial)
ca1d1d23 1231 case_action = cap_initial;
97832bd0
RS
1232 else
1233 case_action = nochange;
ca1d1d23
JB
1234 }
1235
9a76659d
JB
1236 /* We insert the replacement text before the old text, and then
1237 delete the original text. This means that markers at the
1238 beginning or end of the original will float to the corresponding
1239 position in the replacement. */
1240 SET_PT (search_regs.start[0]);
ca1d1d23 1241 if (!NILP (literal))
16fdc568 1242 Finsert_and_inherit (1, &newtext);
ca1d1d23
JB
1243 else
1244 {
1245 struct gcpro gcpro1;
16fdc568 1246 GCPRO1 (newtext);
ca1d1d23 1247
16fdc568 1248 for (pos = 0; pos < XSTRING (newtext)->size; pos++)
ca1d1d23 1249 {
9a76659d
JB
1250 int offset = point - search_regs.start[0];
1251
16fdc568 1252 c = XSTRING (newtext)->data[pos];
ca1d1d23
JB
1253 if (c == '\\')
1254 {
16fdc568 1255 c = XSTRING (newtext)->data[++pos];
ca1d1d23 1256 if (c == '&')
9a76659d
JB
1257 Finsert_buffer_substring
1258 (Fcurrent_buffer (),
1259 make_number (search_regs.start[0] + offset),
1260 make_number (search_regs.end[0] + offset));
4746118a 1261 else if (c >= '1' && c <= search_regs.num_regs + '0')
ca1d1d23
JB
1262 {
1263 if (search_regs.start[c - '0'] >= 1)
9a76659d
JB
1264 Finsert_buffer_substring
1265 (Fcurrent_buffer (),
1266 make_number (search_regs.start[c - '0'] + offset),
1267 make_number (search_regs.end[c - '0'] + offset));
ca1d1d23
JB
1268 }
1269 else
1270 insert_char (c);
1271 }
1272 else
1273 insert_char (c);
1274 }
1275 UNGCPRO;
1276 }
1277
9a76659d
JB
1278 inslen = point - (search_regs.start[0]);
1279 del_range (search_regs.start[0] + inslen, search_regs.end[0] + inslen);
ca1d1d23
JB
1280
1281 if (case_action == all_caps)
1282 Fupcase_region (make_number (point - inslen), make_number (point));
1283 else if (case_action == cap_initial)
1284 upcase_initials_region (make_number (point - inslen), make_number (point));
1285 return Qnil;
1286}
1287\f
1288static Lisp_Object
1289match_limit (num, beginningp)
1290 Lisp_Object num;
1291 int beginningp;
1292{
1293 register int n;
1294
1295 CHECK_NUMBER (num, 0);
1296 n = XINT (num);
4746118a
JB
1297 if (n < 0 || n >= search_regs.num_regs)
1298 args_out_of_range (num, make_number (search_regs.num_regs));
1299 if (search_regs.num_regs <= 0
1300 || search_regs.start[n] < 0)
ca1d1d23
JB
1301 return Qnil;
1302 return (make_number ((beginningp) ? search_regs.start[n]
1303 : search_regs.end[n]));
1304}
1305
1306DEFUN ("match-beginning", Fmatch_beginning, Smatch_beginning, 1, 1, 0,
1307 "Return position of start of text matched by last search.\n\
16fdc568
BF
1308NUM specifies which parenthesized expression in the last regexp.\n\
1309 Value is nil if NUMth pair didn't match, or there were less than NUM pairs.\n\
ca1d1d23
JB
1310Zero means the entire text matched by the whole regexp or whole string.")
1311 (num)
1312 Lisp_Object num;
1313{
1314 return match_limit (num, 1);
1315}
1316
1317DEFUN ("match-end", Fmatch_end, Smatch_end, 1, 1, 0,
1318 "Return position of end of text matched by last search.\n\
1319ARG, a number, specifies which parenthesized expression in the last regexp.\n\
1320 Value is nil if ARGth pair didn't match, or there were less than ARG pairs.\n\
1321Zero means the entire text matched by the whole regexp or whole string.")
1322 (num)
1323 Lisp_Object num;
1324{
1325 return match_limit (num, 0);
1326}
1327
1328DEFUN ("match-data", Fmatch_data, Smatch_data, 0, 0, 0,
1329 "Return a list containing all info on what the last search matched.\n\
1330Element 2N is `(match-beginning N)'; element 2N + 1 is `(match-end N)'.\n\
1331All the elements are markers or nil (nil if the Nth pair didn't match)\n\
1332if the last match was on a buffer; integers or nil if a string was matched.\n\
1333Use `store-match-data' to reinstate the data in this list.")
1334 ()
1335{
4746118a 1336 Lisp_Object *data;
ca1d1d23
JB
1337 int i, len;
1338
daa37602
JB
1339 if (NILP (last_thing_searched))
1340 error ("match-data called before any match found");
1341
4746118a
JB
1342 data = (Lisp_Object *) alloca ((2 * search_regs.num_regs)
1343 * sizeof (Lisp_Object));
1344
ca1d1d23 1345 len = -1;
4746118a 1346 for (i = 0; i < search_regs.num_regs; i++)
ca1d1d23
JB
1347 {
1348 int start = search_regs.start[i];
1349 if (start >= 0)
1350 {
daa37602 1351 if (EQ (last_thing_searched, Qt))
ca1d1d23
JB
1352 {
1353 XFASTINT (data[2 * i]) = start;
1354 XFASTINT (data[2 * i + 1]) = search_regs.end[i];
1355 }
daa37602 1356 else if (XTYPE (last_thing_searched) == Lisp_Buffer)
ca1d1d23
JB
1357 {
1358 data[2 * i] = Fmake_marker ();
daa37602
JB
1359 Fset_marker (data[2 * i],
1360 make_number (start),
1361 last_thing_searched);
ca1d1d23
JB
1362 data[2 * i + 1] = Fmake_marker ();
1363 Fset_marker (data[2 * i + 1],
daa37602
JB
1364 make_number (search_regs.end[i]),
1365 last_thing_searched);
ca1d1d23 1366 }
daa37602
JB
1367 else
1368 /* last_thing_searched must always be Qt, a buffer, or Qnil. */
1369 abort ();
1370
ca1d1d23
JB
1371 len = i;
1372 }
1373 else
1374 data[2 * i] = data [2 * i + 1] = Qnil;
1375 }
1376 return Flist (2 * len + 2, data);
1377}
1378
1379
1380DEFUN ("store-match-data", Fstore_match_data, Sstore_match_data, 1, 1, 0,
1381 "Set internal data on last search match from elements of LIST.\n\
1382LIST should have been created by calling `match-data' previously.")
1383 (list)
1384 register Lisp_Object list;
1385{
1386 register int i;
1387 register Lisp_Object marker;
1388
1389 if (!CONSP (list) && !NILP (list))
b37902c8 1390 list = wrong_type_argument (Qconsp, list);
ca1d1d23 1391
daa37602
JB
1392 /* Unless we find a marker with a buffer in LIST, assume that this
1393 match data came from a string. */
1394 last_thing_searched = Qt;
1395
4746118a
JB
1396 /* Allocate registers if they don't already exist. */
1397 {
d084e942 1398 int length = XFASTINT (Flength (list)) / 2;
4746118a
JB
1399
1400 if (length > search_regs.num_regs)
1401 {
1113d9db
JB
1402 if (search_regs.num_regs == 0)
1403 {
1404 search_regs.start
1405 = (regoff_t *) xmalloc (length * sizeof (regoff_t));
1406 search_regs.end
1407 = (regoff_t *) xmalloc (length * sizeof (regoff_t));
1408 }
4746118a 1409 else
1113d9db
JB
1410 {
1411 search_regs.start
1412 = (regoff_t *) xrealloc (search_regs.start,
1413 length * sizeof (regoff_t));
1414 search_regs.end
1415 = (regoff_t *) xrealloc (search_regs.end,
1416 length * sizeof (regoff_t));
1417 }
4746118a 1418
9ac0d9e0 1419 BLOCK_INPUT;
1113d9db
JB
1420 re_set_registers (&searchbuf, &search_regs, length,
1421 search_regs.start, search_regs.end);
9ac0d9e0 1422 UNBLOCK_INPUT;
4746118a
JB
1423 }
1424 }
1425
1426 for (i = 0; i < search_regs.num_regs; i++)
ca1d1d23
JB
1427 {
1428 marker = Fcar (list);
1429 if (NILP (marker))
1430 {
1431 search_regs.start[i] = -1;
1432 list = Fcdr (list);
1433 }
1434 else
1435 {
daa37602
JB
1436 if (XTYPE (marker) == Lisp_Marker)
1437 {
1438 if (XMARKER (marker)->buffer == 0)
1439 XFASTINT (marker) = 0;
1440 else
1441 XSET (last_thing_searched, Lisp_Buffer,
1442 XMARKER (marker)->buffer);
1443 }
ca1d1d23
JB
1444
1445 CHECK_NUMBER_COERCE_MARKER (marker, 0);
1446 search_regs.start[i] = XINT (marker);
1447 list = Fcdr (list);
1448
1449 marker = Fcar (list);
1450 if (XTYPE (marker) == Lisp_Marker
1451 && XMARKER (marker)->buffer == 0)
1452 XFASTINT (marker) = 0;
1453
1454 CHECK_NUMBER_COERCE_MARKER (marker, 0);
1455 search_regs.end[i] = XINT (marker);
1456 }
1457 list = Fcdr (list);
1458 }
1459
1460 return Qnil;
1461}
1462
1463/* Quote a string to inactivate reg-expr chars */
1464
1465DEFUN ("regexp-quote", Fregexp_quote, Sregexp_quote, 1, 1, 0,
1466 "Return a regexp string which matches exactly STRING and nothing else.")
1467 (str)
1468 Lisp_Object str;
1469{
1470 register unsigned char *in, *out, *end;
1471 register unsigned char *temp;
1472
1473 CHECK_STRING (str, 0);
1474
1475 temp = (unsigned char *) alloca (XSTRING (str)->size * 2);
1476
1477 /* Now copy the data into the new string, inserting escapes. */
1478
1479 in = XSTRING (str)->data;
1480 end = in + XSTRING (str)->size;
1481 out = temp;
1482
1483 for (; in != end; in++)
1484 {
1485 if (*in == '[' || *in == ']'
1486 || *in == '*' || *in == '.' || *in == '\\'
1487 || *in == '?' || *in == '+'
1488 || *in == '^' || *in == '$')
1489 *out++ = '\\';
1490 *out++ = *in;
1491 }
1492
1493 return make_string (temp, out - temp);
1494}
1495\f
1496syms_of_search ()
1497{
1498 register int i;
1499
1500 searchbuf.allocated = 100;
8c0e7b73 1501 searchbuf.buffer = (unsigned char *) malloc (searchbuf.allocated);
ca1d1d23
JB
1502 searchbuf.fastmap = search_fastmap;
1503
1504 Qsearch_failed = intern ("search-failed");
1505 staticpro (&Qsearch_failed);
1506 Qinvalid_regexp = intern ("invalid-regexp");
1507 staticpro (&Qinvalid_regexp);
1508
1509 Fput (Qsearch_failed, Qerror_conditions,
1510 Fcons (Qsearch_failed, Fcons (Qerror, Qnil)));
1511 Fput (Qsearch_failed, Qerror_message,
1512 build_string ("Search failed"));
1513
1514 Fput (Qinvalid_regexp, Qerror_conditions,
1515 Fcons (Qinvalid_regexp, Fcons (Qerror, Qnil)));
1516 Fput (Qinvalid_regexp, Qerror_message,
1517 build_string ("Invalid regexp"));
1518
1519 last_regexp = Qnil;
1520 staticpro (&last_regexp);
1521
daa37602
JB
1522 last_thing_searched = Qnil;
1523 staticpro (&last_thing_searched);
1524
ca1d1d23
JB
1525 defsubr (&Sstring_match);
1526 defsubr (&Slooking_at);
1527 defsubr (&Sskip_chars_forward);
1528 defsubr (&Sskip_chars_backward);
17431c60
RS
1529 defsubr (&Sskip_syntax_forward);
1530 defsubr (&Sskip_syntax_backward);
ca1d1d23
JB
1531 defsubr (&Ssearch_forward);
1532 defsubr (&Ssearch_backward);
1533 defsubr (&Sword_search_forward);
1534 defsubr (&Sword_search_backward);
1535 defsubr (&Sre_search_forward);
1536 defsubr (&Sre_search_backward);
1537 defsubr (&Sreplace_match);
1538 defsubr (&Smatch_beginning);
1539 defsubr (&Smatch_end);
1540 defsubr (&Smatch_data);
1541 defsubr (&Sstore_match_data);
1542 defsubr (&Sregexp_quote);
1543}