* These changes add a @deffnx C function declaration and function
[bpt/guile.git] / libguile / sort.c
CommitLineData
726d810a 1/* Copyright (C) 1999,2000,2001 Free Software Foundation, Inc.
54e09076
MD
2 * This program is free software; you can redistribute it and/or modify
3 * it under the terms of the GNU General Public License as published by
4 * the Free Software Foundation; either version 2, or (at your option)
5 * any later version.
6 *
7 * This program is distributed in the hope that it will be useful,
8 * but WITHOUT ANY WARRANTY; without even the implied warranty of
9 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
10 * GNU General Public License for more details.
11 *
12 * You should have received a copy of the GNU General Public License
13 * along with this software; see the file COPYING. If not, write to
14 * the Free Software Foundation, Inc., 59 Temple Place, Suite 330,
15 * Boston, MA 02111-1307 USA
16 *
17 * As a special exception, the Free Software Foundation gives permission
18 * for additional uses of the text contained in its release of GUILE.
19 *
20 * The exception is that, if you link the GUILE library with other files
21 * to produce an executable, this does not by itself cause the
22 * resulting executable to be covered by the GNU General Public License.
23 * Your use of that executable is in no way restricted on account of
24 * linking the GUILE library code into it.
25 *
26 * This exception does not however invalidate any other reasons why
27 * the executable file might be covered by the GNU General Public License.
28 *
29 * This exception applies only to the code released by the
30 * Free Software Foundation under the name GUILE. If you copy
31 * code from other Free Software Foundation releases into a copy of
32 * GUILE, as the General Public License permits, the exception does
33 * not apply to the code that you add in this way. To avoid misleading
34 * anyone as to the status of such modified files, you must delete
35 * this exception notice from them.
36 *
37 * If you write modifications of your own for GUILE, it is your choice
38 * whether to permit this exception to apply to your modifications.
39 * If you do not wish that, delete this exception notice. */
40
1bbd0b84
GB
41
42
54e09076
MD
43/* Written in December 1998 by Roland Orre <orre@nada.kth.se>
44 * This implements the same sort interface as slib/sort.scm
45 * for lists and vectors where slib defines:
46 * sorted?, merge, merge!, sort, sort!
15d9c4e3 47 * For scsh compatibility sort-list and sort-list! are also defined.
54e09076 48 * In cases where a stable-sort is required use stable-sort or
15d9c4e3 49 * stable-sort!. An additional feature is
54e09076 50 * (restricted-vector-sort! vector less? startpos endpos)
15d9c4e3 51 * which allows you to sort part of a vector.
54e09076
MD
52 * Thanks to Aubrey Jaffer for the slib/sort.scm library.
53 * Thanks to Richard A. O'Keefe (based on Prolog code by D.H.D.Warren)
54 * for the merge sort inspiration.
55 * Thanks to Douglas C. Schmidt (schmidt@ics.uci.edu) for the
56 * quicksort code.
57 */
58
59/* We need this to get the definitions for HAVE_ALLOCA_H, etc. */
a0599745 60#include "libguile/scmconfig.h"
54e09076
MD
61
62/* AIX requires this to be the first thing in the file. The #pragma
63 directive is indented so pre-ANSI compilers will ignore it, rather
64 than choke on it. */
65#ifndef __GNUC__
66# if HAVE_ALLOCA_H
67# include <alloca.h>
68# else
69# ifdef _AIX
70 #pragma alloca
71# else
72# ifndef alloca /* predefined by HP cc +Olibcalls */
73char *alloca ();
74# endif
75# endif
76# endif
77#endif
78
783e7774 79#include <string.h>
a0599745 80#include "libguile/_scm.h"
54e09076 81
a0599745
MD
82#include "libguile/eval.h"
83#include "libguile/unif.h"
84#include "libguile/ramap.h"
85#include "libguile/alist.h"
86#include "libguile/feature.h"
fdc28395 87#include "libguile/root.h"
a0599745 88#include "libguile/vectors.h"
54e09076 89
a0599745
MD
90#include "libguile/validate.h"
91#include "libguile/sort.h"
54e09076
MD
92
93/* The routine quicksort was extracted from the GNU C Library qsort.c
94 written by Douglas C. Schmidt (schmidt@ics.uci.edu)
95 and adapted to guile by adding an extra pointer less
96 to quicksort by Roland Orre <orre@nada.kth.se>.
97
98 The reason to do this instead of using the library function qsort
99 was to avoid dependency of the ANSI-C extensions for local functions
100 and also to avoid obscure pool based solutions.
15d9c4e3
MD
101
102 This sorting routine is not much more efficient than the stable
103 version but doesn't consume extra memory.
54e09076
MD
104 */
105
106/* Byte-wise swap two items of size SIZE. */
107#define SWAP(a, b, size) \
108 do \
109 { \
110 register size_t __size = (size); \
111 register char *__a = (a), *__b = (b); \
112 do \
113 { \
114 char __tmp = *__a; \
115 *__a++ = *__b; \
116 *__b++ = __tmp; \
117 } while (--__size > 0); \
118 } while (0)
119
120/* Discontinue quicksort algorithm when partition gets below this size.
121 This particular magic number was chosen to work best on a Sun 4/260. */
122#define MAX_THRESH 4
123
124/* Stack node declarations used to store unfulfilled partition obligations. */
125typedef struct
126 {
127 char *lo;
128 char *hi;
129 }
130stack_node;
131
132/* The next 4 #defines implement a very fast in-line stack abstraction. */
133#define STACK_SIZE (8 * sizeof(unsigned long int))
134#define PUSH(low, high) ((void) ((top->lo = (low)), (top->hi = (high)), ++top))
135#define POP(low, high) ((void) (--top, (low = top->lo), (high = top->hi)))
136#define STACK_NOT_EMPTY (stack < top)
137
138
139/* Order size using quicksort. This implementation incorporates
140 four optimizations discussed in Sedgewick:
141
142 1. Non-recursive, using an explicit stack of pointer that store the
143 next array partition to sort. To save time, this maximum amount
144 of space required to store an array of MAX_INT is allocated on the
145 stack. Assuming a 32-bit integer, this needs only 32 *
146 sizeof(stack_node) == 136 bits. Pretty cheap, actually.
147
148 2. Chose the pivot element using a median-of-three decision tree.
149 This reduces the probability of selecting a bad pivot value and
150 eliminates certain extraneous comparisons.
151
152 3. Only quicksorts TOTAL_ELEMS / MAX_THRESH partitions, leaving
153 insertion sort to order the MAX_THRESH items within each partition.
154 This is a big win, since insertion sort is faster for small, mostly
155 sorted array segments.
156
157 4. The larger of the two sub-partitions is always pushed onto the
158 stack first, with the algorithm then concentrating on the
159 smaller partition. This *guarantees* no more than log (n)
160 stack size is needed (actually O(1) in this case)! */
161
162typedef int (*cmp_fun_t) (SCM less,
163 const void*,
164 const void*);
165
a34af05e
MD
166static const char s_buggy_less[] = "buggy less predicate used when sorting";
167
54e09076
MD
168static void
169quicksort (void *const pbase,
170 size_t total_elems,
171 size_t size,
172 cmp_fun_t cmp,
173 SCM less)
174{
175 register char *base_ptr = (char *) pbase;
176
177 /* Allocating SIZE bytes for a pivot buffer facilitates a better
178 algorithm below since we can do comparisons directly on the pivot. */
179 char *pivot_buffer = (char *) alloca (size);
180 const size_t max_thresh = MAX_THRESH * size;
181
182 if (total_elems == 0)
183 /* Avoid lossage with unsigned arithmetic below. */
184 return;
185
186 if (total_elems > MAX_THRESH)
187 {
188 char *lo = base_ptr;
189 char *hi = &lo[size * (total_elems - 1)];
190 /* Largest size needed for 32-bit int!!! */
191 stack_node stack[STACK_SIZE];
192 stack_node *top = stack + 1;
193
194 while (STACK_NOT_EMPTY)
195 {
196 char *left_ptr;
197 char *right_ptr;
198
199 char *pivot = pivot_buffer;
200
201 /* Select median value from among LO, MID, and HI. Rearrange
202 LO and HI so the three values are sorted. This lowers the
203 probability of picking a pathological pivot value and
204 skips a comparison for both the LEFT_PTR and RIGHT_PTR. */
205
206 char *mid = lo + size * ((hi - lo) / size >> 1);
207
208 if ((*cmp) (less, (void *) mid, (void *) lo))
209 SWAP (mid, lo, size);
210 if ((*cmp) (less, (void *) hi, (void *) mid))
211 SWAP (mid, hi, size);
212 else
213 goto jump_over;
214 if ((*cmp) (less, (void *) mid, (void *) lo))
215 SWAP (mid, lo, size);
216 jump_over:;
217 memcpy (pivot, mid, size);
218 pivot = pivot_buffer;
219
220 left_ptr = lo + size;
221 right_ptr = hi - size;
222
223 /* Here's the famous ``collapse the walls'' section of quicksort.
224 Gotta like those tight inner loops! They are the main reason
225 that this algorithm runs much faster than others. */
226 do
227 {
228 while ((*cmp) (less, (void *) left_ptr, (void *) pivot))
a34af05e
MD
229 {
230 left_ptr += size;
231 /* The comparison predicate may be buggy */
232 if (left_ptr > hi)
5d2d2ffc 233 scm_misc_error (NULL, s_buggy_less, SCM_EOL);
a34af05e 234 }
54e09076
MD
235
236 while ((*cmp) (less, (void *) pivot, (void *) right_ptr))
a34af05e
MD
237 {
238 right_ptr -= size;
239 /* The comparison predicate may be buggy */
240 if (right_ptr < lo)
5d2d2ffc 241 scm_misc_error (NULL, s_buggy_less, SCM_EOL);
a34af05e 242 }
54e09076
MD
243
244 if (left_ptr < right_ptr)
245 {
246 SWAP (left_ptr, right_ptr, size);
247 left_ptr += size;
248 right_ptr -= size;
249 }
250 else if (left_ptr == right_ptr)
251 {
252 left_ptr += size;
253 right_ptr -= size;
254 break;
255 }
256 }
257 while (left_ptr <= right_ptr);
258
259 /* Set up pointers for next iteration. First determine whether
260 left and right partitions are below the threshold size. If so,
261 ignore one or both. Otherwise, push the larger partition's
262 bounds on the stack and continue sorting the smaller one. */
263
264 if ((size_t) (right_ptr - lo) <= max_thresh)
265 {
266 if ((size_t) (hi - left_ptr) <= max_thresh)
267 /* Ignore both small partitions. */
268 POP (lo, hi);
269 else
270 /* Ignore small left partition. */
271 lo = left_ptr;
272 }
273 else if ((size_t) (hi - left_ptr) <= max_thresh)
274 /* Ignore small right partition. */
275 hi = right_ptr;
276 else if ((right_ptr - lo) > (hi - left_ptr))
277 {
278 /* Push larger left partition indices. */
279 PUSH (lo, right_ptr);
280 lo = left_ptr;
281 }
282 else
283 {
284 /* Push larger right partition indices. */
285 PUSH (left_ptr, hi);
286 hi = right_ptr;
287 }
288 }
289 }
290
291 /* Once the BASE_PTR array is partially sorted by quicksort the rest
292 is completely sorted using insertion sort, since this is efficient
293 for partitions below MAX_THRESH size. BASE_PTR points to the beginning
294 of the array to sort, and END_PTR points at the very last element in
295 the array (*not* one beyond it!). */
296
297 {
298 char *const end_ptr = &base_ptr[size * (total_elems - 1)];
299 char *tmp_ptr = base_ptr;
300 char *thresh = min (end_ptr, base_ptr + max_thresh);
301 register char *run_ptr;
302
303 /* Find smallest element in first threshold and place it at the
304 array's beginning. This is the smallest array element,
305 and the operation speeds up insertion sort's inner loop. */
306
307 for (run_ptr = tmp_ptr + size; run_ptr <= thresh; run_ptr += size)
308 if ((*cmp) (less, (void *) run_ptr, (void *) tmp_ptr))
309 tmp_ptr = run_ptr;
310
311 if (tmp_ptr != base_ptr)
312 SWAP (tmp_ptr, base_ptr, size);
313
314 /* Insertion sort, running from left-hand-side up to right-hand-side. */
315
316 run_ptr = base_ptr + size;
317 while ((run_ptr += size) <= end_ptr)
318 {
319 tmp_ptr = run_ptr - size;
320 while ((*cmp) (less, (void *) run_ptr, (void *) tmp_ptr))
a34af05e
MD
321 {
322 tmp_ptr -= size;
323 /* The comparison predicate may be buggy */
324 if (tmp_ptr < base_ptr)
5d2d2ffc 325 scm_misc_error (NULL, s_buggy_less, SCM_EOL);
a34af05e 326 }
54e09076
MD
327
328 tmp_ptr += size;
329 if (tmp_ptr != run_ptr)
330 {
331 char *trav;
332
333 trav = run_ptr + size;
334 while (--trav >= run_ptr)
335 {
336 char c = *trav;
337 char *hi, *lo;
338
339 for (hi = lo = trav; (lo -= size) >= tmp_ptr; hi = lo)
340 *hi = *lo;
341 *hi = c;
342 }
343 }
344 }
345 }
346} /* quicksort */
347
348
349/* comparison routines */
350
351static int
352subr2less (SCM less, const void *a, const void *b)
353{
354 return SCM_NFALSEP (SCM_SUBRF (less) (*(SCM *) a, *(SCM *) b));
355} /* subr2less */
356
357static int
358subr2oless (SCM less, const void *a, const void *b)
359{
360 return SCM_NFALSEP (SCM_SUBRF (less) (*(SCM *) a,
361 *(SCM *) b,
362 SCM_UNDEFINED));
363} /* subr2oless */
364
365static int
366lsubrless (SCM less, const void *a, const void *b)
367{
368 return SCM_NFALSEP (SCM_SUBRF (less)
369 (scm_cons (*(SCM *) a,
370 scm_cons (*(SCM *) b, SCM_EOL))));
371} /* lsubrless */
372
373static int
374closureless (SCM code, const void *a, const void *b)
375{
726d810a 376 SCM env = SCM_EXTEND_ENV (SCM_CLOSURE_FORMALS (code),
4c6fe5fc
MD
377 scm_cons (*(SCM *) a,
378 scm_cons (*(SCM *) b, SCM_EOL)),
379 SCM_ENV (code));
54e09076 380 /* Evaluate the closure body */
34249025 381 return SCM_NFALSEP (scm_eval_body (SCM_CDR (SCM_CODE (code)), env));
54e09076
MD
382} /* closureless */
383
384static int
385applyless (SCM less, const void *a, const void *b)
386{
fdc28395 387 return SCM_NFALSEP (scm_call_2 (less, *(SCM *) a, *(SCM *) b));
54e09076
MD
388} /* applyless */
389
390static cmp_fun_t
391scm_cmp_function (SCM p)
392{
393 switch (SCM_TYP7 (p))
394 {
395 case scm_tc7_subr_2:
396 case scm_tc7_rpsubr:
397 case scm_tc7_asubr:
398 return subr2less;
399 case scm_tc7_subr_2o:
400 return subr2oless;
401 case scm_tc7_lsubr:
402 return lsubrless;
403 case scm_tcs_closures:
404 return closureless;
405 default:
406 return applyless;
407 }
408} /* scm_cmp_function */
409
54e09076
MD
410
411/* Question: Is there any need to make this a more general array sort?
412 It is probably enough to manage the vector type. */
413/* endpos equal as for substring, i.e. endpos is not included. */
da4a1dba 414/* More natural with length? */
1bbd0b84 415
a1ec6916 416SCM_DEFINE (scm_restricted_vector_sort_x, "restricted-vector-sort!", 4, 0, 0,
1bbd0b84 417 (SCM vec, SCM less, SCM startpos, SCM endpos),
e3239868
DH
418 "Sort the vector @var{vec}, using @var{less} for comparing\n"
419 "the vector elements. @var{startpos} and @var{endpos} delimit\n"
420 "the range of the vector which gets sorted. The return value\n"
421 "is not specified.")
1bbd0b84 422#define FUNC_NAME s_scm_restricted_vector_sort_x
54e09076
MD
423{
424 size_t vlen, spos, len, size = sizeof (SCM);
425 SCM *vp;
426
b5c2579a 427 SCM_VALIDATE_VECTOR (1,vec);
6b5a304f 428 SCM_VALIDATE_NIM (2,less);
b5c2579a 429
54e09076 430 vp = SCM_VELTS (vec); /* vector pointer */
b5c2579a 431 vlen = SCM_VECTOR_LENGTH (vec);
54e09076 432
729dbac3
DH
433 SCM_VALIDATE_INUM_MIN_COPY (3, startpos, 0, spos);
434 SCM_ASSERT_RANGE (3,startpos, spos <= vlen);
3b3b36dd 435 SCM_VALIDATE_INUM_RANGE (4,endpos,0,vlen+1);
54e09076
MD
436 len = SCM_INUM (endpos) - spos;
437
438 quicksort (&vp[spos], len, size, scm_cmp_function (less), less);
439 return SCM_UNSPECIFIED;
440 /* return vec; */
1bbd0b84
GB
441}
442#undef FUNC_NAME
54e09076
MD
443
444/* (sorted? sequence less?)
445 * is true when sequence is a list (x0 x1 ... xm) or a vector #(x0 ... xm)
446 * such that for all 1 <= i <= m,
447 * (not (less? (list-ref list i) (list-ref list (- i 1)))). */
a1ec6916 448SCM_DEFINE (scm_sorted_p, "sorted?", 2, 0, 0,
1bbd0b84 449 (SCM items, SCM less),
e3239868
DH
450 "Return @code{#t} iff @var{items} is a list or a vector such that\n"
451 "for all 1 <= i <= m, the predicate @var{less} returns true when\n"
452 "applied to all elements i - 1 and i")
1bbd0b84 453#define FUNC_NAME s_scm_sorted_p
54e09076 454{
c014a02e 455 long len, j; /* list/vector length, temp j */
54e09076
MD
456 SCM item, rest; /* rest of items loop variable */
457 SCM *vp;
458 cmp_fun_t cmp = scm_cmp_function (less);
459
460 if (SCM_NULLP (items))
461 return SCM_BOOL_T;
1bbd0b84 462
6b5a304f 463 SCM_VALIDATE_NIM (2,less);
54e09076
MD
464
465 if (SCM_CONSP (items))
466 {
467 len = scm_ilength (items); /* also checks that it's a pure list */
1bbd0b84 468 SCM_ASSERT_RANGE (1,items,len >= 0);
54e09076
MD
469 if (len <= 1)
470 return SCM_BOOL_T;
471
472 item = SCM_CAR (items);
473 rest = SCM_CDR (items);
474 j = len - 1;
475 while (j > 0)
476 {
4b479d98 477 if ((*cmp) (less, SCM_CARLOC(rest), &item))
54e09076
MD
478 return SCM_BOOL_F;
479 else
480 {
481 item = SCM_CAR (rest);
482 rest = SCM_CDR (rest);
483 j--;
484 }
485 }
486 return SCM_BOOL_T;
487 }
488 else
489 {
b5c2579a
DH
490 SCM_VALIDATE_VECTOR (1, items);
491
492 vp = SCM_VELTS (items); /* vector pointer */
493 len = SCM_VECTOR_LENGTH (items);
494 j = len - 1;
495 while (j > 0)
54e09076 496 {
b5c2579a
DH
497 if ((*cmp) (less, &vp[1], vp))
498 return SCM_BOOL_F;
499 else
500 {
501 vp++;
502 j--;
503 }
54e09076 504 }
b5c2579a 505 return SCM_BOOL_T;
54e09076 506 }
b5c2579a 507
54e09076 508 return SCM_BOOL_F;
1bbd0b84
GB
509}
510#undef FUNC_NAME
54e09076
MD
511
512/* (merge a b less?)
513 takes two lists a and b such that (sorted? a less?) and (sorted? b less?)
514 and returns a new list in which the elements of a and b have been stably
515 interleaved so that (sorted? (merge a b less?) less?).
516 Note: this does _not_ accept vectors. */
a1ec6916 517SCM_DEFINE (scm_merge, "merge", 3, 0, 0,
1bbd0b84 518 (SCM alist, SCM blist, SCM less),
e3239868
DH
519 "Takes two lists @var{alist} and @var{blist} such that\n"
520 "@code{(sorted? alist less?)} and @code{(sorted? blist less?)} and\n"
521 "returns a new list in which the elements of @var{alist} and\n"
522 "@var{blist} have been stably interleaved so that\n"
523 "@code{(sorted? (merge alist blist less?) less?)}.\n"
524 "Note: this does _not_ accept vectors.")
1bbd0b84 525#define FUNC_NAME s_scm_merge
54e09076 526{
c014a02e 527 long alen, blen; /* list lengths */
54e09076
MD
528 SCM build, last;
529 cmp_fun_t cmp = scm_cmp_function (less);
6b5a304f 530 SCM_VALIDATE_NIM (3,less);
54e09076
MD
531
532 if (SCM_NULLP (alist))
533 return blist;
534 else if (SCM_NULLP (blist))
535 return alist;
536 else
537 {
3b3b36dd
GB
538 SCM_VALIDATE_NONEMPTYLIST_COPYLEN (1,alist,alen);
539 SCM_VALIDATE_NONEMPTYLIST_COPYLEN (2,blist,blen);
4b479d98 540 if ((*cmp) (less, SCM_CARLOC (blist), SCM_CARLOC (alist)))
54e09076
MD
541 {
542 build = scm_cons (SCM_CAR (blist), SCM_EOL);
543 blist = SCM_CDR (blist);
544 blen--;
545 }
c56cc3c8
MD
546 else
547 {
548 build = scm_cons (SCM_CAR (alist), SCM_EOL);
549 alist = SCM_CDR (alist);
550 alen--;
551 }
54e09076
MD
552 last = build;
553 while ((alen > 0) && (blen > 0))
554 {
4b479d98 555 if ((*cmp) (less, SCM_CARLOC (blist), SCM_CARLOC (alist)))
54e09076
MD
556 {
557 SCM_SETCDR (last, scm_cons (SCM_CAR (blist), SCM_EOL));
558 blist = SCM_CDR (blist);
559 blen--;
560 }
c56cc3c8
MD
561 else
562 {
563 SCM_SETCDR (last, scm_cons (SCM_CAR (alist), SCM_EOL));
564 alist = SCM_CDR (alist);
565 alen--;
566 }
54e09076
MD
567 last = SCM_CDR (last);
568 }
569 if ((alen > 0) && (blen == 0))
570 SCM_SETCDR (last, alist);
571 else if ((alen == 0) && (blen > 0))
572 SCM_SETCDR (last, blist);
573 }
574 return build;
1bbd0b84
GB
575}
576#undef FUNC_NAME
577
54e09076
MD
578
579static SCM
580scm_merge_list_x (SCM alist, SCM blist,
581 long alen, long blen,
582 cmp_fun_t cmp, SCM less)
583{
584 SCM build, last;
585
586 if (SCM_NULLP (alist))
587 return blist;
588 else if (SCM_NULLP (blist))
589 return alist;
590 else
591 {
4b479d98 592 if ((*cmp) (less, SCM_CARLOC (blist), SCM_CARLOC (alist)))
54e09076
MD
593 {
594 build = blist;
595 blist = SCM_CDR (blist);
596 blen--;
597 }
c56cc3c8
MD
598 else
599 {
600 build = alist;
601 alist = SCM_CDR (alist);
602 alen--;
603 }
54e09076
MD
604 last = build;
605 while ((alen > 0) && (blen > 0))
606 {
4b479d98 607 if ((*cmp) (less, SCM_CARLOC (blist), SCM_CARLOC (alist)))
54e09076
MD
608 {
609 SCM_SETCDR (last, blist);
610 blist = SCM_CDR (blist);
611 blen--;
612 }
c56cc3c8
MD
613 else
614 {
615 SCM_SETCDR (last, alist);
616 alist = SCM_CDR (alist);
617 alen--;
618 }
54e09076
MD
619 last = SCM_CDR (last);
620 }
621 if ((alen > 0) && (blen == 0))
622 SCM_SETCDR (last, alist);
623 else if ((alen == 0) && (blen > 0))
624 SCM_SETCDR (last, blist);
625 }
626 return build;
627} /* scm_merge_list_x */
628
a1ec6916 629SCM_DEFINE (scm_merge_x, "merge!", 3, 0, 0,
1bbd0b84 630 (SCM alist, SCM blist, SCM less),
e3239868
DH
631 "Takes two lists @var{alist} and @var{blist} such that\n"
632 "@code{(sorted? alist less?)} and @code{(sorted? blist less?)} and\n"
633 "returns a new list in which the elements of @var{alist} and\n"
634 "@var{blist} have been stably interleaved so that\n"
635 " @code{(sorted? (merge alist blist less?) less?)}.\n"
636 "This is the destructive variant of @code{merge}\n"
637 "Note: this does _not_ accept vectors.")
1bbd0b84 638#define FUNC_NAME s_scm_merge_x
54e09076 639{
c014a02e 640 long alen, blen; /* list lengths */
54e09076 641
6b5a304f 642 SCM_VALIDATE_NIM (3,less);
54e09076
MD
643 if (SCM_NULLP (alist))
644 return blist;
645 else if (SCM_NULLP (blist))
646 return alist;
647 else
648 {
3b3b36dd
GB
649 SCM_VALIDATE_NONEMPTYLIST_COPYLEN (1,alist,alen);
650 SCM_VALIDATE_NONEMPTYLIST_COPYLEN (2,blist,blen);
54e09076
MD
651 return scm_merge_list_x (alist, blist,
652 alen, blen,
653 scm_cmp_function (less),
654 less);
655 }
1bbd0b84
GB
656}
657#undef FUNC_NAME
54e09076
MD
658
659/* This merge sort algorithm is same as slib's by Richard A. O'Keefe.
660 The algorithm is stable. We also tried to use the algorithm used by
661 scsh's merge-sort but that algorithm showed to not be stable, even
662 though it claimed to be.
663*/
664static SCM
665scm_merge_list_step (SCM * seq,
666 cmp_fun_t cmp,
667 SCM less,
c014a02e 668 long n)
54e09076 669{
c56cc3c8
MD
670 SCM a, b;
671
54e09076
MD
672 if (n > 2)
673 {
c014a02e 674 long mid = n / 2;
c56cc3c8
MD
675 a = scm_merge_list_step (seq, cmp, less, mid);
676 b = scm_merge_list_step (seq, cmp, less, n - mid);
677 return scm_merge_list_x (a, b, mid, n - mid, cmp, less);
54e09076
MD
678 }
679 else if (n == 2)
680 {
681 SCM p = *seq;
682 SCM rest = SCM_CDR (*seq);
683 SCM x = SCM_CAR (*seq);
684 SCM y = SCM_CAR (SCM_CDR (*seq));
685 *seq = SCM_CDR (rest);
686 SCM_SETCDR (rest, SCM_EOL);
687 if ((*cmp) (less, &y, &x))
688 {
4b479d98
DH
689 SCM_SETCAR (p, y);
690 SCM_SETCAR (rest, x);
54e09076
MD
691 }
692 return p;
693 }
694 else if (n == 1)
695 {
696 SCM p = *seq;
697 *seq = SCM_CDR (p);
698 SCM_SETCDR (p, SCM_EOL);
699 return p;
700 }
701 else
702 return SCM_EOL;
703} /* scm_merge_list_step */
704
705
54e09076 706/* scm_sort_x manages lists and vectors, not stable sort */
a1ec6916 707SCM_DEFINE (scm_sort_x, "sort!", 2, 0, 0,
1bbd0b84 708 (SCM items, SCM less),
e3239868
DH
709 "Sort the sequence @var{items}, which may be a list or a\n"
710 "vector. @var{less} is used for comparing the sequence\n"
711 "elements. The sorting is destructive, that means that the\n"
712 "input sequence is modified to produce the sorted result.\n"
713 "This is not a stable sort.")
1bbd0b84 714#define FUNC_NAME s_scm_sort_x
54e09076 715{
c014a02e 716 long len; /* list/vector length */
54e09076
MD
717 if (SCM_NULLP(items))
718 return SCM_EOL;
b5c2579a 719
6b5a304f 720 SCM_VALIDATE_NIM (2,less);
54e09076
MD
721
722 if (SCM_CONSP (items))
723 {
3b3b36dd 724 SCM_VALIDATE_LIST_COPYLEN (1,items,len);
54e09076
MD
725 return scm_merge_list_step (&items, scm_cmp_function (less), less, len);
726 }
727 else if (SCM_VECTORP (items))
728 {
b5c2579a 729 len = SCM_VECTOR_LENGTH (items);
54e09076
MD
730 scm_restricted_vector_sort_x (items,
731 less,
732 SCM_MAKINUM (0L),
733 SCM_MAKINUM (len));
734 return items;
735 }
736 else
276dd677 737 SCM_WRONG_TYPE_ARG (1, items);
1bbd0b84 738}
0f981281 739#undef FUNC_NAME
54e09076
MD
740
741/* scm_sort manages lists and vectors, not stable sort */
1bbd0b84 742
a1ec6916 743SCM_DEFINE (scm_sort, "sort", 2, 0, 0,
1bbd0b84 744 (SCM items, SCM less),
e3239868
DH
745 "Sort the sequence @var{items}, which may be a list or a\n"
746 "vector. @var{less} is used for comparing the sequence\n"
747 "elements. This is not a stable sort.")
1bbd0b84 748#define FUNC_NAME s_scm_sort
54e09076 749{
54e09076
MD
750 if (SCM_NULLP(items))
751 return SCM_EOL;
b5c2579a 752
6b5a304f 753 SCM_VALIDATE_NIM (2,less);
54e09076
MD
754 if (SCM_CONSP (items))
755 {
c014a02e 756 long len;
e9e225e5 757
3b3b36dd 758 SCM_VALIDATE_LIST_COPYLEN (1,items,len);
54e09076
MD
759 items = scm_list_copy (items);
760 return scm_merge_list_step (&items, scm_cmp_function (less), less, len);
761 }
afe5177e
GH
762#ifdef HAVE_ARRAYS
763 /* support ordinary vectors even if arrays not available? */
54e09076
MD
764 else if (SCM_VECTORP (items))
765 {
c014a02e 766 long len = SCM_VECTOR_LENGTH (items);
e9e225e5
GH
767 SCM sortvec = scm_make_uve (len, scm_array_prototype (items));
768
54e09076
MD
769 scm_array_copy_x (items, sortvec);
770 scm_restricted_vector_sort_x (sortvec,
771 less,
772 SCM_MAKINUM (0L),
773 SCM_MAKINUM (len));
774 return sortvec;
775 }
afe5177e 776#endif
54e09076 777 else
276dd677 778 SCM_WRONG_TYPE_ARG (1, items);
1bbd0b84 779}
0f981281 780#undef FUNC_NAME
54e09076
MD
781
782static void
783scm_merge_vector_x (void *const vecbase,
784 void *const tempbase,
785 cmp_fun_t cmp,
786 SCM less,
c014a02e
ML
787 long low,
788 long mid,
789 long high)
54e09076
MD
790{
791 register SCM *vp = (SCM *) vecbase;
792 register SCM *temp = (SCM *) tempbase;
c014a02e
ML
793 long it; /* Index for temp vector */
794 long i1 = low; /* Index for lower vector segment */
795 long i2 = mid + 1; /* Index for upper vector segment */
54e09076
MD
796
797 /* Copy while both segments contain more characters */
798 for (it = low; (i1 <= mid) && (i2 <= high); ++it)
799 if ((*cmp) (less, &vp[i2], &vp[i1]))
800 temp[it] = vp[i2++];
801 else
802 temp[it] = vp[i1++];
803
804 /* Copy while first segment contains more characters */
805 while (i1 <= mid)
806 temp[it++] = vp[i1++];
807
808 /* Copy while second segment contains more characters */
809 while (i2 <= high)
810 temp[it++] = vp[i2++];
811
812 /* Copy back from temp to vp */
813 for (it = low; it <= high; ++it)
814 vp[it] = temp[it];
815} /* scm_merge_vector_x */
816
817static void
818scm_merge_vector_step (void *const vp,
819 void *const temp,
820 cmp_fun_t cmp,
821 SCM less,
c014a02e
ML
822 long low,
823 long high)
54e09076
MD
824{
825 if (high > low)
826 {
c014a02e 827 long mid = (low + high) / 2;
54e09076
MD
828 scm_merge_vector_step (vp, temp, cmp, less, low, mid);
829 scm_merge_vector_step (vp, temp, cmp, less, mid+1, high);
830 scm_merge_vector_x (vp, temp, cmp, less, low, mid, high);
831 }
832} /* scm_merge_vector_step */
833
834
54e09076
MD
835/* stable-sort! manages lists and vectors */
836
a1ec6916 837SCM_DEFINE (scm_stable_sort_x, "stable-sort!", 2, 0, 0,
1bbd0b84 838 (SCM items, SCM less),
e3239868
DH
839 "Sort the sequence @var{items}, which may be a list or a\n"
840 "vector. @var{less} is used for comparing the sequence elements.\n"
841 "The sorting is destructive, that means that the input sequence\n"
842 "is modified to produce the sorted result.\n"
843 "This is a stable sort.")
1bbd0b84 844#define FUNC_NAME s_scm_stable_sort_x
54e09076 845{
c014a02e 846 long len; /* list/vector length */
54e09076
MD
847
848 if (SCM_NULLP (items))
849 return SCM_EOL;
b5c2579a 850
6b5a304f 851 SCM_VALIDATE_NIM (2,less);
54e09076
MD
852 if (SCM_CONSP (items))
853 {
3b3b36dd 854 SCM_VALIDATE_LIST_COPYLEN (1,items,len);
54e09076
MD
855 return scm_merge_list_step (&items, scm_cmp_function (less), less, len);
856 }
857 else if (SCM_VECTORP (items))
858 {
859 SCM *temp, *vp;
b5c2579a 860 len = SCM_VECTOR_LENGTH (items);
54e09076
MD
861 temp = malloc (len * sizeof(SCM));
862 vp = SCM_VELTS (items);
863 scm_merge_vector_step (vp,
864 temp,
865 scm_cmp_function (less),
866 less,
867 0,
868 len - 1);
869 free(temp);
870 return items;
871 }
872 else
276dd677 873 SCM_WRONG_TYPE_ARG (1, items);
1bbd0b84 874}
0f981281 875#undef FUNC_NAME
54e09076
MD
876
877/* stable_sort manages lists and vectors */
1bbd0b84 878
a1ec6916 879SCM_DEFINE (scm_stable_sort, "stable-sort", 2, 0, 0,
1bbd0b84 880 (SCM items, SCM less),
e3239868
DH
881 "Sort the sequence @var{items}, which may be a list or a\n"
882 "vector. @var{less} is used for comparing the sequence elements.\n"
883 "This is a stable sort.")
1bbd0b84 884#define FUNC_NAME s_scm_stable_sort
54e09076 885{
c014a02e 886 long len; /* list/vector length */
54e09076
MD
887 if (SCM_NULLP (items))
888 return SCM_EOL;
b5c2579a 889
6b5a304f 890 SCM_VALIDATE_NIM (2,less);
54e09076
MD
891 if (SCM_CONSP (items))
892 {
3b3b36dd 893 SCM_VALIDATE_LIST_COPYLEN (1,items,len);
54e09076
MD
894 items = scm_list_copy (items);
895 return scm_merge_list_step (&items, scm_cmp_function (less), less, len);
896 }
afe5177e
GH
897#ifdef HAVE_ARRAYS
898 /* support ordinary vectors even if arrays not available? */
54e09076
MD
899 else if (SCM_VECTORP (items))
900 {
901 SCM retvec;
902 SCM *temp, *vp;
b5c2579a 903 len = SCM_VECTOR_LENGTH (items);
54e09076
MD
904 retvec = scm_make_uve (len, scm_array_prototype (items));
905 scm_array_copy_x (items, retvec);
906 temp = malloc (len * sizeof (SCM));
907 vp = SCM_VELTS (retvec);
908 scm_merge_vector_step (vp,
909 temp,
910 scm_cmp_function (less),
911 less,
912 0,
913 len - 1);
914 free (temp);
915 return retvec;
916 }
afe5177e 917#endif
54e09076 918 else
276dd677 919 SCM_WRONG_TYPE_ARG (1, items);
1bbd0b84 920}
0f981281 921#undef FUNC_NAME
54e09076 922
1bbd0b84 923/* stable */
a1ec6916 924SCM_DEFINE (scm_sort_list_x, "sort-list!", 2, 0, 0,
1bbd0b84 925 (SCM items, SCM less),
e3239868
DH
926 "Sort the list @var{items}, using @var{less} for comparing the\n"
927 "list elements. The sorting is destructive, that means that the\n"
928 "input list is modified to produce the sorted result.\n"
929 "This is a stable sort.")
1bbd0b84 930#define FUNC_NAME s_scm_sort_list_x
54e09076 931{
c014a02e 932 long len;
3b3b36dd 933 SCM_VALIDATE_LIST_COPYLEN (1,items,len);
6b5a304f 934 SCM_VALIDATE_NIM (2,less);
54e09076 935 return scm_merge_list_step (&items, scm_cmp_function (less), less, len);
1bbd0b84 936}
0f981281 937#undef FUNC_NAME
54e09076 938
1bbd0b84 939/* stable */
a1ec6916 940SCM_DEFINE (scm_sort_list, "sort-list", 2, 0, 0,
e3239868
DH
941 (SCM items, SCM less),
942 "Sort the list @var{items}, using @var{less} for comparing the\n"
943 "list elements. This is a stable sort.")
1bbd0b84 944#define FUNC_NAME s_scm_sort_list
54e09076 945{
c014a02e 946 long len;
3b3b36dd 947 SCM_VALIDATE_LIST_COPYLEN (1,items,len);
6b5a304f 948 SCM_VALIDATE_NIM (2,less);
54e09076
MD
949 items = scm_list_copy (items);
950 return scm_merge_list_step (&items, scm_cmp_function (less), less, len);
1bbd0b84 951}
0f981281 952#undef FUNC_NAME
54e09076
MD
953
954void
955scm_init_sort ()
956{
8dc9439f 957#ifndef SCM_MAGIC_SNARFER
a0599745 958#include "libguile/sort.x"
8dc9439f 959#endif
54e09076
MD
960
961 scm_add_feature ("sort");
962}
89e00824
ML
963
964/*
965 Local Variables:
966 c-file-style: "gnu"
967 End:
968*/