1 /* srfi-14.c --- SRFI-14 procedures for Guile
3 * Copyright (C) 2001 Free Software Foundation, Inc.
5 * This library is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU Lesser General Public
7 * License as published by the Free Software Foundation; either
8 * version 2.1 of the License, or (at your option) any later version.
10 * This library is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * Lesser General Public License for more details.
15 * You should have received a copy of the GNU Lesser General Public
16 * License along with this library; if not, write to the Free Software
17 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
28 #define SCM_CHARSET_SET(cs, idx) \
29 (((long *) SCM_SMOB_DATA (cs))[(idx) / SCM_BITS_PER_LONG] |= \
30 (1L << ((idx) % SCM_BITS_PER_LONG)))
32 #define BYTES_PER_CHARSET (SCM_CHARSET_SIZE / 8)
33 #define LONGS_PER_CHARSET (SCM_CHARSET_SIZE / SCM_BITS_PER_LONG)
36 /* Smob type code for character sets. */
37 int scm_tc16_charset
= 0;
40 /* Smob print hook for character sets. */
42 charset_print (SCM charset
, SCM port
, scm_print_state
*pstate SCM_UNUSED
)
47 scm_puts ("#<charset {", port
);
48 for (i
= 0; i
< SCM_CHARSET_SIZE
; i
++)
49 if (SCM_CHARSET_GET (charset
, i
))
55 scm_write (SCM_MAKE_CHAR (i
), port
);
57 scm_puts ("}>", port
);
62 /* Smob free hook for character sets. */
64 charset_free (SCM charset
)
66 return scm_smob_free (charset
);
70 /* Create a new, empty character set. */
72 make_char_set (const char * func_name
)
76 p
= scm_gc_malloc (BYTES_PER_CHARSET
, "character-set");
77 memset (p
, 0, BYTES_PER_CHARSET
);
78 SCM_RETURN_NEWSMOB (scm_tc16_charset
, p
);
82 SCM_DEFINE (scm_char_set_p
, "char-set?", 1, 0, 0,
84 "Return @code{#t} if @var{obj} is a character set, @code{#f}\n"
86 #define FUNC_NAME s_scm_char_set_p
88 return SCM_BOOL (SCM_SMOB_PREDICATE (scm_tc16_charset
, obj
));
93 SCM_DEFINE (scm_char_set_eq
, "char-set=", 0, 0, 1,
95 "Return @code{#t} if all given character sets are equal.")
96 #define FUNC_NAME s_scm_char_set_eq
99 long *cs1_data
= NULL
;
101 SCM_VALIDATE_REST_ARGUMENT (char_sets
);
103 while (!SCM_NULLP (char_sets
))
105 SCM csi
= SCM_CAR (char_sets
);
108 SCM_VALIDATE_SMOB (argnum
, csi
, charset
);
110 csi_data
= (long *) SCM_SMOB_DATA (csi
);
111 if (cs1_data
== NULL
)
113 else if (memcmp (cs1_data
, csi_data
, BYTES_PER_CHARSET
) != 0)
115 char_sets
= SCM_CDR (char_sets
);
122 SCM_DEFINE (scm_char_set_leq
, "char-set<=", 0, 0, 1,
124 "Return @code{#t} if every character set @var{cs}i is a subset\n"
125 "of character set @var{cs}i+1.")
126 #define FUNC_NAME s_scm_char_set_leq
129 long *prev_data
= NULL
;
131 SCM_VALIDATE_REST_ARGUMENT (char_sets
);
133 while (!SCM_NULLP (char_sets
))
135 SCM csi
= SCM_CAR (char_sets
);
138 SCM_VALIDATE_SMOB (argnum
, csi
, charset
);
140 csi_data
= (long *) SCM_SMOB_DATA (csi
);
145 for (k
= 0; k
< LONGS_PER_CHARSET
; k
++)
147 if ((prev_data
[k
] & csi_data
[k
]) != prev_data
[k
])
151 prev_data
= csi_data
;
152 char_sets
= SCM_CDR (char_sets
);
159 SCM_DEFINE (scm_char_set_hash
, "char-set-hash", 1, 1, 0,
161 "Compute a hash value for the character set @var{cs}. If\n"
162 "@var{bound} is given and non-zero, it restricts the\n"
163 "returned value to the range 0 @dots{} @var{bound - 1}.")
164 #define FUNC_NAME s_scm_char_set_hash
166 const int default_bnd
= 871;
169 unsigned long val
= 0;
172 SCM_VALIDATE_SMOB (1, cs
, charset
);
174 if (SCM_UNBNDP (bound
))
178 SCM_VALIDATE_INUM_MIN_COPY (2, bound
, 0, bnd
);
183 p
= (long *) SCM_SMOB_DATA (cs
);
184 for (k
= 0; k
< LONGS_PER_CHARSET
; k
++)
187 val
= p
[k
] + (val
<< 1);
189 return SCM_MAKINUM (val
% bnd
);
194 SCM_DEFINE (scm_char_set_cursor
, "char-set-cursor", 1, 0, 0,
196 "Return a cursor into the character set @var{cs}.")
197 #define FUNC_NAME s_scm_char_set_cursor
201 SCM_VALIDATE_SMOB (1, cs
, charset
);
202 for (idx
= 0; idx
< SCM_CHARSET_SIZE
; idx
++)
204 if (SCM_CHARSET_GET (cs
, idx
))
207 return SCM_MAKINUM (idx
);
212 SCM_DEFINE (scm_char_set_ref
, "char-set-ref", 2, 0, 0,
213 (SCM cs
, SCM cursor
),
214 "Return the character at the current cursor position\n"
215 "@var{cursor} in the character set @var{cs}. It is an error to\n"
216 "pass a cursor for which @code{end-of-char-set?} returns true.")
217 #define FUNC_NAME s_scm_char_set_ref
221 SCM_VALIDATE_SMOB (1, cs
, charset
);
222 SCM_VALIDATE_INUM_MIN_COPY (2, cursor
, 0, ccursor
);
224 if (ccursor
>= SCM_CHARSET_SIZE
|| !SCM_CHARSET_GET (cs
, ccursor
))
225 SCM_MISC_ERROR ("invalid character set cursor: ~A", scm_list_1 (cursor
));
226 return SCM_MAKE_CHAR (ccursor
);
231 SCM_DEFINE (scm_char_set_cursor_next
, "char-set-cursor-next", 2, 0, 0,
232 (SCM cs
, SCM cursor
),
233 "Advance the character set cursor @var{cursor} to the next\n"
234 "character in the character set @var{cs}. It is an error if the\n"
235 "cursor given satisfies @code{end-of-char-set?}.")
236 #define FUNC_NAME s_scm_char_set_cursor_next
240 SCM_VALIDATE_SMOB (1, cs
, charset
);
241 SCM_VALIDATE_INUM_MIN_COPY (2, cursor
, 0, ccursor
);
243 if (ccursor
>= SCM_CHARSET_SIZE
|| !SCM_CHARSET_GET (cs
, ccursor
))
244 SCM_MISC_ERROR ("invalid character set cursor: ~A", scm_list_1 (cursor
));
245 for (ccursor
++; ccursor
< SCM_CHARSET_SIZE
; ccursor
++)
247 if (SCM_CHARSET_GET (cs
, ccursor
))
250 return SCM_MAKINUM (ccursor
);
255 SCM_DEFINE (scm_end_of_char_set_p
, "end-of-char-set?", 1, 0, 0,
257 "Return @code{#t} if @var{cursor} has reached the end of a\n"
258 "character set, @code{#f} otherwise.")
259 #define FUNC_NAME s_scm_end_of_char_set_p
263 SCM_VALIDATE_INUM_MIN_COPY (1, cursor
, 0, ccursor
);
264 return SCM_BOOL (ccursor
>= SCM_CHARSET_SIZE
);
269 SCM_DEFINE (scm_char_set_fold
, "char-set-fold", 3, 0, 0,
270 (SCM kons
, SCM knil
, SCM cs
),
271 "Fold the procedure @var{kons} over the character set @var{cs},\n"
272 "initializing it with @var{knil}.")
273 #define FUNC_NAME s_scm_char_set_fold
277 SCM_VALIDATE_PROC (1, kons
);
278 SCM_VALIDATE_SMOB (3, cs
, charset
);
280 for (k
= 0; k
< SCM_CHARSET_SIZE
; k
++)
281 if (SCM_CHARSET_GET (cs
, k
))
283 knil
= scm_call_2 (kons
, SCM_MAKE_CHAR (k
), knil
);
290 SCM_DEFINE (scm_char_set_unfold
, "char-set-unfold", 4, 1, 0,
291 (SCM p
, SCM f
, SCM g
, SCM seed
, SCM base_cs
),
292 "This is a fundamental constructor for character sets.\n"
294 "@item @var{g} is used to generate a series of ``seed'' values\n"
295 "from the initial seed: @var{seed}, (@var{g} @var{seed}),\n"
296 "(@var{g}^2 @var{seed}), (@var{g}^3 @var{seed}), @dots{}\n"
297 "@item @var{p} tells us when to stop -- when it returns true\n"
298 "when applied to one of the seed values.\n"
299 "@item @var{f} maps each seed value to a character. These\n"
300 "characters are added to the base character set @var{base_cs} to\n"
301 "form the result; @var{base_cs} defaults to the empty set.\n"
303 #define FUNC_NAME s_scm_char_set_unfold
307 SCM_VALIDATE_PROC (1, p
);
308 SCM_VALIDATE_PROC (2, f
);
309 SCM_VALIDATE_PROC (3, g
);
310 if (!SCM_UNBNDP (base_cs
))
312 SCM_VALIDATE_SMOB (5, base_cs
, charset
);
313 result
= scm_char_set_copy (base_cs
);
316 result
= make_char_set (FUNC_NAME
);
318 tmp
= scm_call_1 (p
, seed
);
319 while (SCM_FALSEP (tmp
))
321 SCM ch
= scm_call_1 (f
, seed
);
323 SCM_MISC_ERROR ("procedure ~S returned non-char", scm_list_1 (f
));
324 SCM_CHARSET_SET (result
, SCM_CHAR (ch
));
326 seed
= scm_call_1 (g
, seed
);
327 tmp
= scm_call_1 (p
, seed
);
334 SCM_DEFINE (scm_char_set_unfold_x
, "char-set-unfold!", 5, 0, 0,
335 (SCM p
, SCM f
, SCM g
, SCM seed
, SCM base_cs
),
336 "This is a fundamental constructor for character sets.\n"
338 "@item @var{g} is used to generate a series of ``seed'' values\n"
339 "from the initial seed: @var{seed}, (@var{g} @var{seed}),\n"
340 "(@var{g}^2 @var{seed}), (@var{g}^3 @var{seed}), @dots{}\n"
341 "@item @var{p} tells us when to stop -- when it returns true\n"
342 "when applied to one of the seed values.\n"
343 "@item @var{f} maps each seed value to a character. These\n"
344 "characters are added to the base character set @var{base_cs} to\n"
345 "form the result; @var{base_cs} defaults to the empty set.\n"
347 #define FUNC_NAME s_scm_char_set_unfold_x
351 SCM_VALIDATE_PROC (1, p
);
352 SCM_VALIDATE_PROC (2, f
);
353 SCM_VALIDATE_PROC (3, g
);
354 SCM_VALIDATE_SMOB (5, base_cs
, charset
);
356 tmp
= scm_call_1 (p
, seed
);
357 while (SCM_FALSEP (tmp
))
359 SCM ch
= scm_call_1 (f
, seed
);
361 SCM_MISC_ERROR ("procedure ~S returned non-char", scm_list_1 (f
));
362 SCM_CHARSET_SET (base_cs
, SCM_CHAR (ch
));
364 seed
= scm_call_1 (g
, seed
);
365 tmp
= scm_call_1 (p
, seed
);
372 SCM_DEFINE (scm_char_set_for_each
, "char-set-for-each", 2, 0, 0,
374 "Apply @var{proc} to every character in the character set\n"
375 "@var{cs}. The return value is not specified.")
376 #define FUNC_NAME s_scm_char_set_for_each
380 SCM_VALIDATE_PROC (1, proc
);
381 SCM_VALIDATE_SMOB (2, cs
, charset
);
383 for (k
= 0; k
< SCM_CHARSET_SIZE
; k
++)
384 if (SCM_CHARSET_GET (cs
, k
))
385 scm_call_1 (proc
, SCM_MAKE_CHAR (k
));
386 return SCM_UNSPECIFIED
;
391 SCM_DEFINE (scm_char_set_map
, "char-set-map", 2, 0, 0,
393 "Map the procedure @var{proc} over every character in @var{cs}.\n"
394 "@var{proc} must be a character -> character procedure.")
395 #define FUNC_NAME s_scm_char_set_map
400 SCM_VALIDATE_PROC (1, proc
);
401 SCM_VALIDATE_SMOB (2, cs
, charset
);
403 result
= make_char_set (FUNC_NAME
);
404 for (k
= 0; k
< SCM_CHARSET_SIZE
; k
++)
405 if (SCM_CHARSET_GET (cs
, k
))
407 SCM ch
= scm_call_1 (proc
, SCM_MAKE_CHAR (k
));
409 SCM_MISC_ERROR ("procedure ~S returned non-char", scm_list_1 (proc
));
410 SCM_CHARSET_SET (result
, SCM_CHAR (ch
));
417 SCM_DEFINE (scm_char_set_copy
, "char-set-copy", 1, 0, 0,
419 "Return a newly allocated character set containing all\n"
420 "characters in @var{cs}.")
421 #define FUNC_NAME s_scm_char_set_copy
427 SCM_VALIDATE_SMOB (1, cs
, charset
);
428 ret
= make_char_set (FUNC_NAME
);
429 p1
= (long *) SCM_SMOB_DATA (cs
);
430 p2
= (long *) SCM_SMOB_DATA (ret
);
431 for (k
= 0; k
< LONGS_PER_CHARSET
; k
++)
438 SCM_DEFINE (scm_char_set
, "char-set", 0, 0, 1,
440 "Return a character set containing all given characters.")
441 #define FUNC_NAME s_scm_char_set
447 SCM_VALIDATE_REST_ARGUMENT (rest
);
448 cs
= make_char_set (FUNC_NAME
);
449 p
= (long *) SCM_SMOB_DATA (cs
);
450 while (!SCM_NULLP (rest
))
454 SCM_VALIDATE_CHAR_COPY (argnum
, SCM_CAR (rest
), c
);
456 rest
= SCM_CDR (rest
);
457 p
[c
/ SCM_BITS_PER_LONG
] |= 1L << (c
% SCM_BITS_PER_LONG
);
464 SCM_DEFINE (scm_list_to_char_set
, "list->char-set", 1, 1, 0,
465 (SCM list
, SCM base_cs
),
466 "Convert the character list @var{list} to a character set. If\n"
467 "the character set @var{base_cs} is given, the character in this\n"
468 "set are also included in the result.")
469 #define FUNC_NAME s_scm_list_to_char_set
474 SCM_VALIDATE_LIST (1, list
);
475 if (SCM_UNBNDP (base_cs
))
476 cs
= make_char_set (FUNC_NAME
);
479 SCM_VALIDATE_SMOB (2, base_cs
, charset
);
480 cs
= scm_char_set_copy (base_cs
);
482 p
= (long *) SCM_SMOB_DATA (cs
);
483 while (!SCM_NULLP (list
))
485 SCM chr
= SCM_CAR (list
);
488 SCM_VALIDATE_CHAR_COPY (0, chr
, c
);
489 list
= SCM_CDR (list
);
491 p
[c
/ SCM_BITS_PER_LONG
] |= 1L << (c
% SCM_BITS_PER_LONG
);
498 SCM_DEFINE (scm_list_to_char_set_x
, "list->char-set!", 2, 0, 0,
499 (SCM list
, SCM base_cs
),
500 "Convert the character list @var{list} to a character set. The\n"
501 "characters are added to @var{base_cs} and @var{base_cs} is\n"
503 #define FUNC_NAME s_scm_list_to_char_set_x
507 SCM_VALIDATE_LIST (1, list
);
508 SCM_VALIDATE_SMOB (2, base_cs
, charset
);
509 p
= (long *) SCM_SMOB_DATA (base_cs
);
510 while (!SCM_NULLP (list
))
512 SCM chr
= SCM_CAR (list
);
515 SCM_VALIDATE_CHAR_COPY (0, chr
, c
);
516 list
= SCM_CDR (list
);
518 p
[c
/ SCM_BITS_PER_LONG
] |= 1L << (c
% SCM_BITS_PER_LONG
);
525 SCM_DEFINE (scm_string_to_char_set
, "string->char-set", 1, 1, 0,
526 (SCM str
, SCM base_cs
),
527 "Convert the string @var{str} to a character set. If the\n"
528 "character set @var{base_cs} is given, the characters in this\n"
529 "set are also included in the result.")
530 #define FUNC_NAME s_scm_string_to_char_set
537 SCM_VALIDATE_STRING (1, str
);
538 if (SCM_UNBNDP (base_cs
))
539 cs
= make_char_set (FUNC_NAME
);
542 SCM_VALIDATE_SMOB (2, base_cs
, charset
);
543 cs
= scm_char_set_copy (base_cs
);
545 p
= (long *) SCM_SMOB_DATA (cs
);
546 s
= SCM_STRING_CHARS (str
);
547 while (k
< SCM_STRING_LENGTH (str
))
550 p
[c
/ SCM_BITS_PER_LONG
] |= 1L << (c
% SCM_BITS_PER_LONG
);
557 SCM_DEFINE (scm_string_to_char_set_x
, "string->char-set!", 2, 0, 0,
558 (SCM str
, SCM base_cs
),
559 "Convert the string @var{str} to a character set. The\n"
560 "characters from the string are added to @var{base_cs}, and\n"
561 "@var{base_cs} is returned.")
562 #define FUNC_NAME s_scm_string_to_char_set_x
568 SCM_VALIDATE_STRING (1, str
);
569 SCM_VALIDATE_SMOB (2, base_cs
, charset
);
570 p
= (long *) SCM_SMOB_DATA (base_cs
);
571 s
= SCM_STRING_CHARS (str
);
572 while (k
< SCM_STRING_LENGTH (str
))
575 p
[c
/ SCM_BITS_PER_LONG
] |= 1L << (c
% SCM_BITS_PER_LONG
);
582 SCM_DEFINE (scm_char_set_filter
, "char-set-filter", 2, 1, 0,
583 (SCM pred
, SCM cs
, SCM base_cs
),
584 "Return a character set containing every character from @var{cs}\n"
585 "so that it satisfies @var{pred}. If provided, the characters\n"
586 "from @var{base_cs} are added to the result.")
587 #define FUNC_NAME s_scm_char_set_filter
593 SCM_VALIDATE_PROC (1, pred
);
594 SCM_VALIDATE_SMOB (2, cs
, charset
);
595 if (!SCM_UNBNDP (base_cs
))
597 SCM_VALIDATE_SMOB (3, base_cs
, charset
);
598 ret
= scm_char_set_copy (base_cs
);
601 ret
= make_char_set (FUNC_NAME
);
602 p
= (long *) SCM_SMOB_DATA (ret
);
603 for (k
= 0; k
< SCM_CHARSET_SIZE
; k
++)
605 if (SCM_CHARSET_GET (cs
, k
))
607 SCM res
= scm_call_1 (pred
, SCM_MAKE_CHAR (k
));
609 if (!SCM_FALSEP (res
))
610 p
[k
/ SCM_BITS_PER_LONG
] |= 1L << (k
% SCM_BITS_PER_LONG
);
618 SCM_DEFINE (scm_char_set_filter_x
, "char-set-filter!", 3, 0, 0,
619 (SCM pred
, SCM cs
, SCM base_cs
),
620 "Return a character set containing every character from @var{cs}\n"
621 "so that it satisfies @var{pred}. The characters are added to\n"
622 "@var{base_cs} and @var{base_cs} is returned.")
623 #define FUNC_NAME s_scm_char_set_filter_x
628 SCM_VALIDATE_PROC (1, pred
);
629 SCM_VALIDATE_SMOB (2, cs
, charset
);
630 SCM_VALIDATE_SMOB (3, base_cs
, charset
);
631 p
= (long *) SCM_SMOB_DATA (base_cs
);
632 for (k
= 0; k
< SCM_CHARSET_SIZE
; k
++)
634 if (SCM_CHARSET_GET (cs
, k
))
636 SCM res
= scm_call_1 (pred
, SCM_MAKE_CHAR (k
));
638 if (!SCM_FALSEP (res
))
639 p
[k
/ SCM_BITS_PER_LONG
] |= 1L << (k
% SCM_BITS_PER_LONG
);
647 SCM_DEFINE (scm_ucs_range_to_char_set
, "ucs-range->char-set", 2, 2, 0,
648 (SCM lower
, SCM upper
, SCM error
, SCM base_cs
),
649 "Return a character set containing all characters whose\n"
650 "character codes lie in the half-open range\n"
651 "[@var{lower},@var{upper}).\n"
653 "If @var{error} is a true value, an error is signalled if the\n"
654 "specified range contains characters which are not contained in\n"
655 "the implemented character range. If @var{error} is @code{#f},\n"
656 "these characters are silently left out of the resultung\n"
659 "The characters in @var{base_cs} are added to the result, if\n"
661 #define FUNC_NAME s_scm_ucs_range_to_char_set
667 SCM_VALIDATE_INUM_COPY (1, lower
, clower
);
668 SCM_VALIDATE_INUM_COPY (2, upper
, cupper
);
669 SCM_ASSERT_RANGE (1, lower
, clower
>= 0);
670 SCM_ASSERT_RANGE (2, upper
, cupper
>= 0 && cupper
>= clower
);
671 if (!SCM_UNBNDP (error
))
673 if (!SCM_FALSEP (error
))
675 SCM_ASSERT_RANGE (1, lower
, clower
<= SCM_CHARSET_SIZE
);
676 SCM_ASSERT_RANGE (2, upper
, cupper
<= SCM_CHARSET_SIZE
);
679 if (clower
> SCM_CHARSET_SIZE
)
680 clower
= SCM_CHARSET_SIZE
;
681 if (cupper
> SCM_CHARSET_SIZE
)
682 cupper
= SCM_CHARSET_SIZE
;
683 if (SCM_UNBNDP (base_cs
))
684 cs
= make_char_set (FUNC_NAME
);
687 SCM_VALIDATE_SMOB (2, base_cs
, charset
);
688 cs
= scm_char_set_copy (base_cs
);
690 p
= (long *) SCM_SMOB_DATA (cs
);
691 while (clower
< cupper
)
693 p
[clower
/ SCM_BITS_PER_LONG
] |= 1L << (clower
% SCM_BITS_PER_LONG
);
701 SCM_DEFINE (scm_ucs_range_to_char_set_x
, "ucs-range->char-set!", 4, 0, 0,
702 (SCM lower
, SCM upper
, SCM error
, SCM base_cs
),
703 "Return a character set containing all characters whose\n"
704 "character codes lie in the half-open range\n"
705 "[@var{lower},@var{upper}).\n"
707 "If @var{error} is a true value, an error is signalled if the\n"
708 "specified range contains characters which are not contained in\n"
709 "the implemented character range. If @var{error} is @code{#f},\n"
710 "these characters are silently left out of the resultung\n"
713 "The characters are added to @var{base_cs} and @var{base_cs} is\n"
715 #define FUNC_NAME s_scm_ucs_range_to_char_set_x
720 SCM_VALIDATE_INUM_COPY (1, lower
, clower
);
721 SCM_VALIDATE_INUM_COPY (2, upper
, cupper
);
722 SCM_ASSERT_RANGE (1, lower
, clower
>= 0);
723 SCM_ASSERT_RANGE (2, upper
, cupper
>= 0 && cupper
>= clower
);
724 if (!SCM_FALSEP (error
))
726 SCM_ASSERT_RANGE (1, lower
, clower
<= SCM_CHARSET_SIZE
);
727 SCM_ASSERT_RANGE (2, upper
, cupper
<= SCM_CHARSET_SIZE
);
729 if (clower
> SCM_CHARSET_SIZE
)
730 clower
= SCM_CHARSET_SIZE
;
731 if (cupper
> SCM_CHARSET_SIZE
)
732 cupper
= SCM_CHARSET_SIZE
;
733 p
= (long *) SCM_SMOB_DATA (base_cs
);
734 while (clower
< cupper
)
736 p
[clower
/ SCM_BITS_PER_LONG
] |= 1L << (clower
% SCM_BITS_PER_LONG
);
744 SCM_DEFINE (scm_char_set_size
, "char-set-size", 1, 0, 0,
746 "Return the number of elements in character set @var{cs}.")
747 #define FUNC_NAME s_scm_char_set_size
751 SCM_VALIDATE_SMOB (1, cs
, charset
);
752 for (k
= 0; k
< SCM_CHARSET_SIZE
; k
++)
753 if (SCM_CHARSET_GET (cs
, k
))
755 return SCM_MAKINUM (count
);
760 SCM_DEFINE (scm_char_set_count
, "char-set-count", 2, 0, 0,
762 "Return the number of the elements int the character set\n"
763 "@var{cs} which satisfy the predicate @var{pred}.")
764 #define FUNC_NAME s_scm_char_set_count
768 SCM_VALIDATE_PROC (1, pred
);
769 SCM_VALIDATE_SMOB (2, cs
, charset
);
771 for (k
= 0; k
< SCM_CHARSET_SIZE
; k
++)
772 if (SCM_CHARSET_GET (cs
, k
))
774 SCM res
= scm_call_1 (pred
, SCM_MAKE_CHAR (k
));
775 if (!SCM_FALSEP (res
))
778 return SCM_MAKINUM (count
);
783 SCM_DEFINE (scm_char_set_to_list
, "char-set->list", 1, 0, 0,
785 "Return a list containing the elements of the character set\n"
787 #define FUNC_NAME s_scm_char_set_to_list
790 SCM result
= SCM_EOL
;
792 SCM_VALIDATE_SMOB (1, cs
, charset
);
793 for (k
= SCM_CHARSET_SIZE
; k
> 0; k
--)
794 if (SCM_CHARSET_GET (cs
, k
- 1))
795 result
= scm_cons (SCM_MAKE_CHAR (k
- 1), result
);
801 SCM_DEFINE (scm_char_set_to_string
, "char-set->string", 1, 0, 0,
803 "Return a string containing the elements of the character set\n"
804 "@var{cs}. The order in which the characters are placed in the\n"
805 "string is not defined.")
806 #define FUNC_NAME s_scm_char_set_to_string
814 SCM_VALIDATE_SMOB (1, cs
, charset
);
815 for (k
= 0; k
< SCM_CHARSET_SIZE
; k
++)
816 if (SCM_CHARSET_GET (cs
, k
))
818 result
= scm_allocate_string (count
);
819 p
= SCM_STRING_CHARS (result
);
820 for (k
= 0; k
< SCM_CHARSET_SIZE
; k
++)
821 if (SCM_CHARSET_GET (cs
, k
))
828 SCM_DEFINE (scm_char_set_contains_p
, "char-set-contains?", 2, 0, 0,
830 "Return @code{#t} iff the character @var{ch} is contained in the\n"
831 "character set @var{cs}.")
832 #define FUNC_NAME s_scm_char_set_contains_p
834 SCM_VALIDATE_SMOB (1, cs
, charset
);
835 SCM_VALIDATE_CHAR (2, ch
);
836 return SCM_BOOL (SCM_CHARSET_GET (cs
, SCM_CHAR (ch
)));
841 SCM_DEFINE (scm_char_set_every
, "char-set-every", 2, 0, 0,
843 "Return a true value if every character in the character set\n"
844 "@var{cs} satisfies the predicate @var{pred}.")
845 #define FUNC_NAME s_scm_char_set_every
848 SCM res
= SCM_BOOL_T
;
850 SCM_VALIDATE_PROC (1, pred
);
851 SCM_VALIDATE_SMOB (2, cs
, charset
);
853 for (k
= 0; k
< SCM_CHARSET_SIZE
; k
++)
854 if (SCM_CHARSET_GET (cs
, k
))
856 res
= scm_call_1 (pred
, SCM_MAKE_CHAR (k
));
857 if (SCM_FALSEP (res
))
865 SCM_DEFINE (scm_char_set_any
, "char-set-any", 2, 0, 0,
867 "Return a true value if any character in the character set\n"
868 "@var{cs} satisfies the predicate @var{pred}.")
869 #define FUNC_NAME s_scm_char_set_any
873 SCM_VALIDATE_PROC (1, pred
);
874 SCM_VALIDATE_SMOB (2, cs
, charset
);
876 for (k
= 0; k
< SCM_CHARSET_SIZE
; k
++)
877 if (SCM_CHARSET_GET (cs
, k
))
879 SCM res
= scm_call_1 (pred
, SCM_MAKE_CHAR (k
));
880 if (!SCM_FALSEP (res
))
888 SCM_DEFINE (scm_char_set_adjoin
, "char-set-adjoin", 1, 0, 1,
890 "Add all character arguments to the first argument, which must\n"
891 "be a character set.")
892 #define FUNC_NAME s_scm_char_set_adjoin
896 SCM_VALIDATE_SMOB (1, cs
, charset
);
897 SCM_VALIDATE_REST_ARGUMENT (rest
);
898 cs
= scm_char_set_copy (cs
);
900 p
= (long *) SCM_SMOB_DATA (cs
);
901 while (!SCM_NULLP (rest
))
903 SCM chr
= SCM_CAR (rest
);
906 SCM_VALIDATE_CHAR_COPY (1, chr
, c
);
907 rest
= SCM_CDR (rest
);
909 p
[c
/ SCM_BITS_PER_LONG
] |= 1L << (c
% SCM_BITS_PER_LONG
);
916 SCM_DEFINE (scm_char_set_delete
, "char-set-delete", 1, 0, 1,
918 "Delete all character arguments from the first argument, which\n"
919 "must be a character set.")
920 #define FUNC_NAME s_scm_char_set_delete
924 SCM_VALIDATE_SMOB (1, cs
, charset
);
925 SCM_VALIDATE_REST_ARGUMENT (rest
);
926 cs
= scm_char_set_copy (cs
);
928 p
= (long *) SCM_SMOB_DATA (cs
);
929 while (!SCM_NULLP (rest
))
931 SCM chr
= SCM_CAR (rest
);
934 SCM_VALIDATE_CHAR_COPY (1, chr
, c
);
935 rest
= SCM_CDR (rest
);
937 p
[c
/ SCM_BITS_PER_LONG
] &= ~(1L << (c
% SCM_BITS_PER_LONG
));
944 SCM_DEFINE (scm_char_set_adjoin_x
, "char-set-adjoin!", 1, 0, 1,
946 "Add all character arguments to the first argument, which must\n"
947 "be a character set.")
948 #define FUNC_NAME s_scm_char_set_adjoin_x
952 SCM_VALIDATE_SMOB (1, cs
, charset
);
953 SCM_VALIDATE_REST_ARGUMENT (rest
);
955 p
= (long *) SCM_SMOB_DATA (cs
);
956 while (!SCM_NULLP (rest
))
958 SCM chr
= SCM_CAR (rest
);
961 SCM_VALIDATE_CHAR_COPY (1, chr
, c
);
962 rest
= SCM_CDR (rest
);
964 p
[c
/ SCM_BITS_PER_LONG
] |= 1L << (c
% SCM_BITS_PER_LONG
);
971 SCM_DEFINE (scm_char_set_delete_x
, "char-set-delete!", 1, 0, 1,
973 "Delete all character arguments from the first argument, which\n"
974 "must be a character set.")
975 #define FUNC_NAME s_scm_char_set_delete_x
979 SCM_VALIDATE_SMOB (1, cs
, charset
);
980 SCM_VALIDATE_REST_ARGUMENT (rest
);
982 p
= (long *) SCM_SMOB_DATA (cs
);
983 while (!SCM_NULLP (rest
))
985 SCM chr
= SCM_CAR (rest
);
988 SCM_VALIDATE_CHAR_COPY (1, chr
, c
);
989 rest
= SCM_CDR (rest
);
991 p
[c
/ SCM_BITS_PER_LONG
] &= ~(1L << (c
% SCM_BITS_PER_LONG
));
998 SCM_DEFINE (scm_char_set_complement
, "char-set-complement", 1, 0, 0,
1000 "Return the complement of the character set @var{cs}.")
1001 #define FUNC_NAME s_scm_char_set_complement
1007 SCM_VALIDATE_SMOB (1, cs
, charset
);
1009 res
= make_char_set (FUNC_NAME
);
1010 p
= (long *) SCM_SMOB_DATA (res
);
1011 q
= (long *) SCM_SMOB_DATA (cs
);
1012 for (k
= 0; k
< LONGS_PER_CHARSET
; k
++)
1019 SCM_DEFINE (scm_char_set_union
, "char-set-union", 0, 0, 1,
1021 "Return the union of all argument character sets.")
1022 #define FUNC_NAME s_scm_char_set_union
1028 SCM_VALIDATE_REST_ARGUMENT (rest
);
1030 res
= make_char_set (FUNC_NAME
);
1031 p
= (long *) SCM_SMOB_DATA (res
);
1032 while (!SCM_NULLP (rest
))
1035 SCM cs
= SCM_CAR (rest
);
1036 SCM_VALIDATE_SMOB (c
, cs
, charset
);
1038 rest
= SCM_CDR (rest
);
1040 for (k
= 0; k
< LONGS_PER_CHARSET
; k
++)
1041 p
[k
] |= ((long *) SCM_SMOB_DATA (cs
))[k
];
1048 SCM_DEFINE (scm_char_set_intersection
, "char-set-intersection", 0, 0, 1,
1050 "Return the intersection of all argument character sets.")
1051 #define FUNC_NAME s_scm_char_set_intersection
1055 SCM_VALIDATE_REST_ARGUMENT (rest
);
1057 if (SCM_NULLP (rest
))
1058 res
= make_char_set (FUNC_NAME
);
1064 res
= scm_char_set_copy (SCM_CAR (rest
));
1065 p
= (long *) SCM_SMOB_DATA (res
);
1066 rest
= SCM_CDR (rest
);
1068 while (SCM_CONSP (rest
))
1071 SCM cs
= SCM_CAR (rest
);
1074 SCM_VALIDATE_SMOB (argnum
, cs
, charset
);
1076 cs_data
= (long *) SCM_SMOB_DATA (cs
);
1077 rest
= SCM_CDR (rest
);
1078 for (k
= 0; k
< LONGS_PER_CHARSET
; k
++)
1088 SCM_DEFINE (scm_char_set_difference
, "char-set-difference", 1, 0, 1,
1089 (SCM cs1
, SCM rest
),
1090 "Return the difference of all argument character sets.")
1091 #define FUNC_NAME s_scm_char_set_difference
1097 SCM_VALIDATE_SMOB (1, cs1
, charset
);
1098 SCM_VALIDATE_REST_ARGUMENT (rest
);
1100 res
= scm_char_set_copy (cs1
);
1101 p
= (long *) SCM_SMOB_DATA (res
);
1102 while (!SCM_NULLP (rest
))
1105 SCM cs
= SCM_CAR (rest
);
1106 SCM_VALIDATE_SMOB (c
, cs
, charset
);
1108 rest
= SCM_CDR (rest
);
1110 for (k
= 0; k
< LONGS_PER_CHARSET
; k
++)
1111 p
[k
] &= ~((long *) SCM_SMOB_DATA (cs
))[k
];
1118 SCM_DEFINE (scm_char_set_xor
, "char-set-xor", 0, 0, 1,
1120 "Return the exclusive-or of all argument character sets.")
1121 #define FUNC_NAME s_scm_char_set_xor
1125 SCM_VALIDATE_REST_ARGUMENT (rest
);
1127 if (SCM_NULLP (rest
))
1128 res
= make_char_set (FUNC_NAME
);
1134 res
= scm_char_set_copy (SCM_CAR (rest
));
1135 p
= (long *) SCM_SMOB_DATA (res
);
1136 rest
= SCM_CDR (rest
);
1138 while (SCM_CONSP (rest
))
1140 SCM cs
= SCM_CAR (rest
);
1144 SCM_VALIDATE_SMOB (argnum
, cs
, charset
);
1146 cs_data
= (long *) SCM_SMOB_DATA (cs
);
1147 rest
= SCM_CDR (rest
);
1149 for (k
= 0; k
< LONGS_PER_CHARSET
; k
++)
1158 SCM_DEFINE (scm_char_set_diff_plus_intersection
, "char-set-diff+intersection", 1, 0, 1,
1159 (SCM cs1
, SCM rest
),
1160 "Return the difference and the intersection of all argument\n"
1162 #define FUNC_NAME s_scm_char_set_diff_plus_intersection
1168 SCM_VALIDATE_SMOB (1, cs1
, charset
);
1169 SCM_VALIDATE_REST_ARGUMENT (rest
);
1171 res1
= scm_char_set_copy (cs1
);
1172 res2
= make_char_set (FUNC_NAME
);
1173 p
= (long *) SCM_SMOB_DATA (res1
);
1174 q
= (long *) SCM_SMOB_DATA (res2
);
1175 while (!SCM_NULLP (rest
))
1178 SCM cs
= SCM_CAR (rest
);
1181 SCM_VALIDATE_SMOB (c
, cs
, charset
);
1183 r
= (long *) SCM_SMOB_DATA (cs
);
1185 for (k
= 0; k
< LONGS_PER_CHARSET
; k
++)
1187 q
[k
] |= p
[k
] & r
[k
];
1190 rest
= SCM_CDR (rest
);
1192 return scm_values (scm_list_2 (res1
, res2
));
1197 SCM_DEFINE (scm_char_set_complement_x
, "char-set-complement!", 1, 0, 0,
1199 "Return the complement of the character set @var{cs}.")
1200 #define FUNC_NAME s_scm_char_set_complement_x
1205 SCM_VALIDATE_SMOB (1, cs
, charset
);
1206 p
= (long *) SCM_SMOB_DATA (cs
);
1207 for (k
= 0; k
< LONGS_PER_CHARSET
; k
++)
1214 SCM_DEFINE (scm_char_set_union_x
, "char-set-union!", 1, 0, 1,
1215 (SCM cs1
, SCM rest
),
1216 "Return the union of all argument character sets.")
1217 #define FUNC_NAME s_scm_char_set_union_x
1222 SCM_VALIDATE_SMOB (1, cs1
, charset
);
1223 SCM_VALIDATE_REST_ARGUMENT (rest
);
1225 p
= (long *) SCM_SMOB_DATA (cs1
);
1226 while (!SCM_NULLP (rest
))
1229 SCM cs
= SCM_CAR (rest
);
1230 SCM_VALIDATE_SMOB (c
, cs
, charset
);
1232 rest
= SCM_CDR (rest
);
1234 for (k
= 0; k
< LONGS_PER_CHARSET
; k
++)
1235 p
[k
] |= ((long *) SCM_SMOB_DATA (cs
))[k
];
1242 SCM_DEFINE (scm_char_set_intersection_x
, "char-set-intersection!", 1, 0, 1,
1243 (SCM cs1
, SCM rest
),
1244 "Return the intersection of all argument character sets.")
1245 #define FUNC_NAME s_scm_char_set_intersection_x
1250 SCM_VALIDATE_SMOB (1, cs1
, charset
);
1251 SCM_VALIDATE_REST_ARGUMENT (rest
);
1253 p
= (long *) SCM_SMOB_DATA (cs1
);
1254 while (!SCM_NULLP (rest
))
1257 SCM cs
= SCM_CAR (rest
);
1258 SCM_VALIDATE_SMOB (c
, cs
, charset
);
1260 rest
= SCM_CDR (rest
);
1262 for (k
= 0; k
< LONGS_PER_CHARSET
; k
++)
1263 p
[k
] &= ((long *) SCM_SMOB_DATA (cs
))[k
];
1270 SCM_DEFINE (scm_char_set_difference_x
, "char-set-difference!", 1, 0, 1,
1271 (SCM cs1
, SCM rest
),
1272 "Return the difference of all argument character sets.")
1273 #define FUNC_NAME s_scm_char_set_difference_x
1278 SCM_VALIDATE_SMOB (1, cs1
, charset
);
1279 SCM_VALIDATE_REST_ARGUMENT (rest
);
1281 p
= (long *) SCM_SMOB_DATA (cs1
);
1282 while (!SCM_NULLP (rest
))
1285 SCM cs
= SCM_CAR (rest
);
1286 SCM_VALIDATE_SMOB (c
, cs
, charset
);
1288 rest
= SCM_CDR (rest
);
1290 for (k
= 0; k
< LONGS_PER_CHARSET
; k
++)
1291 p
[k
] &= ~((long *) SCM_SMOB_DATA (cs
))[k
];
1298 SCM_DEFINE (scm_char_set_xor_x
, "char-set-xor!", 1, 0, 1,
1299 (SCM cs1
, SCM rest
),
1300 "Return the exclusive-or of all argument character sets.")
1301 #define FUNC_NAME s_scm_char_set_xor_x
1303 /* a side-effecting variant should presumably give consistent results:
1304 (define a (char-set #\a))
1305 (char-set-xor a a a) -> char set #\a
1306 (char-set-xor! a a a) -> char set #\a
1308 return scm_char_set_xor (scm_cons (cs1
, rest
));
1311 /* this would give (char-set-xor! a a a) -> empty char set. */
1315 SCM_VALIDATE_SMOB (1, cs1
, charset
);
1316 SCM_VALIDATE_REST_ARGUMENT (rest
);
1318 p
= (long *) SCM_SMOB_DATA (cs1
);
1319 while (!SCM_NULLP (rest
))
1322 SCM cs
= SCM_CAR (rest
);
1323 SCM_VALIDATE_SMOB (c
, cs
, charset
);
1325 rest
= SCM_CDR (rest
);
1327 for (k
= 0; k
< LONGS_PER_CHARSET
; k
++)
1328 p
[k
] ^= ((long *) SCM_SMOB_DATA (cs
))[k
];
1336 SCM_DEFINE (scm_char_set_diff_plus_intersection_x
, "char-set-diff+intersection!", 2, 0, 1,
1337 (SCM cs1
, SCM cs2
, SCM rest
),
1338 "Return the difference and the intersection of all argument\n"
1340 #define FUNC_NAME s_scm_char_set_diff_plus_intersection_x
1346 SCM_VALIDATE_SMOB (1, cs1
, charset
);
1347 SCM_VALIDATE_SMOB (2, cs2
, charset
);
1348 SCM_VALIDATE_REST_ARGUMENT (rest
);
1350 p
= (long *) SCM_SMOB_DATA (cs1
);
1351 q
= (long *) SCM_SMOB_DATA (cs2
);
1354 /* (char-set-diff+intersection! a a ...): can't share storage,
1355 but we know the answer without checking for further
1357 return scm_values (scm_list_2 (make_char_set (FUNC_NAME
), cs1
));
1359 for (k
= 0; k
< LONGS_PER_CHARSET
; k
++)
1366 while (!SCM_NULLP (rest
))
1368 SCM cs
= SCM_CAR (rest
);
1371 SCM_VALIDATE_SMOB (c
, cs
, charset
);
1373 r
= (long *) SCM_SMOB_DATA (cs
);
1375 for (k
= 0; k
< LONGS_PER_CHARSET
; k
++)
1377 q
[k
] |= p
[k
] & r
[k
];
1380 rest
= SCM_CDR (rest
);
1382 return scm_values (scm_list_2 (cs1
, cs2
));
1387 /* Create the charset smob type. */
1389 scm_c_init_srfi_14 (void)
1391 /* Charset smob creation is protected by this variable because this
1392 function can be both called from the SRFI-13 and SRFI-14
1393 initialization functions. This is because the SRFI-13 procedures
1394 access the charset smob type code. */
1395 static int initialized
= 0;
1399 scm_tc16_charset
= scm_make_smob_type ("character-set",
1401 scm_set_smob_free (scm_tc16_charset
, charset_free
);
1402 scm_set_smob_print (scm_tc16_charset
, charset_print
);
1408 /* Initialize the SRFI-14 module. This function will be called by the
1409 loading Scheme module. */
1411 scm_init_srfi_14 (void)
1414 fprintf(stderr
, "bytes-per-charset: %d\n", BYTES_PER_CHARSET
);
1415 fprintf(stderr
, "bits-per-long: %d\n", SCM_BITS_PER_LONG
);
1416 fprintf(stderr
, "longs-per-charset: %d\n", LONGS_PER_CHARSET
);
1420 /* Do the smob type initialization. */
1421 scm_c_init_srfi_14 ();
1423 /* Install the charset primitives. */
1424 #include "srfi/srfi-14.x"
1427 /* End of srfi-14.c. */