Optimize 'string-hash'.
[bpt/guile.git] / libguile / tags.h
1 /* classes: h_files */
2
3 #ifndef SCM_TAGS_H
4 #define SCM_TAGS_H
5
6 /* Copyright (C) 1995,1996,1997,1998,1999,2000,2001,2002,2003,2004,2008,2009,2010,2012
7 * Free Software Foundation, Inc.
8 *
9 * This library is free software; you can redistribute it and/or
10 * modify it under the terms of the GNU Lesser General Public License
11 * as published by the Free Software Foundation; either version 3 of
12 * the License, or (at your option) any later version.
13 *
14 * This library is distributed in the hope that it will be useful, but
15 * WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
17 * Lesser General Public License for more details.
18 *
19 * You should have received a copy of the GNU Lesser General Public
20 * License along with this library; if not, write to the Free Software
21 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
22 * 02110-1301 USA
23 */
24
25 \f
26
27 /** This file defines the format of SCM values and cons pairs.
28 ** It is here that tag bits are assigned for various purposes.
29 **/
30
31 /* picks up scmconfig.h too */
32 #include "libguile/__scm.h"
33
34 \f
35
36 /* In the beginning was the Word:
37 *
38 * For the representation of scheme objects and their handling, Guile provides
39 * two types: scm_t_bits and SCM.
40 *
41 * - scm_t_bits values can hold bit patterns of non-objects and objects:
42 *
43 * Non-objects -- in this case the value may not be changed into a SCM value
44 * in any way.
45 *
46 * Objects -- in this case the value may be changed into a SCM value using
47 * the SCM_PACK macro.
48 *
49 * - SCM values can hold proper scheme objects only. They can be changed into
50 * a scm_t_bits value using the SCM_UNPACK macro.
51 *
52 * When working in the domain of scm_t_bits values, programmers must keep
53 * track of any scm_t_bits value they create that is not a proper scheme
54 * object. This makes sure that in the domain of SCM values developers can
55 * rely on the fact that they are dealing with proper scheme objects only.
56 * Thus, the distinction between scm_t_bits and SCM values helps to identify
57 * those parts of the code where special care has to be taken not to create
58 * bad SCM values.
59 */
60
61 /* For dealing with the bit level representation of scheme objects we define
62 * scm_t_bits:
63 */
64
65 typedef scm_t_intptr scm_t_signed_bits;
66 typedef scm_t_uintptr scm_t_bits;
67
68 #define SCM_T_SIGNED_BITS_MAX SCM_T_INTPTR_MAX
69 #define SCM_T_SIGNED_BITS_MIN SCM_T_INTPTR_MIN
70 #define SCM_T_BITS_MAX SCM_T_UINTPTR_MAX
71
72
73 /* But as external interface, we define SCM, which may, according to the
74 * desired level of type checking, be defined in several ways:
75 */
76 #if (SCM_DEBUG_TYPING_STRICTNESS == 2)
77 typedef union SCM { struct { scm_t_bits n; } n; } SCM;
78 # define SCM_UNPACK(x) ((x).n.n)
79 # define SCM_PACK(x) ((SCM) { { (scm_t_bits) (x) } })
80 #elif (SCM_DEBUG_TYPING_STRICTNESS == 1)
81 /* This is the default, which provides an intermediate level of compile time
82 * type checking while still resulting in very efficient code.
83 */
84 typedef struct scm_unused_struct { char scm_unused_field; } *SCM;
85
86 /*
87 The 0?: constructions makes sure that the code is never executed,
88 and that there is no performance hit. However, the alternative is
89 compiled, and does generate a warning when used with the wrong
90 pointer type. We use a volatile pointer type to avoid warnings
91 from clang.
92
93 The Tru64 and ia64-hp-hpux11.23 compilers fail on `case (0?0=0:x)'
94 statements, so for them type-checking is disabled. */
95 #if defined __DECC || defined __HP_cc
96 # define SCM_UNPACK(x) ((scm_t_bits) (x))
97 #else
98 # define SCM_UNPACK(x) ((scm_t_bits) (0? (*(volatile SCM *)0=(x)): x))
99 #endif
100
101 /*
102 There is no typechecking on SCM_PACK, since all kinds of types
103 (unsigned long, void*) go in SCM_PACK
104 */
105 # define SCM_PACK(x) ((SCM) (x))
106
107 #else
108 /* This should be used as a fall back solution for machines on which casting
109 * to a pointer may lead to loss of bit information, e. g. in the three least
110 * significant bits.
111 */
112 typedef scm_t_bits SCM;
113 # define SCM_UNPACK(x) (x)
114 # define SCM_PACK(x) ((SCM) (x))
115 #endif
116
117
118 /* SCM values can not be compared by using the operator ==. Use the following
119 * macro instead, which is the equivalent of the scheme predicate 'eq?'.
120 */
121 #define scm_is_eq(x, y) (SCM_UNPACK (x) == SCM_UNPACK (y))
122
123 \f
124
125 /* Representation of scheme objects:
126 *
127 * Guile's type system is designed to work on systems where scm_t_bits and SCM
128 * variables consist of at least 32 bits. The objects that a SCM variable can
129 * represent belong to one of the following two major categories:
130 *
131 * - Immediates -- meaning that the SCM variable contains an entire Scheme
132 * object. That means, all the object's data (including the type tagging
133 * information that is required to identify the object's type) must fit into
134 * 32 bits.
135 *
136 * - Non-immediates -- meaning that the SCM variable holds a pointer into the
137 * heap of cells (see below). On systems where a pointer needs more than 32
138 * bits this means that scm_t_bits and SCM variables need to be large enough
139 * to hold such pointers. In contrast to immediates, the object's data of
140 * a non-immediate can consume arbitrary amounts of memory: The heap cell
141 * being pointed to consists of at least two scm_t_bits variables and thus
142 * can be used to hold pointers to malloc'ed memory of any size.
143 *
144 * The 'heap' is the memory area that is under control of Guile's garbage
145 * collector. It holds 'single-cells' or 'double-cells', which consist of
146 * either two or four scm_t_bits variables, respectively. It is guaranteed
147 * that the address of a cell on the heap is 8-byte aligned. That is, since
148 * non-immediates hold a cell address, the three least significant bits of a
149 * non-immediate can be used to store additional information. The bits are
150 * used to store information about the object's type and thus are called
151 * tc3-bits, where tc stands for type-code.
152 *
153 * For a given SCM value, the distinction whether it holds an immediate or
154 * non-immediate object is based on the tc3-bits (see above) of its scm_t_bits
155 * equivalent: If the tc3-bits equal #b000, then the SCM value holds a
156 * non-immediate, and the scm_t_bits variable's value is just the pointer to
157 * the heap cell.
158 *
159 * Summarized, the data of a scheme object that is represented by a SCM
160 * variable consists of a) the SCM variable itself, b) in case of
161 * non-immediates the data of the single-cell or double-cell the SCM object
162 * points to, c) in case of non-immediates potentially additional data outside
163 * of the heap (like for example malloc'ed data), and d) in case of
164 * non-immediates potentially additional data inside of the heap, since data
165 * stored in b) and c) may hold references to other cells.
166 *
167 *
168 * Immediates
169 *
170 * Operations on immediate objects can typically be processed faster than on
171 * non-immediates. The reason is that the object's data can be extracted
172 * directly from the SCM variable (or rather a corresponding scm_t_bits
173 * variable), instead of having to perform additional memory accesses to
174 * obtain the object's data from the heap. In order to get the best possible
175 * performance frequently used data types should be realized as immediates.
176 * This is, as has been mentioned above, only possible if the objects can be
177 * represented with 32 bits (including type tagging).
178 *
179 * In Guile, the following data types and special objects are realized as
180 * immediates: booleans, characters, small integers (see below), the empty
181 * list, the end of file object, the 'unspecified' object (which is delivered
182 * as a return value by functions for which the return value is unspecified),
183 * a 'nil' object used in the elisp-compatibility mode and certain other
184 * 'special' objects which are only used internally in Guile.
185 *
186 * Integers in Guile can be arbitrarily large. On the other hand, integers
187 * are one of the most frequently used data types. Especially integers with
188 * less than 32 bits are commonly used. Thus, internally and transparently
189 * for application code guile distinguishes between small and large integers.
190 * Whether an integer is a large or a small integer depends on the number of
191 * bits needed to represent its value. Small integers are those which can be
192 * represented as immediates. Since they don't require more than a fixed
193 * number of bits for their representation, they are also known as 'fixnums'.
194 *
195 * The tc3-combinations #b010 and #b110 are used to represent small integers,
196 * which allows to use the most significant bit of the tc3-bits to be part of
197 * the integer value being represented. This means that all integers with up
198 * to 30 bits (including one bit for the sign) can be represented as
199 * immediates. On systems where SCM and scm_t_bits variables hold more than
200 * 32 bits, the amount of bits usable for small integers will even be larger.
201 * The tc3-code #b100 is shared among booleans, characters and the other
202 * special objects listed above.
203 *
204 *
205 * Non-Immediates
206 *
207 * All object types not mentioned above in the list of immedate objects are
208 * represented as non-immediates. Whether a non-immediate scheme object is
209 * represented by a single-cell or a double-cell depends on the object's type,
210 * namely on the set of attributes that have to be stored with objects of that
211 * type. Every non-immediate type is allowed to define its own layout and
212 * interpretation of the data stored in its cell (with some restrictions, see
213 * below).
214 *
215 * One of the design goals of guile's type system is to make it possible to
216 * store a scheme pair with as little memory usage as possible. The minimum
217 * amount of memory that is required to store two scheme objects (car and cdr
218 * of a pair) is the amount of memory required by two scm_t_bits or SCM
219 * variables. Therefore pairs in guile are stored in single-cells.
220 *
221 * Another design goal for the type system is to store procedure objects
222 * created by lambda expresssions (closures) and class instances (goops
223 * objects) with as little memory usage as possible. Closures are represented
224 * by a reference to the function code and a reference to the closure's
225 * environment. Class instances are represented by a reference to the
226 * instance's class definition and a reference to the instance's data. Thus,
227 * closures as well as class instances also can be stored in single-cells.
228 *
229 * Certain other non-immediate types also store their data in single-cells.
230 * By design decision, the heap is split into areas for single-cells and
231 * double-cells, but not into areas for single-cells-holding-pairs and areas
232 * for single-cells-holding-non-pairs. Any single-cell on the heap therefore
233 * can hold pairs (consisting of two scm_t_bits variables representing two
234 * scheme objects - the car and cdr of the pair) and non-pairs (consisting of
235 * two scm_t_bits variables that hold bit patterns as defined by the layout of
236 * the corresponding object's type).
237 *
238 *
239 * Garbage collection
240 *
241 * During garbage collection, unreachable cells on the heap will be freed.
242 * That is, the garbage collector will detect cells which have no SCM variable
243 * pointing towards them. In order to properly release all memory belonging
244 * to the object to which a cell belongs, the gc needs to be able to interpret
245 * the cell contents in the correct way. That means that the gc needs to be
246 * able to determine the object type associated with a cell only from the cell
247 * itself.
248 *
249 * Consequently, if the gc detects an unreachable single-cell, those two
250 * scm_t_bits variables must provide enough information to determine whether
251 * they belong to a pair (i. e. both scm_t_bits variables represent valid
252 * scheme objects), to a closure, a class instance or if they belong to any
253 * other non-immediate. Guile's type system is designed to make it possible
254 * to determine a the type to which a cell belongs in the majority of cases
255 * from the cell's first scm_t_bits variable. (Given a SCM variable X holding
256 * a non-immediate object, the macro SCM_CELL_TYPE(X) will deliver the
257 * corresponding cell's first scm_t_bits variable.)
258 *
259 * If the cell holds a scheme pair, then we already know that the first
260 * scm_t_bits variable of the cell will hold a scheme object with one of the
261 * following tc3-codes: #b000 (non-immediate), #b010 (small integer), #b110
262 * (small integer), #b100 (non-integer immediate). All these tc3-codes have
263 * in common, that their least significant bit is #b0. This fact is used by
264 * the garbage collector to identify cells that hold pairs. The remaining
265 * tc3-codes are assigned as follows: #b001 (class instance or, more
266 * precisely, a struct, of which a class instance is a special case), #b011
267 * (closure), #b101/#b111 (all remaining non-immediate types).
268 *
269 *
270 * Summary of type codes of scheme objects (SCM variables)
271 *
272 * Here is a summary of tagging bits as they might occur in a scheme object.
273 * The notation is as follows: tc stands for type code as before, tc<n> with n
274 * being a number indicates a type code formed by the n least significant bits
275 * of the SCM variables corresponding scm_t_bits value.
276 *
277 * Note that (as has been explained above) tc1==1 can only occur in the first
278 * scm_t_bits variable of a cell belonging to a non-immediate object that is
279 * not a pair. For an explanation of the tc tags with tc1==1, see the next
280 * section with the summary of the type codes on the heap.
281 *
282 * tc1:
283 * 0: For scheme objects, tc1==0 must be fulfilled.
284 * (1: This can never be the case for a scheme object.)
285 *
286 * tc2:
287 * 00: Either a non-immediate or some non-integer immediate
288 * (01: This can never be the case for a scheme object.)
289 * 10: Small integer
290 * (11: This can never be the case for a scheme object.)
291 *
292 * tc3:
293 * 000: a non-immediate object (pair, closure, class instance etc.)
294 * (001: This can never be the case for a scheme object.)
295 * 010: an even small integer (least significant bit is 0).
296 * (011: This can never be the case for a scheme object.)
297 * 100: Non-integer immediate
298 * (101: This can never be the case for a scheme object.)
299 * 110: an odd small integer (least significant bit is 1).
300 * (111: This can never be the case for a scheme object.)
301 *
302 * The remaining bits of the non-immediate objects form the pointer to the
303 * heap cell. The remaining bits of the small integers form the integer's
304 * value and sign. Thus, the only scheme objects for which a further
305 * subdivision is of interest are the ones with tc3==100.
306 *
307 * tc8 (for objects with tc3==100):
308 * 00000-100: special objects ('flags')
309 * 00001-100: characters
310 * 00010-100: unused
311 * 00011-100: unused
312 *
313 *
314 * Summary of type codes on the heap
315 *
316 * Here is a summary of tagging in scm_t_bits values as they might occur in
317 * the first scm_t_bits variable of a heap cell.
318 *
319 * tc1:
320 * 0: the cell belongs to a pair.
321 * 1: the cell belongs to a non-pair.
322 *
323 * tc2:
324 * 00: the cell belongs to a pair with no short integer in its car.
325 * 01: the cell belongs to a non-pair (struct or some other non-immediate).
326 * 10: the cell belongs to a pair with a short integer in its car.
327 * 11: the cell belongs to a non-pair (closure or some other non-immediate).
328 *
329 * tc3:
330 * 000: the cell belongs to a pair with a non-immediate in its car.
331 * 001: the cell belongs to a struct
332 * 010: the cell belongs to a pair with an even short integer in its car.
333 * 011: the cell belongs to a closure
334 * 100: the cell belongs to a pair with a non-integer immediate in its car.
335 * 101: the cell belongs to some other non-immediate.
336 * 110: the cell belongs to a pair with an odd short integer in its car.
337 * 111: the cell belongs to some other non-immediate.
338 *
339 * tc7 (for tc3==1x1):
340 * See below for the list of types. Note the special case of scm_tc7_vector
341 * and scm_tc7_wvect: vectors and weak vectors are treated the same in many
342 * cases. Thus, their tc7-codes are chosen to only differ in one bit. This
343 * makes it possible to check an object at the same time for being a vector
344 * or a weak vector by comparing its tc7 code with that bit masked (using
345 * the TYP7S macro). Three more special tc7-codes are of interest:
346 * numbers, ports and smobs in fact each represent collections of types,
347 * which are subdivided using tc16-codes.
348 *
349 * tc16 (for tc7==scm_tc7_smob):
350 * The largest part of the space of smob types is not subdivided in a
351 * predefined way, since smobs can be added arbitrarily by user C code.
352 */
353
354 \f
355
356 /* Checking if a SCM variable holds an immediate or a non-immediate object:
357 * This check can either be performed by checking for tc3==000 or tc3==00x,
358 * since for a SCM variable it is known that tc1==0. */
359 #define SCM_IMP(x) (6 & SCM_UNPACK (x))
360 #define SCM_NIMP(x) (!SCM_IMP (x))
361
362 /* Checking if a SCM variable holds an immediate integer: See numbers.h for
363 * the definition of the following macros: SCM_I_FIXNUM_BIT,
364 * SCM_MOST_POSITIVE_FIXNUM, SCM_I_INUMP, SCM_I_MAKINUM, SCM_I_INUM. */
365
366 /* Checking if a SCM variable holds a pair (for historical reasons, in Guile
367 * also known as a cons-cell): This is done by first checking that the SCM
368 * variable holds a non-immediate, and second, by checking that tc1==0 holds
369 * for the SCM_CELL_TYPE of the SCM variable.
370 */
371
372 #define SCM_I_CONSP(x) (!SCM_IMP (x) && ((1 & SCM_CELL_TYPE (x)) == 0))
373
374 \f
375
376 /* Definitions for tc2: */
377
378 #define scm_tc2_int 2
379
380
381 /* Definitions for tc3: */
382
383 #define SCM_ITAG3(x) (7 & SCM_UNPACK (x))
384 #define SCM_TYP3(x) (7 & SCM_CELL_TYPE (x))
385
386 #define scm_tc3_cons 0
387 #define scm_tc3_struct 1
388 #define scm_tc3_int_1 (scm_tc2_int + 0)
389 #define scm_tc3_unused 3
390 #define scm_tc3_imm24 4
391 #define scm_tc3_tc7_1 5
392 #define scm_tc3_int_2 (scm_tc2_int + 4)
393 #define scm_tc3_tc7_2 7
394
395
396 /* Definitions for tc7: */
397
398 #define SCM_ITAG7(x) (127 & SCM_UNPACK (x))
399 #define SCM_TYP7(x) (0x7f & SCM_CELL_TYPE (x))
400 #define SCM_TYP7S(x) ((0x7f & ~2) & SCM_CELL_TYPE (x))
401
402 #define scm_tc7_symbol 5
403 #define scm_tc7_variable 7
404
405 /* couple */
406 #define scm_tc7_vector 13
407 #define scm_tc7_wvect 15
408
409 #define scm_tc7_string 21
410 #define scm_tc7_number 23
411 #define scm_tc7_stringbuf 39
412 #define scm_tc7_bytevector 77
413
414 #define scm_tc7_pointer 31
415 #define scm_tc7_hashtable 29
416 #define scm_tc7_fluid 37
417 #define scm_tc7_dynamic_state 45
418
419 #define scm_tc7_frame 47
420 #define scm_tc7_objcode 53
421 #define scm_tc7_vm 55
422 #define scm_tc7_vm_cont 71
423
424 #define scm_tc7_prompt 61
425 #define scm_tc7_with_fluids 63
426 #define scm_tc7_unused_19 69
427 #define scm_tc7_program 79
428 #define scm_tc7_array 85
429 #define scm_tc7_bitvector 87
430 #define scm_tc7_unused_20 93
431 #define scm_tc7_unused_11 95
432 #define scm_tc7_unused_12 101
433 #define scm_tc7_unused_18 103
434 #define scm_tc7_unused_13 109
435 #define scm_tc7_unused_14 111
436 #define scm_tc7_unused_15 117
437 #define scm_tc7_unused_16 119
438
439 /* There are 256 port subtypes. */
440 #define scm_tc7_port 125
441
442 /* There are 256 smob subtypes. [**] If you change scm_tc7_smob, you must
443 * also change the places it is hard coded in this file and possibly others.
444 * Dirk:FIXME:: Any hard coded reference to scm_tc7_smob must be replaced by a
445 * symbolic reference. */
446 #define scm_tc7_smob 127 /* DO NOT CHANGE [**] */
447
448
449 /* Definitions for tc16: */
450 #define SCM_TYP16(x) (0xffff & SCM_CELL_TYPE (x))
451 #define SCM_TYP16_PREDICATE(tag, x) (!SCM_IMP (x) && SCM_TYP16 (x) == (tag))
452
453
454 \f
455
456 /* {Immediate Values}
457 */
458
459 enum scm_tc8_tags
460 {
461 scm_tc8_flag = scm_tc3_imm24 + 0x00, /* special objects ('flags') */
462 scm_tc8_char = scm_tc3_imm24 + 0x08, /* characters */
463 scm_tc8_unused_0 = scm_tc3_imm24 + 0x10,
464 scm_tc8_unused_1 = scm_tc3_imm24 + 0x18
465 };
466
467 #define SCM_ITAG8(X) (SCM_UNPACK (X) & 0xff)
468 #define SCM_MAKE_ITAG8_BITS(X, TAG) (((X) << 8) + TAG)
469 #define SCM_MAKE_ITAG8(X, TAG) (SCM_PACK (SCM_MAKE_ITAG8_BITS (X, TAG)))
470 #define SCM_ITAG8_DATA(X) (SCM_UNPACK (X) >> 8)
471
472 \f
473
474 /* Flags (special objects). The indices of the flags must agree with the
475 * declarations in print.c: iflagnames. */
476
477 #define SCM_IFLAGP(n) (SCM_ITAG8 (n) == scm_tc8_flag)
478 #define SCM_MAKIFLAG_BITS(n) (SCM_MAKE_ITAG8_BITS ((n), scm_tc8_flag))
479 #define SCM_IFLAGNUM(n) (SCM_ITAG8_DATA (n))
480
481 /*
482 * IMPORTANT NOTE regarding IFLAG numbering!!!
483 *
484 * Several macros depend upon careful IFLAG numbering of SCM_BOOL_F,
485 * SCM_BOOL_T, SCM_ELISP_NIL, SCM_EOL, and the two SCM_XXX_*_DONT_USE
486 * constants. In particular:
487 *
488 * - SCM_BOOL_F and SCM_BOOL_T must differ in exactly one bit position.
489 * (used to implement scm_is_bool_and_not_nil, aka scm_is_bool)
490 *
491 * - SCM_ELISP_NIL and SCM_BOOL_F must differ in exactly one bit position.
492 * (used to implement scm_is_false_or_nil and
493 * scm_is_true_and_not_nil)
494 *
495 * - SCM_ELISP_NIL and SCM_EOL must differ in exactly one bit position.
496 * (used to implement scm_is_null_or_nil)
497 *
498 * - SCM_ELISP_NIL, SCM_BOOL_F, SCM_EOL, SCM_XXX_ANOTHER_LISP_FALSE_DONT_USE
499 * must all be equal except for two bit positions.
500 * (used to implement scm_is_lisp_false)
501 *
502 * - SCM_ELISP_NIL, SCM_BOOL_F, SCM_BOOL_T, SCM_XXX_ANOTHER_BOOLEAN_DONT_USE_0
503 * must all be equal except for two bit positions.
504 * (used to implement scm_is_bool_or_nil)
505 *
506 * These properties allow the aforementioned macros to be implemented
507 * by bitwise ANDing with a mask and then comparing with a constant,
508 * using as a common basis the macro SCM_MATCHES_BITS_IN_COMMON,
509 * defined below. The properties are checked at compile-time using
510 * `verify' macros near the top of boolean.c and pairs.c.
511 */
512 #define SCM_BOOL_F_BITS SCM_MAKIFLAG_BITS (0)
513 #define SCM_ELISP_NIL_BITS SCM_MAKIFLAG_BITS (1)
514
515 #define SCM_BOOL_F SCM_PACK (SCM_BOOL_F_BITS)
516 #define SCM_ELISP_NIL SCM_PACK (SCM_ELISP_NIL_BITS)
517
518 #ifdef BUILDING_LIBGUILE
519 #define SCM_XXX_ANOTHER_LISP_FALSE_DONT_USE SCM_MAKIFLAG_BITS (2)
520 #endif
521
522 #define SCM_EOL_BITS SCM_MAKIFLAG_BITS (3)
523 #define SCM_BOOL_T_BITS SCM_MAKIFLAG_BITS (4)
524
525 #define SCM_EOL SCM_PACK (SCM_EOL_BITS)
526 #define SCM_BOOL_T SCM_PACK (SCM_BOOL_T_BITS)
527
528 #ifdef BUILDING_LIBGUILE
529 #define SCM_XXX_ANOTHER_BOOLEAN_DONT_USE_0 SCM_MAKIFLAG_BITS (5)
530 #define SCM_XXX_ANOTHER_BOOLEAN_DONT_USE_1 SCM_MAKIFLAG_BITS (6)
531 #define SCM_XXX_ANOTHER_BOOLEAN_DONT_USE_2 SCM_MAKIFLAG_BITS (7)
532 #endif
533
534 #define SCM_UNSPECIFIED_BITS SCM_MAKIFLAG_BITS (8)
535 #define SCM_UNDEFINED_BITS SCM_MAKIFLAG_BITS (9)
536 #define SCM_EOF_VAL_BITS SCM_MAKIFLAG_BITS (10)
537
538 #define SCM_UNSPECIFIED SCM_PACK (SCM_UNSPECIFIED_BITS)
539 #define SCM_UNDEFINED SCM_PACK (SCM_UNDEFINED_BITS)
540 #define SCM_EOF_VAL SCM_PACK (SCM_EOF_VAL_BITS)
541
542 /* When a variable is unbound this is marked by the SCM_UNDEFINED
543 * value. The following is an unbound value which can be handled on
544 * the Scheme level, i.e., it can be stored in and retrieved from a
545 * Scheme variable. This value is only intended to mark an unbound
546 * slot in GOOPS. It is needed now, but we should probably rewrite
547 * the code which handles this value in C so that SCM_UNDEFINED can be
548 * used instead. It is not ideal to let this kind of unique and
549 * strange values loose on the Scheme level. */
550 #define SCM_UNBOUND_BITS SCM_MAKIFLAG_BITS (11)
551 #define SCM_UNBOUND SCM_PACK (SCM_UNBOUND_BITS)
552
553 #define SCM_UNBNDP(x) (scm_is_eq ((x), SCM_UNDEFINED))
554
555 /*
556 * SCM_MATCHES_BITS_IN_COMMON(x,a,b) returns 1 if and only if x
557 * matches both a and b in every bit position where a and b are equal;
558 * otherwise it returns 0. Bit positions where a and b differ are
559 * ignored.
560 *
561 * This is used to efficiently compare against two values which differ
562 * in exactly one bit position, or against four values which differ in
563 * exactly two bit positions. It is the basis for the following
564 * macros:
565 *
566 * scm_is_null_or_nil,
567 * scm_is_false_or_nil,
568 * scm_is_true_and_not_nil,
569 * scm_is_lisp_false,
570 * scm_is_lisp_true,
571 * scm_is_bool_and_not_nil (aka scm_is_bool)
572 * scm_is_bool_or_nil.
573 */
574 #define SCM_MATCHES_BITS_IN_COMMON(x,a,b) \
575 ((SCM_UNPACK(x) & ~(SCM_UNPACK(a) ^ SCM_UNPACK(b))) == \
576 (SCM_UNPACK(a) & SCM_UNPACK(b)))
577
578 /*
579 * These macros are used for compile-time verification that the
580 * constants have the properties needed for the above macro to work
581 * properly.
582 */
583 #ifdef BUILDING_LIBGUILE
584 #define SCM_WITH_LEAST_SIGNIFICANT_1_BIT_CLEARED(x) ((x) & ((x)-1))
585 #define SCM_HAS_EXACTLY_ONE_BIT_SET(x) \
586 ((x) != 0 && SCM_WITH_LEAST_SIGNIFICANT_1_BIT_CLEARED (x) == 0)
587 #define SCM_HAS_EXACTLY_TWO_BITS_SET(x) \
588 (SCM_HAS_EXACTLY_ONE_BIT_SET (SCM_WITH_LEAST_SIGNIFICANT_1_BIT_CLEARED (x)))
589
590 #define SCM_BITS_DIFFER_IN_EXACTLY_ONE_BIT_POSITION(a,b) \
591 (SCM_HAS_EXACTLY_ONE_BIT_SET ((a) ^ (b)))
592 #define SCM_BITS_DIFFER_IN_EXACTLY_TWO_BIT_POSITIONS(a,b,c,d) \
593 (SCM_HAS_EXACTLY_TWO_BITS_SET (((a) ^ (b)) | \
594 ((b) ^ (c)) | \
595 ((c) ^ (d))))
596 #endif /* BUILDING_LIBGUILE */
597 \f
598
599 /* Dispatching aids:
600
601 When switching on SCM_TYP7 of a SCM value, use these fake case
602 labels to catch types that use fewer than 7 bits for tagging. */
603
604 /* For cons pairs with immediate values in the CAR
605 */
606
607 #define scm_tcs_cons_imcar \
608 scm_tc2_int + 0: case scm_tc2_int + 4: case scm_tc3_imm24 + 0:\
609 case scm_tc2_int + 8: case scm_tc2_int + 12: case scm_tc3_imm24 + 8:\
610 case scm_tc2_int + 16: case scm_tc2_int + 20: case scm_tc3_imm24 + 16:\
611 case scm_tc2_int + 24: case scm_tc2_int + 28: case scm_tc3_imm24 + 24:\
612 case scm_tc2_int + 32: case scm_tc2_int + 36: case scm_tc3_imm24 + 32:\
613 case scm_tc2_int + 40: case scm_tc2_int + 44: case scm_tc3_imm24 + 40:\
614 case scm_tc2_int + 48: case scm_tc2_int + 52: case scm_tc3_imm24 + 48:\
615 case scm_tc2_int + 56: case scm_tc2_int + 60: case scm_tc3_imm24 + 56:\
616 case scm_tc2_int + 64: case scm_tc2_int + 68: case scm_tc3_imm24 + 64:\
617 case scm_tc2_int + 72: case scm_tc2_int + 76: case scm_tc3_imm24 + 72:\
618 case scm_tc2_int + 80: case scm_tc2_int + 84: case scm_tc3_imm24 + 80:\
619 case scm_tc2_int + 88: case scm_tc2_int + 92: case scm_tc3_imm24 + 88:\
620 case scm_tc2_int + 96: case scm_tc2_int + 100: case scm_tc3_imm24 + 96:\
621 case scm_tc2_int + 104: case scm_tc2_int + 108: case scm_tc3_imm24 + 104:\
622 case scm_tc2_int + 112: case scm_tc2_int + 116: case scm_tc3_imm24 + 112:\
623 case scm_tc2_int + 120: case scm_tc2_int + 124: case scm_tc3_imm24 + 120
624
625 /* For cons pairs with non-immediate values in the SCM_CAR
626 */
627 #define scm_tcs_cons_nimcar \
628 scm_tc3_cons + 0:\
629 case scm_tc3_cons + 8:\
630 case scm_tc3_cons + 16:\
631 case scm_tc3_cons + 24:\
632 case scm_tc3_cons + 32:\
633 case scm_tc3_cons + 40:\
634 case scm_tc3_cons + 48:\
635 case scm_tc3_cons + 56:\
636 case scm_tc3_cons + 64:\
637 case scm_tc3_cons + 72:\
638 case scm_tc3_cons + 80:\
639 case scm_tc3_cons + 88:\
640 case scm_tc3_cons + 96:\
641 case scm_tc3_cons + 104:\
642 case scm_tc3_cons + 112:\
643 case scm_tc3_cons + 120
644
645 /* For structs
646 */
647 #define scm_tcs_struct \
648 scm_tc3_struct + 0:\
649 case scm_tc3_struct + 8:\
650 case scm_tc3_struct + 16:\
651 case scm_tc3_struct + 24:\
652 case scm_tc3_struct + 32:\
653 case scm_tc3_struct + 40:\
654 case scm_tc3_struct + 48:\
655 case scm_tc3_struct + 56:\
656 case scm_tc3_struct + 64:\
657 case scm_tc3_struct + 72:\
658 case scm_tc3_struct + 80:\
659 case scm_tc3_struct + 88:\
660 case scm_tc3_struct + 96:\
661 case scm_tc3_struct + 104:\
662 case scm_tc3_struct + 112:\
663 case scm_tc3_struct + 120
664
665 \f
666
667 #if (SCM_ENABLE_DEPRECATED == 1)
668
669 #define SCM_CELLP(x) (((sizeof (scm_t_cell) - 1) & SCM_UNPACK (x)) == 0)
670 #define SCM_NCELLP(x) (!SCM_CELLP (x))
671
672 #endif
673
674 #endif /* SCM_TAGS_H */
675
676 /*
677 Local Variables:
678 c-file-style: "gnu"
679 End:
680 */