Merge remote-tracking branch 'origin/stable-2.0'
[bpt/guile.git] / libguile / gc.c
1 /* Copyright (C) 1995,1996,1997,1998,1999,2000,2001, 2002, 2003, 2006, 2008, 2009, 2010, 2011 Free Software Foundation, Inc.
2 *
3 * This library is free software; you can redistribute it and/or
4 * modify it under the terms of the GNU Lesser General Public License
5 * as published by the Free Software Foundation; either version 3 of
6 * the License, or (at your option) any later version.
7 *
8 * This library is distributed in the hope that it will be useful, but
9 * WITHOUT ANY WARRANTY; without even the implied warranty of
10 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
11 * Lesser General Public License for more details.
12 *
13 * You should have received a copy of the GNU Lesser General Public
14 * License along with this library; if not, write to the Free Software
15 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
16 * 02110-1301 USA
17 */
18
19 /* #define DEBUGINFO */
20
21 #ifdef HAVE_CONFIG_H
22 # include <config.h>
23 #endif
24
25 #include "libguile/gen-scmconfig.h"
26
27 #include <stdio.h>
28 #include <errno.h>
29 #include <string.h>
30 #include <math.h>
31
32 #ifdef __ia64__
33 #include <ucontext.h>
34 extern unsigned long * __libc_ia64_register_backing_store_base;
35 #endif
36
37 #include "libguile/_scm.h"
38 #include "libguile/eval.h"
39 #include "libguile/stime.h"
40 #include "libguile/stackchk.h"
41 #include "libguile/struct.h"
42 #include "libguile/smob.h"
43 #include "libguile/arrays.h"
44 #include "libguile/async.h"
45 #include "libguile/ports.h"
46 #include "libguile/root.h"
47 #include "libguile/strings.h"
48 #include "libguile/vectors.h"
49 #include "libguile/hashtab.h"
50 #include "libguile/tags.h"
51
52 #include "libguile/private-gc.h"
53 #include "libguile/validate.h"
54 #include "libguile/deprecation.h"
55 #include "libguile/gc.h"
56 #include "libguile/dynwind.h"
57
58 #include "libguile/bdw-gc.h"
59
60 /* For GC_set_start_callback. */
61 #include <gc/gc_mark.h>
62
63 #ifdef GUILE_DEBUG_MALLOC
64 #include "libguile/debug-malloc.h"
65 #endif
66
67 #ifdef HAVE_MALLOC_H
68 #include <malloc.h>
69 #endif
70
71 #ifdef HAVE_UNISTD_H
72 #include <unistd.h>
73 #endif
74
75 /* Set this to != 0 if every cell that is accessed shall be checked:
76 */
77 int scm_debug_cell_accesses_p = 0;
78 int scm_expensive_debug_cell_accesses_p = 0;
79
80 /* Set this to 0 if no additional gc's shall be performed, otherwise set it to
81 * the number of cell accesses after which a gc shall be called.
82 */
83 int scm_debug_cells_gc_interval = 0;
84
85 /* Hash table that keeps a reference to objects the user wants to protect from
86 garbage collection. */
87 static SCM scm_protects;
88
89
90 #if (SCM_DEBUG_CELL_ACCESSES == 1)
91
92
93 /*
94
95 Assert that the given object is a valid reference to a valid cell. This
96 test involves to determine whether the object is a cell pointer, whether
97 this pointer actually points into a heap segment and whether the cell
98 pointed to is not a free cell. Further, additional garbage collections may
99 get executed after a user defined number of cell accesses. This helps to
100 find places in the C code where references are dropped for extremely short
101 periods.
102
103 */
104 void
105 scm_i_expensive_validation_check (SCM cell)
106 {
107 /* If desired, perform additional garbage collections after a user
108 * defined number of cell accesses.
109 */
110 if (scm_debug_cells_gc_interval)
111 {
112 static unsigned int counter = 0;
113
114 if (counter != 0)
115 {
116 --counter;
117 }
118 else
119 {
120 counter = scm_debug_cells_gc_interval;
121 scm_gc ();
122 }
123 }
124 }
125
126 /* Whether cell validation is already running. */
127 static int scm_i_cell_validation_already_running = 0;
128
129 void
130 scm_assert_cell_valid (SCM cell)
131 {
132 if (!scm_i_cell_validation_already_running && scm_debug_cell_accesses_p)
133 {
134 scm_i_cell_validation_already_running = 1; /* set to avoid recursion */
135
136 /*
137 During GC, no user-code should be run, and the guile core
138 should use non-protected accessors.
139 */
140 if (scm_gc_running_p)
141 return;
142
143 /*
144 Only scm_in_heap_p and rescanning the heap is wildly
145 expensive.
146 */
147 if (scm_expensive_debug_cell_accesses_p)
148 scm_i_expensive_validation_check (cell);
149
150 scm_i_cell_validation_already_running = 0; /* re-enable */
151 }
152 }
153
154
155
156 SCM_DEFINE (scm_set_debug_cell_accesses_x, "set-debug-cell-accesses!", 1, 0, 0,
157 (SCM flag),
158 "If @var{flag} is @code{#f}, cell access checking is disabled.\n"
159 "If @var{flag} is @code{#t}, cheap cell access checking is enabled,\n"
160 "but no additional calls to garbage collection are issued.\n"
161 "If @var{flag} is a number, strict cell access checking is enabled,\n"
162 "with an additional garbage collection after the given\n"
163 "number of cell accesses.\n"
164 "This procedure only exists when the compile-time flag\n"
165 "@code{SCM_DEBUG_CELL_ACCESSES} was set to 1.")
166 #define FUNC_NAME s_scm_set_debug_cell_accesses_x
167 {
168 if (scm_is_false (flag))
169 {
170 scm_debug_cell_accesses_p = 0;
171 }
172 else if (scm_is_eq (flag, SCM_BOOL_T))
173 {
174 scm_debug_cells_gc_interval = 0;
175 scm_debug_cell_accesses_p = 1;
176 scm_expensive_debug_cell_accesses_p = 0;
177 }
178 else
179 {
180 scm_debug_cells_gc_interval = scm_to_signed_integer (flag, 0, INT_MAX);
181 scm_debug_cell_accesses_p = 1;
182 scm_expensive_debug_cell_accesses_p = 1;
183 }
184 return SCM_UNSPECIFIED;
185 }
186 #undef FUNC_NAME
187
188
189 #endif /* SCM_DEBUG_CELL_ACCESSES == 1 */
190
191 \f
192
193 /* Compatibility. */
194
195 #ifndef HAVE_GC_GET_HEAP_USAGE_SAFE
196 static void
197 GC_get_heap_usage_safe (GC_word *pheap_size, GC_word *pfree_bytes,
198 GC_word *punmapped_bytes, GC_word *pbytes_since_gc,
199 GC_word *ptotal_bytes)
200 {
201 *pheap_size = GC_get_heap_size ();
202 *pfree_bytes = GC_get_free_bytes ();
203 *punmapped_bytes = GC_get_unmapped_bytes ();
204 *pbytes_since_gc = GC_get_bytes_since_gc ();
205 *ptotal_bytes = GC_get_total_bytes ();
206 }
207 #endif
208
209 #ifndef HAVE_GC_GET_FREE_SPACE_DIVISOR
210 static GC_word
211 GC_get_free_space_divisor (void)
212 {
213 return GC_free_space_divisor;
214 }
215 #endif
216
217 \f
218 /* Hooks. */
219 scm_t_c_hook scm_before_gc_c_hook;
220 scm_t_c_hook scm_before_mark_c_hook;
221 scm_t_c_hook scm_before_sweep_c_hook;
222 scm_t_c_hook scm_after_sweep_c_hook;
223 scm_t_c_hook scm_after_gc_c_hook;
224
225
226 static void
227 run_before_gc_c_hook (void)
228 {
229 scm_c_hook_run (&scm_before_gc_c_hook, NULL);
230 }
231
232
233 /* GC Statistics Keeping
234 */
235 unsigned long scm_gc_ports_collected = 0;
236 static long gc_time_taken = 0;
237 static long gc_start_time = 0;
238
239 static unsigned long free_space_divisor;
240 static unsigned long minimum_free_space_divisor;
241 static double target_free_space_divisor;
242
243 static unsigned long protected_obj_count = 0;
244
245
246 SCM_SYMBOL (sym_gc_time_taken, "gc-time-taken");
247 SCM_SYMBOL (sym_heap_size, "heap-size");
248 SCM_SYMBOL (sym_heap_free_size, "heap-free-size");
249 SCM_SYMBOL (sym_heap_total_allocated, "heap-total-allocated");
250 SCM_SYMBOL (sym_heap_allocated_since_gc, "heap-allocated-since-gc");
251 SCM_SYMBOL (sym_protected_objects, "protected-objects");
252 SCM_SYMBOL (sym_times, "gc-times");
253
254
255 /* {Scheme Interface to GC}
256 */
257 static SCM
258 tag_table_to_type_alist (void *closure, SCM key, SCM val, SCM acc)
259 {
260 if (scm_is_integer (key))
261 {
262 int c_tag = scm_to_int (key);
263
264 char const * name = scm_i_tag_name (c_tag);
265 if (name != NULL)
266 {
267 key = scm_from_locale_string (name);
268 }
269 else
270 {
271 char s[100];
272 sprintf (s, "tag %d", c_tag);
273 key = scm_from_locale_string (s);
274 }
275 }
276
277 return scm_cons (scm_cons (key, val), acc);
278 }
279
280 SCM_DEFINE (scm_gc_live_object_stats, "gc-live-object-stats", 0, 0, 0,
281 (),
282 "Return an alist of statistics of the current live objects. ")
283 #define FUNC_NAME s_scm_gc_live_object_stats
284 {
285 SCM tab = scm_make_hash_table (scm_from_int (57));
286 SCM alist;
287
288 alist
289 = scm_internal_hash_fold (&tag_table_to_type_alist, NULL, SCM_EOL, tab);
290
291 return alist;
292 }
293 #undef FUNC_NAME
294
295 extern int scm_gc_malloc_yield_percentage;
296 SCM_DEFINE (scm_gc_stats, "gc-stats", 0, 0, 0,
297 (),
298 "Return an association list of statistics about Guile's current\n"
299 "use of storage.\n")
300 #define FUNC_NAME s_scm_gc_stats
301 {
302 SCM answer;
303 GC_word heap_size, free_bytes, unmapped_bytes, bytes_since_gc, total_bytes;
304 size_t gc_times;
305
306 GC_get_heap_usage_safe (&heap_size, &free_bytes, &unmapped_bytes,
307 &bytes_since_gc, &total_bytes);
308 gc_times = GC_gc_no;
309
310 answer =
311 scm_list_n (scm_cons (sym_gc_time_taken, scm_from_long (gc_time_taken)),
312 scm_cons (sym_heap_size, scm_from_size_t (heap_size)),
313 scm_cons (sym_heap_free_size, scm_from_size_t (free_bytes)),
314 scm_cons (sym_heap_total_allocated,
315 scm_from_size_t (total_bytes)),
316 scm_cons (sym_heap_allocated_since_gc,
317 scm_from_size_t (bytes_since_gc)),
318 scm_cons (sym_protected_objects,
319 scm_from_ulong (protected_obj_count)),
320 scm_cons (sym_times, scm_from_size_t (gc_times)),
321 SCM_UNDEFINED);
322
323 return answer;
324 }
325 #undef FUNC_NAME
326
327
328 SCM_DEFINE (scm_gc_dump, "gc-dump", 0, 0, 0,
329 (void),
330 "Dump information about the garbage collector's internal data "
331 "structures and memory usage to the standard output.")
332 #define FUNC_NAME s_scm_gc_dump
333 {
334 GC_dump ();
335
336 return SCM_UNSPECIFIED;
337 }
338 #undef FUNC_NAME
339
340
341 SCM_DEFINE (scm_object_address, "object-address", 1, 0, 0,
342 (SCM obj),
343 "Return an integer that for the lifetime of @var{obj} is uniquely\n"
344 "returned by this function for @var{obj}")
345 #define FUNC_NAME s_scm_object_address
346 {
347 return scm_from_ulong (SCM_UNPACK (obj));
348 }
349 #undef FUNC_NAME
350
351
352 SCM_DEFINE (scm_gc_disable, "gc-disable", 0, 0, 0,
353 (),
354 "Disables the garbage collector. Nested calls are permitted. "
355 "GC is re-enabled once @code{gc-enable} has been called the "
356 "same number of times @code{gc-disable} was called.")
357 #define FUNC_NAME s_scm_gc_disable
358 {
359 GC_disable ();
360 return SCM_UNSPECIFIED;
361 }
362 #undef FUNC_NAME
363
364 SCM_DEFINE (scm_gc_enable, "gc-enable", 0, 0, 0,
365 (),
366 "Enables the garbage collector.")
367 #define FUNC_NAME s_scm_gc_enable
368 {
369 GC_enable ();
370 return SCM_UNSPECIFIED;
371 }
372 #undef FUNC_NAME
373
374
375 SCM_DEFINE (scm_gc, "gc", 0, 0, 0,
376 (),
377 "Scans all of SCM objects and reclaims for further use those that are\n"
378 "no longer accessible.")
379 #define FUNC_NAME s_scm_gc
380 {
381 scm_i_gc ("call");
382 return SCM_UNSPECIFIED;
383 }
384 #undef FUNC_NAME
385
386 void
387 scm_i_gc (const char *what)
388 {
389 #ifndef HAVE_GC_SET_START_CALLBACK
390 run_before_gc_c_hook ();
391 #endif
392 GC_gcollect ();
393 }
394
395
396 \f
397 /* {GC Protection Helper Functions}
398 */
399
400
401 /*
402 * If within a function you need to protect one or more scheme objects from
403 * garbage collection, pass them as parameters to one of the
404 * scm_remember_upto_here* functions below. These functions don't do
405 * anything, but since the compiler does not know that they are actually
406 * no-ops, it will generate code that calls these functions with the given
407 * parameters. Therefore, you can be sure that the compiler will keep those
408 * scheme values alive (on the stack or in a register) up to the point where
409 * scm_remember_upto_here* is called. In other words, place the call to
410 * scm_remember_upto_here* _behind_ the last code in your function, that
411 * depends on the scheme object to exist.
412 *
413 * Example: We want to make sure that the string object str does not get
414 * garbage collected during the execution of 'some_function' in the code
415 * below, because otherwise the characters belonging to str would be freed and
416 * 'some_function' might access freed memory. To make sure that the compiler
417 * keeps str alive on the stack or in a register such that it is visible to
418 * the conservative gc we add the call to scm_remember_upto_here_1 _after_ the
419 * call to 'some_function'. Note that this would not be necessary if str was
420 * used anyway after the call to 'some_function'.
421 * char *chars = scm_i_string_chars (str);
422 * some_function (chars);
423 * scm_remember_upto_here_1 (str); // str will be alive up to this point.
424 */
425
426 /* Remove any macro versions of these while defining the functions.
427 Functions are always included in the library, for upward binary
428 compatibility and in case combinations of GCC and non-GCC are used. */
429 #undef scm_remember_upto_here_1
430 #undef scm_remember_upto_here_2
431
432 void
433 scm_remember_upto_here_1 (SCM obj SCM_UNUSED)
434 {
435 /* Empty. Protects a single object from garbage collection. */
436 }
437
438 void
439 scm_remember_upto_here_2 (SCM obj1 SCM_UNUSED, SCM obj2 SCM_UNUSED)
440 {
441 /* Empty. Protects two objects from garbage collection. */
442 }
443
444 void
445 scm_remember_upto_here (SCM obj SCM_UNUSED, ...)
446 {
447 /* Empty. Protects any number of objects from garbage collection. */
448 }
449
450 /*
451 These crazy functions prevent garbage collection
452 of arguments after the first argument by
453 ensuring they remain live throughout the
454 function because they are used in the last
455 line of the code block.
456 It'd be better to have a nice compiler hint to
457 aid the conservative stack-scanning GC. --03/09/00 gjb */
458 SCM
459 scm_return_first (SCM elt, ...)
460 {
461 return elt;
462 }
463
464 int
465 scm_return_first_int (int i, ...)
466 {
467 return i;
468 }
469
470
471 SCM
472 scm_permanent_object (SCM obj)
473 {
474 return (scm_gc_protect_object (obj));
475 }
476
477
478 /* Protect OBJ from the garbage collector. OBJ will not be freed, even if all
479 other references are dropped, until the object is unprotected by calling
480 scm_gc_unprotect_object (OBJ). Calls to scm_gc_protect/unprotect_object nest,
481 i. e. it is possible to protect the same object several times, but it is
482 necessary to unprotect the object the same number of times to actually get
483 the object unprotected. It is an error to unprotect an object more often
484 than it has been protected before. The function scm_protect_object returns
485 OBJ.
486 */
487
488 /* Implementation note: For every object X, there is a counter which
489 scm_gc_protect_object (X) increments and scm_gc_unprotect_object (X) decrements.
490 */
491
492
493
494 SCM
495 scm_gc_protect_object (SCM obj)
496 {
497 SCM handle;
498
499 /* This critical section barrier will be replaced by a mutex. */
500 /* njrev: Indeed; if my comment above is correct, there is the same
501 critsec/mutex inconsistency here. */
502 SCM_CRITICAL_SECTION_START;
503
504 handle = scm_hashq_create_handle_x (scm_protects, obj, scm_from_int (0));
505 SCM_SETCDR (handle, scm_sum (SCM_CDR (handle), scm_from_int (1)));
506
507 protected_obj_count ++;
508
509 SCM_CRITICAL_SECTION_END;
510
511 return obj;
512 }
513
514
515 /* Remove any protection for OBJ established by a prior call to
516 scm_protect_object. This function returns OBJ.
517
518 See scm_protect_object for more information. */
519 SCM
520 scm_gc_unprotect_object (SCM obj)
521 {
522 SCM handle;
523
524 /* This critical section barrier will be replaced by a mutex. */
525 /* njrev: and again. */
526 SCM_CRITICAL_SECTION_START;
527
528 if (scm_gc_running_p)
529 {
530 fprintf (stderr, "scm_unprotect_object called during GC.\n");
531 abort ();
532 }
533
534 handle = scm_hashq_get_handle (scm_protects, obj);
535
536 if (scm_is_false (handle))
537 {
538 fprintf (stderr, "scm_unprotect_object called on unprotected object\n");
539 abort ();
540 }
541 else
542 {
543 SCM count = scm_difference (SCM_CDR (handle), scm_from_int (1));
544 if (scm_is_eq (count, scm_from_int (0)))
545 scm_hashq_remove_x (scm_protects, obj);
546 else
547 SCM_SETCDR (handle, count);
548 }
549 protected_obj_count --;
550
551 SCM_CRITICAL_SECTION_END;
552
553 return obj;
554 }
555
556 void
557 scm_gc_register_root (SCM *p)
558 {
559 /* Nothing. */
560 }
561
562 void
563 scm_gc_unregister_root (SCM *p)
564 {
565 /* Nothing. */
566 }
567
568 void
569 scm_gc_register_roots (SCM *b, unsigned long n)
570 {
571 SCM *p = b;
572 for (; p < b + n; ++p)
573 scm_gc_register_root (p);
574 }
575
576 void
577 scm_gc_unregister_roots (SCM *b, unsigned long n)
578 {
579 SCM *p = b;
580 for (; p < b + n; ++p)
581 scm_gc_unregister_root (p);
582 }
583
584 \f
585
586
587 /*
588 MOVE THIS FUNCTION. IT DOES NOT HAVE ANYTHING TODO WITH GC.
589 */
590
591 /* Get an integer from an environment variable. */
592 int
593 scm_getenv_int (const char *var, int def)
594 {
595 char *end = 0;
596 char *val = getenv (var);
597 long res = def;
598 if (!val)
599 return def;
600 res = strtol (val, &end, 10);
601 if (end == val)
602 return def;
603 return res;
604 }
605
606 void
607 scm_storage_prehistory ()
608 {
609 GC_all_interior_pointers = 0;
610 free_space_divisor = scm_getenv_int ("GC_FREE_SPACE_DIVISOR", 3);
611 minimum_free_space_divisor = free_space_divisor;
612 target_free_space_divisor = free_space_divisor;
613 GC_set_free_space_divisor (free_space_divisor);
614
615 GC_INIT ();
616
617 #if (! ((defined GC_VERSION_MAJOR) && (GC_VERSION_MAJOR >= 7))) \
618 && (defined SCM_I_GSC_USE_PTHREAD_THREADS)
619 /* When using GC 6.8, this call is required to initialize thread-local
620 freelists (shouldn't be necessary with GC 7.0). */
621 GC_init ();
622 #endif
623
624 GC_expand_hp (SCM_DEFAULT_INIT_HEAP_SIZE_2);
625
626 /* We only need to register a displacement for those types for which the
627 higher bits of the type tag are used to store a pointer (that is, a
628 pointer to an 8-octet aligned region). For `scm_tc3_struct', this is
629 handled in `scm_alloc_struct ()'. */
630 GC_REGISTER_DISPLACEMENT (scm_tc3_cons);
631 /* GC_REGISTER_DISPLACEMENT (scm_tc3_unused); */
632
633 /* Sanity check. */
634 if (!GC_is_visible (&scm_protects))
635 abort ();
636
637 scm_c_hook_init (&scm_before_gc_c_hook, 0, SCM_C_HOOK_NORMAL);
638 scm_c_hook_init (&scm_before_mark_c_hook, 0, SCM_C_HOOK_NORMAL);
639 scm_c_hook_init (&scm_before_sweep_c_hook, 0, SCM_C_HOOK_NORMAL);
640 scm_c_hook_init (&scm_after_sweep_c_hook, 0, SCM_C_HOOK_NORMAL);
641 scm_c_hook_init (&scm_after_gc_c_hook, 0, SCM_C_HOOK_NORMAL);
642 }
643
644 scm_i_pthread_mutex_t scm_i_gc_admin_mutex = SCM_I_PTHREAD_MUTEX_INITIALIZER;
645
646 void
647 scm_init_gc_protect_object ()
648 {
649 scm_protects = scm_c_make_hash_table (31);
650
651 #if 0
652 /* We can't have a cleanup handler since we have no thread to run it
653 in. */
654
655 #ifdef HAVE_ATEXIT
656 atexit (cleanup);
657 #else
658 #ifdef HAVE_ON_EXIT
659 on_exit (cleanup, 0);
660 #endif
661 #endif
662
663 #endif
664 }
665
666 \f
667
668 SCM scm_after_gc_hook;
669
670 static SCM after_gc_async_cell;
671
672 /* The function after_gc_async_thunk causes the execution of the
673 * after-gc-hook. It is run after the gc, as soon as the asynchronous
674 * events are handled by the evaluator.
675 */
676 static SCM
677 after_gc_async_thunk (void)
678 {
679 /* Fun, no? Hook-run *and* run-hook? */
680 scm_c_hook_run (&scm_after_gc_c_hook, NULL);
681 scm_c_run_hook (scm_after_gc_hook, SCM_EOL);
682 return SCM_UNSPECIFIED;
683 }
684
685
686 /* The function queue_after_gc_hook is run by the scm_before_gc_c_hook
687 * at the end of the garbage collection. The only purpose of this
688 * function is to mark the after_gc_async (which will eventually lead to
689 * the execution of the after_gc_async_thunk).
690 */
691 static void *
692 queue_after_gc_hook (void * hook_data SCM_UNUSED,
693 void *fn_data SCM_UNUSED,
694 void *data SCM_UNUSED)
695 {
696 /* If cell access debugging is enabled, the user may choose to perform
697 * additional garbage collections after an arbitrary number of cell
698 * accesses. We don't want the scheme level after-gc-hook to be performed
699 * for each of these garbage collections for the following reason: The
700 * execution of the after-gc-hook causes cell accesses itself. Thus, if the
701 * after-gc-hook was performed with every gc, and if the gc was performed
702 * after a very small number of cell accesses, then the number of cell
703 * accesses during the execution of the after-gc-hook will suffice to cause
704 * the execution of the next gc. Then, guile would keep executing the
705 * after-gc-hook over and over again, and would never come to do other
706 * things.
707 *
708 * To overcome this problem, if cell access debugging with additional
709 * garbage collections is enabled, the after-gc-hook is never run by the
710 * garbage collecter. When running guile with cell access debugging and the
711 * execution of the after-gc-hook is desired, then it is necessary to run
712 * the hook explicitly from the user code. This has the effect, that from
713 * the scheme level point of view it seems that garbage collection is
714 * performed with a much lower frequency than it actually is. Obviously,
715 * this will not work for code that depends on a fixed one to one
716 * relationship between the execution counts of the C level garbage
717 * collection hooks and the execution count of the scheme level
718 * after-gc-hook.
719 */
720
721 #if (SCM_DEBUG_CELL_ACCESSES == 1)
722 if (scm_debug_cells_gc_interval == 0)
723 #endif
724 {
725 scm_i_thread *t = SCM_I_CURRENT_THREAD;
726
727 if (scm_is_false (SCM_CDR (after_gc_async_cell)))
728 {
729 SCM_SETCDR (after_gc_async_cell, t->active_asyncs);
730 t->active_asyncs = after_gc_async_cell;
731 t->pending_asyncs = 1;
732 }
733 }
734
735 return NULL;
736 }
737
738 \f
739
740 static void *
741 start_gc_timer (void * hook_data SCM_UNUSED,
742 void *fn_data SCM_UNUSED,
743 void *data SCM_UNUSED)
744 {
745 if (!gc_start_time)
746 gc_start_time = scm_c_get_internal_run_time ();
747
748 return NULL;
749 }
750
751 static void *
752 accumulate_gc_timer (void * hook_data SCM_UNUSED,
753 void *fn_data SCM_UNUSED,
754 void *data SCM_UNUSED)
755 {
756 if (gc_start_time)
757 {
758 long now = scm_c_get_internal_run_time ();
759 gc_time_taken += now - gc_start_time;
760 gc_start_time = 0;
761 }
762
763 return NULL;
764 }
765
766 /* Return some idea of the memory footprint of a process, in bytes.
767 Currently only works on Linux systems. */
768 static size_t
769 get_image_size (void)
770 {
771 unsigned long size, resident, share;
772 size_t ret = 0;
773
774 FILE *fp = fopen ("/proc/self/statm", "r");
775
776 if (fp && fscanf (fp, "%lu %lu %lu", &size, &resident, &share) == 3)
777 ret = resident * 4096;
778
779 if (fp)
780 fclose (fp);
781
782 return ret;
783 }
784
785 /* These are discussed later. */
786 static size_t bytes_until_gc;
787 static scm_i_pthread_mutex_t bytes_until_gc_lock = SCM_I_PTHREAD_MUTEX_INITIALIZER;
788
789 /* Make GC run more frequently when the process image size is growing,
790 measured against the number of bytes allocated through the GC.
791
792 If Guile is allocating at a GC-managed heap size H, libgc will tend
793 to limit the process image size to H*N. But if at the same time the
794 user program is mallocating at a rate M bytes per GC-allocated byte,
795 then the process stabilizes at H*N*M -- assuming that collecting data
796 will result in malloc'd data being freed. It doesn't take a very
797 large M for this to be a bad situation. To limit the image size,
798 Guile should GC more often -- the bigger the M, the more often.
799
800 Numeric functions that produce bigger and bigger integers are
801 pessimal, because M is an increasing function of time. Here is an
802 example of such a function:
803
804 (define (factorial n)
805 (define (fac n acc)
806 (if (<= n 1)
807 acc
808 (fac (1- n) (* n acc))))
809 (fac n 1))
810
811 It is possible for a process to grow for reasons that will not be
812 solved by faster GC. In that case M will be estimated as
813 artificially high for a while, and so GC will happen more often on
814 the Guile side. But when it stabilizes, Guile can ease back the GC
815 frequency.
816
817 The key is to measure process image growth, not mallocation rate.
818 For maximum effectiveness, Guile reacts quickly to process growth,
819 and exponentially backs down when the process stops growing.
820
821 See http://thread.gmane.org/gmane.lisp.guile.devel/12552/focus=12936
822 for further discussion.
823 */
824 static void *
825 adjust_gc_frequency (void * hook_data SCM_UNUSED,
826 void *fn_data SCM_UNUSED,
827 void *data SCM_UNUSED)
828 {
829 static size_t prev_image_size = 0;
830 static size_t prev_bytes_alloced = 0;
831 size_t image_size;
832 size_t bytes_alloced;
833
834 scm_i_pthread_mutex_lock (&bytes_until_gc_lock);
835 bytes_until_gc = GC_get_heap_size ();
836 scm_i_pthread_mutex_unlock (&bytes_until_gc_lock);
837
838 image_size = get_image_size ();
839 bytes_alloced = GC_get_total_bytes ();
840
841 #define HEURISTICS_DEBUG 0
842
843 #if HEURISTICS_DEBUG
844 fprintf (stderr, "prev image / alloced: %lu / %lu\n", prev_image_size, prev_bytes_alloced);
845 fprintf (stderr, " image / alloced: %lu / %lu\n", image_size, bytes_alloced);
846 fprintf (stderr, "divisor %lu / %f\n", free_space_divisor, target_free_space_divisor);
847 #endif
848
849 if (prev_image_size && bytes_alloced != prev_bytes_alloced)
850 {
851 double growth_rate, new_target_free_space_divisor;
852 double decay_factor = 0.5;
853 double hysteresis = 0.1;
854
855 growth_rate = ((double) image_size - prev_image_size)
856 / ((double)bytes_alloced - prev_bytes_alloced);
857
858 #if HEURISTICS_DEBUG
859 fprintf (stderr, "growth rate %f\n", growth_rate);
860 #endif
861
862 new_target_free_space_divisor = minimum_free_space_divisor;
863
864 if (growth_rate > 0)
865 new_target_free_space_divisor *= 1.0 + growth_rate;
866
867 #if HEURISTICS_DEBUG
868 fprintf (stderr, "new divisor %f\n", new_target_free_space_divisor);
869 #endif
870
871 if (new_target_free_space_divisor < target_free_space_divisor)
872 /* Decay down. */
873 target_free_space_divisor =
874 (decay_factor * target_free_space_divisor
875 + (1.0 - decay_factor) * new_target_free_space_divisor);
876 else
877 /* Jump up. */
878 target_free_space_divisor = new_target_free_space_divisor;
879
880 #if HEURISTICS_DEBUG
881 fprintf (stderr, "new target divisor %f\n", target_free_space_divisor);
882 #endif
883
884 if (free_space_divisor + 0.5 + hysteresis < target_free_space_divisor
885 || free_space_divisor - 0.5 - hysteresis > target_free_space_divisor)
886 {
887 free_space_divisor = lround (target_free_space_divisor);
888 #if HEURISTICS_DEBUG
889 fprintf (stderr, "new divisor %lu\n", free_space_divisor);
890 #endif
891 GC_set_free_space_divisor (free_space_divisor);
892 }
893 }
894
895 prev_image_size = image_size;
896 prev_bytes_alloced = bytes_alloced;
897
898 return NULL;
899 }
900
901 /* The adjust_gc_frequency routine handles transients in the process
902 image size. It can't handle instense non-GC-managed steady-state
903 allocation though, as it decays the FSD at steady-state down to its
904 minimum value.
905
906 The only real way to handle continuous, high non-GC allocation is to
907 let the GC know about it. This routine can handle non-GC allocation
908 rates that are similar in size to the GC-managed heap size.
909 */
910
911 void
912 scm_gc_register_allocation (size_t size)
913 {
914 scm_i_pthread_mutex_lock (&bytes_until_gc_lock);
915 if (bytes_until_gc - size > bytes_until_gc)
916 {
917 bytes_until_gc = GC_get_heap_size ();
918 scm_i_pthread_mutex_unlock (&bytes_until_gc_lock);
919 GC_gcollect ();
920 }
921 else
922 {
923 bytes_until_gc -= size;
924 scm_i_pthread_mutex_unlock (&bytes_until_gc_lock);
925 }
926 }
927
928
929 \f
930
931 char const *
932 scm_i_tag_name (scm_t_bits tag)
933 {
934 switch (tag & 0x7f) /* 7 bits */
935 {
936 case scm_tcs_struct:
937 return "struct";
938 case scm_tcs_cons_imcar:
939 return "cons (immediate car)";
940 case scm_tcs_cons_nimcar:
941 return "cons (non-immediate car)";
942 case scm_tc7_pointer:
943 return "foreign";
944 case scm_tc7_hashtable:
945 return "hashtable";
946 case scm_tc7_weak_set:
947 return "weak-set";
948 case scm_tc7_weak_table:
949 return "weak-table";
950 case scm_tc7_fluid:
951 return "fluid";
952 case scm_tc7_dynamic_state:
953 return "dynamic state";
954 case scm_tc7_frame:
955 return "frame";
956 case scm_tc7_objcode:
957 return "objcode";
958 case scm_tc7_vm:
959 return "vm";
960 case scm_tc7_vm_cont:
961 return "vm continuation";
962 case scm_tc7_wvect:
963 return "weak vector";
964 case scm_tc7_vector:
965 return "vector";
966 case scm_tc7_number:
967 switch (tag)
968 {
969 case scm_tc16_real:
970 return "real";
971 break;
972 case scm_tc16_big:
973 return "bignum";
974 break;
975 case scm_tc16_complex:
976 return "complex number";
977 break;
978 case scm_tc16_fraction:
979 return "fraction";
980 break;
981 }
982 break;
983 case scm_tc7_string:
984 return "string";
985 break;
986 case scm_tc7_stringbuf:
987 return "string buffer";
988 break;
989 case scm_tc7_symbol:
990 return "symbol";
991 break;
992 case scm_tc7_variable:
993 return "variable";
994 break;
995 case scm_tc7_port:
996 return "port";
997 break;
998 case scm_tc7_smob:
999 {
1000 int k = 0xff & (tag >> 8);
1001 return (scm_smobs[k].name);
1002 }
1003 break;
1004 }
1005
1006 return NULL;
1007 }
1008
1009
1010
1011 \f
1012 void
1013 scm_init_gc ()
1014 {
1015 /* `GC_INIT ()' was invoked in `scm_storage_prehistory ()'. */
1016
1017 scm_after_gc_hook = scm_make_hook (SCM_INUM0);
1018 scm_c_define ("after-gc-hook", scm_after_gc_hook);
1019
1020 /* When the async is to run, the cdr of the gc_async pair gets set to
1021 the asyncs queue of the current thread. */
1022 after_gc_async_cell = scm_cons (scm_c_make_gsubr ("%after-gc-thunk", 0, 0, 0,
1023 after_gc_async_thunk),
1024 SCM_BOOL_F);
1025
1026 scm_c_hook_add (&scm_before_gc_c_hook, queue_after_gc_hook, NULL, 0);
1027 scm_c_hook_add (&scm_before_gc_c_hook, start_gc_timer, NULL, 0);
1028 scm_c_hook_add (&scm_after_gc_c_hook, accumulate_gc_timer, NULL, 0);
1029
1030 #if HAVE_GC_GET_HEAP_USAGE_SAFE
1031 /* GC_get_heap_usage does not take a lock, and so can run in the GC
1032 start hook. */
1033 scm_c_hook_add (&scm_before_gc_c_hook, adjust_gc_frequency, NULL, 0);
1034 #else
1035 /* GC_get_heap_usage might take a lock (and did from 7.2alpha1 to
1036 7.2alpha7), so call it in the after_gc_hook. */
1037 scm_c_hook_add (&scm_after_gc_c_hook, adjust_gc_frequency, NULL, 0);
1038 #endif
1039
1040 #ifdef HAVE_GC_SET_START_CALLBACK
1041 GC_set_start_callback (run_before_gc_c_hook);
1042 #endif
1043
1044 #include "libguile/gc.x"
1045 }
1046
1047
1048 void
1049 scm_gc_sweep (void)
1050 #define FUNC_NAME "scm_gc_sweep"
1051 {
1052 /* FIXME */
1053 fprintf (stderr, "%s: doing nothing\n", FUNC_NAME);
1054 }
1055 #undef FUNC_NAME
1056
1057 /*
1058 Local Variables:
1059 c-file-style: "gnu"
1060 End:
1061 */