Merge remote-tracking branch 'origin/stable-2.0'
[bpt/guile.git] / libguile / gc.c
1 /* Copyright (C) 1995,1996,1997,1998,1999,2000,2001, 2002, 2003, 2006, 2008, 2009, 2010, 2011 Free Software Foundation, Inc.
2 *
3 * This library is free software; you can redistribute it and/or
4 * modify it under the terms of the GNU Lesser General Public License
5 * as published by the Free Software Foundation; either version 3 of
6 * the License, or (at your option) any later version.
7 *
8 * This library is distributed in the hope that it will be useful, but
9 * WITHOUT ANY WARRANTY; without even the implied warranty of
10 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
11 * Lesser General Public License for more details.
12 *
13 * You should have received a copy of the GNU Lesser General Public
14 * License along with this library; if not, write to the Free Software
15 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
16 * 02110-1301 USA
17 */
18
19 /* #define DEBUGINFO */
20
21 #ifdef HAVE_CONFIG_H
22 # include <config.h>
23 #endif
24
25 #include "libguile/gen-scmconfig.h"
26
27 #include <stdio.h>
28 #include <errno.h>
29 #include <string.h>
30 #include <math.h>
31
32 #ifdef __ia64__
33 #include <ucontext.h>
34 extern unsigned long * __libc_ia64_register_backing_store_base;
35 #endif
36
37 #include "libguile/_scm.h"
38 #include "libguile/eval.h"
39 #include "libguile/stime.h"
40 #include "libguile/stackchk.h"
41 #include "libguile/struct.h"
42 #include "libguile/smob.h"
43 #include "libguile/arrays.h"
44 #include "libguile/async.h"
45 #include "libguile/ports.h"
46 #include "libguile/root.h"
47 #include "libguile/strings.h"
48 #include "libguile/vectors.h"
49 #include "libguile/hashtab.h"
50 #include "libguile/tags.h"
51
52 #include "libguile/private-gc.h"
53 #include "libguile/validate.h"
54 #include "libguile/deprecation.h"
55 #include "libguile/gc.h"
56 #include "libguile/dynwind.h"
57
58 #include "libguile/bdw-gc.h"
59
60 /* For GC_set_start_callback. */
61 #include <gc/gc_mark.h>
62
63 #ifdef GUILE_DEBUG_MALLOC
64 #include "libguile/debug-malloc.h"
65 #endif
66
67 #ifdef HAVE_MALLOC_H
68 #include <malloc.h>
69 #endif
70
71 #ifdef HAVE_UNISTD_H
72 #include <unistd.h>
73 #endif
74
75 /* Set this to != 0 if every cell that is accessed shall be checked:
76 */
77 int scm_debug_cell_accesses_p = 0;
78 int scm_expensive_debug_cell_accesses_p = 0;
79
80 /* Set this to 0 if no additional gc's shall be performed, otherwise set it to
81 * the number of cell accesses after which a gc shall be called.
82 */
83 int scm_debug_cells_gc_interval = 0;
84
85 /* Hash table that keeps a reference to objects the user wants to protect from
86 garbage collection. */
87 static SCM scm_protects;
88
89
90 #if (SCM_DEBUG_CELL_ACCESSES == 1)
91
92
93 /*
94
95 Assert that the given object is a valid reference to a valid cell. This
96 test involves to determine whether the object is a cell pointer, whether
97 this pointer actually points into a heap segment and whether the cell
98 pointed to is not a free cell. Further, additional garbage collections may
99 get executed after a user defined number of cell accesses. This helps to
100 find places in the C code where references are dropped for extremely short
101 periods.
102
103 */
104 void
105 scm_i_expensive_validation_check (SCM cell)
106 {
107 /* If desired, perform additional garbage collections after a user
108 * defined number of cell accesses.
109 */
110 if (scm_debug_cells_gc_interval)
111 {
112 static unsigned int counter = 0;
113
114 if (counter != 0)
115 {
116 --counter;
117 }
118 else
119 {
120 counter = scm_debug_cells_gc_interval;
121 scm_gc ();
122 }
123 }
124 }
125
126 /* Whether cell validation is already running. */
127 static int scm_i_cell_validation_already_running = 0;
128
129 void
130 scm_assert_cell_valid (SCM cell)
131 {
132 if (!scm_i_cell_validation_already_running && scm_debug_cell_accesses_p)
133 {
134 scm_i_cell_validation_already_running = 1; /* set to avoid recursion */
135
136 /*
137 During GC, no user-code should be run, and the guile core
138 should use non-protected accessors.
139 */
140 if (scm_gc_running_p)
141 return;
142
143 /*
144 Only scm_in_heap_p and rescanning the heap is wildly
145 expensive.
146 */
147 if (scm_expensive_debug_cell_accesses_p)
148 scm_i_expensive_validation_check (cell);
149
150 scm_i_cell_validation_already_running = 0; /* re-enable */
151 }
152 }
153
154
155
156 SCM_DEFINE (scm_set_debug_cell_accesses_x, "set-debug-cell-accesses!", 1, 0, 0,
157 (SCM flag),
158 "If @var{flag} is @code{#f}, cell access checking is disabled.\n"
159 "If @var{flag} is @code{#t}, cheap cell access checking is enabled,\n"
160 "but no additional calls to garbage collection are issued.\n"
161 "If @var{flag} is a number, strict cell access checking is enabled,\n"
162 "with an additional garbage collection after the given\n"
163 "number of cell accesses.\n"
164 "This procedure only exists when the compile-time flag\n"
165 "@code{SCM_DEBUG_CELL_ACCESSES} was set to 1.")
166 #define FUNC_NAME s_scm_set_debug_cell_accesses_x
167 {
168 if (scm_is_false (flag))
169 {
170 scm_debug_cell_accesses_p = 0;
171 }
172 else if (scm_is_eq (flag, SCM_BOOL_T))
173 {
174 scm_debug_cells_gc_interval = 0;
175 scm_debug_cell_accesses_p = 1;
176 scm_expensive_debug_cell_accesses_p = 0;
177 }
178 else
179 {
180 scm_debug_cells_gc_interval = scm_to_signed_integer (flag, 0, INT_MAX);
181 scm_debug_cell_accesses_p = 1;
182 scm_expensive_debug_cell_accesses_p = 1;
183 }
184 return SCM_UNSPECIFIED;
185 }
186 #undef FUNC_NAME
187
188
189 #endif /* SCM_DEBUG_CELL_ACCESSES == 1 */
190
191 \f
192
193 /* Compatibility. */
194
195 #ifndef HAVE_GC_GET_HEAP_USAGE_SAFE
196 static void
197 GC_get_heap_usage_safe (GC_word *pheap_size, GC_word *pfree_bytes,
198 GC_word *punmapped_bytes, GC_word *pbytes_since_gc,
199 GC_word *ptotal_bytes)
200 {
201 *pheap_size = GC_get_heap_size ();
202 *pfree_bytes = GC_get_free_bytes ();
203 #ifdef HAVE_GC_GET_UNMAPPED_BYTES
204 *punmapped_bytes = GC_get_unmapped_bytes ();
205 #else
206 *punmapped_bytes = 0;
207 #endif
208 *pbytes_since_gc = GC_get_bytes_since_gc ();
209 *ptotal_bytes = GC_get_total_bytes ();
210 }
211 #endif
212
213 #ifndef HAVE_GC_GET_FREE_SPACE_DIVISOR
214 static GC_word
215 GC_get_free_space_divisor (void)
216 {
217 return GC_free_space_divisor;
218 }
219 #endif
220
221 \f
222 /* Hooks. */
223 scm_t_c_hook scm_before_gc_c_hook;
224 scm_t_c_hook scm_before_mark_c_hook;
225 scm_t_c_hook scm_before_sweep_c_hook;
226 scm_t_c_hook scm_after_sweep_c_hook;
227 scm_t_c_hook scm_after_gc_c_hook;
228
229
230 static void
231 run_before_gc_c_hook (void)
232 {
233 scm_c_hook_run (&scm_before_gc_c_hook, NULL);
234 }
235
236
237 /* GC Statistics Keeping
238 */
239 unsigned long scm_gc_ports_collected = 0;
240 static long gc_time_taken = 0;
241 static long gc_start_time = 0;
242
243 static unsigned long free_space_divisor;
244 static unsigned long minimum_free_space_divisor;
245 static double target_free_space_divisor;
246
247 static unsigned long protected_obj_count = 0;
248
249
250 SCM_SYMBOL (sym_gc_time_taken, "gc-time-taken");
251 SCM_SYMBOL (sym_heap_size, "heap-size");
252 SCM_SYMBOL (sym_heap_free_size, "heap-free-size");
253 SCM_SYMBOL (sym_heap_total_allocated, "heap-total-allocated");
254 SCM_SYMBOL (sym_heap_allocated_since_gc, "heap-allocated-since-gc");
255 SCM_SYMBOL (sym_protected_objects, "protected-objects");
256 SCM_SYMBOL (sym_times, "gc-times");
257
258
259 /* {Scheme Interface to GC}
260 */
261 static SCM
262 tag_table_to_type_alist (void *closure, SCM key, SCM val, SCM acc)
263 {
264 if (scm_is_integer (key))
265 {
266 int c_tag = scm_to_int (key);
267
268 char const * name = scm_i_tag_name (c_tag);
269 if (name != NULL)
270 {
271 key = scm_from_locale_string (name);
272 }
273 else
274 {
275 char s[100];
276 sprintf (s, "tag %d", c_tag);
277 key = scm_from_locale_string (s);
278 }
279 }
280
281 return scm_cons (scm_cons (key, val), acc);
282 }
283
284 SCM_DEFINE (scm_gc_live_object_stats, "gc-live-object-stats", 0, 0, 0,
285 (),
286 "Return an alist of statistics of the current live objects. ")
287 #define FUNC_NAME s_scm_gc_live_object_stats
288 {
289 SCM tab = scm_make_hash_table (scm_from_int (57));
290 SCM alist;
291
292 alist
293 = scm_internal_hash_fold (&tag_table_to_type_alist, NULL, SCM_EOL, tab);
294
295 return alist;
296 }
297 #undef FUNC_NAME
298
299 extern int scm_gc_malloc_yield_percentage;
300 SCM_DEFINE (scm_gc_stats, "gc-stats", 0, 0, 0,
301 (),
302 "Return an association list of statistics about Guile's current\n"
303 "use of storage.\n")
304 #define FUNC_NAME s_scm_gc_stats
305 {
306 SCM answer;
307 GC_word heap_size, free_bytes, unmapped_bytes, bytes_since_gc, total_bytes;
308 size_t gc_times;
309
310 GC_get_heap_usage_safe (&heap_size, &free_bytes, &unmapped_bytes,
311 &bytes_since_gc, &total_bytes);
312 gc_times = GC_gc_no;
313
314 answer =
315 scm_list_n (scm_cons (sym_gc_time_taken, scm_from_long (gc_time_taken)),
316 scm_cons (sym_heap_size, scm_from_size_t (heap_size)),
317 scm_cons (sym_heap_free_size, scm_from_size_t (free_bytes)),
318 scm_cons (sym_heap_total_allocated,
319 scm_from_size_t (total_bytes)),
320 scm_cons (sym_heap_allocated_since_gc,
321 scm_from_size_t (bytes_since_gc)),
322 scm_cons (sym_protected_objects,
323 scm_from_ulong (protected_obj_count)),
324 scm_cons (sym_times, scm_from_size_t (gc_times)),
325 SCM_UNDEFINED);
326
327 return answer;
328 }
329 #undef FUNC_NAME
330
331
332 SCM_DEFINE (scm_gc_dump, "gc-dump", 0, 0, 0,
333 (void),
334 "Dump information about the garbage collector's internal data "
335 "structures and memory usage to the standard output.")
336 #define FUNC_NAME s_scm_gc_dump
337 {
338 GC_dump ();
339
340 return SCM_UNSPECIFIED;
341 }
342 #undef FUNC_NAME
343
344
345 SCM_DEFINE (scm_object_address, "object-address", 1, 0, 0,
346 (SCM obj),
347 "Return an integer that for the lifetime of @var{obj} is uniquely\n"
348 "returned by this function for @var{obj}")
349 #define FUNC_NAME s_scm_object_address
350 {
351 return scm_from_ulong (SCM_UNPACK (obj));
352 }
353 #undef FUNC_NAME
354
355
356 SCM_DEFINE (scm_gc_disable, "gc-disable", 0, 0, 0,
357 (),
358 "Disables the garbage collector. Nested calls are permitted. "
359 "GC is re-enabled once @code{gc-enable} has been called the "
360 "same number of times @code{gc-disable} was called.")
361 #define FUNC_NAME s_scm_gc_disable
362 {
363 GC_disable ();
364 return SCM_UNSPECIFIED;
365 }
366 #undef FUNC_NAME
367
368 SCM_DEFINE (scm_gc_enable, "gc-enable", 0, 0, 0,
369 (),
370 "Enables the garbage collector.")
371 #define FUNC_NAME s_scm_gc_enable
372 {
373 GC_enable ();
374 return SCM_UNSPECIFIED;
375 }
376 #undef FUNC_NAME
377
378
379 SCM_DEFINE (scm_gc, "gc", 0, 0, 0,
380 (),
381 "Scans all of SCM objects and reclaims for further use those that are\n"
382 "no longer accessible.")
383 #define FUNC_NAME s_scm_gc
384 {
385 scm_i_gc ("call");
386 return SCM_UNSPECIFIED;
387 }
388 #undef FUNC_NAME
389
390 void
391 scm_i_gc (const char *what)
392 {
393 #ifndef HAVE_GC_SET_START_CALLBACK
394 run_before_gc_c_hook ();
395 #endif
396 GC_gcollect ();
397 }
398
399
400 \f
401 /* {GC Protection Helper Functions}
402 */
403
404
405 /*
406 * If within a function you need to protect one or more scheme objects from
407 * garbage collection, pass them as parameters to one of the
408 * scm_remember_upto_here* functions below. These functions don't do
409 * anything, but since the compiler does not know that they are actually
410 * no-ops, it will generate code that calls these functions with the given
411 * parameters. Therefore, you can be sure that the compiler will keep those
412 * scheme values alive (on the stack or in a register) up to the point where
413 * scm_remember_upto_here* is called. In other words, place the call to
414 * scm_remember_upto_here* _behind_ the last code in your function, that
415 * depends on the scheme object to exist.
416 *
417 * Example: We want to make sure that the string object str does not get
418 * garbage collected during the execution of 'some_function' in the code
419 * below, because otherwise the characters belonging to str would be freed and
420 * 'some_function' might access freed memory. To make sure that the compiler
421 * keeps str alive on the stack or in a register such that it is visible to
422 * the conservative gc we add the call to scm_remember_upto_here_1 _after_ the
423 * call to 'some_function'. Note that this would not be necessary if str was
424 * used anyway after the call to 'some_function'.
425 * char *chars = scm_i_string_chars (str);
426 * some_function (chars);
427 * scm_remember_upto_here_1 (str); // str will be alive up to this point.
428 */
429
430 /* Remove any macro versions of these while defining the functions.
431 Functions are always included in the library, for upward binary
432 compatibility and in case combinations of GCC and non-GCC are used. */
433 #undef scm_remember_upto_here_1
434 #undef scm_remember_upto_here_2
435
436 void
437 scm_remember_upto_here_1 (SCM obj SCM_UNUSED)
438 {
439 /* Empty. Protects a single object from garbage collection. */
440 }
441
442 void
443 scm_remember_upto_here_2 (SCM obj1 SCM_UNUSED, SCM obj2 SCM_UNUSED)
444 {
445 /* Empty. Protects two objects from garbage collection. */
446 }
447
448 void
449 scm_remember_upto_here (SCM obj SCM_UNUSED, ...)
450 {
451 /* Empty. Protects any number of objects from garbage collection. */
452 }
453
454 /*
455 These crazy functions prevent garbage collection
456 of arguments after the first argument by
457 ensuring they remain live throughout the
458 function because they are used in the last
459 line of the code block.
460 It'd be better to have a nice compiler hint to
461 aid the conservative stack-scanning GC. --03/09/00 gjb */
462 SCM
463 scm_return_first (SCM elt, ...)
464 {
465 return elt;
466 }
467
468 int
469 scm_return_first_int (int i, ...)
470 {
471 return i;
472 }
473
474
475 SCM
476 scm_permanent_object (SCM obj)
477 {
478 return (scm_gc_protect_object (obj));
479 }
480
481
482 /* Protect OBJ from the garbage collector. OBJ will not be freed, even if all
483 other references are dropped, until the object is unprotected by calling
484 scm_gc_unprotect_object (OBJ). Calls to scm_gc_protect/unprotect_object nest,
485 i. e. it is possible to protect the same object several times, but it is
486 necessary to unprotect the object the same number of times to actually get
487 the object unprotected. It is an error to unprotect an object more often
488 than it has been protected before. The function scm_protect_object returns
489 OBJ.
490 */
491
492 /* Implementation note: For every object X, there is a counter which
493 scm_gc_protect_object (X) increments and scm_gc_unprotect_object (X) decrements.
494 */
495
496
497
498 SCM
499 scm_gc_protect_object (SCM obj)
500 {
501 SCM handle;
502
503 /* This critical section barrier will be replaced by a mutex. */
504 /* njrev: Indeed; if my comment above is correct, there is the same
505 critsec/mutex inconsistency here. */
506 SCM_CRITICAL_SECTION_START;
507
508 handle = scm_hashq_create_handle_x (scm_protects, obj, scm_from_int (0));
509 SCM_SETCDR (handle, scm_sum (SCM_CDR (handle), scm_from_int (1)));
510
511 protected_obj_count ++;
512
513 SCM_CRITICAL_SECTION_END;
514
515 return obj;
516 }
517
518
519 /* Remove any protection for OBJ established by a prior call to
520 scm_protect_object. This function returns OBJ.
521
522 See scm_protect_object for more information. */
523 SCM
524 scm_gc_unprotect_object (SCM obj)
525 {
526 SCM handle;
527
528 /* This critical section barrier will be replaced by a mutex. */
529 /* njrev: and again. */
530 SCM_CRITICAL_SECTION_START;
531
532 if (scm_gc_running_p)
533 {
534 fprintf (stderr, "scm_unprotect_object called during GC.\n");
535 abort ();
536 }
537
538 handle = scm_hashq_get_handle (scm_protects, obj);
539
540 if (scm_is_false (handle))
541 {
542 fprintf (stderr, "scm_unprotect_object called on unprotected object\n");
543 abort ();
544 }
545 else
546 {
547 SCM count = scm_difference (SCM_CDR (handle), scm_from_int (1));
548 if (scm_is_eq (count, scm_from_int (0)))
549 scm_hashq_remove_x (scm_protects, obj);
550 else
551 SCM_SETCDR (handle, count);
552 }
553 protected_obj_count --;
554
555 SCM_CRITICAL_SECTION_END;
556
557 return obj;
558 }
559
560 void
561 scm_gc_register_root (SCM *p)
562 {
563 /* Nothing. */
564 }
565
566 void
567 scm_gc_unregister_root (SCM *p)
568 {
569 /* Nothing. */
570 }
571
572 void
573 scm_gc_register_roots (SCM *b, unsigned long n)
574 {
575 SCM *p = b;
576 for (; p < b + n; ++p)
577 scm_gc_register_root (p);
578 }
579
580 void
581 scm_gc_unregister_roots (SCM *b, unsigned long n)
582 {
583 SCM *p = b;
584 for (; p < b + n; ++p)
585 scm_gc_unregister_root (p);
586 }
587
588 \f
589
590
591 /*
592 MOVE THIS FUNCTION. IT DOES NOT HAVE ANYTHING TODO WITH GC.
593 */
594
595 /* Get an integer from an environment variable. */
596 int
597 scm_getenv_int (const char *var, int def)
598 {
599 char *end = 0;
600 char *val = getenv (var);
601 long res = def;
602 if (!val)
603 return def;
604 res = strtol (val, &end, 10);
605 if (end == val)
606 return def;
607 return res;
608 }
609
610 void
611 scm_storage_prehistory ()
612 {
613 GC_all_interior_pointers = 0;
614 free_space_divisor = scm_getenv_int ("GC_FREE_SPACE_DIVISOR", 3);
615 minimum_free_space_divisor = free_space_divisor;
616 target_free_space_divisor = free_space_divisor;
617 GC_set_free_space_divisor (free_space_divisor);
618
619 GC_INIT ();
620
621 #if (! ((defined GC_VERSION_MAJOR) && (GC_VERSION_MAJOR >= 7))) \
622 && (defined SCM_I_GSC_USE_PTHREAD_THREADS)
623 /* When using GC 6.8, this call is required to initialize thread-local
624 freelists (shouldn't be necessary with GC 7.0). */
625 GC_init ();
626 #endif
627
628 GC_expand_hp (SCM_DEFAULT_INIT_HEAP_SIZE_2);
629
630 /* We only need to register a displacement for those types for which the
631 higher bits of the type tag are used to store a pointer (that is, a
632 pointer to an 8-octet aligned region). For `scm_tc3_struct', this is
633 handled in `scm_alloc_struct ()'. */
634 GC_REGISTER_DISPLACEMENT (scm_tc3_cons);
635 /* GC_REGISTER_DISPLACEMENT (scm_tc3_unused); */
636
637 /* Sanity check. */
638 if (!GC_is_visible (&scm_protects))
639 abort ();
640
641 scm_c_hook_init (&scm_before_gc_c_hook, 0, SCM_C_HOOK_NORMAL);
642 scm_c_hook_init (&scm_before_mark_c_hook, 0, SCM_C_HOOK_NORMAL);
643 scm_c_hook_init (&scm_before_sweep_c_hook, 0, SCM_C_HOOK_NORMAL);
644 scm_c_hook_init (&scm_after_sweep_c_hook, 0, SCM_C_HOOK_NORMAL);
645 scm_c_hook_init (&scm_after_gc_c_hook, 0, SCM_C_HOOK_NORMAL);
646 }
647
648 scm_i_pthread_mutex_t scm_i_gc_admin_mutex = SCM_I_PTHREAD_MUTEX_INITIALIZER;
649
650 void
651 scm_init_gc_protect_object ()
652 {
653 scm_protects = scm_c_make_hash_table (31);
654
655 #if 0
656 /* We can't have a cleanup handler since we have no thread to run it
657 in. */
658
659 #ifdef HAVE_ATEXIT
660 atexit (cleanup);
661 #else
662 #ifdef HAVE_ON_EXIT
663 on_exit (cleanup, 0);
664 #endif
665 #endif
666
667 #endif
668 }
669
670 \f
671
672 SCM scm_after_gc_hook;
673
674 static SCM after_gc_async_cell;
675
676 /* The function after_gc_async_thunk causes the execution of the
677 * after-gc-hook. It is run after the gc, as soon as the asynchronous
678 * events are handled by the evaluator.
679 */
680 static SCM
681 after_gc_async_thunk (void)
682 {
683 /* Fun, no? Hook-run *and* run-hook? */
684 scm_c_hook_run (&scm_after_gc_c_hook, NULL);
685 scm_c_run_hook (scm_after_gc_hook, SCM_EOL);
686 return SCM_UNSPECIFIED;
687 }
688
689
690 /* The function queue_after_gc_hook is run by the scm_before_gc_c_hook
691 * at the end of the garbage collection. The only purpose of this
692 * function is to mark the after_gc_async (which will eventually lead to
693 * the execution of the after_gc_async_thunk).
694 */
695 static void *
696 queue_after_gc_hook (void * hook_data SCM_UNUSED,
697 void *fn_data SCM_UNUSED,
698 void *data SCM_UNUSED)
699 {
700 /* If cell access debugging is enabled, the user may choose to perform
701 * additional garbage collections after an arbitrary number of cell
702 * accesses. We don't want the scheme level after-gc-hook to be performed
703 * for each of these garbage collections for the following reason: The
704 * execution of the after-gc-hook causes cell accesses itself. Thus, if the
705 * after-gc-hook was performed with every gc, and if the gc was performed
706 * after a very small number of cell accesses, then the number of cell
707 * accesses during the execution of the after-gc-hook will suffice to cause
708 * the execution of the next gc. Then, guile would keep executing the
709 * after-gc-hook over and over again, and would never come to do other
710 * things.
711 *
712 * To overcome this problem, if cell access debugging with additional
713 * garbage collections is enabled, the after-gc-hook is never run by the
714 * garbage collecter. When running guile with cell access debugging and the
715 * execution of the after-gc-hook is desired, then it is necessary to run
716 * the hook explicitly from the user code. This has the effect, that from
717 * the scheme level point of view it seems that garbage collection is
718 * performed with a much lower frequency than it actually is. Obviously,
719 * this will not work for code that depends on a fixed one to one
720 * relationship between the execution counts of the C level garbage
721 * collection hooks and the execution count of the scheme level
722 * after-gc-hook.
723 */
724
725 #if (SCM_DEBUG_CELL_ACCESSES == 1)
726 if (scm_debug_cells_gc_interval == 0)
727 #endif
728 {
729 scm_i_thread *t = SCM_I_CURRENT_THREAD;
730
731 if (scm_is_false (SCM_CDR (after_gc_async_cell)))
732 {
733 SCM_SETCDR (after_gc_async_cell, t->active_asyncs);
734 t->active_asyncs = after_gc_async_cell;
735 t->pending_asyncs = 1;
736 }
737 }
738
739 return NULL;
740 }
741
742 \f
743
744 static void *
745 start_gc_timer (void * hook_data SCM_UNUSED,
746 void *fn_data SCM_UNUSED,
747 void *data SCM_UNUSED)
748 {
749 if (!gc_start_time)
750 gc_start_time = scm_c_get_internal_run_time ();
751
752 return NULL;
753 }
754
755 static void *
756 accumulate_gc_timer (void * hook_data SCM_UNUSED,
757 void *fn_data SCM_UNUSED,
758 void *data SCM_UNUSED)
759 {
760 if (gc_start_time)
761 {
762 long now = scm_c_get_internal_run_time ();
763 gc_time_taken += now - gc_start_time;
764 gc_start_time = 0;
765 }
766
767 return NULL;
768 }
769
770 /* Return some idea of the memory footprint of a process, in bytes.
771 Currently only works on Linux systems. */
772 static size_t
773 get_image_size (void)
774 {
775 unsigned long size, resident, share;
776 size_t ret = 0;
777
778 FILE *fp = fopen ("/proc/self/statm", "r");
779
780 if (fp && fscanf (fp, "%lu %lu %lu", &size, &resident, &share) == 3)
781 ret = resident * 4096;
782
783 if (fp)
784 fclose (fp);
785
786 return ret;
787 }
788
789 /* These are discussed later. */
790 static size_t bytes_until_gc;
791 static scm_i_pthread_mutex_t bytes_until_gc_lock = SCM_I_PTHREAD_MUTEX_INITIALIZER;
792
793 /* Make GC run more frequently when the process image size is growing,
794 measured against the number of bytes allocated through the GC.
795
796 If Guile is allocating at a GC-managed heap size H, libgc will tend
797 to limit the process image size to H*N. But if at the same time the
798 user program is mallocating at a rate M bytes per GC-allocated byte,
799 then the process stabilizes at H*N*M -- assuming that collecting data
800 will result in malloc'd data being freed. It doesn't take a very
801 large M for this to be a bad situation. To limit the image size,
802 Guile should GC more often -- the bigger the M, the more often.
803
804 Numeric functions that produce bigger and bigger integers are
805 pessimal, because M is an increasing function of time. Here is an
806 example of such a function:
807
808 (define (factorial n)
809 (define (fac n acc)
810 (if (<= n 1)
811 acc
812 (fac (1- n) (* n acc))))
813 (fac n 1))
814
815 It is possible for a process to grow for reasons that will not be
816 solved by faster GC. In that case M will be estimated as
817 artificially high for a while, and so GC will happen more often on
818 the Guile side. But when it stabilizes, Guile can ease back the GC
819 frequency.
820
821 The key is to measure process image growth, not mallocation rate.
822 For maximum effectiveness, Guile reacts quickly to process growth,
823 and exponentially backs down when the process stops growing.
824
825 See http://thread.gmane.org/gmane.lisp.guile.devel/12552/focus=12936
826 for further discussion.
827 */
828 static void *
829 adjust_gc_frequency (void * hook_data SCM_UNUSED,
830 void *fn_data SCM_UNUSED,
831 void *data SCM_UNUSED)
832 {
833 static size_t prev_image_size = 0;
834 static size_t prev_bytes_alloced = 0;
835 size_t image_size;
836 size_t bytes_alloced;
837
838 scm_i_pthread_mutex_lock (&bytes_until_gc_lock);
839 bytes_until_gc = GC_get_heap_size ();
840 scm_i_pthread_mutex_unlock (&bytes_until_gc_lock);
841
842 image_size = get_image_size ();
843 bytes_alloced = GC_get_total_bytes ();
844
845 #define HEURISTICS_DEBUG 0
846
847 #if HEURISTICS_DEBUG
848 fprintf (stderr, "prev image / alloced: %lu / %lu\n", prev_image_size, prev_bytes_alloced);
849 fprintf (stderr, " image / alloced: %lu / %lu\n", image_size, bytes_alloced);
850 fprintf (stderr, "divisor %lu / %f\n", free_space_divisor, target_free_space_divisor);
851 #endif
852
853 if (prev_image_size && bytes_alloced != prev_bytes_alloced)
854 {
855 double growth_rate, new_target_free_space_divisor;
856 double decay_factor = 0.5;
857 double hysteresis = 0.1;
858
859 growth_rate = ((double) image_size - prev_image_size)
860 / ((double)bytes_alloced - prev_bytes_alloced);
861
862 #if HEURISTICS_DEBUG
863 fprintf (stderr, "growth rate %f\n", growth_rate);
864 #endif
865
866 new_target_free_space_divisor = minimum_free_space_divisor;
867
868 if (growth_rate > 0)
869 new_target_free_space_divisor *= 1.0 + growth_rate;
870
871 #if HEURISTICS_DEBUG
872 fprintf (stderr, "new divisor %f\n", new_target_free_space_divisor);
873 #endif
874
875 if (new_target_free_space_divisor < target_free_space_divisor)
876 /* Decay down. */
877 target_free_space_divisor =
878 (decay_factor * target_free_space_divisor
879 + (1.0 - decay_factor) * new_target_free_space_divisor);
880 else
881 /* Jump up. */
882 target_free_space_divisor = new_target_free_space_divisor;
883
884 #if HEURISTICS_DEBUG
885 fprintf (stderr, "new target divisor %f\n", target_free_space_divisor);
886 #endif
887
888 if (free_space_divisor + 0.5 + hysteresis < target_free_space_divisor
889 || free_space_divisor - 0.5 - hysteresis > target_free_space_divisor)
890 {
891 free_space_divisor = lround (target_free_space_divisor);
892 #if HEURISTICS_DEBUG
893 fprintf (stderr, "new divisor %lu\n", free_space_divisor);
894 #endif
895 GC_set_free_space_divisor (free_space_divisor);
896 }
897 }
898
899 prev_image_size = image_size;
900 prev_bytes_alloced = bytes_alloced;
901
902 return NULL;
903 }
904
905 /* The adjust_gc_frequency routine handles transients in the process
906 image size. It can't handle instense non-GC-managed steady-state
907 allocation though, as it decays the FSD at steady-state down to its
908 minimum value.
909
910 The only real way to handle continuous, high non-GC allocation is to
911 let the GC know about it. This routine can handle non-GC allocation
912 rates that are similar in size to the GC-managed heap size.
913 */
914
915 void
916 scm_gc_register_allocation (size_t size)
917 {
918 scm_i_pthread_mutex_lock (&bytes_until_gc_lock);
919 if (bytes_until_gc - size > bytes_until_gc)
920 {
921 bytes_until_gc = GC_get_heap_size ();
922 scm_i_pthread_mutex_unlock (&bytes_until_gc_lock);
923 GC_gcollect ();
924 }
925 else
926 {
927 bytes_until_gc -= size;
928 scm_i_pthread_mutex_unlock (&bytes_until_gc_lock);
929 }
930 }
931
932
933 \f
934
935 char const *
936 scm_i_tag_name (scm_t_bits tag)
937 {
938 switch (tag & 0x7f) /* 7 bits */
939 {
940 case scm_tcs_struct:
941 return "struct";
942 case scm_tcs_cons_imcar:
943 return "cons (immediate car)";
944 case scm_tcs_cons_nimcar:
945 return "cons (non-immediate car)";
946 case scm_tc7_pointer:
947 return "foreign";
948 case scm_tc7_hashtable:
949 return "hashtable";
950 case scm_tc7_weak_set:
951 return "weak-set";
952 case scm_tc7_weak_table:
953 return "weak-table";
954 case scm_tc7_fluid:
955 return "fluid";
956 case scm_tc7_dynamic_state:
957 return "dynamic state";
958 case scm_tc7_frame:
959 return "frame";
960 case scm_tc7_objcode:
961 return "objcode";
962 case scm_tc7_vm:
963 return "vm";
964 case scm_tc7_vm_cont:
965 return "vm continuation";
966 case scm_tc7_wvect:
967 return "weak vector";
968 case scm_tc7_vector:
969 return "vector";
970 case scm_tc7_number:
971 switch (tag)
972 {
973 case scm_tc16_real:
974 return "real";
975 break;
976 case scm_tc16_big:
977 return "bignum";
978 break;
979 case scm_tc16_complex:
980 return "complex number";
981 break;
982 case scm_tc16_fraction:
983 return "fraction";
984 break;
985 }
986 break;
987 case scm_tc7_string:
988 return "string";
989 break;
990 case scm_tc7_stringbuf:
991 return "string buffer";
992 break;
993 case scm_tc7_symbol:
994 return "symbol";
995 break;
996 case scm_tc7_variable:
997 return "variable";
998 break;
999 case scm_tc7_port:
1000 return "port";
1001 break;
1002 case scm_tc7_smob:
1003 {
1004 int k = 0xff & (tag >> 8);
1005 return (scm_smobs[k].name);
1006 }
1007 break;
1008 }
1009
1010 return NULL;
1011 }
1012
1013
1014
1015 \f
1016 void
1017 scm_init_gc ()
1018 {
1019 /* `GC_INIT ()' was invoked in `scm_storage_prehistory ()'. */
1020
1021 scm_after_gc_hook = scm_make_hook (SCM_INUM0);
1022 scm_c_define ("after-gc-hook", scm_after_gc_hook);
1023
1024 /* When the async is to run, the cdr of the gc_async pair gets set to
1025 the asyncs queue of the current thread. */
1026 after_gc_async_cell = scm_cons (scm_c_make_gsubr ("%after-gc-thunk", 0, 0, 0,
1027 after_gc_async_thunk),
1028 SCM_BOOL_F);
1029
1030 scm_c_hook_add (&scm_before_gc_c_hook, queue_after_gc_hook, NULL, 0);
1031 scm_c_hook_add (&scm_before_gc_c_hook, start_gc_timer, NULL, 0);
1032 scm_c_hook_add (&scm_after_gc_c_hook, accumulate_gc_timer, NULL, 0);
1033
1034 #if HAVE_GC_GET_HEAP_USAGE_SAFE
1035 /* GC_get_heap_usage does not take a lock, and so can run in the GC
1036 start hook. */
1037 scm_c_hook_add (&scm_before_gc_c_hook, adjust_gc_frequency, NULL, 0);
1038 #else
1039 /* GC_get_heap_usage might take a lock (and did from 7.2alpha1 to
1040 7.2alpha7), so call it in the after_gc_hook. */
1041 scm_c_hook_add (&scm_after_gc_c_hook, adjust_gc_frequency, NULL, 0);
1042 #endif
1043
1044 #ifdef HAVE_GC_SET_START_CALLBACK
1045 GC_set_start_callback (run_before_gc_c_hook);
1046 #endif
1047
1048 #include "libguile/gc.x"
1049 }
1050
1051
1052 void
1053 scm_gc_sweep (void)
1054 #define FUNC_NAME "scm_gc_sweep"
1055 {
1056 /* FIXME */
1057 fprintf (stderr, "%s: doing nothing\n", FUNC_NAME);
1058 }
1059 #undef FUNC_NAME
1060
1061 /*
1062 Local Variables:
1063 c-file-style: "gnu"
1064 End:
1065 */