Merge commit 'fb7dd00169304a5922838e4d2f25253640a35def'
[bpt/guile.git] / libguile / print.c
1 /* Copyright (C) 1995-1999, 2000, 2001, 2002, 2003, 2004, 2006, 2008,
2 * 2009, 2010, 2011, 2012, 2013, 2014 Free Software Foundation, Inc.
3 *
4 * This library is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU Lesser General Public License
6 * as published by the Free Software Foundation; either version 3 of
7 * the License, or (at your option) any later version.
8 *
9 * This library is distributed in the hope that it will be useful, but
10 * WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
13 *
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with this library; if not, write to the Free Software
16 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
17 * 02110-1301 USA
18 */
19
20
21 \f
22 #ifdef HAVE_CONFIG_H
23 # include <config.h>
24 #endif
25
26 #include <errno.h>
27 #include <iconv.h>
28 #include <stdio.h>
29 #include <assert.h>
30
31 #include <uniconv.h>
32 #include <unictype.h>
33
34 #include "libguile/_scm.h"
35 #include "libguile/chars.h"
36 #include "libguile/continuations.h"
37 #include "libguile/smob.h"
38 #include "libguile/control.h"
39 #include "libguile/eval.h"
40 #include "libguile/macros.h"
41 #include "libguile/procprop.h"
42 #include "libguile/read.h"
43 #include "libguile/programs.h"
44 #include "libguile/alist.h"
45 #include "libguile/struct.h"
46 #include "libguile/ports.h"
47 #include "libguile/ports-internal.h"
48 #include "libguile/root.h"
49 #include "libguile/strings.h"
50 #include "libguile/strports.h"
51 #include "libguile/vectors.h"
52 #include "libguile/numbers.h"
53 #include "libguile/vm.h"
54
55 #include "libguile/validate.h"
56 #include "libguile/print.h"
57
58 #include "libguile/private-options.h"
59
60 \f
61
62 /* Character printers. */
63
64 #define PORT_CONVERSION_HANDLER(port) \
65 SCM_PTAB_ENTRY (port)->ilseq_handler
66
67 static size_t display_string (const void *, int, size_t, SCM,
68 scm_t_string_failed_conversion_handler);
69
70 static int display_character (scm_t_wchar, SCM,
71 scm_t_string_failed_conversion_handler);
72
73 static void write_character (scm_t_wchar, SCM, int);
74
75 static void write_character_escaped (scm_t_wchar, int, SCM);
76
77 \f
78
79 /* {Names of immediate symbols}
80 *
81 * This table must agree with the declarations in scm.h: {Immediate Symbols}.
82 */
83
84 /* This table must agree with the list of flags in tags.h. */
85 static const char *iflagnames[] =
86 {
87 "#f",
88 "#nil", /* Elisp nil value. Should print from elisp as symbol `nil'. */
89 "#<XXX UNUSED LISP FALSE -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>",
90 "()",
91 "#t",
92 "#<XXX UNUSED BOOLEAN 0 -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>",
93 "#<XXX UNUSED BOOLEAN 1 -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>",
94 "#<XXX UNUSED BOOLEAN 2 -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>",
95 "#<unspecified>",
96 "#<undefined>",
97 "#<eof>",
98
99 /* Unbound slot marker for GOOPS. For internal use in GOOPS only. */
100 "#<unbound>",
101 };
102
103 SCM_SYMBOL (sym_reader, "reader");
104
105 scm_t_option scm_print_opts[] = {
106 { SCM_OPTION_SCM, "highlight-prefix", (scm_t_bits)SCM_BOOL_F_BITS,
107 "The string to print before highlighted values." },
108 { SCM_OPTION_SCM, "highlight-suffix", (scm_t_bits)SCM_BOOL_F_BITS,
109 "The string to print after highlighted values." },
110 { SCM_OPTION_SCM, "quote-keywordish-symbols", (scm_t_bits)SCM_BOOL_F_BITS,
111 "How to print symbols that have a colon as their first or last character. "
112 "The value '#f' does not quote the colons; '#t' quotes them; "
113 "'reader' quotes them when the reader option 'keywords' is not '#f'." },
114 { SCM_OPTION_BOOLEAN, "escape-newlines", 1,
115 "Render newlines as \\n when printing using `write'." },
116 { SCM_OPTION_BOOLEAN, "r7rs-symbols", 0,
117 "Escape symbols using R7RS |...| symbol notation." },
118 { 0 },
119 };
120
121 SCM_DEFINE (scm_print_options, "print-options-interface", 0, 1, 0,
122 (SCM setting),
123 "Option interface for the print options. Instead of using\n"
124 "this procedure directly, use the procedures\n"
125 "@code{print-enable}, @code{print-disable}, @code{print-set!}\n"
126 "and @code{print-options}.")
127 #define FUNC_NAME s_scm_print_options
128 {
129 SCM ans = scm_options (setting,
130 scm_print_opts,
131 FUNC_NAME);
132 return ans;
133 }
134 #undef FUNC_NAME
135
136 \f
137 /* {Printing of Scheme Objects}
138 */
139
140 /* Detection of circular references.
141 *
142 * Due to other constraints in the implementation, this code has bad
143 * time complexity (O (depth * N)), The printer code can be
144 * rewritten to be O(N).
145 */
146 #define PUSH_REF(pstate, obj) \
147 do \
148 { \
149 PSTATE_STACK_SET (pstate, pstate->top, obj); \
150 pstate->top++; \
151 if (pstate->top == pstate->ceiling) \
152 grow_ref_stack (pstate); \
153 } while(0)
154
155 #define ENTER_NESTED_DATA(pstate, obj, label) \
156 do \
157 { \
158 register unsigned long i; \
159 for (i = 0; i < pstate->top; ++i) \
160 if (scm_is_eq (PSTATE_STACK_REF (pstate, i), (obj))) \
161 goto label; \
162 if (pstate->fancyp) \
163 { \
164 if (pstate->top - pstate->list_offset >= pstate->level) \
165 { \
166 scm_putc_unlocked ('#', port); \
167 return; \
168 } \
169 } \
170 PUSH_REF(pstate, obj); \
171 } while(0)
172
173 #define EXIT_NESTED_DATA(pstate) \
174 do \
175 { \
176 --pstate->top; \
177 PSTATE_STACK_SET (pstate, pstate->top, SCM_UNDEFINED); \
178 } \
179 while (0)
180
181 SCM scm_print_state_vtable = SCM_BOOL_F;
182 static SCM print_state_pool = SCM_EOL;
183 scm_i_pthread_mutex_t print_state_mutex = SCM_I_PTHREAD_MUTEX_INITIALIZER;
184
185 #ifdef GUILE_DEBUG /* Used for debugging purposes */
186
187 SCM_DEFINE (scm_current_pstate, "current-pstate", 0, 0, 0,
188 (),
189 "Return the current-pstate -- the car of the\n"
190 "@code{print_state_pool}. @code{current-pstate} is only\n"
191 "included in @code{--enable-guile-debug} builds.")
192 #define FUNC_NAME s_scm_current_pstate
193 {
194 if (!scm_is_null (print_state_pool))
195 return SCM_CAR (print_state_pool);
196 else
197 return SCM_BOOL_F;
198 }
199 #undef FUNC_NAME
200
201 #endif
202
203 #define PSTATE_SIZE 50L
204
205 static SCM
206 make_print_state (void)
207 {
208 SCM print_state
209 = scm_make_struct (scm_print_state_vtable, SCM_INUM0, SCM_EOL);
210 scm_print_state *pstate = SCM_PRINT_STATE (print_state);
211 pstate->ref_vect = scm_c_make_vector (PSTATE_SIZE, SCM_UNDEFINED);
212 pstate->ceiling = SCM_SIMPLE_VECTOR_LENGTH (pstate->ref_vect);
213 pstate->highlight_objects = SCM_EOL;
214 return print_state;
215 }
216
217 SCM
218 scm_make_print_state ()
219 {
220 SCM answer = SCM_BOOL_F;
221
222 /* First try to allocate a print state from the pool */
223 scm_i_pthread_mutex_lock (&print_state_mutex);
224 if (!scm_is_null (print_state_pool))
225 {
226 answer = SCM_CAR (print_state_pool);
227 print_state_pool = SCM_CDR (print_state_pool);
228 }
229 scm_i_pthread_mutex_unlock (&print_state_mutex);
230
231 return scm_is_false (answer) ? make_print_state () : answer;
232 }
233
234 void
235 scm_free_print_state (SCM print_state)
236 {
237 SCM handle;
238 scm_print_state *pstate = SCM_PRINT_STATE (print_state);
239 /* Cleanup before returning print state to pool.
240 * It is better to do it here. Doing it in scm_prin1
241 * would cost more since that function is called much more
242 * often.
243 */
244 pstate->fancyp = 0;
245 pstate->revealed = 0;
246 pstate->highlight_objects = SCM_EOL;
247 scm_i_pthread_mutex_lock (&print_state_mutex);
248 handle = scm_cons (print_state, print_state_pool);
249 print_state_pool = handle;
250 scm_i_pthread_mutex_unlock (&print_state_mutex);
251 }
252
253 SCM
254 scm_i_port_with_print_state (SCM port, SCM print_state)
255 {
256 if (SCM_UNBNDP (print_state))
257 {
258 if (SCM_PORT_WITH_PS_P (port))
259 return port;
260 else
261 print_state = scm_make_print_state ();
262 /* port does not need to be coerced since it doesn't have ps */
263 }
264 else
265 port = SCM_COERCE_OUTPORT (port);
266 SCM_RETURN_NEWSMOB (scm_tc16_port_with_ps,
267 SCM_UNPACK (scm_cons (port, print_state)));
268 }
269
270 static void
271 grow_ref_stack (scm_print_state *pstate)
272 {
273 SCM old_vect = pstate->ref_vect;
274 size_t old_size = SCM_SIMPLE_VECTOR_LENGTH (old_vect);
275 size_t new_size = 2 * pstate->ceiling;
276 SCM new_vect = scm_c_make_vector (new_size, SCM_UNDEFINED);
277 unsigned long int i;
278
279 for (i = 0; i != old_size; ++i)
280 SCM_SIMPLE_VECTOR_SET (new_vect, i, SCM_SIMPLE_VECTOR_REF (old_vect, i));
281
282 pstate->ref_vect = new_vect;
283 pstate->ceiling = new_size;
284 }
285
286 #define PSTATE_STACK_REF(p,i) SCM_SIMPLE_VECTOR_REF((p)->ref_vect, (i))
287 #define PSTATE_STACK_SET(p,i,v) SCM_SIMPLE_VECTOR_SET((p)->ref_vect, (i), (v))
288
289 static void
290 print_circref (SCM port, scm_print_state *pstate, SCM ref)
291 {
292 register long i;
293 long self = pstate->top - 1;
294 i = pstate->top - 1;
295 if (scm_is_pair (PSTATE_STACK_REF (pstate, i)))
296 {
297 while (i > 0)
298 {
299 if (!scm_is_pair (PSTATE_STACK_REF (pstate, i-1))
300 || !scm_is_eq (SCM_CDR (PSTATE_STACK_REF (pstate, i-1)),
301 SCM_CDR (PSTATE_STACK_REF (pstate, i))))
302 break;
303 --i;
304 }
305 self = i;
306 }
307 for (i = pstate->top - 1; 1; --i)
308 if (scm_is_eq (PSTATE_STACK_REF(pstate, i), ref))
309 break;
310 scm_putc_unlocked ('#', port);
311 scm_intprint (i - self, 10, port);
312 scm_putc_unlocked ('#', port);
313 }
314
315 /* Print the name of a symbol. */
316
317 static int
318 quote_keywordish_symbols (void)
319 {
320 SCM option = SCM_PRINT_KEYWORD_STYLE;
321
322 if (scm_is_false (option))
323 return 0;
324 if (scm_is_eq (option, sym_reader))
325 return scm_is_true (SCM_PACK (SCM_KEYWORD_STYLE));
326 return 1;
327 }
328
329 #define INITIAL_IDENTIFIER_MASK \
330 (UC_CATEGORY_MASK_Lu | UC_CATEGORY_MASK_Ll | UC_CATEGORY_MASK_Lt \
331 | UC_CATEGORY_MASK_Lm | UC_CATEGORY_MASK_Lo | UC_CATEGORY_MASK_Mn \
332 | UC_CATEGORY_MASK_Nl | UC_CATEGORY_MASK_No | UC_CATEGORY_MASK_Pd \
333 | UC_CATEGORY_MASK_Pc | UC_CATEGORY_MASK_Po | UC_CATEGORY_MASK_Sc \
334 | UC_CATEGORY_MASK_Sm | UC_CATEGORY_MASK_Sk | UC_CATEGORY_MASK_So \
335 | UC_CATEGORY_MASK_Co)
336
337 #define SUBSEQUENT_IDENTIFIER_MASK \
338 (INITIAL_IDENTIFIER_MASK \
339 | UC_CATEGORY_MASK_Nd | UC_CATEGORY_MASK_Mc | UC_CATEGORY_MASK_Me)
340
341 /* FIXME: Cache this information on the symbol, somehow. */
342 static int
343 symbol_has_extended_read_syntax (SCM sym)
344 {
345 size_t pos, len = scm_i_symbol_length (sym);
346 scm_t_wchar c;
347
348 /* The empty symbol. */
349 if (len == 0)
350 return 1;
351
352 c = scm_i_symbol_ref (sym, 0);
353
354 switch (c)
355 {
356 case '\'':
357 case '`':
358 case ',':
359 case '"':
360 case ';':
361 case '#':
362 /* Some initial-character constraints. */
363 return 1;
364
365 case '|':
366 case '\\':
367 /* R7RS allows neither '|' nor '\' in bare symbols. */
368 if (SCM_PRINT_R7RS_SYMBOLS_P)
369 return 1;
370 break;
371
372 case ':':
373 /* Symbols that look like keywords. */
374 return quote_keywordish_symbols ();
375
376 case '.':
377 /* Single dot conflicts with dotted-pair notation. */
378 if (len == 1)
379 return 1;
380 /* Fall through to check numbers. */
381 case '+':
382 case '-':
383 case '0':
384 case '1':
385 case '2':
386 case '3':
387 case '4':
388 case '5':
389 case '6':
390 case '7':
391 case '8':
392 case '9':
393 /* Number-ish symbols. Numbers with radixes already caught be #
394 above. */
395 if (scm_is_true (scm_i_string_to_number (scm_symbol_to_string (sym), 10)))
396 return 1;
397 break;
398
399 default:
400 break;
401 }
402
403 /* Other disallowed first characters. */
404 if (!uc_is_general_category_withtable (c, INITIAL_IDENTIFIER_MASK))
405 return 1;
406
407 /* Keywords can be identified by trailing colons too. */
408 if (scm_i_symbol_ref (sym, len - 1) == ':')
409 return quote_keywordish_symbols ();
410
411 /* Otherwise, any character that's in the identifier category mask is
412 fine to pass through as-is, provided it's not one of the ASCII
413 delimiters like `;'. */
414 for (pos = 1; pos < len; pos++)
415 {
416 c = scm_i_symbol_ref (sym, pos);
417 if (!uc_is_general_category_withtable (c, SUBSEQUENT_IDENTIFIER_MASK))
418 return 1;
419 else if (c == '"' || c == ';' || c == '#')
420 return 1;
421 else if ((c == '|' || c == '\\') && SCM_PRINT_R7RS_SYMBOLS_P)
422 /* R7RS allows neither '|' nor '\' in bare symbols. */
423 return 1;
424 }
425
426 return 0;
427 }
428
429 static void
430 print_normal_symbol (SCM sym, SCM port)
431 {
432 size_t len;
433 scm_t_string_failed_conversion_handler strategy;
434
435 len = scm_i_symbol_length (sym);
436 strategy = SCM_PTAB_ENTRY (port)->ilseq_handler;
437
438 if (scm_i_is_narrow_symbol (sym))
439 display_string (scm_i_symbol_chars (sym), 1, len, port, strategy);
440 else
441 display_string (scm_i_symbol_wide_chars (sym), 0, len, port, strategy);
442 }
443
444 static void
445 print_extended_symbol (SCM sym, SCM port)
446 {
447 size_t pos, len;
448 scm_t_string_failed_conversion_handler strategy;
449
450 len = scm_i_symbol_length (sym);
451 strategy = PORT_CONVERSION_HANDLER (port);
452
453 scm_lfwrite_unlocked ("#{", 2, port);
454
455 for (pos = 0; pos < len; pos++)
456 {
457 scm_t_wchar c = scm_i_symbol_ref (sym, pos);
458
459 if (uc_is_general_category_withtable (c,
460 SUBSEQUENT_IDENTIFIER_MASK
461 | UC_CATEGORY_MASK_Zs))
462 {
463 if (!display_character (c, port, strategy)
464 || (c == '\\' && !display_character (c, port, strategy)))
465 scm_encoding_error ("print_extended_symbol", errno,
466 "cannot convert to output locale",
467 port, SCM_MAKE_CHAR (c));
468 }
469 else
470 {
471 scm_lfwrite_unlocked ("\\x", 2, port);
472 scm_intprint (c, 16, port);
473 scm_putc_unlocked (';', port);
474 }
475 }
476
477 scm_lfwrite_unlocked ("}#", 2, port);
478 }
479
480 static void
481 print_r7rs_extended_symbol (SCM sym, SCM port)
482 {
483 size_t pos, len;
484 scm_t_string_failed_conversion_handler strategy;
485
486 len = scm_i_symbol_length (sym);
487 strategy = PORT_CONVERSION_HANDLER (port);
488
489 scm_putc_unlocked ('|', port);
490
491 for (pos = 0; pos < len; pos++)
492 {
493 scm_t_wchar c = scm_i_symbol_ref (sym, pos);
494
495 switch (c)
496 {
497 case '\a': scm_lfwrite_unlocked ("\\a", 2, port); break;
498 case '\b': scm_lfwrite_unlocked ("\\b", 2, port); break;
499 case '\t': scm_lfwrite_unlocked ("\\t", 2, port); break;
500 case '\n': scm_lfwrite_unlocked ("\\n", 2, port); break;
501 case '\r': scm_lfwrite_unlocked ("\\r", 2, port); break;
502 case '|': scm_lfwrite_unlocked ("\\|", 2, port); break;
503 case '\\': scm_lfwrite_unlocked ("\\x5c;", 5, port); break;
504 default:
505 if (uc_is_general_category_withtable (c,
506 UC_CATEGORY_MASK_L
507 | UC_CATEGORY_MASK_M
508 | UC_CATEGORY_MASK_N
509 | UC_CATEGORY_MASK_P
510 | UC_CATEGORY_MASK_S)
511 || (c == ' '))
512 {
513 if (!display_character (c, port, strategy))
514 scm_encoding_error ("print_r7rs_extended_symbol", errno,
515 "cannot convert to output locale",
516 port, SCM_MAKE_CHAR (c));
517 }
518 else
519 {
520 scm_lfwrite_unlocked ("\\x", 2, port);
521 scm_intprint (c, 16, port);
522 scm_putc_unlocked (';', port);
523 }
524 break;
525 }
526 }
527
528 scm_putc_unlocked ('|', port);
529 }
530
531 /* FIXME: allow R6RS hex escapes instead of #{...}# or |...|. */
532 static void
533 print_symbol (SCM sym, SCM port)
534 {
535 if (!symbol_has_extended_read_syntax (sym))
536 print_normal_symbol (sym, port);
537 else if (SCM_PRINT_R7RS_SYMBOLS_P)
538 print_r7rs_extended_symbol (sym, port);
539 else
540 print_extended_symbol (sym, port);
541 }
542
543 void
544 scm_print_symbol_name (const char *str, size_t len, SCM port)
545 {
546 SCM symbol = scm_from_utf8_symboln (str, len);
547 print_symbol (symbol, port);
548 }
549
550 /* Print generally. Handles both write and display according to PSTATE.
551 */
552 SCM_GPROC(s_write, "write", 1, 1, 0, scm_write, g_write);
553 SCM_GPROC(s_display, "display", 1, 1, 0, scm_display, g_display);
554
555 static void iprin1 (SCM exp, SCM port, scm_print_state *pstate);
556
557
558 /* Print a character as an octal or hex escape. */
559 #define PRINT_CHAR_ESCAPE(i, port) \
560 do \
561 { \
562 if (!SCM_R6RS_ESCAPES_P) \
563 scm_intprint (i, 8, port); \
564 else \
565 { \
566 scm_puts_unlocked ("x", port); \
567 scm_intprint (i, 16, port); \
568 } \
569 } \
570 while (0)
571
572
573 void
574 scm_iprin1 (SCM exp, SCM port, scm_print_state *pstate)
575 {
576 if (pstate->fancyp
577 && scm_is_true (scm_memq (exp, pstate->highlight_objects)))
578 {
579 scm_display (SCM_PRINT_HIGHLIGHT_PREFIX, port);
580 iprin1 (exp, port, pstate);
581 scm_display (SCM_PRINT_HIGHLIGHT_SUFFIX, port);
582 }
583 else
584 iprin1 (exp, port, pstate);
585 }
586
587 static void
588 iprin1 (SCM exp, SCM port, scm_print_state *pstate)
589 {
590 switch (SCM_ITAG3 (exp))
591 {
592 case scm_tc3_tc7_1:
593 case scm_tc3_tc7_2:
594 /* These tc3 tags should never occur in an immediate value. They are
595 * only used in cell types of non-immediates, i. e. the value returned
596 * by SCM_CELL_TYPE (exp) can use these tags.
597 */
598 scm_ipruk ("immediate", exp, port);
599 break;
600 case scm_tc3_int_1:
601 case scm_tc3_int_2:
602 scm_intprint (SCM_I_INUM (exp), 10, port);
603 break;
604 case scm_tc3_imm24:
605 if (SCM_CHARP (exp))
606 {
607 if (SCM_WRITINGP (pstate))
608 write_character (SCM_CHAR (exp), port, 0);
609 else
610 {
611 if (!display_character (SCM_CHAR (exp), port,
612 PORT_CONVERSION_HANDLER (port)))
613 scm_encoding_error (__func__, errno,
614 "cannot convert to output locale",
615 port, exp);
616 }
617 }
618 else if (SCM_IFLAGP (exp)
619 && ((size_t) SCM_IFLAGNUM (exp) < (sizeof iflagnames / sizeof (char *))))
620 {
621 scm_puts_unlocked (iflagnames [SCM_IFLAGNUM (exp)], port);
622 }
623 else
624 {
625 /* unknown immediate value */
626 scm_ipruk ("immediate", exp, port);
627 }
628 break;
629 case scm_tc3_cons:
630 switch (SCM_TYP7 (exp))
631 {
632 case scm_tcs_struct:
633 {
634 ENTER_NESTED_DATA (pstate, exp, circref);
635 if (SCM_OBJ_CLASS_FLAGS (exp) & SCM_CLASSF_GOOPS)
636 {
637 SCM pwps, print = pstate->writingp ? g_write : g_display;
638 if (SCM_UNPACK (print) == 0)
639 goto print_struct;
640 pwps = scm_i_port_with_print_state (port, pstate->handle);
641 pstate->revealed = 1;
642 scm_call_2 (print, exp, pwps);
643 }
644 else
645 {
646 print_struct:
647 scm_print_struct (exp, port, pstate);
648 }
649 EXIT_NESTED_DATA (pstate);
650 }
651 break;
652 case scm_tcs_cons_imcar:
653 case scm_tcs_cons_nimcar:
654 ENTER_NESTED_DATA (pstate, exp, circref);
655 scm_iprlist ("(", exp, ')', port, pstate);
656 EXIT_NESTED_DATA (pstate);
657 break;
658 circref:
659 print_circref (port, pstate, exp);
660 break;
661 case scm_tc7_number:
662 switch SCM_TYP16 (exp) {
663 case scm_tc16_big:
664 scm_bigprint (exp, port, pstate);
665 break;
666 case scm_tc16_real:
667 scm_print_real (exp, port, pstate);
668 break;
669 case scm_tc16_complex:
670 scm_print_complex (exp, port, pstate);
671 break;
672 case scm_tc16_fraction:
673 scm_i_print_fraction (exp, port, pstate);
674 break;
675 }
676 break;
677 case scm_tc7_stringbuf:
678 scm_i_print_stringbuf (exp, port, pstate);
679 break;
680 case scm_tc7_string:
681 if (SCM_WRITINGP (pstate))
682 {
683 size_t len, i;
684
685 display_character ('"', port, iconveh_question_mark);
686 len = scm_i_string_length (exp);
687 for (i = 0; i < len; ++i)
688 write_character (scm_i_string_ref (exp, i), port, 1);
689
690 display_character ('"', port, iconveh_question_mark);
691 scm_remember_upto_here_1 (exp);
692 }
693 else
694 {
695 size_t len, printed;
696
697 len = scm_i_string_length (exp);
698 printed = display_string (scm_i_string_data (exp),
699 scm_i_is_narrow_string (exp),
700 len, port,
701 PORT_CONVERSION_HANDLER (port));
702 if (SCM_UNLIKELY (printed < len))
703 scm_encoding_error (__func__, errno,
704 "cannot convert to output locale",
705 port, scm_c_string_ref (exp, printed));
706 }
707
708 scm_remember_upto_here_1 (exp);
709 break;
710 case scm_tc7_symbol:
711 if (scm_i_symbol_is_interned (exp))
712 {
713 print_symbol (exp, port);
714 scm_remember_upto_here_1 (exp);
715 }
716 else
717 {
718 scm_puts_unlocked ("#<uninterned-symbol ", port);
719 print_symbol (exp, port);
720 scm_putc_unlocked (' ', port);
721 scm_uintprint (SCM_UNPACK (exp), 16, port);
722 scm_putc_unlocked ('>', port);
723 }
724 break;
725 case scm_tc7_variable:
726 scm_i_variable_print (exp, port, pstate);
727 break;
728 case scm_tc7_program:
729 scm_i_program_print (exp, port, pstate);
730 break;
731 case scm_tc7_pointer:
732 scm_i_pointer_print (exp, port, pstate);
733 break;
734 case scm_tc7_hashtable:
735 scm_i_hashtable_print (exp, port, pstate);
736 break;
737 case scm_tc7_weak_set:
738 scm_i_weak_set_print (exp, port, pstate);
739 break;
740 case scm_tc7_weak_table:
741 scm_i_weak_table_print (exp, port, pstate);
742 break;
743 case scm_tc7_fluid:
744 scm_i_fluid_print (exp, port, pstate);
745 break;
746 case scm_tc7_dynamic_state:
747 scm_i_dynamic_state_print (exp, port, pstate);
748 break;
749 case scm_tc7_frame:
750 scm_i_frame_print (exp, port, pstate);
751 break;
752 case scm_tc7_vm_cont:
753 scm_i_vm_cont_print (exp, port, pstate);
754 break;
755 case scm_tc7_array:
756 ENTER_NESTED_DATA (pstate, exp, circref);
757 scm_i_print_array (exp, port, pstate);
758 EXIT_NESTED_DATA (pstate);
759 break;
760 case scm_tc7_bytevector:
761 scm_i_print_bytevector (exp, port, pstate);
762 break;
763 case scm_tc7_bitvector:
764 scm_i_print_bitvector (exp, port, pstate);
765 break;
766 case scm_tc7_wvect:
767 ENTER_NESTED_DATA (pstate, exp, circref);
768 scm_puts_unlocked ("#w(", port);
769 goto common_vector_printer;
770 case scm_tc7_vector:
771 ENTER_NESTED_DATA (pstate, exp, circref);
772 scm_puts_unlocked ("#(", port);
773 common_vector_printer:
774 {
775 register long i;
776 long last = SCM_SIMPLE_VECTOR_LENGTH (exp) - 1;
777 int cutp = 0;
778 if (pstate->fancyp
779 && SCM_SIMPLE_VECTOR_LENGTH (exp) > pstate->length)
780 {
781 last = pstate->length - 1;
782 cutp = 1;
783 }
784 for (i = 0; i < last; ++i)
785 {
786 scm_iprin1 (scm_c_vector_ref (exp, i), port, pstate);
787 scm_putc_unlocked (' ', port);
788 }
789 if (i == last)
790 {
791 /* CHECK_INTS; */
792 scm_iprin1 (scm_c_vector_ref (exp, i), port, pstate);
793 }
794 if (cutp)
795 scm_puts_unlocked (" ...", port);
796 scm_putc_unlocked (')', port);
797 }
798 EXIT_NESTED_DATA (pstate);
799 break;
800 case scm_tc7_port:
801 {
802 scm_t_ptob_descriptor *ptob = SCM_PORT_DESCRIPTOR (exp);
803 if (ptob->print && ptob->print (exp, port, pstate))
804 break;
805 goto punk;
806 }
807 case scm_tc7_smob:
808 ENTER_NESTED_DATA (pstate, exp, circref);
809 SCM_SMOB_DESCRIPTOR (exp).print (exp, port, pstate);
810 EXIT_NESTED_DATA (pstate);
811 break;
812 default:
813 /* case scm_tcs_closures: */
814 punk:
815 scm_ipruk ("type", exp, port);
816 }
817 }
818 }
819
820 /* Print states are necessary for circular reference safe printing.
821 * They are also expensive to allocate. Therefore print states are
822 * kept in a pool so that they can be reused.
823 */
824
825 /* The PORT argument can also be a print-state/port pair, which will
826 * then be used instead of allocating a new print state. This is
827 * useful for continuing a chain of print calls from Scheme. */
828
829 void
830 scm_prin1 (SCM exp, SCM port, int writingp)
831 {
832 SCM handle = SCM_BOOL_F; /* Will GC protect the handle whilst unlinked */
833 SCM pstate_scm;
834 scm_print_state *pstate;
835 int old_writingp;
836
837 /* If PORT is a print-state/port pair, use that. Else create a new
838 print-state. */
839
840 if (SCM_PORT_WITH_PS_P (port))
841 {
842 pstate_scm = SCM_PORT_WITH_PS_PS (port);
843 port = SCM_PORT_WITH_PS_PORT (port);
844 }
845 else
846 {
847 /* First try to allocate a print state from the pool */
848 scm_i_pthread_mutex_lock (&print_state_mutex);
849 if (!scm_is_null (print_state_pool))
850 {
851 handle = print_state_pool;
852 print_state_pool = SCM_CDR (print_state_pool);
853 }
854 scm_i_pthread_mutex_unlock (&print_state_mutex);
855 if (scm_is_false (handle))
856 handle = scm_list_1 (make_print_state ());
857 pstate_scm = SCM_CAR (handle);
858 }
859
860 pstate = SCM_PRINT_STATE (pstate_scm);
861 old_writingp = pstate->writingp;
862 pstate->writingp = writingp;
863 scm_iprin1 (exp, port, pstate);
864 pstate->writingp = old_writingp;
865
866 /* Return print state to pool if it has been created above and
867 hasn't escaped to Scheme. */
868
869 if (scm_is_true (handle) && !pstate->revealed)
870 {
871 scm_i_pthread_mutex_lock (&print_state_mutex);
872 SCM_SETCDR (handle, print_state_pool);
873 print_state_pool = handle;
874 scm_i_pthread_mutex_unlock (&print_state_mutex);
875 }
876 }
877
878 /* Convert codepoint CH to UTF-8 and store the result in UTF8. Return
879 the number of bytes of the UTF-8-encoded string. */
880 static size_t
881 codepoint_to_utf8 (scm_t_wchar ch, scm_t_uint8 utf8[4])
882 {
883 size_t len;
884 scm_t_uint32 codepoint;
885
886 codepoint = (scm_t_uint32) ch;
887
888 if (codepoint <= 0x7f)
889 {
890 len = 1;
891 utf8[0] = (scm_t_uint8) codepoint;
892 }
893 else if (codepoint <= 0x7ffUL)
894 {
895 len = 2;
896 utf8[0] = 0xc0 | (codepoint >> 6);
897 utf8[1] = 0x80 | (codepoint & 0x3f);
898 }
899 else if (codepoint <= 0xffffUL)
900 {
901 len = 3;
902 utf8[0] = 0xe0 | (codepoint >> 12);
903 utf8[1] = 0x80 | ((codepoint >> 6) & 0x3f);
904 utf8[2] = 0x80 | (codepoint & 0x3f);
905 }
906 else
907 {
908 len = 4;
909 utf8[0] = 0xf0 | (codepoint >> 18);
910 utf8[1] = 0x80 | ((codepoint >> 12) & 0x3f);
911 utf8[2] = 0x80 | ((codepoint >> 6) & 0x3f);
912 utf8[3] = 0x80 | (codepoint & 0x3f);
913 }
914
915 return len;
916 }
917
918 #define STR_REF(s, x) \
919 (narrow_p \
920 ? (scm_t_wchar) ((unsigned char *) (s))[x] \
921 : ((scm_t_wchar *) (s))[x])
922
923 /* Write STR to PORT as UTF-8. STR is a LEN-codepoint string; it is
924 narrow if NARROW_P is true, wide otherwise. Return LEN. */
925 static size_t
926 display_string_as_utf8 (const void *str, int narrow_p, size_t len,
927 SCM port)
928 {
929 size_t printed = 0;
930
931 while (len > printed)
932 {
933 size_t utf8_len, i;
934 char *input, utf8_buf[256];
935
936 /* Convert STR to UTF-8. */
937 for (i = printed, utf8_len = 0, input = utf8_buf;
938 i < len && utf8_len + 4 < sizeof (utf8_buf);
939 i++)
940 {
941 utf8_len += codepoint_to_utf8 (STR_REF (str, i),
942 (scm_t_uint8 *) input);
943 input = utf8_buf + utf8_len;
944 }
945
946 /* INPUT was successfully converted, entirely; print the
947 result. */
948 scm_lfwrite_unlocked (utf8_buf, utf8_len, port);
949 printed += i - printed;
950 }
951
952 assert (printed == len);
953
954 return len;
955 }
956
957 /* Write STR to PORT as ISO-8859-1. STR is a LEN-codepoint string; it
958 is narrow if NARROW_P is true, wide otherwise. Return LEN. */
959 static size_t
960 display_string_as_latin1 (const void *str, int narrow_p, size_t len,
961 SCM port,
962 scm_t_string_failed_conversion_handler strategy)
963 {
964 size_t printed = 0;
965
966 if (narrow_p)
967 {
968 scm_lfwrite_unlocked (str, len, port);
969 return len;
970 }
971
972 while (printed < len)
973 {
974 char buf[256];
975 size_t i;
976
977 for (i = 0; i < sizeof(buf) && printed < len; i++, printed++)
978 {
979 scm_t_wchar c = STR_REF (str, printed);
980
981 if (c < 256)
982 buf[i] = c;
983 else
984 break;
985 }
986
987 scm_lfwrite_unlocked (buf, i, port);
988
989 if (i < sizeof(buf) && printed < len)
990 {
991 if (strategy == SCM_FAILED_CONVERSION_ERROR)
992 break;
993 else if (strategy == SCM_FAILED_CONVERSION_ESCAPE_SEQUENCE)
994 write_character_escaped (STR_REF (str, printed), 1, port);
995 else
996 /* STRATEGY is `SCM_FAILED_CONVERSION_QUESTION_MARK'. */
997 display_string ("?", 1, 1, port, strategy);
998 printed++;
999 }
1000 }
1001
1002 return printed;
1003 }
1004
1005 /* Convert STR through PORT's output conversion descriptor and write the
1006 output to PORT. Return the number of codepoints written. */
1007 static size_t
1008 display_string_using_iconv (const void *str, int narrow_p, size_t len,
1009 SCM port,
1010 scm_t_string_failed_conversion_handler strategy)
1011 {
1012 size_t printed;
1013 scm_t_iconv_descriptors *id;
1014 scm_t_port_internal *pti = SCM_PORT_GET_INTERNAL (port);
1015
1016 id = scm_i_port_iconv_descriptors (port, SCM_PORT_WRITE);
1017
1018 if (SCM_UNLIKELY (pti->at_stream_start_for_bom_write && len > 0))
1019 {
1020 scm_t_port *pt = SCM_PTAB_ENTRY (port);
1021
1022 /* Record that we're no longer at stream start. */
1023 pti->at_stream_start_for_bom_write = 0;
1024 if (pt->rw_random)
1025 pti->at_stream_start_for_bom_read = 0;
1026
1027 /* Write a BOM if appropriate. */
1028 if (SCM_UNLIKELY (strcmp(pt->encoding, "UTF-16") == 0
1029 || strcmp(pt->encoding, "UTF-32") == 0))
1030 display_character (SCM_UNICODE_BOM, port, iconveh_error);
1031 }
1032
1033 printed = 0;
1034
1035 while (len > printed)
1036 {
1037 size_t done, utf8_len, input_left, output_left, i;
1038 size_t codepoints_read, output_len;
1039 char *input, *output;
1040 char utf8_buf[256], encoded_output[256];
1041 size_t offsets[256];
1042
1043 /* Convert STR to UTF-8. */
1044 for (i = printed, utf8_len = 0, input = utf8_buf;
1045 i < len && utf8_len + 4 < sizeof (utf8_buf);
1046 i++)
1047 {
1048 offsets[utf8_len] = i;
1049 utf8_len += codepoint_to_utf8 (STR_REF (str, i),
1050 (scm_t_uint8 *) input);
1051 input = utf8_buf + utf8_len;
1052 }
1053
1054 input = utf8_buf;
1055 input_left = utf8_len;
1056
1057 output = encoded_output;
1058 output_left = sizeof (encoded_output);
1059
1060 done = iconv (id->output_cd, &input, &input_left,
1061 &output, &output_left);
1062
1063 output_len = sizeof (encoded_output) - output_left;
1064
1065 if (SCM_UNLIKELY (done == (size_t) -1))
1066 {
1067 int errno_save = errno;
1068
1069 /* Reset the `iconv' state. */
1070 iconv (id->output_cd, NULL, NULL, NULL, NULL);
1071
1072 /* Print the OUTPUT_LEN bytes successfully converted. */
1073 scm_lfwrite_unlocked (encoded_output, output_len, port);
1074
1075 /* See how many input codepoints these OUTPUT_LEN bytes
1076 corresponds to. */
1077 codepoints_read = offsets[input - utf8_buf] - printed;
1078 printed += codepoints_read;
1079
1080 if (errno_save == EILSEQ &&
1081 strategy != SCM_FAILED_CONVERSION_ERROR)
1082 {
1083 /* Conversion failed somewhere in INPUT and we want to
1084 escape or substitute the offending input character. */
1085
1086 if (strategy == SCM_FAILED_CONVERSION_ESCAPE_SEQUENCE)
1087 {
1088 scm_t_wchar ch;
1089
1090 /* Find CH, the offending codepoint, and escape it. */
1091 ch = STR_REF (str, offsets[input - utf8_buf]);
1092 write_character_escaped (ch, 1, port);
1093 }
1094 else
1095 /* STRATEGY is `SCM_FAILED_CONVERSION_QUESTION_MARK'. */
1096 display_string ("?", 1, 1, port, strategy);
1097
1098 printed++;
1099 }
1100 else
1101 /* Something bad happened that we can't handle: bail out. */
1102 break;
1103 }
1104 else
1105 {
1106 /* INPUT was successfully converted, entirely; print the
1107 result. */
1108 scm_lfwrite_unlocked (encoded_output, output_len, port);
1109 codepoints_read = i - printed;
1110 printed += codepoints_read;
1111 }
1112 }
1113
1114 return printed;
1115 }
1116
1117 #undef STR_REF
1118
1119 /* Display the LEN codepoints in STR to PORT according to STRATEGY;
1120 return the number of codepoints successfully displayed. If NARROW_P,
1121 then STR is interpreted as a sequence of `char', denoting a Latin-1
1122 string; otherwise it's interpreted as a sequence of
1123 `scm_t_wchar'. */
1124 static size_t
1125 display_string (const void *str, int narrow_p,
1126 size_t len, SCM port,
1127 scm_t_string_failed_conversion_handler strategy)
1128 {
1129 scm_t_port_internal *pti;
1130
1131 pti = SCM_PORT_GET_INTERNAL (port);
1132
1133 if (pti->encoding_mode == SCM_PORT_ENCODING_MODE_UTF8)
1134 return display_string_as_utf8 (str, narrow_p, len, port);
1135 else if (pti->encoding_mode == SCM_PORT_ENCODING_MODE_LATIN1)
1136 return display_string_as_latin1 (str, narrow_p, len, port, strategy);
1137 else
1138 return display_string_using_iconv (str, narrow_p, len, port, strategy);
1139 }
1140
1141 /* Attempt to display CH to PORT according to STRATEGY. Return non-zero
1142 if CH was successfully displayed, zero otherwise (e.g., if it was not
1143 representable in PORT's encoding.) */
1144 static int
1145 display_character (scm_t_wchar ch, SCM port,
1146 scm_t_string_failed_conversion_handler strategy)
1147 {
1148 return display_string (&ch, 0, 1, port, strategy) == 1;
1149 }
1150
1151 /* Attempt to pretty-print CH, a combining character, to PORT. Return
1152 zero upon failure, non-zero otherwise. The idea is to print CH above
1153 a dotted circle to make it more visible. */
1154 static int
1155 write_combining_character (scm_t_wchar ch, SCM port)
1156 {
1157 scm_t_wchar str[2];
1158
1159 str[0] = SCM_CODEPOINT_DOTTED_CIRCLE;
1160 str[1] = ch;
1161
1162 return display_string (str, 0, 2, port, iconveh_error) == 2;
1163 }
1164
1165 /* Write CH to PORT in its escaped form, using the string escape syntax
1166 if STRING_ESCAPES_P is non-zero. */
1167 static void
1168 write_character_escaped (scm_t_wchar ch, int string_escapes_p, SCM port)
1169 {
1170 if (string_escapes_p)
1171 {
1172 /* Represent CH using the in-string escape syntax. */
1173
1174 static const char hex[] = "0123456789abcdef";
1175 static const char escapes[7] = "abtnvfr";
1176 char buf[9];
1177
1178 if (ch >= 0x07 && ch <= 0x0D && ch != 0x0A)
1179 {
1180 /* Use special escapes for some C0 controls. */
1181 buf[0] = '\\';
1182 buf[1] = escapes[ch - 0x07];
1183 scm_lfwrite_unlocked (buf, 2, port);
1184 }
1185 else if (!SCM_R6RS_ESCAPES_P)
1186 {
1187 if (ch <= 0xFF)
1188 {
1189 buf[0] = '\\';
1190 buf[1] = 'x';
1191 buf[2] = hex[ch / 16];
1192 buf[3] = hex[ch % 16];
1193 scm_lfwrite_unlocked (buf, 4, port);
1194 }
1195 else if (ch <= 0xFFFF)
1196 {
1197 buf[0] = '\\';
1198 buf[1] = 'u';
1199 buf[2] = hex[(ch & 0xF000) >> 12];
1200 buf[3] = hex[(ch & 0xF00) >> 8];
1201 buf[4] = hex[(ch & 0xF0) >> 4];
1202 buf[5] = hex[(ch & 0xF)];
1203 scm_lfwrite_unlocked (buf, 6, port);
1204 }
1205 else if (ch > 0xFFFF)
1206 {
1207 buf[0] = '\\';
1208 buf[1] = 'U';
1209 buf[2] = hex[(ch & 0xF00000) >> 20];
1210 buf[3] = hex[(ch & 0xF0000) >> 16];
1211 buf[4] = hex[(ch & 0xF000) >> 12];
1212 buf[5] = hex[(ch & 0xF00) >> 8];
1213 buf[6] = hex[(ch & 0xF0) >> 4];
1214 buf[7] = hex[(ch & 0xF)];
1215 scm_lfwrite_unlocked (buf, 8, port);
1216 }
1217 }
1218 else
1219 {
1220 /* Print an R6RS variable-length hex escape: "\xNNNN;". */
1221 scm_t_wchar ch2 = ch;
1222
1223 int i = 8;
1224 buf[i] = ';';
1225 i --;
1226 if (ch == 0)
1227 buf[i--] = '0';
1228 else
1229 while (ch2 > 0)
1230 {
1231 buf[i] = hex[ch2 & 0xF];
1232 ch2 >>= 4;
1233 i --;
1234 }
1235 buf[i] = 'x';
1236 i --;
1237 buf[i] = '\\';
1238 scm_lfwrite_unlocked (buf + i, 9 - i, port);
1239 }
1240 }
1241 else
1242 {
1243 /* Represent CH using the character escape syntax. */
1244 const char *name;
1245
1246 name = scm_i_charname (SCM_MAKE_CHAR (ch));
1247 if (name != NULL)
1248 scm_puts_unlocked (name, port);
1249 else
1250 PRINT_CHAR_ESCAPE (ch, port);
1251 }
1252 }
1253
1254 /* Write CH to PORT, escaping it if it's non-graphic or not
1255 representable in PORT's encoding. If STRING_ESCAPES_P is true and CH
1256 needs to be escaped, it is escaped using the in-string escape syntax;
1257 otherwise the character escape syntax is used. */
1258 static void
1259 write_character (scm_t_wchar ch, SCM port, int string_escapes_p)
1260 {
1261 int printed = 0;
1262 scm_t_string_failed_conversion_handler strategy;
1263
1264 strategy = PORT_CONVERSION_HANDLER (port);
1265
1266 if (string_escapes_p)
1267 {
1268 /* Check if CH deserves special treatment. */
1269 if (ch == '"' || ch == '\\')
1270 {
1271 display_character ('\\', port, iconveh_question_mark);
1272 display_character (ch, port, strategy);
1273 printed = 1;
1274 }
1275 else if (ch == '\n' && SCM_PRINT_ESCAPE_NEWLINES_P)
1276 {
1277 display_character ('\\', port, iconveh_question_mark);
1278 display_character ('n', port, strategy);
1279 printed = 1;
1280 }
1281 else if (ch == ' ' || ch == '\n')
1282 {
1283 display_character (ch, port, strategy);
1284 printed = 1;
1285 }
1286 }
1287 else
1288 {
1289 display_string ("#\\", 1, 2, port, iconveh_question_mark);
1290
1291 if (uc_combining_class (ch) != UC_CCC_NR)
1292 /* Character is a combining character, so attempt to
1293 pretty-print it. */
1294 printed = write_combining_character (ch, port);
1295 }
1296
1297 if (!printed
1298 && uc_is_general_category_withtable (ch,
1299 UC_CATEGORY_MASK_L |
1300 UC_CATEGORY_MASK_M |
1301 UC_CATEGORY_MASK_N |
1302 UC_CATEGORY_MASK_P |
1303 UC_CATEGORY_MASK_S))
1304 /* CH is graphic; attempt to display it. */
1305 printed = display_character (ch, port, iconveh_error);
1306
1307 if (!printed)
1308 /* CH isn't graphic or cannot be represented in PORT's encoding. */
1309 write_character_escaped (ch, string_escapes_p, port);
1310 }
1311
1312 /* Display STR to PORT from START inclusive to END exclusive. */
1313 void
1314 scm_i_display_substring (SCM str, size_t start, size_t end, SCM port)
1315 {
1316 int narrow_p;
1317 const char *buf;
1318 size_t len, printed;
1319
1320 buf = scm_i_string_data (str);
1321 len = end - start;
1322 narrow_p = scm_i_is_narrow_string (str);
1323 buf += start * (narrow_p ? sizeof (char) : sizeof (scm_t_wchar));
1324
1325 printed = display_string (buf, narrow_p, end - start, port,
1326 PORT_CONVERSION_HANDLER (port));
1327
1328 if (SCM_UNLIKELY (printed < len))
1329 scm_encoding_error (__func__, errno,
1330 "cannot convert to output locale",
1331 port, scm_c_string_ref (str, printed + start));
1332 }
1333
1334 \f
1335 /* Print an integer.
1336 */
1337
1338 void
1339 scm_intprint (scm_t_intmax n, int radix, SCM port)
1340 {
1341 char num_buf[SCM_INTBUFLEN];
1342 scm_lfwrite_unlocked (num_buf, scm_iint2str (n, radix, num_buf), port);
1343 }
1344
1345 void
1346 scm_uintprint (scm_t_uintmax n, int radix, SCM port)
1347 {
1348 char num_buf[SCM_INTBUFLEN];
1349 scm_lfwrite_unlocked (num_buf, scm_iuint2str (n, radix, num_buf), port);
1350 }
1351
1352 /* Print an object of unrecognized type.
1353 */
1354
1355 void
1356 scm_ipruk (char *hdr, SCM ptr, SCM port)
1357 {
1358 scm_puts_unlocked ("#<unknown-", port);
1359 scm_puts_unlocked (hdr, port);
1360 if (1) /* (scm_in_heap_p (ptr)) */ /* FIXME */
1361 {
1362 scm_puts_unlocked (" (0x", port);
1363 scm_uintprint (SCM_CELL_WORD_0 (ptr), 16, port);
1364 scm_puts_unlocked (" . 0x", port);
1365 scm_uintprint (SCM_CELL_WORD_1 (ptr), 16, port);
1366 scm_puts_unlocked (") @", port);
1367 }
1368 scm_puts_unlocked (" 0x", port);
1369 scm_uintprint (SCM_UNPACK (ptr), 16, port);
1370 scm_putc_unlocked ('>', port);
1371 }
1372
1373
1374 /* Print a list.
1375 */
1376 void
1377 scm_iprlist (char *hdr, SCM exp, int tlr, SCM port, scm_print_state *pstate)
1378 {
1379 register SCM hare, tortoise;
1380 long floor = pstate->top - 2;
1381 scm_puts_unlocked (hdr, port);
1382 /* CHECK_INTS; */
1383 if (pstate->fancyp)
1384 goto fancy_printing;
1385
1386 /* Run a hare and tortoise so that total time complexity will be
1387 O(depth * N) instead of O(N^2). */
1388 hare = SCM_CDR (exp);
1389 tortoise = exp;
1390 while (scm_is_pair (hare))
1391 {
1392 if (scm_is_eq (hare, tortoise))
1393 goto fancy_printing;
1394 hare = SCM_CDR (hare);
1395 if (!scm_is_pair (hare))
1396 break;
1397 hare = SCM_CDR (hare);
1398 tortoise = SCM_CDR (tortoise);
1399 }
1400
1401 /* No cdr cycles intrinsic to this list */
1402 scm_iprin1 (SCM_CAR (exp), port, pstate);
1403 for (exp = SCM_CDR (exp); scm_is_pair (exp); exp = SCM_CDR (exp))
1404 {
1405 register long i;
1406
1407 for (i = floor; i >= 0; --i)
1408 if (scm_is_eq (PSTATE_STACK_REF(pstate, i), exp))
1409 goto circref;
1410 PUSH_REF (pstate, exp);
1411 scm_putc_unlocked (' ', port);
1412 /* CHECK_INTS; */
1413 scm_iprin1 (SCM_CAR (exp), port, pstate);
1414 }
1415 if (!SCM_NULL_OR_NIL_P (exp))
1416 {
1417 scm_puts_unlocked (" . ", port);
1418 scm_iprin1 (exp, port, pstate);
1419 }
1420
1421 end:
1422 scm_putc_unlocked (tlr, port);
1423 pstate->top = floor + 2;
1424 return;
1425
1426 fancy_printing:
1427 {
1428 long n = pstate->length;
1429
1430 scm_iprin1 (SCM_CAR (exp), port, pstate);
1431 exp = SCM_CDR (exp); --n;
1432 for (; scm_is_pair (exp); exp = SCM_CDR (exp))
1433 {
1434 register unsigned long i;
1435
1436 for (i = 0; i < pstate->top; ++i)
1437 if (scm_is_eq (PSTATE_STACK_REF(pstate, i), exp))
1438 goto fancy_circref;
1439 if (pstate->fancyp)
1440 {
1441 if (n == 0)
1442 {
1443 scm_puts_unlocked (" ...", port);
1444 goto skip_tail;
1445 }
1446 else
1447 --n;
1448 }
1449 PUSH_REF(pstate, exp);
1450 ++pstate->list_offset;
1451 scm_putc_unlocked (' ', port);
1452 /* CHECK_INTS; */
1453 scm_iprin1 (SCM_CAR (exp), port, pstate);
1454 }
1455 }
1456 if (!SCM_NULL_OR_NIL_P (exp))
1457 {
1458 scm_puts_unlocked (" . ", port);
1459 scm_iprin1 (exp, port, pstate);
1460 }
1461 skip_tail:
1462 pstate->list_offset -= pstate->top - floor - 2;
1463 goto end;
1464
1465 fancy_circref:
1466 pstate->list_offset -= pstate->top - floor - 2;
1467
1468 circref:
1469 scm_puts_unlocked (" . ", port);
1470 print_circref (port, pstate, exp);
1471 goto end;
1472 }
1473
1474 \f
1475
1476 int
1477 scm_valid_oport_value_p (SCM val)
1478 {
1479 return (SCM_OPOUTPORTP (val)
1480 || (SCM_PORT_WITH_PS_P (val)
1481 && SCM_OPOUTPORTP (SCM_PORT_WITH_PS_PORT (val))));
1482 }
1483
1484 /* SCM_GPROC(s_write, "write", 1, 1, 0, scm_write, g_write); */
1485
1486 SCM
1487 scm_write (SCM obj, SCM port)
1488 {
1489 if (SCM_UNBNDP (port))
1490 port = scm_current_output_port ();
1491
1492 SCM_ASSERT (scm_valid_oport_value_p (port), port, SCM_ARG2, s_write);
1493
1494 scm_dynwind_begin (0);
1495 scm_dynwind_lock_port (SCM_COERCE_OUTPORT (port));
1496 scm_prin1 (obj, port, 1);
1497 scm_dynwind_end ();
1498
1499 return SCM_UNSPECIFIED;
1500 }
1501
1502
1503 /* SCM_GPROC(s_display, "display", 1, 1, 0, scm_display, g_display); */
1504
1505 SCM
1506 scm_display (SCM obj, SCM port)
1507 {
1508 if (SCM_UNBNDP (port))
1509 port = scm_current_output_port ();
1510
1511 SCM_ASSERT (scm_valid_oport_value_p (port), port, SCM_ARG2, s_display);
1512
1513 scm_dynwind_begin (0);
1514 scm_dynwind_lock_port (SCM_COERCE_OUTPORT (port));
1515 scm_prin1 (obj, port, 0);
1516 scm_dynwind_end ();
1517
1518 return SCM_UNSPECIFIED;
1519 }
1520
1521
1522 SCM_DEFINE (scm_simple_format, "simple-format", 2, 0, 1,
1523 (SCM destination, SCM message, SCM args),
1524 "Write @var{message} to @var{destination}, defaulting to\n"
1525 "the current output port.\n"
1526 "@var{message} can contain @code{~A} (was @code{%s}) and\n"
1527 "@code{~S} (was @code{%S}) escapes. When printed,\n"
1528 "the escapes are replaced with corresponding members of\n"
1529 "@var{args}:\n"
1530 "@code{~A} formats using @code{display} and @code{~S} formats\n"
1531 "using @code{write}.\n"
1532 "If @var{destination} is @code{#t}, then use the current output\n"
1533 "port, if @var{destination} is @code{#f}, then return a string\n"
1534 "containing the formatted text. Does not add a trailing newline.")
1535 #define FUNC_NAME s_scm_simple_format
1536 {
1537 SCM port, answer = SCM_UNSPECIFIED;
1538 int fReturnString = 0;
1539 int writingp;
1540 size_t start, p, end;
1541
1542 if (scm_is_eq (destination, SCM_BOOL_T))
1543 {
1544 destination = port = scm_current_output_port ();
1545 }
1546 else if (scm_is_false (destination))
1547 {
1548 fReturnString = 1;
1549 port = scm_mkstrport (SCM_INUM0, SCM_BOOL_F,
1550 SCM_OPN | SCM_WRTNG,
1551 FUNC_NAME);
1552 destination = port;
1553 }
1554 else
1555 {
1556 SCM_VALIDATE_OPORT_VALUE (1, destination);
1557 port = SCM_COERCE_OUTPORT (destination);
1558 }
1559 SCM_VALIDATE_STRING (2, message);
1560 SCM_VALIDATE_REST_ARGUMENT (args);
1561
1562 p = 0;
1563 start = 0;
1564 end = scm_i_string_length (message);
1565 for (p = start; p != end; ++p)
1566 if (scm_i_string_ref (message, p) == '~')
1567 {
1568 if (++p == end)
1569 break;
1570
1571 switch (scm_i_string_ref (message, p))
1572 {
1573 case 'A': case 'a':
1574 writingp = 0;
1575 break;
1576 case 'S': case 's':
1577 writingp = 1;
1578 break;
1579 case '~':
1580 scm_lfwrite_substr (message, start, p, port);
1581 start = p + 1;
1582 continue;
1583 case '%':
1584 scm_lfwrite_substr (message, start, p - 1, port);
1585 scm_newline (port);
1586 start = p + 1;
1587 continue;
1588 default:
1589 SCM_MISC_ERROR ("FORMAT: Unsupported format option ~~~A - use (ice-9 format) instead",
1590 scm_list_1 (SCM_MAKE_CHAR (scm_i_string_ref (message, p))));
1591
1592 }
1593
1594
1595 if (!scm_is_pair (args))
1596 SCM_MISC_ERROR ("FORMAT: Missing argument for ~~~A",
1597 scm_list_1 (SCM_MAKE_CHAR (scm_i_string_ref (message, p))));
1598
1599 scm_lfwrite_substr (message, start, p - 1, port);
1600 /* we pass destination here */
1601 scm_prin1 (SCM_CAR (args), destination, writingp);
1602 args = SCM_CDR (args);
1603 start = p + 1;
1604 }
1605
1606 scm_lfwrite_substr (message, start, p, port);
1607 if (!scm_is_eq (args, SCM_EOL))
1608 SCM_MISC_ERROR ("FORMAT: ~A superfluous arguments",
1609 scm_list_1 (scm_length (args)));
1610
1611 if (fReturnString)
1612 answer = scm_strport_to_string (destination);
1613
1614 return scm_return_first (answer, message);
1615 }
1616 #undef FUNC_NAME
1617
1618
1619 SCM_DEFINE (scm_newline, "newline", 0, 1, 0,
1620 (SCM port),
1621 "Send a newline to @var{port}.\n"
1622 "If @var{port} is omitted, send to the current output port.")
1623 #define FUNC_NAME s_scm_newline
1624 {
1625 if (SCM_UNBNDP (port))
1626 port = scm_current_output_port ();
1627
1628 SCM_VALIDATE_OPORT_VALUE (1, port);
1629
1630 scm_putc_unlocked ('\n', SCM_COERCE_OUTPORT (port));
1631 return SCM_UNSPECIFIED;
1632 }
1633 #undef FUNC_NAME
1634
1635 SCM_DEFINE (scm_write_char, "write-char", 1, 1, 0,
1636 (SCM chr, SCM port),
1637 "Send character @var{chr} to @var{port}.")
1638 #define FUNC_NAME s_scm_write_char
1639 {
1640 if (SCM_UNBNDP (port))
1641 port = scm_current_output_port ();
1642
1643 SCM_VALIDATE_CHAR (1, chr);
1644 SCM_VALIDATE_OPORT_VALUE (2, port);
1645
1646 port = SCM_COERCE_OUTPORT (port);
1647 if (!display_character (SCM_CHAR (chr), port,
1648 PORT_CONVERSION_HANDLER (port)))
1649 scm_encoding_error (__func__, errno,
1650 "cannot convert to output locale",
1651 port, chr);
1652
1653 return SCM_UNSPECIFIED;
1654 }
1655 #undef FUNC_NAME
1656
1657 \f
1658
1659 /* Call back to Scheme code to do the printing of special objects
1660 * (like structs). SCM_PRINTER_APPLY applies PROC to EXP and a smob
1661 * containing PORT and PSTATE. This object can be used as the port for
1662 * display/write etc to continue the current print chain. The REVEALED
1663 * field of PSTATE is set to true to indicate that the print state has
1664 * escaped to Scheme and thus has to be freed by the GC.
1665 */
1666
1667 scm_t_bits scm_tc16_port_with_ps;
1668
1669 /* Print exactly as the port itself would */
1670
1671 static int
1672 port_with_ps_print (SCM obj, SCM port, scm_print_state *pstate)
1673 {
1674 obj = SCM_PORT_WITH_PS_PORT (obj);
1675 return SCM_PORT_DESCRIPTOR (obj)->print (obj, port, pstate);
1676 }
1677
1678 SCM
1679 scm_printer_apply (SCM proc, SCM exp, SCM port, scm_print_state *pstate)
1680 {
1681 pstate->revealed = 1;
1682 return scm_call_2 (proc, exp,
1683 scm_i_port_with_print_state (port, pstate->handle));
1684 }
1685
1686 SCM_DEFINE (scm_port_with_print_state, "port-with-print-state", 1, 1, 0,
1687 (SCM port, SCM pstate),
1688 "Create a new port which behaves like @var{port}, but with an\n"
1689 "included print state @var{pstate}. @var{pstate} is optional.\n"
1690 "If @var{pstate} isn't supplied and @var{port} already has\n"
1691 "a print state, the old print state is reused.")
1692 #define FUNC_NAME s_scm_port_with_print_state
1693 {
1694 SCM_VALIDATE_OPORT_VALUE (1, port);
1695 if (!SCM_UNBNDP (pstate))
1696 SCM_VALIDATE_PRINTSTATE (2, pstate);
1697 return scm_i_port_with_print_state (port, pstate);
1698 }
1699 #undef FUNC_NAME
1700
1701 SCM_DEFINE (scm_get_print_state, "get-print-state", 1, 0, 0,
1702 (SCM port),
1703 "Return the print state of the port @var{port}. If @var{port}\n"
1704 "has no associated print state, @code{#f} is returned.")
1705 #define FUNC_NAME s_scm_get_print_state
1706 {
1707 if (SCM_PORT_WITH_PS_P (port))
1708 return SCM_PORT_WITH_PS_PS (port);
1709 if (SCM_OUTPUT_PORT_P (port))
1710 return SCM_BOOL_F;
1711 SCM_WRONG_TYPE_ARG (1, port);
1712 }
1713 #undef FUNC_NAME
1714
1715 \f
1716
1717 void
1718 scm_init_print ()
1719 {
1720 SCM type;
1721
1722 type = scm_make_vtable (scm_from_locale_string (SCM_PRINT_STATE_LAYOUT),
1723 SCM_BOOL_F);
1724 scm_set_struct_vtable_name_x (type, scm_from_latin1_symbol ("print-state"));
1725 scm_print_state_vtable = type;
1726
1727 /* Don't want to bind a wrapper class in GOOPS, so pass 0 as arg1. */
1728 scm_tc16_port_with_ps = scm_make_smob_type (0, 0);
1729 scm_set_smob_print (scm_tc16_port_with_ps, port_with_ps_print);
1730
1731 #include "libguile/print.x"
1732
1733 scm_init_opts (scm_print_options, scm_print_opts);
1734 scm_print_opts[SCM_PRINT_HIGHLIGHT_PREFIX_I].val =
1735 SCM_UNPACK (scm_from_locale_string ("{"));
1736 scm_print_opts[SCM_PRINT_HIGHLIGHT_SUFFIX_I].val =
1737 SCM_UNPACK (scm_from_locale_string ("}"));
1738 scm_print_opts[SCM_PRINT_KEYWORD_STYLE_I].val = SCM_UNPACK (sym_reader);
1739 }
1740
1741 /*
1742 Local Variables:
1743 c-file-style: "gnu"
1744 End:
1745 */