print: Support R7RS |...| symbol notation.
[bpt/guile.git] / libguile / print.c
1 /* Copyright (C) 1995-1999, 2000, 2001, 2002, 2003, 2004, 2006, 2008,
2 * 2009, 2010, 2011, 2012, 2013, 2014 Free Software Foundation, Inc.
3 *
4 * This library is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU Lesser General Public License
6 * as published by the Free Software Foundation; either version 3 of
7 * the License, or (at your option) any later version.
8 *
9 * This library is distributed in the hope that it will be useful, but
10 * WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
13 *
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with this library; if not, write to the Free Software
16 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
17 * 02110-1301 USA
18 */
19
20
21 \f
22 #ifdef HAVE_CONFIG_H
23 # include <config.h>
24 #endif
25
26 #include <errno.h>
27 #include <iconv.h>
28 #include <stdio.h>
29 #include <assert.h>
30
31 #include <uniconv.h>
32 #include <unictype.h>
33 #include <c-strcase.h>
34
35 #include "libguile/_scm.h"
36 #include "libguile/chars.h"
37 #include "libguile/continuations.h"
38 #include "libguile/smob.h"
39 #include "libguile/control.h"
40 #include "libguile/eval.h"
41 #include "libguile/macros.h"
42 #include "libguile/procprop.h"
43 #include "libguile/read.h"
44 #include "libguile/weaks.h"
45 #include "libguile/programs.h"
46 #include "libguile/alist.h"
47 #include "libguile/struct.h"
48 #include "libguile/ports.h"
49 #include "libguile/ports-internal.h"
50 #include "libguile/root.h"
51 #include "libguile/strings.h"
52 #include "libguile/strports.h"
53 #include "libguile/vectors.h"
54 #include "libguile/numbers.h"
55 #include "libguile/vm.h"
56
57 #include "libguile/validate.h"
58 #include "libguile/print.h"
59
60 #include "libguile/private-options.h"
61
62 \f
63
64 /* Character printers. */
65
66 #define PORT_CONVERSION_HANDLER(port) \
67 SCM_PTAB_ENTRY (port)->ilseq_handler
68
69 static size_t display_string (const void *, int, size_t, SCM,
70 scm_t_string_failed_conversion_handler);
71
72 static int display_character (scm_t_wchar, SCM,
73 scm_t_string_failed_conversion_handler);
74
75 static void write_character (scm_t_wchar, SCM, int);
76
77 static void write_character_escaped (scm_t_wchar, int, SCM);
78
79 \f
80
81 /* {Names of immediate symbols}
82 *
83 * This table must agree with the declarations in scm.h: {Immediate Symbols}.
84 */
85
86 /* This table must agree with the list of flags in tags.h. */
87 static const char *iflagnames[] =
88 {
89 "#f",
90 "#nil", /* Elisp nil value. Should print from elisp as symbol `nil'. */
91 "#<XXX UNUSED LISP FALSE -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>",
92 "()",
93 "#t",
94 "#<XXX UNUSED BOOLEAN 0 -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>",
95 "#<XXX UNUSED BOOLEAN 1 -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>",
96 "#<XXX UNUSED BOOLEAN 2 -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>",
97 "#<unspecified>",
98 "#<undefined>",
99 "#<eof>",
100
101 /* Unbound slot marker for GOOPS. For internal use in GOOPS only. */
102 "#<unbound>",
103 };
104
105 SCM_SYMBOL (sym_reader, "reader");
106
107 scm_t_option scm_print_opts[] = {
108 { SCM_OPTION_SCM, "highlight-prefix", (scm_t_bits)SCM_BOOL_F_BITS,
109 "The string to print before highlighted values." },
110 { SCM_OPTION_SCM, "highlight-suffix", (scm_t_bits)SCM_BOOL_F_BITS,
111 "The string to print after highlighted values." },
112 { SCM_OPTION_SCM, "quote-keywordish-symbols", (scm_t_bits)SCM_BOOL_F_BITS,
113 "How to print symbols that have a colon as their first or last character. "
114 "The value '#f' does not quote the colons; '#t' quotes them; "
115 "'reader' quotes them when the reader option 'keywords' is not '#f'." },
116 { SCM_OPTION_BOOLEAN, "escape-newlines", 1,
117 "Render newlines as \\n when printing using `write'." },
118 { SCM_OPTION_BOOLEAN, "r7rs-symbols", 0,
119 "Escape symbols using R7RS |...| symbol notation." },
120 { 0 },
121 };
122
123 SCM_DEFINE (scm_print_options, "print-options-interface", 0, 1, 0,
124 (SCM setting),
125 "Option interface for the print options. Instead of using\n"
126 "this procedure directly, use the procedures\n"
127 "@code{print-enable}, @code{print-disable}, @code{print-set!}\n"
128 "and @code{print-options}.")
129 #define FUNC_NAME s_scm_print_options
130 {
131 SCM ans = scm_options (setting,
132 scm_print_opts,
133 FUNC_NAME);
134 return ans;
135 }
136 #undef FUNC_NAME
137
138 \f
139 /* {Printing of Scheme Objects}
140 */
141
142 /* Detection of circular references.
143 *
144 * Due to other constraints in the implementation, this code has bad
145 * time complexity (O (depth * N)), The printer code can be
146 * rewritten to be O(N).
147 */
148 #define PUSH_REF(pstate, obj) \
149 do \
150 { \
151 PSTATE_STACK_SET (pstate, pstate->top, obj); \
152 pstate->top++; \
153 if (pstate->top == pstate->ceiling) \
154 grow_ref_stack (pstate); \
155 } while(0)
156
157 #define ENTER_NESTED_DATA(pstate, obj, label) \
158 do \
159 { \
160 register unsigned long i; \
161 for (i = 0; i < pstate->top; ++i) \
162 if (scm_is_eq (PSTATE_STACK_REF (pstate, i), (obj))) \
163 goto label; \
164 if (pstate->fancyp) \
165 { \
166 if (pstate->top - pstate->list_offset >= pstate->level) \
167 { \
168 scm_putc ('#', port); \
169 return; \
170 } \
171 } \
172 PUSH_REF(pstate, obj); \
173 } while(0)
174
175 #define EXIT_NESTED_DATA(pstate) \
176 do \
177 { \
178 --pstate->top; \
179 PSTATE_STACK_SET (pstate, pstate->top, SCM_UNDEFINED); \
180 } \
181 while (0)
182
183 SCM scm_print_state_vtable = SCM_BOOL_F;
184 static SCM print_state_pool = SCM_EOL;
185 scm_i_pthread_mutex_t print_state_mutex = SCM_I_PTHREAD_MUTEX_INITIALIZER;
186
187 #ifdef GUILE_DEBUG /* Used for debugging purposes */
188
189 SCM_DEFINE (scm_current_pstate, "current-pstate", 0, 0, 0,
190 (),
191 "Return the current-pstate -- the car of the\n"
192 "@code{print_state_pool}. @code{current-pstate} is only\n"
193 "included in @code{--enable-guile-debug} builds.")
194 #define FUNC_NAME s_scm_current_pstate
195 {
196 if (!scm_is_null (print_state_pool))
197 return SCM_CAR (print_state_pool);
198 else
199 return SCM_BOOL_F;
200 }
201 #undef FUNC_NAME
202
203 #endif
204
205 #define PSTATE_SIZE 50L
206
207 static SCM
208 make_print_state (void)
209 {
210 SCM print_state
211 = scm_make_struct (scm_print_state_vtable, SCM_INUM0, SCM_EOL);
212 scm_print_state *pstate = SCM_PRINT_STATE (print_state);
213 pstate->ref_vect = scm_c_make_vector (PSTATE_SIZE, SCM_UNDEFINED);
214 pstate->ceiling = SCM_SIMPLE_VECTOR_LENGTH (pstate->ref_vect);
215 pstate->highlight_objects = SCM_EOL;
216 return print_state;
217 }
218
219 SCM
220 scm_make_print_state ()
221 {
222 SCM answer = SCM_BOOL_F;
223
224 /* First try to allocate a print state from the pool */
225 scm_i_pthread_mutex_lock (&print_state_mutex);
226 if (!scm_is_null (print_state_pool))
227 {
228 answer = SCM_CAR (print_state_pool);
229 print_state_pool = SCM_CDR (print_state_pool);
230 }
231 scm_i_pthread_mutex_unlock (&print_state_mutex);
232
233 return scm_is_false (answer) ? make_print_state () : answer;
234 }
235
236 void
237 scm_free_print_state (SCM print_state)
238 {
239 SCM handle;
240 scm_print_state *pstate = SCM_PRINT_STATE (print_state);
241 /* Cleanup before returning print state to pool.
242 * It is better to do it here. Doing it in scm_prin1
243 * would cost more since that function is called much more
244 * often.
245 */
246 pstate->fancyp = 0;
247 pstate->revealed = 0;
248 pstate->highlight_objects = SCM_EOL;
249 scm_i_pthread_mutex_lock (&print_state_mutex);
250 handle = scm_cons (print_state, print_state_pool);
251 print_state_pool = handle;
252 scm_i_pthread_mutex_unlock (&print_state_mutex);
253 }
254
255 SCM
256 scm_i_port_with_print_state (SCM port, SCM print_state)
257 {
258 if (SCM_UNBNDP (print_state))
259 {
260 if (SCM_PORT_WITH_PS_P (port))
261 return port;
262 else
263 print_state = scm_make_print_state ();
264 /* port does not need to be coerced since it doesn't have ps */
265 }
266 else
267 port = SCM_COERCE_OUTPORT (port);
268 SCM_RETURN_NEWSMOB (scm_tc16_port_with_ps,
269 SCM_UNPACK (scm_cons (port, print_state)));
270 }
271
272 static void
273 grow_ref_stack (scm_print_state *pstate)
274 {
275 SCM old_vect = pstate->ref_vect;
276 size_t old_size = SCM_SIMPLE_VECTOR_LENGTH (old_vect);
277 size_t new_size = 2 * pstate->ceiling;
278 SCM new_vect = scm_c_make_vector (new_size, SCM_UNDEFINED);
279 unsigned long int i;
280
281 for (i = 0; i != old_size; ++i)
282 SCM_SIMPLE_VECTOR_SET (new_vect, i, SCM_SIMPLE_VECTOR_REF (old_vect, i));
283
284 pstate->ref_vect = new_vect;
285 pstate->ceiling = new_size;
286 }
287
288 #define PSTATE_STACK_REF(p,i) SCM_SIMPLE_VECTOR_REF((p)->ref_vect, (i))
289 #define PSTATE_STACK_SET(p,i,v) SCM_SIMPLE_VECTOR_SET((p)->ref_vect, (i), (v))
290
291 static void
292 print_circref (SCM port, scm_print_state *pstate, SCM ref)
293 {
294 register long i;
295 long self = pstate->top - 1;
296 i = pstate->top - 1;
297 if (scm_is_pair (PSTATE_STACK_REF (pstate, i)))
298 {
299 while (i > 0)
300 {
301 if (!scm_is_pair (PSTATE_STACK_REF (pstate, i-1))
302 || !scm_is_eq (SCM_CDR (PSTATE_STACK_REF (pstate, i-1)),
303 SCM_CDR (PSTATE_STACK_REF (pstate, i))))
304 break;
305 --i;
306 }
307 self = i;
308 }
309 for (i = pstate->top - 1; 1; --i)
310 if (scm_is_eq (PSTATE_STACK_REF(pstate, i), ref))
311 break;
312 scm_putc ('#', port);
313 scm_intprint (i - self, 10, port);
314 scm_putc ('#', port);
315 }
316
317 /* Print the name of a symbol. */
318
319 static int
320 quote_keywordish_symbols (void)
321 {
322 SCM option = SCM_PRINT_KEYWORD_STYLE;
323
324 if (scm_is_false (option))
325 return 0;
326 if (scm_is_eq (option, sym_reader))
327 return scm_is_true (SCM_PACK (SCM_KEYWORD_STYLE));
328 return 1;
329 }
330
331 #define INITIAL_IDENTIFIER_MASK \
332 (UC_CATEGORY_MASK_Lu | UC_CATEGORY_MASK_Ll | UC_CATEGORY_MASK_Lt \
333 | UC_CATEGORY_MASK_Lm | UC_CATEGORY_MASK_Lo | UC_CATEGORY_MASK_Mn \
334 | UC_CATEGORY_MASK_Nl | UC_CATEGORY_MASK_No | UC_CATEGORY_MASK_Pd \
335 | UC_CATEGORY_MASK_Pc | UC_CATEGORY_MASK_Po | UC_CATEGORY_MASK_Sc \
336 | UC_CATEGORY_MASK_Sm | UC_CATEGORY_MASK_Sk | UC_CATEGORY_MASK_So \
337 | UC_CATEGORY_MASK_Co)
338
339 #define SUBSEQUENT_IDENTIFIER_MASK \
340 (INITIAL_IDENTIFIER_MASK \
341 | UC_CATEGORY_MASK_Nd | UC_CATEGORY_MASK_Mc | UC_CATEGORY_MASK_Me)
342
343 static int
344 symbol_has_extended_read_syntax (SCM sym)
345 {
346 size_t pos, len = scm_i_symbol_length (sym);
347 scm_t_wchar c;
348
349 /* The empty symbol. */
350 if (len == 0)
351 return 1;
352
353 c = scm_i_symbol_ref (sym, 0);
354
355 /* Single dot; conflicts with dotted-pair notation. */
356 if (len == 1 && c == '.')
357 return 1;
358
359 /* Other initial-character constraints. */
360 if (c == '\'' || c == '`' || c == ',' || c == '"' || c == ';' || c == '#')
361 return 1;
362
363 /* R7RS allows neither '|' nor '\' in bare symbols. */
364 if ((c == '|' || c == '\\') && SCM_PRINT_R7RS_SYMBOLS_P)
365 return 1;
366
367 /* Keywords can be identified by trailing colons too. */
368 if (c == ':' || scm_i_symbol_ref (sym, len - 1) == ':')
369 return quote_keywordish_symbols ();
370
371 /* Number-ish symbols. */
372 if (scm_is_true (scm_i_string_to_number (scm_symbol_to_string (sym), 10)))
373 return 1;
374
375 /* Other disallowed first characters. */
376 if (!uc_is_general_category_withtable (c, INITIAL_IDENTIFIER_MASK))
377 return 1;
378
379 /* Otherwise, any character that's in the identifier category mask is
380 fine to pass through as-is, provided it's not one of the ASCII
381 delimiters like `;'. */
382 for (pos = 1; pos < len; pos++)
383 {
384 c = scm_i_symbol_ref (sym, pos);
385 if (!uc_is_general_category_withtable (c, SUBSEQUENT_IDENTIFIER_MASK))
386 return 1;
387 else if (c == '"' || c == ';' || c == '#')
388 return 1;
389 else if ((c == '|' || c == '\\') && SCM_PRINT_R7RS_SYMBOLS_P)
390 /* R7RS allows neither '|' nor '\' in bare symbols. */
391 return 1;
392 }
393
394 return 0;
395 }
396
397 static void
398 print_normal_symbol (SCM sym, SCM port)
399 {
400 scm_display (scm_symbol_to_string (sym), port);
401 }
402
403 static void
404 print_extended_symbol (SCM sym, SCM port)
405 {
406 size_t pos, len;
407 scm_t_string_failed_conversion_handler strategy;
408
409 len = scm_i_symbol_length (sym);
410 strategy = PORT_CONVERSION_HANDLER (port);
411
412 scm_lfwrite ("#{", 2, port);
413
414 for (pos = 0; pos < len; pos++)
415 {
416 scm_t_wchar c = scm_i_symbol_ref (sym, pos);
417
418 if (uc_is_general_category_withtable (c,
419 SUBSEQUENT_IDENTIFIER_MASK
420 | UC_CATEGORY_MASK_Zs))
421 {
422 if (!display_character (c, port, strategy)
423 || (c == '\\' && !display_character (c, port, strategy)))
424 scm_encoding_error ("print_extended_symbol", errno,
425 "cannot convert to output locale",
426 port, SCM_MAKE_CHAR (c));
427 }
428 else
429 {
430 scm_lfwrite ("\\x", 2, port);
431 scm_intprint (c, 16, port);
432 scm_putc (';', port);
433 }
434 }
435
436 scm_lfwrite ("}#", 2, port);
437 }
438
439 static void
440 print_r7rs_extended_symbol (SCM sym, SCM port)
441 {
442 size_t pos, len;
443 scm_t_string_failed_conversion_handler strategy;
444
445 len = scm_i_symbol_length (sym);
446 strategy = PORT_CONVERSION_HANDLER (port);
447
448 scm_putc ('|', port);
449
450 for (pos = 0; pos < len; pos++)
451 {
452 scm_t_wchar c = scm_i_symbol_ref (sym, pos);
453
454 switch (c)
455 {
456 case '\a': scm_lfwrite ("\\a", 2, port); break;
457 case '\b': scm_lfwrite ("\\b", 2, port); break;
458 case '\t': scm_lfwrite ("\\t", 2, port); break;
459 case '\n': scm_lfwrite ("\\n", 2, port); break;
460 case '\r': scm_lfwrite ("\\r", 2, port); break;
461 case '|': scm_lfwrite ("\\|", 2, port); break;
462 case '\\': scm_lfwrite ("\\x5c;", 5, port); break;
463 default:
464 if (uc_is_general_category_withtable (c,
465 SUBSEQUENT_IDENTIFIER_MASK
466 | UC_CATEGORY_MASK_Zs))
467 {
468 if (!display_character (c, port, strategy))
469 scm_encoding_error ("print_r7rs_extended_symbol", errno,
470 "cannot convert to output locale",
471 port, SCM_MAKE_CHAR (c));
472 }
473 else
474 {
475 scm_lfwrite ("\\x", 2, port);
476 scm_intprint (c, 16, port);
477 scm_putc (';', port);
478 }
479 break;
480 }
481 }
482
483 scm_putc ('|', port);
484 }
485
486 /* FIXME: allow R6RS hex escapes instead of #{...}# or |...|. */
487 void
488 scm_i_print_symbol_name (SCM sym, SCM port)
489 {
490 if (!symbol_has_extended_read_syntax (sym))
491 print_normal_symbol (sym, port);
492 else if (SCM_PRINT_R7RS_SYMBOLS_P)
493 print_r7rs_extended_symbol (sym, port);
494 else
495 print_extended_symbol (sym, port);
496 }
497
498 void
499 scm_print_symbol_name (const char *str, size_t len, SCM port)
500 {
501 SCM symbol = scm_from_locale_symboln (str, len);
502 scm_i_print_symbol_name (symbol, port);
503 }
504
505 /* Print generally. Handles both write and display according to PSTATE.
506 */
507 SCM_GPROC(s_write, "write", 1, 1, 0, scm_write, g_write);
508 SCM_GPROC(s_display, "display", 1, 1, 0, scm_display, g_display);
509
510 static void iprin1 (SCM exp, SCM port, scm_print_state *pstate);
511
512
513 /* Print a character as an octal or hex escape. */
514 #define PRINT_CHAR_ESCAPE(i, port) \
515 do \
516 { \
517 if (!SCM_R6RS_ESCAPES_P) \
518 scm_intprint (i, 8, port); \
519 else \
520 { \
521 scm_puts ("x", port); \
522 scm_intprint (i, 16, port); \
523 } \
524 } \
525 while (0)
526
527
528 void
529 scm_iprin1 (SCM exp, SCM port, scm_print_state *pstate)
530 {
531 if (pstate->fancyp
532 && scm_is_true (scm_memq (exp, pstate->highlight_objects)))
533 {
534 scm_display (SCM_PRINT_HIGHLIGHT_PREFIX, port);
535 iprin1 (exp, port, pstate);
536 scm_display (SCM_PRINT_HIGHLIGHT_SUFFIX, port);
537 }
538 else
539 iprin1 (exp, port, pstate);
540 }
541
542 static void
543 iprin1 (SCM exp, SCM port, scm_print_state *pstate)
544 {
545 switch (SCM_ITAG3 (exp))
546 {
547 case scm_tc3_tc7_1:
548 case scm_tc3_tc7_2:
549 /* These tc3 tags should never occur in an immediate value. They are
550 * only used in cell types of non-immediates, i. e. the value returned
551 * by SCM_CELL_TYPE (exp) can use these tags.
552 */
553 scm_ipruk ("immediate", exp, port);
554 break;
555 case scm_tc3_int_1:
556 case scm_tc3_int_2:
557 scm_intprint (SCM_I_INUM (exp), 10, port);
558 break;
559 case scm_tc3_imm24:
560 if (SCM_CHARP (exp))
561 {
562 if (SCM_WRITINGP (pstate))
563 write_character (SCM_CHAR (exp), port, 0);
564 else
565 {
566 if (!display_character (SCM_CHAR (exp), port,
567 PORT_CONVERSION_HANDLER (port)))
568 scm_encoding_error (__func__, errno,
569 "cannot convert to output locale",
570 port, exp);
571 }
572 }
573 else if (SCM_IFLAGP (exp)
574 && ((size_t) SCM_IFLAGNUM (exp) < (sizeof iflagnames / sizeof (char *))))
575 {
576 scm_puts (iflagnames [SCM_IFLAGNUM (exp)], port);
577 }
578 else
579 {
580 /* unknown immediate value */
581 scm_ipruk ("immediate", exp, port);
582 }
583 break;
584 case scm_tc3_cons:
585 switch (SCM_TYP7 (exp))
586 {
587 case scm_tcs_struct:
588 {
589 ENTER_NESTED_DATA (pstate, exp, circref);
590 if (SCM_OBJ_CLASS_FLAGS (exp) & SCM_CLASSF_GOOPS)
591 {
592 SCM pwps, print = pstate->writingp ? g_write : g_display;
593 if (SCM_UNPACK (print) == 0)
594 goto print_struct;
595 pwps = scm_i_port_with_print_state (port, pstate->handle);
596 pstate->revealed = 1;
597 scm_call_generic_2 (print, exp, pwps);
598 }
599 else
600 {
601 print_struct:
602 scm_print_struct (exp, port, pstate);
603 }
604 EXIT_NESTED_DATA (pstate);
605 }
606 break;
607 case scm_tcs_cons_imcar:
608 case scm_tcs_cons_nimcar:
609 ENTER_NESTED_DATA (pstate, exp, circref);
610 scm_iprlist ("(", exp, ')', port, pstate);
611 EXIT_NESTED_DATA (pstate);
612 break;
613 circref:
614 print_circref (port, pstate, exp);
615 break;
616 case scm_tc7_number:
617 switch SCM_TYP16 (exp) {
618 case scm_tc16_big:
619 scm_bigprint (exp, port, pstate);
620 break;
621 case scm_tc16_real:
622 scm_print_real (exp, port, pstate);
623 break;
624 case scm_tc16_complex:
625 scm_print_complex (exp, port, pstate);
626 break;
627 case scm_tc16_fraction:
628 scm_i_print_fraction (exp, port, pstate);
629 break;
630 }
631 break;
632 case scm_tc7_string:
633 if (SCM_WRITINGP (pstate))
634 {
635 size_t len, i;
636
637 display_character ('"', port, iconveh_question_mark);
638 len = scm_i_string_length (exp);
639 for (i = 0; i < len; ++i)
640 write_character (scm_i_string_ref (exp, i), port, 1);
641
642 display_character ('"', port, iconveh_question_mark);
643 scm_remember_upto_here_1 (exp);
644 }
645 else
646 {
647 size_t len, printed;
648
649 len = scm_i_string_length (exp);
650 printed = display_string (scm_i_string_data (exp),
651 scm_i_is_narrow_string (exp),
652 len, port,
653 PORT_CONVERSION_HANDLER (port));
654 if (SCM_UNLIKELY (printed < len))
655 scm_encoding_error (__func__, errno,
656 "cannot convert to output locale",
657 port, scm_c_string_ref (exp, printed));
658 }
659
660 scm_remember_upto_here_1 (exp);
661 break;
662 case scm_tc7_symbol:
663 if (scm_i_symbol_is_interned (exp))
664 {
665 scm_i_print_symbol_name (exp, port);
666 scm_remember_upto_here_1 (exp);
667 }
668 else
669 {
670 scm_puts ("#<uninterned-symbol ", port);
671 scm_i_print_symbol_name (exp, port);
672 scm_putc (' ', port);
673 scm_uintprint (SCM_UNPACK (exp), 16, port);
674 scm_putc ('>', port);
675 }
676 break;
677 case scm_tc7_variable:
678 scm_i_variable_print (exp, port, pstate);
679 break;
680 case scm_tc7_program:
681 scm_i_program_print (exp, port, pstate);
682 break;
683 case scm_tc7_pointer:
684 scm_i_pointer_print (exp, port, pstate);
685 break;
686 case scm_tc7_hashtable:
687 scm_i_hashtable_print (exp, port, pstate);
688 break;
689 case scm_tc7_fluid:
690 scm_i_fluid_print (exp, port, pstate);
691 break;
692 case scm_tc7_dynamic_state:
693 scm_i_dynamic_state_print (exp, port, pstate);
694 break;
695 case scm_tc7_frame:
696 scm_i_frame_print (exp, port, pstate);
697 break;
698 case scm_tc7_objcode:
699 scm_i_objcode_print (exp, port, pstate);
700 break;
701 case scm_tc7_vm:
702 scm_i_vm_print (exp, port, pstate);
703 break;
704 case scm_tc7_vm_cont:
705 scm_i_vm_cont_print (exp, port, pstate);
706 break;
707 case scm_tc7_prompt:
708 scm_i_prompt_print (exp, port, pstate);
709 break;
710 case scm_tc7_with_fluids:
711 scm_i_with_fluids_print (exp, port, pstate);
712 break;
713 case scm_tc7_array:
714 ENTER_NESTED_DATA (pstate, exp, circref);
715 scm_i_print_array (exp, port, pstate);
716 EXIT_NESTED_DATA (pstate);
717 break;
718 case scm_tc7_bytevector:
719 scm_i_print_bytevector (exp, port, pstate);
720 break;
721 case scm_tc7_bitvector:
722 scm_i_print_bitvector (exp, port, pstate);
723 break;
724 case scm_tc7_wvect:
725 ENTER_NESTED_DATA (pstate, exp, circref);
726 if (SCM_IS_WHVEC (exp))
727 scm_puts ("#wh(", port);
728 else
729 scm_puts ("#w(", port);
730 goto common_vector_printer;
731 case scm_tc7_vector:
732 ENTER_NESTED_DATA (pstate, exp, circref);
733 scm_puts ("#(", port);
734 common_vector_printer:
735 {
736 register long i;
737 long last = SCM_SIMPLE_VECTOR_LENGTH (exp) - 1;
738 int cutp = 0;
739 if (pstate->fancyp
740 && SCM_SIMPLE_VECTOR_LENGTH (exp) > pstate->length)
741 {
742 last = pstate->length - 1;
743 cutp = 1;
744 }
745 if (SCM_I_WVECTP (exp))
746 {
747 /* Elements of weak vectors may not be accessed via the
748 `SIMPLE_VECTOR_REF ()' macro. */
749 for (i = 0; i < last; ++i)
750 {
751 scm_iprin1 (scm_c_vector_ref (exp, i),
752 port, pstate);
753 scm_putc (' ', port);
754 }
755 }
756 else
757 {
758 for (i = 0; i < last; ++i)
759 {
760 scm_iprin1 (SCM_SIMPLE_VECTOR_REF (exp, i), port, pstate);
761 scm_putc (' ', port);
762 }
763 }
764
765 if (i == last)
766 {
767 /* CHECK_INTS; */
768 scm_iprin1 (scm_c_vector_ref (exp, i), port, pstate);
769 }
770 if (cutp)
771 scm_puts (" ...", port);
772 scm_putc (')', port);
773 }
774 EXIT_NESTED_DATA (pstate);
775 break;
776 case scm_tc7_port:
777 {
778 register long i = SCM_PTOBNUM (exp);
779 if (i < scm_numptob
780 && scm_ptobs[i].print
781 && (scm_ptobs[i].print) (exp, port, pstate))
782 break;
783 goto punk;
784 }
785 case scm_tc7_smob:
786 ENTER_NESTED_DATA (pstate, exp, circref);
787 SCM_SMOB_DESCRIPTOR (exp).print (exp, port, pstate);
788 EXIT_NESTED_DATA (pstate);
789 break;
790 default:
791 /* case scm_tcs_closures: */
792 punk:
793 scm_ipruk ("type", exp, port);
794 }
795 }
796 }
797
798 /* Print states are necessary for circular reference safe printing.
799 * They are also expensive to allocate. Therefore print states are
800 * kept in a pool so that they can be reused.
801 */
802
803 /* The PORT argument can also be a print-state/port pair, which will
804 * then be used instead of allocating a new print state. This is
805 * useful for continuing a chain of print calls from Scheme. */
806
807 void
808 scm_prin1 (SCM exp, SCM port, int writingp)
809 {
810 SCM handle = SCM_BOOL_F; /* Will GC protect the handle whilst unlinked */
811 SCM pstate_scm;
812 scm_print_state *pstate;
813 int old_writingp;
814
815 /* If PORT is a print-state/port pair, use that. Else create a new
816 print-state. */
817
818 if (SCM_PORT_WITH_PS_P (port))
819 {
820 pstate_scm = SCM_PORT_WITH_PS_PS (port);
821 port = SCM_PORT_WITH_PS_PORT (port);
822 }
823 else
824 {
825 /* First try to allocate a print state from the pool */
826 scm_i_pthread_mutex_lock (&print_state_mutex);
827 if (!scm_is_null (print_state_pool))
828 {
829 handle = print_state_pool;
830 print_state_pool = SCM_CDR (print_state_pool);
831 }
832 scm_i_pthread_mutex_unlock (&print_state_mutex);
833 if (scm_is_false (handle))
834 handle = scm_list_1 (make_print_state ());
835 pstate_scm = SCM_CAR (handle);
836 }
837
838 pstate = SCM_PRINT_STATE (pstate_scm);
839 old_writingp = pstate->writingp;
840 pstate->writingp = writingp;
841 scm_iprin1 (exp, port, pstate);
842 pstate->writingp = old_writingp;
843
844 /* Return print state to pool if it has been created above and
845 hasn't escaped to Scheme. */
846
847 if (scm_is_true (handle) && !pstate->revealed)
848 {
849 scm_i_pthread_mutex_lock (&print_state_mutex);
850 SCM_SETCDR (handle, print_state_pool);
851 print_state_pool = handle;
852 scm_i_pthread_mutex_unlock (&print_state_mutex);
853 }
854 }
855
856 /* Convert codepoint CH to UTF-8 and store the result in UTF8. Return
857 the number of bytes of the UTF-8-encoded string. */
858 static size_t
859 codepoint_to_utf8 (scm_t_wchar ch, scm_t_uint8 utf8[4])
860 {
861 size_t len;
862 scm_t_uint32 codepoint;
863
864 codepoint = (scm_t_uint32) ch;
865
866 if (codepoint <= 0x7f)
867 {
868 len = 1;
869 utf8[0] = (scm_t_uint8) codepoint;
870 }
871 else if (codepoint <= 0x7ffUL)
872 {
873 len = 2;
874 utf8[0] = 0xc0 | (codepoint >> 6);
875 utf8[1] = 0x80 | (codepoint & 0x3f);
876 }
877 else if (codepoint <= 0xffffUL)
878 {
879 len = 3;
880 utf8[0] = 0xe0 | (codepoint >> 12);
881 utf8[1] = 0x80 | ((codepoint >> 6) & 0x3f);
882 utf8[2] = 0x80 | (codepoint & 0x3f);
883 }
884 else
885 {
886 len = 4;
887 utf8[0] = 0xf0 | (codepoint >> 18);
888 utf8[1] = 0x80 | ((codepoint >> 12) & 0x3f);
889 utf8[2] = 0x80 | ((codepoint >> 6) & 0x3f);
890 utf8[3] = 0x80 | (codepoint & 0x3f);
891 }
892
893 return len;
894 }
895
896 #define STR_REF(s, x) \
897 (narrow_p \
898 ? (scm_t_wchar) ((unsigned char *) (s))[x] \
899 : ((scm_t_wchar *) (s))[x])
900
901 /* Write STR to PORT as UTF-8. STR is a LEN-codepoint string; it is
902 narrow if NARROW_P is true, wide otherwise. Return LEN. */
903 static size_t
904 display_string_as_utf8 (const void *str, int narrow_p, size_t len,
905 SCM port)
906 {
907 size_t printed = 0;
908
909 while (len > printed)
910 {
911 size_t utf8_len, i;
912 char *input, utf8_buf[256];
913
914 /* Convert STR to UTF-8. */
915 for (i = printed, utf8_len = 0, input = utf8_buf;
916 i < len && utf8_len + 4 < sizeof (utf8_buf);
917 i++)
918 {
919 utf8_len += codepoint_to_utf8 (STR_REF (str, i),
920 (scm_t_uint8 *) input);
921 input = utf8_buf + utf8_len;
922 }
923
924 /* INPUT was successfully converted, entirely; print the
925 result. */
926 scm_lfwrite (utf8_buf, utf8_len, port);
927 printed += i - printed;
928 }
929
930 assert (printed == len);
931
932 return len;
933 }
934
935 /* Convert STR through PORT's output conversion descriptor and write the
936 output to PORT. Return the number of codepoints written. */
937 static size_t
938 display_string_using_iconv (const void *str, int narrow_p, size_t len,
939 SCM port,
940 scm_t_string_failed_conversion_handler strategy)
941 {
942 size_t printed;
943 scm_t_iconv_descriptors *id;
944 scm_t_port_internal *pti = SCM_PORT_GET_INTERNAL (port);
945
946 id = scm_i_port_iconv_descriptors (port, SCM_PORT_WRITE);
947
948 if (SCM_UNLIKELY (pti->at_stream_start_for_bom_write && len > 0))
949 {
950 scm_t_port *pt = SCM_PTAB_ENTRY (port);
951
952 /* Record that we're no longer at stream start. */
953 pti->at_stream_start_for_bom_write = 0;
954 if (pt->rw_random)
955 pti->at_stream_start_for_bom_read = 0;
956
957 /* Write a BOM if appropriate. */
958 if (SCM_UNLIKELY (c_strcasecmp(pt->encoding, "UTF-16") == 0
959 || c_strcasecmp(pt->encoding, "UTF-32") == 0))
960 display_character (SCM_UNICODE_BOM, port, iconveh_error);
961 }
962
963 printed = 0;
964
965 while (len > printed)
966 {
967 size_t done, utf8_len, input_left, output_left, i;
968 size_t codepoints_read, output_len;
969 char *input, *output;
970 char utf8_buf[256], encoded_output[256];
971 size_t offsets[256];
972
973 /* Convert STR to UTF-8. */
974 for (i = printed, utf8_len = 0, input = utf8_buf;
975 i < len && utf8_len + 4 < sizeof (utf8_buf);
976 i++)
977 {
978 offsets[utf8_len] = i;
979 utf8_len += codepoint_to_utf8 (STR_REF (str, i),
980 (scm_t_uint8 *) input);
981 input = utf8_buf + utf8_len;
982 }
983
984 input = utf8_buf;
985 input_left = utf8_len;
986
987 output = encoded_output;
988 output_left = sizeof (encoded_output);
989
990 done = iconv (id->output_cd, &input, &input_left,
991 &output, &output_left);
992
993 output_len = sizeof (encoded_output) - output_left;
994
995 if (SCM_UNLIKELY (done == (size_t) -1))
996 {
997 int errno_save = errno;
998
999 /* Reset the `iconv' state. */
1000 iconv (id->output_cd, NULL, NULL, NULL, NULL);
1001
1002 /* Print the OUTPUT_LEN bytes successfully converted. */
1003 scm_lfwrite (encoded_output, output_len, port);
1004
1005 /* See how many input codepoints these OUTPUT_LEN bytes
1006 corresponds to. */
1007 codepoints_read = offsets[input - utf8_buf] - printed;
1008 printed += codepoints_read;
1009
1010 if (errno_save == EILSEQ &&
1011 strategy != SCM_FAILED_CONVERSION_ERROR)
1012 {
1013 /* Conversion failed somewhere in INPUT and we want to
1014 escape or substitute the offending input character. */
1015
1016 if (strategy == SCM_FAILED_CONVERSION_ESCAPE_SEQUENCE)
1017 {
1018 scm_t_wchar ch;
1019
1020 /* Find CH, the offending codepoint, and escape it. */
1021 ch = STR_REF (str, offsets[input - utf8_buf]);
1022 write_character_escaped (ch, 1, port);
1023 }
1024 else
1025 /* STRATEGY is `SCM_FAILED_CONVERSION_QUESTION_MARK'. */
1026 display_string ("?", 1, 1, port, strategy);
1027
1028 printed++;
1029 }
1030 else
1031 /* Something bad happened that we can't handle: bail out. */
1032 break;
1033 }
1034 else
1035 {
1036 /* INPUT was successfully converted, entirely; print the
1037 result. */
1038 scm_lfwrite (encoded_output, output_len, port);
1039 codepoints_read = i - printed;
1040 printed += codepoints_read;
1041 }
1042 }
1043
1044 return printed;
1045 }
1046
1047 #undef STR_REF
1048
1049 /* Display the LEN codepoints in STR to PORT according to STRATEGY;
1050 return the number of codepoints successfully displayed. If NARROW_P,
1051 then STR is interpreted as a sequence of `char', denoting a Latin-1
1052 string; otherwise it's interpreted as a sequence of
1053 `scm_t_wchar'. */
1054 static size_t
1055 display_string (const void *str, int narrow_p,
1056 size_t len, SCM port,
1057 scm_t_string_failed_conversion_handler strategy)
1058
1059 {
1060 scm_t_port_internal *pti;
1061
1062 pti = SCM_PORT_GET_INTERNAL (port);
1063
1064 if (pti->encoding_mode == SCM_PORT_ENCODING_MODE_UTF8)
1065 return display_string_as_utf8 (str, narrow_p, len, port);
1066 else
1067 return display_string_using_iconv (str, narrow_p, len,
1068 port, strategy);
1069 }
1070
1071 /* Attempt to display CH to PORT according to STRATEGY. Return non-zero
1072 if CH was successfully displayed, zero otherwise (e.g., if it was not
1073 representable in PORT's encoding.) */
1074 static int
1075 display_character (scm_t_wchar ch, SCM port,
1076 scm_t_string_failed_conversion_handler strategy)
1077 {
1078 return display_string (&ch, 0, 1, port, strategy) == 1;
1079 }
1080
1081 /* Attempt to pretty-print CH, a combining character, to PORT. Return
1082 zero upon failure, non-zero otherwise. The idea is to print CH above
1083 a dotted circle to make it more visible. */
1084 static int
1085 write_combining_character (scm_t_wchar ch, SCM port)
1086 {
1087 scm_t_wchar str[2];
1088
1089 str[0] = SCM_CODEPOINT_DOTTED_CIRCLE;
1090 str[1] = ch;
1091
1092 return display_string (str, 0, 2, port, iconveh_error) == 2;
1093 }
1094
1095 /* Write CH to PORT in its escaped form, using the string escape syntax
1096 if STRING_ESCAPES_P is non-zero. */
1097 static void
1098 write_character_escaped (scm_t_wchar ch, int string_escapes_p, SCM port)
1099 {
1100 if (string_escapes_p)
1101 {
1102 /* Represent CH using the in-string escape syntax. */
1103
1104 static const char hex[] = "0123456789abcdef";
1105 static const char escapes[7] = "abtnvfr";
1106 char buf[9];
1107
1108 if (ch >= 0x07 && ch <= 0x0D && ch != 0x0A)
1109 {
1110 /* Use special escapes for some C0 controls. */
1111 buf[0] = '\\';
1112 buf[1] = escapes[ch - 0x07];
1113 scm_lfwrite (buf, 2, port);
1114 }
1115 else if (!SCM_R6RS_ESCAPES_P)
1116 {
1117 if (ch <= 0xFF)
1118 {
1119 buf[0] = '\\';
1120 buf[1] = 'x';
1121 buf[2] = hex[ch / 16];
1122 buf[3] = hex[ch % 16];
1123 scm_lfwrite (buf, 4, port);
1124 }
1125 else if (ch <= 0xFFFF)
1126 {
1127 buf[0] = '\\';
1128 buf[1] = 'u';
1129 buf[2] = hex[(ch & 0xF000) >> 12];
1130 buf[3] = hex[(ch & 0xF00) >> 8];
1131 buf[4] = hex[(ch & 0xF0) >> 4];
1132 buf[5] = hex[(ch & 0xF)];
1133 scm_lfwrite (buf, 6, port);
1134 }
1135 else if (ch > 0xFFFF)
1136 {
1137 buf[0] = '\\';
1138 buf[1] = 'U';
1139 buf[2] = hex[(ch & 0xF00000) >> 20];
1140 buf[3] = hex[(ch & 0xF0000) >> 16];
1141 buf[4] = hex[(ch & 0xF000) >> 12];
1142 buf[5] = hex[(ch & 0xF00) >> 8];
1143 buf[6] = hex[(ch & 0xF0) >> 4];
1144 buf[7] = hex[(ch & 0xF)];
1145 scm_lfwrite (buf, 8, port);
1146 }
1147 }
1148 else
1149 {
1150 /* Print an R6RS variable-length hex escape: "\xNNNN;". */
1151 scm_t_wchar ch2 = ch;
1152
1153 int i = 8;
1154 buf[i] = ';';
1155 i --;
1156 if (ch == 0)
1157 buf[i--] = '0';
1158 else
1159 while (ch2 > 0)
1160 {
1161 buf[i] = hex[ch2 & 0xF];
1162 ch2 >>= 4;
1163 i --;
1164 }
1165 buf[i] = 'x';
1166 i --;
1167 buf[i] = '\\';
1168 scm_lfwrite (buf + i, 9 - i, port);
1169 }
1170 }
1171 else
1172 {
1173 /* Represent CH using the character escape syntax. */
1174 const char *name;
1175
1176 name = scm_i_charname (SCM_MAKE_CHAR (ch));
1177 if (name != NULL)
1178 scm_puts (name, port);
1179 else
1180 PRINT_CHAR_ESCAPE (ch, port);
1181 }
1182 }
1183
1184 /* Write CH to PORT, escaping it if it's non-graphic or not
1185 representable in PORT's encoding. If STRING_ESCAPES_P is true and CH
1186 needs to be escaped, it is escaped using the in-string escape syntax;
1187 otherwise the character escape syntax is used. */
1188 static void
1189 write_character (scm_t_wchar ch, SCM port, int string_escapes_p)
1190 {
1191 int printed = 0;
1192 scm_t_string_failed_conversion_handler strategy;
1193
1194 strategy = PORT_CONVERSION_HANDLER (port);
1195
1196 if (string_escapes_p)
1197 {
1198 /* Check if CH deserves special treatment. */
1199 if (ch == '"' || ch == '\\')
1200 {
1201 display_character ('\\', port, iconveh_question_mark);
1202 display_character (ch, port, strategy);
1203 printed = 1;
1204 }
1205 else if (ch == '\n' && SCM_PRINT_ESCAPE_NEWLINES_P)
1206 {
1207 display_character ('\\', port, iconveh_question_mark);
1208 display_character ('n', port, strategy);
1209 printed = 1;
1210 }
1211 else if (ch == ' ' || ch == '\n')
1212 {
1213 display_character (ch, port, strategy);
1214 printed = 1;
1215 }
1216 }
1217 else
1218 {
1219 display_string ("#\\", 1, 2, port, iconveh_question_mark);
1220
1221 if (uc_combining_class (ch) != UC_CCC_NR)
1222 /* Character is a combining character, so attempt to
1223 pretty-print it. */
1224 printed = write_combining_character (ch, port);
1225 }
1226
1227 if (!printed
1228 && uc_is_general_category_withtable (ch,
1229 UC_CATEGORY_MASK_L |
1230 UC_CATEGORY_MASK_M |
1231 UC_CATEGORY_MASK_N |
1232 UC_CATEGORY_MASK_P |
1233 UC_CATEGORY_MASK_S))
1234 /* CH is graphic; attempt to display it. */
1235 printed = display_character (ch, port, iconveh_error);
1236
1237 if (!printed)
1238 /* CH isn't graphic or cannot be represented in PORT's encoding. */
1239 write_character_escaped (ch, string_escapes_p, port);
1240 }
1241
1242 /* Display STR to PORT from START inclusive to END exclusive. */
1243 void
1244 scm_i_display_substring (SCM str, size_t start, size_t end, SCM port)
1245 {
1246 int narrow_p;
1247 const char *buf;
1248 size_t len, printed;
1249
1250 buf = scm_i_string_data (str);
1251 len = end - start;
1252 narrow_p = scm_i_is_narrow_string (str);
1253 buf += start * (narrow_p ? sizeof (char) : sizeof (scm_t_wchar));
1254
1255 printed = display_string (buf, narrow_p, end - start, port,
1256 PORT_CONVERSION_HANDLER (port));
1257
1258 if (SCM_UNLIKELY (printed < len))
1259 scm_encoding_error (__func__, errno,
1260 "cannot convert to output locale",
1261 port, scm_c_string_ref (str, printed + start));
1262 }
1263
1264 \f
1265 /* Print an integer.
1266 */
1267
1268 void
1269 scm_intprint (scm_t_intmax n, int radix, SCM port)
1270 {
1271 char num_buf[SCM_INTBUFLEN];
1272 scm_lfwrite (num_buf, scm_iint2str (n, radix, num_buf), port);
1273 }
1274
1275 void
1276 scm_uintprint (scm_t_uintmax n, int radix, SCM port)
1277 {
1278 char num_buf[SCM_INTBUFLEN];
1279 scm_lfwrite (num_buf, scm_iuint2str (n, radix, num_buf), port);
1280 }
1281
1282 /* Print an object of unrecognized type.
1283 */
1284
1285 void
1286 scm_ipruk (char *hdr, SCM ptr, SCM port)
1287 {
1288 scm_puts ("#<unknown-", port);
1289 scm_puts (hdr, port);
1290 if (1) /* (scm_in_heap_p (ptr)) */ /* FIXME */
1291 {
1292 scm_puts (" (0x", port);
1293 scm_uintprint (SCM_CELL_WORD_0 (ptr), 16, port);
1294 scm_puts (" . 0x", port);
1295 scm_uintprint (SCM_CELL_WORD_1 (ptr), 16, port);
1296 scm_puts (") @", port);
1297 }
1298 scm_puts (" 0x", port);
1299 scm_uintprint (SCM_UNPACK (ptr), 16, port);
1300 scm_putc ('>', port);
1301 }
1302
1303
1304 /* Print a list.
1305 */
1306 void
1307 scm_iprlist (char *hdr, SCM exp, int tlr, SCM port, scm_print_state *pstate)
1308 {
1309 register SCM hare, tortoise;
1310 long floor = pstate->top - 2;
1311 scm_puts (hdr, port);
1312 /* CHECK_INTS; */
1313 if (pstate->fancyp)
1314 goto fancy_printing;
1315
1316 /* Run a hare and tortoise so that total time complexity will be
1317 O(depth * N) instead of O(N^2). */
1318 hare = SCM_CDR (exp);
1319 tortoise = exp;
1320 while (scm_is_pair (hare))
1321 {
1322 if (scm_is_eq (hare, tortoise))
1323 goto fancy_printing;
1324 hare = SCM_CDR (hare);
1325 if (!scm_is_pair (hare))
1326 break;
1327 hare = SCM_CDR (hare);
1328 tortoise = SCM_CDR (tortoise);
1329 }
1330
1331 /* No cdr cycles intrinsic to this list */
1332 scm_iprin1 (SCM_CAR (exp), port, pstate);
1333 for (exp = SCM_CDR (exp); scm_is_pair (exp); exp = SCM_CDR (exp))
1334 {
1335 register long i;
1336
1337 for (i = floor; i >= 0; --i)
1338 if (scm_is_eq (PSTATE_STACK_REF(pstate, i), exp))
1339 goto circref;
1340 PUSH_REF (pstate, exp);
1341 scm_putc (' ', port);
1342 /* CHECK_INTS; */
1343 scm_iprin1 (SCM_CAR (exp), port, pstate);
1344 }
1345 if (!SCM_NULL_OR_NIL_P (exp))
1346 {
1347 scm_puts (" . ", port);
1348 scm_iprin1 (exp, port, pstate);
1349 }
1350
1351 end:
1352 scm_putc (tlr, port);
1353 pstate->top = floor + 2;
1354 return;
1355
1356 fancy_printing:
1357 {
1358 long n = pstate->length;
1359
1360 scm_iprin1 (SCM_CAR (exp), port, pstate);
1361 exp = SCM_CDR (exp); --n;
1362 for (; scm_is_pair (exp); exp = SCM_CDR (exp))
1363 {
1364 register unsigned long i;
1365
1366 for (i = 0; i < pstate->top; ++i)
1367 if (scm_is_eq (PSTATE_STACK_REF(pstate, i), exp))
1368 goto fancy_circref;
1369 if (pstate->fancyp)
1370 {
1371 if (n == 0)
1372 {
1373 scm_puts (" ...", port);
1374 goto skip_tail;
1375 }
1376 else
1377 --n;
1378 }
1379 PUSH_REF(pstate, exp);
1380 ++pstate->list_offset;
1381 scm_putc (' ', port);
1382 /* CHECK_INTS; */
1383 scm_iprin1 (SCM_CAR (exp), port, pstate);
1384 }
1385 }
1386 if (!SCM_NULL_OR_NIL_P (exp))
1387 {
1388 scm_puts (" . ", port);
1389 scm_iprin1 (exp, port, pstate);
1390 }
1391 skip_tail:
1392 pstate->list_offset -= pstate->top - floor - 2;
1393 goto end;
1394
1395 fancy_circref:
1396 pstate->list_offset -= pstate->top - floor - 2;
1397
1398 circref:
1399 scm_puts (" . ", port);
1400 print_circref (port, pstate, exp);
1401 goto end;
1402 }
1403
1404 \f
1405
1406 int
1407 scm_valid_oport_value_p (SCM val)
1408 {
1409 return (SCM_OPOUTPORTP (val)
1410 || (SCM_PORT_WITH_PS_P (val)
1411 && SCM_OPOUTPORTP (SCM_PORT_WITH_PS_PORT (val))));
1412 }
1413
1414 /* SCM_GPROC(s_write, "write", 1, 1, 0, scm_write, g_write); */
1415
1416 SCM
1417 scm_write (SCM obj, SCM port)
1418 {
1419 if (SCM_UNBNDP (port))
1420 port = scm_current_output_port ();
1421
1422 SCM_ASSERT (scm_valid_oport_value_p (port), port, SCM_ARG2, s_write);
1423
1424 scm_prin1 (obj, port, 1);
1425 return SCM_UNSPECIFIED;
1426 }
1427
1428
1429 /* SCM_GPROC(s_display, "display", 1, 1, 0, scm_display, g_display); */
1430
1431 SCM
1432 scm_display (SCM obj, SCM port)
1433 {
1434 if (SCM_UNBNDP (port))
1435 port = scm_current_output_port ();
1436
1437 SCM_ASSERT (scm_valid_oport_value_p (port), port, SCM_ARG2, s_display);
1438
1439 scm_prin1 (obj, port, 0);
1440 return SCM_UNSPECIFIED;
1441 }
1442
1443
1444 SCM_DEFINE (scm_simple_format, "simple-format", 2, 0, 1,
1445 (SCM destination, SCM message, SCM args),
1446 "Write @var{message} to @var{destination}, defaulting to\n"
1447 "the current output port.\n"
1448 "@var{message} can contain @code{~A} (was @code{%s}) and\n"
1449 "@code{~S} (was @code{%S}) escapes. When printed,\n"
1450 "the escapes are replaced with corresponding members of\n"
1451 "@var{args}:\n"
1452 "@code{~A} formats using @code{display} and @code{~S} formats\n"
1453 "using @code{write}.\n"
1454 "If @var{destination} is @code{#t}, then use the current output\n"
1455 "port, if @var{destination} is @code{#f}, then return a string\n"
1456 "containing the formatted text. Does not add a trailing newline.")
1457 #define FUNC_NAME s_scm_simple_format
1458 {
1459 SCM port, answer = SCM_UNSPECIFIED;
1460 int fReturnString = 0;
1461 int writingp;
1462 size_t start, p, end;
1463
1464 if (scm_is_eq (destination, SCM_BOOL_T))
1465 {
1466 destination = port = scm_current_output_port ();
1467 }
1468 else if (scm_is_false (destination))
1469 {
1470 fReturnString = 1;
1471 port = scm_mkstrport (SCM_INUM0, SCM_BOOL_F,
1472 SCM_OPN | SCM_WRTNG,
1473 FUNC_NAME);
1474 destination = port;
1475 }
1476 else
1477 {
1478 SCM_VALIDATE_OPORT_VALUE (1, destination);
1479 port = SCM_COERCE_OUTPORT (destination);
1480 }
1481 SCM_VALIDATE_STRING (2, message);
1482 SCM_VALIDATE_REST_ARGUMENT (args);
1483
1484 p = 0;
1485 start = 0;
1486 end = scm_i_string_length (message);
1487 for (p = start; p != end; ++p)
1488 if (scm_i_string_ref (message, p) == '~')
1489 {
1490 if (++p == end)
1491 break;
1492
1493 switch (scm_i_string_ref (message, p))
1494 {
1495 case 'A': case 'a':
1496 writingp = 0;
1497 break;
1498 case 'S': case 's':
1499 writingp = 1;
1500 break;
1501 case '~':
1502 scm_lfwrite_substr (message, start, p, port);
1503 start = p + 1;
1504 continue;
1505 case '%':
1506 scm_lfwrite_substr (message, start, p - 1, port);
1507 scm_newline (port);
1508 start = p + 1;
1509 continue;
1510 default:
1511 SCM_MISC_ERROR ("FORMAT: Unsupported format option ~~~A - use (ice-9 format) instead",
1512 scm_list_1 (SCM_MAKE_CHAR (scm_i_string_ref (message, p))));
1513
1514 }
1515
1516
1517 if (!scm_is_pair (args))
1518 SCM_MISC_ERROR ("FORMAT: Missing argument for ~~~A",
1519 scm_list_1 (SCM_MAKE_CHAR (scm_i_string_ref (message, p))));
1520
1521 scm_lfwrite_substr (message, start, p - 1, port);
1522 /* we pass destination here */
1523 scm_prin1 (SCM_CAR (args), destination, writingp);
1524 args = SCM_CDR (args);
1525 start = p + 1;
1526 }
1527
1528 scm_lfwrite_substr (message, start, p, port);
1529 if (!scm_is_eq (args, SCM_EOL))
1530 SCM_MISC_ERROR ("FORMAT: ~A superfluous arguments",
1531 scm_list_1 (scm_length (args)));
1532
1533 if (fReturnString)
1534 answer = scm_strport_to_string (destination);
1535
1536 return scm_return_first (answer, message);
1537 }
1538 #undef FUNC_NAME
1539
1540
1541 SCM_DEFINE (scm_newline, "newline", 0, 1, 0,
1542 (SCM port),
1543 "Send a newline to @var{port}.\n"
1544 "If @var{port} is omitted, send to the current output port.")
1545 #define FUNC_NAME s_scm_newline
1546 {
1547 if (SCM_UNBNDP (port))
1548 port = scm_current_output_port ();
1549
1550 SCM_VALIDATE_OPORT_VALUE (1, port);
1551
1552 scm_putc ('\n', SCM_COERCE_OUTPORT (port));
1553 return SCM_UNSPECIFIED;
1554 }
1555 #undef FUNC_NAME
1556
1557 SCM_DEFINE (scm_write_char, "write-char", 1, 1, 0,
1558 (SCM chr, SCM port),
1559 "Send character @var{chr} to @var{port}.")
1560 #define FUNC_NAME s_scm_write_char
1561 {
1562 if (SCM_UNBNDP (port))
1563 port = scm_current_output_port ();
1564
1565 SCM_VALIDATE_CHAR (1, chr);
1566 SCM_VALIDATE_OPORT_VALUE (2, port);
1567
1568 port = SCM_COERCE_OUTPORT (port);
1569 if (!display_character (SCM_CHAR (chr), port,
1570 PORT_CONVERSION_HANDLER (port)))
1571 scm_encoding_error (__func__, errno,
1572 "cannot convert to output locale",
1573 port, chr);
1574
1575 return SCM_UNSPECIFIED;
1576 }
1577 #undef FUNC_NAME
1578
1579 \f
1580
1581 /* Call back to Scheme code to do the printing of special objects
1582 * (like structs). SCM_PRINTER_APPLY applies PROC to EXP and a smob
1583 * containing PORT and PSTATE. This object can be used as the port for
1584 * display/write etc to continue the current print chain. The REVEALED
1585 * field of PSTATE is set to true to indicate that the print state has
1586 * escaped to Scheme and thus has to be freed by the GC.
1587 */
1588
1589 scm_t_bits scm_tc16_port_with_ps;
1590
1591 /* Print exactly as the port itself would */
1592
1593 static int
1594 port_with_ps_print (SCM obj, SCM port, scm_print_state *pstate)
1595 {
1596 obj = SCM_PORT_WITH_PS_PORT (obj);
1597 return scm_ptobs[SCM_PTOBNUM (obj)].print (obj, port, pstate);
1598 }
1599
1600 SCM
1601 scm_printer_apply (SCM proc, SCM exp, SCM port, scm_print_state *pstate)
1602 {
1603 pstate->revealed = 1;
1604 return scm_call_2 (proc, exp,
1605 scm_i_port_with_print_state (port, pstate->handle));
1606 }
1607
1608 SCM_DEFINE (scm_port_with_print_state, "port-with-print-state", 1, 1, 0,
1609 (SCM port, SCM pstate),
1610 "Create a new port which behaves like @var{port}, but with an\n"
1611 "included print state @var{pstate}. @var{pstate} is optional.\n"
1612 "If @var{pstate} isn't supplied and @var{port} already has\n"
1613 "a print state, the old print state is reused.")
1614 #define FUNC_NAME s_scm_port_with_print_state
1615 {
1616 SCM_VALIDATE_OPORT_VALUE (1, port);
1617 if (!SCM_UNBNDP (pstate))
1618 SCM_VALIDATE_PRINTSTATE (2, pstate);
1619 return scm_i_port_with_print_state (port, pstate);
1620 }
1621 #undef FUNC_NAME
1622
1623 SCM_DEFINE (scm_get_print_state, "get-print-state", 1, 0, 0,
1624 (SCM port),
1625 "Return the print state of the port @var{port}. If @var{port}\n"
1626 "has no associated print state, @code{#f} is returned.")
1627 #define FUNC_NAME s_scm_get_print_state
1628 {
1629 if (SCM_PORT_WITH_PS_P (port))
1630 return SCM_PORT_WITH_PS_PS (port);
1631 if (SCM_OUTPUT_PORT_P (port))
1632 return SCM_BOOL_F;
1633 SCM_WRONG_TYPE_ARG (1, port);
1634 }
1635 #undef FUNC_NAME
1636
1637 \f
1638
1639 void
1640 scm_init_print ()
1641 {
1642 SCM type;
1643
1644 scm_gc_register_root (&print_state_pool);
1645 scm_gc_register_root (&scm_print_state_vtable);
1646 type = scm_make_vtable (scm_from_locale_string (SCM_PRINT_STATE_LAYOUT),
1647 SCM_BOOL_F);
1648 scm_set_struct_vtable_name_x (type, scm_from_latin1_symbol ("print-state"));
1649 scm_print_state_vtable = type;
1650
1651 /* Don't want to bind a wrapper class in GOOPS, so pass 0 as arg1. */
1652 scm_tc16_port_with_ps = scm_make_smob_type (0, 0);
1653 scm_set_smob_print (scm_tc16_port_with_ps, port_with_ps_print);
1654
1655 #include "libguile/print.x"
1656
1657 scm_init_opts (scm_print_options, scm_print_opts);
1658 scm_print_opts[SCM_PRINT_HIGHLIGHT_PREFIX_I].val =
1659 SCM_UNPACK (scm_from_locale_string ("{"));
1660 scm_print_opts[SCM_PRINT_HIGHLIGHT_SUFFIX_I].val =
1661 SCM_UNPACK (scm_from_locale_string ("}"));
1662 scm_print_opts[SCM_PRINT_KEYWORD_STYLE_I].val = SCM_UNPACK (sym_reader);
1663 }
1664
1665 /*
1666 Local Variables:
1667 c-file-style: "gnu"
1668 End:
1669 */