Print the faulty object upon invalid-keyword errors.
[bpt/guile.git] / libguile / print.c
CommitLineData
f4bc4e59 1/* Copyright (C) 1995-1999, 2000, 2001, 2002, 2003, 2004, 2006, 2008,
e4598559 2 * 2009, 2010, 2011, 2012, 2013 Free Software Foundation, Inc.
f4bc4e59 3 *
73be1d9e 4 * This library is free software; you can redistribute it and/or
53befeb7
NJ
5 * modify it under the terms of the GNU Lesser General Public License
6 * as published by the Free Software Foundation; either version 3 of
7 * the License, or (at your option) any later version.
0f2d19dd 8 *
53befeb7
NJ
9 * This library is distributed in the hope that it will be useful, but
10 * WITHOUT ANY WARRANTY; without even the implied warranty of
73be1d9e
MV
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
0f2d19dd 13 *
73be1d9e
MV
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with this library; if not, write to the Free Software
53befeb7
NJ
16 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
17 * 02110-1301 USA
73be1d9e 18 */
1bbd0b84 19
1bbd0b84 20
0f2d19dd 21\f
dbb605f5
LC
22#ifdef HAVE_CONFIG_H
23# include <config.h>
24#endif
0f2d19dd 25
e6e2e95a 26#include <errno.h>
f4bc4e59
LC
27#include <iconv.h>
28#include <stdio.h>
29#include <assert.h>
30
eca29b02 31#include <uniconv.h>
904a78f1 32#include <unictype.h>
96965a6e 33#include <c-strcase.h>
e6e2e95a 34
a0599745
MD
35#include "libguile/_scm.h"
36#include "libguile/chars.h"
a002f1a2 37#include "libguile/continuations.h"
a0599745 38#include "libguile/smob.h"
bbb2ecd1 39#include "libguile/control.h"
a0599745
MD
40#include "libguile/eval.h"
41#include "libguile/macros.h"
42#include "libguile/procprop.h"
43#include "libguile/read.h"
44#include "libguile/weaks.h"
2fb924f6 45#include "libguile/programs.h"
a0599745
MD
46#include "libguile/alist.h"
47#include "libguile/struct.h"
a0599745 48#include "libguile/ports.h"
e4598559 49#include "libguile/ports-internal.h"
a0599745
MD
50#include "libguile/root.h"
51#include "libguile/strings.h"
52#include "libguile/strports.h"
53#include "libguile/vectors.h"
327967ef 54#include "libguile/numbers.h"
6f3b0cc2 55#include "libguile/vm.h"
a0599745
MD
56
57#include "libguile/validate.h"
58#include "libguile/print.h"
22fc179a
HWN
59
60#include "libguile/private-options.h"
61
0f2d19dd
JB
62\f
63
07f49ac7
LC
64/* Character printers. */
65
478848cb
LC
66#define PORT_CONVERSION_HANDLER(port) \
67 SCM_PTAB_ENTRY (port)->ilseq_handler
68
f4bc4e59
LC
69static size_t display_string (const void *, int, size_t, SCM,
70 scm_t_string_failed_conversion_handler);
71
07f49ac7
LC
72static int display_character (scm_t_wchar, SCM,
73 scm_t_string_failed_conversion_handler);
f4bc4e59 74
07f49ac7
LC
75static void write_character (scm_t_wchar, SCM, int);
76
f4bc4e59
LC
77static void write_character_escaped (scm_t_wchar, int, SCM);
78
07f49ac7
LC
79\f
80
0f2d19dd
JB
81/* {Names of immediate symbols}
82 *
83 * This table must agree with the declarations in scm.h: {Immediate Symbols}.
84 */
85
e17d318f
DH
86/* This table must agree with the list of flags in tags.h. */
87static const char *iflagnames[] =
88{
89 "#f",
45f4cbdf
MW
90 "#nil", /* Elisp nil value. Should print from elisp as symbol `nil'. */
91 "#<XXX UNUSED LISP FALSE -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>",
92 "()",
e17d318f 93 "#t",
f60c2c4e
MW
94 "#<XXX UNUSED BOOLEAN 0 -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>",
95 "#<XXX UNUSED BOOLEAN 1 -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>",
96 "#<XXX UNUSED BOOLEAN 2 -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>",
45f4cbdf 97 "#<unspecified>",
e17d318f
DH
98 "#<undefined>",
99 "#<eof>",
e17d318f
DH
100
101 /* Unbound slot marker for GOOPS. For internal use in GOOPS only. */
102 "#<unbound>",
e17d318f
DH
103};
104
475fa9a5
MV
105SCM_SYMBOL (sym_reader, "reader");
106
92c2555f 107scm_t_option scm_print_opts[] = {
210c0325 108 { SCM_OPTION_SCM, "highlight-prefix", (scm_t_bits)SCM_BOOL_F_BITS,
81ae25da 109 "The string to print before highlighted values." },
210c0325 110 { SCM_OPTION_SCM, "highlight-suffix", (scm_t_bits)SCM_BOOL_F_BITS,
475fa9a5 111 "The string to print after highlighted values." },
210c0325 112 { SCM_OPTION_SCM, "quote-keywordish-symbols", (scm_t_bits)SCM_BOOL_F_BITS,
475fa9a5
MV
113 "How to print symbols that have a colon as their first or last character. "
114 "The value '#f' does not quote the colons; '#t' quotes them; "
8500b186
AW
115 "'reader' quotes them when the reader option 'keywords' is not '#f'." },
116 { SCM_OPTION_BOOLEAN, "escape-newlines", 1,
117 "Render newlines as \\n when printing using `write'." },
62560650 118 { 0 },
e6e4c9af
MD
119};
120
a1ec6916 121SCM_DEFINE (scm_print_options, "print-options-interface", 0, 1, 0,
1bbd0b84 122 (SCM setting),
71331188 123 "Option interface for the print options. Instead of using\n"
1dd05fd8
MG
124 "this procedure directly, use the procedures\n"
125 "@code{print-enable}, @code{print-disable}, @code{print-set!}\n"
126 "and @code{print-options}.")
1bbd0b84 127#define FUNC_NAME s_scm_print_options
e6e4c9af 128{
a51ea417 129 SCM ans = scm_options (setting,
b7ff98dd 130 scm_print_opts,
1bbd0b84 131 FUNC_NAME);
e6e4c9af
MD
132 return ans;
133}
1bbd0b84 134#undef FUNC_NAME
e6e4c9af 135
0f2d19dd
JB
136\f
137/* {Printing of Scheme Objects}
138 */
139
a51ea417 140/* Detection of circular references.
c62fbfe1
MD
141 *
142 * Due to other constraints in the implementation, this code has bad
5d46ebe3
MD
143 * time complexity (O (depth * N)), The printer code can be
144 * rewritten to be O(N).
a51ea417 145 */
dbb5de29
NJ
146#define PUSH_REF(pstate, obj) \
147do \
148{ \
149 PSTATE_STACK_SET (pstate, pstate->top, obj); \
150 pstate->top++; \
151 if (pstate->top == pstate->ceiling) \
152 grow_ref_stack (pstate); \
1bbd0b84 153} while(0)
a51ea417 154
dbb5de29
NJ
155#define ENTER_NESTED_DATA(pstate, obj, label) \
156do \
157{ \
158 register unsigned long i; \
159 for (i = 0; i < pstate->top; ++i) \
160 if (scm_is_eq (PSTATE_STACK_REF (pstate, i), (obj))) \
161 goto label; \
162 if (pstate->fancyp) \
163 { \
164 if (pstate->top - pstate->list_offset >= pstate->level) \
165 { \
166 scm_putc ('#', port); \
167 return; \
168 } \
169 } \
170 PUSH_REF(pstate, obj); \
1bbd0b84 171} while(0)
a51ea417 172
dbb5de29
NJ
173#define EXIT_NESTED_DATA(pstate) \
174do \
175{ \
176 --pstate->top; \
177 PSTATE_STACK_SET (pstate, pstate->top, SCM_UNDEFINED); \
178} \
179while (0)
c62fbfe1 180
d5cf5324
DH
181SCM scm_print_state_vtable = SCM_BOOL_F;
182static SCM print_state_pool = SCM_EOL;
9de87eea 183scm_i_pthread_mutex_t print_state_mutex = SCM_I_PTHREAD_MUTEX_INITIALIZER;
c4f37e80 184
f843a84c 185#ifdef GUILE_DEBUG /* Used for debugging purposes */
1cc91f1b 186
3b3b36dd 187SCM_DEFINE (scm_current_pstate, "current-pstate", 0, 0, 0,
1bbd0b84 188 (),
d5cf5324 189 "Return the current-pstate -- the car of the\n"
5352393c
MG
190 "@code{print_state_pool}. @code{current-pstate} is only\n"
191 "included in @code{--enable-guile-debug} builds.")
1bbd0b84 192#define FUNC_NAME s_scm_current_pstate
c62fbfe1 193{
d2e53ed6 194 if (!scm_is_null (print_state_pool))
d5cf5324 195 return SCM_CAR (print_state_pool);
a0adfbf0 196 else
0a284a4e 197 return SCM_BOOL_F;
c62fbfe1 198}
1bbd0b84
GB
199#undef FUNC_NAME
200
c62fbfe1
MD
201#endif
202
203#define PSTATE_SIZE 50L
204
698c0295 205static SCM
1bbd0b84 206make_print_state (void)
698c0295 207{
d5cf5324
DH
208 SCM print_state
209 = scm_make_struct (scm_print_state_vtable, SCM_INUM0, SCM_EOL);
bf685b6d 210 scm_print_state *pstate = SCM_PRINT_STATE (print_state);
00ffa0e7 211 pstate->ref_vect = scm_c_make_vector (PSTATE_SIZE, SCM_UNDEFINED);
4057a3e0 212 pstate->ceiling = SCM_SIMPLE_VECTOR_LENGTH (pstate->ref_vect);
d232520a 213 pstate->highlight_objects = SCM_EOL;
698c0295
MD
214 return print_state;
215}
1cc91f1b 216
c62fbfe1
MD
217SCM
218scm_make_print_state ()
c62fbfe1 219{
230d095f 220 SCM answer = SCM_BOOL_F;
698c0295
MD
221
222 /* First try to allocate a print state from the pool */
9de87eea 223 scm_i_pthread_mutex_lock (&print_state_mutex);
d2e53ed6 224 if (!scm_is_null (print_state_pool))
698c0295 225 {
d5cf5324
DH
226 answer = SCM_CAR (print_state_pool);
227 print_state_pool = SCM_CDR (print_state_pool);
698c0295 228 }
9de87eea 229 scm_i_pthread_mutex_unlock (&print_state_mutex);
698c0295 230
7888309b 231 return scm_is_false (answer) ? make_print_state () : answer;
c62fbfe1 232}
a51ea417 233
698c0295 234void
6e8d25a6 235scm_free_print_state (SCM print_state)
698c0295
MD
236{
237 SCM handle;
238 scm_print_state *pstate = SCM_PRINT_STATE (print_state);
239 /* Cleanup before returning print state to pool.
240 * It is better to do it here. Doing it in scm_prin1
241 * would cost more since that function is called much more
242 * often.
243 */
244 pstate->fancyp = 0;
bb35f315 245 pstate->revealed = 0;
d232520a 246 pstate->highlight_objects = SCM_EOL;
9de87eea 247 scm_i_pthread_mutex_lock (&print_state_mutex);
16d4699b 248 handle = scm_cons (print_state, print_state_pool);
d5cf5324 249 print_state_pool = handle;
9de87eea 250 scm_i_pthread_mutex_unlock (&print_state_mutex);
dfd03fb9
MD
251}
252
253SCM
254scm_i_port_with_print_state (SCM port, SCM print_state)
255{
256 if (SCM_UNBNDP (print_state))
257 {
258 if (SCM_PORT_WITH_PS_P (port))
259 return port;
260 else
261 print_state = scm_make_print_state ();
262 /* port does not need to be coerced since it doesn't have ps */
263 }
264 else
265 port = SCM_COERCE_OUTPORT (port);
266 SCM_RETURN_NEWSMOB (scm_tc16_port_with_ps,
267 SCM_UNPACK (scm_cons (port, print_state)));
698c0295 268}
1cc91f1b 269
a51ea417 270static void
1bbd0b84 271grow_ref_stack (scm_print_state *pstate)
a51ea417 272{
4057a3e0
MV
273 SCM old_vect = pstate->ref_vect;
274 size_t old_size = SCM_SIMPLE_VECTOR_LENGTH (old_vect);
275 size_t new_size = 2 * pstate->ceiling;
00ffa0e7 276 SCM new_vect = scm_c_make_vector (new_size, SCM_UNDEFINED);
b17004b8
DH
277 unsigned long int i;
278
279 for (i = 0; i != old_size; ++i)
4057a3e0 280 SCM_SIMPLE_VECTOR_SET (new_vect, i, SCM_SIMPLE_VECTOR_REF (old_vect, i));
b17004b8
DH
281
282 pstate->ref_vect = new_vect;
bf685b6d 283 pstate->ceiling = new_size;
a51ea417
MD
284}
285
509759dd
MV
286#define PSTATE_STACK_REF(p,i) SCM_SIMPLE_VECTOR_REF((p)->ref_vect, (i))
287#define PSTATE_STACK_SET(p,i,v) SCM_SIMPLE_VECTOR_SET((p)->ref_vect, (i), (v))
1cc91f1b 288
a51ea417 289static void
34d19ef6 290print_circref (SCM port, scm_print_state *pstate, SCM ref)
a51ea417 291{
c014a02e
ML
292 register long i;
293 long self = pstate->top - 1;
c62fbfe1 294 i = pstate->top - 1;
509759dd 295 if (scm_is_pair (PSTATE_STACK_REF (pstate, i)))
c62fbfe1
MD
296 {
297 while (i > 0)
298 {
509759dd
MV
299 if (!scm_is_pair (PSTATE_STACK_REF (pstate, i-1))
300 || !scm_is_eq (SCM_CDR (PSTATE_STACK_REF (pstate, i-1)),
301 SCM_CDR (PSTATE_STACK_REF (pstate, i))))
c62fbfe1
MD
302 break;
303 --i;
304 }
305 self = i;
306 }
307 for (i = pstate->top - 1; 1; --i)
509759dd 308 if (scm_is_eq (PSTATE_STACK_REF(pstate, i), ref))
c62fbfe1 309 break;
b7f3516f 310 scm_putc ('#', port);
c62fbfe1 311 scm_intprint (i - self, 10, port);
b7f3516f 312 scm_putc ('#', port);
a51ea417
MD
313}
314
6662998f
MV
315/* Print the name of a symbol. */
316
475fa9a5 317static int
15671c6e 318quote_keywordish_symbols (void)
475fa9a5 319{
15671c6e 320 SCM option = SCM_PRINT_KEYWORD_STYLE;
475fa9a5 321
475fa9a5
MV
322 if (scm_is_false (option))
323 return 0;
324 if (scm_is_eq (option, sym_reader))
325 return scm_is_true (SCM_PACK (SCM_KEYWORD_STYLE));
326 return 1;
327}
328
2e9fc9fc
AW
329#define INITIAL_IDENTIFIER_MASK \
330 (UC_CATEGORY_MASK_Lu | UC_CATEGORY_MASK_Ll | UC_CATEGORY_MASK_Lt \
331 | UC_CATEGORY_MASK_Lm | UC_CATEGORY_MASK_Lo | UC_CATEGORY_MASK_Mn \
332 | UC_CATEGORY_MASK_Nl | UC_CATEGORY_MASK_No | UC_CATEGORY_MASK_Pd \
333 | UC_CATEGORY_MASK_Pc | UC_CATEGORY_MASK_Po | UC_CATEGORY_MASK_Sc \
334 | UC_CATEGORY_MASK_Sm | UC_CATEGORY_MASK_Sk | UC_CATEGORY_MASK_So \
335 | UC_CATEGORY_MASK_Co)
336
337#define SUBSEQUENT_IDENTIFIER_MASK \
338 (INITIAL_IDENTIFIER_MASK \
339 | UC_CATEGORY_MASK_Nd | UC_CATEGORY_MASK_Mc | UC_CATEGORY_MASK_Me)
340
15671c6e
AW
341static int
342symbol_has_extended_read_syntax (SCM sym)
6662998f 343{
15671c6e
AW
344 size_t pos, len = scm_i_symbol_length (sym);
345 scm_t_wchar c;
346
347 /* The empty symbol. */
348 if (len == 0)
349 return 1;
350
351 c = scm_i_symbol_ref (sym, 0);
352
353 /* Single dot; conflicts with dotted-pair notation. */
354 if (len == 1 && c == '.')
355 return 1;
356
357 /* Other initial-character constraints. */
2e9fc9fc 358 if (c == '\'' || c == '`' || c == ',' || c == '"' || c == ';' || c == '#')
15671c6e
AW
359 return 1;
360
361 /* Keywords can be identified by trailing colons too. */
362 if (c == ':' || scm_i_symbol_ref (sym, len - 1) == ':')
363 return quote_keywordish_symbols ();
364
365 /* Number-ish symbols. */
366 if (scm_is_true (scm_i_string_to_number (scm_symbol_to_string (sym), 10)))
367 return 1;
368
2e9fc9fc
AW
369 /* Other disallowed first characters. */
370 if (!uc_is_general_category_withtable (c, INITIAL_IDENTIFIER_MASK))
371 return 1;
372
373 /* Otherwise, any character that's in the identifier category mask is
374 fine to pass through as-is, provided it's not one of the ASCII
375 delimiters like `;'. */
376 for (pos = 1; pos < len; pos++)
6662998f 377 {
2e9fc9fc
AW
378 c = scm_i_symbol_ref (sym, pos);
379 if (!uc_is_general_category_withtable (c, SUBSEQUENT_IDENTIFIER_MASK))
380 return 1;
381 else if (c == '"' || c == ';' || c == '#')
382 return 1;
6662998f 383 }
c6b49e89 384
15671c6e
AW
385 return 0;
386}
387
388static void
389print_normal_symbol (SCM sym, SCM port)
390{
391 scm_display (scm_symbol_to_string (sym), port);
392}
393
15671c6e
AW
394static void
395print_extended_symbol (SCM sym, SCM port)
396{
397 size_t pos, len;
398 scm_t_string_failed_conversion_handler strategy;
399
400 len = scm_i_symbol_length (sym);
478848cb 401 strategy = PORT_CONVERSION_HANDLER (port);
15671c6e
AW
402
403 scm_lfwrite ("#{", 2, port);
404
405 for (pos = 0; pos < len; pos++)
406 {
407 scm_t_wchar c = scm_i_symbol_ref (sym, pos);
408
2e9fc9fc
AW
409 if (uc_is_general_category_withtable (c,
410 SUBSEQUENT_IDENTIFIER_MASK
411 | UC_CATEGORY_MASK_Zs))
15671c6e 412 {
15671c6e
AW
413 if (!display_character (c, port, strategy))
414 scm_encoding_error ("print_extended_symbol", errno,
415 "cannot convert to output locale",
416 port, SCM_MAKE_CHAR (c));
2e9fc9fc
AW
417 }
418 else
419 {
420 display_string ("\\x", 1, 2, port, iconveh_question_mark);
421 scm_intprint (c, 16, port);
422 display_character (';', port, iconveh_question_mark);
15671c6e
AW
423 }
424 }
425
426 scm_lfwrite ("}#", 2, port);
427}
428
429/* FIXME: allow R6RS hex escapes instead of #{...}#. */
430void
431scm_i_print_symbol_name (SCM sym, SCM port)
432{
433 if (symbol_has_extended_read_syntax (sym))
434 print_extended_symbol (sym, port);
435 else
436 print_normal_symbol (sym, port);
6662998f
MV
437}
438
e23106d5
MG
439void
440scm_print_symbol_name (const char *str, size_t len, SCM port)
441{
442 SCM symbol = scm_from_locale_symboln (str, len);
ab33782c 443 scm_i_print_symbol_name (symbol, port);
e23106d5
MG
444}
445
c62fbfe1 446/* Print generally. Handles both write and display according to PSTATE.
0f2d19dd 447 */
8b840115
MD
448SCM_GPROC(s_write, "write", 1, 1, 0, scm_write, g_write);
449SCM_GPROC(s_display, "display", 1, 1, 0, scm_display, g_display);
1cc91f1b 450
d232520a
MV
451static void iprin1 (SCM exp, SCM port, scm_print_state *pstate);
452
dea901d6
MG
453
454/* Print a character as an octal or hex escape. */
455#define PRINT_CHAR_ESCAPE(i, port) \
456 do \
457 { \
458 if (!SCM_R6RS_ESCAPES_P) \
459 scm_intprint (i, 8, port); \
460 else \
461 { \
462 scm_puts ("x", port); \
463 scm_intprint (i, 16, port); \
464 } \
465 } \
466 while (0)
467
468
0f2d19dd 469void
1bbd0b84 470scm_iprin1 (SCM exp, SCM port, scm_print_state *pstate)
d232520a
MV
471{
472 if (pstate->fancyp
473 && scm_is_true (scm_memq (exp, pstate->highlight_objects)))
474 {
81ae25da 475 scm_display (SCM_PRINT_HIGHLIGHT_PREFIX, port);
d232520a 476 iprin1 (exp, port, pstate);
81ae25da 477 scm_display (SCM_PRINT_HIGHLIGHT_SUFFIX, port);
d232520a
MV
478 }
479 else
480 iprin1 (exp, port, pstate);
481}
482
483static void
484iprin1 (SCM exp, SCM port, scm_print_state *pstate)
0f2d19dd 485{
54778cd3 486 switch (SCM_ITAG3 (exp))
0f2d19dd 487 {
e34f941a
DH
488 case scm_tc3_tc7_1:
489 case scm_tc3_tc7_2:
490 /* These tc3 tags should never occur in an immediate value. They are
491 * only used in cell types of non-immediates, i. e. the value returned
492 * by SCM_CELL_TYPE (exp) can use these tags.
493 */
494 scm_ipruk ("immediate", exp, port);
495 break;
496 case scm_tc3_int_1:
497 case scm_tc3_int_2:
e11e83f3 498 scm_intprint (SCM_I_INUM (exp), 10, port);
0f2d19dd 499 break;
e34f941a 500 case scm_tc3_imm24:
7866a09b 501 if (SCM_CHARP (exp))
0f2d19dd 502 {
b7f3516f 503 if (SCM_WRITINGP (pstate))
07f49ac7
LC
504 write_character (SCM_CHAR (exp), port, 0);
505 else
b7f3516f 506 {
07f49ac7 507 if (!display_character (SCM_CHAR (exp), port,
478848cb 508 PORT_CONVERSION_HANDLER (port)))
07f49ac7
LC
509 scm_encoding_error (__func__, errno,
510 "cannot convert to output locale",
6851d3be 511 port, exp);
b7f3516f 512 }
0f2d19dd 513 }
a51ea417 514 else if (SCM_IFLAGP (exp)
e17d318f
DH
515 && ((size_t) SCM_IFLAGNUM (exp) < (sizeof iflagnames / sizeof (char *))))
516 {
517 scm_puts (iflagnames [SCM_IFLAGNUM (exp)], port);
518 }
0f2d19dd 519 else
e34f941a
DH
520 {
521 /* unknown immediate value */
522 scm_ipruk ("immediate", exp, port);
523 }
0f2d19dd 524 break;
e34f941a 525 case scm_tc3_cons:
0f2d19dd
JB
526 switch (SCM_TYP7 (exp))
527 {
904a077d
MV
528 case scm_tcs_struct:
529 {
530 ENTER_NESTED_DATA (pstate, exp, circref);
531 if (SCM_OBJ_CLASS_FLAGS (exp) & SCM_CLASSF_GOOPS)
532 {
533 SCM pwps, print = pstate->writingp ? g_write : g_display;
b2b33168 534 if (SCM_UNPACK (print) == 0)
904a077d 535 goto print_struct;
dfd03fb9 536 pwps = scm_i_port_with_print_state (port, pstate->handle);
7663c008 537 pstate->revealed = 1;
904a077d
MV
538 scm_call_generic_2 (print, exp, pwps);
539 }
540 else
541 {
542 print_struct:
543 scm_print_struct (exp, port, pstate);
544 }
545 EXIT_NESTED_DATA (pstate);
546 }
547 break;
0f2d19dd
JB
548 case scm_tcs_cons_imcar:
549 case scm_tcs_cons_nimcar:
c62fbfe1
MD
550 ENTER_NESTED_DATA (pstate, exp, circref);
551 scm_iprlist ("(", exp, ')', port, pstate);
552 EXIT_NESTED_DATA (pstate);
a51ea417
MD
553 break;
554 circref:
c62fbfe1 555 print_circref (port, pstate, exp);
0f2d19dd 556 break;
534c55a9
DH
557 case scm_tc7_number:
558 switch SCM_TYP16 (exp) {
559 case scm_tc16_big:
560 scm_bigprint (exp, port, pstate);
561 break;
562 case scm_tc16_real:
563 scm_print_real (exp, port, pstate);
564 break;
565 case scm_tc16_complex:
566 scm_print_complex (exp, port, pstate);
567 break;
f92e85f7
MV
568 case scm_tc16_fraction:
569 scm_i_print_fraction (exp, port, pstate);
570 break;
534c55a9
DH
571 }
572 break;
9c44cd45
MG
573 case scm_tc7_string:
574 if (SCM_WRITINGP (pstate))
575 {
07f49ac7 576 size_t len, i;
9c44cd45 577
f4bc4e59 578 display_character ('"', port, iconveh_question_mark);
9c44cd45
MG
579 len = scm_i_string_length (exp);
580 for (i = 0; i < len; ++i)
07f49ac7
LC
581 write_character (scm_i_string_ref (exp, i), port, 1);
582
f4bc4e59 583 display_character ('"', port, iconveh_question_mark);
9c44cd45
MG
584 scm_remember_upto_here_1 (exp);
585 }
586 else
f4bc4e59
LC
587 {
588 size_t len, printed;
589
590 len = scm_i_string_length (exp);
591 printed = display_string (scm_i_string_data (exp),
592 scm_i_is_narrow_string (exp),
593 len, port,
478848cb 594 PORT_CONVERSION_HANDLER (port));
f4bc4e59 595 if (SCM_UNLIKELY (printed < len))
f4bc4e59
LC
596 scm_encoding_error (__func__, errno,
597 "cannot convert to output locale",
6851d3be 598 port, scm_c_string_ref (exp, printed));
f4bc4e59
LC
599 }
600
9c44cd45
MG
601 scm_remember_upto_here_1 (exp);
602 break;
28b06554 603 case scm_tc7_symbol:
cc95e00a 604 if (scm_i_symbol_is_interned (exp))
9ff28a13 605 {
e23106d5 606 scm_i_print_symbol_name (exp, port);
9ff28a13
MV
607 scm_remember_upto_here_1 (exp);
608 }
609 else
610 {
611 scm_puts ("#<uninterned-symbol ", port);
e23106d5 612 scm_i_print_symbol_name (exp, port);
9ff28a13 613 scm_putc (' ', port);
0345e278 614 scm_uintprint (SCM_UNPACK (exp), 16, port);
9ff28a13
MV
615 scm_putc ('>', port);
616 }
6662998f 617 break;
e5aca4b5
MV
618 case scm_tc7_variable:
619 scm_i_variable_print (exp, port, pstate);
620 break;
2fb924f6
AW
621 case scm_tc7_program:
622 scm_i_program_print (exp, port, pstate);
623 break;
5b46a8c2
LC
624 case scm_tc7_pointer:
625 scm_i_pointer_print (exp, port, pstate);
e2c2a699 626 break;
c99de5aa
AW
627 case scm_tc7_hashtable:
628 scm_i_hashtable_print (exp, port, pstate);
629 break;
9ea31741
AW
630 case scm_tc7_fluid:
631 scm_i_fluid_print (exp, port, pstate);
632 break;
45cf2428
AW
633 case scm_tc7_dynamic_state:
634 scm_i_dynamic_state_print (exp, port, pstate);
635 break;
6f3b0cc2
AW
636 case scm_tc7_frame:
637 scm_i_frame_print (exp, port, pstate);
638 break;
639 case scm_tc7_objcode:
640 scm_i_objcode_print (exp, port, pstate);
641 break;
642 case scm_tc7_vm:
643 scm_i_vm_print (exp, port, pstate);
644 break;
645 case scm_tc7_vm_cont:
646 scm_i_vm_cont_print (exp, port, pstate);
647 break;
bbb2ecd1
AW
648 case scm_tc7_prompt:
649 scm_i_prompt_print (exp, port, pstate);
650 break;
651 case scm_tc7_with_fluids:
652 scm_i_with_fluids_print (exp, port, pstate);
653 break;
b2637c98
AW
654 case scm_tc7_array:
655 ENTER_NESTED_DATA (pstate, exp, circref);
656 scm_i_print_array (exp, port, pstate);
88c0a1d5 657 EXIT_NESTED_DATA (pstate);
b2637c98
AW
658 break;
659 case scm_tc7_bytevector:
660 scm_i_print_bytevector (exp, port, pstate);
661 break;
ff1feca9
AW
662 case scm_tc7_bitvector:
663 scm_i_print_bitvector (exp, port, pstate);
664 break;
0f2d19dd 665 case scm_tc7_wvect:
c62fbfe1 666 ENTER_NESTED_DATA (pstate, exp, circref);
0f2d19dd 667 if (SCM_IS_WHVEC (exp))
b7f3516f 668 scm_puts ("#wh(", port);
0f2d19dd 669 else
b7f3516f 670 scm_puts ("#w(", port);
0f2d19dd 671 goto common_vector_printer;
0f2d19dd 672 case scm_tc7_vector:
c62fbfe1 673 ENTER_NESTED_DATA (pstate, exp, circref);
b7f3516f 674 scm_puts ("#(", port);
0f2d19dd 675 common_vector_printer:
9fbaf27c 676 {
c014a02e 677 register long i;
4057a3e0 678 long last = SCM_SIMPLE_VECTOR_LENGTH (exp) - 1;
9fbaf27c 679 int cutp = 0;
4057a3e0
MV
680 if (pstate->fancyp
681 && SCM_SIMPLE_VECTOR_LENGTH (exp) > pstate->length)
9fbaf27c
MD
682 {
683 last = pstate->length - 1;
684 cutp = 1;
685 }
c367c4b4 686 if (SCM_I_WVECTP (exp))
9fbaf27c 687 {
c367c4b4
LC
688 /* Elements of weak vectors may not be accessed via the
689 `SIMPLE_VECTOR_REF ()' macro. */
690 for (i = 0; i < last; ++i)
691 {
692 scm_iprin1 (scm_c_vector_ref (exp, i),
693 port, pstate);
694 scm_putc (' ', port);
695 }
9fbaf27c 696 }
c367c4b4
LC
697 else
698 {
699 for (i = 0; i < last; ++i)
700 {
701 scm_iprin1 (SCM_SIMPLE_VECTOR_REF (exp, i), port, pstate);
702 scm_putc (' ', port);
703 }
704 }
705
9fbaf27c
MD
706 if (i == last)
707 {
708 /* CHECK_INTS; */
c367c4b4 709 scm_iprin1 (scm_c_vector_ref (exp, i), port, pstate);
9fbaf27c
MD
710 }
711 if (cutp)
b7f3516f
TT
712 scm_puts (" ...", port);
713 scm_putc (')', port);
9fbaf27c 714 }
c62fbfe1 715 EXIT_NESTED_DATA (pstate);
0f2d19dd 716 break;
0f2d19dd 717 case scm_tc7_port:
5ca6dc39
JB
718 {
719 register long i = SCM_PTOBNUM (exp);
720 if (i < scm_numptob
721 && scm_ptobs[i].print
722 && (scm_ptobs[i].print) (exp, port, pstate))
a51ea417 723 break;
5ca6dc39
JB
724 goto punk;
725 }
726 case scm_tc7_smob:
7a7f7c53
DH
727 ENTER_NESTED_DATA (pstate, exp, circref);
728 SCM_SMOB_DESCRIPTOR (exp).print (exp, port, pstate);
729 EXIT_NESTED_DATA (pstate);
730 break;
0f2d19dd 731 default:
314b8716 732 /* case scm_tcs_closures: */
a51ea417
MD
733 punk:
734 scm_ipruk ("type", exp, port);
0f2d19dd
JB
735 }
736 }
737}
738
c62fbfe1
MD
739/* Print states are necessary for circular reference safe printing.
740 * They are also expensive to allocate. Therefore print states are
741 * kept in a pool so that they can be reused.
742 */
1cc91f1b 743
bb35f315
MV
744/* The PORT argument can also be a print-state/port pair, which will
745 * then be used instead of allocating a new print state. This is
746 * useful for continuing a chain of print calls from Scheme. */
747
a51ea417 748void
1bbd0b84 749scm_prin1 (SCM exp, SCM port, int writingp)
a51ea417 750{
c4f37e80
MV
751 SCM handle = SCM_BOOL_F; /* Will GC protect the handle whilst unlinked */
752 SCM pstate_scm;
c62fbfe1 753 scm_print_state *pstate;
15635be5 754 int old_writingp;
c62fbfe1 755
bb35f315
MV
756 /* If PORT is a print-state/port pair, use that. Else create a new
757 print-state. */
c4f37e80 758
0c95b57d 759 if (SCM_PORT_WITH_PS_P (port))
bb35f315 760 {
52235e71
MD
761 pstate_scm = SCM_PORT_WITH_PS_PS (port);
762 port = SCM_PORT_WITH_PS_PORT (port);
bb35f315
MV
763 }
764 else
c62fbfe1 765 {
c4f37e80 766 /* First try to allocate a print state from the pool */
9de87eea 767 scm_i_pthread_mutex_lock (&print_state_mutex);
d2e53ed6 768 if (!scm_is_null (print_state_pool))
c4f37e80 769 {
d5cf5324
DH
770 handle = print_state_pool;
771 print_state_pool = SCM_CDR (print_state_pool);
c4f37e80 772 }
9de87eea 773 scm_i_pthread_mutex_unlock (&print_state_mutex);
7888309b 774 if (scm_is_false (handle))
d5cf5324 775 handle = scm_list_1 (make_print_state ());
c4f37e80 776 pstate_scm = SCM_CAR (handle);
c62fbfe1 777 }
c62fbfe1 778
c4f37e80 779 pstate = SCM_PRINT_STATE (pstate_scm);
15635be5 780 old_writingp = pstate->writingp;
c62fbfe1
MD
781 pstate->writingp = writingp;
782 scm_iprin1 (exp, port, pstate);
15635be5 783 pstate->writingp = old_writingp;
c62fbfe1 784
bb35f315
MV
785 /* Return print state to pool if it has been created above and
786 hasn't escaped to Scheme. */
787
7888309b 788 if (scm_is_true (handle) && !pstate->revealed)
c4f37e80 789 {
9de87eea 790 scm_i_pthread_mutex_lock (&print_state_mutex);
d5cf5324
DH
791 SCM_SETCDR (handle, print_state_pool);
792 print_state_pool = handle;
9de87eea 793 scm_i_pthread_mutex_unlock (&print_state_mutex);
c4f37e80 794 }
a51ea417
MD
795}
796
f4bc4e59
LC
797/* Convert codepoint CH to UTF-8 and store the result in UTF8. Return
798 the number of bytes of the UTF-8-encoded string. */
799static size_t
800codepoint_to_utf8 (scm_t_wchar ch, scm_t_uint8 utf8[4])
9c44cd45 801{
f4bc4e59
LC
802 size_t len;
803 scm_t_uint32 codepoint;
804
805 codepoint = (scm_t_uint32) ch;
07f49ac7 806
f4bc4e59 807 if (codepoint <= 0x7f)
07f49ac7 808 {
f4bc4e59
LC
809 len = 1;
810 utf8[0] = (scm_t_uint8) codepoint;
811 }
812 else if (codepoint <= 0x7ffUL)
813 {
814 len = 2;
815 utf8[0] = 0xc0 | (codepoint >> 6);
816 utf8[1] = 0x80 | (codepoint & 0x3f);
817 }
818 else if (codepoint <= 0xffffUL)
819 {
820 len = 3;
821 utf8[0] = 0xe0 | (codepoint >> 12);
822 utf8[1] = 0x80 | ((codepoint >> 6) & 0x3f);
823 utf8[2] = 0x80 | (codepoint & 0x3f);
07f49ac7
LC
824 }
825 else
826 {
f4bc4e59
LC
827 len = 4;
828 utf8[0] = 0xf0 | (codepoint >> 18);
829 utf8[1] = 0x80 | ((codepoint >> 12) & 0x3f);
830 utf8[2] = 0x80 | ((codepoint >> 6) & 0x3f);
831 utf8[3] = 0x80 | (codepoint & 0x3f);
832 }
833
834 return len;
835}
836
f4bc4e59
LC
837#define STR_REF(s, x) \
838 (narrow_p \
839 ? (scm_t_wchar) ((unsigned char *) (s))[x] \
840 : ((scm_t_wchar *) (s))[x])
841
7b292a9d
LC
842/* Write STR to PORT as UTF-8. STR is a LEN-codepoint string; it is
843 narrow if NARROW_P is true, wide otherwise. Return LEN. */
844static size_t
845display_string_as_utf8 (const void *str, int narrow_p, size_t len,
846 SCM port)
847{
848 size_t printed = 0;
849
850 while (len > printed)
851 {
852 size_t utf8_len, i;
853 char *input, utf8_buf[256];
854
855 /* Convert STR to UTF-8. */
856 for (i = printed, utf8_len = 0, input = utf8_buf;
857 i < len && utf8_len + 4 < sizeof (utf8_buf);
858 i++)
859 {
860 utf8_len += codepoint_to_utf8 (STR_REF (str, i),
861 (scm_t_uint8 *) input);
862 input = utf8_buf + utf8_len;
863 }
864
865 /* INPUT was successfully converted, entirely; print the
866 result. */
867 scm_lfwrite (utf8_buf, utf8_len, port);
868 printed += i - printed;
869 }
870
871 assert (printed == len);
872
873 return len;
874}
875
876/* Convert STR through PORT's output conversion descriptor and write the
877 output to PORT. Return the number of codepoints written. */
878static size_t
879display_string_using_iconv (const void *str, int narrow_p, size_t len,
880 SCM port,
881 scm_t_string_failed_conversion_handler strategy)
882{
f4bc4e59 883 size_t printed;
337edc59 884 scm_t_iconv_descriptors *id;
cdd3d6c9 885 scm_t_port_internal *pti = SCM_PORT_GET_INTERNAL (port);
f4bc4e59 886
cdd3d6c9
MW
887 id = scm_i_port_iconv_descriptors (port, SCM_PORT_WRITE);
888
889 if (SCM_UNLIKELY (pti->at_stream_start_for_bom_write && len > 0))
890 {
891 scm_t_port *pt = SCM_PTAB_ENTRY (port);
892
893 /* Record that we're no longer at stream start. */
894 pti->at_stream_start_for_bom_write = 0;
895 if (pt->rw_random)
896 pti->at_stream_start_for_bom_read = 0;
897
898 /* Write a BOM if appropriate. */
96965a6e
MW
899 if (SCM_UNLIKELY (c_strcasecmp(pt->encoding, "UTF-16") == 0
900 || c_strcasecmp(pt->encoding, "UTF-32") == 0))
cdd3d6c9
MW
901 display_character (SCM_UNICODE_BOM, port, iconveh_error);
902 }
f4bc4e59 903
f4bc4e59
LC
904 printed = 0;
905
906 while (len > printed)
907 {
908 size_t done, utf8_len, input_left, output_left, i;
909 size_t codepoints_read, output_len;
910 char *input, *output;
911 char utf8_buf[256], encoded_output[256];
912 size_t offsets[256];
913
914 /* Convert STR to UTF-8. */
915 for (i = printed, utf8_len = 0, input = utf8_buf;
916 i < len && utf8_len + 4 < sizeof (utf8_buf);
917 i++)
07f49ac7 918 {
f4bc4e59
LC
919 offsets[utf8_len] = i;
920 utf8_len += codepoint_to_utf8 (STR_REF (str, i),
921 (scm_t_uint8 *) input);
922 input = utf8_buf + utf8_len;
923 }
924
925 input = utf8_buf;
926 input_left = utf8_len;
927
928 output = encoded_output;
929 output_left = sizeof (encoded_output);
930
337edc59 931 done = iconv (id->output_cd, &input, &input_left,
f4bc4e59 932 &output, &output_left);
07f49ac7 933
f4bc4e59
LC
934 output_len = sizeof (encoded_output) - output_left;
935
936 if (SCM_UNLIKELY (done == (size_t) -1))
937 {
b2548e23
AW
938 int errno_save = errno;
939
f4bc4e59 940 /* Reset the `iconv' state. */
337edc59 941 iconv (id->output_cd, NULL, NULL, NULL, NULL);
f4bc4e59 942
7174bc08
LC
943 /* Print the OUTPUT_LEN bytes successfully converted. */
944 scm_lfwrite (encoded_output, output_len, port);
945
946 /* See how many input codepoints these OUTPUT_LEN bytes
947 corresponds to. */
948 codepoints_read = offsets[input - utf8_buf] - printed;
949 printed += codepoints_read;
950
b2548e23 951 if (errno_save == EILSEQ &&
f4bc4e59 952 strategy != SCM_FAILED_CONVERSION_ERROR)
07f49ac7 953 {
f4bc4e59
LC
954 /* Conversion failed somewhere in INPUT and we want to
955 escape or substitute the offending input character. */
956
f4bc4e59 957 if (strategy == SCM_FAILED_CONVERSION_ESCAPE_SEQUENCE)
f1ee6d54 958 {
f4bc4e59
LC
959 scm_t_wchar ch;
960
961 /* Find CH, the offending codepoint, and escape it. */
962 ch = STR_REF (str, offsets[input - utf8_buf]);
963 write_character_escaped (ch, 1, port);
f1ee6d54 964 }
07f49ac7 965 else
f4bc4e59
LC
966 /* STRATEGY is `SCM_FAILED_CONVERSION_QUESTION_MARK'. */
967 display_string ("?", 1, 1, port, strategy);
9c44cd45 968
f4bc4e59
LC
969 printed++;
970 }
971 else
972 /* Something bad happened that we can't handle: bail out. */
973 break;
07f49ac7
LC
974 }
975 else
f4bc4e59
LC
976 {
977 /* INPUT was successfully converted, entirely; print the
978 result. */
979 scm_lfwrite (encoded_output, output_len, port);
980 codepoints_read = i - printed;
981 printed += codepoints_read;
982 }
07f49ac7
LC
983 }
984
985 return printed;
7b292a9d
LC
986}
987
f4bc4e59 988#undef STR_REF
7b292a9d
LC
989
990/* Display the LEN codepoints in STR to PORT according to STRATEGY;
991 return the number of codepoints successfully displayed. If NARROW_P,
992 then STR is interpreted as a sequence of `char', denoting a Latin-1
993 string; otherwise it's interpreted as a sequence of
994 `scm_t_wchar'. */
995static size_t
996display_string (const void *str, int narrow_p,
997 size_t len, SCM port,
998 scm_t_string_failed_conversion_handler strategy)
999
1000{
e4598559 1001 scm_t_port_internal *pti;
7b292a9d 1002
e4598559 1003 pti = SCM_PORT_GET_INTERNAL (port);
7b292a9d 1004
337edc59 1005 if (pti->encoding_mode == SCM_PORT_ENCODING_MODE_UTF8)
7b292a9d
LC
1006 return display_string_as_utf8 (str, narrow_p, len, port);
1007 else
1008 return display_string_using_iconv (str, narrow_p, len,
1009 port, strategy);
f4bc4e59
LC
1010}
1011
1012/* Attempt to display CH to PORT according to STRATEGY. Return non-zero
1013 if CH was successfully displayed, zero otherwise (e.g., if it was not
1014 representable in PORT's encoding.) */
1015static int
1016display_character (scm_t_wchar ch, SCM port,
1017 scm_t_string_failed_conversion_handler strategy)
1018{
1019 return display_string (&ch, 0, 1, port, strategy) == 1;
07f49ac7
LC
1020}
1021
33d92fe6
LC
1022/* Attempt to pretty-print CH, a combining character, to PORT. Return
1023 zero upon failure, non-zero otherwise. The idea is to print CH above
1024 a dotted circle to make it more visible. */
1025static int
1026write_combining_character (scm_t_wchar ch, SCM port)
1027{
f4bc4e59
LC
1028 scm_t_wchar str[2];
1029
1030 str[0] = SCM_CODEPOINT_DOTTED_CIRCLE;
1031 str[1] = ch;
1032
1033 return display_string (str, 0, 2, port, iconveh_error) == 2;
1034}
33d92fe6 1035
f4bc4e59
LC
1036/* Write CH to PORT in its escaped form, using the string escape syntax
1037 if STRING_ESCAPES_P is non-zero. */
1038static void
1039write_character_escaped (scm_t_wchar ch, int string_escapes_p, SCM port)
1040{
1041 if (string_escapes_p)
33d92fe6 1042 {
f4bc4e59
LC
1043 /* Represent CH using the in-string escape syntax. */
1044
1045 static const char hex[] = "0123456789abcdef";
1046 static const char escapes[7] = "abtnvfr";
1047 char buf[9];
1048
1049 if (ch >= 0x07 && ch <= 0x0D && ch != 0x0A)
33d92fe6 1050 {
f4bc4e59
LC
1051 /* Use special escapes for some C0 controls. */
1052 buf[0] = '\\';
1053 buf[1] = escapes[ch - 0x07];
1054 scm_lfwrite (buf, 2, port);
1055 }
1056 else if (!SCM_R6RS_ESCAPES_P)
1057 {
1058 if (ch <= 0xFF)
1059 {
1060 buf[0] = '\\';
1061 buf[1] = 'x';
1062 buf[2] = hex[ch / 16];
1063 buf[3] = hex[ch % 16];
1064 scm_lfwrite (buf, 4, port);
1065 }
1066 else if (ch <= 0xFFFF)
1067 {
1068 buf[0] = '\\';
1069 buf[1] = 'u';
1070 buf[2] = hex[(ch & 0xF000) >> 12];
1071 buf[3] = hex[(ch & 0xF00) >> 8];
1072 buf[4] = hex[(ch & 0xF0) >> 4];
1073 buf[5] = hex[(ch & 0xF)];
1074 scm_lfwrite (buf, 6, port);
1075 }
1076 else if (ch > 0xFFFF)
1077 {
1078 buf[0] = '\\';
1079 buf[1] = 'U';
1080 buf[2] = hex[(ch & 0xF00000) >> 20];
1081 buf[3] = hex[(ch & 0xF0000) >> 16];
1082 buf[4] = hex[(ch & 0xF000) >> 12];
1083 buf[5] = hex[(ch & 0xF00) >> 8];
1084 buf[6] = hex[(ch & 0xF0) >> 4];
1085 buf[7] = hex[(ch & 0xF)];
1086 scm_lfwrite (buf, 8, port);
1087 }
33d92fe6
LC
1088 }
1089 else
f4bc4e59
LC
1090 {
1091 /* Print an R6RS variable-length hex escape: "\xNNNN;". */
1092 scm_t_wchar ch2 = ch;
1093
1094 int i = 8;
1095 buf[i] = ';';
1096 i --;
1097 if (ch == 0)
1098 buf[i--] = '0';
1099 else
1100 while (ch2 > 0)
1101 {
1102 buf[i] = hex[ch2 & 0xF];
1103 ch2 >>= 4;
1104 i --;
1105 }
1106 buf[i] = 'x';
1107 i --;
1108 buf[i] = '\\';
1109 scm_lfwrite (buf + i, 9 - i, port);
1110 }
33d92fe6
LC
1111 }
1112 else
f4bc4e59
LC
1113 {
1114 /* Represent CH using the character escape syntax. */
1115 const char *name;
33d92fe6 1116
f4bc4e59
LC
1117 name = scm_i_charname (SCM_MAKE_CHAR (ch));
1118 if (name != NULL)
1119 scm_puts (name, port);
1120 else
1121 PRINT_CHAR_ESCAPE (ch, port);
1122 }
33d92fe6
LC
1123}
1124
07f49ac7
LC
1125/* Write CH to PORT, escaping it if it's non-graphic or not
1126 representable in PORT's encoding. If STRING_ESCAPES_P is true and CH
1127 needs to be escaped, it is escaped using the in-string escape syntax;
1128 otherwise the character escape syntax is used. */
1129static void
1130write_character (scm_t_wchar ch, SCM port, int string_escapes_p)
1131{
1132 int printed = 0;
f4bc4e59
LC
1133 scm_t_string_failed_conversion_handler strategy;
1134
478848cb 1135 strategy = PORT_CONVERSION_HANDLER (port);
07f49ac7
LC
1136
1137 if (string_escapes_p)
1138 {
1139 /* Check if CH deserves special treatment. */
1140 if (ch == '"' || ch == '\\')
1141 {
f4bc4e59
LC
1142 display_character ('\\', port, iconveh_question_mark);
1143 display_character (ch, port, strategy);
07f49ac7
LC
1144 printed = 1;
1145 }
8500b186
AW
1146 else if (ch == '\n' && SCM_PRINT_ESCAPE_NEWLINES_P)
1147 {
1148 display_character ('\\', port, iconveh_question_mark);
1149 display_character ('n', port, strategy);
1150 printed = 1;
1151 }
07f49ac7
LC
1152 else if (ch == ' ' || ch == '\n')
1153 {
f4bc4e59 1154 display_character (ch, port, strategy);
07f49ac7
LC
1155 printed = 1;
1156 }
1157 }
1158 else
33d92fe6 1159 {
f4bc4e59 1160 display_string ("#\\", 1, 2, port, iconveh_question_mark);
33d92fe6
LC
1161
1162 if (uc_combining_class (ch) != UC_CCC_NR)
1163 /* Character is a combining character, so attempt to
1164 pretty-print it. */
1165 printed = write_combining_character (ch, port);
1166 }
07f49ac7
LC
1167
1168 if (!printed
1169 && uc_is_general_category_withtable (ch,
1170 UC_CATEGORY_MASK_L |
1171 UC_CATEGORY_MASK_M |
1172 UC_CATEGORY_MASK_N |
1173 UC_CATEGORY_MASK_P |
1174 UC_CATEGORY_MASK_S))
1175 /* CH is graphic; attempt to display it. */
1176 printed = display_character (ch, port, iconveh_error);
1177
1178 if (!printed)
f4bc4e59
LC
1179 /* CH isn't graphic or cannot be represented in PORT's encoding. */
1180 write_character_escaped (ch, string_escapes_p, port);
9c44cd45 1181}
0f2d19dd 1182
b908768a
LC
1183/* Display STR to PORT from START inclusive to END exclusive. */
1184void
1185scm_i_display_substring (SCM str, size_t start, size_t end, SCM port)
1186{
1187 int narrow_p;
1188 const char *buf;
1189 size_t len, printed;
1190
1191 buf = scm_i_string_data (str);
1192 len = end - start;
1193 narrow_p = scm_i_is_narrow_string (str);
1194 buf += start * (narrow_p ? sizeof (char) : sizeof (scm_t_wchar));
1195
1196 printed = display_string (buf, narrow_p, end - start, port,
1197 PORT_CONVERSION_HANDLER (port));
1198
1199 if (SCM_UNLIKELY (printed < len))
1200 scm_encoding_error (__func__, errno,
1201 "cannot convert to output locale",
1202 port, scm_c_string_ref (str, printed + start));
1203}
1204
1205\f
0f2d19dd
JB
1206/* Print an integer.
1207 */
1cc91f1b 1208
0f2d19dd 1209void
a406c9e9 1210scm_intprint (scm_t_intmax n, int radix, SCM port)
0f2d19dd
JB
1211{
1212 char num_buf[SCM_INTBUFLEN];
b7f3516f 1213 scm_lfwrite (num_buf, scm_iint2str (n, radix, num_buf), port);
0f2d19dd
JB
1214}
1215
a406c9e9
MV
1216void
1217scm_uintprint (scm_t_uintmax n, int radix, SCM port)
1218{
1219 char num_buf[SCM_INTBUFLEN];
1220 scm_lfwrite (num_buf, scm_iuint2str (n, radix, num_buf), port);
1221}
1222
0f2d19dd
JB
1223/* Print an object of unrecognized type.
1224 */
1cc91f1b 1225
0f2d19dd 1226void
1bbd0b84 1227scm_ipruk (char *hdr, SCM ptr, SCM port)
0f2d19dd 1228{
b7f3516f
TT
1229 scm_puts ("#<unknown-", port);
1230 scm_puts (hdr, port);
26224b3f 1231 if (1) /* (scm_in_heap_p (ptr)) */ /* FIXME */
0f2d19dd 1232 {
b7f3516f 1233 scm_puts (" (0x", port);
0345e278 1234 scm_uintprint (SCM_CELL_WORD_0 (ptr), 16, port);
b7f3516f 1235 scm_puts (" . 0x", port);
0345e278 1236 scm_uintprint (SCM_CELL_WORD_1 (ptr), 16, port);
b7f3516f 1237 scm_puts (") @", port);
0f2d19dd 1238 }
b7f3516f 1239 scm_puts (" 0x", port);
0345e278 1240 scm_uintprint (SCM_UNPACK (ptr), 16, port);
b7f3516f 1241 scm_putc ('>', port);
0f2d19dd
JB
1242}
1243
1cc91f1b 1244
904a077d 1245/* Print a list.
22a52da1 1246 */
0f2d19dd 1247void
34d19ef6 1248scm_iprlist (char *hdr, SCM exp, int tlr, SCM port, scm_print_state *pstate)
0f2d19dd 1249{
c62fbfe1 1250 register SCM hare, tortoise;
c014a02e 1251 long floor = pstate->top - 2;
b7f3516f 1252 scm_puts (hdr, port);
0f2d19dd 1253 /* CHECK_INTS; */
c62fbfe1
MD
1254 if (pstate->fancyp)
1255 goto fancy_printing;
1256
1257 /* Run a hare and tortoise so that total time complexity will be
1258 O(depth * N) instead of O(N^2). */
1259 hare = SCM_CDR (exp);
1260 tortoise = exp;
d2e53ed6 1261 while (scm_is_pair (hare))
c62fbfe1 1262 {
bc36d050 1263 if (scm_is_eq (hare, tortoise))
c62fbfe1
MD
1264 goto fancy_printing;
1265 hare = SCM_CDR (hare);
d2e53ed6 1266 if (!scm_is_pair (hare))
c62fbfe1
MD
1267 break;
1268 hare = SCM_CDR (hare);
1269 tortoise = SCM_CDR (tortoise);
1270 }
1271
1272 /* No cdr cycles intrinsic to this list */
1273 scm_iprin1 (SCM_CAR (exp), port, pstate);
d2e53ed6 1274 for (exp = SCM_CDR (exp); scm_is_pair (exp); exp = SCM_CDR (exp))
0f2d19dd 1275 {
c014a02e 1276 register long i;
5ca6dc39 1277
c62fbfe1 1278 for (i = floor; i >= 0; --i)
509759dd 1279 if (scm_is_eq (PSTATE_STACK_REF(pstate, i), exp))
c62fbfe1
MD
1280 goto circref;
1281 PUSH_REF (pstate, exp);
b7f3516f 1282 scm_putc (' ', port);
0f2d19dd 1283 /* CHECK_INTS; */
c62fbfe1 1284 scm_iprin1 (SCM_CAR (exp), port, pstate);
0f2d19dd 1285 }
c96d76b8 1286 if (!SCM_NULL_OR_NIL_P (exp))
0f2d19dd 1287 {
b7f3516f 1288 scm_puts (" . ", port);
c62fbfe1 1289 scm_iprin1 (exp, port, pstate);
0f2d19dd 1290 }
c62fbfe1 1291
a51ea417 1292end:
b7f3516f 1293 scm_putc (tlr, port);
c62fbfe1 1294 pstate->top = floor + 2;
a51ea417 1295 return;
c62fbfe1
MD
1296
1297fancy_printing:
1298 {
c014a02e 1299 long n = pstate->length;
c62fbfe1
MD
1300
1301 scm_iprin1 (SCM_CAR (exp), port, pstate);
1302 exp = SCM_CDR (exp); --n;
d2e53ed6 1303 for (; scm_is_pair (exp); exp = SCM_CDR (exp))
c62fbfe1 1304 {
c014a02e 1305 register unsigned long i;
5ca6dc39 1306
c62fbfe1 1307 for (i = 0; i < pstate->top; ++i)
509759dd 1308 if (scm_is_eq (PSTATE_STACK_REF(pstate, i), exp))
c62fbfe1
MD
1309 goto fancy_circref;
1310 if (pstate->fancyp)
1311 {
1312 if (n == 0)
1313 {
b7f3516f 1314 scm_puts (" ...", port);
c62fbfe1
MD
1315 goto skip_tail;
1316 }
1317 else
1318 --n;
1319 }
1320 PUSH_REF(pstate, exp);
1321 ++pstate->list_offset;
b7f3516f 1322 scm_putc (' ', port);
c62fbfe1
MD
1323 /* CHECK_INTS; */
1324 scm_iprin1 (SCM_CAR (exp), port, pstate);
1325 }
1326 }
c96d76b8 1327 if (!SCM_NULL_OR_NIL_P (exp))
c62fbfe1 1328 {
b7f3516f 1329 scm_puts (" . ", port);
c62fbfe1
MD
1330 scm_iprin1 (exp, port, pstate);
1331 }
1332skip_tail:
1333 pstate->list_offset -= pstate->top - floor - 2;
a51ea417 1334 goto end;
a51ea417 1335
c62fbfe1
MD
1336fancy_circref:
1337 pstate->list_offset -= pstate->top - floor - 2;
1338
1339circref:
b7f3516f 1340 scm_puts (" . ", port);
c62fbfe1
MD
1341 print_circref (port, pstate, exp);
1342 goto end;
0f2d19dd
JB
1343}
1344
1345\f
1346
bb35f315
MV
1347int
1348scm_valid_oport_value_p (SCM val)
1349{
368cf54d
GB
1350 return (SCM_OPOUTPORTP (val)
1351 || (SCM_PORT_WITH_PS_P (val)
1352 && SCM_OPOUTPORTP (SCM_PORT_WITH_PS_PORT (val))));
bb35f315
MV
1353}
1354
8b840115 1355/* SCM_GPROC(s_write, "write", 1, 1, 0, scm_write, g_write); */
1cc91f1b 1356
0f2d19dd 1357SCM
1bbd0b84 1358scm_write (SCM obj, SCM port)
0f2d19dd
JB
1359{
1360 if (SCM_UNBNDP (port))
9de87eea 1361 port = scm_current_output_port ();
3eb7e6ee
JB
1362
1363 SCM_ASSERT (scm_valid_oport_value_p (port), port, SCM_ARG2, s_write);
bb35f315 1364
a51ea417 1365 scm_prin1 (obj, port, 1);
0f2d19dd
JB
1366 return SCM_UNSPECIFIED;
1367}
1368
1369
8b840115 1370/* SCM_GPROC(s_display, "display", 1, 1, 0, scm_display, g_display); */
1cc91f1b 1371
0f2d19dd 1372SCM
1bbd0b84 1373scm_display (SCM obj, SCM port)
0f2d19dd
JB
1374{
1375 if (SCM_UNBNDP (port))
9de87eea 1376 port = scm_current_output_port ();
3eb7e6ee
JB
1377
1378 SCM_ASSERT (scm_valid_oport_value_p (port), port, SCM_ARG2, s_display);
bb35f315 1379
a51ea417 1380 scm_prin1 (obj, port, 0);
0f2d19dd
JB
1381 return SCM_UNSPECIFIED;
1382}
1383
70d63753
GB
1384
1385SCM_DEFINE (scm_simple_format, "simple-format", 2, 0, 1,
1386 (SCM destination, SCM message, SCM args),
eca65e90
MG
1387 "Write @var{message} to @var{destination}, defaulting to\n"
1388 "the current output port.\n"
1389 "@var{message} can contain @code{~A} (was @code{%s}) and\n"
1390 "@code{~S} (was @code{%S}) escapes. When printed,\n"
1391 "the escapes are replaced with corresponding members of\n"
b7e64f8b 1392 "@var{args}:\n"
eca65e90
MG
1393 "@code{~A} formats using @code{display} and @code{~S} formats\n"
1394 "using @code{write}.\n"
1395 "If @var{destination} is @code{#t}, then use the current output\n"
1396 "port, if @var{destination} is @code{#f}, then return a string\n"
1397 "containing the formatted text. Does not add a trailing newline.")
70d63753
GB
1398#define FUNC_NAME s_scm_simple_format
1399{
dfd03fb9 1400 SCM port, answer = SCM_UNSPECIFIED;
70d63753
GB
1401 int fReturnString = 0;
1402 int writingp;
889975e5 1403 size_t start, p, end;
70d63753 1404
bc36d050 1405 if (scm_is_eq (destination, SCM_BOOL_T))
daba1a71 1406 {
9de87eea 1407 destination = port = scm_current_output_port ();
daba1a71 1408 }
7888309b 1409 else if (scm_is_false (destination))
daba1a71
MD
1410 {
1411 fReturnString = 1;
0b2c2ba3 1412 port = scm_mkstrport (SCM_INUM0, SCM_BOOL_F,
dfd03fb9
MD
1413 SCM_OPN | SCM_WRTNG,
1414 FUNC_NAME);
1415 destination = port;
daba1a71
MD
1416 }
1417 else
1418 {
1419 SCM_VALIDATE_OPORT_VALUE (1, destination);
dfd03fb9 1420 port = SCM_COERCE_OUTPORT (destination);
daba1a71
MD
1421 }
1422 SCM_VALIDATE_STRING (2, message);
af45e3b0 1423 SCM_VALIDATE_REST_ARGUMENT (args);
70d63753 1424
889975e5
MG
1425 p = 0;
1426 start = 0;
1427 end = scm_i_string_length (message);
b24b5e13 1428 for (p = start; p != end; ++p)
889975e5 1429 if (scm_i_string_ref (message, p) == '~')
70d63753 1430 {
b24b5e13 1431 if (++p == end)
6662998f
MV
1432 break;
1433
889975e5 1434 switch (scm_i_string_ref (message, p))
6662998f
MV
1435 {
1436 case 'A': case 'a':
1437 writingp = 0;
1438 break;
1439 case 'S': case 's':
1440 writingp = 1;
1441 break;
1442 case '~':
889975e5 1443 scm_lfwrite_substr (message, start, p, port);
6662998f
MV
1444 start = p + 1;
1445 continue;
1446 case '%':
889975e5 1447 scm_lfwrite_substr (message, start, p - 1, port);
dfd03fb9 1448 scm_newline (port);
6662998f
MV
1449 start = p + 1;
1450 continue;
1451 default:
1afff620 1452 SCM_MISC_ERROR ("FORMAT: Unsupported format option ~~~A - use (ice-9 format) instead",
889975e5 1453 scm_list_1 (SCM_MAKE_CHAR (scm_i_string_ref (message, p))));
6662998f
MV
1454
1455 }
70d63753 1456
6662998f 1457
d2e53ed6 1458 if (!scm_is_pair (args))
1afff620 1459 SCM_MISC_ERROR ("FORMAT: Missing argument for ~~~A",
889975e5 1460 scm_list_1 (SCM_MAKE_CHAR (scm_i_string_ref (message, p))));
6662998f 1461
889975e5 1462 scm_lfwrite_substr (message, start, p - 1, port);
dfd03fb9 1463 /* we pass destination here */
70d63753
GB
1464 scm_prin1 (SCM_CAR (args), destination, writingp);
1465 args = SCM_CDR (args);
1466 start = p + 1;
1467 }
6662998f 1468
889975e5 1469 scm_lfwrite_substr (message, start, p, port);
bc36d050 1470 if (!scm_is_eq (args, SCM_EOL))
1afff620
KN
1471 SCM_MISC_ERROR ("FORMAT: ~A superfluous arguments",
1472 scm_list_1 (scm_length (args)));
70d63753
GB
1473
1474 if (fReturnString)
1475 answer = scm_strport_to_string (destination);
1476
daba1a71 1477 return scm_return_first (answer, message);
70d63753
GB
1478}
1479#undef FUNC_NAME
1480
1481
3b3b36dd 1482SCM_DEFINE (scm_newline, "newline", 0, 1, 0,
b450f070 1483 (SCM port),
8f85c0c6
NJ
1484 "Send a newline to @var{port}.\n"
1485 "If @var{port} is omitted, send to the current output port.")
1bbd0b84 1486#define FUNC_NAME s_scm_newline
0f2d19dd
JB
1487{
1488 if (SCM_UNBNDP (port))
9de87eea 1489 port = scm_current_output_port ();
3eb7e6ee 1490
34d19ef6 1491 SCM_VALIDATE_OPORT_VALUE (1, port);
bb35f315 1492
0ef4ae82 1493 scm_putc ('\n', SCM_COERCE_OUTPORT (port));
0f2d19dd
JB
1494 return SCM_UNSPECIFIED;
1495}
1bbd0b84 1496#undef FUNC_NAME
0f2d19dd 1497
3b3b36dd 1498SCM_DEFINE (scm_write_char, "write-char", 1, 1, 0,
b450f070 1499 (SCM chr, SCM port),
eca65e90 1500 "Send character @var{chr} to @var{port}.")
1bbd0b84 1501#define FUNC_NAME s_scm_write_char
0f2d19dd
JB
1502{
1503 if (SCM_UNBNDP (port))
9de87eea 1504 port = scm_current_output_port ();
3eb7e6ee 1505
34d19ef6
HWN
1506 SCM_VALIDATE_CHAR (1, chr);
1507 SCM_VALIDATE_OPORT_VALUE (2, port);
07f49ac7
LC
1508
1509 port = SCM_COERCE_OUTPORT (port);
1510 if (!display_character (SCM_CHAR (chr), port,
478848cb 1511 PORT_CONVERSION_HANDLER (port)))
07f49ac7
LC
1512 scm_encoding_error (__func__, errno,
1513 "cannot convert to output locale",
6851d3be 1514 port, chr);
07f49ac7 1515
0f2d19dd
JB
1516 return SCM_UNSPECIFIED;
1517}
1bbd0b84 1518#undef FUNC_NAME
0f2d19dd 1519
0f2d19dd
JB
1520\f
1521
bb35f315 1522/* Call back to Scheme code to do the printing of special objects
c19bc088
MD
1523 * (like structs). SCM_PRINTER_APPLY applies PROC to EXP and a smob
1524 * containing PORT and PSTATE. This object can be used as the port for
1525 * display/write etc to continue the current print chain. The REVEALED
1526 * field of PSTATE is set to true to indicate that the print state has
1527 * escaped to Scheme and thus has to be freed by the GC.
1528 */
1529
92c2555f 1530scm_t_bits scm_tc16_port_with_ps;
c19bc088
MD
1531
1532/* Print exactly as the port itself would */
1533
1534static int
e841c3e0 1535port_with_ps_print (SCM obj, SCM port, scm_print_state *pstate)
c19bc088
MD
1536{
1537 obj = SCM_PORT_WITH_PS_PORT (obj);
1538 return scm_ptobs[SCM_PTOBNUM (obj)].print (obj, port, pstate);
1539}
c4f37e80
MV
1540
1541SCM
1bbd0b84 1542scm_printer_apply (SCM proc, SCM exp, SCM port, scm_print_state *pstate)
c4f37e80 1543{
bb35f315 1544 pstate->revealed = 1;
dfd03fb9
MD
1545 return scm_call_2 (proc, exp,
1546 scm_i_port_with_print_state (port, pstate->handle));
c19bc088
MD
1547}
1548
dfd03fb9 1549SCM_DEFINE (scm_port_with_print_state, "port-with-print-state", 1, 1, 0,
1bbd0b84 1550 (SCM port, SCM pstate),
71331188 1551 "Create a new port which behaves like @var{port}, but with an\n"
dfd03fb9
MD
1552 "included print state @var{pstate}. @var{pstate} is optional.\n"
1553 "If @var{pstate} isn't supplied and @var{port} already has\n"
1554 "a print state, the old print state is reused.")
1bbd0b84 1555#define FUNC_NAME s_scm_port_with_print_state
c19bc088 1556{
34d19ef6 1557 SCM_VALIDATE_OPORT_VALUE (1, port);
dfd03fb9
MD
1558 if (!SCM_UNBNDP (pstate))
1559 SCM_VALIDATE_PRINTSTATE (2, pstate);
1560 return scm_i_port_with_print_state (port, pstate);
c19bc088 1561}
1bbd0b84 1562#undef FUNC_NAME
c19bc088 1563
a1ec6916 1564SCM_DEFINE (scm_get_print_state, "get-print-state", 1, 0, 0,
1bbd0b84 1565 (SCM port),
71331188
MG
1566 "Return the print state of the port @var{port}. If @var{port}\n"
1567 "has no associated print state, @code{#f} is returned.")
1bbd0b84 1568#define FUNC_NAME s_scm_get_print_state
c19bc088 1569{
368cf54d
GB
1570 if (SCM_PORT_WITH_PS_P (port))
1571 return SCM_PORT_WITH_PS_PS (port);
f5f2dcff 1572 if (SCM_OUTPUT_PORT_P (port))
368cf54d 1573 return SCM_BOOL_F;
276dd677 1574 SCM_WRONG_TYPE_ARG (1, port);
c4f37e80 1575}
1bbd0b84 1576#undef FUNC_NAME
bb35f315 1577
c4f37e80 1578\f
1cc91f1b 1579
0f2d19dd
JB
1580void
1581scm_init_print ()
0f2d19dd 1582{
66b1dbf6 1583 SCM type;
d5cf5324 1584
d5cf5324
DH
1585 scm_gc_register_root (&print_state_pool);
1586 scm_gc_register_root (&scm_print_state_vtable);
66b1dbf6
AW
1587 type = scm_make_vtable (scm_from_locale_string (SCM_PRINT_STATE_LAYOUT),
1588 SCM_BOOL_F);
4a655e50 1589 scm_set_struct_vtable_name_x (type, scm_from_latin1_symbol ("print-state"));
bb35f315 1590 scm_print_state_vtable = type;
c4f37e80 1591
c19bc088
MD
1592 /* Don't want to bind a wrapper class in GOOPS, so pass 0 as arg1. */
1593 scm_tc16_port_with_ps = scm_make_smob_type (0, 0);
e841c3e0 1594 scm_set_smob_print (scm_tc16_port_with_ps, port_with_ps_print);
81ae25da 1595
a0599745 1596#include "libguile/print.x"
475fa9a5 1597
8500b186
AW
1598 scm_init_opts (scm_print_options, scm_print_opts);
1599 scm_print_opts[SCM_PRINT_HIGHLIGHT_PREFIX_I].val =
1600 SCM_UNPACK (scm_from_locale_string ("{"));
1601 scm_print_opts[SCM_PRINT_HIGHLIGHT_SUFFIX_I].val =
1602 SCM_UNPACK (scm_from_locale_string ("}"));
475fa9a5 1603 scm_print_opts[SCM_PRINT_KEYWORD_STYLE_I].val = SCM_UNPACK (sym_reader);
0f2d19dd 1604}
89e00824
ML
1605
1606/*
1607 Local Variables:
1608 c-file-style: "gnu"
1609 End:
1610*/