read: Support R7RS |...| symbol notation.
[bpt/guile.git] / libguile / print.c
CommitLineData
f4bc4e59 1/* Copyright (C) 1995-1999, 2000, 2001, 2002, 2003, 2004, 2006, 2008,
e4598559 2 * 2009, 2010, 2011, 2012, 2013 Free Software Foundation, Inc.
f4bc4e59 3 *
73be1d9e 4 * This library is free software; you can redistribute it and/or
53befeb7
NJ
5 * modify it under the terms of the GNU Lesser General Public License
6 * as published by the Free Software Foundation; either version 3 of
7 * the License, or (at your option) any later version.
0f2d19dd 8 *
53befeb7
NJ
9 * This library is distributed in the hope that it will be useful, but
10 * WITHOUT ANY WARRANTY; without even the implied warranty of
73be1d9e
MV
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
0f2d19dd 13 *
73be1d9e
MV
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with this library; if not, write to the Free Software
53befeb7
NJ
16 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
17 * 02110-1301 USA
73be1d9e 18 */
1bbd0b84 19
1bbd0b84 20
0f2d19dd 21\f
dbb605f5
LC
22#ifdef HAVE_CONFIG_H
23# include <config.h>
24#endif
0f2d19dd 25
e6e2e95a 26#include <errno.h>
f4bc4e59
LC
27#include <iconv.h>
28#include <stdio.h>
29#include <assert.h>
30
eca29b02 31#include <uniconv.h>
904a78f1 32#include <unictype.h>
96965a6e 33#include <c-strcase.h>
e6e2e95a 34
a0599745
MD
35#include "libguile/_scm.h"
36#include "libguile/chars.h"
a002f1a2 37#include "libguile/continuations.h"
a0599745 38#include "libguile/smob.h"
bbb2ecd1 39#include "libguile/control.h"
a0599745
MD
40#include "libguile/eval.h"
41#include "libguile/macros.h"
42#include "libguile/procprop.h"
43#include "libguile/read.h"
44#include "libguile/weaks.h"
2fb924f6 45#include "libguile/programs.h"
a0599745
MD
46#include "libguile/alist.h"
47#include "libguile/struct.h"
a0599745 48#include "libguile/ports.h"
e4598559 49#include "libguile/ports-internal.h"
a0599745
MD
50#include "libguile/root.h"
51#include "libguile/strings.h"
52#include "libguile/strports.h"
53#include "libguile/vectors.h"
327967ef 54#include "libguile/numbers.h"
6f3b0cc2 55#include "libguile/vm.h"
a0599745
MD
56
57#include "libguile/validate.h"
58#include "libguile/print.h"
22fc179a
HWN
59
60#include "libguile/private-options.h"
61
0f2d19dd
JB
62\f
63
07f49ac7
LC
64/* Character printers. */
65
478848cb
LC
66#define PORT_CONVERSION_HANDLER(port) \
67 SCM_PTAB_ENTRY (port)->ilseq_handler
68
f4bc4e59
LC
69static size_t display_string (const void *, int, size_t, SCM,
70 scm_t_string_failed_conversion_handler);
71
07f49ac7
LC
72static int display_character (scm_t_wchar, SCM,
73 scm_t_string_failed_conversion_handler);
f4bc4e59 74
07f49ac7
LC
75static void write_character (scm_t_wchar, SCM, int);
76
f4bc4e59
LC
77static void write_character_escaped (scm_t_wchar, int, SCM);
78
07f49ac7
LC
79\f
80
0f2d19dd
JB
81/* {Names of immediate symbols}
82 *
83 * This table must agree with the declarations in scm.h: {Immediate Symbols}.
84 */
85
e17d318f
DH
86/* This table must agree with the list of flags in tags.h. */
87static const char *iflagnames[] =
88{
89 "#f",
45f4cbdf
MW
90 "#nil", /* Elisp nil value. Should print from elisp as symbol `nil'. */
91 "#<XXX UNUSED LISP FALSE -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>",
92 "()",
e17d318f 93 "#t",
f60c2c4e
MW
94 "#<XXX UNUSED BOOLEAN 0 -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>",
95 "#<XXX UNUSED BOOLEAN 1 -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>",
96 "#<XXX UNUSED BOOLEAN 2 -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>",
45f4cbdf 97 "#<unspecified>",
e17d318f
DH
98 "#<undefined>",
99 "#<eof>",
e17d318f
DH
100
101 /* Unbound slot marker for GOOPS. For internal use in GOOPS only. */
102 "#<unbound>",
e17d318f
DH
103};
104
475fa9a5
MV
105SCM_SYMBOL (sym_reader, "reader");
106
92c2555f 107scm_t_option scm_print_opts[] = {
210c0325 108 { SCM_OPTION_SCM, "highlight-prefix", (scm_t_bits)SCM_BOOL_F_BITS,
81ae25da 109 "The string to print before highlighted values." },
210c0325 110 { SCM_OPTION_SCM, "highlight-suffix", (scm_t_bits)SCM_BOOL_F_BITS,
475fa9a5 111 "The string to print after highlighted values." },
210c0325 112 { SCM_OPTION_SCM, "quote-keywordish-symbols", (scm_t_bits)SCM_BOOL_F_BITS,
475fa9a5
MV
113 "How to print symbols that have a colon as their first or last character. "
114 "The value '#f' does not quote the colons; '#t' quotes them; "
8500b186
AW
115 "'reader' quotes them when the reader option 'keywords' is not '#f'." },
116 { SCM_OPTION_BOOLEAN, "escape-newlines", 1,
117 "Render newlines as \\n when printing using `write'." },
62560650 118 { 0 },
e6e4c9af
MD
119};
120
a1ec6916 121SCM_DEFINE (scm_print_options, "print-options-interface", 0, 1, 0,
1bbd0b84 122 (SCM setting),
71331188 123 "Option interface for the print options. Instead of using\n"
1dd05fd8
MG
124 "this procedure directly, use the procedures\n"
125 "@code{print-enable}, @code{print-disable}, @code{print-set!}\n"
126 "and @code{print-options}.")
1bbd0b84 127#define FUNC_NAME s_scm_print_options
e6e4c9af 128{
a51ea417 129 SCM ans = scm_options (setting,
b7ff98dd 130 scm_print_opts,
1bbd0b84 131 FUNC_NAME);
e6e4c9af
MD
132 return ans;
133}
1bbd0b84 134#undef FUNC_NAME
e6e4c9af 135
0f2d19dd
JB
136\f
137/* {Printing of Scheme Objects}
138 */
139
a51ea417 140/* Detection of circular references.
c62fbfe1
MD
141 *
142 * Due to other constraints in the implementation, this code has bad
5d46ebe3
MD
143 * time complexity (O (depth * N)), The printer code can be
144 * rewritten to be O(N).
a51ea417 145 */
dbb5de29
NJ
146#define PUSH_REF(pstate, obj) \
147do \
148{ \
149 PSTATE_STACK_SET (pstate, pstate->top, obj); \
150 pstate->top++; \
151 if (pstate->top == pstate->ceiling) \
152 grow_ref_stack (pstate); \
1bbd0b84 153} while(0)
a51ea417 154
dbb5de29
NJ
155#define ENTER_NESTED_DATA(pstate, obj, label) \
156do \
157{ \
158 register unsigned long i; \
159 for (i = 0; i < pstate->top; ++i) \
160 if (scm_is_eq (PSTATE_STACK_REF (pstate, i), (obj))) \
161 goto label; \
162 if (pstate->fancyp) \
163 { \
164 if (pstate->top - pstate->list_offset >= pstate->level) \
165 { \
166 scm_putc ('#', port); \
167 return; \
168 } \
169 } \
170 PUSH_REF(pstate, obj); \
1bbd0b84 171} while(0)
a51ea417 172
dbb5de29
NJ
173#define EXIT_NESTED_DATA(pstate) \
174do \
175{ \
176 --pstate->top; \
177 PSTATE_STACK_SET (pstate, pstate->top, SCM_UNDEFINED); \
178} \
179while (0)
c62fbfe1 180
d5cf5324
DH
181SCM scm_print_state_vtable = SCM_BOOL_F;
182static SCM print_state_pool = SCM_EOL;
9de87eea 183scm_i_pthread_mutex_t print_state_mutex = SCM_I_PTHREAD_MUTEX_INITIALIZER;
c4f37e80 184
f843a84c 185#ifdef GUILE_DEBUG /* Used for debugging purposes */
1cc91f1b 186
3b3b36dd 187SCM_DEFINE (scm_current_pstate, "current-pstate", 0, 0, 0,
1bbd0b84 188 (),
d5cf5324 189 "Return the current-pstate -- the car of the\n"
5352393c
MG
190 "@code{print_state_pool}. @code{current-pstate} is only\n"
191 "included in @code{--enable-guile-debug} builds.")
1bbd0b84 192#define FUNC_NAME s_scm_current_pstate
c62fbfe1 193{
d2e53ed6 194 if (!scm_is_null (print_state_pool))
d5cf5324 195 return SCM_CAR (print_state_pool);
a0adfbf0 196 else
0a284a4e 197 return SCM_BOOL_F;
c62fbfe1 198}
1bbd0b84
GB
199#undef FUNC_NAME
200
c62fbfe1
MD
201#endif
202
203#define PSTATE_SIZE 50L
204
698c0295 205static SCM
1bbd0b84 206make_print_state (void)
698c0295 207{
d5cf5324
DH
208 SCM print_state
209 = scm_make_struct (scm_print_state_vtable, SCM_INUM0, SCM_EOL);
bf685b6d 210 scm_print_state *pstate = SCM_PRINT_STATE (print_state);
00ffa0e7 211 pstate->ref_vect = scm_c_make_vector (PSTATE_SIZE, SCM_UNDEFINED);
4057a3e0 212 pstate->ceiling = SCM_SIMPLE_VECTOR_LENGTH (pstate->ref_vect);
d232520a 213 pstate->highlight_objects = SCM_EOL;
698c0295
MD
214 return print_state;
215}
1cc91f1b 216
c62fbfe1
MD
217SCM
218scm_make_print_state ()
c62fbfe1 219{
230d095f 220 SCM answer = SCM_BOOL_F;
698c0295
MD
221
222 /* First try to allocate a print state from the pool */
9de87eea 223 scm_i_pthread_mutex_lock (&print_state_mutex);
d2e53ed6 224 if (!scm_is_null (print_state_pool))
698c0295 225 {
d5cf5324
DH
226 answer = SCM_CAR (print_state_pool);
227 print_state_pool = SCM_CDR (print_state_pool);
698c0295 228 }
9de87eea 229 scm_i_pthread_mutex_unlock (&print_state_mutex);
698c0295 230
7888309b 231 return scm_is_false (answer) ? make_print_state () : answer;
c62fbfe1 232}
a51ea417 233
698c0295 234void
6e8d25a6 235scm_free_print_state (SCM print_state)
698c0295
MD
236{
237 SCM handle;
238 scm_print_state *pstate = SCM_PRINT_STATE (print_state);
239 /* Cleanup before returning print state to pool.
240 * It is better to do it here. Doing it in scm_prin1
241 * would cost more since that function is called much more
242 * often.
243 */
244 pstate->fancyp = 0;
bb35f315 245 pstate->revealed = 0;
d232520a 246 pstate->highlight_objects = SCM_EOL;
9de87eea 247 scm_i_pthread_mutex_lock (&print_state_mutex);
16d4699b 248 handle = scm_cons (print_state, print_state_pool);
d5cf5324 249 print_state_pool = handle;
9de87eea 250 scm_i_pthread_mutex_unlock (&print_state_mutex);
dfd03fb9
MD
251}
252
253SCM
254scm_i_port_with_print_state (SCM port, SCM print_state)
255{
256 if (SCM_UNBNDP (print_state))
257 {
258 if (SCM_PORT_WITH_PS_P (port))
259 return port;
260 else
261 print_state = scm_make_print_state ();
262 /* port does not need to be coerced since it doesn't have ps */
263 }
264 else
265 port = SCM_COERCE_OUTPORT (port);
266 SCM_RETURN_NEWSMOB (scm_tc16_port_with_ps,
267 SCM_UNPACK (scm_cons (port, print_state)));
698c0295 268}
1cc91f1b 269
a51ea417 270static void
1bbd0b84 271grow_ref_stack (scm_print_state *pstate)
a51ea417 272{
4057a3e0
MV
273 SCM old_vect = pstate->ref_vect;
274 size_t old_size = SCM_SIMPLE_VECTOR_LENGTH (old_vect);
275 size_t new_size = 2 * pstate->ceiling;
00ffa0e7 276 SCM new_vect = scm_c_make_vector (new_size, SCM_UNDEFINED);
b17004b8
DH
277 unsigned long int i;
278
279 for (i = 0; i != old_size; ++i)
4057a3e0 280 SCM_SIMPLE_VECTOR_SET (new_vect, i, SCM_SIMPLE_VECTOR_REF (old_vect, i));
b17004b8
DH
281
282 pstate->ref_vect = new_vect;
bf685b6d 283 pstate->ceiling = new_size;
a51ea417
MD
284}
285
509759dd
MV
286#define PSTATE_STACK_REF(p,i) SCM_SIMPLE_VECTOR_REF((p)->ref_vect, (i))
287#define PSTATE_STACK_SET(p,i,v) SCM_SIMPLE_VECTOR_SET((p)->ref_vect, (i), (v))
1cc91f1b 288
a51ea417 289static void
34d19ef6 290print_circref (SCM port, scm_print_state *pstate, SCM ref)
a51ea417 291{
c014a02e
ML
292 register long i;
293 long self = pstate->top - 1;
c62fbfe1 294 i = pstate->top - 1;
509759dd 295 if (scm_is_pair (PSTATE_STACK_REF (pstate, i)))
c62fbfe1
MD
296 {
297 while (i > 0)
298 {
509759dd
MV
299 if (!scm_is_pair (PSTATE_STACK_REF (pstate, i-1))
300 || !scm_is_eq (SCM_CDR (PSTATE_STACK_REF (pstate, i-1)),
301 SCM_CDR (PSTATE_STACK_REF (pstate, i))))
c62fbfe1
MD
302 break;
303 --i;
304 }
305 self = i;
306 }
307 for (i = pstate->top - 1; 1; --i)
509759dd 308 if (scm_is_eq (PSTATE_STACK_REF(pstate, i), ref))
c62fbfe1 309 break;
b7f3516f 310 scm_putc ('#', port);
c62fbfe1 311 scm_intprint (i - self, 10, port);
b7f3516f 312 scm_putc ('#', port);
a51ea417
MD
313}
314
6662998f
MV
315/* Print the name of a symbol. */
316
475fa9a5 317static int
15671c6e 318quote_keywordish_symbols (void)
475fa9a5 319{
15671c6e 320 SCM option = SCM_PRINT_KEYWORD_STYLE;
475fa9a5 321
475fa9a5
MV
322 if (scm_is_false (option))
323 return 0;
324 if (scm_is_eq (option, sym_reader))
325 return scm_is_true (SCM_PACK (SCM_KEYWORD_STYLE));
326 return 1;
327}
328
2e9fc9fc
AW
329#define INITIAL_IDENTIFIER_MASK \
330 (UC_CATEGORY_MASK_Lu | UC_CATEGORY_MASK_Ll | UC_CATEGORY_MASK_Lt \
331 | UC_CATEGORY_MASK_Lm | UC_CATEGORY_MASK_Lo | UC_CATEGORY_MASK_Mn \
332 | UC_CATEGORY_MASK_Nl | UC_CATEGORY_MASK_No | UC_CATEGORY_MASK_Pd \
333 | UC_CATEGORY_MASK_Pc | UC_CATEGORY_MASK_Po | UC_CATEGORY_MASK_Sc \
334 | UC_CATEGORY_MASK_Sm | UC_CATEGORY_MASK_Sk | UC_CATEGORY_MASK_So \
335 | UC_CATEGORY_MASK_Co)
336
337#define SUBSEQUENT_IDENTIFIER_MASK \
338 (INITIAL_IDENTIFIER_MASK \
339 | UC_CATEGORY_MASK_Nd | UC_CATEGORY_MASK_Mc | UC_CATEGORY_MASK_Me)
340
15671c6e
AW
341static int
342symbol_has_extended_read_syntax (SCM sym)
6662998f 343{
15671c6e
AW
344 size_t pos, len = scm_i_symbol_length (sym);
345 scm_t_wchar c;
346
347 /* The empty symbol. */
348 if (len == 0)
349 return 1;
350
351 c = scm_i_symbol_ref (sym, 0);
352
353 /* Single dot; conflicts with dotted-pair notation. */
354 if (len == 1 && c == '.')
355 return 1;
356
357 /* Other initial-character constraints. */
2e9fc9fc 358 if (c == '\'' || c == '`' || c == ',' || c == '"' || c == ';' || c == '#')
15671c6e
AW
359 return 1;
360
361 /* Keywords can be identified by trailing colons too. */
362 if (c == ':' || scm_i_symbol_ref (sym, len - 1) == ':')
363 return quote_keywordish_symbols ();
364
365 /* Number-ish symbols. */
366 if (scm_is_true (scm_i_string_to_number (scm_symbol_to_string (sym), 10)))
367 return 1;
368
2e9fc9fc
AW
369 /* Other disallowed first characters. */
370 if (!uc_is_general_category_withtable (c, INITIAL_IDENTIFIER_MASK))
371 return 1;
372
373 /* Otherwise, any character that's in the identifier category mask is
374 fine to pass through as-is, provided it's not one of the ASCII
375 delimiters like `;'. */
376 for (pos = 1; pos < len; pos++)
6662998f 377 {
2e9fc9fc
AW
378 c = scm_i_symbol_ref (sym, pos);
379 if (!uc_is_general_category_withtable (c, SUBSEQUENT_IDENTIFIER_MASK))
380 return 1;
381 else if (c == '"' || c == ';' || c == '#')
382 return 1;
6662998f 383 }
c6b49e89 384
15671c6e
AW
385 return 0;
386}
387
388static void
389print_normal_symbol (SCM sym, SCM port)
390{
391 scm_display (scm_symbol_to_string (sym), port);
392}
393
15671c6e
AW
394static void
395print_extended_symbol (SCM sym, SCM port)
396{
397 size_t pos, len;
398 scm_t_string_failed_conversion_handler strategy;
399
400 len = scm_i_symbol_length (sym);
478848cb 401 strategy = PORT_CONVERSION_HANDLER (port);
15671c6e
AW
402
403 scm_lfwrite ("#{", 2, port);
404
405 for (pos = 0; pos < len; pos++)
406 {
407 scm_t_wchar c = scm_i_symbol_ref (sym, pos);
408
2e9fc9fc
AW
409 if (uc_is_general_category_withtable (c,
410 SUBSEQUENT_IDENTIFIER_MASK
411 | UC_CATEGORY_MASK_Zs))
15671c6e 412 {
b4a09988
DK
413 if (!display_character (c, port, strategy)
414 || (c == '\\' && !display_character (c, port, strategy)))
15671c6e
AW
415 scm_encoding_error ("print_extended_symbol", errno,
416 "cannot convert to output locale",
417 port, SCM_MAKE_CHAR (c));
2e9fc9fc
AW
418 }
419 else
420 {
421 display_string ("\\x", 1, 2, port, iconveh_question_mark);
422 scm_intprint (c, 16, port);
423 display_character (';', port, iconveh_question_mark);
15671c6e
AW
424 }
425 }
426
427 scm_lfwrite ("}#", 2, port);
428}
429
430/* FIXME: allow R6RS hex escapes instead of #{...}#. */
431void
432scm_i_print_symbol_name (SCM sym, SCM port)
433{
434 if (symbol_has_extended_read_syntax (sym))
435 print_extended_symbol (sym, port);
436 else
437 print_normal_symbol (sym, port);
6662998f
MV
438}
439
e23106d5
MG
440void
441scm_print_symbol_name (const char *str, size_t len, SCM port)
442{
443 SCM symbol = scm_from_locale_symboln (str, len);
ab33782c 444 scm_i_print_symbol_name (symbol, port);
e23106d5
MG
445}
446
c62fbfe1 447/* Print generally. Handles both write and display according to PSTATE.
0f2d19dd 448 */
8b840115
MD
449SCM_GPROC(s_write, "write", 1, 1, 0, scm_write, g_write);
450SCM_GPROC(s_display, "display", 1, 1, 0, scm_display, g_display);
1cc91f1b 451
d232520a
MV
452static void iprin1 (SCM exp, SCM port, scm_print_state *pstate);
453
dea901d6
MG
454
455/* Print a character as an octal or hex escape. */
456#define PRINT_CHAR_ESCAPE(i, port) \
457 do \
458 { \
459 if (!SCM_R6RS_ESCAPES_P) \
460 scm_intprint (i, 8, port); \
461 else \
462 { \
463 scm_puts ("x", port); \
464 scm_intprint (i, 16, port); \
465 } \
466 } \
467 while (0)
468
469
0f2d19dd 470void
1bbd0b84 471scm_iprin1 (SCM exp, SCM port, scm_print_state *pstate)
d232520a
MV
472{
473 if (pstate->fancyp
474 && scm_is_true (scm_memq (exp, pstate->highlight_objects)))
475 {
81ae25da 476 scm_display (SCM_PRINT_HIGHLIGHT_PREFIX, port);
d232520a 477 iprin1 (exp, port, pstate);
81ae25da 478 scm_display (SCM_PRINT_HIGHLIGHT_SUFFIX, port);
d232520a
MV
479 }
480 else
481 iprin1 (exp, port, pstate);
482}
483
484static void
485iprin1 (SCM exp, SCM port, scm_print_state *pstate)
0f2d19dd 486{
54778cd3 487 switch (SCM_ITAG3 (exp))
0f2d19dd 488 {
e34f941a
DH
489 case scm_tc3_tc7_1:
490 case scm_tc3_tc7_2:
491 /* These tc3 tags should never occur in an immediate value. They are
492 * only used in cell types of non-immediates, i. e. the value returned
493 * by SCM_CELL_TYPE (exp) can use these tags.
494 */
495 scm_ipruk ("immediate", exp, port);
496 break;
497 case scm_tc3_int_1:
498 case scm_tc3_int_2:
e11e83f3 499 scm_intprint (SCM_I_INUM (exp), 10, port);
0f2d19dd 500 break;
e34f941a 501 case scm_tc3_imm24:
7866a09b 502 if (SCM_CHARP (exp))
0f2d19dd 503 {
b7f3516f 504 if (SCM_WRITINGP (pstate))
07f49ac7
LC
505 write_character (SCM_CHAR (exp), port, 0);
506 else
b7f3516f 507 {
07f49ac7 508 if (!display_character (SCM_CHAR (exp), port,
478848cb 509 PORT_CONVERSION_HANDLER (port)))
07f49ac7
LC
510 scm_encoding_error (__func__, errno,
511 "cannot convert to output locale",
6851d3be 512 port, exp);
b7f3516f 513 }
0f2d19dd 514 }
a51ea417 515 else if (SCM_IFLAGP (exp)
e17d318f
DH
516 && ((size_t) SCM_IFLAGNUM (exp) < (sizeof iflagnames / sizeof (char *))))
517 {
518 scm_puts (iflagnames [SCM_IFLAGNUM (exp)], port);
519 }
0f2d19dd 520 else
e34f941a
DH
521 {
522 /* unknown immediate value */
523 scm_ipruk ("immediate", exp, port);
524 }
0f2d19dd 525 break;
e34f941a 526 case scm_tc3_cons:
0f2d19dd
JB
527 switch (SCM_TYP7 (exp))
528 {
904a077d
MV
529 case scm_tcs_struct:
530 {
531 ENTER_NESTED_DATA (pstate, exp, circref);
532 if (SCM_OBJ_CLASS_FLAGS (exp) & SCM_CLASSF_GOOPS)
533 {
534 SCM pwps, print = pstate->writingp ? g_write : g_display;
b2b33168 535 if (SCM_UNPACK (print) == 0)
904a077d 536 goto print_struct;
dfd03fb9 537 pwps = scm_i_port_with_print_state (port, pstate->handle);
7663c008 538 pstate->revealed = 1;
904a077d
MV
539 scm_call_generic_2 (print, exp, pwps);
540 }
541 else
542 {
543 print_struct:
544 scm_print_struct (exp, port, pstate);
545 }
546 EXIT_NESTED_DATA (pstate);
547 }
548 break;
0f2d19dd
JB
549 case scm_tcs_cons_imcar:
550 case scm_tcs_cons_nimcar:
c62fbfe1
MD
551 ENTER_NESTED_DATA (pstate, exp, circref);
552 scm_iprlist ("(", exp, ')', port, pstate);
553 EXIT_NESTED_DATA (pstate);
a51ea417
MD
554 break;
555 circref:
c62fbfe1 556 print_circref (port, pstate, exp);
0f2d19dd 557 break;
534c55a9
DH
558 case scm_tc7_number:
559 switch SCM_TYP16 (exp) {
560 case scm_tc16_big:
561 scm_bigprint (exp, port, pstate);
562 break;
563 case scm_tc16_real:
564 scm_print_real (exp, port, pstate);
565 break;
566 case scm_tc16_complex:
567 scm_print_complex (exp, port, pstate);
568 break;
f92e85f7
MV
569 case scm_tc16_fraction:
570 scm_i_print_fraction (exp, port, pstate);
571 break;
534c55a9
DH
572 }
573 break;
9c44cd45
MG
574 case scm_tc7_string:
575 if (SCM_WRITINGP (pstate))
576 {
07f49ac7 577 size_t len, i;
9c44cd45 578
f4bc4e59 579 display_character ('"', port, iconveh_question_mark);
9c44cd45
MG
580 len = scm_i_string_length (exp);
581 for (i = 0; i < len; ++i)
07f49ac7
LC
582 write_character (scm_i_string_ref (exp, i), port, 1);
583
f4bc4e59 584 display_character ('"', port, iconveh_question_mark);
9c44cd45
MG
585 scm_remember_upto_here_1 (exp);
586 }
587 else
f4bc4e59
LC
588 {
589 size_t len, printed;
590
591 len = scm_i_string_length (exp);
592 printed = display_string (scm_i_string_data (exp),
593 scm_i_is_narrow_string (exp),
594 len, port,
478848cb 595 PORT_CONVERSION_HANDLER (port));
f4bc4e59 596 if (SCM_UNLIKELY (printed < len))
f4bc4e59
LC
597 scm_encoding_error (__func__, errno,
598 "cannot convert to output locale",
6851d3be 599 port, scm_c_string_ref (exp, printed));
f4bc4e59
LC
600 }
601
9c44cd45
MG
602 scm_remember_upto_here_1 (exp);
603 break;
28b06554 604 case scm_tc7_symbol:
cc95e00a 605 if (scm_i_symbol_is_interned (exp))
9ff28a13 606 {
e23106d5 607 scm_i_print_symbol_name (exp, port);
9ff28a13
MV
608 scm_remember_upto_here_1 (exp);
609 }
610 else
611 {
612 scm_puts ("#<uninterned-symbol ", port);
e23106d5 613 scm_i_print_symbol_name (exp, port);
9ff28a13 614 scm_putc (' ', port);
0345e278 615 scm_uintprint (SCM_UNPACK (exp), 16, port);
9ff28a13
MV
616 scm_putc ('>', port);
617 }
6662998f 618 break;
e5aca4b5
MV
619 case scm_tc7_variable:
620 scm_i_variable_print (exp, port, pstate);
621 break;
2fb924f6
AW
622 case scm_tc7_program:
623 scm_i_program_print (exp, port, pstate);
624 break;
5b46a8c2
LC
625 case scm_tc7_pointer:
626 scm_i_pointer_print (exp, port, pstate);
e2c2a699 627 break;
c99de5aa
AW
628 case scm_tc7_hashtable:
629 scm_i_hashtable_print (exp, port, pstate);
630 break;
9ea31741
AW
631 case scm_tc7_fluid:
632 scm_i_fluid_print (exp, port, pstate);
633 break;
45cf2428
AW
634 case scm_tc7_dynamic_state:
635 scm_i_dynamic_state_print (exp, port, pstate);
636 break;
6f3b0cc2
AW
637 case scm_tc7_frame:
638 scm_i_frame_print (exp, port, pstate);
639 break;
640 case scm_tc7_objcode:
641 scm_i_objcode_print (exp, port, pstate);
642 break;
643 case scm_tc7_vm:
644 scm_i_vm_print (exp, port, pstate);
645 break;
646 case scm_tc7_vm_cont:
647 scm_i_vm_cont_print (exp, port, pstate);
648 break;
bbb2ecd1
AW
649 case scm_tc7_prompt:
650 scm_i_prompt_print (exp, port, pstate);
651 break;
652 case scm_tc7_with_fluids:
653 scm_i_with_fluids_print (exp, port, pstate);
654 break;
b2637c98
AW
655 case scm_tc7_array:
656 ENTER_NESTED_DATA (pstate, exp, circref);
657 scm_i_print_array (exp, port, pstate);
88c0a1d5 658 EXIT_NESTED_DATA (pstate);
b2637c98
AW
659 break;
660 case scm_tc7_bytevector:
661 scm_i_print_bytevector (exp, port, pstate);
662 break;
ff1feca9
AW
663 case scm_tc7_bitvector:
664 scm_i_print_bitvector (exp, port, pstate);
665 break;
0f2d19dd 666 case scm_tc7_wvect:
c62fbfe1 667 ENTER_NESTED_DATA (pstate, exp, circref);
0f2d19dd 668 if (SCM_IS_WHVEC (exp))
b7f3516f 669 scm_puts ("#wh(", port);
0f2d19dd 670 else
b7f3516f 671 scm_puts ("#w(", port);
0f2d19dd 672 goto common_vector_printer;
0f2d19dd 673 case scm_tc7_vector:
c62fbfe1 674 ENTER_NESTED_DATA (pstate, exp, circref);
b7f3516f 675 scm_puts ("#(", port);
0f2d19dd 676 common_vector_printer:
9fbaf27c 677 {
c014a02e 678 register long i;
4057a3e0 679 long last = SCM_SIMPLE_VECTOR_LENGTH (exp) - 1;
9fbaf27c 680 int cutp = 0;
4057a3e0
MV
681 if (pstate->fancyp
682 && SCM_SIMPLE_VECTOR_LENGTH (exp) > pstate->length)
9fbaf27c
MD
683 {
684 last = pstate->length - 1;
685 cutp = 1;
686 }
c367c4b4 687 if (SCM_I_WVECTP (exp))
9fbaf27c 688 {
c367c4b4
LC
689 /* Elements of weak vectors may not be accessed via the
690 `SIMPLE_VECTOR_REF ()' macro. */
691 for (i = 0; i < last; ++i)
692 {
693 scm_iprin1 (scm_c_vector_ref (exp, i),
694 port, pstate);
695 scm_putc (' ', port);
696 }
9fbaf27c 697 }
c367c4b4
LC
698 else
699 {
700 for (i = 0; i < last; ++i)
701 {
702 scm_iprin1 (SCM_SIMPLE_VECTOR_REF (exp, i), port, pstate);
703 scm_putc (' ', port);
704 }
705 }
706
9fbaf27c
MD
707 if (i == last)
708 {
709 /* CHECK_INTS; */
c367c4b4 710 scm_iprin1 (scm_c_vector_ref (exp, i), port, pstate);
9fbaf27c
MD
711 }
712 if (cutp)
b7f3516f
TT
713 scm_puts (" ...", port);
714 scm_putc (')', port);
9fbaf27c 715 }
c62fbfe1 716 EXIT_NESTED_DATA (pstate);
0f2d19dd 717 break;
0f2d19dd 718 case scm_tc7_port:
5ca6dc39
JB
719 {
720 register long i = SCM_PTOBNUM (exp);
721 if (i < scm_numptob
722 && scm_ptobs[i].print
723 && (scm_ptobs[i].print) (exp, port, pstate))
a51ea417 724 break;
5ca6dc39
JB
725 goto punk;
726 }
727 case scm_tc7_smob:
7a7f7c53
DH
728 ENTER_NESTED_DATA (pstate, exp, circref);
729 SCM_SMOB_DESCRIPTOR (exp).print (exp, port, pstate);
730 EXIT_NESTED_DATA (pstate);
731 break;
0f2d19dd 732 default:
314b8716 733 /* case scm_tcs_closures: */
a51ea417
MD
734 punk:
735 scm_ipruk ("type", exp, port);
0f2d19dd
JB
736 }
737 }
738}
739
c62fbfe1
MD
740/* Print states are necessary for circular reference safe printing.
741 * They are also expensive to allocate. Therefore print states are
742 * kept in a pool so that they can be reused.
743 */
1cc91f1b 744
bb35f315
MV
745/* The PORT argument can also be a print-state/port pair, which will
746 * then be used instead of allocating a new print state. This is
747 * useful for continuing a chain of print calls from Scheme. */
748
a51ea417 749void
1bbd0b84 750scm_prin1 (SCM exp, SCM port, int writingp)
a51ea417 751{
c4f37e80
MV
752 SCM handle = SCM_BOOL_F; /* Will GC protect the handle whilst unlinked */
753 SCM pstate_scm;
c62fbfe1 754 scm_print_state *pstate;
15635be5 755 int old_writingp;
c62fbfe1 756
bb35f315
MV
757 /* If PORT is a print-state/port pair, use that. Else create a new
758 print-state. */
c4f37e80 759
0c95b57d 760 if (SCM_PORT_WITH_PS_P (port))
bb35f315 761 {
52235e71
MD
762 pstate_scm = SCM_PORT_WITH_PS_PS (port);
763 port = SCM_PORT_WITH_PS_PORT (port);
bb35f315
MV
764 }
765 else
c62fbfe1 766 {
c4f37e80 767 /* First try to allocate a print state from the pool */
9de87eea 768 scm_i_pthread_mutex_lock (&print_state_mutex);
d2e53ed6 769 if (!scm_is_null (print_state_pool))
c4f37e80 770 {
d5cf5324
DH
771 handle = print_state_pool;
772 print_state_pool = SCM_CDR (print_state_pool);
c4f37e80 773 }
9de87eea 774 scm_i_pthread_mutex_unlock (&print_state_mutex);
7888309b 775 if (scm_is_false (handle))
d5cf5324 776 handle = scm_list_1 (make_print_state ());
c4f37e80 777 pstate_scm = SCM_CAR (handle);
c62fbfe1 778 }
c62fbfe1 779
c4f37e80 780 pstate = SCM_PRINT_STATE (pstate_scm);
15635be5 781 old_writingp = pstate->writingp;
c62fbfe1
MD
782 pstate->writingp = writingp;
783 scm_iprin1 (exp, port, pstate);
15635be5 784 pstate->writingp = old_writingp;
c62fbfe1 785
bb35f315
MV
786 /* Return print state to pool if it has been created above and
787 hasn't escaped to Scheme. */
788
7888309b 789 if (scm_is_true (handle) && !pstate->revealed)
c4f37e80 790 {
9de87eea 791 scm_i_pthread_mutex_lock (&print_state_mutex);
d5cf5324
DH
792 SCM_SETCDR (handle, print_state_pool);
793 print_state_pool = handle;
9de87eea 794 scm_i_pthread_mutex_unlock (&print_state_mutex);
c4f37e80 795 }
a51ea417
MD
796}
797
f4bc4e59
LC
798/* Convert codepoint CH to UTF-8 and store the result in UTF8. Return
799 the number of bytes of the UTF-8-encoded string. */
800static size_t
801codepoint_to_utf8 (scm_t_wchar ch, scm_t_uint8 utf8[4])
9c44cd45 802{
f4bc4e59
LC
803 size_t len;
804 scm_t_uint32 codepoint;
805
806 codepoint = (scm_t_uint32) ch;
07f49ac7 807
f4bc4e59 808 if (codepoint <= 0x7f)
07f49ac7 809 {
f4bc4e59
LC
810 len = 1;
811 utf8[0] = (scm_t_uint8) codepoint;
812 }
813 else if (codepoint <= 0x7ffUL)
814 {
815 len = 2;
816 utf8[0] = 0xc0 | (codepoint >> 6);
817 utf8[1] = 0x80 | (codepoint & 0x3f);
818 }
819 else if (codepoint <= 0xffffUL)
820 {
821 len = 3;
822 utf8[0] = 0xe0 | (codepoint >> 12);
823 utf8[1] = 0x80 | ((codepoint >> 6) & 0x3f);
824 utf8[2] = 0x80 | (codepoint & 0x3f);
07f49ac7
LC
825 }
826 else
827 {
f4bc4e59
LC
828 len = 4;
829 utf8[0] = 0xf0 | (codepoint >> 18);
830 utf8[1] = 0x80 | ((codepoint >> 12) & 0x3f);
831 utf8[2] = 0x80 | ((codepoint >> 6) & 0x3f);
832 utf8[3] = 0x80 | (codepoint & 0x3f);
833 }
834
835 return len;
836}
837
f4bc4e59
LC
838#define STR_REF(s, x) \
839 (narrow_p \
840 ? (scm_t_wchar) ((unsigned char *) (s))[x] \
841 : ((scm_t_wchar *) (s))[x])
842
7b292a9d
LC
843/* Write STR to PORT as UTF-8. STR is a LEN-codepoint string; it is
844 narrow if NARROW_P is true, wide otherwise. Return LEN. */
845static size_t
846display_string_as_utf8 (const void *str, int narrow_p, size_t len,
847 SCM port)
848{
849 size_t printed = 0;
850
851 while (len > printed)
852 {
853 size_t utf8_len, i;
854 char *input, utf8_buf[256];
855
856 /* Convert STR to UTF-8. */
857 for (i = printed, utf8_len = 0, input = utf8_buf;
858 i < len && utf8_len + 4 < sizeof (utf8_buf);
859 i++)
860 {
861 utf8_len += codepoint_to_utf8 (STR_REF (str, i),
862 (scm_t_uint8 *) input);
863 input = utf8_buf + utf8_len;
864 }
865
866 /* INPUT was successfully converted, entirely; print the
867 result. */
868 scm_lfwrite (utf8_buf, utf8_len, port);
869 printed += i - printed;
870 }
871
872 assert (printed == len);
873
874 return len;
875}
876
877/* Convert STR through PORT's output conversion descriptor and write the
878 output to PORT. Return the number of codepoints written. */
879static size_t
880display_string_using_iconv (const void *str, int narrow_p, size_t len,
881 SCM port,
882 scm_t_string_failed_conversion_handler strategy)
883{
f4bc4e59 884 size_t printed;
337edc59 885 scm_t_iconv_descriptors *id;
cdd3d6c9 886 scm_t_port_internal *pti = SCM_PORT_GET_INTERNAL (port);
f4bc4e59 887
cdd3d6c9
MW
888 id = scm_i_port_iconv_descriptors (port, SCM_PORT_WRITE);
889
890 if (SCM_UNLIKELY (pti->at_stream_start_for_bom_write && len > 0))
891 {
892 scm_t_port *pt = SCM_PTAB_ENTRY (port);
893
894 /* Record that we're no longer at stream start. */
895 pti->at_stream_start_for_bom_write = 0;
896 if (pt->rw_random)
897 pti->at_stream_start_for_bom_read = 0;
898
899 /* Write a BOM if appropriate. */
96965a6e
MW
900 if (SCM_UNLIKELY (c_strcasecmp(pt->encoding, "UTF-16") == 0
901 || c_strcasecmp(pt->encoding, "UTF-32") == 0))
cdd3d6c9
MW
902 display_character (SCM_UNICODE_BOM, port, iconveh_error);
903 }
f4bc4e59 904
f4bc4e59
LC
905 printed = 0;
906
907 while (len > printed)
908 {
909 size_t done, utf8_len, input_left, output_left, i;
910 size_t codepoints_read, output_len;
911 char *input, *output;
912 char utf8_buf[256], encoded_output[256];
913 size_t offsets[256];
914
915 /* Convert STR to UTF-8. */
916 for (i = printed, utf8_len = 0, input = utf8_buf;
917 i < len && utf8_len + 4 < sizeof (utf8_buf);
918 i++)
07f49ac7 919 {
f4bc4e59
LC
920 offsets[utf8_len] = i;
921 utf8_len += codepoint_to_utf8 (STR_REF (str, i),
922 (scm_t_uint8 *) input);
923 input = utf8_buf + utf8_len;
924 }
925
926 input = utf8_buf;
927 input_left = utf8_len;
928
929 output = encoded_output;
930 output_left = sizeof (encoded_output);
931
337edc59 932 done = iconv (id->output_cd, &input, &input_left,
f4bc4e59 933 &output, &output_left);
07f49ac7 934
f4bc4e59
LC
935 output_len = sizeof (encoded_output) - output_left;
936
937 if (SCM_UNLIKELY (done == (size_t) -1))
938 {
b2548e23
AW
939 int errno_save = errno;
940
f4bc4e59 941 /* Reset the `iconv' state. */
337edc59 942 iconv (id->output_cd, NULL, NULL, NULL, NULL);
f4bc4e59 943
7174bc08
LC
944 /* Print the OUTPUT_LEN bytes successfully converted. */
945 scm_lfwrite (encoded_output, output_len, port);
946
947 /* See how many input codepoints these OUTPUT_LEN bytes
948 corresponds to. */
949 codepoints_read = offsets[input - utf8_buf] - printed;
950 printed += codepoints_read;
951
b2548e23 952 if (errno_save == EILSEQ &&
f4bc4e59 953 strategy != SCM_FAILED_CONVERSION_ERROR)
07f49ac7 954 {
f4bc4e59
LC
955 /* Conversion failed somewhere in INPUT and we want to
956 escape or substitute the offending input character. */
957
f4bc4e59 958 if (strategy == SCM_FAILED_CONVERSION_ESCAPE_SEQUENCE)
f1ee6d54 959 {
f4bc4e59
LC
960 scm_t_wchar ch;
961
962 /* Find CH, the offending codepoint, and escape it. */
963 ch = STR_REF (str, offsets[input - utf8_buf]);
964 write_character_escaped (ch, 1, port);
f1ee6d54 965 }
07f49ac7 966 else
f4bc4e59
LC
967 /* STRATEGY is `SCM_FAILED_CONVERSION_QUESTION_MARK'. */
968 display_string ("?", 1, 1, port, strategy);
9c44cd45 969
f4bc4e59
LC
970 printed++;
971 }
972 else
973 /* Something bad happened that we can't handle: bail out. */
974 break;
07f49ac7
LC
975 }
976 else
f4bc4e59
LC
977 {
978 /* INPUT was successfully converted, entirely; print the
979 result. */
980 scm_lfwrite (encoded_output, output_len, port);
981 codepoints_read = i - printed;
982 printed += codepoints_read;
983 }
07f49ac7
LC
984 }
985
986 return printed;
7b292a9d
LC
987}
988
f4bc4e59 989#undef STR_REF
7b292a9d
LC
990
991/* Display the LEN codepoints in STR to PORT according to STRATEGY;
992 return the number of codepoints successfully displayed. If NARROW_P,
993 then STR is interpreted as a sequence of `char', denoting a Latin-1
994 string; otherwise it's interpreted as a sequence of
995 `scm_t_wchar'. */
996static size_t
997display_string (const void *str, int narrow_p,
998 size_t len, SCM port,
999 scm_t_string_failed_conversion_handler strategy)
1000
1001{
e4598559 1002 scm_t_port_internal *pti;
7b292a9d 1003
e4598559 1004 pti = SCM_PORT_GET_INTERNAL (port);
7b292a9d 1005
337edc59 1006 if (pti->encoding_mode == SCM_PORT_ENCODING_MODE_UTF8)
7b292a9d
LC
1007 return display_string_as_utf8 (str, narrow_p, len, port);
1008 else
1009 return display_string_using_iconv (str, narrow_p, len,
1010 port, strategy);
f4bc4e59
LC
1011}
1012
1013/* Attempt to display CH to PORT according to STRATEGY. Return non-zero
1014 if CH was successfully displayed, zero otherwise (e.g., if it was not
1015 representable in PORT's encoding.) */
1016static int
1017display_character (scm_t_wchar ch, SCM port,
1018 scm_t_string_failed_conversion_handler strategy)
1019{
1020 return display_string (&ch, 0, 1, port, strategy) == 1;
07f49ac7
LC
1021}
1022
33d92fe6
LC
1023/* Attempt to pretty-print CH, a combining character, to PORT. Return
1024 zero upon failure, non-zero otherwise. The idea is to print CH above
1025 a dotted circle to make it more visible. */
1026static int
1027write_combining_character (scm_t_wchar ch, SCM port)
1028{
f4bc4e59
LC
1029 scm_t_wchar str[2];
1030
1031 str[0] = SCM_CODEPOINT_DOTTED_CIRCLE;
1032 str[1] = ch;
1033
1034 return display_string (str, 0, 2, port, iconveh_error) == 2;
1035}
33d92fe6 1036
f4bc4e59
LC
1037/* Write CH to PORT in its escaped form, using the string escape syntax
1038 if STRING_ESCAPES_P is non-zero. */
1039static void
1040write_character_escaped (scm_t_wchar ch, int string_escapes_p, SCM port)
1041{
1042 if (string_escapes_p)
33d92fe6 1043 {
f4bc4e59
LC
1044 /* Represent CH using the in-string escape syntax. */
1045
1046 static const char hex[] = "0123456789abcdef";
1047 static const char escapes[7] = "abtnvfr";
1048 char buf[9];
1049
1050 if (ch >= 0x07 && ch <= 0x0D && ch != 0x0A)
33d92fe6 1051 {
f4bc4e59
LC
1052 /* Use special escapes for some C0 controls. */
1053 buf[0] = '\\';
1054 buf[1] = escapes[ch - 0x07];
1055 scm_lfwrite (buf, 2, port);
1056 }
1057 else if (!SCM_R6RS_ESCAPES_P)
1058 {
1059 if (ch <= 0xFF)
1060 {
1061 buf[0] = '\\';
1062 buf[1] = 'x';
1063 buf[2] = hex[ch / 16];
1064 buf[3] = hex[ch % 16];
1065 scm_lfwrite (buf, 4, port);
1066 }
1067 else if (ch <= 0xFFFF)
1068 {
1069 buf[0] = '\\';
1070 buf[1] = 'u';
1071 buf[2] = hex[(ch & 0xF000) >> 12];
1072 buf[3] = hex[(ch & 0xF00) >> 8];
1073 buf[4] = hex[(ch & 0xF0) >> 4];
1074 buf[5] = hex[(ch & 0xF)];
1075 scm_lfwrite (buf, 6, port);
1076 }
1077 else if (ch > 0xFFFF)
1078 {
1079 buf[0] = '\\';
1080 buf[1] = 'U';
1081 buf[2] = hex[(ch & 0xF00000) >> 20];
1082 buf[3] = hex[(ch & 0xF0000) >> 16];
1083 buf[4] = hex[(ch & 0xF000) >> 12];
1084 buf[5] = hex[(ch & 0xF00) >> 8];
1085 buf[6] = hex[(ch & 0xF0) >> 4];
1086 buf[7] = hex[(ch & 0xF)];
1087 scm_lfwrite (buf, 8, port);
1088 }
33d92fe6
LC
1089 }
1090 else
f4bc4e59
LC
1091 {
1092 /* Print an R6RS variable-length hex escape: "\xNNNN;". */
1093 scm_t_wchar ch2 = ch;
1094
1095 int i = 8;
1096 buf[i] = ';';
1097 i --;
1098 if (ch == 0)
1099 buf[i--] = '0';
1100 else
1101 while (ch2 > 0)
1102 {
1103 buf[i] = hex[ch2 & 0xF];
1104 ch2 >>= 4;
1105 i --;
1106 }
1107 buf[i] = 'x';
1108 i --;
1109 buf[i] = '\\';
1110 scm_lfwrite (buf + i, 9 - i, port);
1111 }
33d92fe6
LC
1112 }
1113 else
f4bc4e59
LC
1114 {
1115 /* Represent CH using the character escape syntax. */
1116 const char *name;
33d92fe6 1117
f4bc4e59
LC
1118 name = scm_i_charname (SCM_MAKE_CHAR (ch));
1119 if (name != NULL)
1120 scm_puts (name, port);
1121 else
1122 PRINT_CHAR_ESCAPE (ch, port);
1123 }
33d92fe6
LC
1124}
1125
07f49ac7
LC
1126/* Write CH to PORT, escaping it if it's non-graphic or not
1127 representable in PORT's encoding. If STRING_ESCAPES_P is true and CH
1128 needs to be escaped, it is escaped using the in-string escape syntax;
1129 otherwise the character escape syntax is used. */
1130static void
1131write_character (scm_t_wchar ch, SCM port, int string_escapes_p)
1132{
1133 int printed = 0;
f4bc4e59
LC
1134 scm_t_string_failed_conversion_handler strategy;
1135
478848cb 1136 strategy = PORT_CONVERSION_HANDLER (port);
07f49ac7
LC
1137
1138 if (string_escapes_p)
1139 {
1140 /* Check if CH deserves special treatment. */
1141 if (ch == '"' || ch == '\\')
1142 {
f4bc4e59
LC
1143 display_character ('\\', port, iconveh_question_mark);
1144 display_character (ch, port, strategy);
07f49ac7
LC
1145 printed = 1;
1146 }
8500b186
AW
1147 else if (ch == '\n' && SCM_PRINT_ESCAPE_NEWLINES_P)
1148 {
1149 display_character ('\\', port, iconveh_question_mark);
1150 display_character ('n', port, strategy);
1151 printed = 1;
1152 }
07f49ac7
LC
1153 else if (ch == ' ' || ch == '\n')
1154 {
f4bc4e59 1155 display_character (ch, port, strategy);
07f49ac7
LC
1156 printed = 1;
1157 }
1158 }
1159 else
33d92fe6 1160 {
f4bc4e59 1161 display_string ("#\\", 1, 2, port, iconveh_question_mark);
33d92fe6
LC
1162
1163 if (uc_combining_class (ch) != UC_CCC_NR)
1164 /* Character is a combining character, so attempt to
1165 pretty-print it. */
1166 printed = write_combining_character (ch, port);
1167 }
07f49ac7
LC
1168
1169 if (!printed
1170 && uc_is_general_category_withtable (ch,
1171 UC_CATEGORY_MASK_L |
1172 UC_CATEGORY_MASK_M |
1173 UC_CATEGORY_MASK_N |
1174 UC_CATEGORY_MASK_P |
1175 UC_CATEGORY_MASK_S))
1176 /* CH is graphic; attempt to display it. */
1177 printed = display_character (ch, port, iconveh_error);
1178
1179 if (!printed)
f4bc4e59
LC
1180 /* CH isn't graphic or cannot be represented in PORT's encoding. */
1181 write_character_escaped (ch, string_escapes_p, port);
9c44cd45 1182}
0f2d19dd 1183
b908768a
LC
1184/* Display STR to PORT from START inclusive to END exclusive. */
1185void
1186scm_i_display_substring (SCM str, size_t start, size_t end, SCM port)
1187{
1188 int narrow_p;
1189 const char *buf;
1190 size_t len, printed;
1191
1192 buf = scm_i_string_data (str);
1193 len = end - start;
1194 narrow_p = scm_i_is_narrow_string (str);
1195 buf += start * (narrow_p ? sizeof (char) : sizeof (scm_t_wchar));
1196
1197 printed = display_string (buf, narrow_p, end - start, port,
1198 PORT_CONVERSION_HANDLER (port));
1199
1200 if (SCM_UNLIKELY (printed < len))
1201 scm_encoding_error (__func__, errno,
1202 "cannot convert to output locale",
1203 port, scm_c_string_ref (str, printed + start));
1204}
1205
1206\f
0f2d19dd
JB
1207/* Print an integer.
1208 */
1cc91f1b 1209
0f2d19dd 1210void
a406c9e9 1211scm_intprint (scm_t_intmax n, int radix, SCM port)
0f2d19dd
JB
1212{
1213 char num_buf[SCM_INTBUFLEN];
b7f3516f 1214 scm_lfwrite (num_buf, scm_iint2str (n, radix, num_buf), port);
0f2d19dd
JB
1215}
1216
a406c9e9
MV
1217void
1218scm_uintprint (scm_t_uintmax n, int radix, SCM port)
1219{
1220 char num_buf[SCM_INTBUFLEN];
1221 scm_lfwrite (num_buf, scm_iuint2str (n, radix, num_buf), port);
1222}
1223
0f2d19dd
JB
1224/* Print an object of unrecognized type.
1225 */
1cc91f1b 1226
0f2d19dd 1227void
1bbd0b84 1228scm_ipruk (char *hdr, SCM ptr, SCM port)
0f2d19dd 1229{
b7f3516f
TT
1230 scm_puts ("#<unknown-", port);
1231 scm_puts (hdr, port);
26224b3f 1232 if (1) /* (scm_in_heap_p (ptr)) */ /* FIXME */
0f2d19dd 1233 {
b7f3516f 1234 scm_puts (" (0x", port);
0345e278 1235 scm_uintprint (SCM_CELL_WORD_0 (ptr), 16, port);
b7f3516f 1236 scm_puts (" . 0x", port);
0345e278 1237 scm_uintprint (SCM_CELL_WORD_1 (ptr), 16, port);
b7f3516f 1238 scm_puts (") @", port);
0f2d19dd 1239 }
b7f3516f 1240 scm_puts (" 0x", port);
0345e278 1241 scm_uintprint (SCM_UNPACK (ptr), 16, port);
b7f3516f 1242 scm_putc ('>', port);
0f2d19dd
JB
1243}
1244
1cc91f1b 1245
904a077d 1246/* Print a list.
22a52da1 1247 */
0f2d19dd 1248void
34d19ef6 1249scm_iprlist (char *hdr, SCM exp, int tlr, SCM port, scm_print_state *pstate)
0f2d19dd 1250{
c62fbfe1 1251 register SCM hare, tortoise;
c014a02e 1252 long floor = pstate->top - 2;
b7f3516f 1253 scm_puts (hdr, port);
0f2d19dd 1254 /* CHECK_INTS; */
c62fbfe1
MD
1255 if (pstate->fancyp)
1256 goto fancy_printing;
1257
1258 /* Run a hare and tortoise so that total time complexity will be
1259 O(depth * N) instead of O(N^2). */
1260 hare = SCM_CDR (exp);
1261 tortoise = exp;
d2e53ed6 1262 while (scm_is_pair (hare))
c62fbfe1 1263 {
bc36d050 1264 if (scm_is_eq (hare, tortoise))
c62fbfe1
MD
1265 goto fancy_printing;
1266 hare = SCM_CDR (hare);
d2e53ed6 1267 if (!scm_is_pair (hare))
c62fbfe1
MD
1268 break;
1269 hare = SCM_CDR (hare);
1270 tortoise = SCM_CDR (tortoise);
1271 }
1272
1273 /* No cdr cycles intrinsic to this list */
1274 scm_iprin1 (SCM_CAR (exp), port, pstate);
d2e53ed6 1275 for (exp = SCM_CDR (exp); scm_is_pair (exp); exp = SCM_CDR (exp))
0f2d19dd 1276 {
c014a02e 1277 register long i;
5ca6dc39 1278
c62fbfe1 1279 for (i = floor; i >= 0; --i)
509759dd 1280 if (scm_is_eq (PSTATE_STACK_REF(pstate, i), exp))
c62fbfe1
MD
1281 goto circref;
1282 PUSH_REF (pstate, exp);
b7f3516f 1283 scm_putc (' ', port);
0f2d19dd 1284 /* CHECK_INTS; */
c62fbfe1 1285 scm_iprin1 (SCM_CAR (exp), port, pstate);
0f2d19dd 1286 }
c96d76b8 1287 if (!SCM_NULL_OR_NIL_P (exp))
0f2d19dd 1288 {
b7f3516f 1289 scm_puts (" . ", port);
c62fbfe1 1290 scm_iprin1 (exp, port, pstate);
0f2d19dd 1291 }
c62fbfe1 1292
a51ea417 1293end:
b7f3516f 1294 scm_putc (tlr, port);
c62fbfe1 1295 pstate->top = floor + 2;
a51ea417 1296 return;
c62fbfe1
MD
1297
1298fancy_printing:
1299 {
c014a02e 1300 long n = pstate->length;
c62fbfe1
MD
1301
1302 scm_iprin1 (SCM_CAR (exp), port, pstate);
1303 exp = SCM_CDR (exp); --n;
d2e53ed6 1304 for (; scm_is_pair (exp); exp = SCM_CDR (exp))
c62fbfe1 1305 {
c014a02e 1306 register unsigned long i;
5ca6dc39 1307
c62fbfe1 1308 for (i = 0; i < pstate->top; ++i)
509759dd 1309 if (scm_is_eq (PSTATE_STACK_REF(pstate, i), exp))
c62fbfe1
MD
1310 goto fancy_circref;
1311 if (pstate->fancyp)
1312 {
1313 if (n == 0)
1314 {
b7f3516f 1315 scm_puts (" ...", port);
c62fbfe1
MD
1316 goto skip_tail;
1317 }
1318 else
1319 --n;
1320 }
1321 PUSH_REF(pstate, exp);
1322 ++pstate->list_offset;
b7f3516f 1323 scm_putc (' ', port);
c62fbfe1
MD
1324 /* CHECK_INTS; */
1325 scm_iprin1 (SCM_CAR (exp), port, pstate);
1326 }
1327 }
c96d76b8 1328 if (!SCM_NULL_OR_NIL_P (exp))
c62fbfe1 1329 {
b7f3516f 1330 scm_puts (" . ", port);
c62fbfe1
MD
1331 scm_iprin1 (exp, port, pstate);
1332 }
1333skip_tail:
1334 pstate->list_offset -= pstate->top - floor - 2;
a51ea417 1335 goto end;
a51ea417 1336
c62fbfe1
MD
1337fancy_circref:
1338 pstate->list_offset -= pstate->top - floor - 2;
1339
1340circref:
b7f3516f 1341 scm_puts (" . ", port);
c62fbfe1
MD
1342 print_circref (port, pstate, exp);
1343 goto end;
0f2d19dd
JB
1344}
1345
1346\f
1347
bb35f315
MV
1348int
1349scm_valid_oport_value_p (SCM val)
1350{
368cf54d
GB
1351 return (SCM_OPOUTPORTP (val)
1352 || (SCM_PORT_WITH_PS_P (val)
1353 && SCM_OPOUTPORTP (SCM_PORT_WITH_PS_PORT (val))));
bb35f315
MV
1354}
1355
8b840115 1356/* SCM_GPROC(s_write, "write", 1, 1, 0, scm_write, g_write); */
1cc91f1b 1357
0f2d19dd 1358SCM
1bbd0b84 1359scm_write (SCM obj, SCM port)
0f2d19dd
JB
1360{
1361 if (SCM_UNBNDP (port))
9de87eea 1362 port = scm_current_output_port ();
3eb7e6ee
JB
1363
1364 SCM_ASSERT (scm_valid_oport_value_p (port), port, SCM_ARG2, s_write);
bb35f315 1365
a51ea417 1366 scm_prin1 (obj, port, 1);
0f2d19dd
JB
1367 return SCM_UNSPECIFIED;
1368}
1369
1370
8b840115 1371/* SCM_GPROC(s_display, "display", 1, 1, 0, scm_display, g_display); */
1cc91f1b 1372
0f2d19dd 1373SCM
1bbd0b84 1374scm_display (SCM obj, SCM port)
0f2d19dd
JB
1375{
1376 if (SCM_UNBNDP (port))
9de87eea 1377 port = scm_current_output_port ();
3eb7e6ee
JB
1378
1379 SCM_ASSERT (scm_valid_oport_value_p (port), port, SCM_ARG2, s_display);
bb35f315 1380
a51ea417 1381 scm_prin1 (obj, port, 0);
0f2d19dd
JB
1382 return SCM_UNSPECIFIED;
1383}
1384
70d63753
GB
1385
1386SCM_DEFINE (scm_simple_format, "simple-format", 2, 0, 1,
1387 (SCM destination, SCM message, SCM args),
eca65e90
MG
1388 "Write @var{message} to @var{destination}, defaulting to\n"
1389 "the current output port.\n"
1390 "@var{message} can contain @code{~A} (was @code{%s}) and\n"
1391 "@code{~S} (was @code{%S}) escapes. When printed,\n"
1392 "the escapes are replaced with corresponding members of\n"
b7e64f8b 1393 "@var{args}:\n"
eca65e90
MG
1394 "@code{~A} formats using @code{display} and @code{~S} formats\n"
1395 "using @code{write}.\n"
1396 "If @var{destination} is @code{#t}, then use the current output\n"
1397 "port, if @var{destination} is @code{#f}, then return a string\n"
1398 "containing the formatted text. Does not add a trailing newline.")
70d63753
GB
1399#define FUNC_NAME s_scm_simple_format
1400{
dfd03fb9 1401 SCM port, answer = SCM_UNSPECIFIED;
70d63753
GB
1402 int fReturnString = 0;
1403 int writingp;
889975e5 1404 size_t start, p, end;
70d63753 1405
bc36d050 1406 if (scm_is_eq (destination, SCM_BOOL_T))
daba1a71 1407 {
9de87eea 1408 destination = port = scm_current_output_port ();
daba1a71 1409 }
7888309b 1410 else if (scm_is_false (destination))
daba1a71
MD
1411 {
1412 fReturnString = 1;
0b2c2ba3 1413 port = scm_mkstrport (SCM_INUM0, SCM_BOOL_F,
dfd03fb9
MD
1414 SCM_OPN | SCM_WRTNG,
1415 FUNC_NAME);
1416 destination = port;
daba1a71
MD
1417 }
1418 else
1419 {
1420 SCM_VALIDATE_OPORT_VALUE (1, destination);
dfd03fb9 1421 port = SCM_COERCE_OUTPORT (destination);
daba1a71
MD
1422 }
1423 SCM_VALIDATE_STRING (2, message);
af45e3b0 1424 SCM_VALIDATE_REST_ARGUMENT (args);
70d63753 1425
889975e5
MG
1426 p = 0;
1427 start = 0;
1428 end = scm_i_string_length (message);
b24b5e13 1429 for (p = start; p != end; ++p)
889975e5 1430 if (scm_i_string_ref (message, p) == '~')
70d63753 1431 {
b24b5e13 1432 if (++p == end)
6662998f
MV
1433 break;
1434
889975e5 1435 switch (scm_i_string_ref (message, p))
6662998f
MV
1436 {
1437 case 'A': case 'a':
1438 writingp = 0;
1439 break;
1440 case 'S': case 's':
1441 writingp = 1;
1442 break;
1443 case '~':
889975e5 1444 scm_lfwrite_substr (message, start, p, port);
6662998f
MV
1445 start = p + 1;
1446 continue;
1447 case '%':
889975e5 1448 scm_lfwrite_substr (message, start, p - 1, port);
dfd03fb9 1449 scm_newline (port);
6662998f
MV
1450 start = p + 1;
1451 continue;
1452 default:
1afff620 1453 SCM_MISC_ERROR ("FORMAT: Unsupported format option ~~~A - use (ice-9 format) instead",
889975e5 1454 scm_list_1 (SCM_MAKE_CHAR (scm_i_string_ref (message, p))));
6662998f
MV
1455
1456 }
70d63753 1457
6662998f 1458
d2e53ed6 1459 if (!scm_is_pair (args))
1afff620 1460 SCM_MISC_ERROR ("FORMAT: Missing argument for ~~~A",
889975e5 1461 scm_list_1 (SCM_MAKE_CHAR (scm_i_string_ref (message, p))));
6662998f 1462
889975e5 1463 scm_lfwrite_substr (message, start, p - 1, port);
dfd03fb9 1464 /* we pass destination here */
70d63753
GB
1465 scm_prin1 (SCM_CAR (args), destination, writingp);
1466 args = SCM_CDR (args);
1467 start = p + 1;
1468 }
6662998f 1469
889975e5 1470 scm_lfwrite_substr (message, start, p, port);
bc36d050 1471 if (!scm_is_eq (args, SCM_EOL))
1afff620
KN
1472 SCM_MISC_ERROR ("FORMAT: ~A superfluous arguments",
1473 scm_list_1 (scm_length (args)));
70d63753
GB
1474
1475 if (fReturnString)
1476 answer = scm_strport_to_string (destination);
1477
daba1a71 1478 return scm_return_first (answer, message);
70d63753
GB
1479}
1480#undef FUNC_NAME
1481
1482
3b3b36dd 1483SCM_DEFINE (scm_newline, "newline", 0, 1, 0,
b450f070 1484 (SCM port),
8f85c0c6
NJ
1485 "Send a newline to @var{port}.\n"
1486 "If @var{port} is omitted, send to the current output port.")
1bbd0b84 1487#define FUNC_NAME s_scm_newline
0f2d19dd
JB
1488{
1489 if (SCM_UNBNDP (port))
9de87eea 1490 port = scm_current_output_port ();
3eb7e6ee 1491
34d19ef6 1492 SCM_VALIDATE_OPORT_VALUE (1, port);
bb35f315 1493
0ef4ae82 1494 scm_putc ('\n', SCM_COERCE_OUTPORT (port));
0f2d19dd
JB
1495 return SCM_UNSPECIFIED;
1496}
1bbd0b84 1497#undef FUNC_NAME
0f2d19dd 1498
3b3b36dd 1499SCM_DEFINE (scm_write_char, "write-char", 1, 1, 0,
b450f070 1500 (SCM chr, SCM port),
eca65e90 1501 "Send character @var{chr} to @var{port}.")
1bbd0b84 1502#define FUNC_NAME s_scm_write_char
0f2d19dd
JB
1503{
1504 if (SCM_UNBNDP (port))
9de87eea 1505 port = scm_current_output_port ();
3eb7e6ee 1506
34d19ef6
HWN
1507 SCM_VALIDATE_CHAR (1, chr);
1508 SCM_VALIDATE_OPORT_VALUE (2, port);
07f49ac7
LC
1509
1510 port = SCM_COERCE_OUTPORT (port);
1511 if (!display_character (SCM_CHAR (chr), port,
478848cb 1512 PORT_CONVERSION_HANDLER (port)))
07f49ac7
LC
1513 scm_encoding_error (__func__, errno,
1514 "cannot convert to output locale",
6851d3be 1515 port, chr);
07f49ac7 1516
0f2d19dd
JB
1517 return SCM_UNSPECIFIED;
1518}
1bbd0b84 1519#undef FUNC_NAME
0f2d19dd 1520
0f2d19dd
JB
1521\f
1522
bb35f315 1523/* Call back to Scheme code to do the printing of special objects
c19bc088
MD
1524 * (like structs). SCM_PRINTER_APPLY applies PROC to EXP and a smob
1525 * containing PORT and PSTATE. This object can be used as the port for
1526 * display/write etc to continue the current print chain. The REVEALED
1527 * field of PSTATE is set to true to indicate that the print state has
1528 * escaped to Scheme and thus has to be freed by the GC.
1529 */
1530
92c2555f 1531scm_t_bits scm_tc16_port_with_ps;
c19bc088
MD
1532
1533/* Print exactly as the port itself would */
1534
1535static int
e841c3e0 1536port_with_ps_print (SCM obj, SCM port, scm_print_state *pstate)
c19bc088
MD
1537{
1538 obj = SCM_PORT_WITH_PS_PORT (obj);
1539 return scm_ptobs[SCM_PTOBNUM (obj)].print (obj, port, pstate);
1540}
c4f37e80
MV
1541
1542SCM
1bbd0b84 1543scm_printer_apply (SCM proc, SCM exp, SCM port, scm_print_state *pstate)
c4f37e80 1544{
bb35f315 1545 pstate->revealed = 1;
dfd03fb9
MD
1546 return scm_call_2 (proc, exp,
1547 scm_i_port_with_print_state (port, pstate->handle));
c19bc088
MD
1548}
1549
dfd03fb9 1550SCM_DEFINE (scm_port_with_print_state, "port-with-print-state", 1, 1, 0,
1bbd0b84 1551 (SCM port, SCM pstate),
71331188 1552 "Create a new port which behaves like @var{port}, but with an\n"
dfd03fb9
MD
1553 "included print state @var{pstate}. @var{pstate} is optional.\n"
1554 "If @var{pstate} isn't supplied and @var{port} already has\n"
1555 "a print state, the old print state is reused.")
1bbd0b84 1556#define FUNC_NAME s_scm_port_with_print_state
c19bc088 1557{
34d19ef6 1558 SCM_VALIDATE_OPORT_VALUE (1, port);
dfd03fb9
MD
1559 if (!SCM_UNBNDP (pstate))
1560 SCM_VALIDATE_PRINTSTATE (2, pstate);
1561 return scm_i_port_with_print_state (port, pstate);
c19bc088 1562}
1bbd0b84 1563#undef FUNC_NAME
c19bc088 1564
a1ec6916 1565SCM_DEFINE (scm_get_print_state, "get-print-state", 1, 0, 0,
1bbd0b84 1566 (SCM port),
71331188
MG
1567 "Return the print state of the port @var{port}. If @var{port}\n"
1568 "has no associated print state, @code{#f} is returned.")
1bbd0b84 1569#define FUNC_NAME s_scm_get_print_state
c19bc088 1570{
368cf54d
GB
1571 if (SCM_PORT_WITH_PS_P (port))
1572 return SCM_PORT_WITH_PS_PS (port);
f5f2dcff 1573 if (SCM_OUTPUT_PORT_P (port))
368cf54d 1574 return SCM_BOOL_F;
276dd677 1575 SCM_WRONG_TYPE_ARG (1, port);
c4f37e80 1576}
1bbd0b84 1577#undef FUNC_NAME
bb35f315 1578
c4f37e80 1579\f
1cc91f1b 1580
0f2d19dd
JB
1581void
1582scm_init_print ()
0f2d19dd 1583{
66b1dbf6 1584 SCM type;
d5cf5324 1585
d5cf5324
DH
1586 scm_gc_register_root (&print_state_pool);
1587 scm_gc_register_root (&scm_print_state_vtable);
66b1dbf6
AW
1588 type = scm_make_vtable (scm_from_locale_string (SCM_PRINT_STATE_LAYOUT),
1589 SCM_BOOL_F);
4a655e50 1590 scm_set_struct_vtable_name_x (type, scm_from_latin1_symbol ("print-state"));
bb35f315 1591 scm_print_state_vtable = type;
c4f37e80 1592
c19bc088
MD
1593 /* Don't want to bind a wrapper class in GOOPS, so pass 0 as arg1. */
1594 scm_tc16_port_with_ps = scm_make_smob_type (0, 0);
e841c3e0 1595 scm_set_smob_print (scm_tc16_port_with_ps, port_with_ps_print);
81ae25da 1596
a0599745 1597#include "libguile/print.x"
475fa9a5 1598
8500b186
AW
1599 scm_init_opts (scm_print_options, scm_print_opts);
1600 scm_print_opts[SCM_PRINT_HIGHLIGHT_PREFIX_I].val =
1601 SCM_UNPACK (scm_from_locale_string ("{"));
1602 scm_print_opts[SCM_PRINT_HIGHLIGHT_SUFFIX_I].val =
1603 SCM_UNPACK (scm_from_locale_string ("}"));
475fa9a5 1604 scm_print_opts[SCM_PRINT_KEYWORD_STYLE_I].val = SCM_UNPACK (sym_reader);
0f2d19dd 1605}
89e00824
ML
1606
1607/*
1608 Local Variables:
1609 c-file-style: "gnu"
1610 End:
1611*/