Add internal-only port structure and move iconv descriptors there.
[bpt/guile.git] / libguile / print.c
CommitLineData
f4bc4e59 1/* Copyright (C) 1995-1999, 2000, 2001, 2002, 2003, 2004, 2006, 2008,
e4598559 2 * 2009, 2010, 2011, 2012, 2013 Free Software Foundation, Inc.
f4bc4e59 3 *
73be1d9e 4 * This library is free software; you can redistribute it and/or
53befeb7
NJ
5 * modify it under the terms of the GNU Lesser General Public License
6 * as published by the Free Software Foundation; either version 3 of
7 * the License, or (at your option) any later version.
0f2d19dd 8 *
53befeb7
NJ
9 * This library is distributed in the hope that it will be useful, but
10 * WITHOUT ANY WARRANTY; without even the implied warranty of
73be1d9e
MV
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
0f2d19dd 13 *
73be1d9e
MV
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with this library; if not, write to the Free Software
53befeb7
NJ
16 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
17 * 02110-1301 USA
73be1d9e 18 */
1bbd0b84 19
1bbd0b84 20
0f2d19dd 21\f
dbb605f5
LC
22#ifdef HAVE_CONFIG_H
23# include <config.h>
24#endif
0f2d19dd 25
e6e2e95a 26#include <errno.h>
f4bc4e59
LC
27#include <iconv.h>
28#include <stdio.h>
29#include <assert.h>
30
eca29b02 31#include <uniconv.h>
904a78f1 32#include <unictype.h>
e6e2e95a 33
a0599745
MD
34#include "libguile/_scm.h"
35#include "libguile/chars.h"
a002f1a2 36#include "libguile/continuations.h"
a0599745 37#include "libguile/smob.h"
bbb2ecd1 38#include "libguile/control.h"
a0599745
MD
39#include "libguile/eval.h"
40#include "libguile/macros.h"
41#include "libguile/procprop.h"
42#include "libguile/read.h"
43#include "libguile/weaks.h"
2fb924f6 44#include "libguile/programs.h"
a0599745
MD
45#include "libguile/alist.h"
46#include "libguile/struct.h"
a0599745 47#include "libguile/ports.h"
e4598559 48#include "libguile/ports-internal.h"
a0599745
MD
49#include "libguile/root.h"
50#include "libguile/strings.h"
51#include "libguile/strports.h"
52#include "libguile/vectors.h"
327967ef 53#include "libguile/numbers.h"
6f3b0cc2 54#include "libguile/vm.h"
a0599745
MD
55
56#include "libguile/validate.h"
57#include "libguile/print.h"
22fc179a
HWN
58
59#include "libguile/private-options.h"
60
0f2d19dd
JB
61\f
62
07f49ac7
LC
63/* Character printers. */
64
478848cb
LC
65#define PORT_CONVERSION_HANDLER(port) \
66 SCM_PTAB_ENTRY (port)->ilseq_handler
67
f4bc4e59
LC
68static size_t display_string (const void *, int, size_t, SCM,
69 scm_t_string_failed_conversion_handler);
70
07f49ac7
LC
71static int display_character (scm_t_wchar, SCM,
72 scm_t_string_failed_conversion_handler);
f4bc4e59 73
07f49ac7
LC
74static void write_character (scm_t_wchar, SCM, int);
75
f4bc4e59
LC
76static void write_character_escaped (scm_t_wchar, int, SCM);
77
07f49ac7
LC
78\f
79
0f2d19dd
JB
80/* {Names of immediate symbols}
81 *
82 * This table must agree with the declarations in scm.h: {Immediate Symbols}.
83 */
84
e17d318f
DH
85/* This table must agree with the list of flags in tags.h. */
86static const char *iflagnames[] =
87{
88 "#f",
45f4cbdf
MW
89 "#nil", /* Elisp nil value. Should print from elisp as symbol `nil'. */
90 "#<XXX UNUSED LISP FALSE -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>",
91 "()",
e17d318f 92 "#t",
f60c2c4e
MW
93 "#<XXX UNUSED BOOLEAN 0 -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>",
94 "#<XXX UNUSED BOOLEAN 1 -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>",
95 "#<XXX UNUSED BOOLEAN 2 -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>",
45f4cbdf 96 "#<unspecified>",
e17d318f
DH
97 "#<undefined>",
98 "#<eof>",
e17d318f
DH
99
100 /* Unbound slot marker for GOOPS. For internal use in GOOPS only. */
101 "#<unbound>",
e17d318f
DH
102};
103
475fa9a5
MV
104SCM_SYMBOL (sym_reader, "reader");
105
92c2555f 106scm_t_option scm_print_opts[] = {
210c0325 107 { SCM_OPTION_SCM, "highlight-prefix", (scm_t_bits)SCM_BOOL_F_BITS,
81ae25da 108 "The string to print before highlighted values." },
210c0325 109 { SCM_OPTION_SCM, "highlight-suffix", (scm_t_bits)SCM_BOOL_F_BITS,
475fa9a5 110 "The string to print after highlighted values." },
210c0325 111 { SCM_OPTION_SCM, "quote-keywordish-symbols", (scm_t_bits)SCM_BOOL_F_BITS,
475fa9a5
MV
112 "How to print symbols that have a colon as their first or last character. "
113 "The value '#f' does not quote the colons; '#t' quotes them; "
8500b186
AW
114 "'reader' quotes them when the reader option 'keywords' is not '#f'." },
115 { SCM_OPTION_BOOLEAN, "escape-newlines", 1,
116 "Render newlines as \\n when printing using `write'." },
62560650 117 { 0 },
e6e4c9af
MD
118};
119
a1ec6916 120SCM_DEFINE (scm_print_options, "print-options-interface", 0, 1, 0,
1bbd0b84 121 (SCM setting),
71331188 122 "Option interface for the print options. Instead of using\n"
1dd05fd8
MG
123 "this procedure directly, use the procedures\n"
124 "@code{print-enable}, @code{print-disable}, @code{print-set!}\n"
125 "and @code{print-options}.")
1bbd0b84 126#define FUNC_NAME s_scm_print_options
e6e4c9af 127{
a51ea417 128 SCM ans = scm_options (setting,
b7ff98dd 129 scm_print_opts,
1bbd0b84 130 FUNC_NAME);
e6e4c9af
MD
131 return ans;
132}
1bbd0b84 133#undef FUNC_NAME
e6e4c9af 134
0f2d19dd
JB
135\f
136/* {Printing of Scheme Objects}
137 */
138
a51ea417 139/* Detection of circular references.
c62fbfe1
MD
140 *
141 * Due to other constraints in the implementation, this code has bad
5d46ebe3
MD
142 * time complexity (O (depth * N)), The printer code can be
143 * rewritten to be O(N).
a51ea417 144 */
dbb5de29
NJ
145#define PUSH_REF(pstate, obj) \
146do \
147{ \
148 PSTATE_STACK_SET (pstate, pstate->top, obj); \
149 pstate->top++; \
150 if (pstate->top == pstate->ceiling) \
151 grow_ref_stack (pstate); \
1bbd0b84 152} while(0)
a51ea417 153
dbb5de29
NJ
154#define ENTER_NESTED_DATA(pstate, obj, label) \
155do \
156{ \
157 register unsigned long i; \
158 for (i = 0; i < pstate->top; ++i) \
159 if (scm_is_eq (PSTATE_STACK_REF (pstate, i), (obj))) \
160 goto label; \
161 if (pstate->fancyp) \
162 { \
163 if (pstate->top - pstate->list_offset >= pstate->level) \
164 { \
165 scm_putc ('#', port); \
166 return; \
167 } \
168 } \
169 PUSH_REF(pstate, obj); \
1bbd0b84 170} while(0)
a51ea417 171
dbb5de29
NJ
172#define EXIT_NESTED_DATA(pstate) \
173do \
174{ \
175 --pstate->top; \
176 PSTATE_STACK_SET (pstate, pstate->top, SCM_UNDEFINED); \
177} \
178while (0)
c62fbfe1 179
d5cf5324
DH
180SCM scm_print_state_vtable = SCM_BOOL_F;
181static SCM print_state_pool = SCM_EOL;
9de87eea 182scm_i_pthread_mutex_t print_state_mutex = SCM_I_PTHREAD_MUTEX_INITIALIZER;
c4f37e80 183
f843a84c 184#ifdef GUILE_DEBUG /* Used for debugging purposes */
1cc91f1b 185
3b3b36dd 186SCM_DEFINE (scm_current_pstate, "current-pstate", 0, 0, 0,
1bbd0b84 187 (),
d5cf5324 188 "Return the current-pstate -- the car of the\n"
5352393c
MG
189 "@code{print_state_pool}. @code{current-pstate} is only\n"
190 "included in @code{--enable-guile-debug} builds.")
1bbd0b84 191#define FUNC_NAME s_scm_current_pstate
c62fbfe1 192{
d2e53ed6 193 if (!scm_is_null (print_state_pool))
d5cf5324 194 return SCM_CAR (print_state_pool);
a0adfbf0 195 else
0a284a4e 196 return SCM_BOOL_F;
c62fbfe1 197}
1bbd0b84
GB
198#undef FUNC_NAME
199
c62fbfe1
MD
200#endif
201
202#define PSTATE_SIZE 50L
203
698c0295 204static SCM
1bbd0b84 205make_print_state (void)
698c0295 206{
d5cf5324
DH
207 SCM print_state
208 = scm_make_struct (scm_print_state_vtable, SCM_INUM0, SCM_EOL);
bf685b6d 209 scm_print_state *pstate = SCM_PRINT_STATE (print_state);
00ffa0e7 210 pstate->ref_vect = scm_c_make_vector (PSTATE_SIZE, SCM_UNDEFINED);
4057a3e0 211 pstate->ceiling = SCM_SIMPLE_VECTOR_LENGTH (pstate->ref_vect);
d232520a 212 pstate->highlight_objects = SCM_EOL;
698c0295
MD
213 return print_state;
214}
1cc91f1b 215
c62fbfe1
MD
216SCM
217scm_make_print_state ()
c62fbfe1 218{
230d095f 219 SCM answer = SCM_BOOL_F;
698c0295
MD
220
221 /* First try to allocate a print state from the pool */
9de87eea 222 scm_i_pthread_mutex_lock (&print_state_mutex);
d2e53ed6 223 if (!scm_is_null (print_state_pool))
698c0295 224 {
d5cf5324
DH
225 answer = SCM_CAR (print_state_pool);
226 print_state_pool = SCM_CDR (print_state_pool);
698c0295 227 }
9de87eea 228 scm_i_pthread_mutex_unlock (&print_state_mutex);
698c0295 229
7888309b 230 return scm_is_false (answer) ? make_print_state () : answer;
c62fbfe1 231}
a51ea417 232
698c0295 233void
6e8d25a6 234scm_free_print_state (SCM print_state)
698c0295
MD
235{
236 SCM handle;
237 scm_print_state *pstate = SCM_PRINT_STATE (print_state);
238 /* Cleanup before returning print state to pool.
239 * It is better to do it here. Doing it in scm_prin1
240 * would cost more since that function is called much more
241 * often.
242 */
243 pstate->fancyp = 0;
bb35f315 244 pstate->revealed = 0;
d232520a 245 pstate->highlight_objects = SCM_EOL;
9de87eea 246 scm_i_pthread_mutex_lock (&print_state_mutex);
16d4699b 247 handle = scm_cons (print_state, print_state_pool);
d5cf5324 248 print_state_pool = handle;
9de87eea 249 scm_i_pthread_mutex_unlock (&print_state_mutex);
dfd03fb9
MD
250}
251
252SCM
253scm_i_port_with_print_state (SCM port, SCM print_state)
254{
255 if (SCM_UNBNDP (print_state))
256 {
257 if (SCM_PORT_WITH_PS_P (port))
258 return port;
259 else
260 print_state = scm_make_print_state ();
261 /* port does not need to be coerced since it doesn't have ps */
262 }
263 else
264 port = SCM_COERCE_OUTPORT (port);
265 SCM_RETURN_NEWSMOB (scm_tc16_port_with_ps,
266 SCM_UNPACK (scm_cons (port, print_state)));
698c0295 267}
1cc91f1b 268
a51ea417 269static void
1bbd0b84 270grow_ref_stack (scm_print_state *pstate)
a51ea417 271{
4057a3e0
MV
272 SCM old_vect = pstate->ref_vect;
273 size_t old_size = SCM_SIMPLE_VECTOR_LENGTH (old_vect);
274 size_t new_size = 2 * pstate->ceiling;
00ffa0e7 275 SCM new_vect = scm_c_make_vector (new_size, SCM_UNDEFINED);
b17004b8
DH
276 unsigned long int i;
277
278 for (i = 0; i != old_size; ++i)
4057a3e0 279 SCM_SIMPLE_VECTOR_SET (new_vect, i, SCM_SIMPLE_VECTOR_REF (old_vect, i));
b17004b8
DH
280
281 pstate->ref_vect = new_vect;
bf685b6d 282 pstate->ceiling = new_size;
a51ea417
MD
283}
284
509759dd
MV
285#define PSTATE_STACK_REF(p,i) SCM_SIMPLE_VECTOR_REF((p)->ref_vect, (i))
286#define PSTATE_STACK_SET(p,i,v) SCM_SIMPLE_VECTOR_SET((p)->ref_vect, (i), (v))
1cc91f1b 287
a51ea417 288static void
34d19ef6 289print_circref (SCM port, scm_print_state *pstate, SCM ref)
a51ea417 290{
c014a02e
ML
291 register long i;
292 long self = pstate->top - 1;
c62fbfe1 293 i = pstate->top - 1;
509759dd 294 if (scm_is_pair (PSTATE_STACK_REF (pstate, i)))
c62fbfe1
MD
295 {
296 while (i > 0)
297 {
509759dd
MV
298 if (!scm_is_pair (PSTATE_STACK_REF (pstate, i-1))
299 || !scm_is_eq (SCM_CDR (PSTATE_STACK_REF (pstate, i-1)),
300 SCM_CDR (PSTATE_STACK_REF (pstate, i))))
c62fbfe1
MD
301 break;
302 --i;
303 }
304 self = i;
305 }
306 for (i = pstate->top - 1; 1; --i)
509759dd 307 if (scm_is_eq (PSTATE_STACK_REF(pstate, i), ref))
c62fbfe1 308 break;
b7f3516f 309 scm_putc ('#', port);
c62fbfe1 310 scm_intprint (i - self, 10, port);
b7f3516f 311 scm_putc ('#', port);
a51ea417
MD
312}
313
6662998f
MV
314/* Print the name of a symbol. */
315
475fa9a5 316static int
15671c6e 317quote_keywordish_symbols (void)
475fa9a5 318{
15671c6e 319 SCM option = SCM_PRINT_KEYWORD_STYLE;
475fa9a5 320
475fa9a5
MV
321 if (scm_is_false (option))
322 return 0;
323 if (scm_is_eq (option, sym_reader))
324 return scm_is_true (SCM_PACK (SCM_KEYWORD_STYLE));
325 return 1;
326}
327
2e9fc9fc
AW
328#define INITIAL_IDENTIFIER_MASK \
329 (UC_CATEGORY_MASK_Lu | UC_CATEGORY_MASK_Ll | UC_CATEGORY_MASK_Lt \
330 | UC_CATEGORY_MASK_Lm | UC_CATEGORY_MASK_Lo | UC_CATEGORY_MASK_Mn \
331 | UC_CATEGORY_MASK_Nl | UC_CATEGORY_MASK_No | UC_CATEGORY_MASK_Pd \
332 | UC_CATEGORY_MASK_Pc | UC_CATEGORY_MASK_Po | UC_CATEGORY_MASK_Sc \
333 | UC_CATEGORY_MASK_Sm | UC_CATEGORY_MASK_Sk | UC_CATEGORY_MASK_So \
334 | UC_CATEGORY_MASK_Co)
335
336#define SUBSEQUENT_IDENTIFIER_MASK \
337 (INITIAL_IDENTIFIER_MASK \
338 | UC_CATEGORY_MASK_Nd | UC_CATEGORY_MASK_Mc | UC_CATEGORY_MASK_Me)
339
15671c6e
AW
340static int
341symbol_has_extended_read_syntax (SCM sym)
6662998f 342{
15671c6e
AW
343 size_t pos, len = scm_i_symbol_length (sym);
344 scm_t_wchar c;
345
346 /* The empty symbol. */
347 if (len == 0)
348 return 1;
349
350 c = scm_i_symbol_ref (sym, 0);
351
352 /* Single dot; conflicts with dotted-pair notation. */
353 if (len == 1 && c == '.')
354 return 1;
355
356 /* Other initial-character constraints. */
2e9fc9fc 357 if (c == '\'' || c == '`' || c == ',' || c == '"' || c == ';' || c == '#')
15671c6e
AW
358 return 1;
359
360 /* Keywords can be identified by trailing colons too. */
361 if (c == ':' || scm_i_symbol_ref (sym, len - 1) == ':')
362 return quote_keywordish_symbols ();
363
364 /* Number-ish symbols. */
365 if (scm_is_true (scm_i_string_to_number (scm_symbol_to_string (sym), 10)))
366 return 1;
367
2e9fc9fc
AW
368 /* Other disallowed first characters. */
369 if (!uc_is_general_category_withtable (c, INITIAL_IDENTIFIER_MASK))
370 return 1;
371
372 /* Otherwise, any character that's in the identifier category mask is
373 fine to pass through as-is, provided it's not one of the ASCII
374 delimiters like `;'. */
375 for (pos = 1; pos < len; pos++)
6662998f 376 {
2e9fc9fc
AW
377 c = scm_i_symbol_ref (sym, pos);
378 if (!uc_is_general_category_withtable (c, SUBSEQUENT_IDENTIFIER_MASK))
379 return 1;
380 else if (c == '"' || c == ';' || c == '#')
381 return 1;
6662998f 382 }
c6b49e89 383
15671c6e
AW
384 return 0;
385}
386
387static void
388print_normal_symbol (SCM sym, SCM port)
389{
390 scm_display (scm_symbol_to_string (sym), port);
391}
392
15671c6e
AW
393static void
394print_extended_symbol (SCM sym, SCM port)
395{
396 size_t pos, len;
397 scm_t_string_failed_conversion_handler strategy;
398
399 len = scm_i_symbol_length (sym);
478848cb 400 strategy = PORT_CONVERSION_HANDLER (port);
15671c6e
AW
401
402 scm_lfwrite ("#{", 2, port);
403
404 for (pos = 0; pos < len; pos++)
405 {
406 scm_t_wchar c = scm_i_symbol_ref (sym, pos);
407
2e9fc9fc
AW
408 if (uc_is_general_category_withtable (c,
409 SUBSEQUENT_IDENTIFIER_MASK
410 | UC_CATEGORY_MASK_Zs))
15671c6e 411 {
15671c6e
AW
412 if (!display_character (c, port, strategy))
413 scm_encoding_error ("print_extended_symbol", errno,
414 "cannot convert to output locale",
415 port, SCM_MAKE_CHAR (c));
2e9fc9fc
AW
416 }
417 else
418 {
419 display_string ("\\x", 1, 2, port, iconveh_question_mark);
420 scm_intprint (c, 16, port);
421 display_character (';', port, iconveh_question_mark);
15671c6e
AW
422 }
423 }
424
425 scm_lfwrite ("}#", 2, port);
426}
427
428/* FIXME: allow R6RS hex escapes instead of #{...}#. */
429void
430scm_i_print_symbol_name (SCM sym, SCM port)
431{
432 if (symbol_has_extended_read_syntax (sym))
433 print_extended_symbol (sym, port);
434 else
435 print_normal_symbol (sym, port);
6662998f
MV
436}
437
e23106d5
MG
438void
439scm_print_symbol_name (const char *str, size_t len, SCM port)
440{
441 SCM symbol = scm_from_locale_symboln (str, len);
ab33782c 442 scm_i_print_symbol_name (symbol, port);
e23106d5
MG
443}
444
c62fbfe1 445/* Print generally. Handles both write and display according to PSTATE.
0f2d19dd 446 */
8b840115
MD
447SCM_GPROC(s_write, "write", 1, 1, 0, scm_write, g_write);
448SCM_GPROC(s_display, "display", 1, 1, 0, scm_display, g_display);
1cc91f1b 449
d232520a
MV
450static void iprin1 (SCM exp, SCM port, scm_print_state *pstate);
451
dea901d6
MG
452
453/* Print a character as an octal or hex escape. */
454#define PRINT_CHAR_ESCAPE(i, port) \
455 do \
456 { \
457 if (!SCM_R6RS_ESCAPES_P) \
458 scm_intprint (i, 8, port); \
459 else \
460 { \
461 scm_puts ("x", port); \
462 scm_intprint (i, 16, port); \
463 } \
464 } \
465 while (0)
466
467
0f2d19dd 468void
1bbd0b84 469scm_iprin1 (SCM exp, SCM port, scm_print_state *pstate)
d232520a
MV
470{
471 if (pstate->fancyp
472 && scm_is_true (scm_memq (exp, pstate->highlight_objects)))
473 {
81ae25da 474 scm_display (SCM_PRINT_HIGHLIGHT_PREFIX, port);
d232520a 475 iprin1 (exp, port, pstate);
81ae25da 476 scm_display (SCM_PRINT_HIGHLIGHT_SUFFIX, port);
d232520a
MV
477 }
478 else
479 iprin1 (exp, port, pstate);
480}
481
482static void
483iprin1 (SCM exp, SCM port, scm_print_state *pstate)
0f2d19dd 484{
54778cd3 485 switch (SCM_ITAG3 (exp))
0f2d19dd 486 {
e34f941a
DH
487 case scm_tc3_tc7_1:
488 case scm_tc3_tc7_2:
489 /* These tc3 tags should never occur in an immediate value. They are
490 * only used in cell types of non-immediates, i. e. the value returned
491 * by SCM_CELL_TYPE (exp) can use these tags.
492 */
493 scm_ipruk ("immediate", exp, port);
494 break;
495 case scm_tc3_int_1:
496 case scm_tc3_int_2:
e11e83f3 497 scm_intprint (SCM_I_INUM (exp), 10, port);
0f2d19dd 498 break;
e34f941a 499 case scm_tc3_imm24:
7866a09b 500 if (SCM_CHARP (exp))
0f2d19dd 501 {
b7f3516f 502 if (SCM_WRITINGP (pstate))
07f49ac7
LC
503 write_character (SCM_CHAR (exp), port, 0);
504 else
b7f3516f 505 {
07f49ac7 506 if (!display_character (SCM_CHAR (exp), port,
478848cb 507 PORT_CONVERSION_HANDLER (port)))
07f49ac7
LC
508 scm_encoding_error (__func__, errno,
509 "cannot convert to output locale",
6851d3be 510 port, exp);
b7f3516f 511 }
0f2d19dd 512 }
a51ea417 513 else if (SCM_IFLAGP (exp)
e17d318f
DH
514 && ((size_t) SCM_IFLAGNUM (exp) < (sizeof iflagnames / sizeof (char *))))
515 {
516 scm_puts (iflagnames [SCM_IFLAGNUM (exp)], port);
517 }
0f2d19dd 518 else
e34f941a
DH
519 {
520 /* unknown immediate value */
521 scm_ipruk ("immediate", exp, port);
522 }
0f2d19dd 523 break;
e34f941a 524 case scm_tc3_cons:
0f2d19dd
JB
525 switch (SCM_TYP7 (exp))
526 {
904a077d
MV
527 case scm_tcs_struct:
528 {
529 ENTER_NESTED_DATA (pstate, exp, circref);
530 if (SCM_OBJ_CLASS_FLAGS (exp) & SCM_CLASSF_GOOPS)
531 {
532 SCM pwps, print = pstate->writingp ? g_write : g_display;
b2b33168 533 if (SCM_UNPACK (print) == 0)
904a077d 534 goto print_struct;
dfd03fb9 535 pwps = scm_i_port_with_print_state (port, pstate->handle);
7663c008 536 pstate->revealed = 1;
904a077d
MV
537 scm_call_generic_2 (print, exp, pwps);
538 }
539 else
540 {
541 print_struct:
542 scm_print_struct (exp, port, pstate);
543 }
544 EXIT_NESTED_DATA (pstate);
545 }
546 break;
0f2d19dd
JB
547 case scm_tcs_cons_imcar:
548 case scm_tcs_cons_nimcar:
c62fbfe1
MD
549 ENTER_NESTED_DATA (pstate, exp, circref);
550 scm_iprlist ("(", exp, ')', port, pstate);
551 EXIT_NESTED_DATA (pstate);
a51ea417
MD
552 break;
553 circref:
c62fbfe1 554 print_circref (port, pstate, exp);
0f2d19dd 555 break;
534c55a9
DH
556 case scm_tc7_number:
557 switch SCM_TYP16 (exp) {
558 case scm_tc16_big:
559 scm_bigprint (exp, port, pstate);
560 break;
561 case scm_tc16_real:
562 scm_print_real (exp, port, pstate);
563 break;
564 case scm_tc16_complex:
565 scm_print_complex (exp, port, pstate);
566 break;
f92e85f7
MV
567 case scm_tc16_fraction:
568 scm_i_print_fraction (exp, port, pstate);
569 break;
534c55a9
DH
570 }
571 break;
9c44cd45
MG
572 case scm_tc7_string:
573 if (SCM_WRITINGP (pstate))
574 {
07f49ac7 575 size_t len, i;
9c44cd45 576
f4bc4e59 577 display_character ('"', port, iconveh_question_mark);
9c44cd45
MG
578 len = scm_i_string_length (exp);
579 for (i = 0; i < len; ++i)
07f49ac7
LC
580 write_character (scm_i_string_ref (exp, i), port, 1);
581
f4bc4e59 582 display_character ('"', port, iconveh_question_mark);
9c44cd45
MG
583 scm_remember_upto_here_1 (exp);
584 }
585 else
f4bc4e59
LC
586 {
587 size_t len, printed;
588
589 len = scm_i_string_length (exp);
590 printed = display_string (scm_i_string_data (exp),
591 scm_i_is_narrow_string (exp),
592 len, port,
478848cb 593 PORT_CONVERSION_HANDLER (port));
f4bc4e59 594 if (SCM_UNLIKELY (printed < len))
f4bc4e59
LC
595 scm_encoding_error (__func__, errno,
596 "cannot convert to output locale",
6851d3be 597 port, scm_c_string_ref (exp, printed));
f4bc4e59
LC
598 }
599
9c44cd45
MG
600 scm_remember_upto_here_1 (exp);
601 break;
28b06554 602 case scm_tc7_symbol:
cc95e00a 603 if (scm_i_symbol_is_interned (exp))
9ff28a13 604 {
e23106d5 605 scm_i_print_symbol_name (exp, port);
9ff28a13
MV
606 scm_remember_upto_here_1 (exp);
607 }
608 else
609 {
610 scm_puts ("#<uninterned-symbol ", port);
e23106d5 611 scm_i_print_symbol_name (exp, port);
9ff28a13 612 scm_putc (' ', port);
0345e278 613 scm_uintprint (SCM_UNPACK (exp), 16, port);
9ff28a13
MV
614 scm_putc ('>', port);
615 }
6662998f 616 break;
e5aca4b5
MV
617 case scm_tc7_variable:
618 scm_i_variable_print (exp, port, pstate);
619 break;
2fb924f6
AW
620 case scm_tc7_program:
621 scm_i_program_print (exp, port, pstate);
622 break;
5b46a8c2
LC
623 case scm_tc7_pointer:
624 scm_i_pointer_print (exp, port, pstate);
e2c2a699 625 break;
c99de5aa
AW
626 case scm_tc7_hashtable:
627 scm_i_hashtable_print (exp, port, pstate);
628 break;
9ea31741
AW
629 case scm_tc7_fluid:
630 scm_i_fluid_print (exp, port, pstate);
631 break;
45cf2428
AW
632 case scm_tc7_dynamic_state:
633 scm_i_dynamic_state_print (exp, port, pstate);
634 break;
6f3b0cc2
AW
635 case scm_tc7_frame:
636 scm_i_frame_print (exp, port, pstate);
637 break;
638 case scm_tc7_objcode:
639 scm_i_objcode_print (exp, port, pstate);
640 break;
641 case scm_tc7_vm:
642 scm_i_vm_print (exp, port, pstate);
643 break;
644 case scm_tc7_vm_cont:
645 scm_i_vm_cont_print (exp, port, pstate);
646 break;
bbb2ecd1
AW
647 case scm_tc7_prompt:
648 scm_i_prompt_print (exp, port, pstate);
649 break;
650 case scm_tc7_with_fluids:
651 scm_i_with_fluids_print (exp, port, pstate);
652 break;
b2637c98
AW
653 case scm_tc7_array:
654 ENTER_NESTED_DATA (pstate, exp, circref);
655 scm_i_print_array (exp, port, pstate);
88c0a1d5 656 EXIT_NESTED_DATA (pstate);
b2637c98
AW
657 break;
658 case scm_tc7_bytevector:
659 scm_i_print_bytevector (exp, port, pstate);
660 break;
ff1feca9
AW
661 case scm_tc7_bitvector:
662 scm_i_print_bitvector (exp, port, pstate);
663 break;
0f2d19dd 664 case scm_tc7_wvect:
c62fbfe1 665 ENTER_NESTED_DATA (pstate, exp, circref);
0f2d19dd 666 if (SCM_IS_WHVEC (exp))
b7f3516f 667 scm_puts ("#wh(", port);
0f2d19dd 668 else
b7f3516f 669 scm_puts ("#w(", port);
0f2d19dd 670 goto common_vector_printer;
0f2d19dd 671 case scm_tc7_vector:
c62fbfe1 672 ENTER_NESTED_DATA (pstate, exp, circref);
b7f3516f 673 scm_puts ("#(", port);
0f2d19dd 674 common_vector_printer:
9fbaf27c 675 {
c014a02e 676 register long i;
4057a3e0 677 long last = SCM_SIMPLE_VECTOR_LENGTH (exp) - 1;
9fbaf27c 678 int cutp = 0;
4057a3e0
MV
679 if (pstate->fancyp
680 && SCM_SIMPLE_VECTOR_LENGTH (exp) > pstate->length)
9fbaf27c
MD
681 {
682 last = pstate->length - 1;
683 cutp = 1;
684 }
c367c4b4 685 if (SCM_I_WVECTP (exp))
9fbaf27c 686 {
c367c4b4
LC
687 /* Elements of weak vectors may not be accessed via the
688 `SIMPLE_VECTOR_REF ()' macro. */
689 for (i = 0; i < last; ++i)
690 {
691 scm_iprin1 (scm_c_vector_ref (exp, i),
692 port, pstate);
693 scm_putc (' ', port);
694 }
9fbaf27c 695 }
c367c4b4
LC
696 else
697 {
698 for (i = 0; i < last; ++i)
699 {
700 scm_iprin1 (SCM_SIMPLE_VECTOR_REF (exp, i), port, pstate);
701 scm_putc (' ', port);
702 }
703 }
704
9fbaf27c
MD
705 if (i == last)
706 {
707 /* CHECK_INTS; */
c367c4b4 708 scm_iprin1 (scm_c_vector_ref (exp, i), port, pstate);
9fbaf27c
MD
709 }
710 if (cutp)
b7f3516f
TT
711 scm_puts (" ...", port);
712 scm_putc (')', port);
9fbaf27c 713 }
c62fbfe1 714 EXIT_NESTED_DATA (pstate);
0f2d19dd 715 break;
0f2d19dd 716 case scm_tc7_port:
5ca6dc39
JB
717 {
718 register long i = SCM_PTOBNUM (exp);
719 if (i < scm_numptob
720 && scm_ptobs[i].print
721 && (scm_ptobs[i].print) (exp, port, pstate))
a51ea417 722 break;
5ca6dc39
JB
723 goto punk;
724 }
725 case scm_tc7_smob:
7a7f7c53
DH
726 ENTER_NESTED_DATA (pstate, exp, circref);
727 SCM_SMOB_DESCRIPTOR (exp).print (exp, port, pstate);
728 EXIT_NESTED_DATA (pstate);
729 break;
0f2d19dd 730 default:
314b8716 731 /* case scm_tcs_closures: */
a51ea417
MD
732 punk:
733 scm_ipruk ("type", exp, port);
0f2d19dd
JB
734 }
735 }
736}
737
c62fbfe1
MD
738/* Print states are necessary for circular reference safe printing.
739 * They are also expensive to allocate. Therefore print states are
740 * kept in a pool so that they can be reused.
741 */
1cc91f1b 742
bb35f315
MV
743/* The PORT argument can also be a print-state/port pair, which will
744 * then be used instead of allocating a new print state. This is
745 * useful for continuing a chain of print calls from Scheme. */
746
a51ea417 747void
1bbd0b84 748scm_prin1 (SCM exp, SCM port, int writingp)
a51ea417 749{
c4f37e80
MV
750 SCM handle = SCM_BOOL_F; /* Will GC protect the handle whilst unlinked */
751 SCM pstate_scm;
c62fbfe1 752 scm_print_state *pstate;
15635be5 753 int old_writingp;
c62fbfe1 754
bb35f315
MV
755 /* If PORT is a print-state/port pair, use that. Else create a new
756 print-state. */
c4f37e80 757
0c95b57d 758 if (SCM_PORT_WITH_PS_P (port))
bb35f315 759 {
52235e71
MD
760 pstate_scm = SCM_PORT_WITH_PS_PS (port);
761 port = SCM_PORT_WITH_PS_PORT (port);
bb35f315
MV
762 }
763 else
c62fbfe1 764 {
c4f37e80 765 /* First try to allocate a print state from the pool */
9de87eea 766 scm_i_pthread_mutex_lock (&print_state_mutex);
d2e53ed6 767 if (!scm_is_null (print_state_pool))
c4f37e80 768 {
d5cf5324
DH
769 handle = print_state_pool;
770 print_state_pool = SCM_CDR (print_state_pool);
c4f37e80 771 }
9de87eea 772 scm_i_pthread_mutex_unlock (&print_state_mutex);
7888309b 773 if (scm_is_false (handle))
d5cf5324 774 handle = scm_list_1 (make_print_state ());
c4f37e80 775 pstate_scm = SCM_CAR (handle);
c62fbfe1 776 }
c62fbfe1 777
c4f37e80 778 pstate = SCM_PRINT_STATE (pstate_scm);
15635be5 779 old_writingp = pstate->writingp;
c62fbfe1
MD
780 pstate->writingp = writingp;
781 scm_iprin1 (exp, port, pstate);
15635be5 782 pstate->writingp = old_writingp;
c62fbfe1 783
bb35f315
MV
784 /* Return print state to pool if it has been created above and
785 hasn't escaped to Scheme. */
786
7888309b 787 if (scm_is_true (handle) && !pstate->revealed)
c4f37e80 788 {
9de87eea 789 scm_i_pthread_mutex_lock (&print_state_mutex);
d5cf5324
DH
790 SCM_SETCDR (handle, print_state_pool);
791 print_state_pool = handle;
9de87eea 792 scm_i_pthread_mutex_unlock (&print_state_mutex);
c4f37e80 793 }
a51ea417
MD
794}
795
f4bc4e59
LC
796/* Convert codepoint CH to UTF-8 and store the result in UTF8. Return
797 the number of bytes of the UTF-8-encoded string. */
798static size_t
799codepoint_to_utf8 (scm_t_wchar ch, scm_t_uint8 utf8[4])
9c44cd45 800{
f4bc4e59
LC
801 size_t len;
802 scm_t_uint32 codepoint;
803
804 codepoint = (scm_t_uint32) ch;
07f49ac7 805
f4bc4e59 806 if (codepoint <= 0x7f)
07f49ac7 807 {
f4bc4e59
LC
808 len = 1;
809 utf8[0] = (scm_t_uint8) codepoint;
810 }
811 else if (codepoint <= 0x7ffUL)
812 {
813 len = 2;
814 utf8[0] = 0xc0 | (codepoint >> 6);
815 utf8[1] = 0x80 | (codepoint & 0x3f);
816 }
817 else if (codepoint <= 0xffffUL)
818 {
819 len = 3;
820 utf8[0] = 0xe0 | (codepoint >> 12);
821 utf8[1] = 0x80 | ((codepoint >> 6) & 0x3f);
822 utf8[2] = 0x80 | (codepoint & 0x3f);
07f49ac7
LC
823 }
824 else
825 {
f4bc4e59
LC
826 len = 4;
827 utf8[0] = 0xf0 | (codepoint >> 18);
828 utf8[1] = 0x80 | ((codepoint >> 12) & 0x3f);
829 utf8[2] = 0x80 | ((codepoint >> 6) & 0x3f);
830 utf8[3] = 0x80 | (codepoint & 0x3f);
831 }
832
833 return len;
834}
835
f4bc4e59
LC
836#define STR_REF(s, x) \
837 (narrow_p \
838 ? (scm_t_wchar) ((unsigned char *) (s))[x] \
839 : ((scm_t_wchar *) (s))[x])
840
7b292a9d
LC
841/* Write STR to PORT as UTF-8. STR is a LEN-codepoint string; it is
842 narrow if NARROW_P is true, wide otherwise. Return LEN. */
843static size_t
844display_string_as_utf8 (const void *str, int narrow_p, size_t len,
845 SCM port)
846{
847 size_t printed = 0;
848
849 while (len > printed)
850 {
851 size_t utf8_len, i;
852 char *input, utf8_buf[256];
853
854 /* Convert STR to UTF-8. */
855 for (i = printed, utf8_len = 0, input = utf8_buf;
856 i < len && utf8_len + 4 < sizeof (utf8_buf);
857 i++)
858 {
859 utf8_len += codepoint_to_utf8 (STR_REF (str, i),
860 (scm_t_uint8 *) input);
861 input = utf8_buf + utf8_len;
862 }
863
864 /* INPUT was successfully converted, entirely; print the
865 result. */
866 scm_lfwrite (utf8_buf, utf8_len, port);
867 printed += i - printed;
868 }
869
870 assert (printed == len);
871
872 return len;
873}
874
875/* Convert STR through PORT's output conversion descriptor and write the
876 output to PORT. Return the number of codepoints written. */
877static size_t
878display_string_using_iconv (const void *str, int narrow_p, size_t len,
879 SCM port,
880 scm_t_string_failed_conversion_handler strategy)
881{
f4bc4e59 882 size_t printed;
e4598559 883 scm_t_port_internal *pti;
f4bc4e59 884
e4598559 885 pti = SCM_PORT_GET_INTERNAL (port);
f4bc4e59 886
f4bc4e59
LC
887 printed = 0;
888
889 while (len > printed)
890 {
891 size_t done, utf8_len, input_left, output_left, i;
892 size_t codepoints_read, output_len;
893 char *input, *output;
894 char utf8_buf[256], encoded_output[256];
895 size_t offsets[256];
896
897 /* Convert STR to UTF-8. */
898 for (i = printed, utf8_len = 0, input = utf8_buf;
899 i < len && utf8_len + 4 < sizeof (utf8_buf);
900 i++)
07f49ac7 901 {
f4bc4e59
LC
902 offsets[utf8_len] = i;
903 utf8_len += codepoint_to_utf8 (STR_REF (str, i),
904 (scm_t_uint8 *) input);
905 input = utf8_buf + utf8_len;
906 }
907
908 input = utf8_buf;
909 input_left = utf8_len;
910
911 output = encoded_output;
912 output_left = sizeof (encoded_output);
913
e4598559 914 done = iconv (pti->output_cd, &input, &input_left,
f4bc4e59 915 &output, &output_left);
07f49ac7 916
f4bc4e59
LC
917 output_len = sizeof (encoded_output) - output_left;
918
919 if (SCM_UNLIKELY (done == (size_t) -1))
920 {
b2548e23
AW
921 int errno_save = errno;
922
f4bc4e59 923 /* Reset the `iconv' state. */
e4598559 924 iconv (pti->output_cd, NULL, NULL, NULL, NULL);
f4bc4e59 925
7174bc08
LC
926 /* Print the OUTPUT_LEN bytes successfully converted. */
927 scm_lfwrite (encoded_output, output_len, port);
928
929 /* See how many input codepoints these OUTPUT_LEN bytes
930 corresponds to. */
931 codepoints_read = offsets[input - utf8_buf] - printed;
932 printed += codepoints_read;
933
b2548e23 934 if (errno_save == EILSEQ &&
f4bc4e59 935 strategy != SCM_FAILED_CONVERSION_ERROR)
07f49ac7 936 {
f4bc4e59
LC
937 /* Conversion failed somewhere in INPUT and we want to
938 escape or substitute the offending input character. */
939
f4bc4e59 940 if (strategy == SCM_FAILED_CONVERSION_ESCAPE_SEQUENCE)
f1ee6d54 941 {
f4bc4e59
LC
942 scm_t_wchar ch;
943
944 /* Find CH, the offending codepoint, and escape it. */
945 ch = STR_REF (str, offsets[input - utf8_buf]);
946 write_character_escaped (ch, 1, port);
f1ee6d54 947 }
07f49ac7 948 else
f4bc4e59
LC
949 /* STRATEGY is `SCM_FAILED_CONVERSION_QUESTION_MARK'. */
950 display_string ("?", 1, 1, port, strategy);
9c44cd45 951
f4bc4e59
LC
952 printed++;
953 }
954 else
955 /* Something bad happened that we can't handle: bail out. */
956 break;
07f49ac7
LC
957 }
958 else
f4bc4e59
LC
959 {
960 /* INPUT was successfully converted, entirely; print the
961 result. */
962 scm_lfwrite (encoded_output, output_len, port);
963 codepoints_read = i - printed;
964 printed += codepoints_read;
965 }
07f49ac7
LC
966 }
967
968 return printed;
7b292a9d
LC
969}
970
f4bc4e59 971#undef STR_REF
7b292a9d
LC
972
973/* Display the LEN codepoints in STR to PORT according to STRATEGY;
974 return the number of codepoints successfully displayed. If NARROW_P,
975 then STR is interpreted as a sequence of `char', denoting a Latin-1
976 string; otherwise it's interpreted as a sequence of
977 `scm_t_wchar'. */
978static size_t
979display_string (const void *str, int narrow_p,
980 size_t len, SCM port,
981 scm_t_string_failed_conversion_handler strategy)
982
983{
984 scm_t_port *pt;
e4598559 985 scm_t_port_internal *pti;
7b292a9d
LC
986
987 pt = SCM_PTAB_ENTRY (port);
e4598559 988 pti = SCM_PORT_GET_INTERNAL (port);
7b292a9d 989
e4598559 990 if (pti->output_cd == (iconv_t) -1)
7b292a9d
LC
991 /* Initialize the conversion descriptors, if needed. */
992 scm_i_set_port_encoding_x (port, pt->encoding);
993
994 /* FIXME: In 2.1, add a flag to determine whether a port is UTF-8. */
e4598559 995 if (pti->output_cd == (iconv_t) -1)
7b292a9d
LC
996 return display_string_as_utf8 (str, narrow_p, len, port);
997 else
998 return display_string_using_iconv (str, narrow_p, len,
999 port, strategy);
f4bc4e59
LC
1000}
1001
1002/* Attempt to display CH to PORT according to STRATEGY. Return non-zero
1003 if CH was successfully displayed, zero otherwise (e.g., if it was not
1004 representable in PORT's encoding.) */
1005static int
1006display_character (scm_t_wchar ch, SCM port,
1007 scm_t_string_failed_conversion_handler strategy)
1008{
1009 return display_string (&ch, 0, 1, port, strategy) == 1;
07f49ac7
LC
1010}
1011
33d92fe6
LC
1012/* Attempt to pretty-print CH, a combining character, to PORT. Return
1013 zero upon failure, non-zero otherwise. The idea is to print CH above
1014 a dotted circle to make it more visible. */
1015static int
1016write_combining_character (scm_t_wchar ch, SCM port)
1017{
f4bc4e59
LC
1018 scm_t_wchar str[2];
1019
1020 str[0] = SCM_CODEPOINT_DOTTED_CIRCLE;
1021 str[1] = ch;
1022
1023 return display_string (str, 0, 2, port, iconveh_error) == 2;
1024}
33d92fe6 1025
f4bc4e59
LC
1026/* Write CH to PORT in its escaped form, using the string escape syntax
1027 if STRING_ESCAPES_P is non-zero. */
1028static void
1029write_character_escaped (scm_t_wchar ch, int string_escapes_p, SCM port)
1030{
1031 if (string_escapes_p)
33d92fe6 1032 {
f4bc4e59
LC
1033 /* Represent CH using the in-string escape syntax. */
1034
1035 static const char hex[] = "0123456789abcdef";
1036 static const char escapes[7] = "abtnvfr";
1037 char buf[9];
1038
1039 if (ch >= 0x07 && ch <= 0x0D && ch != 0x0A)
33d92fe6 1040 {
f4bc4e59
LC
1041 /* Use special escapes for some C0 controls. */
1042 buf[0] = '\\';
1043 buf[1] = escapes[ch - 0x07];
1044 scm_lfwrite (buf, 2, port);
1045 }
1046 else if (!SCM_R6RS_ESCAPES_P)
1047 {
1048 if (ch <= 0xFF)
1049 {
1050 buf[0] = '\\';
1051 buf[1] = 'x';
1052 buf[2] = hex[ch / 16];
1053 buf[3] = hex[ch % 16];
1054 scm_lfwrite (buf, 4, port);
1055 }
1056 else if (ch <= 0xFFFF)
1057 {
1058 buf[0] = '\\';
1059 buf[1] = 'u';
1060 buf[2] = hex[(ch & 0xF000) >> 12];
1061 buf[3] = hex[(ch & 0xF00) >> 8];
1062 buf[4] = hex[(ch & 0xF0) >> 4];
1063 buf[5] = hex[(ch & 0xF)];
1064 scm_lfwrite (buf, 6, port);
1065 }
1066 else if (ch > 0xFFFF)
1067 {
1068 buf[0] = '\\';
1069 buf[1] = 'U';
1070 buf[2] = hex[(ch & 0xF00000) >> 20];
1071 buf[3] = hex[(ch & 0xF0000) >> 16];
1072 buf[4] = hex[(ch & 0xF000) >> 12];
1073 buf[5] = hex[(ch & 0xF00) >> 8];
1074 buf[6] = hex[(ch & 0xF0) >> 4];
1075 buf[7] = hex[(ch & 0xF)];
1076 scm_lfwrite (buf, 8, port);
1077 }
33d92fe6
LC
1078 }
1079 else
f4bc4e59
LC
1080 {
1081 /* Print an R6RS variable-length hex escape: "\xNNNN;". */
1082 scm_t_wchar ch2 = ch;
1083
1084 int i = 8;
1085 buf[i] = ';';
1086 i --;
1087 if (ch == 0)
1088 buf[i--] = '0';
1089 else
1090 while (ch2 > 0)
1091 {
1092 buf[i] = hex[ch2 & 0xF];
1093 ch2 >>= 4;
1094 i --;
1095 }
1096 buf[i] = 'x';
1097 i --;
1098 buf[i] = '\\';
1099 scm_lfwrite (buf + i, 9 - i, port);
1100 }
33d92fe6
LC
1101 }
1102 else
f4bc4e59
LC
1103 {
1104 /* Represent CH using the character escape syntax. */
1105 const char *name;
33d92fe6 1106
f4bc4e59
LC
1107 name = scm_i_charname (SCM_MAKE_CHAR (ch));
1108 if (name != NULL)
1109 scm_puts (name, port);
1110 else
1111 PRINT_CHAR_ESCAPE (ch, port);
1112 }
33d92fe6
LC
1113}
1114
07f49ac7
LC
1115/* Write CH to PORT, escaping it if it's non-graphic or not
1116 representable in PORT's encoding. If STRING_ESCAPES_P is true and CH
1117 needs to be escaped, it is escaped using the in-string escape syntax;
1118 otherwise the character escape syntax is used. */
1119static void
1120write_character (scm_t_wchar ch, SCM port, int string_escapes_p)
1121{
1122 int printed = 0;
f4bc4e59
LC
1123 scm_t_string_failed_conversion_handler strategy;
1124
478848cb 1125 strategy = PORT_CONVERSION_HANDLER (port);
07f49ac7
LC
1126
1127 if (string_escapes_p)
1128 {
1129 /* Check if CH deserves special treatment. */
1130 if (ch == '"' || ch == '\\')
1131 {
f4bc4e59
LC
1132 display_character ('\\', port, iconveh_question_mark);
1133 display_character (ch, port, strategy);
07f49ac7
LC
1134 printed = 1;
1135 }
8500b186
AW
1136 else if (ch == '\n' && SCM_PRINT_ESCAPE_NEWLINES_P)
1137 {
1138 display_character ('\\', port, iconveh_question_mark);
1139 display_character ('n', port, strategy);
1140 printed = 1;
1141 }
07f49ac7
LC
1142 else if (ch == ' ' || ch == '\n')
1143 {
f4bc4e59 1144 display_character (ch, port, strategy);
07f49ac7
LC
1145 printed = 1;
1146 }
1147 }
1148 else
33d92fe6 1149 {
f4bc4e59 1150 display_string ("#\\", 1, 2, port, iconveh_question_mark);
33d92fe6
LC
1151
1152 if (uc_combining_class (ch) != UC_CCC_NR)
1153 /* Character is a combining character, so attempt to
1154 pretty-print it. */
1155 printed = write_combining_character (ch, port);
1156 }
07f49ac7
LC
1157
1158 if (!printed
1159 && uc_is_general_category_withtable (ch,
1160 UC_CATEGORY_MASK_L |
1161 UC_CATEGORY_MASK_M |
1162 UC_CATEGORY_MASK_N |
1163 UC_CATEGORY_MASK_P |
1164 UC_CATEGORY_MASK_S))
1165 /* CH is graphic; attempt to display it. */
1166 printed = display_character (ch, port, iconveh_error);
1167
1168 if (!printed)
f4bc4e59
LC
1169 /* CH isn't graphic or cannot be represented in PORT's encoding. */
1170 write_character_escaped (ch, string_escapes_p, port);
9c44cd45 1171}
0f2d19dd 1172
b908768a
LC
1173/* Display STR to PORT from START inclusive to END exclusive. */
1174void
1175scm_i_display_substring (SCM str, size_t start, size_t end, SCM port)
1176{
1177 int narrow_p;
1178 const char *buf;
1179 size_t len, printed;
1180
1181 buf = scm_i_string_data (str);
1182 len = end - start;
1183 narrow_p = scm_i_is_narrow_string (str);
1184 buf += start * (narrow_p ? sizeof (char) : sizeof (scm_t_wchar));
1185
1186 printed = display_string (buf, narrow_p, end - start, port,
1187 PORT_CONVERSION_HANDLER (port));
1188
1189 if (SCM_UNLIKELY (printed < len))
1190 scm_encoding_error (__func__, errno,
1191 "cannot convert to output locale",
1192 port, scm_c_string_ref (str, printed + start));
1193}
1194
1195\f
0f2d19dd
JB
1196/* Print an integer.
1197 */
1cc91f1b 1198
0f2d19dd 1199void
a406c9e9 1200scm_intprint (scm_t_intmax n, int radix, SCM port)
0f2d19dd
JB
1201{
1202 char num_buf[SCM_INTBUFLEN];
b7f3516f 1203 scm_lfwrite (num_buf, scm_iint2str (n, radix, num_buf), port);
0f2d19dd
JB
1204}
1205
a406c9e9
MV
1206void
1207scm_uintprint (scm_t_uintmax n, int radix, SCM port)
1208{
1209 char num_buf[SCM_INTBUFLEN];
1210 scm_lfwrite (num_buf, scm_iuint2str (n, radix, num_buf), port);
1211}
1212
0f2d19dd
JB
1213/* Print an object of unrecognized type.
1214 */
1cc91f1b 1215
0f2d19dd 1216void
1bbd0b84 1217scm_ipruk (char *hdr, SCM ptr, SCM port)
0f2d19dd 1218{
b7f3516f
TT
1219 scm_puts ("#<unknown-", port);
1220 scm_puts (hdr, port);
26224b3f 1221 if (1) /* (scm_in_heap_p (ptr)) */ /* FIXME */
0f2d19dd 1222 {
b7f3516f 1223 scm_puts (" (0x", port);
0345e278 1224 scm_uintprint (SCM_CELL_WORD_0 (ptr), 16, port);
b7f3516f 1225 scm_puts (" . 0x", port);
0345e278 1226 scm_uintprint (SCM_CELL_WORD_1 (ptr), 16, port);
b7f3516f 1227 scm_puts (") @", port);
0f2d19dd 1228 }
b7f3516f 1229 scm_puts (" 0x", port);
0345e278 1230 scm_uintprint (SCM_UNPACK (ptr), 16, port);
b7f3516f 1231 scm_putc ('>', port);
0f2d19dd
JB
1232}
1233
1cc91f1b 1234
904a077d 1235/* Print a list.
22a52da1 1236 */
0f2d19dd 1237void
34d19ef6 1238scm_iprlist (char *hdr, SCM exp, int tlr, SCM port, scm_print_state *pstate)
0f2d19dd 1239{
c62fbfe1 1240 register SCM hare, tortoise;
c014a02e 1241 long floor = pstate->top - 2;
b7f3516f 1242 scm_puts (hdr, port);
0f2d19dd 1243 /* CHECK_INTS; */
c62fbfe1
MD
1244 if (pstate->fancyp)
1245 goto fancy_printing;
1246
1247 /* Run a hare and tortoise so that total time complexity will be
1248 O(depth * N) instead of O(N^2). */
1249 hare = SCM_CDR (exp);
1250 tortoise = exp;
d2e53ed6 1251 while (scm_is_pair (hare))
c62fbfe1 1252 {
bc36d050 1253 if (scm_is_eq (hare, tortoise))
c62fbfe1
MD
1254 goto fancy_printing;
1255 hare = SCM_CDR (hare);
d2e53ed6 1256 if (!scm_is_pair (hare))
c62fbfe1
MD
1257 break;
1258 hare = SCM_CDR (hare);
1259 tortoise = SCM_CDR (tortoise);
1260 }
1261
1262 /* No cdr cycles intrinsic to this list */
1263 scm_iprin1 (SCM_CAR (exp), port, pstate);
d2e53ed6 1264 for (exp = SCM_CDR (exp); scm_is_pair (exp); exp = SCM_CDR (exp))
0f2d19dd 1265 {
c014a02e 1266 register long i;
5ca6dc39 1267
c62fbfe1 1268 for (i = floor; i >= 0; --i)
509759dd 1269 if (scm_is_eq (PSTATE_STACK_REF(pstate, i), exp))
c62fbfe1
MD
1270 goto circref;
1271 PUSH_REF (pstate, exp);
b7f3516f 1272 scm_putc (' ', port);
0f2d19dd 1273 /* CHECK_INTS; */
c62fbfe1 1274 scm_iprin1 (SCM_CAR (exp), port, pstate);
0f2d19dd 1275 }
c96d76b8 1276 if (!SCM_NULL_OR_NIL_P (exp))
0f2d19dd 1277 {
b7f3516f 1278 scm_puts (" . ", port);
c62fbfe1 1279 scm_iprin1 (exp, port, pstate);
0f2d19dd 1280 }
c62fbfe1 1281
a51ea417 1282end:
b7f3516f 1283 scm_putc (tlr, port);
c62fbfe1 1284 pstate->top = floor + 2;
a51ea417 1285 return;
c62fbfe1
MD
1286
1287fancy_printing:
1288 {
c014a02e 1289 long n = pstate->length;
c62fbfe1
MD
1290
1291 scm_iprin1 (SCM_CAR (exp), port, pstate);
1292 exp = SCM_CDR (exp); --n;
d2e53ed6 1293 for (; scm_is_pair (exp); exp = SCM_CDR (exp))
c62fbfe1 1294 {
c014a02e 1295 register unsigned long i;
5ca6dc39 1296
c62fbfe1 1297 for (i = 0; i < pstate->top; ++i)
509759dd 1298 if (scm_is_eq (PSTATE_STACK_REF(pstate, i), exp))
c62fbfe1
MD
1299 goto fancy_circref;
1300 if (pstate->fancyp)
1301 {
1302 if (n == 0)
1303 {
b7f3516f 1304 scm_puts (" ...", port);
c62fbfe1
MD
1305 goto skip_tail;
1306 }
1307 else
1308 --n;
1309 }
1310 PUSH_REF(pstate, exp);
1311 ++pstate->list_offset;
b7f3516f 1312 scm_putc (' ', port);
c62fbfe1
MD
1313 /* CHECK_INTS; */
1314 scm_iprin1 (SCM_CAR (exp), port, pstate);
1315 }
1316 }
c96d76b8 1317 if (!SCM_NULL_OR_NIL_P (exp))
c62fbfe1 1318 {
b7f3516f 1319 scm_puts (" . ", port);
c62fbfe1
MD
1320 scm_iprin1 (exp, port, pstate);
1321 }
1322skip_tail:
1323 pstate->list_offset -= pstate->top - floor - 2;
a51ea417 1324 goto end;
a51ea417 1325
c62fbfe1
MD
1326fancy_circref:
1327 pstate->list_offset -= pstate->top - floor - 2;
1328
1329circref:
b7f3516f 1330 scm_puts (" . ", port);
c62fbfe1
MD
1331 print_circref (port, pstate, exp);
1332 goto end;
0f2d19dd
JB
1333}
1334
1335\f
1336
bb35f315
MV
1337int
1338scm_valid_oport_value_p (SCM val)
1339{
368cf54d
GB
1340 return (SCM_OPOUTPORTP (val)
1341 || (SCM_PORT_WITH_PS_P (val)
1342 && SCM_OPOUTPORTP (SCM_PORT_WITH_PS_PORT (val))));
bb35f315
MV
1343}
1344
8b840115 1345/* SCM_GPROC(s_write, "write", 1, 1, 0, scm_write, g_write); */
1cc91f1b 1346
0f2d19dd 1347SCM
1bbd0b84 1348scm_write (SCM obj, SCM port)
0f2d19dd
JB
1349{
1350 if (SCM_UNBNDP (port))
9de87eea 1351 port = scm_current_output_port ();
3eb7e6ee
JB
1352
1353 SCM_ASSERT (scm_valid_oport_value_p (port), port, SCM_ARG2, s_write);
bb35f315 1354
a51ea417 1355 scm_prin1 (obj, port, 1);
0f2d19dd
JB
1356 return SCM_UNSPECIFIED;
1357}
1358
1359
8b840115 1360/* SCM_GPROC(s_display, "display", 1, 1, 0, scm_display, g_display); */
1cc91f1b 1361
0f2d19dd 1362SCM
1bbd0b84 1363scm_display (SCM obj, SCM port)
0f2d19dd
JB
1364{
1365 if (SCM_UNBNDP (port))
9de87eea 1366 port = scm_current_output_port ();
3eb7e6ee
JB
1367
1368 SCM_ASSERT (scm_valid_oport_value_p (port), port, SCM_ARG2, s_display);
bb35f315 1369
a51ea417 1370 scm_prin1 (obj, port, 0);
0f2d19dd
JB
1371 return SCM_UNSPECIFIED;
1372}
1373
70d63753
GB
1374
1375SCM_DEFINE (scm_simple_format, "simple-format", 2, 0, 1,
1376 (SCM destination, SCM message, SCM args),
eca65e90
MG
1377 "Write @var{message} to @var{destination}, defaulting to\n"
1378 "the current output port.\n"
1379 "@var{message} can contain @code{~A} (was @code{%s}) and\n"
1380 "@code{~S} (was @code{%S}) escapes. When printed,\n"
1381 "the escapes are replaced with corresponding members of\n"
b7e64f8b 1382 "@var{args}:\n"
eca65e90
MG
1383 "@code{~A} formats using @code{display} and @code{~S} formats\n"
1384 "using @code{write}.\n"
1385 "If @var{destination} is @code{#t}, then use the current output\n"
1386 "port, if @var{destination} is @code{#f}, then return a string\n"
1387 "containing the formatted text. Does not add a trailing newline.")
70d63753
GB
1388#define FUNC_NAME s_scm_simple_format
1389{
dfd03fb9 1390 SCM port, answer = SCM_UNSPECIFIED;
70d63753
GB
1391 int fReturnString = 0;
1392 int writingp;
889975e5 1393 size_t start, p, end;
70d63753 1394
bc36d050 1395 if (scm_is_eq (destination, SCM_BOOL_T))
daba1a71 1396 {
9de87eea 1397 destination = port = scm_current_output_port ();
daba1a71 1398 }
7888309b 1399 else if (scm_is_false (destination))
daba1a71
MD
1400 {
1401 fReturnString = 1;
0b2c2ba3 1402 port = scm_mkstrport (SCM_INUM0, SCM_BOOL_F,
dfd03fb9
MD
1403 SCM_OPN | SCM_WRTNG,
1404 FUNC_NAME);
1405 destination = port;
daba1a71
MD
1406 }
1407 else
1408 {
1409 SCM_VALIDATE_OPORT_VALUE (1, destination);
dfd03fb9 1410 port = SCM_COERCE_OUTPORT (destination);
daba1a71
MD
1411 }
1412 SCM_VALIDATE_STRING (2, message);
af45e3b0 1413 SCM_VALIDATE_REST_ARGUMENT (args);
70d63753 1414
889975e5
MG
1415 p = 0;
1416 start = 0;
1417 end = scm_i_string_length (message);
b24b5e13 1418 for (p = start; p != end; ++p)
889975e5 1419 if (scm_i_string_ref (message, p) == '~')
70d63753 1420 {
b24b5e13 1421 if (++p == end)
6662998f
MV
1422 break;
1423
889975e5 1424 switch (scm_i_string_ref (message, p))
6662998f
MV
1425 {
1426 case 'A': case 'a':
1427 writingp = 0;
1428 break;
1429 case 'S': case 's':
1430 writingp = 1;
1431 break;
1432 case '~':
889975e5 1433 scm_lfwrite_substr (message, start, p, port);
6662998f
MV
1434 start = p + 1;
1435 continue;
1436 case '%':
889975e5 1437 scm_lfwrite_substr (message, start, p - 1, port);
dfd03fb9 1438 scm_newline (port);
6662998f
MV
1439 start = p + 1;
1440 continue;
1441 default:
1afff620 1442 SCM_MISC_ERROR ("FORMAT: Unsupported format option ~~~A - use (ice-9 format) instead",
889975e5 1443 scm_list_1 (SCM_MAKE_CHAR (scm_i_string_ref (message, p))));
6662998f
MV
1444
1445 }
70d63753 1446
6662998f 1447
d2e53ed6 1448 if (!scm_is_pair (args))
1afff620 1449 SCM_MISC_ERROR ("FORMAT: Missing argument for ~~~A",
889975e5 1450 scm_list_1 (SCM_MAKE_CHAR (scm_i_string_ref (message, p))));
6662998f 1451
889975e5 1452 scm_lfwrite_substr (message, start, p - 1, port);
dfd03fb9 1453 /* we pass destination here */
70d63753
GB
1454 scm_prin1 (SCM_CAR (args), destination, writingp);
1455 args = SCM_CDR (args);
1456 start = p + 1;
1457 }
6662998f 1458
889975e5 1459 scm_lfwrite_substr (message, start, p, port);
bc36d050 1460 if (!scm_is_eq (args, SCM_EOL))
1afff620
KN
1461 SCM_MISC_ERROR ("FORMAT: ~A superfluous arguments",
1462 scm_list_1 (scm_length (args)));
70d63753
GB
1463
1464 if (fReturnString)
1465 answer = scm_strport_to_string (destination);
1466
daba1a71 1467 return scm_return_first (answer, message);
70d63753
GB
1468}
1469#undef FUNC_NAME
1470
1471
3b3b36dd 1472SCM_DEFINE (scm_newline, "newline", 0, 1, 0,
b450f070 1473 (SCM port),
8f85c0c6
NJ
1474 "Send a newline to @var{port}.\n"
1475 "If @var{port} is omitted, send to the current output port.")
1bbd0b84 1476#define FUNC_NAME s_scm_newline
0f2d19dd
JB
1477{
1478 if (SCM_UNBNDP (port))
9de87eea 1479 port = scm_current_output_port ();
3eb7e6ee 1480
34d19ef6 1481 SCM_VALIDATE_OPORT_VALUE (1, port);
bb35f315 1482
0ef4ae82 1483 scm_putc ('\n', SCM_COERCE_OUTPORT (port));
0f2d19dd
JB
1484 return SCM_UNSPECIFIED;
1485}
1bbd0b84 1486#undef FUNC_NAME
0f2d19dd 1487
3b3b36dd 1488SCM_DEFINE (scm_write_char, "write-char", 1, 1, 0,
b450f070 1489 (SCM chr, SCM port),
eca65e90 1490 "Send character @var{chr} to @var{port}.")
1bbd0b84 1491#define FUNC_NAME s_scm_write_char
0f2d19dd
JB
1492{
1493 if (SCM_UNBNDP (port))
9de87eea 1494 port = scm_current_output_port ();
3eb7e6ee 1495
34d19ef6
HWN
1496 SCM_VALIDATE_CHAR (1, chr);
1497 SCM_VALIDATE_OPORT_VALUE (2, port);
07f49ac7
LC
1498
1499 port = SCM_COERCE_OUTPORT (port);
1500 if (!display_character (SCM_CHAR (chr), port,
478848cb 1501 PORT_CONVERSION_HANDLER (port)))
07f49ac7
LC
1502 scm_encoding_error (__func__, errno,
1503 "cannot convert to output locale",
6851d3be 1504 port, chr);
07f49ac7 1505
0f2d19dd
JB
1506 return SCM_UNSPECIFIED;
1507}
1bbd0b84 1508#undef FUNC_NAME
0f2d19dd 1509
0f2d19dd
JB
1510\f
1511
bb35f315 1512/* Call back to Scheme code to do the printing of special objects
c19bc088
MD
1513 * (like structs). SCM_PRINTER_APPLY applies PROC to EXP and a smob
1514 * containing PORT and PSTATE. This object can be used as the port for
1515 * display/write etc to continue the current print chain. The REVEALED
1516 * field of PSTATE is set to true to indicate that the print state has
1517 * escaped to Scheme and thus has to be freed by the GC.
1518 */
1519
92c2555f 1520scm_t_bits scm_tc16_port_with_ps;
c19bc088
MD
1521
1522/* Print exactly as the port itself would */
1523
1524static int
e841c3e0 1525port_with_ps_print (SCM obj, SCM port, scm_print_state *pstate)
c19bc088
MD
1526{
1527 obj = SCM_PORT_WITH_PS_PORT (obj);
1528 return scm_ptobs[SCM_PTOBNUM (obj)].print (obj, port, pstate);
1529}
c4f37e80
MV
1530
1531SCM
1bbd0b84 1532scm_printer_apply (SCM proc, SCM exp, SCM port, scm_print_state *pstate)
c4f37e80 1533{
bb35f315 1534 pstate->revealed = 1;
dfd03fb9
MD
1535 return scm_call_2 (proc, exp,
1536 scm_i_port_with_print_state (port, pstate->handle));
c19bc088
MD
1537}
1538
dfd03fb9 1539SCM_DEFINE (scm_port_with_print_state, "port-with-print-state", 1, 1, 0,
1bbd0b84 1540 (SCM port, SCM pstate),
71331188 1541 "Create a new port which behaves like @var{port}, but with an\n"
dfd03fb9
MD
1542 "included print state @var{pstate}. @var{pstate} is optional.\n"
1543 "If @var{pstate} isn't supplied and @var{port} already has\n"
1544 "a print state, the old print state is reused.")
1bbd0b84 1545#define FUNC_NAME s_scm_port_with_print_state
c19bc088 1546{
34d19ef6 1547 SCM_VALIDATE_OPORT_VALUE (1, port);
dfd03fb9
MD
1548 if (!SCM_UNBNDP (pstate))
1549 SCM_VALIDATE_PRINTSTATE (2, pstate);
1550 return scm_i_port_with_print_state (port, pstate);
c19bc088 1551}
1bbd0b84 1552#undef FUNC_NAME
c19bc088 1553
a1ec6916 1554SCM_DEFINE (scm_get_print_state, "get-print-state", 1, 0, 0,
1bbd0b84 1555 (SCM port),
71331188
MG
1556 "Return the print state of the port @var{port}. If @var{port}\n"
1557 "has no associated print state, @code{#f} is returned.")
1bbd0b84 1558#define FUNC_NAME s_scm_get_print_state
c19bc088 1559{
368cf54d
GB
1560 if (SCM_PORT_WITH_PS_P (port))
1561 return SCM_PORT_WITH_PS_PS (port);
f5f2dcff 1562 if (SCM_OUTPUT_PORT_P (port))
368cf54d 1563 return SCM_BOOL_F;
276dd677 1564 SCM_WRONG_TYPE_ARG (1, port);
c4f37e80 1565}
1bbd0b84 1566#undef FUNC_NAME
bb35f315 1567
c4f37e80 1568\f
1cc91f1b 1569
0f2d19dd
JB
1570void
1571scm_init_print ()
0f2d19dd 1572{
66b1dbf6 1573 SCM type;
d5cf5324 1574
d5cf5324
DH
1575 scm_gc_register_root (&print_state_pool);
1576 scm_gc_register_root (&scm_print_state_vtable);
66b1dbf6
AW
1577 type = scm_make_vtable (scm_from_locale_string (SCM_PRINT_STATE_LAYOUT),
1578 SCM_BOOL_F);
4a655e50 1579 scm_set_struct_vtable_name_x (type, scm_from_latin1_symbol ("print-state"));
bb35f315 1580 scm_print_state_vtable = type;
c4f37e80 1581
c19bc088
MD
1582 /* Don't want to bind a wrapper class in GOOPS, so pass 0 as arg1. */
1583 scm_tc16_port_with_ps = scm_make_smob_type (0, 0);
e841c3e0 1584 scm_set_smob_print (scm_tc16_port_with_ps, port_with_ps_print);
81ae25da 1585
a0599745 1586#include "libguile/print.x"
475fa9a5 1587
8500b186
AW
1588 scm_init_opts (scm_print_options, scm_print_opts);
1589 scm_print_opts[SCM_PRINT_HIGHLIGHT_PREFIX_I].val =
1590 SCM_UNPACK (scm_from_locale_string ("{"));
1591 scm_print_opts[SCM_PRINT_HIGHLIGHT_SUFFIX_I].val =
1592 SCM_UNPACK (scm_from_locale_string ("}"));
475fa9a5 1593 scm_print_opts[SCM_PRINT_KEYWORD_STYLE_I].val = SCM_UNPACK (sym_reader);
0f2d19dd 1594}
89e00824
ML
1595
1596/*
1597 Local Variables:
1598 c-file-style: "gnu"
1599 End:
1600*/