Commit | Line | Data |
---|---|---|
f4bc4e59 | 1 | /* Copyright (C) 1995-1999, 2000, 2001, 2002, 2003, 2004, 2006, 2008, |
6e504a7b | 2 | * 2009, 2010, 2011, 2012, 2013, 2014 Free Software Foundation, Inc. |
f4bc4e59 | 3 | * |
73be1d9e | 4 | * This library is free software; you can redistribute it and/or |
53befeb7 NJ |
5 | * modify it under the terms of the GNU Lesser General Public License |
6 | * as published by the Free Software Foundation; either version 3 of | |
7 | * the License, or (at your option) any later version. | |
0f2d19dd | 8 | * |
53befeb7 NJ |
9 | * This library is distributed in the hope that it will be useful, but |
10 | * WITHOUT ANY WARRANTY; without even the implied warranty of | |
73be1d9e MV |
11 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
12 | * Lesser General Public License for more details. | |
0f2d19dd | 13 | * |
73be1d9e MV |
14 | * You should have received a copy of the GNU Lesser General Public |
15 | * License along with this library; if not, write to the Free Software | |
53befeb7 NJ |
16 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA |
17 | * 02110-1301 USA | |
73be1d9e | 18 | */ |
1bbd0b84 | 19 | |
1bbd0b84 | 20 | |
0f2d19dd | 21 | \f |
dbb605f5 LC |
22 | #ifdef HAVE_CONFIG_H |
23 | # include <config.h> | |
24 | #endif | |
0f2d19dd | 25 | |
e6e2e95a | 26 | #include <errno.h> |
f4bc4e59 LC |
27 | #include <iconv.h> |
28 | #include <stdio.h> | |
29 | #include <assert.h> | |
30 | ||
eca29b02 | 31 | #include <uniconv.h> |
904a78f1 | 32 | #include <unictype.h> |
e6e2e95a | 33 | |
a0599745 MD |
34 | #include "libguile/_scm.h" |
35 | #include "libguile/chars.h" | |
a002f1a2 | 36 | #include "libguile/continuations.h" |
a0599745 | 37 | #include "libguile/smob.h" |
bbb2ecd1 | 38 | #include "libguile/control.h" |
a0599745 MD |
39 | #include "libguile/eval.h" |
40 | #include "libguile/macros.h" | |
41 | #include "libguile/procprop.h" | |
42 | #include "libguile/read.h" | |
2fb924f6 | 43 | #include "libguile/programs.h" |
a0599745 MD |
44 | #include "libguile/alist.h" |
45 | #include "libguile/struct.h" | |
a0599745 | 46 | #include "libguile/ports.h" |
e4598559 | 47 | #include "libguile/ports-internal.h" |
a0599745 MD |
48 | #include "libguile/root.h" |
49 | #include "libguile/strings.h" | |
50 | #include "libguile/strports.h" | |
51 | #include "libguile/vectors.h" | |
327967ef | 52 | #include "libguile/numbers.h" |
6f3b0cc2 | 53 | #include "libguile/vm.h" |
a0599745 MD |
54 | |
55 | #include "libguile/validate.h" | |
56 | #include "libguile/print.h" | |
22fc179a HWN |
57 | |
58 | #include "libguile/private-options.h" | |
59 | ||
0f2d19dd JB |
60 | \f |
61 | ||
07f49ac7 LC |
62 | /* Character printers. */ |
63 | ||
478848cb LC |
64 | #define PORT_CONVERSION_HANDLER(port) \ |
65 | SCM_PTAB_ENTRY (port)->ilseq_handler | |
66 | ||
f4bc4e59 LC |
67 | static size_t display_string (const void *, int, size_t, SCM, |
68 | scm_t_string_failed_conversion_handler); | |
69 | ||
07f49ac7 LC |
70 | static int display_character (scm_t_wchar, SCM, |
71 | scm_t_string_failed_conversion_handler); | |
f4bc4e59 | 72 | |
07f49ac7 LC |
73 | static void write_character (scm_t_wchar, SCM, int); |
74 | ||
f4bc4e59 LC |
75 | static void write_character_escaped (scm_t_wchar, int, SCM); |
76 | ||
07f49ac7 LC |
77 | \f |
78 | ||
0f2d19dd JB |
79 | /* {Names of immediate symbols} |
80 | * | |
81 | * This table must agree with the declarations in scm.h: {Immediate Symbols}. | |
82 | */ | |
83 | ||
e17d318f DH |
84 | /* This table must agree with the list of flags in tags.h. */ |
85 | static const char *iflagnames[] = | |
86 | { | |
87 | "#f", | |
45f4cbdf MW |
88 | "#nil", /* Elisp nil value. Should print from elisp as symbol `nil'. */ |
89 | "#<XXX UNUSED LISP FALSE -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>", | |
90 | "()", | |
e17d318f | 91 | "#t", |
f60c2c4e MW |
92 | "#<XXX UNUSED BOOLEAN 0 -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>", |
93 | "#<XXX UNUSED BOOLEAN 1 -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>", | |
94 | "#<XXX UNUSED BOOLEAN 2 -- DO NOT USE -- SHOULD NEVER BE SEEN XXX>", | |
45f4cbdf | 95 | "#<unspecified>", |
e17d318f DH |
96 | "#<undefined>", |
97 | "#<eof>", | |
e17d318f DH |
98 | |
99 | /* Unbound slot marker for GOOPS. For internal use in GOOPS only. */ | |
100 | "#<unbound>", | |
e17d318f DH |
101 | }; |
102 | ||
475fa9a5 MV |
103 | SCM_SYMBOL (sym_reader, "reader"); |
104 | ||
92c2555f | 105 | scm_t_option scm_print_opts[] = { |
210c0325 | 106 | { SCM_OPTION_SCM, "highlight-prefix", (scm_t_bits)SCM_BOOL_F_BITS, |
81ae25da | 107 | "The string to print before highlighted values." }, |
210c0325 | 108 | { SCM_OPTION_SCM, "highlight-suffix", (scm_t_bits)SCM_BOOL_F_BITS, |
475fa9a5 | 109 | "The string to print after highlighted values." }, |
210c0325 | 110 | { SCM_OPTION_SCM, "quote-keywordish-symbols", (scm_t_bits)SCM_BOOL_F_BITS, |
475fa9a5 MV |
111 | "How to print symbols that have a colon as their first or last character. " |
112 | "The value '#f' does not quote the colons; '#t' quotes them; " | |
8500b186 AW |
113 | "'reader' quotes them when the reader option 'keywords' is not '#f'." }, |
114 | { SCM_OPTION_BOOLEAN, "escape-newlines", 1, | |
115 | "Render newlines as \\n when printing using `write'." }, | |
6e504a7b MW |
116 | { SCM_OPTION_BOOLEAN, "r7rs-symbols", 0, |
117 | "Escape symbols using R7RS |...| symbol notation." }, | |
62560650 | 118 | { 0 }, |
e6e4c9af MD |
119 | }; |
120 | ||
a1ec6916 | 121 | SCM_DEFINE (scm_print_options, "print-options-interface", 0, 1, 0, |
1bbd0b84 | 122 | (SCM setting), |
71331188 | 123 | "Option interface for the print options. Instead of using\n" |
1dd05fd8 MG |
124 | "this procedure directly, use the procedures\n" |
125 | "@code{print-enable}, @code{print-disable}, @code{print-set!}\n" | |
126 | "and @code{print-options}.") | |
1bbd0b84 | 127 | #define FUNC_NAME s_scm_print_options |
e6e4c9af | 128 | { |
a51ea417 | 129 | SCM ans = scm_options (setting, |
b7ff98dd | 130 | scm_print_opts, |
1bbd0b84 | 131 | FUNC_NAME); |
e6e4c9af MD |
132 | return ans; |
133 | } | |
1bbd0b84 | 134 | #undef FUNC_NAME |
e6e4c9af | 135 | |
0f2d19dd JB |
136 | \f |
137 | /* {Printing of Scheme Objects} | |
138 | */ | |
139 | ||
a51ea417 | 140 | /* Detection of circular references. |
c62fbfe1 MD |
141 | * |
142 | * Due to other constraints in the implementation, this code has bad | |
5d46ebe3 MD |
143 | * time complexity (O (depth * N)), The printer code can be |
144 | * rewritten to be O(N). | |
a51ea417 | 145 | */ |
dbb5de29 NJ |
146 | #define PUSH_REF(pstate, obj) \ |
147 | do \ | |
148 | { \ | |
149 | PSTATE_STACK_SET (pstate, pstate->top, obj); \ | |
150 | pstate->top++; \ | |
151 | if (pstate->top == pstate->ceiling) \ | |
152 | grow_ref_stack (pstate); \ | |
1bbd0b84 | 153 | } while(0) |
a51ea417 | 154 | |
dbb5de29 NJ |
155 | #define ENTER_NESTED_DATA(pstate, obj, label) \ |
156 | do \ | |
157 | { \ | |
158 | register unsigned long i; \ | |
159 | for (i = 0; i < pstate->top; ++i) \ | |
160 | if (scm_is_eq (PSTATE_STACK_REF (pstate, i), (obj))) \ | |
161 | goto label; \ | |
162 | if (pstate->fancyp) \ | |
163 | { \ | |
164 | if (pstate->top - pstate->list_offset >= pstate->level) \ | |
165 | { \ | |
0607ebbf | 166 | scm_putc_unlocked ('#', port); \ |
dbb5de29 NJ |
167 | return; \ |
168 | } \ | |
169 | } \ | |
170 | PUSH_REF(pstate, obj); \ | |
1bbd0b84 | 171 | } while(0) |
a51ea417 | 172 | |
dbb5de29 NJ |
173 | #define EXIT_NESTED_DATA(pstate) \ |
174 | do \ | |
175 | { \ | |
176 | --pstate->top; \ | |
177 | PSTATE_STACK_SET (pstate, pstate->top, SCM_UNDEFINED); \ | |
178 | } \ | |
179 | while (0) | |
c62fbfe1 | 180 | |
d5cf5324 DH |
181 | SCM scm_print_state_vtable = SCM_BOOL_F; |
182 | static SCM print_state_pool = SCM_EOL; | |
9de87eea | 183 | scm_i_pthread_mutex_t print_state_mutex = SCM_I_PTHREAD_MUTEX_INITIALIZER; |
c4f37e80 | 184 | |
f843a84c | 185 | #ifdef GUILE_DEBUG /* Used for debugging purposes */ |
1cc91f1b | 186 | |
3b3b36dd | 187 | SCM_DEFINE (scm_current_pstate, "current-pstate", 0, 0, 0, |
1bbd0b84 | 188 | (), |
d5cf5324 | 189 | "Return the current-pstate -- the car of the\n" |
5352393c MG |
190 | "@code{print_state_pool}. @code{current-pstate} is only\n" |
191 | "included in @code{--enable-guile-debug} builds.") | |
1bbd0b84 | 192 | #define FUNC_NAME s_scm_current_pstate |
c62fbfe1 | 193 | { |
d2e53ed6 | 194 | if (!scm_is_null (print_state_pool)) |
d5cf5324 | 195 | return SCM_CAR (print_state_pool); |
a0adfbf0 | 196 | else |
0a284a4e | 197 | return SCM_BOOL_F; |
c62fbfe1 | 198 | } |
1bbd0b84 GB |
199 | #undef FUNC_NAME |
200 | ||
c62fbfe1 MD |
201 | #endif |
202 | ||
203 | #define PSTATE_SIZE 50L | |
204 | ||
698c0295 | 205 | static SCM |
1bbd0b84 | 206 | make_print_state (void) |
698c0295 | 207 | { |
d5cf5324 DH |
208 | SCM print_state |
209 | = scm_make_struct (scm_print_state_vtable, SCM_INUM0, SCM_EOL); | |
bf685b6d | 210 | scm_print_state *pstate = SCM_PRINT_STATE (print_state); |
00ffa0e7 | 211 | pstate->ref_vect = scm_c_make_vector (PSTATE_SIZE, SCM_UNDEFINED); |
4057a3e0 | 212 | pstate->ceiling = SCM_SIMPLE_VECTOR_LENGTH (pstate->ref_vect); |
d232520a | 213 | pstate->highlight_objects = SCM_EOL; |
698c0295 MD |
214 | return print_state; |
215 | } | |
1cc91f1b | 216 | |
c62fbfe1 MD |
217 | SCM |
218 | scm_make_print_state () | |
c62fbfe1 | 219 | { |
230d095f | 220 | SCM answer = SCM_BOOL_F; |
698c0295 MD |
221 | |
222 | /* First try to allocate a print state from the pool */ | |
9de87eea | 223 | scm_i_pthread_mutex_lock (&print_state_mutex); |
d2e53ed6 | 224 | if (!scm_is_null (print_state_pool)) |
698c0295 | 225 | { |
d5cf5324 DH |
226 | answer = SCM_CAR (print_state_pool); |
227 | print_state_pool = SCM_CDR (print_state_pool); | |
698c0295 | 228 | } |
9de87eea | 229 | scm_i_pthread_mutex_unlock (&print_state_mutex); |
698c0295 | 230 | |
7888309b | 231 | return scm_is_false (answer) ? make_print_state () : answer; |
c62fbfe1 | 232 | } |
a51ea417 | 233 | |
698c0295 | 234 | void |
6e8d25a6 | 235 | scm_free_print_state (SCM print_state) |
698c0295 MD |
236 | { |
237 | SCM handle; | |
238 | scm_print_state *pstate = SCM_PRINT_STATE (print_state); | |
239 | /* Cleanup before returning print state to pool. | |
240 | * It is better to do it here. Doing it in scm_prin1 | |
241 | * would cost more since that function is called much more | |
242 | * often. | |
243 | */ | |
244 | pstate->fancyp = 0; | |
bb35f315 | 245 | pstate->revealed = 0; |
d232520a | 246 | pstate->highlight_objects = SCM_EOL; |
9de87eea | 247 | scm_i_pthread_mutex_lock (&print_state_mutex); |
16d4699b | 248 | handle = scm_cons (print_state, print_state_pool); |
d5cf5324 | 249 | print_state_pool = handle; |
9de87eea | 250 | scm_i_pthread_mutex_unlock (&print_state_mutex); |
dfd03fb9 MD |
251 | } |
252 | ||
253 | SCM | |
254 | scm_i_port_with_print_state (SCM port, SCM print_state) | |
255 | { | |
256 | if (SCM_UNBNDP (print_state)) | |
257 | { | |
258 | if (SCM_PORT_WITH_PS_P (port)) | |
259 | return port; | |
260 | else | |
261 | print_state = scm_make_print_state (); | |
262 | /* port does not need to be coerced since it doesn't have ps */ | |
263 | } | |
264 | else | |
265 | port = SCM_COERCE_OUTPORT (port); | |
266 | SCM_RETURN_NEWSMOB (scm_tc16_port_with_ps, | |
267 | SCM_UNPACK (scm_cons (port, print_state))); | |
698c0295 | 268 | } |
1cc91f1b | 269 | |
a51ea417 | 270 | static void |
1bbd0b84 | 271 | grow_ref_stack (scm_print_state *pstate) |
a51ea417 | 272 | { |
4057a3e0 MV |
273 | SCM old_vect = pstate->ref_vect; |
274 | size_t old_size = SCM_SIMPLE_VECTOR_LENGTH (old_vect); | |
275 | size_t new_size = 2 * pstate->ceiling; | |
00ffa0e7 | 276 | SCM new_vect = scm_c_make_vector (new_size, SCM_UNDEFINED); |
b17004b8 DH |
277 | unsigned long int i; |
278 | ||
279 | for (i = 0; i != old_size; ++i) | |
4057a3e0 | 280 | SCM_SIMPLE_VECTOR_SET (new_vect, i, SCM_SIMPLE_VECTOR_REF (old_vect, i)); |
b17004b8 DH |
281 | |
282 | pstate->ref_vect = new_vect; | |
bf685b6d | 283 | pstate->ceiling = new_size; |
a51ea417 MD |
284 | } |
285 | ||
509759dd MV |
286 | #define PSTATE_STACK_REF(p,i) SCM_SIMPLE_VECTOR_REF((p)->ref_vect, (i)) |
287 | #define PSTATE_STACK_SET(p,i,v) SCM_SIMPLE_VECTOR_SET((p)->ref_vect, (i), (v)) | |
1cc91f1b | 288 | |
a51ea417 | 289 | static void |
34d19ef6 | 290 | print_circref (SCM port, scm_print_state *pstate, SCM ref) |
a51ea417 | 291 | { |
c014a02e ML |
292 | register long i; |
293 | long self = pstate->top - 1; | |
c62fbfe1 | 294 | i = pstate->top - 1; |
509759dd | 295 | if (scm_is_pair (PSTATE_STACK_REF (pstate, i))) |
c62fbfe1 MD |
296 | { |
297 | while (i > 0) | |
298 | { | |
509759dd MV |
299 | if (!scm_is_pair (PSTATE_STACK_REF (pstate, i-1)) |
300 | || !scm_is_eq (SCM_CDR (PSTATE_STACK_REF (pstate, i-1)), | |
301 | SCM_CDR (PSTATE_STACK_REF (pstate, i)))) | |
c62fbfe1 MD |
302 | break; |
303 | --i; | |
304 | } | |
305 | self = i; | |
306 | } | |
307 | for (i = pstate->top - 1; 1; --i) | |
509759dd | 308 | if (scm_is_eq (PSTATE_STACK_REF(pstate, i), ref)) |
c62fbfe1 | 309 | break; |
0607ebbf | 310 | scm_putc_unlocked ('#', port); |
c62fbfe1 | 311 | scm_intprint (i - self, 10, port); |
0607ebbf | 312 | scm_putc_unlocked ('#', port); |
a51ea417 MD |
313 | } |
314 | ||
6662998f MV |
315 | /* Print the name of a symbol. */ |
316 | ||
475fa9a5 | 317 | static int |
15671c6e | 318 | quote_keywordish_symbols (void) |
475fa9a5 | 319 | { |
15671c6e | 320 | SCM option = SCM_PRINT_KEYWORD_STYLE; |
475fa9a5 | 321 | |
475fa9a5 MV |
322 | if (scm_is_false (option)) |
323 | return 0; | |
324 | if (scm_is_eq (option, sym_reader)) | |
325 | return scm_is_true (SCM_PACK (SCM_KEYWORD_STYLE)); | |
326 | return 1; | |
327 | } | |
328 | ||
2e9fc9fc AW |
329 | #define INITIAL_IDENTIFIER_MASK \ |
330 | (UC_CATEGORY_MASK_Lu | UC_CATEGORY_MASK_Ll | UC_CATEGORY_MASK_Lt \ | |
331 | | UC_CATEGORY_MASK_Lm | UC_CATEGORY_MASK_Lo | UC_CATEGORY_MASK_Mn \ | |
332 | | UC_CATEGORY_MASK_Nl | UC_CATEGORY_MASK_No | UC_CATEGORY_MASK_Pd \ | |
333 | | UC_CATEGORY_MASK_Pc | UC_CATEGORY_MASK_Po | UC_CATEGORY_MASK_Sc \ | |
334 | | UC_CATEGORY_MASK_Sm | UC_CATEGORY_MASK_Sk | UC_CATEGORY_MASK_So \ | |
335 | | UC_CATEGORY_MASK_Co) | |
336 | ||
337 | #define SUBSEQUENT_IDENTIFIER_MASK \ | |
338 | (INITIAL_IDENTIFIER_MASK \ | |
339 | | UC_CATEGORY_MASK_Nd | UC_CATEGORY_MASK_Mc | UC_CATEGORY_MASK_Me) | |
340 | ||
4164dd6d | 341 | /* FIXME: Cache this information on the symbol, somehow. */ |
15671c6e AW |
342 | static int |
343 | symbol_has_extended_read_syntax (SCM sym) | |
6662998f | 344 | { |
15671c6e AW |
345 | size_t pos, len = scm_i_symbol_length (sym); |
346 | scm_t_wchar c; | |
347 | ||
348 | /* The empty symbol. */ | |
349 | if (len == 0) | |
350 | return 1; | |
351 | ||
352 | c = scm_i_symbol_ref (sym, 0); | |
353 | ||
4164dd6d AW |
354 | switch (c) |
355 | { | |
356 | case '\'': | |
357 | case '`': | |
358 | case ',': | |
359 | case '"': | |
360 | case ';': | |
361 | case '#': | |
362 | /* Some initial-character constraints. */ | |
363 | return 1; | |
c92ee2b3 MW |
364 | |
365 | case '|': | |
366 | case '\\': | |
367 | /* R7RS allows neither '|' nor '\' in bare symbols. */ | |
368 | if (SCM_PRINT_R7RS_SYMBOLS_P) | |
369 | return 1; | |
370 | break; | |
15671c6e | 371 | |
4164dd6d AW |
372 | case ':': |
373 | /* Symbols that look like keywords. */ | |
374 | return quote_keywordish_symbols (); | |
15671c6e | 375 | |
4164dd6d AW |
376 | case '.': |
377 | /* Single dot conflicts with dotted-pair notation. */ | |
378 | if (len == 1) | |
379 | return 1; | |
380 | /* Fall through to check numbers. */ | |
381 | case '+': | |
382 | case '-': | |
383 | case '0': | |
384 | case '1': | |
385 | case '2': | |
386 | case '3': | |
387 | case '4': | |
388 | case '5': | |
389 | case '6': | |
390 | case '7': | |
391 | case '8': | |
392 | case '9': | |
393 | /* Number-ish symbols. Numbers with radixes already caught be # | |
394 | above. */ | |
395 | if (scm_is_true (scm_i_string_to_number (scm_symbol_to_string (sym), 10))) | |
396 | return 1; | |
397 | break; | |
398 | ||
399 | default: | |
400 | break; | |
401 | } | |
15671c6e | 402 | |
2e9fc9fc AW |
403 | /* Other disallowed first characters. */ |
404 | if (!uc_is_general_category_withtable (c, INITIAL_IDENTIFIER_MASK)) | |
405 | return 1; | |
406 | ||
4164dd6d AW |
407 | /* Keywords can be identified by trailing colons too. */ |
408 | if (scm_i_symbol_ref (sym, len - 1) == ':') | |
409 | return quote_keywordish_symbols (); | |
410 | ||
2e9fc9fc AW |
411 | /* Otherwise, any character that's in the identifier category mask is |
412 | fine to pass through as-is, provided it's not one of the ASCII | |
413 | delimiters like `;'. */ | |
414 | for (pos = 1; pos < len; pos++) | |
6662998f | 415 | { |
2e9fc9fc AW |
416 | c = scm_i_symbol_ref (sym, pos); |
417 | if (!uc_is_general_category_withtable (c, SUBSEQUENT_IDENTIFIER_MASK)) | |
418 | return 1; | |
419 | else if (c == '"' || c == ';' || c == '#') | |
420 | return 1; | |
6e504a7b MW |
421 | else if ((c == '|' || c == '\\') && SCM_PRINT_R7RS_SYMBOLS_P) |
422 | /* R7RS allows neither '|' nor '\' in bare symbols. */ | |
423 | return 1; | |
6662998f | 424 | } |
c6b49e89 | 425 | |
15671c6e AW |
426 | return 0; |
427 | } | |
428 | ||
429 | static void | |
430 | print_normal_symbol (SCM sym, SCM port) | |
431 | { | |
4164dd6d AW |
432 | size_t len; |
433 | scm_t_string_failed_conversion_handler strategy; | |
434 | ||
435 | len = scm_i_symbol_length (sym); | |
0dd7c540 | 436 | strategy = SCM_PTAB_ENTRY (port)->ilseq_handler; |
4164dd6d AW |
437 | |
438 | if (scm_i_is_narrow_symbol (sym)) | |
439 | display_string (scm_i_symbol_chars (sym), 1, len, port, strategy); | |
440 | else | |
441 | display_string (scm_i_symbol_wide_chars (sym), 0, len, port, strategy); | |
15671c6e AW |
442 | } |
443 | ||
15671c6e AW |
444 | static void |
445 | print_extended_symbol (SCM sym, SCM port) | |
446 | { | |
447 | size_t pos, len; | |
448 | scm_t_string_failed_conversion_handler strategy; | |
449 | ||
450 | len = scm_i_symbol_length (sym); | |
478848cb | 451 | strategy = PORT_CONVERSION_HANDLER (port); |
15671c6e | 452 | |
f209aeee | 453 | scm_lfwrite_unlocked ("#{", 2, port); |
15671c6e AW |
454 | |
455 | for (pos = 0; pos < len; pos++) | |
456 | { | |
457 | scm_t_wchar c = scm_i_symbol_ref (sym, pos); | |
458 | ||
2e9fc9fc AW |
459 | if (uc_is_general_category_withtable (c, |
460 | SUBSEQUENT_IDENTIFIER_MASK | |
461 | | UC_CATEGORY_MASK_Zs)) | |
15671c6e | 462 | { |
b4a09988 DK |
463 | if (!display_character (c, port, strategy) |
464 | || (c == '\\' && !display_character (c, port, strategy))) | |
15671c6e AW |
465 | scm_encoding_error ("print_extended_symbol", errno, |
466 | "cannot convert to output locale", | |
467 | port, SCM_MAKE_CHAR (c)); | |
2e9fc9fc AW |
468 | } |
469 | else | |
470 | { | |
c92ee2b3 | 471 | scm_lfwrite_unlocked ("\\x", 2, port); |
2e9fc9fc | 472 | scm_intprint (c, 16, port); |
c92ee2b3 | 473 | scm_putc_unlocked (';', port); |
15671c6e AW |
474 | } |
475 | } | |
476 | ||
f209aeee | 477 | scm_lfwrite_unlocked ("}#", 2, port); |
15671c6e AW |
478 | } |
479 | ||
6e504a7b MW |
480 | static void |
481 | print_r7rs_extended_symbol (SCM sym, SCM port) | |
482 | { | |
483 | size_t pos, len; | |
484 | scm_t_string_failed_conversion_handler strategy; | |
485 | ||
486 | len = scm_i_symbol_length (sym); | |
487 | strategy = PORT_CONVERSION_HANDLER (port); | |
488 | ||
c92ee2b3 | 489 | scm_putc_unlocked ('|', port); |
6e504a7b MW |
490 | |
491 | for (pos = 0; pos < len; pos++) | |
492 | { | |
493 | scm_t_wchar c = scm_i_symbol_ref (sym, pos); | |
494 | ||
495 | switch (c) | |
496 | { | |
c92ee2b3 MW |
497 | case '\a': scm_lfwrite_unlocked ("\\a", 2, port); break; |
498 | case '\b': scm_lfwrite_unlocked ("\\b", 2, port); break; | |
499 | case '\t': scm_lfwrite_unlocked ("\\t", 2, port); break; | |
500 | case '\n': scm_lfwrite_unlocked ("\\n", 2, port); break; | |
501 | case '\r': scm_lfwrite_unlocked ("\\r", 2, port); break; | |
502 | case '|': scm_lfwrite_unlocked ("\\|", 2, port); break; | |
503 | case '\\': scm_lfwrite_unlocked ("\\x5c;", 5, port); break; | |
6e504a7b MW |
504 | default: |
505 | if (uc_is_general_category_withtable (c, | |
1fc651e3 MW |
506 | UC_CATEGORY_MASK_L |
507 | | UC_CATEGORY_MASK_M | |
508 | | UC_CATEGORY_MASK_N | |
509 | | UC_CATEGORY_MASK_P | |
510 | | UC_CATEGORY_MASK_S) | |
511 | || (c == ' ')) | |
6e504a7b MW |
512 | { |
513 | if (!display_character (c, port, strategy)) | |
514 | scm_encoding_error ("print_r7rs_extended_symbol", errno, | |
515 | "cannot convert to output locale", | |
516 | port, SCM_MAKE_CHAR (c)); | |
517 | } | |
518 | else | |
519 | { | |
c92ee2b3 | 520 | scm_lfwrite_unlocked ("\\x", 2, port); |
6e504a7b | 521 | scm_intprint (c, 16, port); |
c92ee2b3 | 522 | scm_putc_unlocked (';', port); |
6e504a7b MW |
523 | } |
524 | break; | |
525 | } | |
526 | } | |
527 | ||
c92ee2b3 | 528 | scm_putc_unlocked ('|', port); |
6e504a7b MW |
529 | } |
530 | ||
531 | /* FIXME: allow R6RS hex escapes instead of #{...}# or |...|. */ | |
4164dd6d AW |
532 | static void |
533 | print_symbol (SCM sym, SCM port) | |
15671c6e | 534 | { |
6e504a7b | 535 | if (!symbol_has_extended_read_syntax (sym)) |
15671c6e | 536 | print_normal_symbol (sym, port); |
6e504a7b MW |
537 | else if (SCM_PRINT_R7RS_SYMBOLS_P) |
538 | print_r7rs_extended_symbol (sym, port); | |
539 | else | |
540 | print_extended_symbol (sym, port); | |
6662998f MV |
541 | } |
542 | ||
e23106d5 MG |
543 | void |
544 | scm_print_symbol_name (const char *str, size_t len, SCM port) | |
545 | { | |
25d50a05 | 546 | SCM symbol = scm_from_utf8_symboln (str, len); |
4164dd6d | 547 | print_symbol (symbol, port); |
e23106d5 MG |
548 | } |
549 | ||
c62fbfe1 | 550 | /* Print generally. Handles both write and display according to PSTATE. |
0f2d19dd | 551 | */ |
8b840115 MD |
552 | SCM_GPROC(s_write, "write", 1, 1, 0, scm_write, g_write); |
553 | SCM_GPROC(s_display, "display", 1, 1, 0, scm_display, g_display); | |
1cc91f1b | 554 | |
d232520a MV |
555 | static void iprin1 (SCM exp, SCM port, scm_print_state *pstate); |
556 | ||
dea901d6 MG |
557 | |
558 | /* Print a character as an octal or hex escape. */ | |
559 | #define PRINT_CHAR_ESCAPE(i, port) \ | |
560 | do \ | |
561 | { \ | |
562 | if (!SCM_R6RS_ESCAPES_P) \ | |
563 | scm_intprint (i, 8, port); \ | |
564 | else \ | |
565 | { \ | |
0607ebbf | 566 | scm_puts_unlocked ("x", port); \ |
dea901d6 MG |
567 | scm_intprint (i, 16, port); \ |
568 | } \ | |
569 | } \ | |
570 | while (0) | |
571 | ||
572 | ||
0f2d19dd | 573 | void |
1bbd0b84 | 574 | scm_iprin1 (SCM exp, SCM port, scm_print_state *pstate) |
d232520a MV |
575 | { |
576 | if (pstate->fancyp | |
577 | && scm_is_true (scm_memq (exp, pstate->highlight_objects))) | |
578 | { | |
81ae25da | 579 | scm_display (SCM_PRINT_HIGHLIGHT_PREFIX, port); |
d232520a | 580 | iprin1 (exp, port, pstate); |
81ae25da | 581 | scm_display (SCM_PRINT_HIGHLIGHT_SUFFIX, port); |
d232520a MV |
582 | } |
583 | else | |
584 | iprin1 (exp, port, pstate); | |
585 | } | |
586 | ||
0e92ef40 MW |
587 | static void |
588 | print_vector_or_weak_vector (SCM v, size_t len, SCM (*ref) (SCM, size_t), | |
589 | SCM port, scm_print_state *pstate) | |
590 | { | |
591 | long i; | |
592 | long last = len - 1; | |
593 | int cutp = 0; | |
594 | if (pstate->fancyp && len > pstate->length) | |
595 | { | |
596 | last = pstate->length - 1; | |
597 | cutp = 1; | |
598 | } | |
599 | for (i = 0; i < last; ++i) | |
600 | { | |
601 | scm_iprin1 (ref (v, i), port, pstate); | |
602 | scm_putc_unlocked (' ', port); | |
603 | } | |
604 | if (i == last) | |
605 | { | |
606 | /* CHECK_INTS; */ | |
607 | scm_iprin1 (ref (v, i), port, pstate); | |
608 | } | |
609 | if (cutp) | |
610 | scm_puts_unlocked (" ...", port); | |
611 | scm_putc_unlocked (')', port); | |
612 | } | |
613 | ||
d232520a MV |
614 | static void |
615 | iprin1 (SCM exp, SCM port, scm_print_state *pstate) | |
0f2d19dd | 616 | { |
54778cd3 | 617 | switch (SCM_ITAG3 (exp)) |
0f2d19dd | 618 | { |
e34f941a DH |
619 | case scm_tc3_tc7_1: |
620 | case scm_tc3_tc7_2: | |
621 | /* These tc3 tags should never occur in an immediate value. They are | |
622 | * only used in cell types of non-immediates, i. e. the value returned | |
623 | * by SCM_CELL_TYPE (exp) can use these tags. | |
624 | */ | |
625 | scm_ipruk ("immediate", exp, port); | |
626 | break; | |
627 | case scm_tc3_int_1: | |
628 | case scm_tc3_int_2: | |
e11e83f3 | 629 | scm_intprint (SCM_I_INUM (exp), 10, port); |
0f2d19dd | 630 | break; |
e34f941a | 631 | case scm_tc3_imm24: |
7866a09b | 632 | if (SCM_CHARP (exp)) |
0f2d19dd | 633 | { |
b7f3516f | 634 | if (SCM_WRITINGP (pstate)) |
07f49ac7 LC |
635 | write_character (SCM_CHAR (exp), port, 0); |
636 | else | |
b7f3516f | 637 | { |
07f49ac7 | 638 | if (!display_character (SCM_CHAR (exp), port, |
478848cb | 639 | PORT_CONVERSION_HANDLER (port))) |
07f49ac7 LC |
640 | scm_encoding_error (__func__, errno, |
641 | "cannot convert to output locale", | |
6851d3be | 642 | port, exp); |
b7f3516f | 643 | } |
0f2d19dd | 644 | } |
a51ea417 | 645 | else if (SCM_IFLAGP (exp) |
e17d318f DH |
646 | && ((size_t) SCM_IFLAGNUM (exp) < (sizeof iflagnames / sizeof (char *)))) |
647 | { | |
0607ebbf | 648 | scm_puts_unlocked (iflagnames [SCM_IFLAGNUM (exp)], port); |
e17d318f | 649 | } |
0f2d19dd | 650 | else |
e34f941a DH |
651 | { |
652 | /* unknown immediate value */ | |
653 | scm_ipruk ("immediate", exp, port); | |
654 | } | |
0f2d19dd | 655 | break; |
e34f941a | 656 | case scm_tc3_cons: |
0f2d19dd JB |
657 | switch (SCM_TYP7 (exp)) |
658 | { | |
904a077d MV |
659 | case scm_tcs_struct: |
660 | { | |
661 | ENTER_NESTED_DATA (pstate, exp, circref); | |
662 | if (SCM_OBJ_CLASS_FLAGS (exp) & SCM_CLASSF_GOOPS) | |
663 | { | |
664 | SCM pwps, print = pstate->writingp ? g_write : g_display; | |
b2b33168 | 665 | if (SCM_UNPACK (print) == 0) |
904a077d | 666 | goto print_struct; |
dfd03fb9 | 667 | pwps = scm_i_port_with_print_state (port, pstate->handle); |
7663c008 | 668 | pstate->revealed = 1; |
fa075d40 | 669 | scm_call_2 (print, exp, pwps); |
904a077d MV |
670 | } |
671 | else | |
672 | { | |
673 | print_struct: | |
674 | scm_print_struct (exp, port, pstate); | |
675 | } | |
676 | EXIT_NESTED_DATA (pstate); | |
677 | } | |
678 | break; | |
0f2d19dd JB |
679 | case scm_tcs_cons_imcar: |
680 | case scm_tcs_cons_nimcar: | |
c62fbfe1 MD |
681 | ENTER_NESTED_DATA (pstate, exp, circref); |
682 | scm_iprlist ("(", exp, ')', port, pstate); | |
683 | EXIT_NESTED_DATA (pstate); | |
a51ea417 MD |
684 | break; |
685 | circref: | |
c62fbfe1 | 686 | print_circref (port, pstate, exp); |
0f2d19dd | 687 | break; |
534c55a9 DH |
688 | case scm_tc7_number: |
689 | switch SCM_TYP16 (exp) { | |
690 | case scm_tc16_big: | |
691 | scm_bigprint (exp, port, pstate); | |
692 | break; | |
693 | case scm_tc16_real: | |
694 | scm_print_real (exp, port, pstate); | |
695 | break; | |
696 | case scm_tc16_complex: | |
697 | scm_print_complex (exp, port, pstate); | |
698 | break; | |
f92e85f7 MV |
699 | case scm_tc16_fraction: |
700 | scm_i_print_fraction (exp, port, pstate); | |
701 | break; | |
534c55a9 DH |
702 | } |
703 | break; | |
db071766 AW |
704 | case scm_tc7_stringbuf: |
705 | scm_i_print_stringbuf (exp, port, pstate); | |
706 | break; | |
9c44cd45 MG |
707 | case scm_tc7_string: |
708 | if (SCM_WRITINGP (pstate)) | |
709 | { | |
07f49ac7 | 710 | size_t len, i; |
9c44cd45 | 711 | |
f4bc4e59 | 712 | display_character ('"', port, iconveh_question_mark); |
9c44cd45 MG |
713 | len = scm_i_string_length (exp); |
714 | for (i = 0; i < len; ++i) | |
07f49ac7 LC |
715 | write_character (scm_i_string_ref (exp, i), port, 1); |
716 | ||
f4bc4e59 | 717 | display_character ('"', port, iconveh_question_mark); |
9c44cd45 MG |
718 | scm_remember_upto_here_1 (exp); |
719 | } | |
720 | else | |
f4bc4e59 LC |
721 | { |
722 | size_t len, printed; | |
723 | ||
724 | len = scm_i_string_length (exp); | |
725 | printed = display_string (scm_i_string_data (exp), | |
726 | scm_i_is_narrow_string (exp), | |
727 | len, port, | |
478848cb | 728 | PORT_CONVERSION_HANDLER (port)); |
f4bc4e59 | 729 | if (SCM_UNLIKELY (printed < len)) |
f4bc4e59 LC |
730 | scm_encoding_error (__func__, errno, |
731 | "cannot convert to output locale", | |
6851d3be | 732 | port, scm_c_string_ref (exp, printed)); |
f4bc4e59 LC |
733 | } |
734 | ||
9c44cd45 MG |
735 | scm_remember_upto_here_1 (exp); |
736 | break; | |
28b06554 | 737 | case scm_tc7_symbol: |
cc95e00a | 738 | if (scm_i_symbol_is_interned (exp)) |
9ff28a13 | 739 | { |
4164dd6d | 740 | print_symbol (exp, port); |
9ff28a13 MV |
741 | scm_remember_upto_here_1 (exp); |
742 | } | |
743 | else | |
744 | { | |
0607ebbf | 745 | scm_puts_unlocked ("#<uninterned-symbol ", port); |
4164dd6d | 746 | print_symbol (exp, port); |
0607ebbf | 747 | scm_putc_unlocked (' ', port); |
0345e278 | 748 | scm_uintprint (SCM_UNPACK (exp), 16, port); |
0607ebbf | 749 | scm_putc_unlocked ('>', port); |
9ff28a13 | 750 | } |
6662998f | 751 | break; |
e5aca4b5 MV |
752 | case scm_tc7_variable: |
753 | scm_i_variable_print (exp, port, pstate); | |
754 | break; | |
e0755cd1 | 755 | case scm_tc7_program: |
2fb924f6 AW |
756 | scm_i_program_print (exp, port, pstate); |
757 | break; | |
5b46a8c2 LC |
758 | case scm_tc7_pointer: |
759 | scm_i_pointer_print (exp, port, pstate); | |
e2c2a699 | 760 | break; |
c99de5aa AW |
761 | case scm_tc7_hashtable: |
762 | scm_i_hashtable_print (exp, port, pstate); | |
763 | break; | |
26b26354 AW |
764 | case scm_tc7_weak_set: |
765 | scm_i_weak_set_print (exp, port, pstate); | |
766 | break; | |
7005c60f AW |
767 | case scm_tc7_weak_table: |
768 | scm_i_weak_table_print (exp, port, pstate); | |
769 | break; | |
9ea31741 AW |
770 | case scm_tc7_fluid: |
771 | scm_i_fluid_print (exp, port, pstate); | |
772 | break; | |
45cf2428 AW |
773 | case scm_tc7_dynamic_state: |
774 | scm_i_dynamic_state_print (exp, port, pstate); | |
775 | break; | |
6f3b0cc2 AW |
776 | case scm_tc7_frame: |
777 | scm_i_frame_print (exp, port, pstate); | |
778 | break; | |
6f3b0cc2 AW |
779 | case scm_tc7_vm_cont: |
780 | scm_i_vm_cont_print (exp, port, pstate); | |
781 | break; | |
b2637c98 | 782 | case scm_tc7_array: |
c62fbfe1 | 783 | ENTER_NESTED_DATA (pstate, exp, circref); |
b2637c98 | 784 | scm_i_print_array (exp, port, pstate); |
88c0a1d5 | 785 | EXIT_NESTED_DATA (pstate); |
b2637c98 | 786 | break; |
807e5a66 LC |
787 | case scm_tc7_bytevector: |
788 | scm_i_print_bytevector (exp, port, pstate); | |
789 | break; | |
ff1feca9 AW |
790 | case scm_tc7_bitvector: |
791 | scm_i_print_bitvector (exp, port, pstate); | |
792 | break; | |
0f2d19dd | 793 | case scm_tc7_wvect: |
c62fbfe1 | 794 | ENTER_NESTED_DATA (pstate, exp, circref); |
91ee7515 | 795 | scm_puts_unlocked ("#w(", port); |
0e92ef40 MW |
796 | print_vector_or_weak_vector (exp, scm_c_weak_vector_length (exp), |
797 | scm_c_weak_vector_ref, port, pstate); | |
798 | EXIT_NESTED_DATA (pstate); | |
799 | break; | |
0f2d19dd | 800 | case scm_tc7_vector: |
c62fbfe1 | 801 | ENTER_NESTED_DATA (pstate, exp, circref); |
0607ebbf | 802 | scm_puts_unlocked ("#(", port); |
0e92ef40 MW |
803 | print_vector_or_weak_vector (exp, SCM_SIMPLE_VECTOR_LENGTH (exp), |
804 | scm_c_vector_ref, port, pstate); | |
c62fbfe1 | 805 | EXIT_NESTED_DATA (pstate); |
0f2d19dd | 806 | break; |
0f2d19dd | 807 | case scm_tc7_port: |
5ca6dc39 | 808 | { |
62bd5d66 AW |
809 | scm_t_ptob_descriptor *ptob = SCM_PORT_DESCRIPTOR (exp); |
810 | if (ptob->print && ptob->print (exp, port, pstate)) | |
a51ea417 | 811 | break; |
5ca6dc39 JB |
812 | goto punk; |
813 | } | |
814 | case scm_tc7_smob: | |
7a7f7c53 DH |
815 | ENTER_NESTED_DATA (pstate, exp, circref); |
816 | SCM_SMOB_DESCRIPTOR (exp).print (exp, port, pstate); | |
817 | EXIT_NESTED_DATA (pstate); | |
818 | break; | |
0f2d19dd | 819 | default: |
314b8716 | 820 | /* case scm_tcs_closures: */ |
a51ea417 MD |
821 | punk: |
822 | scm_ipruk ("type", exp, port); | |
0f2d19dd JB |
823 | } |
824 | } | |
825 | } | |
826 | ||
c62fbfe1 MD |
827 | /* Print states are necessary for circular reference safe printing. |
828 | * They are also expensive to allocate. Therefore print states are | |
829 | * kept in a pool so that they can be reused. | |
830 | */ | |
1cc91f1b | 831 | |
bb35f315 MV |
832 | /* The PORT argument can also be a print-state/port pair, which will |
833 | * then be used instead of allocating a new print state. This is | |
834 | * useful for continuing a chain of print calls from Scheme. */ | |
835 | ||
a51ea417 | 836 | void |
1bbd0b84 | 837 | scm_prin1 (SCM exp, SCM port, int writingp) |
a51ea417 | 838 | { |
c4f37e80 MV |
839 | SCM handle = SCM_BOOL_F; /* Will GC protect the handle whilst unlinked */ |
840 | SCM pstate_scm; | |
c62fbfe1 | 841 | scm_print_state *pstate; |
15635be5 | 842 | int old_writingp; |
c62fbfe1 | 843 | |
bb35f315 MV |
844 | /* If PORT is a print-state/port pair, use that. Else create a new |
845 | print-state. */ | |
c4f37e80 | 846 | |
0c95b57d | 847 | if (SCM_PORT_WITH_PS_P (port)) |
bb35f315 | 848 | { |
52235e71 MD |
849 | pstate_scm = SCM_PORT_WITH_PS_PS (port); |
850 | port = SCM_PORT_WITH_PS_PORT (port); | |
bb35f315 MV |
851 | } |
852 | else | |
c62fbfe1 | 853 | { |
c4f37e80 | 854 | /* First try to allocate a print state from the pool */ |
9de87eea | 855 | scm_i_pthread_mutex_lock (&print_state_mutex); |
d2e53ed6 | 856 | if (!scm_is_null (print_state_pool)) |
c4f37e80 | 857 | { |
d5cf5324 DH |
858 | handle = print_state_pool; |
859 | print_state_pool = SCM_CDR (print_state_pool); | |
c4f37e80 | 860 | } |
9de87eea | 861 | scm_i_pthread_mutex_unlock (&print_state_mutex); |
7888309b | 862 | if (scm_is_false (handle)) |
d5cf5324 | 863 | handle = scm_list_1 (make_print_state ()); |
c4f37e80 | 864 | pstate_scm = SCM_CAR (handle); |
c62fbfe1 | 865 | } |
c62fbfe1 | 866 | |
c4f37e80 | 867 | pstate = SCM_PRINT_STATE (pstate_scm); |
15635be5 | 868 | old_writingp = pstate->writingp; |
c62fbfe1 MD |
869 | pstate->writingp = writingp; |
870 | scm_iprin1 (exp, port, pstate); | |
15635be5 | 871 | pstate->writingp = old_writingp; |
c62fbfe1 | 872 | |
bb35f315 MV |
873 | /* Return print state to pool if it has been created above and |
874 | hasn't escaped to Scheme. */ | |
875 | ||
7888309b | 876 | if (scm_is_true (handle) && !pstate->revealed) |
c4f37e80 | 877 | { |
9de87eea | 878 | scm_i_pthread_mutex_lock (&print_state_mutex); |
d5cf5324 DH |
879 | SCM_SETCDR (handle, print_state_pool); |
880 | print_state_pool = handle; | |
9de87eea | 881 | scm_i_pthread_mutex_unlock (&print_state_mutex); |
c4f37e80 | 882 | } |
a51ea417 MD |
883 | } |
884 | ||
f4bc4e59 LC |
885 | /* Convert codepoint CH to UTF-8 and store the result in UTF8. Return |
886 | the number of bytes of the UTF-8-encoded string. */ | |
887 | static size_t | |
888 | codepoint_to_utf8 (scm_t_wchar ch, scm_t_uint8 utf8[4]) | |
9c44cd45 | 889 | { |
f4bc4e59 LC |
890 | size_t len; |
891 | scm_t_uint32 codepoint; | |
892 | ||
893 | codepoint = (scm_t_uint32) ch; | |
07f49ac7 | 894 | |
f4bc4e59 | 895 | if (codepoint <= 0x7f) |
07f49ac7 | 896 | { |
f4bc4e59 LC |
897 | len = 1; |
898 | utf8[0] = (scm_t_uint8) codepoint; | |
899 | } | |
900 | else if (codepoint <= 0x7ffUL) | |
901 | { | |
902 | len = 2; | |
903 | utf8[0] = 0xc0 | (codepoint >> 6); | |
904 | utf8[1] = 0x80 | (codepoint & 0x3f); | |
905 | } | |
906 | else if (codepoint <= 0xffffUL) | |
907 | { | |
908 | len = 3; | |
909 | utf8[0] = 0xe0 | (codepoint >> 12); | |
910 | utf8[1] = 0x80 | ((codepoint >> 6) & 0x3f); | |
911 | utf8[2] = 0x80 | (codepoint & 0x3f); | |
07f49ac7 LC |
912 | } |
913 | else | |
914 | { | |
f4bc4e59 LC |
915 | len = 4; |
916 | utf8[0] = 0xf0 | (codepoint >> 18); | |
917 | utf8[1] = 0x80 | ((codepoint >> 12) & 0x3f); | |
918 | utf8[2] = 0x80 | ((codepoint >> 6) & 0x3f); | |
919 | utf8[3] = 0x80 | (codepoint & 0x3f); | |
920 | } | |
921 | ||
922 | return len; | |
923 | } | |
924 | ||
f4bc4e59 LC |
925 | #define STR_REF(s, x) \ |
926 | (narrow_p \ | |
927 | ? (scm_t_wchar) ((unsigned char *) (s))[x] \ | |
928 | : ((scm_t_wchar *) (s))[x]) | |
929 | ||
7b292a9d LC |
930 | /* Write STR to PORT as UTF-8. STR is a LEN-codepoint string; it is |
931 | narrow if NARROW_P is true, wide otherwise. Return LEN. */ | |
932 | static size_t | |
933 | display_string_as_utf8 (const void *str, int narrow_p, size_t len, | |
934 | SCM port) | |
935 | { | |
936 | size_t printed = 0; | |
937 | ||
938 | while (len > printed) | |
939 | { | |
940 | size_t utf8_len, i; | |
941 | char *input, utf8_buf[256]; | |
942 | ||
943 | /* Convert STR to UTF-8. */ | |
944 | for (i = printed, utf8_len = 0, input = utf8_buf; | |
945 | i < len && utf8_len + 4 < sizeof (utf8_buf); | |
946 | i++) | |
947 | { | |
948 | utf8_len += codepoint_to_utf8 (STR_REF (str, i), | |
949 | (scm_t_uint8 *) input); | |
950 | input = utf8_buf + utf8_len; | |
951 | } | |
952 | ||
953 | /* INPUT was successfully converted, entirely; print the | |
954 | result. */ | |
f209aeee | 955 | scm_lfwrite_unlocked (utf8_buf, utf8_len, port); |
7b292a9d LC |
956 | printed += i - printed; |
957 | } | |
958 | ||
959 | assert (printed == len); | |
960 | ||
961 | return len; | |
962 | } | |
963 | ||
79eb47ea AW |
964 | /* Write STR to PORT as ISO-8859-1. STR is a LEN-codepoint string; it |
965 | is narrow if NARROW_P is true, wide otherwise. Return LEN. */ | |
966 | static size_t | |
967 | display_string_as_latin1 (const void *str, int narrow_p, size_t len, | |
968 | SCM port, | |
969 | scm_t_string_failed_conversion_handler strategy) | |
970 | { | |
971 | size_t printed = 0; | |
972 | ||
973 | if (narrow_p) | |
974 | { | |
975 | scm_lfwrite_unlocked (str, len, port); | |
976 | return len; | |
977 | } | |
978 | ||
979 | while (printed < len) | |
980 | { | |
981 | char buf[256]; | |
982 | size_t i; | |
983 | ||
984 | for (i = 0; i < sizeof(buf) && printed < len; i++, printed++) | |
985 | { | |
986 | scm_t_wchar c = STR_REF (str, printed); | |
987 | ||
988 | if (c < 256) | |
989 | buf[i] = c; | |
990 | else | |
991 | break; | |
992 | } | |
993 | ||
994 | scm_lfwrite_unlocked (buf, i, port); | |
995 | ||
996 | if (i < sizeof(buf) && printed < len) | |
997 | { | |
998 | if (strategy == SCM_FAILED_CONVERSION_ERROR) | |
999 | break; | |
1000 | else if (strategy == SCM_FAILED_CONVERSION_ESCAPE_SEQUENCE) | |
1001 | write_character_escaped (STR_REF (str, printed), 1, port); | |
1002 | else | |
1003 | /* STRATEGY is `SCM_FAILED_CONVERSION_QUESTION_MARK'. */ | |
1004 | display_string ("?", 1, 1, port, strategy); | |
1005 | printed++; | |
1006 | } | |
1007 | } | |
1008 | ||
1009 | return printed; | |
1010 | } | |
1011 | ||
7b292a9d LC |
1012 | /* Convert STR through PORT's output conversion descriptor and write the |
1013 | output to PORT. Return the number of codepoints written. */ | |
1014 | static size_t | |
1015 | display_string_using_iconv (const void *str, int narrow_p, size_t len, | |
1016 | SCM port, | |
1017 | scm_t_string_failed_conversion_handler strategy) | |
1018 | { | |
f4bc4e59 | 1019 | size_t printed; |
6c98257f | 1020 | scm_t_iconv_descriptors *id; |
cdd3d6c9 | 1021 | scm_t_port_internal *pti = SCM_PORT_GET_INTERNAL (port); |
f4bc4e59 | 1022 | |
cdd3d6c9 MW |
1023 | id = scm_i_port_iconv_descriptors (port, SCM_PORT_WRITE); |
1024 | ||
1025 | if (SCM_UNLIKELY (pti->at_stream_start_for_bom_write && len > 0)) | |
1026 | { | |
1027 | scm_t_port *pt = SCM_PTAB_ENTRY (port); | |
1028 | ||
1029 | /* Record that we're no longer at stream start. */ | |
1030 | pti->at_stream_start_for_bom_write = 0; | |
1031 | if (pt->rw_random) | |
1032 | pti->at_stream_start_for_bom_read = 0; | |
1033 | ||
1034 | /* Write a BOM if appropriate. */ | |
f6f4feb0 MW |
1035 | if (SCM_UNLIKELY (strcmp(pt->encoding, "UTF-16") == 0 |
1036 | || strcmp(pt->encoding, "UTF-32") == 0)) | |
cdd3d6c9 MW |
1037 | display_character (SCM_UNICODE_BOM, port, iconveh_error); |
1038 | } | |
f4bc4e59 | 1039 | |
f4bc4e59 LC |
1040 | printed = 0; |
1041 | ||
1042 | while (len > printed) | |
1043 | { | |
1044 | size_t done, utf8_len, input_left, output_left, i; | |
1045 | size_t codepoints_read, output_len; | |
1046 | char *input, *output; | |
1047 | char utf8_buf[256], encoded_output[256]; | |
1048 | size_t offsets[256]; | |
1049 | ||
1050 | /* Convert STR to UTF-8. */ | |
1051 | for (i = printed, utf8_len = 0, input = utf8_buf; | |
1052 | i < len && utf8_len + 4 < sizeof (utf8_buf); | |
1053 | i++) | |
07f49ac7 | 1054 | { |
f4bc4e59 LC |
1055 | offsets[utf8_len] = i; |
1056 | utf8_len += codepoint_to_utf8 (STR_REF (str, i), | |
1057 | (scm_t_uint8 *) input); | |
1058 | input = utf8_buf + utf8_len; | |
1059 | } | |
1060 | ||
1061 | input = utf8_buf; | |
1062 | input_left = utf8_len; | |
1063 | ||
1064 | output = encoded_output; | |
1065 | output_left = sizeof (encoded_output); | |
1066 | ||
6c98257f | 1067 | done = iconv (id->output_cd, &input, &input_left, |
f4bc4e59 | 1068 | &output, &output_left); |
07f49ac7 | 1069 | |
f4bc4e59 LC |
1070 | output_len = sizeof (encoded_output) - output_left; |
1071 | ||
1072 | if (SCM_UNLIKELY (done == (size_t) -1)) | |
1073 | { | |
b2548e23 AW |
1074 | int errno_save = errno; |
1075 | ||
f4bc4e59 | 1076 | /* Reset the `iconv' state. */ |
6c98257f | 1077 | iconv (id->output_cd, NULL, NULL, NULL, NULL); |
f4bc4e59 | 1078 | |
7174bc08 | 1079 | /* Print the OUTPUT_LEN bytes successfully converted. */ |
f209aeee | 1080 | scm_lfwrite_unlocked (encoded_output, output_len, port); |
7174bc08 LC |
1081 | |
1082 | /* See how many input codepoints these OUTPUT_LEN bytes | |
1083 | corresponds to. */ | |
1084 | codepoints_read = offsets[input - utf8_buf] - printed; | |
1085 | printed += codepoints_read; | |
1086 | ||
b2548e23 | 1087 | if (errno_save == EILSEQ && |
f4bc4e59 | 1088 | strategy != SCM_FAILED_CONVERSION_ERROR) |
07f49ac7 | 1089 | { |
f4bc4e59 LC |
1090 | /* Conversion failed somewhere in INPUT and we want to |
1091 | escape or substitute the offending input character. */ | |
1092 | ||
f4bc4e59 | 1093 | if (strategy == SCM_FAILED_CONVERSION_ESCAPE_SEQUENCE) |
f1ee6d54 | 1094 | { |
f4bc4e59 LC |
1095 | scm_t_wchar ch; |
1096 | ||
1097 | /* Find CH, the offending codepoint, and escape it. */ | |
1098 | ch = STR_REF (str, offsets[input - utf8_buf]); | |
1099 | write_character_escaped (ch, 1, port); | |
f1ee6d54 | 1100 | } |
07f49ac7 | 1101 | else |
f4bc4e59 LC |
1102 | /* STRATEGY is `SCM_FAILED_CONVERSION_QUESTION_MARK'. */ |
1103 | display_string ("?", 1, 1, port, strategy); | |
9c44cd45 | 1104 | |
f4bc4e59 LC |
1105 | printed++; |
1106 | } | |
1107 | else | |
1108 | /* Something bad happened that we can't handle: bail out. */ | |
1109 | break; | |
07f49ac7 LC |
1110 | } |
1111 | else | |
f4bc4e59 LC |
1112 | { |
1113 | /* INPUT was successfully converted, entirely; print the | |
1114 | result. */ | |
f209aeee | 1115 | scm_lfwrite_unlocked (encoded_output, output_len, port); |
f4bc4e59 LC |
1116 | codepoints_read = i - printed; |
1117 | printed += codepoints_read; | |
1118 | } | |
07f49ac7 LC |
1119 | } |
1120 | ||
1121 | return printed; | |
7b292a9d LC |
1122 | } |
1123 | ||
f4bc4e59 | 1124 | #undef STR_REF |
7b292a9d LC |
1125 | |
1126 | /* Display the LEN codepoints in STR to PORT according to STRATEGY; | |
1127 | return the number of codepoints successfully displayed. If NARROW_P, | |
1128 | then STR is interpreted as a sequence of `char', denoting a Latin-1 | |
1129 | string; otherwise it's interpreted as a sequence of | |
1130 | `scm_t_wchar'. */ | |
1131 | static size_t | |
1132 | display_string (const void *str, int narrow_p, | |
1133 | size_t len, SCM port, | |
1134 | scm_t_string_failed_conversion_handler strategy) | |
7b292a9d | 1135 | { |
e4598559 | 1136 | scm_t_port_internal *pti; |
7b292a9d | 1137 | |
e4598559 | 1138 | pti = SCM_PORT_GET_INTERNAL (port); |
7b292a9d | 1139 | |
337edc59 | 1140 | if (pti->encoding_mode == SCM_PORT_ENCODING_MODE_UTF8) |
7b292a9d | 1141 | return display_string_as_utf8 (str, narrow_p, len, port); |
f6f4feb0 | 1142 | else if (pti->encoding_mode == SCM_PORT_ENCODING_MODE_LATIN1) |
79eb47ea | 1143 | return display_string_as_latin1 (str, narrow_p, len, port, strategy); |
7b292a9d | 1144 | else |
79eb47ea | 1145 | return display_string_using_iconv (str, narrow_p, len, port, strategy); |
f4bc4e59 LC |
1146 | } |
1147 | ||
1148 | /* Attempt to display CH to PORT according to STRATEGY. Return non-zero | |
1149 | if CH was successfully displayed, zero otherwise (e.g., if it was not | |
1150 | representable in PORT's encoding.) */ | |
1151 | static int | |
1152 | display_character (scm_t_wchar ch, SCM port, | |
1153 | scm_t_string_failed_conversion_handler strategy) | |
1154 | { | |
1155 | return display_string (&ch, 0, 1, port, strategy) == 1; | |
07f49ac7 LC |
1156 | } |
1157 | ||
33d92fe6 LC |
1158 | /* Attempt to pretty-print CH, a combining character, to PORT. Return |
1159 | zero upon failure, non-zero otherwise. The idea is to print CH above | |
1160 | a dotted circle to make it more visible. */ | |
1161 | static int | |
1162 | write_combining_character (scm_t_wchar ch, SCM port) | |
1163 | { | |
f4bc4e59 LC |
1164 | scm_t_wchar str[2]; |
1165 | ||
1166 | str[0] = SCM_CODEPOINT_DOTTED_CIRCLE; | |
1167 | str[1] = ch; | |
1168 | ||
1169 | return display_string (str, 0, 2, port, iconveh_error) == 2; | |
1170 | } | |
33d92fe6 | 1171 | |
f4bc4e59 LC |
1172 | /* Write CH to PORT in its escaped form, using the string escape syntax |
1173 | if STRING_ESCAPES_P is non-zero. */ | |
1174 | static void | |
1175 | write_character_escaped (scm_t_wchar ch, int string_escapes_p, SCM port) | |
1176 | { | |
1177 | if (string_escapes_p) | |
33d92fe6 | 1178 | { |
f4bc4e59 LC |
1179 | /* Represent CH using the in-string escape syntax. */ |
1180 | ||
1181 | static const char hex[] = "0123456789abcdef"; | |
1182 | static const char escapes[7] = "abtnvfr"; | |
1183 | char buf[9]; | |
1184 | ||
1185 | if (ch >= 0x07 && ch <= 0x0D && ch != 0x0A) | |
33d92fe6 | 1186 | { |
f4bc4e59 LC |
1187 | /* Use special escapes for some C0 controls. */ |
1188 | buf[0] = '\\'; | |
1189 | buf[1] = escapes[ch - 0x07]; | |
f209aeee | 1190 | scm_lfwrite_unlocked (buf, 2, port); |
f4bc4e59 LC |
1191 | } |
1192 | else if (!SCM_R6RS_ESCAPES_P) | |
1193 | { | |
1194 | if (ch <= 0xFF) | |
1195 | { | |
1196 | buf[0] = '\\'; | |
1197 | buf[1] = 'x'; | |
1198 | buf[2] = hex[ch / 16]; | |
1199 | buf[3] = hex[ch % 16]; | |
f209aeee | 1200 | scm_lfwrite_unlocked (buf, 4, port); |
f4bc4e59 LC |
1201 | } |
1202 | else if (ch <= 0xFFFF) | |
1203 | { | |
1204 | buf[0] = '\\'; | |
1205 | buf[1] = 'u'; | |
1206 | buf[2] = hex[(ch & 0xF000) >> 12]; | |
1207 | buf[3] = hex[(ch & 0xF00) >> 8]; | |
1208 | buf[4] = hex[(ch & 0xF0) >> 4]; | |
1209 | buf[5] = hex[(ch & 0xF)]; | |
f209aeee | 1210 | scm_lfwrite_unlocked (buf, 6, port); |
f4bc4e59 LC |
1211 | } |
1212 | else if (ch > 0xFFFF) | |
1213 | { | |
1214 | buf[0] = '\\'; | |
1215 | buf[1] = 'U'; | |
1216 | buf[2] = hex[(ch & 0xF00000) >> 20]; | |
1217 | buf[3] = hex[(ch & 0xF0000) >> 16]; | |
1218 | buf[4] = hex[(ch & 0xF000) >> 12]; | |
1219 | buf[5] = hex[(ch & 0xF00) >> 8]; | |
1220 | buf[6] = hex[(ch & 0xF0) >> 4]; | |
1221 | buf[7] = hex[(ch & 0xF)]; | |
f209aeee | 1222 | scm_lfwrite_unlocked (buf, 8, port); |
f4bc4e59 | 1223 | } |
33d92fe6 LC |
1224 | } |
1225 | else | |
f4bc4e59 LC |
1226 | { |
1227 | /* Print an R6RS variable-length hex escape: "\xNNNN;". */ | |
1228 | scm_t_wchar ch2 = ch; | |
1229 | ||
1230 | int i = 8; | |
1231 | buf[i] = ';'; | |
1232 | i --; | |
1233 | if (ch == 0) | |
1234 | buf[i--] = '0'; | |
1235 | else | |
1236 | while (ch2 > 0) | |
1237 | { | |
1238 | buf[i] = hex[ch2 & 0xF]; | |
1239 | ch2 >>= 4; | |
1240 | i --; | |
1241 | } | |
1242 | buf[i] = 'x'; | |
1243 | i --; | |
1244 | buf[i] = '\\'; | |
f209aeee | 1245 | scm_lfwrite_unlocked (buf + i, 9 - i, port); |
f4bc4e59 | 1246 | } |
33d92fe6 LC |
1247 | } |
1248 | else | |
f4bc4e59 LC |
1249 | { |
1250 | /* Represent CH using the character escape syntax. */ | |
1251 | const char *name; | |
33d92fe6 | 1252 | |
f4bc4e59 LC |
1253 | name = scm_i_charname (SCM_MAKE_CHAR (ch)); |
1254 | if (name != NULL) | |
0607ebbf | 1255 | scm_puts_unlocked (name, port); |
f4bc4e59 LC |
1256 | else |
1257 | PRINT_CHAR_ESCAPE (ch, port); | |
1258 | } | |
33d92fe6 LC |
1259 | } |
1260 | ||
07f49ac7 LC |
1261 | /* Write CH to PORT, escaping it if it's non-graphic or not |
1262 | representable in PORT's encoding. If STRING_ESCAPES_P is true and CH | |
1263 | needs to be escaped, it is escaped using the in-string escape syntax; | |
1264 | otherwise the character escape syntax is used. */ | |
1265 | static void | |
1266 | write_character (scm_t_wchar ch, SCM port, int string_escapes_p) | |
1267 | { | |
1268 | int printed = 0; | |
f4bc4e59 LC |
1269 | scm_t_string_failed_conversion_handler strategy; |
1270 | ||
478848cb | 1271 | strategy = PORT_CONVERSION_HANDLER (port); |
07f49ac7 LC |
1272 | |
1273 | if (string_escapes_p) | |
1274 | { | |
1275 | /* Check if CH deserves special treatment. */ | |
1276 | if (ch == '"' || ch == '\\') | |
1277 | { | |
f4bc4e59 LC |
1278 | display_character ('\\', port, iconveh_question_mark); |
1279 | display_character (ch, port, strategy); | |
07f49ac7 LC |
1280 | printed = 1; |
1281 | } | |
8500b186 AW |
1282 | else if (ch == '\n' && SCM_PRINT_ESCAPE_NEWLINES_P) |
1283 | { | |
1284 | display_character ('\\', port, iconveh_question_mark); | |
1285 | display_character ('n', port, strategy); | |
1286 | printed = 1; | |
1287 | } | |
07f49ac7 LC |
1288 | else if (ch == ' ' || ch == '\n') |
1289 | { | |
f4bc4e59 | 1290 | display_character (ch, port, strategy); |
07f49ac7 LC |
1291 | printed = 1; |
1292 | } | |
1293 | } | |
1294 | else | |
33d92fe6 | 1295 | { |
f4bc4e59 | 1296 | display_string ("#\\", 1, 2, port, iconveh_question_mark); |
33d92fe6 LC |
1297 | |
1298 | if (uc_combining_class (ch) != UC_CCC_NR) | |
1299 | /* Character is a combining character, so attempt to | |
1300 | pretty-print it. */ | |
1301 | printed = write_combining_character (ch, port); | |
1302 | } | |
07f49ac7 LC |
1303 | |
1304 | if (!printed | |
1305 | && uc_is_general_category_withtable (ch, | |
1306 | UC_CATEGORY_MASK_L | | |
1307 | UC_CATEGORY_MASK_M | | |
1308 | UC_CATEGORY_MASK_N | | |
1309 | UC_CATEGORY_MASK_P | | |
1310 | UC_CATEGORY_MASK_S)) | |
1311 | /* CH is graphic; attempt to display it. */ | |
1312 | printed = display_character (ch, port, iconveh_error); | |
1313 | ||
1314 | if (!printed) | |
f4bc4e59 LC |
1315 | /* CH isn't graphic or cannot be represented in PORT's encoding. */ |
1316 | write_character_escaped (ch, string_escapes_p, port); | |
9c44cd45 | 1317 | } |
0f2d19dd | 1318 | |
b908768a LC |
1319 | /* Display STR to PORT from START inclusive to END exclusive. */ |
1320 | void | |
1321 | scm_i_display_substring (SCM str, size_t start, size_t end, SCM port) | |
1322 | { | |
1323 | int narrow_p; | |
1324 | const char *buf; | |
1325 | size_t len, printed; | |
1326 | ||
1327 | buf = scm_i_string_data (str); | |
1328 | len = end - start; | |
1329 | narrow_p = scm_i_is_narrow_string (str); | |
1330 | buf += start * (narrow_p ? sizeof (char) : sizeof (scm_t_wchar)); | |
1331 | ||
1332 | printed = display_string (buf, narrow_p, end - start, port, | |
1333 | PORT_CONVERSION_HANDLER (port)); | |
1334 | ||
1335 | if (SCM_UNLIKELY (printed < len)) | |
1336 | scm_encoding_error (__func__, errno, | |
1337 | "cannot convert to output locale", | |
1338 | port, scm_c_string_ref (str, printed + start)); | |
1339 | } | |
1340 | ||
1341 | \f | |
0f2d19dd JB |
1342 | /* Print an integer. |
1343 | */ | |
1cc91f1b | 1344 | |
0f2d19dd | 1345 | void |
a406c9e9 | 1346 | scm_intprint (scm_t_intmax n, int radix, SCM port) |
0f2d19dd JB |
1347 | { |
1348 | char num_buf[SCM_INTBUFLEN]; | |
f209aeee | 1349 | scm_lfwrite_unlocked (num_buf, scm_iint2str (n, radix, num_buf), port); |
0f2d19dd JB |
1350 | } |
1351 | ||
a406c9e9 MV |
1352 | void |
1353 | scm_uintprint (scm_t_uintmax n, int radix, SCM port) | |
1354 | { | |
1355 | char num_buf[SCM_INTBUFLEN]; | |
f209aeee | 1356 | scm_lfwrite_unlocked (num_buf, scm_iuint2str (n, radix, num_buf), port); |
a406c9e9 MV |
1357 | } |
1358 | ||
0f2d19dd JB |
1359 | /* Print an object of unrecognized type. |
1360 | */ | |
1cc91f1b | 1361 | |
0f2d19dd | 1362 | void |
1bbd0b84 | 1363 | scm_ipruk (char *hdr, SCM ptr, SCM port) |
0f2d19dd | 1364 | { |
0607ebbf AW |
1365 | scm_puts_unlocked ("#<unknown-", port); |
1366 | scm_puts_unlocked (hdr, port); | |
26224b3f | 1367 | if (1) /* (scm_in_heap_p (ptr)) */ /* FIXME */ |
0f2d19dd | 1368 | { |
0607ebbf | 1369 | scm_puts_unlocked (" (0x", port); |
0345e278 | 1370 | scm_uintprint (SCM_CELL_WORD_0 (ptr), 16, port); |
0607ebbf | 1371 | scm_puts_unlocked (" . 0x", port); |
0345e278 | 1372 | scm_uintprint (SCM_CELL_WORD_1 (ptr), 16, port); |
0607ebbf | 1373 | scm_puts_unlocked (") @", port); |
0f2d19dd | 1374 | } |
0607ebbf | 1375 | scm_puts_unlocked (" 0x", port); |
0345e278 | 1376 | scm_uintprint (SCM_UNPACK (ptr), 16, port); |
0607ebbf | 1377 | scm_putc_unlocked ('>', port); |
0f2d19dd JB |
1378 | } |
1379 | ||
1cc91f1b | 1380 | |
904a077d | 1381 | /* Print a list. |
22a52da1 | 1382 | */ |
0f2d19dd | 1383 | void |
34d19ef6 | 1384 | scm_iprlist (char *hdr, SCM exp, int tlr, SCM port, scm_print_state *pstate) |
0f2d19dd | 1385 | { |
c62fbfe1 | 1386 | register SCM hare, tortoise; |
c014a02e | 1387 | long floor = pstate->top - 2; |
0607ebbf | 1388 | scm_puts_unlocked (hdr, port); |
0f2d19dd | 1389 | /* CHECK_INTS; */ |
c62fbfe1 MD |
1390 | if (pstate->fancyp) |
1391 | goto fancy_printing; | |
1392 | ||
1393 | /* Run a hare and tortoise so that total time complexity will be | |
1394 | O(depth * N) instead of O(N^2). */ | |
1395 | hare = SCM_CDR (exp); | |
1396 | tortoise = exp; | |
d2e53ed6 | 1397 | while (scm_is_pair (hare)) |
c62fbfe1 | 1398 | { |
bc36d050 | 1399 | if (scm_is_eq (hare, tortoise)) |
c62fbfe1 MD |
1400 | goto fancy_printing; |
1401 | hare = SCM_CDR (hare); | |
d2e53ed6 | 1402 | if (!scm_is_pair (hare)) |
c62fbfe1 MD |
1403 | break; |
1404 | hare = SCM_CDR (hare); | |
1405 | tortoise = SCM_CDR (tortoise); | |
1406 | } | |
1407 | ||
1408 | /* No cdr cycles intrinsic to this list */ | |
1409 | scm_iprin1 (SCM_CAR (exp), port, pstate); | |
d2e53ed6 | 1410 | for (exp = SCM_CDR (exp); scm_is_pair (exp); exp = SCM_CDR (exp)) |
0f2d19dd | 1411 | { |
c014a02e | 1412 | register long i; |
5ca6dc39 | 1413 | |
c62fbfe1 | 1414 | for (i = floor; i >= 0; --i) |
509759dd | 1415 | if (scm_is_eq (PSTATE_STACK_REF(pstate, i), exp)) |
c62fbfe1 MD |
1416 | goto circref; |
1417 | PUSH_REF (pstate, exp); | |
0607ebbf | 1418 | scm_putc_unlocked (' ', port); |
0f2d19dd | 1419 | /* CHECK_INTS; */ |
c62fbfe1 | 1420 | scm_iprin1 (SCM_CAR (exp), port, pstate); |
0f2d19dd | 1421 | } |
c96d76b8 | 1422 | if (!SCM_NULL_OR_NIL_P (exp)) |
0f2d19dd | 1423 | { |
0607ebbf | 1424 | scm_puts_unlocked (" . ", port); |
c62fbfe1 | 1425 | scm_iprin1 (exp, port, pstate); |
0f2d19dd | 1426 | } |
c62fbfe1 | 1427 | |
a51ea417 | 1428 | end: |
0607ebbf | 1429 | scm_putc_unlocked (tlr, port); |
c62fbfe1 | 1430 | pstate->top = floor + 2; |
a51ea417 | 1431 | return; |
c62fbfe1 MD |
1432 | |
1433 | fancy_printing: | |
1434 | { | |
c014a02e | 1435 | long n = pstate->length; |
c62fbfe1 MD |
1436 | |
1437 | scm_iprin1 (SCM_CAR (exp), port, pstate); | |
1438 | exp = SCM_CDR (exp); --n; | |
d2e53ed6 | 1439 | for (; scm_is_pair (exp); exp = SCM_CDR (exp)) |
c62fbfe1 | 1440 | { |
c014a02e | 1441 | register unsigned long i; |
5ca6dc39 | 1442 | |
c62fbfe1 | 1443 | for (i = 0; i < pstate->top; ++i) |
509759dd | 1444 | if (scm_is_eq (PSTATE_STACK_REF(pstate, i), exp)) |
c62fbfe1 MD |
1445 | goto fancy_circref; |
1446 | if (pstate->fancyp) | |
1447 | { | |
1448 | if (n == 0) | |
1449 | { | |
0607ebbf | 1450 | scm_puts_unlocked (" ...", port); |
c62fbfe1 MD |
1451 | goto skip_tail; |
1452 | } | |
1453 | else | |
1454 | --n; | |
1455 | } | |
1456 | PUSH_REF(pstate, exp); | |
1457 | ++pstate->list_offset; | |
0607ebbf | 1458 | scm_putc_unlocked (' ', port); |
c62fbfe1 MD |
1459 | /* CHECK_INTS; */ |
1460 | scm_iprin1 (SCM_CAR (exp), port, pstate); | |
1461 | } | |
1462 | } | |
c96d76b8 | 1463 | if (!SCM_NULL_OR_NIL_P (exp)) |
c62fbfe1 | 1464 | { |
0607ebbf | 1465 | scm_puts_unlocked (" . ", port); |
c62fbfe1 MD |
1466 | scm_iprin1 (exp, port, pstate); |
1467 | } | |
1468 | skip_tail: | |
1469 | pstate->list_offset -= pstate->top - floor - 2; | |
a51ea417 | 1470 | goto end; |
a51ea417 | 1471 | |
c62fbfe1 MD |
1472 | fancy_circref: |
1473 | pstate->list_offset -= pstate->top - floor - 2; | |
1474 | ||
1475 | circref: | |
0607ebbf | 1476 | scm_puts_unlocked (" . ", port); |
c62fbfe1 MD |
1477 | print_circref (port, pstate, exp); |
1478 | goto end; | |
0f2d19dd JB |
1479 | } |
1480 | ||
1481 | \f | |
1482 | ||
bb35f315 MV |
1483 | int |
1484 | scm_valid_oport_value_p (SCM val) | |
1485 | { | |
368cf54d GB |
1486 | return (SCM_OPOUTPORTP (val) |
1487 | || (SCM_PORT_WITH_PS_P (val) | |
1488 | && SCM_OPOUTPORTP (SCM_PORT_WITH_PS_PORT (val)))); | |
bb35f315 MV |
1489 | } |
1490 | ||
8b840115 | 1491 | /* SCM_GPROC(s_write, "write", 1, 1, 0, scm_write, g_write); */ |
1cc91f1b | 1492 | |
0f2d19dd | 1493 | SCM |
1bbd0b84 | 1494 | scm_write (SCM obj, SCM port) |
0f2d19dd JB |
1495 | { |
1496 | if (SCM_UNBNDP (port)) | |
9de87eea | 1497 | port = scm_current_output_port (); |
3eb7e6ee JB |
1498 | |
1499 | SCM_ASSERT (scm_valid_oport_value_p (port), port, SCM_ARG2, s_write); | |
bb35f315 | 1500 | |
215fe3a8 | 1501 | scm_dynwind_begin (0); |
92c0ebac | 1502 | scm_dynwind_lock_port (SCM_COERCE_OUTPORT (port)); |
a51ea417 | 1503 | scm_prin1 (obj, port, 1); |
215fe3a8 AW |
1504 | scm_dynwind_end (); |
1505 | ||
0f2d19dd JB |
1506 | return SCM_UNSPECIFIED; |
1507 | } | |
1508 | ||
1509 | ||
8b840115 | 1510 | /* SCM_GPROC(s_display, "display", 1, 1, 0, scm_display, g_display); */ |
1cc91f1b | 1511 | |
0f2d19dd | 1512 | SCM |
1bbd0b84 | 1513 | scm_display (SCM obj, SCM port) |
0f2d19dd JB |
1514 | { |
1515 | if (SCM_UNBNDP (port)) | |
9de87eea | 1516 | port = scm_current_output_port (); |
3eb7e6ee JB |
1517 | |
1518 | SCM_ASSERT (scm_valid_oport_value_p (port), port, SCM_ARG2, s_display); | |
bb35f315 | 1519 | |
215fe3a8 | 1520 | scm_dynwind_begin (0); |
92c0ebac | 1521 | scm_dynwind_lock_port (SCM_COERCE_OUTPORT (port)); |
a51ea417 | 1522 | scm_prin1 (obj, port, 0); |
215fe3a8 AW |
1523 | scm_dynwind_end (); |
1524 | ||
0f2d19dd JB |
1525 | return SCM_UNSPECIFIED; |
1526 | } | |
1527 | ||
70d63753 GB |
1528 | |
1529 | SCM_DEFINE (scm_simple_format, "simple-format", 2, 0, 1, | |
1530 | (SCM destination, SCM message, SCM args), | |
eca65e90 MG |
1531 | "Write @var{message} to @var{destination}, defaulting to\n" |
1532 | "the current output port.\n" | |
1533 | "@var{message} can contain @code{~A} (was @code{%s}) and\n" | |
1534 | "@code{~S} (was @code{%S}) escapes. When printed,\n" | |
1535 | "the escapes are replaced with corresponding members of\n" | |
b7e64f8b | 1536 | "@var{args}:\n" |
eca65e90 MG |
1537 | "@code{~A} formats using @code{display} and @code{~S} formats\n" |
1538 | "using @code{write}.\n" | |
1539 | "If @var{destination} is @code{#t}, then use the current output\n" | |
1540 | "port, if @var{destination} is @code{#f}, then return a string\n" | |
1541 | "containing the formatted text. Does not add a trailing newline.") | |
70d63753 GB |
1542 | #define FUNC_NAME s_scm_simple_format |
1543 | { | |
dfd03fb9 | 1544 | SCM port, answer = SCM_UNSPECIFIED; |
70d63753 GB |
1545 | int fReturnString = 0; |
1546 | int writingp; | |
889975e5 | 1547 | size_t start, p, end; |
70d63753 | 1548 | |
bc36d050 | 1549 | if (scm_is_eq (destination, SCM_BOOL_T)) |
daba1a71 | 1550 | { |
9de87eea | 1551 | destination = port = scm_current_output_port (); |
daba1a71 | 1552 | } |
7888309b | 1553 | else if (scm_is_false (destination)) |
daba1a71 MD |
1554 | { |
1555 | fReturnString = 1; | |
0b2c2ba3 | 1556 | port = scm_mkstrport (SCM_INUM0, SCM_BOOL_F, |
dfd03fb9 MD |
1557 | SCM_OPN | SCM_WRTNG, |
1558 | FUNC_NAME); | |
1559 | destination = port; | |
daba1a71 MD |
1560 | } |
1561 | else | |
1562 | { | |
1563 | SCM_VALIDATE_OPORT_VALUE (1, destination); | |
dfd03fb9 | 1564 | port = SCM_COERCE_OUTPORT (destination); |
daba1a71 MD |
1565 | } |
1566 | SCM_VALIDATE_STRING (2, message); | |
af45e3b0 | 1567 | SCM_VALIDATE_REST_ARGUMENT (args); |
70d63753 | 1568 | |
889975e5 MG |
1569 | p = 0; |
1570 | start = 0; | |
1571 | end = scm_i_string_length (message); | |
b24b5e13 | 1572 | for (p = start; p != end; ++p) |
889975e5 | 1573 | if (scm_i_string_ref (message, p) == '~') |
70d63753 | 1574 | { |
b24b5e13 | 1575 | if (++p == end) |
6662998f MV |
1576 | break; |
1577 | ||
889975e5 | 1578 | switch (scm_i_string_ref (message, p)) |
6662998f MV |
1579 | { |
1580 | case 'A': case 'a': | |
1581 | writingp = 0; | |
1582 | break; | |
1583 | case 'S': case 's': | |
1584 | writingp = 1; | |
1585 | break; | |
1586 | case '~': | |
889975e5 | 1587 | scm_lfwrite_substr (message, start, p, port); |
6662998f MV |
1588 | start = p + 1; |
1589 | continue; | |
1590 | case '%': | |
889975e5 | 1591 | scm_lfwrite_substr (message, start, p - 1, port); |
dfd03fb9 | 1592 | scm_newline (port); |
6662998f MV |
1593 | start = p + 1; |
1594 | continue; | |
1595 | default: | |
1afff620 | 1596 | SCM_MISC_ERROR ("FORMAT: Unsupported format option ~~~A - use (ice-9 format) instead", |
889975e5 | 1597 | scm_list_1 (SCM_MAKE_CHAR (scm_i_string_ref (message, p)))); |
6662998f MV |
1598 | |
1599 | } | |
70d63753 | 1600 | |
6662998f | 1601 | |
d2e53ed6 | 1602 | if (!scm_is_pair (args)) |
1afff620 | 1603 | SCM_MISC_ERROR ("FORMAT: Missing argument for ~~~A", |
889975e5 | 1604 | scm_list_1 (SCM_MAKE_CHAR (scm_i_string_ref (message, p)))); |
6662998f | 1605 | |
889975e5 | 1606 | scm_lfwrite_substr (message, start, p - 1, port); |
dfd03fb9 | 1607 | /* we pass destination here */ |
70d63753 GB |
1608 | scm_prin1 (SCM_CAR (args), destination, writingp); |
1609 | args = SCM_CDR (args); | |
1610 | start = p + 1; | |
1611 | } | |
6662998f | 1612 | |
889975e5 | 1613 | scm_lfwrite_substr (message, start, p, port); |
bc36d050 | 1614 | if (!scm_is_eq (args, SCM_EOL)) |
1afff620 KN |
1615 | SCM_MISC_ERROR ("FORMAT: ~A superfluous arguments", |
1616 | scm_list_1 (scm_length (args))); | |
70d63753 GB |
1617 | |
1618 | if (fReturnString) | |
1619 | answer = scm_strport_to_string (destination); | |
1620 | ||
daba1a71 | 1621 | return scm_return_first (answer, message); |
70d63753 GB |
1622 | } |
1623 | #undef FUNC_NAME | |
1624 | ||
1625 | ||
3b3b36dd | 1626 | SCM_DEFINE (scm_newline, "newline", 0, 1, 0, |
b450f070 | 1627 | (SCM port), |
8f85c0c6 NJ |
1628 | "Send a newline to @var{port}.\n" |
1629 | "If @var{port} is omitted, send to the current output port.") | |
1bbd0b84 | 1630 | #define FUNC_NAME s_scm_newline |
0f2d19dd JB |
1631 | { |
1632 | if (SCM_UNBNDP (port)) | |
9de87eea | 1633 | port = scm_current_output_port (); |
3eb7e6ee | 1634 | |
34d19ef6 | 1635 | SCM_VALIDATE_OPORT_VALUE (1, port); |
bb35f315 | 1636 | |
0607ebbf | 1637 | scm_putc_unlocked ('\n', SCM_COERCE_OUTPORT (port)); |
0f2d19dd JB |
1638 | return SCM_UNSPECIFIED; |
1639 | } | |
1bbd0b84 | 1640 | #undef FUNC_NAME |
0f2d19dd | 1641 | |
3b3b36dd | 1642 | SCM_DEFINE (scm_write_char, "write-char", 1, 1, 0, |
b450f070 | 1643 | (SCM chr, SCM port), |
eca65e90 | 1644 | "Send character @var{chr} to @var{port}.") |
1bbd0b84 | 1645 | #define FUNC_NAME s_scm_write_char |
0f2d19dd JB |
1646 | { |
1647 | if (SCM_UNBNDP (port)) | |
9de87eea | 1648 | port = scm_current_output_port (); |
3eb7e6ee | 1649 | |
34d19ef6 HWN |
1650 | SCM_VALIDATE_CHAR (1, chr); |
1651 | SCM_VALIDATE_OPORT_VALUE (2, port); | |
07f49ac7 LC |
1652 | |
1653 | port = SCM_COERCE_OUTPORT (port); | |
1654 | if (!display_character (SCM_CHAR (chr), port, | |
478848cb | 1655 | PORT_CONVERSION_HANDLER (port))) |
07f49ac7 LC |
1656 | scm_encoding_error (__func__, errno, |
1657 | "cannot convert to output locale", | |
6851d3be | 1658 | port, chr); |
07f49ac7 | 1659 | |
0f2d19dd JB |
1660 | return SCM_UNSPECIFIED; |
1661 | } | |
1bbd0b84 | 1662 | #undef FUNC_NAME |
0f2d19dd | 1663 | |
0f2d19dd JB |
1664 | \f |
1665 | ||
bb35f315 | 1666 | /* Call back to Scheme code to do the printing of special objects |
c19bc088 MD |
1667 | * (like structs). SCM_PRINTER_APPLY applies PROC to EXP and a smob |
1668 | * containing PORT and PSTATE. This object can be used as the port for | |
1669 | * display/write etc to continue the current print chain. The REVEALED | |
1670 | * field of PSTATE is set to true to indicate that the print state has | |
1671 | * escaped to Scheme and thus has to be freed by the GC. | |
1672 | */ | |
1673 | ||
92c2555f | 1674 | scm_t_bits scm_tc16_port_with_ps; |
c19bc088 MD |
1675 | |
1676 | /* Print exactly as the port itself would */ | |
1677 | ||
1678 | static int | |
e841c3e0 | 1679 | port_with_ps_print (SCM obj, SCM port, scm_print_state *pstate) |
c19bc088 MD |
1680 | { |
1681 | obj = SCM_PORT_WITH_PS_PORT (obj); | |
62bd5d66 | 1682 | return SCM_PORT_DESCRIPTOR (obj)->print (obj, port, pstate); |
c19bc088 | 1683 | } |
c4f37e80 MV |
1684 | |
1685 | SCM | |
1bbd0b84 | 1686 | scm_printer_apply (SCM proc, SCM exp, SCM port, scm_print_state *pstate) |
c4f37e80 | 1687 | { |
bb35f315 | 1688 | pstate->revealed = 1; |
dfd03fb9 MD |
1689 | return scm_call_2 (proc, exp, |
1690 | scm_i_port_with_print_state (port, pstate->handle)); | |
c19bc088 MD |
1691 | } |
1692 | ||
dfd03fb9 | 1693 | SCM_DEFINE (scm_port_with_print_state, "port-with-print-state", 1, 1, 0, |
1bbd0b84 | 1694 | (SCM port, SCM pstate), |
71331188 | 1695 | "Create a new port which behaves like @var{port}, but with an\n" |
dfd03fb9 MD |
1696 | "included print state @var{pstate}. @var{pstate} is optional.\n" |
1697 | "If @var{pstate} isn't supplied and @var{port} already has\n" | |
1698 | "a print state, the old print state is reused.") | |
1bbd0b84 | 1699 | #define FUNC_NAME s_scm_port_with_print_state |
c19bc088 | 1700 | { |
34d19ef6 | 1701 | SCM_VALIDATE_OPORT_VALUE (1, port); |
dfd03fb9 MD |
1702 | if (!SCM_UNBNDP (pstate)) |
1703 | SCM_VALIDATE_PRINTSTATE (2, pstate); | |
1704 | return scm_i_port_with_print_state (port, pstate); | |
c19bc088 | 1705 | } |
1bbd0b84 | 1706 | #undef FUNC_NAME |
c19bc088 | 1707 | |
a1ec6916 | 1708 | SCM_DEFINE (scm_get_print_state, "get-print-state", 1, 0, 0, |
1bbd0b84 | 1709 | (SCM port), |
71331188 MG |
1710 | "Return the print state of the port @var{port}. If @var{port}\n" |
1711 | "has no associated print state, @code{#f} is returned.") | |
1bbd0b84 | 1712 | #define FUNC_NAME s_scm_get_print_state |
c19bc088 | 1713 | { |
368cf54d GB |
1714 | if (SCM_PORT_WITH_PS_P (port)) |
1715 | return SCM_PORT_WITH_PS_PS (port); | |
f5f2dcff | 1716 | if (SCM_OUTPUT_PORT_P (port)) |
368cf54d | 1717 | return SCM_BOOL_F; |
276dd677 | 1718 | SCM_WRONG_TYPE_ARG (1, port); |
c4f37e80 | 1719 | } |
1bbd0b84 | 1720 | #undef FUNC_NAME |
bb35f315 | 1721 | |
c4f37e80 | 1722 | \f |
1cc91f1b | 1723 | |
0f2d19dd JB |
1724 | void |
1725 | scm_init_print () | |
0f2d19dd | 1726 | { |
231dd356 | 1727 | SCM type; |
d5cf5324 | 1728 | |
231dd356 AW |
1729 | type = scm_make_vtable (scm_from_locale_string (SCM_PRINT_STATE_LAYOUT), |
1730 | SCM_BOOL_F); | |
4a655e50 | 1731 | scm_set_struct_vtable_name_x (type, scm_from_latin1_symbol ("print-state")); |
bb35f315 | 1732 | scm_print_state_vtable = type; |
c4f37e80 | 1733 | |
c19bc088 MD |
1734 | /* Don't want to bind a wrapper class in GOOPS, so pass 0 as arg1. */ |
1735 | scm_tc16_port_with_ps = scm_make_smob_type (0, 0); | |
e841c3e0 | 1736 | scm_set_smob_print (scm_tc16_port_with_ps, port_with_ps_print); |
81ae25da | 1737 | |
a0599745 | 1738 | #include "libguile/print.x" |
475fa9a5 | 1739 | |
8500b186 AW |
1740 | scm_init_opts (scm_print_options, scm_print_opts); |
1741 | scm_print_opts[SCM_PRINT_HIGHLIGHT_PREFIX_I].val = | |
1742 | SCM_UNPACK (scm_from_locale_string ("{")); | |
1743 | scm_print_opts[SCM_PRINT_HIGHLIGHT_SUFFIX_I].val = | |
1744 | SCM_UNPACK (scm_from_locale_string ("}")); | |
475fa9a5 | 1745 | scm_print_opts[SCM_PRINT_KEYWORD_STYLE_I].val = SCM_UNPACK (sym_reader); |
0f2d19dd | 1746 | } |
89e00824 ML |
1747 | |
1748 | /* | |
1749 | Local Variables: | |
1750 | c-file-style: "gnu" | |
1751 | End: | |
1752 | */ |