Commit | Line | Data |
---|---|---|
4a655e50 | 1 | /* Copyright (C) 2006, 2007, 2008, 2009, 2010, 2011 Free Software Foundation, Inc. |
9361f762 MV |
2 | * |
3 | * This library is free software; you can redistribute it and/or | |
53befeb7 NJ |
4 | * modify it under the terms of the GNU Lesser General Public License |
5 | * as published by the Free Software Foundation; either version 3 of | |
6 | * the License, or (at your option) any later version. | |
9361f762 | 7 | * |
53befeb7 NJ |
8 | * This library is distributed in the hope that it will be useful, but |
9 | * WITHOUT ANY WARRANTY; without even the implied warranty of | |
9361f762 MV |
10 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
11 | * Lesser General Public License for more details. | |
12 | * | |
13 | * You should have received a copy of the GNU Lesser General Public | |
14 | * License along with this library; if not, write to the Free Software | |
53befeb7 NJ |
15 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA |
16 | * 02110-1301 USA | |
9361f762 MV |
17 | */ |
18 | ||
dbb605f5 | 19 | #ifdef HAVE_CONFIG_H |
9361f762 MV |
20 | # include <config.h> |
21 | #endif | |
22 | ||
f7439099 | 23 | #include <alloca.h> |
b89c4943 | 24 | |
9361f762 | 25 | #include "libguile/_scm.h" |
756e8a3a | 26 | #include "libguile/extensions.h" |
9361f762 MV |
27 | #include "libguile/feature.h" |
28 | #include "libguile/i18n.h" | |
29 | #include "libguile/strings.h" | |
b89c4943 | 30 | #include "libguile/chars.h" |
9361f762 | 31 | #include "libguile/dynwind.h" |
b89c4943 LC |
32 | #include "libguile/validate.h" |
33 | #include "libguile/values.h" | |
a2f00b9b | 34 | #include "libguile/threads.h" |
9361f762 | 35 | |
9361f762 | 36 | #include <locale.h> |
b89c4943 LC |
37 | #include <string.h> /* `strcoll ()' */ |
38 | #include <ctype.h> /* `toupper ()' et al. */ | |
39 | #include <errno.h> | |
5b878445 MG |
40 | #include <unicase.h> |
41 | #include <unistr.h> | |
9361f762 | 42 | |
b89c4943 | 43 | #if (defined HAVE_NEWLOCALE) && (defined HAVE_STRCOLL_L) |
a2f00b9b LC |
44 | /* The GNU thread-aware locale API is documented in ``Thread-Aware Locale |
45 | Model, a Proposal'', by Ulrich Drepper: | |
46 | ||
47 | http://people.redhat.com/drepper/tllocale.ps.gz | |
48 | ||
49 | It is now also implemented by Darwin: | |
50 | ||
51 | http://developer.apple.com/documentation/Darwin/Reference/ManPages/man3/newlocale.3.html | |
52 | ||
83fda470 LC |
53 | The whole API was eventually standardized in the ``Open Group Base |
54 | Specifications Issue 7'' (aka. "POSIX 2008"): | |
55 | ||
56 | http://www.opengroup.org/onlinepubs/9699919799/basedefs/locale.h.html */ | |
b89c4943 | 57 | # define USE_GNU_LOCALE_API |
9361f762 | 58 | #endif |
b89c4943 | 59 | |
a2f00b9b LC |
60 | #include "libguile/posix.h" /* for `scm_i_locale_mutex' */ |
61 | ||
56d288b8 | 62 | #ifdef HAVE_LANGINFO_H |
a2f00b9b | 63 | # include <langinfo.h> |
56d288b8 LC |
64 | #endif |
65 | #ifdef HAVE_NL_TYPES_H | |
a2f00b9b | 66 | # include <nl_types.h> |
9361f762 | 67 | #endif |
56d288b8 LC |
68 | #ifndef HAVE_NL_ITEM |
69 | /* Cygwin has <langinfo.h> but lacks <nl_types.h> and `nl_item'. */ | |
70 | typedef int nl_item; | |
71 | #endif | |
b89c4943 LC |
72 | |
73 | #ifndef HAVE_SETLOCALE | |
74 | static inline char * | |
75 | setlocale (int category, const char *name) | |
76 | { | |
77 | errno = ENOSYS; | |
78 | return NULL; | |
79 | } | |
9361f762 | 80 | #endif |
b89c4943 | 81 | |
a2f00b9b LC |
82 | /* Helper stringification macro. */ |
83 | #define SCM_I18N_STRINGIFY(_name) # _name | |
84 | ||
b89c4943 LC |
85 | |
86 | \f | |
87 | /* Locale objects, string and character collation, and other locale-dependent | |
88 | string operations. | |
89 | ||
90 | A large part of the code here deals with emulating glibc's reentrant | |
91 | locale API on non-GNU systems. The emulation is a bit "brute-force": | |
92 | Whenever a `-locale<?' procedure is passed a locale object, then: | |
93 | ||
a2f00b9b | 94 | 1. The `scm_i_locale_mutex' is locked. |
b89c4943 | 95 | 2. A series of `setlocale ()' call is performed to store the current |
a2f00b9b | 96 | locale for each category in an `scm_t_locale' object. |
b89c4943 LC |
97 | 3. A series of `setlocale ()' call is made to install each of the locale |
98 | categories of each of the base locales of each locale object, | |
99 | recursively, starting from the last locale object of the chain. | |
100 | 4. The settings captured in step (2) are restored. | |
a2f00b9b | 101 | 5. The `scm_i_locale_mutex' is released. |
b89c4943 | 102 | |
a2f00b9b | 103 | Hopefully, the X/Open standard will eventually make this hack useless. |
b89c4943 LC |
104 | |
105 | Note: We don't wrap glibc's `uselocale ()' call because it sets the locale | |
106 | of the current _thread_ (unlike `setlocale ()') and doing so would require | |
107 | maintaining per-thread locale information on non-GNU systems and always | |
108 | re-installing this locale upon locale-dependent calls. */ | |
109 | ||
110 | ||
a2f00b9b LC |
111 | /* Return the category mask corresponding to CAT. */ |
112 | #define SCM_LOCALE_CATEGORY_MASK(_cat) LC_ ## _cat ## _MASK | |
113 | ||
114 | ||
b89c4943 LC |
115 | #ifndef USE_GNU_LOCALE_API |
116 | ||
a2f00b9b LC |
117 | /* Provide the locale category masks as found in glibc. This must be kept in |
118 | sync with `locale-categories.h'. */ | |
b89c4943 | 119 | |
a2f00b9b LC |
120 | # define LC_CTYPE_MASK 1 |
121 | # define LC_COLLATE_MASK 2 | |
122 | # define LC_MESSAGES_MASK 4 | |
123 | # define LC_MONETARY_MASK 8 | |
124 | # define LC_NUMERIC_MASK 16 | |
125 | # define LC_TIME_MASK 32 | |
b89c4943 LC |
126 | |
127 | # ifdef LC_PAPER | |
a2f00b9b | 128 | # define LC_PAPER_MASK 64 |
b89c4943 LC |
129 | # else |
130 | # define LC_PAPER_MASK 0 | |
131 | # endif | |
132 | # ifdef LC_NAME | |
a2f00b9b | 133 | # define LC_NAME_MASK 128 |
b89c4943 LC |
134 | # else |
135 | # define LC_NAME_MASK 0 | |
136 | # endif | |
137 | # ifdef LC_ADDRESS | |
a2f00b9b | 138 | # define LC_ADDRESS_MASK 256 |
b89c4943 LC |
139 | # else |
140 | # define LC_ADDRESS_MASK 0 | |
141 | # endif | |
142 | # ifdef LC_TELEPHONE | |
a2f00b9b | 143 | # define LC_TELEPHONE_MASK 512 |
b89c4943 LC |
144 | # else |
145 | # define LC_TELEPHONE_MASK 0 | |
146 | # endif | |
147 | # ifdef LC_MEASUREMENT | |
a2f00b9b | 148 | # define LC_MEASUREMENT_MASK 1024 |
b89c4943 LC |
149 | # else |
150 | # define LC_MEASUREMENT_MASK 0 | |
151 | # endif | |
152 | # ifdef LC_IDENTIFICATION | |
a2f00b9b | 153 | # define LC_IDENTIFICATION_MASK 2048 |
b89c4943 LC |
154 | # else |
155 | # define LC_IDENTIFICATION_MASK 0 | |
156 | # endif | |
157 | ||
a2f00b9b LC |
158 | # define LC_ALL_MASK (LC_CTYPE_MASK \ |
159 | | LC_NUMERIC_MASK \ | |
160 | | LC_TIME_MASK \ | |
161 | | LC_COLLATE_MASK \ | |
162 | | LC_MONETARY_MASK \ | |
163 | | LC_MESSAGES_MASK \ | |
164 | | LC_PAPER_MASK \ | |
165 | | LC_NAME_MASK \ | |
166 | | LC_ADDRESS_MASK \ | |
167 | | LC_TELEPHONE_MASK \ | |
168 | | LC_MEASUREMENT_MASK \ | |
169 | | LC_IDENTIFICATION_MASK \ | |
b89c4943 LC |
170 | ) |
171 | ||
172 | /* Locale objects as returned by `make-locale' on non-GNU systems. */ | |
173 | typedef struct scm_locale | |
174 | { | |
175 | SCM base_locale; /* a `locale' object */ | |
176 | char *locale_name; | |
177 | int category_mask; | |
178 | } *scm_t_locale; | |
179 | ||
a2f00b9b LC |
180 | |
181 | /* Free the resources used by LOCALE. */ | |
182 | static inline void | |
183 | scm_i_locale_free (scm_t_locale locale) | |
184 | { | |
185 | free (locale->locale_name); | |
186 | locale->locale_name = NULL; | |
187 | } | |
188 | ||
189 | #else /* USE_GNU_LOCALE_API */ | |
b89c4943 LC |
190 | |
191 | /* Alias for glibc's locale type. */ | |
192 | typedef locale_t scm_t_locale; | |
193 | ||
a2f00b9b LC |
194 | #define scm_i_locale_free freelocale |
195 | ||
196 | #endif /* USE_GNU_LOCALE_API */ | |
197 | ||
198 | ||
199 | /* A locale object denoting the global locale. */ | |
200 | SCM_GLOBAL_VARIABLE (scm_global_locale, "%global-locale"); | |
201 | ||
b89c4943 LC |
202 | |
203 | /* Validate parameter ARG as a locale object and set C_LOCALE to the | |
204 | corresponding C locale object. */ | |
205 | #define SCM_VALIDATE_LOCALE_COPY(_pos, _arg, _c_locale) \ | |
206 | do \ | |
207 | { \ | |
208 | SCM_VALIDATE_SMOB ((_pos), (_arg), locale_smob_type); \ | |
209 | (_c_locale) = (scm_t_locale)SCM_SMOB_DATA (_arg); \ | |
210 | } \ | |
211 | while (0) | |
212 | ||
213 | /* Validate optional parameter ARG as either undefined or bound to a locale | |
214 | object. Set C_LOCALE to the corresponding C locale object or NULL. */ | |
215 | #define SCM_VALIDATE_OPTIONAL_LOCALE_COPY(_pos, _arg, _c_locale) \ | |
216 | do \ | |
217 | { \ | |
218 | if ((_arg) != SCM_UNDEFINED) \ | |
219 | SCM_VALIDATE_LOCALE_COPY (_pos, _arg, _c_locale); \ | |
220 | else \ | |
221 | (_c_locale) = NULL; \ | |
222 | } \ | |
223 | while (0) | |
224 | ||
225 | ||
226 | SCM_SMOB (scm_tc16_locale_smob_type, "locale", 0); | |
227 | ||
228 | SCM_SMOB_FREE (scm_tc16_locale_smob_type, smob_locale_free, locale) | |
229 | { | |
230 | scm_t_locale c_locale; | |
231 | ||
a2f00b9b LC |
232 | c_locale = (scm_t_locale) SCM_SMOB_DATA (locale); |
233 | scm_i_locale_free (c_locale); | |
b89c4943 LC |
234 | |
235 | return 0; | |
236 | } | |
237 | ||
9361f762 | 238 | |
a2f00b9b | 239 | static void inline scm_locale_error (const char *, int) SCM_NORETURN; |
b89c4943 | 240 | |
a2f00b9b LC |
241 | /* Throw an exception corresponding to error ERR. */ |
242 | static void inline | |
243 | scm_locale_error (const char *func_name, int err) | |
244 | { | |
245 | scm_syserror_msg (func_name, | |
246 | "Failed to install locale", | |
247 | SCM_EOL, err); | |
b89c4943 | 248 | } |
b89c4943 LC |
249 | |
250 | ||
251 | \f | |
a2f00b9b LC |
252 | /* Emulating GNU's reentrant locale API. */ |
253 | #ifndef USE_GNU_LOCALE_API | |
b89c4943 LC |
254 | |
255 | ||
256 | /* Maximum number of chained locales (via `base_locale'). */ | |
257 | #define LOCALE_STACK_SIZE_MAX 256 | |
258 | ||
259 | typedef struct | |
260 | { | |
261 | #define SCM_DEFINE_LOCALE_CATEGORY(_name) char * _name; | |
262 | #include "locale-categories.h" | |
263 | #undef SCM_DEFINE_LOCALE_CATEGORY | |
264 | } scm_t_locale_settings; | |
265 | ||
266 | /* Fill out SETTINGS according to the current locale settings. On success | |
267 | zero is returned and SETTINGS is properly initialized. */ | |
268 | static int | |
269 | get_current_locale_settings (scm_t_locale_settings *settings) | |
270 | { | |
271 | const char *locale_name; | |
272 | ||
273 | #define SCM_DEFINE_LOCALE_CATEGORY(_name) \ | |
274 | { \ | |
275 | SCM_SYSCALL (locale_name = setlocale (LC_ ## _name, NULL)); \ | |
a2f00b9b | 276 | if (locale_name == NULL) \ |
b89c4943 LC |
277 | goto handle_error; \ |
278 | \ | |
279 | settings-> _name = strdup (locale_name); \ | |
280 | if (settings-> _name == NULL) \ | |
281 | goto handle_oom; \ | |
282 | } | |
283 | ||
284 | #include "locale-categories.h" | |
285 | #undef SCM_DEFINE_LOCALE_CATEGORY | |
286 | ||
287 | return 0; | |
288 | ||
289 | handle_error: | |
a2f00b9b | 290 | return EINVAL; |
9361f762 | 291 | |
b89c4943 LC |
292 | handle_oom: |
293 | return ENOMEM; | |
294 | } | |
295 | ||
296 | /* Restore locale settings SETTINGS. On success, return zero. */ | |
297 | static int | |
298 | restore_locale_settings (const scm_t_locale_settings *settings) | |
299 | { | |
300 | const char *result; | |
301 | ||
302 | #define SCM_DEFINE_LOCALE_CATEGORY(_name) \ | |
303 | SCM_SYSCALL (result = setlocale (LC_ ## _name, settings-> _name)); \ | |
304 | if (result == NULL) \ | |
305 | goto handle_error; | |
306 | ||
307 | #include "locale-categories.h" | |
308 | #undef SCM_DEFINE_LOCALE_CATEGORY | |
309 | ||
310 | return 0; | |
311 | ||
312 | handle_error: | |
a2f00b9b | 313 | return EINVAL; |
b89c4943 LC |
314 | } |
315 | ||
316 | /* Free memory associated with SETTINGS. */ | |
317 | static void | |
318 | free_locale_settings (scm_t_locale_settings *settings) | |
319 | { | |
320 | #define SCM_DEFINE_LOCALE_CATEGORY(_name) \ | |
321 | free (settings-> _name); \ | |
322 | settings->_name = NULL; | |
323 | #include "locale-categories.h" | |
324 | #undef SCM_DEFINE_LOCALE_CATEGORY | |
325 | } | |
9361f762 | 326 | |
b89c4943 LC |
327 | /* Install the locale named LOCALE_NAME for all the categories listed in |
328 | CATEGORY_MASK. */ | |
329 | static int | |
330 | install_locale_categories (const char *locale_name, int category_mask) | |
331 | { | |
332 | const char *result; | |
9361f762 | 333 | |
b89c4943 | 334 | if (category_mask == LC_ALL_MASK) |
9361f762 | 335 | { |
b89c4943 LC |
336 | SCM_SYSCALL (result = setlocale (LC_ALL, locale_name)); |
337 | if (result == NULL) | |
338 | goto handle_error; | |
9361f762 MV |
339 | } |
340 | else | |
341 | { | |
b89c4943 | 342 | #define SCM_DEFINE_LOCALE_CATEGORY(_name) \ |
a2f00b9b | 343 | if (category_mask & SCM_LOCALE_CATEGORY_MASK (_name)) \ |
b89c4943 LC |
344 | { \ |
345 | SCM_SYSCALL (result = setlocale (LC_ ## _name, locale_name)); \ | |
346 | if (result == NULL) \ | |
347 | goto handle_error; \ | |
348 | } | |
349 | #include "locale-categories.h" | |
350 | #undef SCM_DEFINE_LOCALE_CATEGORY | |
351 | } | |
9361f762 | 352 | |
b89c4943 | 353 | return 0; |
9361f762 | 354 | |
b89c4943 | 355 | handle_error: |
a2f00b9b | 356 | return EINVAL; |
b89c4943 LC |
357 | } |
358 | ||
359 | /* Install LOCALE, recursively installing its base locales first. On | |
360 | success, zero is returned. */ | |
361 | static int | |
362 | install_locale (scm_t_locale locale) | |
363 | { | |
364 | scm_t_locale stack[LOCALE_STACK_SIZE_MAX]; | |
a2f00b9b | 365 | int category_mask = 0; |
b89c4943 LC |
366 | size_t stack_size = 0; |
367 | int stack_offset = 0; | |
368 | const char *result = NULL; | |
369 | ||
370 | /* Build up a locale stack by traversing the `base_locale' link. */ | |
371 | do | |
372 | { | |
373 | if (stack_size >= LOCALE_STACK_SIZE_MAX) | |
374 | /* We cannot use `scm_error ()' here because otherwise the locale | |
375 | mutex may remain locked. */ | |
376 | return EINVAL; | |
377 | ||
378 | stack[stack_size++] = locale; | |
379 | ||
a2f00b9b LC |
380 | /* Keep track of which categories have already been taken into |
381 | account. */ | |
382 | category_mask |= locale->category_mask; | |
383 | ||
b89c4943 | 384 | if (locale->base_locale != SCM_UNDEFINED) |
a2f00b9b | 385 | locale = (scm_t_locale) SCM_SMOB_DATA (locale->base_locale); |
9361f762 | 386 | else |
b89c4943 LC |
387 | locale = NULL; |
388 | } | |
a2f00b9b | 389 | while ((locale != NULL) && (category_mask != LC_ALL_MASK)); |
9361f762 | 390 | |
b89c4943 LC |
391 | /* Install the C locale to start from a pristine state. */ |
392 | SCM_SYSCALL (result = setlocale (LC_ALL, "C")); | |
393 | if (result == NULL) | |
394 | goto handle_error; | |
395 | ||
396 | /* Install the locales in reverse order. */ | |
397 | for (stack_offset = stack_size - 1; | |
398 | stack_offset >= 0; | |
399 | stack_offset--) | |
400 | { | |
401 | int err; | |
402 | scm_t_locale locale; | |
403 | ||
404 | locale = stack[stack_offset]; | |
405 | err = install_locale_categories (locale->locale_name, | |
406 | locale->category_mask); | |
407 | if (err) | |
408 | goto handle_error; | |
9361f762 MV |
409 | } |
410 | ||
b89c4943 | 411 | return 0; |
9361f762 | 412 | |
b89c4943 | 413 | handle_error: |
a2f00b9b | 414 | return EINVAL; |
9361f762 | 415 | } |
9361f762 | 416 | |
b89c4943 LC |
417 | /* Leave the locked locale section. */ |
418 | static inline void | |
419 | leave_locale_section (const scm_t_locale_settings *settings) | |
420 | { | |
421 | /* Restore the previous locale settings. */ | |
422 | (void)restore_locale_settings (settings); | |
423 | ||
424 | scm_i_pthread_mutex_unlock (&scm_i_locale_mutex); | |
425 | } | |
9361f762 | 426 | |
b89c4943 LC |
427 | /* Enter a locked locale section. */ |
428 | static inline int | |
429 | enter_locale_section (scm_t_locale locale, | |
430 | scm_t_locale_settings *prev_locale) | |
9361f762 | 431 | { |
b89c4943 LC |
432 | int err; |
433 | ||
434 | scm_i_pthread_mutex_lock (&scm_i_locale_mutex); | |
435 | ||
436 | err = get_current_locale_settings (prev_locale); | |
437 | if (err) | |
438 | { | |
439 | scm_i_pthread_mutex_unlock (&scm_i_locale_mutex); | |
440 | return err; | |
441 | } | |
9361f762 | 442 | |
b89c4943 LC |
443 | err = install_locale (locale); |
444 | if (err) | |
445 | { | |
446 | leave_locale_section (prev_locale); | |
447 | free_locale_settings (prev_locale); | |
448 | } | |
449 | ||
450 | return err; | |
451 | } | |
452 | ||
b89c4943 LC |
453 | /* Convenient macro to run STATEMENT in the locale context of C_LOCALE. */ |
454 | #define RUN_IN_LOCALE_SECTION(_c_locale, _statement) \ | |
455 | do \ | |
456 | { \ | |
457 | int lsec_err; \ | |
458 | scm_t_locale_settings lsec_prev_locale; \ | |
459 | \ | |
460 | lsec_err = enter_locale_section ((_c_locale), &lsec_prev_locale); \ | |
461 | if (lsec_err) \ | |
462 | scm_locale_error (FUNC_NAME, lsec_err); \ | |
463 | else \ | |
464 | { \ | |
465 | _statement ; \ | |
466 | \ | |
467 | leave_locale_section (&lsec_prev_locale); \ | |
468 | free_locale_settings (&lsec_prev_locale); \ | |
469 | } \ | |
470 | } \ | |
471 | while (0) | |
472 | ||
a2f00b9b LC |
473 | /* Convert the current locale settings into a locale SMOB. On success, zero |
474 | is returned and RESULT points to the new SMOB. Otherwise, an error is | |
475 | returned. */ | |
476 | static int | |
477 | get_current_locale (SCM *result) | |
478 | { | |
479 | int err = 0; | |
480 | scm_t_locale c_locale; | |
481 | const char *current_locale; | |
482 | ||
483 | c_locale = scm_gc_malloc (sizeof (* c_locale), "locale"); | |
484 | ||
485 | ||
486 | scm_i_pthread_mutex_lock (&scm_i_locale_mutex); | |
487 | ||
488 | c_locale->category_mask = LC_ALL_MASK; | |
489 | c_locale->base_locale = SCM_UNDEFINED; | |
490 | ||
491 | current_locale = setlocale (LC_ALL, NULL); | |
492 | if (current_locale != NULL) | |
493 | { | |
494 | c_locale->locale_name = strdup (current_locale); | |
495 | if (c_locale->locale_name == NULL) | |
496 | err = ENOMEM; | |
497 | } | |
498 | else | |
499 | err = EINVAL; | |
500 | ||
501 | scm_i_pthread_mutex_unlock (&scm_i_locale_mutex); | |
502 | ||
503 | if (err) | |
504 | scm_gc_free (c_locale, sizeof (* c_locale), "locale"); | |
505 | else | |
506 | SCM_NEWSMOB (*result, scm_tc16_locale_smob_type, c_locale); | |
507 | ||
508 | return err; | |
509 | } | |
510 | ||
5b878445 | 511 | #else /* USE_GNU_LOCALE_API */ |
a2f00b9b | 512 | |
5b878445 | 513 | /* Convenient macro to run STATEMENT in the locale context of C_LOCALE. */ |
12f0c3e5 LC |
514 | #define RUN_IN_LOCALE_SECTION(_c_locale, _statement) \ |
515 | do \ | |
516 | { \ | |
517 | scm_t_locale old_loc; \ | |
518 | \ | |
519 | old_loc = uselocale (_c_locale); \ | |
520 | _statement ; \ | |
521 | uselocale (old_loc); \ | |
522 | } \ | |
5b878445 MG |
523 | while (0) |
524 | ||
525 | ||
526 | #endif /* USE_GNU_LOCALE_API */ | |
9361f762 | 527 | |
a2f00b9b LC |
528 | |
529 | \f | |
530 | /* `make-locale' can take either category lists or single categories (the | |
531 | `LC_*' integer constants). */ | |
532 | #define SCM_LIST_OR_INTEGER_P(arg) \ | |
533 | (scm_is_integer (arg) || scm_is_true (scm_list_p (arg))) | |
534 | ||
535 | ||
536 | /* Return the category mask corresponding to CATEGORY (an `LC_' integer | |
537 | constant). */ | |
538 | static inline int | |
539 | category_to_category_mask (SCM category, | |
540 | const char *func_name, int pos) | |
541 | { | |
542 | int c_category; | |
543 | int c_category_mask; | |
544 | ||
545 | c_category = scm_to_int (category); | |
546 | ||
547 | #define SCM_DEFINE_LOCALE_CATEGORY(_name) \ | |
548 | case LC_ ## _name: \ | |
549 | c_category_mask = SCM_LOCALE_CATEGORY_MASK (_name); \ | |
550 | break; | |
551 | ||
552 | switch (c_category) | |
553 | { | |
554 | #include "locale-categories.h" | |
555 | ||
556 | case LC_ALL: | |
557 | c_category_mask = LC_ALL_MASK; | |
558 | break; | |
559 | ||
560 | default: | |
561 | scm_wrong_type_arg_msg (func_name, pos, category, | |
562 | "locale category"); | |
563 | } | |
564 | ||
565 | #undef SCM_DEFINE_LOCALE_CATEGORY | |
566 | ||
567 | return c_category_mask; | |
568 | } | |
569 | ||
570 | /* Convert CATEGORIES, a list of locale categories or a single category (an | |
571 | integer), into a category mask. */ | |
572 | static int | |
573 | category_list_to_category_mask (SCM categories, | |
574 | const char *func_name, int pos) | |
575 | { | |
576 | int c_category_mask = 0; | |
577 | ||
578 | if (scm_is_integer (categories)) | |
579 | c_category_mask = category_to_category_mask (categories, | |
580 | func_name, pos); | |
581 | else | |
582 | for (; !scm_is_null (categories); categories = SCM_CDR (categories)) | |
583 | { | |
584 | SCM category = SCM_CAR (categories); | |
585 | ||
586 | c_category_mask |= | |
587 | category_to_category_mask (category, func_name, pos); | |
588 | } | |
589 | ||
590 | return c_category_mask; | |
591 | } | |
592 | ||
593 | ||
594 | SCM_DEFINE (scm_make_locale, "make-locale", 2, 1, 0, | |
595 | (SCM category_list, SCM locale_name, SCM base_locale), | |
596 | "Return a reference to a data structure representing a set of " | |
597 | "locale datasets. @var{category_list} should be either a list " | |
598 | "of locale categories or a single category as used with " | |
599 | "@code{setlocale} (@pxref{Locales, @code{setlocale}}) and " | |
600 | "@var{locale_name} should be the name of the locale considered " | |
601 | "(e.g., @code{\"sl_SI\"}). Optionally, if @code{base_locale} is " | |
602 | "passed, it should be a locale object denoting settings for " | |
603 | "categories not listed in @var{category_list}.") | |
604 | #define FUNC_NAME s_scm_make_locale | |
605 | { | |
606 | SCM locale = SCM_BOOL_F; | |
607 | int err = 0; | |
608 | int c_category_mask; | |
609 | char *c_locale_name; | |
610 | scm_t_locale c_base_locale, c_locale; | |
611 | ||
612 | SCM_MAKE_VALIDATE (1, category_list, LIST_OR_INTEGER_P); | |
613 | SCM_VALIDATE_STRING (2, locale_name); | |
614 | SCM_VALIDATE_OPTIONAL_LOCALE_COPY (3, base_locale, c_base_locale); | |
615 | ||
616 | c_category_mask = category_list_to_category_mask (category_list, | |
617 | FUNC_NAME, 1); | |
618 | c_locale_name = scm_to_locale_string (locale_name); | |
619 | ||
620 | #ifdef USE_GNU_LOCALE_API | |
621 | ||
622 | if (scm_is_eq (base_locale, SCM_VARIABLE_REF (scm_global_locale))) | |
c3b16a5d | 623 | c_base_locale = LC_GLOBAL_LOCALE; |
a2f00b9b | 624 | |
c3b16a5d | 625 | if (c_base_locale != (locale_t) 0) |
a2f00b9b LC |
626 | { |
627 | /* C_BASE_LOCALE is to be consumed by `newlocale ()' so it needs to be | |
628 | duplicated before. */ | |
629 | c_base_locale = duplocale (c_base_locale); | |
c3b16a5d | 630 | |
a2f00b9b LC |
631 | if (c_base_locale == (locale_t) 0) |
632 | { | |
633 | err = errno; | |
634 | goto fail; | |
635 | } | |
636 | } | |
637 | ||
638 | c_locale = newlocale (c_category_mask, c_locale_name, c_base_locale); | |
639 | ||
640 | free (c_locale_name); | |
641 | ||
642 | if (c_locale == (locale_t) 0) | |
643 | { | |
c3b16a5d | 644 | if (c_base_locale != (locale_t) 0) |
a2f00b9b | 645 | freelocale (c_base_locale); |
a2f00b9b LC |
646 | scm_locale_error (FUNC_NAME, errno); |
647 | } | |
648 | else | |
649 | SCM_NEWSMOB (locale, scm_tc16_locale_smob_type, c_locale); | |
650 | ||
651 | #else | |
652 | ||
653 | c_locale = scm_gc_malloc (sizeof (* c_locale), "locale"); | |
654 | ||
655 | c_locale->category_mask = c_category_mask; | |
656 | c_locale->locale_name = c_locale_name; | |
657 | ||
658 | if (scm_is_eq (base_locale, SCM_VARIABLE_REF (scm_global_locale))) | |
659 | { | |
660 | /* Get the current locale settings and turn them into a locale | |
661 | object. */ | |
662 | err = get_current_locale (&base_locale); | |
663 | if (err) | |
664 | goto fail; | |
665 | } | |
666 | ||
667 | c_locale->base_locale = base_locale; | |
668 | ||
669 | { | |
670 | /* Try out the new locale and raise an exception if it doesn't work. */ | |
671 | int err; | |
672 | scm_t_locale_settings prev_locale; | |
673 | ||
674 | err = enter_locale_section (c_locale, &prev_locale); | |
a2f00b9b LC |
675 | |
676 | if (err) | |
677 | goto fail; | |
678 | else | |
1445e449 LC |
679 | { |
680 | leave_locale_section (&prev_locale); | |
681 | SCM_NEWSMOB (locale, scm_tc16_locale_smob_type, c_locale); | |
682 | } | |
a2f00b9b LC |
683 | } |
684 | ||
685 | #endif | |
686 | ||
687 | return locale; | |
688 | ||
689 | fail: | |
690 | #ifndef USE_GNU_LOCALE_API | |
691 | scm_gc_free (c_locale, sizeof (* c_locale), "locale"); | |
692 | #endif | |
693 | free (c_locale_name); | |
694 | scm_locale_error (FUNC_NAME, err); | |
695 | ||
696 | return SCM_BOOL_F; | |
697 | } | |
698 | #undef FUNC_NAME | |
699 | ||
700 | SCM_DEFINE (scm_locale_p, "locale?", 1, 0, 0, | |
701 | (SCM obj), | |
702 | "Return true if @var{obj} is a locale object.") | |
703 | #define FUNC_NAME s_scm_locale_p | |
704 | { | |
705 | return scm_from_bool (SCM_SMOB_PREDICATE (scm_tc16_locale_smob_type, obj)); | |
706 | } | |
707 | #undef FUNC_NAME | |
708 | ||
709 | ||
b89c4943 | 710 | \f |
a2f00b9b LC |
711 | /* Locale-dependent string comparison. |
712 | ||
713 | A similar API can be found in MzScheme starting from version 200: | |
714 | http://download.plt-scheme.org/chronology/mzmr200alpha14.html . */ | |
715 | ||
df047aa2 LC |
716 | #define SCM_STRING_TO_U32_BUF(s1, c_s1) \ |
717 | do \ | |
718 | { \ | |
719 | if (scm_i_is_narrow_string (s1)) \ | |
720 | { \ | |
721 | size_t i, len; \ | |
722 | const char *buf = scm_i_string_chars (s1); \ | |
723 | \ | |
724 | len = scm_i_string_length (s1); \ | |
c291b588 | 725 | c_s1 = alloca (sizeof (scm_t_wchar) * (len + 1)); \ |
df047aa2 LC |
726 | \ |
727 | for (i = 0; i < len; i ++) \ | |
728 | c_s1[i] = (unsigned char ) buf[i]; \ | |
729 | c_s1[len] = 0; \ | |
730 | } \ | |
731 | else \ | |
732 | c_s1 = (scm_t_wchar *) scm_i_string_wide_chars (s1); \ | |
733 | } while (0) | |
734 | ||
735 | ||
736 | /* Compare UTF-32 strings according to LOCALE. Returns a negative value if | |
737 | S1 compares smaller than S2, a positive value if S1 compares larger than | |
738 | S2, or 0 if they compare equal. */ | |
b89c4943 | 739 | static inline int |
5b878445 | 740 | compare_u32_strings (SCM s1, SCM s2, SCM locale, const char *func_name) |
b89c4943 LC |
741 | #define FUNC_NAME func_name |
742 | { | |
743 | int result; | |
744 | scm_t_locale c_locale; | |
5b878445 MG |
745 | scm_t_wchar *c_s1, *c_s2; |
746 | SCM_VALIDATE_OPTIONAL_LOCALE_COPY (3, locale, c_locale); | |
747 | ||
748 | SCM_STRING_TO_U32_BUF (s1, c_s1); | |
749 | SCM_STRING_TO_U32_BUF (s2, c_s2); | |
750 | ||
751 | if (c_locale) | |
752 | RUN_IN_LOCALE_SECTION (c_locale, | |
753 | result = u32_strcoll ((const scm_t_uint32 *) c_s1, | |
754 | (const scm_t_uint32 *) c_s2)); | |
755 | else | |
cdf52ff0 LC |
756 | result = u32_strcoll ((const scm_t_uint32 *) c_s1, |
757 | (const scm_t_uint32 *) c_s2); | |
5b878445 | 758 | |
5b878445 MG |
759 | scm_remember_upto_here_2 (s1, s2); |
760 | scm_remember_upto_here (locale); | |
761 | return result; | |
762 | } | |
763 | #undef FUNC_NAME | |
764 | ||
aafb5062 MG |
765 | /* Return the current language of the locale. */ |
766 | static const char * | |
767 | locale_language () | |
768 | { | |
03d80c03 MG |
769 | /* FIXME: If the locale has been set with 'uselocale', |
770 | libunistring's uc_locale_language will return the incorrect | |
771 | language: it will return the language appropriate for the global | |
772 | (non-thread-specific) locale. | |
773 | ||
774 | There appears to be no portable way to extract the language from | |
775 | the thread-specific locale_t. There is no LANGUAGE capability in | |
776 | nl_langinfo or nl_langinfo_l. | |
777 | ||
778 | Thus, uc_locale_language needs to be fixed upstream. */ | |
aafb5062 | 779 | return uc_locale_language (); |
aafb5062 MG |
780 | } |
781 | ||
5b878445 | 782 | static inline int |
aafb5062 | 783 | u32_locale_casecoll (const char *func_name, const scm_t_uint32 *c_s1, |
c543e41e LC |
784 | const scm_t_uint32 *c_s2, |
785 | int *result) | |
5b878445 | 786 | { |
c543e41e LC |
787 | /* Note: Since this is called from `RUN_IN_LOCALE_SECTION', it must note |
788 | make any non-local exit. */ | |
5b878445 | 789 | |
c543e41e | 790 | int ret; |
aafb5062 | 791 | const char *loc = locale_language (); |
5b878445 | 792 | |
aafb5062 | 793 | ret = u32_casecoll (c_s1, u32_strlen (c_s1), |
5b878445 | 794 | c_s2, u32_strlen (c_s2), |
c543e41e | 795 | loc, UNINORM_NFC, result); |
5b878445 | 796 | |
c543e41e | 797 | return ret == 0 ? ret : errno; |
5b878445 MG |
798 | } |
799 | ||
800 | static inline int | |
801 | compare_u32_strings_ci (SCM s1, SCM s2, SCM locale, const char *func_name) | |
802 | #define FUNC_NAME func_name | |
803 | { | |
c543e41e | 804 | int result, ret = 0; |
5b878445 MG |
805 | scm_t_locale c_locale; |
806 | scm_t_wchar *c_s1, *c_s2; | |
b89c4943 | 807 | SCM_VALIDATE_OPTIONAL_LOCALE_COPY (3, locale, c_locale); |
9361f762 | 808 | |
5b878445 MG |
809 | SCM_STRING_TO_U32_BUF (s1, c_s1); |
810 | SCM_STRING_TO_U32_BUF (s2, c_s2); | |
811 | ||
b89c4943 | 812 | if (c_locale) |
cdf52ff0 LC |
813 | RUN_IN_LOCALE_SECTION |
814 | (c_locale, | |
c543e41e | 815 | ret = u32_locale_casecoll (func_name, |
cdf52ff0 | 816 | (const scm_t_uint32 *) c_s1, |
c543e41e LC |
817 | (const scm_t_uint32 *) c_s2, |
818 | &result)); | |
819 | else | |
820 | ret = u32_locale_casecoll (func_name, | |
821 | (const scm_t_uint32 *) c_s1, | |
822 | (const scm_t_uint32 *) c_s2, | |
823 | &result); | |
824 | ||
825 | if (SCM_UNLIKELY (ret != 0)) | |
826 | { | |
827 | errno = ret; | |
828 | scm_syserror (FUNC_NAME); | |
829 | } | |
b89c4943 | 830 | |
5b878445 MG |
831 | scm_remember_upto_here_2 (s1, s2); |
832 | scm_remember_upto_here (locale); | |
b89c4943 LC |
833 | |
834 | return result; | |
835 | } | |
836 | #undef FUNC_NAME | |
837 | ||
838 | /* Store into DST an upper-case version of SRC. */ | |
839 | static inline void | |
840 | str_upcase (register char *dst, register const char *src) | |
841 | { | |
842 | for (; *src != '\0'; src++, dst++) | |
4e641322 | 843 | *dst = toupper ((int) *src); |
b89c4943 LC |
844 | *dst = '\0'; |
845 | } | |
846 | ||
847 | static inline void | |
848 | str_downcase (register char *dst, register const char *src) | |
849 | { | |
850 | for (; *src != '\0'; src++, dst++) | |
4e641322 | 851 | *dst = tolower ((int) *src); |
b89c4943 LC |
852 | *dst = '\0'; |
853 | } | |
854 | ||
855 | #ifdef USE_GNU_LOCALE_API | |
856 | static inline void | |
857 | str_upcase_l (register char *dst, register const char *src, | |
858 | scm_t_locale locale) | |
859 | { | |
860 | for (; *src != '\0'; src++, dst++) | |
861 | *dst = toupper_l (*src, locale); | |
862 | *dst = '\0'; | |
863 | } | |
864 | ||
865 | static inline void | |
866 | str_downcase_l (register char *dst, register const char *src, | |
867 | scm_t_locale locale) | |
868 | { | |
869 | for (; *src != '\0'; src++, dst++) | |
870 | *dst = tolower_l (*src, locale); | |
871 | *dst = '\0'; | |
872 | } | |
873 | #endif | |
874 | ||
875 | ||
b89c4943 LC |
876 | SCM_DEFINE (scm_string_locale_lt, "string-locale<?", 2, 1, 0, |
877 | (SCM s1, SCM s2, SCM locale), | |
878 | "Compare strings @var{s1} and @var{s2} in a locale-dependent way." | |
879 | "If @var{locale} is provided, it should be locale object (as " | |
880 | "returned by @code{make-locale}) and will be used to perform the " | |
881 | "comparison; otherwise, the current system locale is used.") | |
882 | #define FUNC_NAME s_scm_string_locale_lt | |
9361f762 | 883 | { |
b89c4943 | 884 | int result; |
9361f762 | 885 | |
b89c4943 LC |
886 | SCM_VALIDATE_STRING (1, s1); |
887 | SCM_VALIDATE_STRING (2, s2); | |
9361f762 | 888 | |
5b878445 | 889 | result = compare_u32_strings (s1, s2, locale, FUNC_NAME); |
b89c4943 LC |
890 | |
891 | return scm_from_bool (result < 0); | |
892 | } | |
893 | #undef FUNC_NAME | |
894 | ||
895 | SCM_DEFINE (scm_string_locale_gt, "string-locale>?", 2, 1, 0, | |
896 | (SCM s1, SCM s2, SCM locale), | |
897 | "Compare strings @var{s1} and @var{s2} in a locale-dependent way." | |
898 | "If @var{locale} is provided, it should be locale object (as " | |
899 | "returned by @code{make-locale}) and will be used to perform the " | |
900 | "comparison; otherwise, the current system locale is used.") | |
901 | #define FUNC_NAME s_scm_string_locale_gt | |
902 | { | |
903 | int result; | |
b89c4943 LC |
904 | |
905 | SCM_VALIDATE_STRING (1, s1); | |
906 | SCM_VALIDATE_STRING (2, s2); | |
907 | ||
5b878445 | 908 | result = compare_u32_strings (s1, s2, locale, FUNC_NAME); |
b89c4943 LC |
909 | |
910 | return scm_from_bool (result > 0); | |
911 | } | |
912 | #undef FUNC_NAME | |
913 | ||
914 | SCM_DEFINE (scm_string_locale_ci_lt, "string-locale-ci<?", 2, 1, 0, | |
915 | (SCM s1, SCM s2, SCM locale), | |
916 | "Compare strings @var{s1} and @var{s2} in a case-insensitive, " | |
917 | "and locale-dependent way. If @var{locale} is provided, it " | |
918 | "should be locale object (as returned by @code{make-locale}) " | |
919 | "and will be used to perform the comparison; otherwise, the " | |
920 | "current system locale is used.") | |
921 | #define FUNC_NAME s_scm_string_locale_ci_lt | |
922 | { | |
923 | int result; | |
b89c4943 LC |
924 | |
925 | SCM_VALIDATE_STRING (1, s1); | |
926 | SCM_VALIDATE_STRING (2, s2); | |
927 | ||
5b878445 | 928 | result = compare_u32_strings_ci (s1, s2, locale, FUNC_NAME); |
b89c4943 LC |
929 | |
930 | return scm_from_bool (result < 0); | |
931 | } | |
932 | #undef FUNC_NAME | |
933 | ||
934 | SCM_DEFINE (scm_string_locale_ci_gt, "string-locale-ci>?", 2, 1, 0, | |
935 | (SCM s1, SCM s2, SCM locale), | |
936 | "Compare strings @var{s1} and @var{s2} in a case-insensitive, " | |
937 | "and locale-dependent way. If @var{locale} is provided, it " | |
938 | "should be locale object (as returned by @code{make-locale}) " | |
939 | "and will be used to perform the comparison; otherwise, the " | |
940 | "current system locale is used.") | |
941 | #define FUNC_NAME s_scm_string_locale_ci_gt | |
942 | { | |
943 | int result; | |
b89c4943 LC |
944 | |
945 | SCM_VALIDATE_STRING (1, s1); | |
946 | SCM_VALIDATE_STRING (2, s2); | |
947 | ||
5b878445 | 948 | result = compare_u32_strings_ci (s1, s2, locale, FUNC_NAME); |
b89c4943 LC |
949 | |
950 | return scm_from_bool (result > 0); | |
951 | } | |
952 | #undef FUNC_NAME | |
953 | ||
954 | SCM_DEFINE (scm_string_locale_ci_eq, "string-locale-ci=?", 2, 1, 0, | |
955 | (SCM s1, SCM s2, SCM locale), | |
956 | "Compare strings @var{s1} and @var{s2} in a case-insensitive, " | |
957 | "and locale-dependent way. If @var{locale} is provided, it " | |
958 | "should be locale object (as returned by @code{make-locale}) " | |
959 | "and will be used to perform the comparison; otherwise, the " | |
960 | "current system locale is used.") | |
961 | #define FUNC_NAME s_scm_string_locale_ci_eq | |
962 | { | |
963 | int result; | |
b89c4943 LC |
964 | |
965 | SCM_VALIDATE_STRING (1, s1); | |
966 | SCM_VALIDATE_STRING (2, s2); | |
967 | ||
5b878445 | 968 | result = compare_u32_strings_ci (s1, s2, locale, FUNC_NAME); |
b89c4943 LC |
969 | |
970 | return scm_from_bool (result == 0); | |
971 | } | |
972 | #undef FUNC_NAME | |
973 | ||
974 | ||
975 | SCM_DEFINE (scm_char_locale_lt, "char-locale<?", 2, 1, 0, | |
976 | (SCM c1, SCM c2, SCM locale), | |
977 | "Return true if character @var{c1} is lower than @var{c2} " | |
978 | "according to @var{locale} or to the current locale.") | |
979 | #define FUNC_NAME s_scm_char_locale_lt | |
980 | { | |
5b878445 | 981 | int result; |
b89c4943 LC |
982 | |
983 | SCM_VALIDATE_CHAR (1, c1); | |
984 | SCM_VALIDATE_CHAR (2, c2); | |
985 | ||
5b878445 MG |
986 | result = compare_u32_strings (scm_string (scm_list_1 (c1)), |
987 | scm_string (scm_list_1 (c2)), | |
988 | locale, FUNC_NAME); | |
b89c4943 | 989 | |
5b878445 | 990 | return scm_from_bool (result < 0); |
b89c4943 LC |
991 | } |
992 | #undef FUNC_NAME | |
993 | ||
994 | SCM_DEFINE (scm_char_locale_gt, "char-locale>?", 2, 1, 0, | |
995 | (SCM c1, SCM c2, SCM locale), | |
996 | "Return true if character @var{c1} is greater than @var{c2} " | |
997 | "according to @var{locale} or to the current locale.") | |
998 | #define FUNC_NAME s_scm_char_locale_gt | |
999 | { | |
5b878445 | 1000 | int result; |
b89c4943 LC |
1001 | |
1002 | SCM_VALIDATE_CHAR (1, c1); | |
1003 | SCM_VALIDATE_CHAR (2, c2); | |
1004 | ||
5b878445 MG |
1005 | result = compare_u32_strings (scm_string (scm_list_1 (c1)), |
1006 | scm_string (scm_list_1 (c2)), | |
1007 | locale, FUNC_NAME); | |
b89c4943 | 1008 | |
5b878445 | 1009 | return scm_from_bool (result > 0); |
b89c4943 LC |
1010 | } |
1011 | #undef FUNC_NAME | |
1012 | ||
1013 | SCM_DEFINE (scm_char_locale_ci_lt, "char-locale-ci<?", 2, 1, 0, | |
1014 | (SCM c1, SCM c2, SCM locale), | |
1015 | "Return true if character @var{c1} is lower than @var{c2}, " | |
1016 | "in a case insensitive way according to @var{locale} or to " | |
1017 | "the current locale.") | |
1018 | #define FUNC_NAME s_scm_char_locale_ci_lt | |
1019 | { | |
1020 | int result; | |
b89c4943 LC |
1021 | |
1022 | SCM_VALIDATE_CHAR (1, c1); | |
1023 | SCM_VALIDATE_CHAR (2, c2); | |
1024 | ||
5b878445 MG |
1025 | result = compare_u32_strings_ci (scm_string (scm_list_1 (c1)), |
1026 | scm_string (scm_list_1 (c2)), | |
1027 | locale, FUNC_NAME); | |
b89c4943 LC |
1028 | |
1029 | return scm_from_bool (result < 0); | |
1030 | } | |
1031 | #undef FUNC_NAME | |
1032 | ||
1033 | SCM_DEFINE (scm_char_locale_ci_gt, "char-locale-ci>?", 2, 1, 0, | |
1034 | (SCM c1, SCM c2, SCM locale), | |
1035 | "Return true if character @var{c1} is greater than @var{c2}, " | |
1036 | "in a case insensitive way according to @var{locale} or to " | |
1037 | "the current locale.") | |
1038 | #define FUNC_NAME s_scm_char_locale_ci_gt | |
1039 | { | |
1040 | int result; | |
b89c4943 LC |
1041 | |
1042 | SCM_VALIDATE_CHAR (1, c1); | |
1043 | SCM_VALIDATE_CHAR (2, c2); | |
1044 | ||
5b878445 MG |
1045 | result = compare_u32_strings_ci (scm_string (scm_list_1 (c1)), |
1046 | scm_string (scm_list_1 (c2)), | |
1047 | locale, FUNC_NAME); | |
b89c4943 LC |
1048 | |
1049 | return scm_from_bool (result > 0); | |
1050 | } | |
1051 | #undef FUNC_NAME | |
1052 | ||
1053 | SCM_DEFINE (scm_char_locale_ci_eq, "char-locale-ci=?", 2, 1, 0, | |
1054 | (SCM c1, SCM c2, SCM locale), | |
1055 | "Return true if character @var{c1} is equal to @var{c2}, " | |
1056 | "in a case insensitive way according to @var{locale} or to " | |
1057 | "the current locale.") | |
1058 | #define FUNC_NAME s_scm_char_locale_ci_eq | |
1059 | { | |
1060 | int result; | |
b89c4943 LC |
1061 | |
1062 | SCM_VALIDATE_CHAR (1, c1); | |
1063 | SCM_VALIDATE_CHAR (2, c2); | |
1064 | ||
5b878445 MG |
1065 | result = compare_u32_strings_ci (scm_string (scm_list_1 (c1)), |
1066 | scm_string (scm_list_1 (c2)), | |
1067 | locale, FUNC_NAME); | |
b89c4943 LC |
1068 | |
1069 | return scm_from_bool (result == 0); | |
1070 | } | |
1071 | #undef FUNC_NAME | |
1072 | ||
1073 | ||
1074 | \f | |
1075 | /* Locale-dependent alphabetic character mapping. */ | |
1076 | ||
27f3413e MG |
1077 | static inline int |
1078 | u32_locale_tocase (const scm_t_uint32 *c_s1, size_t len, | |
1079 | scm_t_uint32 **p_c_s2, size_t * p_len2, | |
1080 | scm_t_uint32 *(*func) (const scm_t_uint32 *, size_t, | |
1081 | const char *, uninorm_t, | |
1082 | scm_t_uint32 *, size_t *)) | |
1083 | { | |
1084 | /* Note: Since this is called from `RUN_IN_LOCALE_SECTION', it must not | |
1085 | make any non-local exit. */ | |
1086 | ||
1087 | scm_t_uint32 *ret; | |
aafb5062 | 1088 | const char *loc = locale_language (); |
27f3413e MG |
1089 | |
1090 | /* The first NULL here indicates that no NFC or NFKC normalization | |
1091 | is done. The second NULL means the return buffer is | |
1092 | malloc'ed here. */ | |
1093 | ret = func (c_s1, len, loc, NULL, NULL, p_len2); | |
1094 | ||
1095 | if (ret == NULL) | |
1096 | { | |
2c48e4d5 | 1097 | *p_c_s2 = (scm_t_uint32 *) NULL; |
27f3413e MG |
1098 | *p_len2 = 0; |
1099 | return errno; | |
1100 | } | |
1101 | *p_c_s2 = ret; | |
aafb5062 | 1102 | |
27f3413e MG |
1103 | return 0; |
1104 | } | |
1105 | ||
1106 | ||
820f33aa JG |
1107 | static SCM |
1108 | chr_to_case (SCM chr, scm_t_locale c_locale, | |
1109 | scm_t_uint32 *(*func) (const scm_t_uint32 *, size_t, const char *, | |
1110 | uninorm_t, scm_t_uint32 *, size_t *), | |
44d3d111 | 1111 | const char *func_name, |
820f33aa | 1112 | int *err) |
44d3d111 | 1113 | #define FUNC_NAME func_name |
b89c4943 | 1114 | { |
27f3413e | 1115 | int ret; |
2c48e4d5 | 1116 | scm_t_wchar *buf; |
820f33aa JG |
1117 | scm_t_uint32 *convbuf; |
1118 | size_t convlen; | |
1119 | SCM str, convchar; | |
b89c4943 | 1120 | |
27f3413e MG |
1121 | str = scm_i_make_wide_string (1, &buf); |
1122 | buf[0] = SCM_CHAR (chr); | |
1123 | ||
b89c4943 | 1124 | if (c_locale != NULL) |
27f3413e MG |
1125 | RUN_IN_LOCALE_SECTION (c_locale, ret = |
1126 | u32_locale_tocase ((scm_t_uint32 *) buf, 1, | |
820f33aa JG |
1127 | &convbuf, |
1128 | &convlen, func)); | |
27f3413e MG |
1129 | else |
1130 | ret = | |
820f33aa JG |
1131 | u32_locale_tocase ((scm_t_uint32 *) buf, 1, &convbuf, |
1132 | &convlen, func); | |
27f3413e MG |
1133 | |
1134 | if (SCM_UNLIKELY (ret != 0)) | |
9361f762 | 1135 | { |
820f33aa JG |
1136 | *err = ret; |
1137 | return NULL; | |
9361f762 | 1138 | } |
27f3413e | 1139 | |
820f33aa JG |
1140 | if (convlen == 1) |
1141 | convchar = SCM_MAKE_CHAR ((scm_t_wchar) convbuf[0]); | |
b89c4943 | 1142 | else |
820f33aa JG |
1143 | convchar = chr; |
1144 | free (convbuf); | |
1145 | ||
1146 | return convchar; | |
1147 | } | |
44d3d111 | 1148 | #undef FUNC_NAME |
820f33aa JG |
1149 | |
1150 | SCM_DEFINE (scm_char_locale_downcase, "char-locale-downcase", 1, 1, 0, | |
1151 | (SCM chr, SCM locale), | |
1152 | "Return the lowercase character that corresponds to @var{chr} " | |
1153 | "according to either @var{locale} or the current locale.") | |
1154 | #define FUNC_NAME s_scm_char_locale_downcase | |
1155 | { | |
1156 | scm_t_locale c_locale; | |
1157 | SCM ret; | |
1158 | int err = 0; | |
1159 | ||
1160 | SCM_VALIDATE_CHAR (1, chr); | |
1161 | SCM_VALIDATE_OPTIONAL_LOCALE_COPY (2, locale, c_locale); | |
9361f762 | 1162 | |
44d3d111 | 1163 | ret = chr_to_case (chr, c_locale, u32_tolower, FUNC_NAME, &err); |
820f33aa JG |
1164 | |
1165 | if (err != 0) | |
1166 | { | |
1167 | errno = err; | |
1168 | scm_syserror (FUNC_NAME); | |
1169 | } | |
1170 | return ret; | |
9361f762 MV |
1171 | } |
1172 | #undef FUNC_NAME | |
1173 | ||
b89c4943 LC |
1174 | SCM_DEFINE (scm_char_locale_upcase, "char-locale-upcase", 1, 1, 0, |
1175 | (SCM chr, SCM locale), | |
1176 | "Return the uppercase character that corresponds to @var{chr} " | |
1177 | "according to either @var{locale} or the current locale.") | |
1178 | #define FUNC_NAME s_scm_char_locale_upcase | |
9361f762 | 1179 | { |
b89c4943 | 1180 | scm_t_locale c_locale; |
820f33aa JG |
1181 | SCM ret; |
1182 | int err = 0; | |
b89c4943 LC |
1183 | |
1184 | SCM_VALIDATE_CHAR (1, chr); | |
b89c4943 | 1185 | SCM_VALIDATE_OPTIONAL_LOCALE_COPY (2, locale, c_locale); |
9361f762 | 1186 | |
44d3d111 | 1187 | ret = chr_to_case (chr, c_locale, u32_toupper, FUNC_NAME, &err); |
27f3413e | 1188 | |
820f33aa JG |
1189 | if (err != 0) |
1190 | { | |
1191 | errno = err; | |
1192 | scm_syserror (FUNC_NAME); | |
1193 | } | |
1194 | return ret; | |
1195 | } | |
1196 | #undef FUNC_NAME | |
27f3413e | 1197 | |
820f33aa JG |
1198 | SCM_DEFINE (scm_char_locale_titlecase, "char-locale-titlecase", 1, 1, 0, |
1199 | (SCM chr, SCM locale), | |
1200 | "Return the titlecase character that corresponds to @var{chr} " | |
1201 | "according to either @var{locale} or the current locale.") | |
1202 | #define FUNC_NAME s_scm_char_locale_titlecase | |
1203 | { | |
1204 | scm_t_locale c_locale; | |
1205 | SCM ret; | |
1206 | int err = 0; | |
1207 | ||
1208 | SCM_VALIDATE_CHAR (1, chr); | |
1209 | SCM_VALIDATE_OPTIONAL_LOCALE_COPY (2, locale, c_locale); | |
1210 | ||
44d3d111 | 1211 | ret = chr_to_case (chr, c_locale, u32_totitle, FUNC_NAME, &err); |
820f33aa JG |
1212 | |
1213 | if (err != 0) | |
b89c4943 | 1214 | { |
820f33aa | 1215 | errno = err; |
27f3413e | 1216 | scm_syserror (FUNC_NAME); |
b89c4943 | 1217 | } |
820f33aa | 1218 | return ret; |
b89c4943 LC |
1219 | } |
1220 | #undef FUNC_NAME | |
1221 | ||
820f33aa JG |
1222 | static SCM |
1223 | str_to_case (SCM str, scm_t_locale c_locale, | |
1224 | scm_t_uint32 *(*func) (const scm_t_uint32 *, size_t, const char *, | |
1225 | uninorm_t, scm_t_uint32 *, size_t *), | |
44d3d111 | 1226 | const char *func_name, |
820f33aa | 1227 | int *err) |
44d3d111 | 1228 | #define FUNC_NAME func_name |
b89c4943 | 1229 | { |
2c48e4d5 | 1230 | scm_t_wchar *c_str, *c_buf; |
820f33aa JG |
1231 | scm_t_uint32 *c_convstr; |
1232 | size_t len, convlen; | |
27f3413e | 1233 | int ret; |
820f33aa | 1234 | SCM convstr; |
b89c4943 | 1235 | |
27f3413e MG |
1236 | len = scm_i_string_length (str); |
1237 | if (len == 0) | |
1238 | return scm_nullstr; | |
1239 | SCM_STRING_TO_U32_BUF (str, c_str); | |
b89c4943 LC |
1240 | |
1241 | if (c_locale) | |
27f3413e MG |
1242 | RUN_IN_LOCALE_SECTION (c_locale, ret = |
1243 | u32_locale_tocase ((scm_t_uint32 *) c_str, len, | |
820f33aa JG |
1244 | &c_convstr, |
1245 | &convlen, func)); | |
b89c4943 | 1246 | else |
27f3413e MG |
1247 | ret = |
1248 | u32_locale_tocase ((scm_t_uint32 *) c_str, len, | |
820f33aa | 1249 | &c_convstr, &convlen, func); |
b89c4943 LC |
1250 | |
1251 | scm_remember_upto_here (str); | |
1252 | ||
27f3413e MG |
1253 | if (SCM_UNLIKELY (ret != 0)) |
1254 | { | |
820f33aa JG |
1255 | *err = ret; |
1256 | return NULL; | |
27f3413e MG |
1257 | } |
1258 | ||
820f33aa JG |
1259 | convstr = scm_i_make_wide_string (convlen, &c_buf); |
1260 | memcpy (c_buf, c_convstr, convlen * sizeof (scm_t_wchar)); | |
1261 | free (c_convstr); | |
27f3413e | 1262 | |
820f33aa | 1263 | scm_i_try_narrow_string (convstr); |
27f3413e | 1264 | |
820f33aa JG |
1265 | return convstr; |
1266 | } | |
44d3d111 | 1267 | #undef FUNC_NAME |
820f33aa JG |
1268 | |
1269 | SCM_DEFINE (scm_string_locale_upcase, "string-locale-upcase", 1, 1, 0, | |
1270 | (SCM str, SCM locale), | |
1271 | "Return a new string that is the uppercase version of " | |
1272 | "@var{str} according to either @var{locale} or the current " | |
1273 | "locale.") | |
1274 | #define FUNC_NAME s_scm_string_locale_upcase | |
1275 | { | |
1276 | scm_t_locale c_locale; | |
1277 | SCM ret; | |
1278 | int err = 0; | |
1279 | ||
1280 | SCM_VALIDATE_STRING (1, str); | |
1281 | SCM_VALIDATE_OPTIONAL_LOCALE_COPY (2, locale, c_locale); | |
1282 | ||
44d3d111 | 1283 | ret = str_to_case (str, c_locale, u32_toupper, FUNC_NAME, &err); |
820f33aa JG |
1284 | |
1285 | if (err != 0) | |
1286 | { | |
1287 | errno = err; | |
1288 | scm_syserror (FUNC_NAME); | |
1289 | } | |
1290 | return ret; | |
b89c4943 LC |
1291 | } |
1292 | #undef FUNC_NAME | |
9361f762 | 1293 | |
b89c4943 LC |
1294 | SCM_DEFINE (scm_string_locale_downcase, "string-locale-downcase", 1, 1, 0, |
1295 | (SCM str, SCM locale), | |
1296 | "Return a new string that is the down-case version of " | |
1297 | "@var{str} according to either @var{locale} or the current " | |
1298 | "locale.") | |
1299 | #define FUNC_NAME s_scm_string_locale_downcase | |
1300 | { | |
b89c4943 | 1301 | scm_t_locale c_locale; |
820f33aa JG |
1302 | SCM ret; |
1303 | int err = 0; | |
b89c4943 LC |
1304 | |
1305 | SCM_VALIDATE_STRING (1, str); | |
1306 | SCM_VALIDATE_OPTIONAL_LOCALE_COPY (2, locale, c_locale); | |
9361f762 | 1307 | |
44d3d111 | 1308 | ret = str_to_case (str, c_locale, u32_tolower, FUNC_NAME, &err); |
9361f762 | 1309 | |
820f33aa | 1310 | if (err != 0) |
27f3413e | 1311 | { |
820f33aa | 1312 | errno = err; |
27f3413e MG |
1313 | scm_syserror (FUNC_NAME); |
1314 | } | |
820f33aa JG |
1315 | return ret; |
1316 | } | |
1317 | #undef FUNC_NAME | |
1318 | ||
1319 | SCM_DEFINE (scm_string_locale_titlecase, "string-locale-titlecase", 1, 1, 0, | |
1320 | (SCM str, SCM locale), | |
1321 | "Return a new string that is the title-case version of " | |
1322 | "@var{str} according to either @var{locale} or the current " | |
1323 | "locale.") | |
1324 | #define FUNC_NAME s_scm_string_locale_titlecase | |
1325 | { | |
1326 | scm_t_locale c_locale; | |
1327 | SCM ret; | |
1328 | int err = 0; | |
27f3413e | 1329 | |
820f33aa JG |
1330 | SCM_VALIDATE_STRING (1, str); |
1331 | SCM_VALIDATE_OPTIONAL_LOCALE_COPY (2, locale, c_locale); | |
27f3413e | 1332 | |
44d3d111 | 1333 | ret = str_to_case (str, c_locale, u32_totitle, FUNC_NAME, &err); |
27f3413e | 1334 | |
820f33aa JG |
1335 | if (err != 0) |
1336 | { | |
1337 | errno = err; | |
1338 | scm_syserror (FUNC_NAME); | |
1339 | } | |
1340 | return ret; | |
9361f762 MV |
1341 | } |
1342 | #undef FUNC_NAME | |
1343 | ||
b89c4943 LC |
1344 | /* Note: We don't provide mutative versions of `string-locale-(up|down)case' |
1345 | because, in some languages, a single downcase character maps to a couple | |
1346 | of uppercase characters. Read the SRFI-13 document for a detailed | |
1347 | discussion about this. */ | |
1348 | ||
1349 | ||
1350 | \f | |
1351 | /* Locale-dependent number parsing. */ | |
1352 | ||
1353 | SCM_DEFINE (scm_locale_string_to_integer, "locale-string->integer", | |
1354 | 1, 2, 0, (SCM str, SCM base, SCM locale), | |
1355 | "Convert string @var{str} into an integer according to either " | |
1356 | "@var{locale} (a locale object as returned by @code{make-locale}) " | |
1357 | "or the current process locale. Return two values: an integer " | |
1358 | "(on success) or @code{#f}, and the number of characters read " | |
1359 | "from @var{str} (@code{0} on failure).") | |
1360 | #define FUNC_NAME s_scm_locale_string_to_integer | |
9361f762 | 1361 | { |
9361f762 | 1362 | SCM result; |
b89c4943 LC |
1363 | long c_result; |
1364 | int c_base; | |
1365 | const char *c_str; | |
1366 | char *c_endptr; | |
1367 | scm_t_locale c_locale; | |
9361f762 | 1368 | |
b89c4943 LC |
1369 | SCM_VALIDATE_STRING (1, str); |
1370 | c_str = scm_i_string_chars (str); | |
9361f762 | 1371 | |
b89c4943 LC |
1372 | if (base != SCM_UNDEFINED) |
1373 | SCM_VALIDATE_INT_COPY (2, base, c_base); | |
9361f762 | 1374 | else |
b89c4943 LC |
1375 | c_base = 10; |
1376 | ||
1377 | SCM_VALIDATE_OPTIONAL_LOCALE_COPY (3, locale, c_locale); | |
1378 | ||
1379 | if (c_locale != NULL) | |
9361f762 | 1380 | { |
b89c4943 LC |
1381 | #ifdef USE_GNU_LOCALE_API |
1382 | c_result = strtol_l (c_str, &c_endptr, c_base, c_locale); | |
1383 | #else | |
1384 | RUN_IN_LOCALE_SECTION (c_locale, | |
1385 | c_result = strtol (c_str, &c_endptr, c_base)); | |
1386 | #endif | |
9361f762 | 1387 | } |
b89c4943 LC |
1388 | else |
1389 | c_result = strtol (c_str, &c_endptr, c_base); | |
1390 | ||
1391 | scm_remember_upto_here (str); | |
1392 | ||
1393 | if (c_endptr == c_str) | |
1394 | result = SCM_BOOL_F; | |
1395 | else | |
1396 | result = scm_from_long (c_result); | |
1397 | ||
1398 | return (scm_values (scm_list_2 (result, scm_from_long (c_endptr - c_str)))); | |
1399 | } | |
1400 | #undef FUNC_NAME | |
1401 | ||
1402 | SCM_DEFINE (scm_locale_string_to_inexact, "locale-string->inexact", | |
1403 | 1, 1, 0, (SCM str, SCM locale), | |
1404 | "Convert string @var{str} into an inexact number according to " | |
1405 | "either @var{locale} (a locale object as returned by " | |
1406 | "@code{make-locale}) or the current process locale. Return " | |
1407 | "two values: an inexact number (on success) or @code{#f}, and " | |
1408 | "the number of characters read from @var{str} (@code{0} on " | |
1409 | "failure).") | |
1410 | #define FUNC_NAME s_scm_locale_string_to_inexact | |
1411 | { | |
1412 | SCM result; | |
1413 | double c_result; | |
1414 | const char *c_str; | |
1415 | char *c_endptr; | |
1416 | scm_t_locale c_locale; | |
9361f762 | 1417 | |
b89c4943 LC |
1418 | SCM_VALIDATE_STRING (1, str); |
1419 | c_str = scm_i_string_chars (str); | |
9361f762 | 1420 | |
b89c4943 | 1421 | SCM_VALIDATE_OPTIONAL_LOCALE_COPY (2, locale, c_locale); |
9361f762 | 1422 | |
b89c4943 LC |
1423 | if (c_locale != NULL) |
1424 | { | |
1425 | #ifdef USE_GNU_LOCALE_API | |
1426 | c_result = strtod_l (c_str, &c_endptr, c_locale); | |
1427 | #else | |
1428 | RUN_IN_LOCALE_SECTION (c_locale, | |
1429 | c_result = strtod (c_str, &c_endptr)); | |
1430 | #endif | |
1431 | } | |
9361f762 | 1432 | else |
b89c4943 LC |
1433 | c_result = strtod (c_str, &c_endptr); |
1434 | ||
1435 | scm_remember_upto_here (str); | |
1436 | ||
1437 | if (c_endptr == c_str) | |
9361f762 | 1438 | result = SCM_BOOL_F; |
b89c4943 LC |
1439 | else |
1440 | result = scm_from_double (c_result); | |
9361f762 | 1441 | |
b89c4943 | 1442 | return (scm_values (scm_list_2 (result, scm_from_long (c_endptr - c_str)))); |
9361f762 MV |
1443 | } |
1444 | #undef FUNC_NAME | |
1445 | ||
b89c4943 | 1446 | \f |
a2f00b9b LC |
1447 | /* Language information, aka. `nl_langinfo ()'. */ |
1448 | ||
1449 | /* FIXME: Issues related to `nl-langinfo'. | |
1450 | ||
1451 | 1. The `CODESET' value is not normalized. This is a secondary issue, but | |
1452 | still a practical issue. See | |
1453 | http://www.cl.cam.ac.uk/~mgk25/ucs/norm_charmap.c for codeset | |
1454 | normalization. | |
1455 | ||
1456 | 2. `nl_langinfo ()' is not available on Windows. | |
1457 | ||
1458 | 3. `nl_langinfo ()' may return strings encoded in a locale different from | |
52642040 MG |
1459 | the current one. |
1460 | For example: | |
a2f00b9b LC |
1461 | |
1462 | (nl-langinfo DAY_1 (make-locale LC_ALL "eo_EO.UTF-8")) | |
1463 | ||
52642040 MG |
1464 | returns a result that is a UTF-8 string, regardless of the |
1465 | setting of the current locale. If nl_langinfo supports CODESET, | |
1466 | we can convert the string properly using scm_from_stringn. If | |
1467 | CODESET is not supported, we won't be able to make much sense of | |
56d288b8 LC |
1468 | the returned string. |
1469 | ||
1470 | Note: We don't use Gnulib's `nl_langinfo' module because it's currently not | |
1471 | as complete as the compatibility hacks in `i18n.scm'. */ | |
a2f00b9b LC |
1472 | |
1473 | ||
1474 | SCM_DEFINE (scm_nl_langinfo, "nl-langinfo", 1, 1, 0, | |
1475 | (SCM item, SCM locale), | |
1476 | "Return a string denoting locale information for @var{item} " | |
1477 | "in the current locale or that specified by @var{locale}. " | |
1478 | "The semantics and arguments are the same as those of the " | |
1479 | "X/Open @code{nl_langinfo} function (@pxref{The Elegant and " | |
1480 | "Fast Way, @code{nl_langinfo},, libc, The GNU C Library " | |
1481 | "Reference Manual}).") | |
1482 | #define FUNC_NAME s_scm_nl_langinfo | |
1483 | { | |
1484 | #ifdef HAVE_NL_LANGINFO | |
1485 | SCM result; | |
1486 | nl_item c_item; | |
1487 | char *c_result; | |
1488 | scm_t_locale c_locale; | |
52642040 MG |
1489 | #ifdef HAVE_LANGINFO_CODESET |
1490 | char *codeset; | |
1491 | #endif | |
a2f00b9b LC |
1492 | |
1493 | SCM_VALIDATE_INT_COPY (2, item, c_item); | |
1494 | SCM_VALIDATE_OPTIONAL_LOCALE_COPY (2, locale, c_locale); | |
1495 | ||
1496 | /* Sadly, `nl_langinfo ()' returns a pointer to a static string. According | |
1497 | to SuS v2, that static string may be modified by subsequent calls to | |
1498 | `nl_langinfo ()' as well as by calls to `setlocale ()'. Thus, we must | |
1499 | acquire the locale mutex before doing invoking `nl_langinfo ()'. See | |
1500 | http://opengroup.org/onlinepubs/007908799/xsh/nl_langinfo.html for | |
1501 | details. */ | |
1502 | ||
1503 | scm_i_pthread_mutex_lock (&scm_i_locale_mutex); | |
1504 | if (c_locale != NULL) | |
1505 | { | |
1506 | #ifdef USE_GNU_LOCALE_API | |
1507 | c_result = nl_langinfo_l (c_item, c_locale); | |
52642040 MG |
1508 | #ifdef HAVE_LANGINFO_CODESET |
1509 | codeset = nl_langinfo_l (CODESET, c_locale); | |
1510 | #endif /* HAVE_LANGINFO_CODESET */ | |
1511 | #else /* !USE_GNU_LOCALE_API */ | |
a2f00b9b LC |
1512 | /* We can't use `RUN_IN_LOCALE_SECTION ()' here because the locale |
1513 | mutex is already taken. */ | |
1514 | int lsec_err; | |
1515 | scm_t_locale_settings lsec_prev_locale; | |
1516 | ||
1517 | lsec_err = get_current_locale_settings (&lsec_prev_locale); | |
1518 | if (lsec_err) | |
1519 | scm_i_pthread_mutex_unlock (&scm_i_locale_mutex); | |
1520 | else | |
1521 | { | |
1522 | lsec_err = install_locale (c_locale); | |
1523 | if (lsec_err) | |
1524 | { | |
1525 | leave_locale_section (&lsec_prev_locale); | |
1526 | free_locale_settings (&lsec_prev_locale); | |
1527 | } | |
1528 | } | |
1529 | ||
1530 | if (lsec_err) | |
1531 | scm_locale_error (FUNC_NAME, lsec_err); | |
1532 | else | |
1533 | { | |
1534 | c_result = nl_langinfo (c_item); | |
52642040 MG |
1535 | #ifdef HAVE_LANGINFO_CODESET |
1536 | codeset = nl_langinfo (CODESET); | |
1537 | #endif /* HAVE_LANGINFO_CODESET */ | |
a2f00b9b | 1538 | |
1445e449 | 1539 | restore_locale_settings (&lsec_prev_locale); |
a2f00b9b LC |
1540 | free_locale_settings (&lsec_prev_locale); |
1541 | } | |
1542 | #endif | |
1543 | } | |
1544 | else | |
52642040 MG |
1545 | { |
1546 | c_result = nl_langinfo (c_item); | |
1547 | #ifdef HAVE_LANGINFO_CODESET | |
1548 | codeset = nl_langinfo (CODESET); | |
1549 | #endif /* HAVE_LANGINFO_CODESET */ | |
1550 | } | |
a2f00b9b LC |
1551 | |
1552 | c_result = strdup (c_result); | |
1553 | scm_i_pthread_mutex_unlock (&scm_i_locale_mutex); | |
1554 | ||
1555 | if (c_result == NULL) | |
1556 | result = SCM_BOOL_F; | |
1557 | else | |
1558 | { | |
a2f00b9b LC |
1559 | switch (c_item) |
1560 | { | |
afb49959 | 1561 | #if (defined GROUPING) && (defined MON_GROUPING) |
a2f00b9b LC |
1562 | case GROUPING: |
1563 | case MON_GROUPING: | |
a2f00b9b | 1564 | { |
afb49959 | 1565 | char *p; |
a2f00b9b | 1566 | |
914c4300 LC |
1567 | /* In this cases, the result is to be interpreted as a list |
1568 | of numbers. If the last item is `CHAR_MAX' or a negative | |
1569 | number, it has the special meaning "no more grouping" | |
1570 | (negative numbers aren't specified in POSIX but can be | |
1571 | used by glibc; see | |
1572 | <http://lists.gnu.org/archive/html/bug-guile/2011-02/msg00159.html>). */ | |
afb49959 | 1573 | result = SCM_EOL; |
914c4300 | 1574 | for (p = c_result; (*p > 0) && (*p != CHAR_MAX); p++) |
afb49959 | 1575 | result = scm_cons (SCM_I_MAKINUM ((int) *p), result); |
a2f00b9b | 1576 | |
afb49959 LC |
1577 | { |
1578 | SCM last_pair = result; | |
a2f00b9b | 1579 | |
afb49959 LC |
1580 | result = scm_reverse_x (result, SCM_EOL); |
1581 | ||
914c4300 | 1582 | if (*p == 0) |
afb49959 LC |
1583 | { |
1584 | /* Cyclic grouping information. */ | |
1585 | if (last_pair != SCM_EOL) | |
1586 | SCM_SETCDR (last_pair, result); | |
1587 | } | |
1588 | } | |
a2f00b9b | 1589 | |
afb49959 LC |
1590 | free (c_result); |
1591 | break; | |
1592 | } | |
1593 | #endif | |
1594 | ||
1595 | #if (defined FRAC_DIGITS) && (defined INT_FRAC_DIGITS) | |
a2f00b9b LC |
1596 | case FRAC_DIGITS: |
1597 | case INT_FRAC_DIGITS: | |
1598 | /* This is to be interpreted as a single integer. */ | |
1599 | if (*c_result == CHAR_MAX) | |
1600 | /* Unspecified. */ | |
1601 | result = SCM_BOOL_F; | |
1602 | else | |
1603 | result = SCM_I_MAKINUM (*c_result); | |
1604 | ||
1605 | free (c_result); | |
1606 | break; | |
afb49959 | 1607 | #endif |
a2f00b9b | 1608 | |
afb49959 | 1609 | #if (defined P_CS_PRECEDES) && (defined INT_N_CS_PRECEDES) |
a2f00b9b LC |
1610 | case P_CS_PRECEDES: |
1611 | case N_CS_PRECEDES: | |
1612 | case INT_P_CS_PRECEDES: | |
1613 | case INT_N_CS_PRECEDES: | |
afb49959 | 1614 | #if (defined P_SEP_BY_SPACE) && (defined N_SEP_BY_SPACE) |
a2f00b9b LC |
1615 | case P_SEP_BY_SPACE: |
1616 | case N_SEP_BY_SPACE: | |
afb49959 | 1617 | #endif |
a2f00b9b LC |
1618 | /* This is to be interpreted as a boolean. */ |
1619 | result = scm_from_bool (*c_result); | |
1620 | ||
1621 | free (c_result); | |
1622 | break; | |
afb49959 | 1623 | #endif |
a2f00b9b | 1624 | |
afb49959 | 1625 | #if (defined P_SIGN_POSN) && (defined INT_N_SIGN_POSN) |
a2f00b9b LC |
1626 | case P_SIGN_POSN: |
1627 | case N_SIGN_POSN: | |
1628 | case INT_P_SIGN_POSN: | |
1629 | case INT_N_SIGN_POSN: | |
1630 | /* See `(libc) Sign of Money Amount' for the interpretation of the | |
1631 | return value here. */ | |
1632 | switch (*c_result) | |
1633 | { | |
1634 | case 0: | |
4a655e50 | 1635 | result = scm_from_latin1_symbol ("parenthesize"); |
a2f00b9b LC |
1636 | break; |
1637 | ||
1638 | case 1: | |
4a655e50 | 1639 | result = scm_from_latin1_symbol ("sign-before"); |
a2f00b9b LC |
1640 | break; |
1641 | ||
1642 | case 2: | |
4a655e50 | 1643 | result = scm_from_latin1_symbol ("sign-after"); |
a2f00b9b LC |
1644 | break; |
1645 | ||
1646 | case 3: | |
4a655e50 | 1647 | result = scm_from_latin1_symbol ("sign-before-currency-symbol"); |
a2f00b9b LC |
1648 | break; |
1649 | ||
1650 | case 4: | |
4a655e50 | 1651 | result = scm_from_latin1_symbol ("sign-after-currency-symbol"); |
a2f00b9b LC |
1652 | break; |
1653 | ||
1654 | default: | |
4a655e50 | 1655 | result = scm_from_latin1_symbol ("unspecified"); |
a2f00b9b LC |
1656 | } |
1657 | break; | |
afb49959 | 1658 | #endif |
a2f00b9b LC |
1659 | |
1660 | default: | |
52642040 MG |
1661 | #ifdef HAVE_LANGINFO_CODESET |
1662 | result = scm_from_stringn (c_result, strlen (c_result), | |
1663 | codeset, | |
1664 | SCM_FAILED_CONVERSION_QUESTION_MARK); | |
1665 | #else /* !HAVE_LANGINFO_CODESET */ | |
1666 | /* This may be incorrectly encoded if the locale differs | |
1667 | from the c_locale. */ | |
1668 | result = scm_from_locale_string (c_result); | |
1669 | #endif /* !HAVE_LANGINFO_CODESET */ | |
b8fc11d2 | 1670 | free (c_result); |
a2f00b9b LC |
1671 | } |
1672 | } | |
1673 | ||
1674 | return result; | |
1675 | #else | |
1676 | scm_syserror_msg (FUNC_NAME, "`nl-langinfo' not supported on your system", | |
1677 | SCM_EOL, ENOSYS); | |
1678 | ||
1679 | return SCM_BOOL_F; | |
1680 | #endif | |
1681 | } | |
1682 | #undef FUNC_NAME | |
1683 | ||
1684 | /* Define the `nl_item' constants. */ | |
1685 | static inline void | |
1686 | define_langinfo_items (void) | |
9361f762 | 1687 | { |
24deb6d0 | 1688 | #ifdef HAVE_LANGINFO_H |
a2f00b9b LC |
1689 | |
1690 | #define DEFINE_NLITEM_CONSTANT(_item) \ | |
1691 | scm_c_define (# _item, scm_from_int (_item)) | |
1692 | ||
1693 | DEFINE_NLITEM_CONSTANT (CODESET); | |
1694 | ||
1695 | /* Abbreviated days of the week. */ | |
1696 | DEFINE_NLITEM_CONSTANT (ABDAY_1); | |
1697 | DEFINE_NLITEM_CONSTANT (ABDAY_2); | |
1698 | DEFINE_NLITEM_CONSTANT (ABDAY_3); | |
1699 | DEFINE_NLITEM_CONSTANT (ABDAY_4); | |
1700 | DEFINE_NLITEM_CONSTANT (ABDAY_5); | |
1701 | DEFINE_NLITEM_CONSTANT (ABDAY_6); | |
1702 | DEFINE_NLITEM_CONSTANT (ABDAY_7); | |
1703 | ||
1704 | /* Long-named days of the week. */ | |
1705 | DEFINE_NLITEM_CONSTANT (DAY_1); /* Sunday */ | |
1706 | DEFINE_NLITEM_CONSTANT (DAY_2); /* Monday */ | |
1707 | DEFINE_NLITEM_CONSTANT (DAY_3); /* Tuesday */ | |
1708 | DEFINE_NLITEM_CONSTANT (DAY_4); /* Wednesday */ | |
1709 | DEFINE_NLITEM_CONSTANT (DAY_5); /* Thursday */ | |
1710 | DEFINE_NLITEM_CONSTANT (DAY_6); /* Friday */ | |
1711 | DEFINE_NLITEM_CONSTANT (DAY_7); /* Saturday */ | |
1712 | ||
1713 | /* Abbreviated month names. */ | |
1714 | DEFINE_NLITEM_CONSTANT (ABMON_1); /* Jan */ | |
1715 | DEFINE_NLITEM_CONSTANT (ABMON_2); | |
1716 | DEFINE_NLITEM_CONSTANT (ABMON_3); | |
1717 | DEFINE_NLITEM_CONSTANT (ABMON_4); | |
1718 | DEFINE_NLITEM_CONSTANT (ABMON_5); | |
1719 | DEFINE_NLITEM_CONSTANT (ABMON_6); | |
1720 | DEFINE_NLITEM_CONSTANT (ABMON_7); | |
1721 | DEFINE_NLITEM_CONSTANT (ABMON_8); | |
1722 | DEFINE_NLITEM_CONSTANT (ABMON_9); | |
1723 | DEFINE_NLITEM_CONSTANT (ABMON_10); | |
1724 | DEFINE_NLITEM_CONSTANT (ABMON_11); | |
1725 | DEFINE_NLITEM_CONSTANT (ABMON_12); | |
1726 | ||
1727 | /* Long month names. */ | |
1728 | DEFINE_NLITEM_CONSTANT (MON_1); /* January */ | |
1729 | DEFINE_NLITEM_CONSTANT (MON_2); | |
1730 | DEFINE_NLITEM_CONSTANT (MON_3); | |
1731 | DEFINE_NLITEM_CONSTANT (MON_4); | |
1732 | DEFINE_NLITEM_CONSTANT (MON_5); | |
1733 | DEFINE_NLITEM_CONSTANT (MON_6); | |
1734 | DEFINE_NLITEM_CONSTANT (MON_7); | |
1735 | DEFINE_NLITEM_CONSTANT (MON_8); | |
1736 | DEFINE_NLITEM_CONSTANT (MON_9); | |
1737 | DEFINE_NLITEM_CONSTANT (MON_10); | |
1738 | DEFINE_NLITEM_CONSTANT (MON_11); | |
1739 | DEFINE_NLITEM_CONSTANT (MON_12); | |
1740 | ||
1741 | DEFINE_NLITEM_CONSTANT (AM_STR); /* Ante meridiem string. */ | |
1742 | DEFINE_NLITEM_CONSTANT (PM_STR); /* Post meridiem string. */ | |
1743 | ||
1744 | DEFINE_NLITEM_CONSTANT (D_T_FMT); /* Date and time format for strftime. */ | |
1745 | DEFINE_NLITEM_CONSTANT (D_FMT); /* Date format for strftime. */ | |
1746 | DEFINE_NLITEM_CONSTANT (T_FMT); /* Time format for strftime. */ | |
1747 | DEFINE_NLITEM_CONSTANT (T_FMT_AMPM);/* 12-hour time format for strftime. */ | |
1748 | ||
1749 | DEFINE_NLITEM_CONSTANT (ERA); /* Alternate era. */ | |
1750 | DEFINE_NLITEM_CONSTANT (ERA_D_FMT); /* Date in alternate era format. */ | |
1751 | DEFINE_NLITEM_CONSTANT (ERA_D_T_FMT); /* Date and time in alternate era | |
1752 | format. */ | |
1753 | DEFINE_NLITEM_CONSTANT (ERA_T_FMT); /* Time in alternate era format. */ | |
1754 | ||
1755 | DEFINE_NLITEM_CONSTANT (ALT_DIGITS); /* Alternate symbols for digits. */ | |
1756 | DEFINE_NLITEM_CONSTANT (RADIXCHAR); | |
1757 | DEFINE_NLITEM_CONSTANT (THOUSEP); | |
1758 | ||
1759 | #ifdef YESEXPR | |
1760 | DEFINE_NLITEM_CONSTANT (YESEXPR); | |
1761 | #endif | |
1762 | #ifdef NOEXPR | |
1763 | DEFINE_NLITEM_CONSTANT (NOEXPR); | |
1764 | #endif | |
b89c4943 | 1765 | |
a2f00b9b LC |
1766 | #ifdef CRNCYSTR /* currency symbol */ |
1767 | DEFINE_NLITEM_CONSTANT (CRNCYSTR); | |
1768 | #endif | |
b89c4943 | 1769 | |
a2f00b9b | 1770 | /* GNU extensions. */ |
b89c4943 | 1771 | |
a2f00b9b LC |
1772 | #ifdef ERA_YEAR |
1773 | DEFINE_NLITEM_CONSTANT (ERA_YEAR); /* Year in alternate era format. */ | |
1774 | #endif | |
b89c4943 | 1775 | |
a2f00b9b LC |
1776 | /* LC_MONETARY category: formatting of monetary quantities. |
1777 | These items each correspond to a member of `struct lconv', | |
1778 | defined in <locale.h>. */ | |
1779 | #ifdef INT_CURR_SYMBOL | |
1780 | DEFINE_NLITEM_CONSTANT (INT_CURR_SYMBOL); | |
1781 | #endif | |
1782 | #ifdef MON_DECIMAL_POINT | |
1783 | DEFINE_NLITEM_CONSTANT (MON_DECIMAL_POINT); | |
1784 | #endif | |
1785 | #ifdef MON_THOUSANDS_SEP | |
1786 | DEFINE_NLITEM_CONSTANT (MON_THOUSANDS_SEP); | |
1787 | #endif | |
1788 | #ifdef MON_GROUPING | |
1789 | DEFINE_NLITEM_CONSTANT (MON_GROUPING); | |
1790 | #endif | |
1791 | #ifdef POSITIVE_SIGN | |
1792 | DEFINE_NLITEM_CONSTANT (POSITIVE_SIGN); | |
1793 | #endif | |
1794 | #ifdef NEGATIVE_SIGN | |
1795 | DEFINE_NLITEM_CONSTANT (NEGATIVE_SIGN); | |
1796 | #endif | |
1797 | #ifdef GROUPING | |
1798 | DEFINE_NLITEM_CONSTANT (GROUPING); | |
1799 | #endif | |
1800 | #ifdef INT_FRAC_DIGITS | |
1801 | DEFINE_NLITEM_CONSTANT (INT_FRAC_DIGITS); | |
1802 | #endif | |
1803 | #ifdef FRAC_DIGITS | |
1804 | DEFINE_NLITEM_CONSTANT (FRAC_DIGITS); | |
1805 | #endif | |
1806 | #ifdef P_CS_PRECEDES | |
1807 | DEFINE_NLITEM_CONSTANT (P_CS_PRECEDES); | |
1808 | #endif | |
1809 | #ifdef P_SEP_BY_SPACE | |
1810 | DEFINE_NLITEM_CONSTANT (P_SEP_BY_SPACE); | |
1811 | #endif | |
1812 | #ifdef N_CS_PRECEDES | |
1813 | DEFINE_NLITEM_CONSTANT (N_CS_PRECEDES); | |
1814 | #endif | |
1815 | #ifdef N_SEP_BY_SPACE | |
1816 | DEFINE_NLITEM_CONSTANT (N_SEP_BY_SPACE); | |
1817 | #endif | |
1818 | #ifdef P_SIGN_POSN | |
1819 | DEFINE_NLITEM_CONSTANT (P_SIGN_POSN); | |
1820 | #endif | |
1821 | #ifdef N_SIGN_POSN | |
1822 | DEFINE_NLITEM_CONSTANT (N_SIGN_POSN); | |
1823 | #endif | |
1824 | #ifdef INT_P_CS_PRECEDES | |
1825 | DEFINE_NLITEM_CONSTANT (INT_P_CS_PRECEDES); | |
1826 | #endif | |
1827 | #ifdef INT_P_SEP_BY_SPACE | |
1828 | DEFINE_NLITEM_CONSTANT (INT_P_SEP_BY_SPACE); | |
1829 | #endif | |
1830 | #ifdef INT_N_CS_PRECEDES | |
1831 | DEFINE_NLITEM_CONSTANT (INT_N_CS_PRECEDES); | |
1832 | #endif | |
1833 | #ifdef INT_N_SEP_BY_SPACE | |
1834 | DEFINE_NLITEM_CONSTANT (INT_N_SEP_BY_SPACE); | |
1835 | #endif | |
1836 | #ifdef INT_P_SIGN_POSN | |
1837 | DEFINE_NLITEM_CONSTANT (INT_P_SIGN_POSN); | |
1838 | #endif | |
1839 | #ifdef INT_N_SIGN_POSN | |
1840 | DEFINE_NLITEM_CONSTANT (INT_N_SIGN_POSN); | |
1841 | #endif | |
1842 | ||
1843 | #undef DEFINE_NLITEM_CONSTANT | |
1844 | ||
1845 | #endif /* HAVE_NL_TYPES_H */ | |
1846 | } | |
1847 | ||
1848 | \f | |
1849 | void | |
1850 | scm_init_i18n () | |
1851 | { | |
1852 | SCM global_locale_smob; | |
1853 | ||
1854 | #ifdef HAVE_NL_LANGINFO | |
1855 | scm_add_feature ("nl-langinfo"); | |
1856 | define_langinfo_items (); | |
1857 | #endif | |
b89c4943 | 1858 | |
9361f762 | 1859 | #include "libguile/i18n.x" |
b89c4943 | 1860 | |
a2f00b9b | 1861 | /* Initialize the global locale object with a special `locale' SMOB. */ |
c3b16a5d LC |
1862 | /* XXX: We don't define it as `LC_GLOBAL_LOCALE' because of bugs as of |
1863 | glibc <= 2.11 not (yet) worked around by Gnulib. See | |
1864 | http://sourceware.org/bugzilla/show_bug.cgi?id=11009 for details. */ | |
a2f00b9b LC |
1865 | SCM_NEWSMOB (global_locale_smob, scm_tc16_locale_smob_type, NULL); |
1866 | SCM_VARIABLE_SET (scm_global_locale, global_locale_smob); | |
9361f762 MV |
1867 | } |
1868 | ||
756e8a3a LC |
1869 | void |
1870 | scm_bootstrap_i18n () | |
1871 | { | |
44602b08 AW |
1872 | scm_c_register_extension ("libguile-" SCM_EFFECTIVE_VERSION, |
1873 | "scm_init_i18n", | |
756e8a3a LC |
1874 | (scm_t_extension_init_func) scm_init_i18n, |
1875 | NULL); | |
1876 | ||
1877 | } | |
1878 | ||
9361f762 MV |
1879 | |
1880 | /* | |
1881 | Local Variables: | |
1882 | c-file-style: "gnu" | |
1883 | End: | |
1884 | */ |