Commit | Line | Data |
---|---|---|
8cd39fb3 MH |
1 | ;;; rng-match.el --- matching of RELAX NG patterns against XML events |
2 | ||
5df4f04c | 3 | ;; Copyright (C) 2003, 2007, 2008, 2009, 2010, 2011 Free Software Foundation, Inc. |
8cd39fb3 MH |
4 | |
5 | ;; Author: James Clark | |
6 | ;; Keywords: XML, RelaxNG | |
7 | ||
09aa73e6 | 8 | ;; This file is part of GNU Emacs. |
8cd39fb3 | 9 | |
4936186e | 10 | ;; GNU Emacs is free software: you can redistribute it and/or modify |
09aa73e6 | 11 | ;; it under the terms of the GNU General Public License as published by |
4936186e GM |
12 | ;; the Free Software Foundation, either version 3 of the License, or |
13 | ;; (at your option) any later version. | |
8cd39fb3 | 14 | |
09aa73e6 GM |
15 | ;; GNU Emacs is distributed in the hope that it will be useful, |
16 | ;; but WITHOUT ANY WARRANTY; without even the implied warranty of | |
17 | ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
18 | ;; GNU General Public License for more details. | |
19 | ||
20 | ;; You should have received a copy of the GNU General Public License | |
4936186e | 21 | ;; along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>. |
8cd39fb3 MH |
22 | |
23 | ;;; Commentary: | |
24 | ||
25 | ;; This uses the algorithm described in | |
26 | ;; http://www.thaiopensource.com/relaxng/derivative.html | |
27 | ;; | |
28 | ;; The schema to be used is contained in the variable | |
29 | ;; rng-current-schema. It has the form described in the file | |
30 | ;; rng-pttrn.el. | |
31 | ;; | |
32 | ;;; Code: | |
33 | ||
34 | (require 'rng-pttrn) | |
35 | (require 'rng-util) | |
36 | (require 'rng-dt) | |
37 | ||
38 | (defvar rng-not-allowed-ipattern nil) | |
39 | (defvar rng-empty-ipattern nil) | |
40 | (defvar rng-text-ipattern nil) | |
41 | ||
42 | (defvar rng-compile-table nil) | |
43 | ||
44 | (defvar rng-being-compiled nil | |
45 | "Contains a list of ref patterns currently being compiled. | |
10545bd8 | 46 | Used to detect invalid recursive references.") |
8cd39fb3 MH |
47 | |
48 | (defvar rng-ipattern-table nil) | |
49 | ||
50 | (defvar rng-last-ipattern-index nil) | |
51 | ||
52 | (defvar rng-match-state nil | |
53 | "An ipattern representing the current state of validation.") | |
54 | ||
55 | ;;; Inline functions | |
56 | ||
57 | (defsubst rng-update-match-state (new-state) | |
58 | (if (and (eq new-state rng-not-allowed-ipattern) | |
59 | (not (eq rng-match-state rng-not-allowed-ipattern))) | |
60 | nil | |
61 | (setq rng-match-state new-state) | |
62 | t)) | |
63 | ||
64 | ;;; Interned patterns | |
65 | ||
66 | (eval-when-compile | |
67 | (defun rng-ipattern-slot-accessor-name (slot-name) | |
68 | (intern (concat "rng-ipattern-get-" | |
69 | (symbol-name slot-name)))) | |
10545bd8 | 70 | |
8cd39fb3 MH |
71 | (defun rng-ipattern-slot-setter-name (slot-name) |
72 | (intern (concat "rng-ipattern-set-" | |
73 | (symbol-name slot-name))))) | |
74 | ||
75 | (defmacro rng-ipattern-defslot (slot-name index) | |
76 | `(progn | |
77 | (defsubst ,(rng-ipattern-slot-accessor-name slot-name) (ipattern) | |
78 | (aref ipattern ,index)) | |
79 | (defsubst ,(rng-ipattern-slot-setter-name slot-name) (ipattern value) | |
80 | (aset ipattern ,index value)))) | |
81 | ||
82 | (rng-ipattern-defslot type 0) | |
83 | (rng-ipattern-defslot index 1) | |
84 | (rng-ipattern-defslot name-class 2) | |
85 | (rng-ipattern-defslot datatype 2) | |
86 | (rng-ipattern-defslot after 2) | |
87 | (rng-ipattern-defslot child 3) | |
88 | (rng-ipattern-defslot value-object 3) | |
89 | (rng-ipattern-defslot nullable 4) | |
90 | (rng-ipattern-defslot memo-text-typed 5) | |
91 | (rng-ipattern-defslot memo-map-start-tag-open-deriv 6) | |
92 | (rng-ipattern-defslot memo-map-start-attribute-deriv 7) | |
93 | (rng-ipattern-defslot memo-start-tag-close-deriv 8) | |
94 | (rng-ipattern-defslot memo-text-only-deriv 9) | |
95 | (rng-ipattern-defslot memo-mixed-text-deriv 10) | |
96 | (rng-ipattern-defslot memo-map-data-deriv 11) | |
97 | (rng-ipattern-defslot memo-end-tag-deriv 12) | |
98 | ||
99 | (defconst rng-memo-map-alist-max 10) | |
100 | ||
101 | (defsubst rng-memo-map-get (key mm) | |
102 | "Return the value associated with KEY in memo-map MM." | |
103 | (let ((found (assoc key mm))) | |
104 | (if found | |
105 | (cdr found) | |
106 | (and mm | |
107 | (let ((head (car mm))) | |
108 | (and (hash-table-p head) | |
109 | (gethash key head))))))) | |
110 | ||
111 | (defun rng-memo-map-add (key value mm &optional weakness) | |
112 | "Associate KEY with VALUE in memo-map MM and return the new memo-map. | |
113 | The new memo-map may or may not be a different object from MM. | |
114 | ||
10545bd8 | 115 | Alists are better for small maps. Hash tables are better for large |
8cd39fb3 | 116 | maps. A memo-map therefore starts off as an alist and switches to a |
10545bd8 JB |
117 | hash table for large memo-maps. A memo-map is always a list. An empty |
118 | memo-map is represented by nil. A large memo-map is represented by a | |
8cd39fb3 MH |
119 | list containing just a hash-table. A small memo map is represented by |
120 | a list whose cdr is an alist and whose car is the number of entries in | |
10545bd8 | 121 | the alist. The complete memo-map can be passed to `assoc' without |
8cd39fb3 MH |
122 | problems: assoc ignores any members that are not cons cells. There is |
123 | therefore minimal overhead in successful lookups on small lists | |
124 | \(which is the most common case)." | |
125 | (if (null mm) | |
126 | (list 1 (cons key value)) | |
127 | (let ((head (car mm))) | |
128 | (cond ((hash-table-p head) | |
129 | (puthash key value head) | |
130 | mm) | |
131 | ((>= head rng-memo-map-alist-max) | |
132 | (let ((ht (make-hash-table :test 'equal | |
133 | :weakness weakness | |
134 | :size (* 2 rng-memo-map-alist-max)))) | |
135 | (setq mm (cdr mm)) | |
136 | (while mm | |
137 | (setq head (car mm)) | |
138 | (puthash (car head) (cdr head) ht) | |
139 | (setq mm (cdr mm))) | |
140 | (cons ht nil))) | |
141 | (t (cons (1+ head) | |
142 | (cons (cons key value) | |
143 | (cdr mm)))))))) | |
10545bd8 | 144 | |
8cd39fb3 MH |
145 | (defsubst rng-make-ipattern (type index name-class child nullable) |
146 | (vector type index name-class child nullable | |
147 | ;; 5 memo-text-typed | |
148 | 'unknown | |
149 | ;; 6 memo-map-start-tag-open-deriv | |
150 | nil | |
151 | ;; 7 memo-map-start-attribute-deriv | |
152 | nil | |
153 | ;; 8 memo-start-tag-close-deriv | |
154 | nil | |
155 | ;; 9 memo-text-only-deriv | |
156 | nil | |
157 | ;; 10 memo-mixed-text-deriv | |
158 | nil | |
159 | ;; 11 memo-map-data-deriv | |
160 | nil | |
161 | ;; 12 memo-end-tag-deriv | |
162 | nil)) | |
163 | ||
164 | (defun rng-ipattern-maybe-init () | |
165 | (unless rng-ipattern-table | |
166 | (setq rng-ipattern-table (make-hash-table :test 'equal)) | |
167 | (setq rng-last-ipattern-index -1))) | |
168 | ||
169 | (defun rng-ipattern-clear () | |
170 | (when rng-ipattern-table | |
171 | (clrhash rng-ipattern-table)) | |
172 | (setq rng-last-ipattern-index -1)) | |
173 | ||
174 | (defsubst rng-gen-ipattern-index () | |
175 | (setq rng-last-ipattern-index (1+ rng-last-ipattern-index))) | |
176 | ||
177 | (defun rng-put-ipattern (key type name-class child nullable) | |
178 | (let ((ipattern | |
179 | (rng-make-ipattern type | |
180 | (rng-gen-ipattern-index) | |
181 | name-class | |
182 | child | |
183 | nullable))) | |
184 | (puthash key ipattern rng-ipattern-table) | |
185 | ipattern)) | |
186 | ||
187 | (defun rng-get-ipattern (key) | |
188 | (gethash key rng-ipattern-table)) | |
189 | ||
190 | (or rng-not-allowed-ipattern | |
191 | (setq rng-not-allowed-ipattern | |
192 | (rng-make-ipattern 'not-allowed -3 nil nil nil))) | |
193 | ||
194 | (or rng-empty-ipattern | |
195 | (setq rng-empty-ipattern | |
196 | (rng-make-ipattern 'empty -2 nil nil t))) | |
197 | ||
198 | (or rng-text-ipattern | |
199 | (setq rng-text-ipattern | |
200 | (rng-make-ipattern 'text -1 nil nil t))) | |
201 | ||
202 | (defconst rng-const-ipatterns | |
203 | (list rng-not-allowed-ipattern | |
204 | rng-empty-ipattern | |
205 | rng-text-ipattern)) | |
206 | ||
207 | (defun rng-intern-after (child after) | |
208 | (if (eq child rng-not-allowed-ipattern) | |
209 | rng-not-allowed-ipattern | |
210 | (let ((key (list 'after | |
211 | (rng-ipattern-get-index child) | |
212 | (rng-ipattern-get-index after)))) | |
213 | (or (rng-get-ipattern key) | |
214 | (rng-put-ipattern key | |
215 | 'after | |
216 | after | |
217 | child | |
218 | nil))))) | |
10545bd8 | 219 | |
8cd39fb3 MH |
220 | (defun rng-intern-attribute (name-class ipattern) |
221 | (if (eq ipattern rng-not-allowed-ipattern) | |
222 | rng-not-allowed-ipattern | |
223 | (let ((key (list 'attribute | |
224 | name-class | |
225 | (rng-ipattern-get-index ipattern)))) | |
226 | (or (rng-get-ipattern key) | |
227 | (rng-put-ipattern key | |
228 | 'attribute | |
229 | name-class | |
230 | ipattern | |
231 | nil))))) | |
232 | ||
233 | (defun rng-intern-data (dt matches-anything) | |
234 | (let ((key (list 'data dt))) | |
235 | (or (rng-get-ipattern key) | |
236 | (let ((ipattern (rng-put-ipattern key | |
237 | 'data | |
238 | dt | |
239 | nil | |
240 | matches-anything))) | |
241 | (rng-ipattern-set-memo-text-typed ipattern | |
242 | (not matches-anything)) | |
243 | ipattern)))) | |
244 | ||
245 | (defun rng-intern-data-except (dt ipattern) | |
246 | (let ((key (list 'data-except dt ipattern))) | |
247 | (or (rng-get-ipattern key) | |
248 | (rng-put-ipattern key | |
249 | 'data-except | |
250 | dt | |
251 | ipattern | |
252 | nil)))) | |
253 | ||
254 | (defun rng-intern-value (dt obj) | |
255 | (let ((key (list 'value dt obj))) | |
256 | (or (rng-get-ipattern key) | |
257 | (rng-put-ipattern key | |
258 | 'value | |
259 | dt | |
260 | obj | |
261 | nil)))) | |
262 | ||
263 | (defun rng-intern-one-or-more (ipattern) | |
264 | (or (rng-intern-one-or-more-shortcut ipattern) | |
265 | (let ((key (cons 'one-or-more | |
266 | (list (rng-ipattern-get-index ipattern))))) | |
267 | (or (rng-get-ipattern key) | |
268 | (rng-put-ipattern key | |
269 | 'one-or-more | |
270 | nil | |
271 | ipattern | |
272 | (rng-ipattern-get-nullable ipattern)))))) | |
273 | ||
274 | (defun rng-intern-one-or-more-shortcut (ipattern) | |
275 | (cond ((eq ipattern rng-not-allowed-ipattern) | |
276 | rng-not-allowed-ipattern) | |
277 | ((eq ipattern rng-empty-ipattern) | |
278 | rng-empty-ipattern) | |
279 | ((eq (rng-ipattern-get-type ipattern) 'one-or-more) | |
280 | ipattern) | |
281 | (t nil))) | |
282 | ||
283 | (defun rng-intern-list (ipattern) | |
284 | (if (eq ipattern rng-not-allowed-ipattern) | |
285 | rng-not-allowed-ipattern | |
286 | (let ((key (cons 'list | |
287 | (list (rng-ipattern-get-index ipattern))))) | |
288 | (or (rng-get-ipattern key) | |
289 | (rng-put-ipattern key | |
290 | 'list | |
291 | nil | |
292 | ipattern | |
293 | nil))))) | |
294 | ||
295 | (defun rng-intern-group (ipatterns) | |
10545bd8 | 296 | "Return an ipattern for the list of group members in IPATTERNS." |
8cd39fb3 MH |
297 | (or (rng-intern-group-shortcut ipatterns) |
298 | (let* ((tem (rng-normalize-group-list ipatterns)) | |
299 | (normalized (cdr tem))) | |
300 | (or (rng-intern-group-shortcut normalized) | |
301 | (let ((key (cons 'group | |
302 | (mapcar 'rng-ipattern-get-index normalized)))) | |
303 | (or (rng-get-ipattern key) | |
304 | (rng-put-ipattern key | |
305 | 'group | |
306 | nil | |
307 | normalized | |
308 | (car tem)))))))) | |
309 | ||
310 | (defun rng-intern-group-shortcut (ipatterns) | |
10545bd8 JB |
311 | "Try to shortcut interning a group list. |
312 | If successful, return the interned pattern. Otherwise return nil." | |
8cd39fb3 MH |
313 | (while (and ipatterns |
314 | (eq (car ipatterns) rng-empty-ipattern)) | |
315 | (setq ipatterns (cdr ipatterns))) | |
316 | (if ipatterns | |
317 | (let ((ret (car ipatterns))) | |
318 | (if (eq ret rng-not-allowed-ipattern) | |
319 | rng-not-allowed-ipattern | |
320 | (setq ipatterns (cdr ipatterns)) | |
321 | (while (and ipatterns ret) | |
322 | (let ((tem (car ipatterns))) | |
323 | (cond ((eq tem rng-not-allowed-ipattern) | |
324 | (setq ret tem) | |
325 | (setq ipatterns nil)) | |
326 | ((eq tem rng-empty-ipattern) | |
327 | (setq ipatterns (cdr ipatterns))) | |
328 | (t | |
329 | ;; Stop here rather than continuing | |
330 | ;; looking for not-allowed patterns. | |
331 | ;; We do a complete scan elsewhere. | |
332 | (setq ret nil))))) | |
333 | ret)) | |
334 | rng-empty-ipattern)) | |
335 | ||
336 | (defun rng-normalize-group-list (ipatterns) | |
337 | "Normalize a list containing members of a group. | |
338 | Expands nested groups, removes empty members, handles notAllowed. | |
339 | Returns a pair whose car says whether the list is nullable and whose | |
340 | cdr is the normalized list." | |
341 | (let ((nullable t) | |
342 | (result nil) | |
343 | member) | |
344 | (while ipatterns | |
345 | (setq member (car ipatterns)) | |
346 | (setq ipatterns (cdr ipatterns)) | |
347 | (when nullable | |
348 | (setq nullable (rng-ipattern-get-nullable member))) | |
349 | (cond ((eq (rng-ipattern-get-type member) 'group) | |
350 | (setq result | |
351 | (nconc (reverse (rng-ipattern-get-child member)) | |
352 | result))) | |
353 | ((eq member rng-not-allowed-ipattern) | |
354 | (setq result (list rng-not-allowed-ipattern)) | |
355 | (setq ipatterns nil)) | |
356 | ((not (eq member rng-empty-ipattern)) | |
357 | (setq result (cons member result))))) | |
358 | (cons nullable (nreverse result)))) | |
359 | ||
360 | (defun rng-intern-interleave (ipatterns) | |
361 | (or (rng-intern-group-shortcut ipatterns) | |
362 | (let* ((tem (rng-normalize-interleave-list ipatterns)) | |
363 | (normalized (cdr tem))) | |
364 | (or (rng-intern-group-shortcut normalized) | |
365 | (let ((key (cons 'interleave | |
366 | (mapcar 'rng-ipattern-get-index normalized)))) | |
367 | (or (rng-get-ipattern key) | |
368 | (rng-put-ipattern key | |
369 | 'interleave | |
370 | nil | |
371 | normalized | |
372 | (car tem)))))))) | |
373 | ||
374 | (defun rng-normalize-interleave-list (ipatterns) | |
375 | "Normalize a list containing members of an interleave. | |
376 | Expands nested groups, removes empty members, handles notAllowed. | |
377 | Returns a pair whose car says whether the list is nullable and whose | |
378 | cdr is the normalized list." | |
379 | (let ((nullable t) | |
380 | (result nil) | |
381 | member) | |
382 | (while ipatterns | |
383 | (setq member (car ipatterns)) | |
384 | (setq ipatterns (cdr ipatterns)) | |
385 | (when nullable | |
386 | (setq nullable (rng-ipattern-get-nullable member))) | |
387 | (cond ((eq (rng-ipattern-get-type member) 'interleave) | |
388 | (setq result | |
389 | (append (rng-ipattern-get-child member) | |
390 | result))) | |
391 | ((eq member rng-not-allowed-ipattern) | |
392 | (setq result (list rng-not-allowed-ipattern)) | |
393 | (setq ipatterns nil)) | |
394 | ((not (eq member rng-empty-ipattern)) | |
395 | (setq result (cons member result))))) | |
396 | (cons nullable (sort result 'rng-compare-ipattern)))) | |
397 | ||
398 | ;; Would be cleaner if this didn't modify IPATTERNS. | |
399 | ||
400 | (defun rng-intern-choice (ipatterns) | |
401 | "Return a choice ipattern for the list of choices in IPATTERNS. | |
402 | May alter IPATTERNS." | |
403 | (or (rng-intern-choice-shortcut ipatterns) | |
404 | (let* ((tem (rng-normalize-choice-list ipatterns)) | |
405 | (normalized (cdr tem))) | |
406 | (or (rng-intern-choice-shortcut normalized) | |
407 | (rng-intern-choice1 normalized (car tem)))))) | |
408 | ||
409 | (defun rng-intern-optional (ipattern) | |
410 | (cond ((rng-ipattern-get-nullable ipattern) ipattern) | |
411 | ((eq ipattern rng-not-allowed-ipattern) rng-empty-ipattern) | |
412 | (t (rng-intern-choice1 | |
413 | ;; This is sorted since the empty pattern | |
414 | ;; is before everything except not allowed. | |
415 | ;; It cannot have a duplicate empty pattern, | |
416 | ;; since it is not nullable. | |
417 | (cons rng-empty-ipattern | |
418 | (if (eq (rng-ipattern-get-type ipattern) 'choice) | |
419 | (rng-ipattern-get-child ipattern) | |
420 | (list ipattern))) | |
421 | t)))) | |
422 | ||
423 | ||
424 | (defun rng-intern-choice1 (normalized nullable) | |
425 | (let ((key (cons 'choice | |
426 | (mapcar 'rng-ipattern-get-index normalized)))) | |
427 | (or (rng-get-ipattern key) | |
428 | (rng-put-ipattern key | |
429 | 'choice | |
430 | nil | |
431 | normalized | |
432 | nullable)))) | |
10545bd8 | 433 | |
8cd39fb3 | 434 | (defun rng-intern-choice-shortcut (ipatterns) |
10545bd8 JB |
435 | "Try to shortcut interning a choice list. |
436 | If successful, return the interned pattern. Otherwise return nil." | |
8cd39fb3 MH |
437 | (while (and ipatterns |
438 | (eq (car ipatterns) | |
439 | rng-not-allowed-ipattern)) | |
440 | (setq ipatterns (cdr ipatterns))) | |
441 | (if ipatterns | |
442 | (let ((ret (car ipatterns))) | |
443 | (setq ipatterns (cdr ipatterns)) | |
444 | (while (and ipatterns ret) | |
445 | (or (eq (car ipatterns) rng-not-allowed-ipattern) | |
446 | (eq (car ipatterns) ret) | |
447 | (setq ret nil)) | |
448 | (setq ipatterns (cdr ipatterns))) | |
449 | ret) | |
450 | rng-not-allowed-ipattern)) | |
451 | ||
452 | (defun rng-normalize-choice-list (ipatterns) | |
10545bd8 JB |
453 | "Normalize a list of choices. |
454 | Expands nested choices, removes not-allowed members, sorts by index | |
455 | and removes duplicates. Return a pair whose car says whether the | |
456 | list is nullable and whose cdr is the normalized list." | |
8cd39fb3 MH |
457 | (let ((sorted t) |
458 | (nullable nil) | |
459 | (head (cons nil ipatterns))) | |
460 | (let ((tail head) | |
461 | (final-tail nil) | |
462 | (prev-index -100) | |
463 | (cur ipatterns) | |
464 | member) | |
465 | ;; the cdr of tail is always cur | |
466 | (while cur | |
467 | (setq member (car cur)) | |
468 | (or nullable | |
469 | (setq nullable (rng-ipattern-get-nullable member))) | |
470 | (cond ((eq (rng-ipattern-get-type member) 'choice) | |
471 | (setq final-tail | |
472 | (append (rng-ipattern-get-child member) | |
473 | final-tail)) | |
474 | (setq cur (cdr cur)) | |
475 | (setq sorted nil) | |
476 | (setcdr tail cur)) | |
477 | ((eq member rng-not-allowed-ipattern) | |
478 | (setq cur (cdr cur)) | |
479 | (setcdr tail cur)) | |
480 | (t | |
481 | (if (and sorted | |
482 | (let ((cur-index (rng-ipattern-get-index member))) | |
483 | (if (>= prev-index cur-index) | |
484 | (or (= prev-index cur-index) ; will remove it | |
485 | (setq sorted nil)) ; won't remove it | |
486 | (setq prev-index cur-index) | |
487 | ;; won't remove it | |
488 | nil))) | |
489 | (progn | |
490 | ;; remove it | |
491 | (setq cur (cdr cur)) | |
492 | (setcdr tail cur)) | |
493 | ;; don't remove it | |
494 | (setq tail cur) | |
495 | (setq cur (cdr cur)))))) | |
496 | (setcdr tail final-tail)) | |
497 | (setq head (cdr head)) | |
498 | (cons nullable | |
499 | (if sorted | |
500 | head | |
501 | (rng-uniquify-eq (sort head 'rng-compare-ipattern)))))) | |
502 | ||
503 | (defun rng-compare-ipattern (p1 p2) | |
504 | (< (rng-ipattern-get-index p1) | |
505 | (rng-ipattern-get-index p2))) | |
506 | ||
507 | ;;; Name classes | |
508 | ||
509 | (defsubst rng-name-class-contains (nc nm) | |
510 | (if (consp nc) | |
511 | (equal nm nc) | |
512 | (rng-name-class-contains1 nc nm))) | |
513 | ||
514 | (defun rng-name-class-contains1 (nc nm) | |
515 | (let ((type (aref nc 0))) | |
516 | (cond ((eq type 'any-name) t) | |
517 | ((eq type 'any-name-except) | |
518 | (not (rng-name-class-contains (aref nc 1) nm))) | |
519 | ((eq type 'ns-name) | |
520 | (eq (car nm) (aref nc 1))) | |
521 | ((eq type 'ns-name-except) | |
522 | (and (eq (car nm) (aref nc 1)) | |
523 | (not (rng-name-class-contains (aref nc 2) nm)))) | |
524 | ((eq type 'choice) | |
525 | (let ((choices (aref nc 1)) | |
526 | (ret nil)) | |
527 | (while choices | |
528 | (if (rng-name-class-contains (car choices) nm) | |
529 | (progn | |
530 | (setq choices nil) | |
531 | (setq ret t)) | |
532 | (setq choices (cdr choices)))) | |
533 | ret))))) | |
534 | ||
535 | (defun rng-name-class-possible-names (nc accum) | |
536 | "Return a list of possible names that nameclass NC can match. | |
537 | ||
538 | Each possible name should be returned as a (NAMESPACE . LOCAL-NAME) | |
539 | pair, where NAMESPACE is a symbol or nil and LOCAL-NAME is a string. | |
10545bd8 JB |
540 | NAMESPACE, if nil, matches the absent namespace. ACCUM is a list of |
541 | names which should be appended to the returned list. The returned | |
542 | list may contain duplicates." | |
8cd39fb3 MH |
543 | (if (consp nc) |
544 | (cons nc accum) | |
545 | (when (eq (aref nc 0) 'choice) | |
546 | (let ((members (aref nc 1)) member) | |
547 | (while members | |
548 | (setq member (car members)) | |
549 | (setq accum | |
550 | (if (consp member) | |
551 | (cons member accum) | |
552 | (rng-name-class-possible-names member | |
553 | accum))) | |
554 | (setq members (cdr members))))) | |
555 | accum)) | |
556 | ||
557 | ;;; Debugging utilities | |
558 | ||
559 | (defun rng-ipattern-to-string (ipattern) | |
560 | (let ((type (rng-ipattern-get-type ipattern))) | |
561 | (cond ((eq type 'after) | |
562 | (concat (rng-ipattern-to-string | |
563 | (rng-ipattern-get-child ipattern)) | |
564 | " </> " | |
565 | (rng-ipattern-to-string | |
566 | (rng-ipattern-get-after ipattern)))) | |
567 | ((eq type 'element) | |
568 | (concat "element " | |
569 | (rng-name-class-to-string | |
570 | (rng-ipattern-get-name-class ipattern)) | |
571 | ;; we can get cycles with elements so don't print it out | |
572 | " {...}")) | |
573 | ((eq type 'attribute) | |
574 | (concat "attribute " | |
575 | (rng-name-class-to-string | |
576 | (rng-ipattern-get-name-class ipattern)) | |
577 | " { " | |
578 | (rng-ipattern-to-string | |
579 | (rng-ipattern-get-child ipattern)) | |
580 | " } ")) | |
581 | ((eq type 'empty) "empty") | |
582 | ((eq type 'text) "text") | |
583 | ((eq type 'not-allowed) "notAllowed") | |
584 | ((eq type 'one-or-more) | |
585 | (concat (rng-ipattern-to-string | |
586 | (rng-ipattern-get-child ipattern)) | |
587 | "+")) | |
588 | ((eq type 'choice) | |
589 | (concat "(" | |
590 | (mapconcat 'rng-ipattern-to-string | |
591 | (rng-ipattern-get-child ipattern) | |
592 | " | ") | |
593 | ")")) | |
594 | ((eq type 'group) | |
595 | (concat "(" | |
596 | (mapconcat 'rng-ipattern-to-string | |
597 | (rng-ipattern-get-child ipattern) | |
598 | ", ") | |
599 | ")")) | |
600 | ((eq type 'interleave) | |
601 | (concat "(" | |
602 | (mapconcat 'rng-ipattern-to-string | |
603 | (rng-ipattern-get-child ipattern) | |
604 | " & ") | |
605 | ")")) | |
606 | (t (symbol-name type))))) | |
607 | ||
608 | (defun rng-name-class-to-string (nc) | |
609 | (if (consp nc) | |
610 | (cdr nc) | |
611 | (let ((type (aref nc 0))) | |
612 | (cond ((eq type 'choice) | |
613 | (mapconcat 'rng-name-class-to-string | |
614 | (aref nc 1) | |
615 | "|")) | |
616 | (t (concat (symbol-name type) "*")))))) | |
617 | ||
618 | ||
619 | ;;; Compiling | |
620 | ||
621 | (defun rng-compile-maybe-init () | |
622 | (unless rng-compile-table | |
623 | (setq rng-compile-table (make-hash-table :test 'eq)))) | |
624 | ||
625 | (defun rng-compile-clear () | |
626 | (when rng-compile-table | |
627 | (clrhash rng-compile-table))) | |
628 | ||
629 | (defun rng-compile (pattern) | |
630 | (or (gethash pattern rng-compile-table) | |
631 | (let ((ipattern (apply (get (car pattern) 'rng-compile) | |
632 | (cdr pattern)))) | |
633 | (puthash pattern ipattern rng-compile-table) | |
634 | ipattern))) | |
635 | ||
636 | (put 'empty 'rng-compile 'rng-compile-empty) | |
637 | (put 'text 'rng-compile 'rng-compile-text) | |
638 | (put 'not-allowed 'rng-compile 'rng-compile-not-allowed) | |
639 | (put 'element 'rng-compile 'rng-compile-element) | |
640 | (put 'attribute 'rng-compile 'rng-compile-attribute) | |
641 | (put 'choice 'rng-compile 'rng-compile-choice) | |
642 | (put 'optional 'rng-compile 'rng-compile-optional) | |
643 | (put 'group 'rng-compile 'rng-compile-group) | |
644 | (put 'interleave 'rng-compile 'rng-compile-interleave) | |
645 | (put 'ref 'rng-compile 'rng-compile-ref) | |
646 | (put 'one-or-more 'rng-compile 'rng-compile-one-or-more) | |
647 | (put 'zero-or-more 'rng-compile 'rng-compile-zero-or-more) | |
648 | (put 'mixed 'rng-compile 'rng-compile-mixed) | |
649 | (put 'data 'rng-compile 'rng-compile-data) | |
650 | (put 'data-except 'rng-compile 'rng-compile-data-except) | |
651 | (put 'value 'rng-compile 'rng-compile-value) | |
652 | (put 'list 'rng-compile 'rng-compile-list) | |
653 | ||
654 | (defun rng-compile-not-allowed () rng-not-allowed-ipattern) | |
655 | (defun rng-compile-empty () rng-empty-ipattern) | |
656 | (defun rng-compile-text () rng-text-ipattern) | |
657 | ||
658 | (defun rng-compile-element (name-class pattern) | |
659 | ;; don't intern | |
660 | (rng-make-ipattern 'element | |
661 | (rng-gen-ipattern-index) | |
662 | (rng-compile-name-class name-class) | |
663 | pattern ; compile lazily | |
664 | nil)) | |
665 | ||
666 | (defun rng-element-get-child (element) | |
667 | (let ((tem (rng-ipattern-get-child element))) | |
668 | (if (vectorp tem) | |
669 | tem | |
670 | (rng-ipattern-set-child element (rng-compile tem))))) | |
671 | ||
672 | (defun rng-compile-attribute (name-class pattern) | |
673 | (rng-intern-attribute (rng-compile-name-class name-class) | |
674 | (rng-compile pattern))) | |
675 | ||
676 | (defun rng-compile-ref (pattern name) | |
677 | (and (memq pattern rng-being-compiled) | |
678 | (rng-compile-error "Reference loop on symbol %s" name)) | |
679 | (setq rng-being-compiled | |
680 | (cons pattern rng-being-compiled)) | |
681 | (unwind-protect | |
682 | (rng-compile pattern) | |
683 | (setq rng-being-compiled | |
684 | (cdr rng-being-compiled)))) | |
10545bd8 | 685 | |
8cd39fb3 MH |
686 | (defun rng-compile-one-or-more (pattern) |
687 | (rng-intern-one-or-more (rng-compile pattern))) | |
688 | ||
689 | (defun rng-compile-zero-or-more (pattern) | |
690 | (rng-intern-optional | |
691 | (rng-intern-one-or-more (rng-compile pattern)))) | |
692 | ||
693 | (defun rng-compile-optional (pattern) | |
694 | (rng-intern-optional (rng-compile pattern))) | |
695 | ||
696 | (defun rng-compile-mixed (pattern) | |
697 | (rng-intern-interleave (cons rng-text-ipattern | |
698 | (list (rng-compile pattern))))) | |
699 | ||
700 | (defun rng-compile-list (pattern) | |
701 | (rng-intern-list (rng-compile pattern))) | |
702 | ||
703 | (defun rng-compile-choice (&rest patterns) | |
704 | (rng-intern-choice (mapcar 'rng-compile patterns))) | |
705 | ||
706 | (defun rng-compile-group (&rest patterns) | |
707 | (rng-intern-group (mapcar 'rng-compile patterns))) | |
708 | ||
709 | (defun rng-compile-interleave (&rest patterns) | |
710 | (rng-intern-interleave (mapcar 'rng-compile patterns))) | |
711 | ||
712 | (defun rng-compile-dt (name params) | |
713 | (let ((rng-dt-error-reporter 'rng-compile-error)) | |
714 | (funcall (let ((uri (car name))) | |
715 | (or (get uri 'rng-dt-compile) | |
716 | (rng-compile-error "Unknown datatype library %s" uri))) | |
717 | (cdr name) | |
718 | params))) | |
719 | ||
720 | (defun rng-compile-data (name params) | |
721 | (let ((dt (rng-compile-dt name params))) | |
722 | (rng-intern-data (cdr dt) (car dt)))) | |
723 | ||
724 | (defun rng-compile-data-except (name params pattern) | |
725 | (rng-intern-data-except (cdr (rng-compile-dt name params)) | |
726 | (rng-compile pattern))) | |
727 | ||
728 | (defun rng-compile-value (name str context) | |
729 | (let* ((dt (cdr (rng-compile-dt name '()))) | |
730 | (rng-dt-namespace-context-getter (list 'identity context)) | |
731 | (obj (rng-dt-make-value dt str))) | |
732 | (if obj | |
733 | (rng-intern-value dt obj) | |
734 | (rng-compile-error "Value %s is not a valid instance of the datatype %s" | |
735 | str | |
736 | name)))) | |
10545bd8 | 737 | |
8cd39fb3 MH |
738 | (defun rng-compile-name-class (nc) |
739 | (let ((type (car nc))) | |
740 | (cond ((eq type 'name) (nth 1 nc)) | |
741 | ((eq type 'any-name) [any-name]) | |
742 | ((eq type 'any-name-except) | |
743 | (vector 'any-name-except | |
744 | (rng-compile-name-class (nth 1 nc)))) | |
745 | ((eq type 'ns-name) | |
746 | (vector 'ns-name (nth 1 nc))) | |
747 | ((eq type 'ns-name-except) | |
748 | (vector 'ns-name-except | |
749 | (nth 1 nc) | |
750 | (rng-compile-name-class (nth 2 nc)))) | |
751 | ((eq type 'choice) | |
752 | (vector 'choice | |
753 | (mapcar 'rng-compile-name-class (cdr nc)))) | |
754 | (t (error "Bad name-class type %s" type))))) | |
755 | ||
756 | ;;; Searching patterns | |
757 | ||
758 | ;; We write this non-recursively to avoid hitting max-lisp-eval-depth | |
759 | ;; on large schemas. | |
760 | ||
761 | (defun rng-map-element-attribute (function pattern accum &rest args) | |
762 | (let ((searched (make-hash-table :test 'eq)) | |
763 | type todo patterns) | |
764 | (while (progn | |
765 | (setq type (car pattern)) | |
766 | (cond ((memq type '(element attribute)) | |
767 | (setq accum | |
768 | (apply function | |
769 | (cons pattern | |
770 | (cons accum args)))) | |
771 | (setq pattern (nth 2 pattern))) | |
772 | ((eq type 'ref) | |
773 | (setq pattern (nth 1 pattern)) | |
774 | (if (gethash pattern searched) | |
775 | (setq pattern nil) | |
776 | (puthash pattern t searched))) | |
777 | ((memq type '(choice group interleave)) | |
778 | (setq todo (cons (cdr pattern) todo)) | |
779 | (setq pattern nil)) | |
780 | ((memq type '(one-or-more | |
781 | zero-or-more | |
782 | optional | |
783 | mixed)) | |
784 | (setq pattern (nth 1 pattern))) | |
785 | (t (setq pattern nil))) | |
786 | (cond (pattern) | |
787 | (patterns | |
788 | (setq pattern (car patterns)) | |
789 | (setq patterns (cdr patterns)) | |
790 | t) | |
791 | (todo | |
792 | (setq patterns (car todo)) | |
793 | (setq todo (cdr todo)) | |
794 | (setq pattern (car patterns)) | |
795 | (setq patterns (cdr patterns)) | |
796 | t)))) | |
797 | accum)) | |
798 | ||
799 | (defun rng-find-element-content-pattern (pattern accum name) | |
800 | (if (and (eq (car pattern) 'element) | |
801 | (rng-search-name name (nth 1 pattern))) | |
802 | (cons (rng-compile (nth 2 pattern)) accum) | |
803 | accum)) | |
804 | ||
805 | (defun rng-search-name (name nc) | |
806 | (let ((type (car nc))) | |
807 | (cond ((eq type 'name) | |
808 | (equal (cadr nc) name)) | |
809 | ((eq type 'choice) | |
810 | (let ((choices (cdr nc)) | |
811 | (found nil)) | |
812 | (while (and choices (not found)) | |
813 | (if (rng-search-name name (car choices)) | |
814 | (setq found t) | |
815 | (setq choices (cdr choices)))) | |
816 | found)) | |
817 | (t nil)))) | |
818 | ||
819 | (defun rng-find-name-class-uris (nc accum) | |
820 | (let ((type (car nc))) | |
821 | (cond ((eq type 'name) | |
822 | (rng-accum-namespace-uri (car (nth 1 nc)) accum)) | |
823 | ((memq type '(ns-name ns-name-except)) | |
824 | (rng-accum-namespace-uri (nth 1 nc) accum)) | |
825 | ((eq type 'choice) | |
826 | (let ((choices (cdr nc))) | |
827 | (while choices | |
828 | (setq accum | |
829 | (rng-find-name-class-uris (car choices) accum)) | |
830 | (setq choices (cdr choices)))) | |
831 | accum) | |
832 | (t accum)))) | |
833 | ||
834 | (defun rng-accum-namespace-uri (ns accum) | |
835 | (if (and ns (not (memq ns accum))) | |
836 | (cons ns accum) | |
837 | accum)) | |
838 | ||
839 | ;;; Derivatives | |
840 | ||
841 | (defun rng-ipattern-text-typed-p (ipattern) | |
842 | (let ((memo (rng-ipattern-get-memo-text-typed ipattern))) | |
843 | (if (eq memo 'unknown) | |
844 | (rng-ipattern-set-memo-text-typed | |
845 | ipattern | |
846 | (rng-ipattern-compute-text-typed-p ipattern)) | |
847 | memo))) | |
848 | ||
849 | (defun rng-ipattern-compute-text-typed-p (ipattern) | |
850 | (let ((type (rng-ipattern-get-type ipattern))) | |
851 | (cond ((eq type 'choice) | |
852 | (let ((cur (rng-ipattern-get-child ipattern)) | |
853 | (ret nil)) | |
854 | (while (and cur (not ret)) | |
855 | (if (rng-ipattern-text-typed-p (car cur)) | |
856 | (setq ret t) | |
857 | (setq cur (cdr cur)))) | |
858 | ret)) | |
859 | ((eq type 'group) | |
860 | (let ((cur (rng-ipattern-get-child ipattern)) | |
861 | (ret nil) | |
862 | member) | |
863 | (while (and cur (not ret)) | |
864 | (setq member (car cur)) | |
865 | (if (rng-ipattern-text-typed-p member) | |
866 | (setq ret t)) | |
867 | (setq cur | |
868 | (and (rng-ipattern-get-nullable member) | |
869 | (cdr cur)))) | |
870 | ret)) | |
871 | ((eq type 'after) | |
872 | (rng-ipattern-text-typed-p (rng-ipattern-get-child ipattern))) | |
873 | (t (and (memq type '(value list data data-except)) t))))) | |
10545bd8 | 874 | |
8cd39fb3 MH |
875 | (defun rng-start-tag-open-deriv (ipattern nm) |
876 | (or (rng-memo-map-get | |
877 | nm | |
878 | (rng-ipattern-get-memo-map-start-tag-open-deriv ipattern)) | |
879 | (rng-ipattern-memo-start-tag-open-deriv | |
880 | ipattern | |
10545bd8 | 881 | nm |
8cd39fb3 | 882 | (rng-compute-start-tag-open-deriv ipattern nm)))) |
10545bd8 | 883 | |
8cd39fb3 MH |
884 | (defun rng-ipattern-memo-start-tag-open-deriv (ipattern nm deriv) |
885 | (or (memq ipattern rng-const-ipatterns) | |
886 | (rng-ipattern-set-memo-map-start-tag-open-deriv | |
887 | ipattern | |
888 | (rng-memo-map-add nm | |
889 | deriv | |
890 | (rng-ipattern-get-memo-map-start-tag-open-deriv | |
891 | ipattern)))) | |
892 | deriv) | |
893 | ||
894 | (defun rng-compute-start-tag-open-deriv (ipattern nm) | |
895 | (let ((type (rng-ipattern-get-type ipattern))) | |
896 | (cond ((eq type 'choice) | |
897 | (rng-transform-choice `(lambda (p) | |
898 | (rng-start-tag-open-deriv p ',nm)) | |
899 | ipattern)) | |
900 | ((eq type 'element) | |
901 | (if (rng-name-class-contains | |
902 | (rng-ipattern-get-name-class ipattern) | |
903 | nm) | |
904 | (rng-intern-after (rng-element-get-child ipattern) | |
905 | rng-empty-ipattern) | |
906 | rng-not-allowed-ipattern)) | |
907 | ((eq type 'group) | |
908 | (rng-transform-group-nullable | |
909 | `(lambda (p) (rng-start-tag-open-deriv p ',nm)) | |
10545bd8 | 910 | 'rng-cons-group-after |
8cd39fb3 MH |
911 | ipattern)) |
912 | ((eq type 'interleave) | |
913 | (rng-transform-interleave-single | |
914 | `(lambda (p) (rng-start-tag-open-deriv p ',nm)) | |
915 | 'rng-subst-interleave-after | |
916 | ipattern)) | |
917 | ((eq type 'one-or-more) | |
918 | (rng-apply-after | |
919 | `(lambda (p) | |
920 | (rng-intern-group (list p ,(rng-intern-optional ipattern)))) | |
921 | (rng-start-tag-open-deriv (rng-ipattern-get-child ipattern) | |
922 | nm))) | |
923 | ((eq type 'after) | |
924 | (rng-apply-after | |
925 | `(lambda (p) | |
926 | (rng-intern-after p | |
927 | ,(rng-ipattern-get-after ipattern))) | |
928 | (rng-start-tag-open-deriv (rng-ipattern-get-child ipattern) | |
929 | nm))) | |
930 | (t rng-not-allowed-ipattern)))) | |
931 | ||
932 | (defun rng-start-attribute-deriv (ipattern nm) | |
933 | (or (rng-memo-map-get | |
934 | nm | |
935 | (rng-ipattern-get-memo-map-start-attribute-deriv ipattern)) | |
936 | (rng-ipattern-memo-start-attribute-deriv | |
937 | ipattern | |
10545bd8 | 938 | nm |
8cd39fb3 | 939 | (rng-compute-start-attribute-deriv ipattern nm)))) |
10545bd8 | 940 | |
8cd39fb3 MH |
941 | (defun rng-ipattern-memo-start-attribute-deriv (ipattern nm deriv) |
942 | (or (memq ipattern rng-const-ipatterns) | |
943 | (rng-ipattern-set-memo-map-start-attribute-deriv | |
944 | ipattern | |
945 | (rng-memo-map-add | |
946 | nm | |
947 | deriv | |
948 | (rng-ipattern-get-memo-map-start-attribute-deriv ipattern)))) | |
949 | deriv) | |
950 | ||
951 | (defun rng-compute-start-attribute-deriv (ipattern nm) | |
952 | (let ((type (rng-ipattern-get-type ipattern))) | |
953 | (cond ((eq type 'choice) | |
954 | (rng-transform-choice `(lambda (p) | |
955 | (rng-start-attribute-deriv p ',nm)) | |
956 | ipattern)) | |
957 | ((eq type 'attribute) | |
958 | (if (rng-name-class-contains | |
959 | (rng-ipattern-get-name-class ipattern) | |
960 | nm) | |
961 | (rng-intern-after (rng-ipattern-get-child ipattern) | |
962 | rng-empty-ipattern) | |
963 | rng-not-allowed-ipattern)) | |
964 | ((eq type 'group) | |
965 | (rng-transform-interleave-single | |
966 | `(lambda (p) (rng-start-attribute-deriv p ',nm)) | |
10545bd8 | 967 | 'rng-subst-group-after |
8cd39fb3 MH |
968 | ipattern)) |
969 | ((eq type 'interleave) | |
970 | (rng-transform-interleave-single | |
971 | `(lambda (p) (rng-start-attribute-deriv p ',nm)) | |
972 | 'rng-subst-interleave-after | |
973 | ipattern)) | |
974 | ((eq type 'one-or-more) | |
975 | (rng-apply-after | |
976 | `(lambda (p) | |
977 | (rng-intern-group (list p ,(rng-intern-optional ipattern)))) | |
978 | (rng-start-attribute-deriv (rng-ipattern-get-child ipattern) | |
979 | nm))) | |
980 | ((eq type 'after) | |
981 | (rng-apply-after | |
982 | `(lambda (p) | |
983 | (rng-intern-after p ,(rng-ipattern-get-after ipattern))) | |
984 | (rng-start-attribute-deriv (rng-ipattern-get-child ipattern) | |
985 | nm))) | |
986 | (t rng-not-allowed-ipattern)))) | |
987 | ||
988 | (defun rng-cons-group-after (x y) | |
989 | (rng-apply-after `(lambda (p) (rng-intern-group (cons p ',y))) | |
990 | x)) | |
991 | ||
992 | (defun rng-subst-group-after (new old list) | |
993 | (rng-apply-after `(lambda (p) | |
994 | (rng-intern-group (rng-substq p ,old ',list))) | |
995 | new)) | |
996 | ||
997 | (defun rng-subst-interleave-after (new old list) | |
998 | (rng-apply-after `(lambda (p) | |
999 | (rng-intern-interleave (rng-substq p ,old ',list))) | |
1000 | new)) | |
1001 | ||
1002 | (defun rng-apply-after (f ipattern) | |
1003 | (let ((type (rng-ipattern-get-type ipattern))) | |
1004 | (cond ((eq type 'after) | |
1005 | (rng-intern-after | |
1006 | (rng-ipattern-get-child ipattern) | |
1007 | (funcall f | |
1008 | (rng-ipattern-get-after ipattern)))) | |
1009 | ((eq type 'choice) | |
1010 | (rng-transform-choice `(lambda (x) (rng-apply-after ,f x)) | |
1011 | ipattern)) | |
1012 | (t rng-not-allowed-ipattern)))) | |
1013 | ||
1014 | (defun rng-start-tag-close-deriv (ipattern) | |
1015 | (or (rng-ipattern-get-memo-start-tag-close-deriv ipattern) | |
1016 | (rng-ipattern-set-memo-start-tag-close-deriv | |
1017 | ipattern | |
1018 | (rng-compute-start-tag-close-deriv ipattern)))) | |
1019 | ||
1020 | (defconst rng-transform-map | |
1021 | '((choice . rng-transform-choice) | |
1022 | (group . rng-transform-group) | |
1023 | (interleave . rng-transform-interleave) | |
1024 | (one-or-more . rng-transform-one-or-more) | |
1025 | (after . rng-transform-after-child))) | |
1026 | ||
1027 | (defun rng-compute-start-tag-close-deriv (ipattern) | |
1028 | (let* ((type (rng-ipattern-get-type ipattern))) | |
1029 | (if (eq type 'attribute) | |
1030 | rng-not-allowed-ipattern | |
1031 | (let ((transform (assq type rng-transform-map))) | |
1032 | (if transform | |
1033 | (funcall (cdr transform) | |
1034 | 'rng-start-tag-close-deriv | |
1035 | ipattern) | |
1036 | ipattern))))) | |
1037 | ||
1038 | (defun rng-ignore-attributes-deriv (ipattern) | |
1039 | (let* ((type (rng-ipattern-get-type ipattern))) | |
1040 | (if (eq type 'attribute) | |
1041 | rng-empty-ipattern | |
1042 | (let ((transform (assq type rng-transform-map))) | |
1043 | (if transform | |
1044 | (funcall (cdr transform) | |
1045 | 'rng-ignore-attributes-deriv | |
1046 | ipattern) | |
1047 | ipattern))))) | |
10545bd8 | 1048 | |
8cd39fb3 MH |
1049 | (defun rng-text-only-deriv (ipattern) |
1050 | (or (rng-ipattern-get-memo-text-only-deriv ipattern) | |
1051 | (rng-ipattern-set-memo-text-only-deriv | |
1052 | ipattern | |
1053 | (rng-compute-text-only-deriv ipattern)))) | |
1054 | ||
1055 | (defun rng-compute-text-only-deriv (ipattern) | |
1056 | (let* ((type (rng-ipattern-get-type ipattern))) | |
1057 | (if (eq type 'element) | |
1058 | rng-not-allowed-ipattern | |
1059 | (let ((transform (assq type | |
1060 | '((choice . rng-transform-choice) | |
1061 | (group . rng-transform-group) | |
1062 | (interleave . rng-transform-interleave) | |
1063 | (one-or-more . rng-transform-one-or-more) | |
1064 | (after . rng-transform-after-child))))) | |
1065 | (if transform | |
1066 | (funcall (cdr transform) | |
1067 | 'rng-text-only-deriv | |
1068 | ipattern) | |
1069 | ipattern))))) | |
1070 | ||
1071 | (defun rng-mixed-text-deriv (ipattern) | |
1072 | (or (rng-ipattern-get-memo-mixed-text-deriv ipattern) | |
1073 | (rng-ipattern-set-memo-mixed-text-deriv | |
1074 | ipattern | |
1075 | (rng-compute-mixed-text-deriv ipattern)))) | |
1076 | ||
1077 | (defun rng-compute-mixed-text-deriv (ipattern) | |
1078 | (let ((type (rng-ipattern-get-type ipattern))) | |
1079 | (cond ((eq type 'text) ipattern) | |
1080 | ((eq type 'after) | |
1081 | (rng-transform-after-child 'rng-mixed-text-deriv | |
1082 | ipattern)) | |
1083 | ((eq type 'choice) | |
1084 | (rng-transform-choice 'rng-mixed-text-deriv | |
1085 | ipattern)) | |
1086 | ((eq type 'one-or-more) | |
1087 | (rng-intern-group | |
1088 | (list (rng-mixed-text-deriv | |
1089 | (rng-ipattern-get-child ipattern)) | |
1090 | (rng-intern-optional ipattern)))) | |
1091 | ((eq type 'group) | |
1092 | (rng-transform-group-nullable | |
1093 | 'rng-mixed-text-deriv | |
1094 | (lambda (x y) (rng-intern-group (cons x y))) | |
1095 | ipattern)) | |
1096 | ((eq type 'interleave) | |
1097 | (rng-transform-interleave-single | |
1098 | 'rng-mixed-text-deriv | |
1099 | (lambda (new old list) (rng-intern-interleave | |
1100 | (rng-substq new old list))) | |
1101 | ipattern)) | |
1102 | ((and (eq type 'data) | |
1103 | (not (rng-ipattern-get-memo-text-typed ipattern))) | |
1104 | ipattern) | |
1105 | (t rng-not-allowed-ipattern)))) | |
1106 | ||
1107 | (defun rng-end-tag-deriv (ipattern) | |
1108 | (or (rng-ipattern-get-memo-end-tag-deriv ipattern) | |
1109 | (rng-ipattern-set-memo-end-tag-deriv | |
1110 | ipattern | |
1111 | (rng-compute-end-tag-deriv ipattern)))) | |
1112 | ||
1113 | (defun rng-compute-end-tag-deriv (ipattern) | |
1114 | (let ((type (rng-ipattern-get-type ipattern))) | |
1115 | (cond ((eq type 'choice) | |
1116 | (rng-intern-choice | |
1117 | (mapcar 'rng-end-tag-deriv | |
1118 | (rng-ipattern-get-child ipattern)))) | |
1119 | ((eq type 'after) | |
1120 | (if (rng-ipattern-get-nullable | |
1121 | (rng-ipattern-get-child ipattern)) | |
1122 | (rng-ipattern-get-after ipattern) | |
1123 | rng-not-allowed-ipattern)) | |
1124 | (t rng-not-allowed-ipattern)))) | |
1125 | ||
1126 | (defun rng-data-deriv (ipattern value) | |
1127 | (or (rng-memo-map-get value | |
1128 | (rng-ipattern-get-memo-map-data-deriv ipattern)) | |
1129 | (and (rng-memo-map-get | |
1130 | (cons value (rng-namespace-context-get-no-trace)) | |
1131 | (rng-ipattern-get-memo-map-data-deriv ipattern)) | |
1132 | (rng-memo-map-get | |
1133 | (cons value (apply (car rng-dt-namespace-context-getter) | |
1134 | (cdr rng-dt-namespace-context-getter))) | |
1135 | (rng-ipattern-get-memo-map-data-deriv ipattern))) | |
1136 | (let* ((used-context (vector nil)) | |
1137 | (rng-dt-namespace-context-getter | |
1138 | (cons 'rng-namespace-context-tracer | |
1139 | (cons used-context | |
1140 | rng-dt-namespace-context-getter))) | |
1141 | (deriv (rng-compute-data-deriv ipattern value))) | |
1142 | (rng-ipattern-memo-data-deriv ipattern | |
1143 | value | |
1144 | (aref used-context 0) | |
1145 | deriv)))) | |
1146 | ||
1147 | (defun rng-namespace-context-tracer (used getter &rest args) | |
1148 | (let ((context (apply getter args))) | |
1149 | (aset used 0 context) | |
1150 | context)) | |
1151 | ||
1152 | (defun rng-namespace-context-get-no-trace () | |
1153 | (let ((tem rng-dt-namespace-context-getter)) | |
1154 | (while (and tem (eq (car tem) 'rng-namespace-context-tracer)) | |
1155 | (setq tem (cddr tem))) | |
1156 | (apply (car tem) (cdr tem)))) | |
1157 | ||
1158 | (defconst rng-memo-data-deriv-max-length 80 | |
1159 | "Don't memoize data-derivs for values longer than this.") | |
1160 | ||
1161 | (defun rng-ipattern-memo-data-deriv (ipattern value context deriv) | |
1162 | (or (memq ipattern rng-const-ipatterns) | |
1163 | (> (length value) rng-memo-data-deriv-max-length) | |
1164 | (rng-ipattern-set-memo-map-data-deriv | |
1165 | ipattern | |
1166 | (rng-memo-map-add (if context (cons value context) value) | |
1167 | deriv | |
1168 | (rng-ipattern-get-memo-map-data-deriv ipattern) | |
1169 | t))) | |
1170 | deriv) | |
1171 | ||
1172 | (defun rng-compute-data-deriv (ipattern value) | |
1173 | (let ((type (rng-ipattern-get-type ipattern))) | |
1174 | (cond ((eq type 'text) ipattern) | |
1175 | ((eq type 'choice) | |
1176 | (rng-transform-choice `(lambda (p) (rng-data-deriv p ,value)) | |
1177 | ipattern)) | |
1178 | ((eq type 'group) | |
1179 | (rng-transform-group-nullable | |
1180 | `(lambda (p) (rng-data-deriv p ,value)) | |
1181 | (lambda (x y) (rng-intern-group (cons x y))) | |
1182 | ipattern)) | |
1183 | ((eq type 'one-or-more) | |
1184 | (rng-intern-group (list (rng-data-deriv | |
1185 | (rng-ipattern-get-child ipattern) | |
1186 | value) | |
1187 | (rng-intern-optional ipattern)))) | |
1188 | ((eq type 'after) | |
1189 | (let ((child (rng-ipattern-get-child ipattern))) | |
1190 | (if (or (rng-ipattern-get-nullable | |
1191 | (rng-data-deriv child value)) | |
1192 | (and (rng-ipattern-get-nullable child) | |
1193 | (rng-blank-p value))) | |
1194 | (rng-ipattern-get-after ipattern) | |
1195 | rng-not-allowed-ipattern))) | |
1196 | ((eq type 'data) | |
1197 | (if (rng-dt-make-value (rng-ipattern-get-datatype ipattern) | |
1198 | value) | |
1199 | rng-empty-ipattern | |
1200 | rng-not-allowed-ipattern)) | |
1201 | ((eq type 'data-except) | |
1202 | (if (and (rng-dt-make-value (rng-ipattern-get-datatype ipattern) | |
1203 | value) | |
1204 | (not (rng-ipattern-get-nullable | |
1205 | (rng-data-deriv | |
1206 | (rng-ipattern-get-child ipattern) | |
1207 | value)))) | |
1208 | rng-empty-ipattern | |
1209 | rng-not-allowed-ipattern)) | |
1210 | ((eq type 'value) | |
1211 | (if (equal (rng-dt-make-value (rng-ipattern-get-datatype ipattern) | |
1212 | value) | |
1213 | (rng-ipattern-get-value-object ipattern)) | |
1214 | rng-empty-ipattern | |
1215 | rng-not-allowed-ipattern)) | |
1216 | ((eq type 'list) | |
1217 | (let ((tokens (split-string value)) | |
1218 | (state (rng-ipattern-get-child ipattern))) | |
1219 | (while (and tokens | |
1220 | (not (eq state rng-not-allowed-ipattern))) | |
1221 | (setq state (rng-data-deriv state (car tokens))) | |
1222 | (setq tokens (cdr tokens))) | |
1223 | (if (rng-ipattern-get-nullable state) | |
1224 | rng-empty-ipattern | |
1225 | rng-not-allowed-ipattern))) | |
1226 | ;; don't think interleave can occur | |
1227 | ;; since we do text-only-deriv first | |
1228 | (t rng-not-allowed-ipattern)))) | |
1229 | ||
1230 | (defun rng-transform-multi (f ipattern interner) | |
1231 | (let* ((members (rng-ipattern-get-child ipattern)) | |
1232 | (transformed (mapcar f members))) | |
1233 | (if (rng-members-eq members transformed) | |
1234 | ipattern | |
1235 | (funcall interner transformed)))) | |
1236 | ||
1237 | (defun rng-transform-choice (f ipattern) | |
1238 | (rng-transform-multi f ipattern 'rng-intern-choice)) | |
1239 | ||
1240 | (defun rng-transform-group (f ipattern) | |
1241 | (rng-transform-multi f ipattern 'rng-intern-group)) | |
1242 | ||
1243 | (defun rng-transform-interleave (f ipattern) | |
1244 | (rng-transform-multi f ipattern 'rng-intern-interleave)) | |
1245 | ||
1246 | (defun rng-transform-one-or-more (f ipattern) | |
1247 | (let* ((child (rng-ipattern-get-child ipattern)) | |
1248 | (transformed (funcall f child))) | |
1249 | (if (eq child transformed) | |
1250 | ipattern | |
1251 | (rng-intern-one-or-more transformed)))) | |
1252 | ||
1253 | (defun rng-transform-after-child (f ipattern) | |
1254 | (let* ((child (rng-ipattern-get-child ipattern)) | |
1255 | (transformed (funcall f child))) | |
1256 | (if (eq child transformed) | |
1257 | ipattern | |
1258 | (rng-intern-after transformed | |
1259 | (rng-ipattern-get-after ipattern))))) | |
1260 | ||
1261 | (defun rng-transform-interleave-single (f subster ipattern) | |
1262 | (let ((children (rng-ipattern-get-child ipattern)) | |
1263 | found) | |
1264 | (while (and children (not found)) | |
1265 | (let* ((child (car children)) | |
1266 | (transformed (funcall f child))) | |
1267 | (if (eq transformed rng-not-allowed-ipattern) | |
1268 | (setq children (cdr children)) | |
1269 | (setq found | |
1270 | (funcall subster | |
1271 | transformed | |
1272 | child | |
1273 | (rng-ipattern-get-child ipattern)))))) | |
1274 | (or found | |
1275 | rng-not-allowed-ipattern))) | |
1276 | ||
1277 | (defun rng-transform-group-nullable (f conser ipattern) | |
1278 | "Given a group x1,...,xn,y1,...,yn where the xs are all | |
1279 | nullable and y1 isn't, return a choice | |
1280 | (conser f(x1) x2,...,xm,y1,...,yn) | |
1281 | |(conser f(x2) x3,...,xm,y1,...,yn) | |
1282 | |... | |
1283 | |(conser f(xm) y1,...,yn) | |
1284 | |(conser f(y1) y2,...,yn)" | |
1285 | (rng-intern-choice | |
1286 | (rng-transform-group-nullable-gen-choices | |
1287 | f | |
1288 | conser | |
1289 | (rng-ipattern-get-child ipattern)))) | |
1290 | ||
1291 | (defun rng-transform-group-nullable-gen-choices (f conser members) | |
1292 | (let ((head (car members)) | |
1293 | (tail (cdr members))) | |
1294 | (if tail | |
1295 | (cons (funcall conser (funcall f head) tail) | |
1296 | (if (rng-ipattern-get-nullable head) | |
1297 | (rng-transform-group-nullable-gen-choices f conser tail) | |
1298 | nil)) | |
1299 | (list (funcall f head))))) | |
1300 | ||
1301 | (defun rng-members-eq (list1 list2) | |
1302 | (while (and list1 | |
1303 | list2 | |
1304 | (eq (car list1) (car list2))) | |
1305 | (setq list1 (cdr list1)) | |
1306 | (setq list2 (cdr list2))) | |
1307 | (and (null list1) (null list2))) | |
10545bd8 | 1308 | |
8cd39fb3 MH |
1309 | |
1310 | (defun rng-ipattern-after (ipattern) | |
1311 | (let ((type (rng-ipattern-get-type ipattern))) | |
1312 | (cond ((eq type 'choice) | |
1313 | (rng-transform-choice 'rng-ipattern-after ipattern)) | |
1314 | ((eq type 'after) | |
1315 | (rng-ipattern-get-after ipattern)) | |
1316 | ((eq type 'not-allowed) | |
1317 | ipattern) | |
1318 | (t (error "Internal error in rng-ipattern-after: unexpected type %s" type))))) | |
1319 | ||
1320 | (defun rng-unknown-start-tag-open-deriv (ipattern) | |
1321 | (rng-intern-after (rng-compile rng-any-content) ipattern)) | |
1322 | ||
1323 | (defun rng-ipattern-optionalize-elements (ipattern) | |
1324 | (let* ((type (rng-ipattern-get-type ipattern)) | |
1325 | (transform (assq type rng-transform-map))) | |
1326 | (cond (transform | |
1327 | (funcall (cdr transform) | |
1328 | 'rng-ipattern-optionalize-elements | |
1329 | ipattern)) | |
1330 | ((eq type 'element) | |
1331 | (rng-intern-optional ipattern)) | |
1332 | (t ipattern)))) | |
1333 | ||
1334 | (defun rng-ipattern-empty-before-p (ipattern) | |
1335 | (let ((type (rng-ipattern-get-type ipattern))) | |
1336 | (cond ((eq type 'after) | |
1337 | (eq (rng-ipattern-get-child ipattern) rng-empty-ipattern)) | |
1338 | ((eq type 'choice) | |
1339 | (let ((members (rng-ipattern-get-child ipattern)) | |
1340 | (ret t)) | |
1341 | (while (and members ret) | |
1342 | (or (rng-ipattern-empty-before-p (car members)) | |
1343 | (setq ret nil)) | |
1344 | (setq members (cdr members))) | |
1345 | ret)) | |
1346 | (t nil)))) | |
1347 | ||
1348 | (defun rng-ipattern-possible-start-tags (ipattern accum) | |
1349 | (let ((type (rng-ipattern-get-type ipattern))) | |
1350 | (cond ((eq type 'after) | |
1351 | (rng-ipattern-possible-start-tags | |
1352 | (rng-ipattern-get-child ipattern) | |
1353 | accum)) | |
1354 | ((memq type '(choice interleave)) | |
1355 | (let ((members (rng-ipattern-get-child ipattern))) | |
1356 | (while members | |
1357 | (setq accum | |
1358 | (rng-ipattern-possible-start-tags (car members) | |
1359 | accum)) | |
1360 | (setq members (cdr members)))) | |
1361 | accum) | |
1362 | ((eq type 'group) | |
1363 | (let ((members (rng-ipattern-get-child ipattern))) | |
1364 | (while members | |
1365 | (setq accum | |
1366 | (rng-ipattern-possible-start-tags (car members) | |
1367 | accum)) | |
1368 | (setq members | |
1369 | (and (rng-ipattern-get-nullable (car members)) | |
1370 | (cdr members))))) | |
1371 | accum) | |
1372 | ((eq type 'element) | |
1373 | (if (eq (rng-element-get-child ipattern) rng-not-allowed-ipattern) | |
1374 | accum | |
1375 | (rng-name-class-possible-names | |
1376 | (rng-ipattern-get-name-class ipattern) | |
1377 | accum))) | |
1378 | ((eq type 'one-or-more) | |
1379 | (rng-ipattern-possible-start-tags | |
1380 | (rng-ipattern-get-child ipattern) | |
1381 | accum)) | |
1382 | (t accum)))) | |
1383 | ||
1384 | (defun rng-ipattern-start-tag-possible-p (ipattern) | |
1385 | (let ((type (rng-ipattern-get-type ipattern))) | |
1386 | (cond ((memq type '(after one-or-more)) | |
1387 | (rng-ipattern-start-tag-possible-p | |
1388 | (rng-ipattern-get-child ipattern))) | |
1389 | ((memq type '(choice interleave)) | |
1390 | (let ((members (rng-ipattern-get-child ipattern)) | |
1391 | (possible nil)) | |
1392 | (while (and members (not possible)) | |
1393 | (setq possible | |
1394 | (rng-ipattern-start-tag-possible-p (car members))) | |
1395 | (setq members (cdr members))) | |
1396 | possible)) | |
1397 | ((eq type 'group) | |
1398 | (let ((members (rng-ipattern-get-child ipattern)) | |
1399 | (possible nil)) | |
1400 | (while (and members (not possible)) | |
1401 | (setq possible | |
1402 | (rng-ipattern-start-tag-possible-p (car members))) | |
1403 | (setq members | |
1404 | (and (rng-ipattern-get-nullable (car members)) | |
1405 | (cdr members)))) | |
1406 | possible)) | |
1407 | ((eq type 'element) | |
1408 | (not (eq (rng-element-get-child ipattern) | |
1409 | rng-not-allowed-ipattern))) | |
1410 | (t nil)))) | |
1411 | ||
1412 | (defun rng-ipattern-possible-attributes (ipattern accum) | |
1413 | (let ((type (rng-ipattern-get-type ipattern))) | |
1414 | (cond ((eq type 'after) | |
1415 | (rng-ipattern-possible-attributes (rng-ipattern-get-child ipattern) | |
1416 | accum)) | |
1417 | ((memq type '(choice interleave group)) | |
1418 | (let ((members (rng-ipattern-get-child ipattern))) | |
1419 | (while members | |
1420 | (setq accum | |
1421 | (rng-ipattern-possible-attributes (car members) | |
1422 | accum)) | |
1423 | (setq members (cdr members)))) | |
1424 | accum) | |
1425 | ((eq type 'attribute) | |
1426 | (rng-name-class-possible-names | |
1427 | (rng-ipattern-get-name-class ipattern) | |
1428 | accum)) | |
1429 | ((eq type 'one-or-more) | |
1430 | (rng-ipattern-possible-attributes | |
1431 | (rng-ipattern-get-child ipattern) | |
1432 | accum)) | |
1433 | (t accum)))) | |
1434 | ||
1435 | (defun rng-ipattern-possible-values (ipattern accum) | |
1436 | (let ((type (rng-ipattern-get-type ipattern))) | |
1437 | (cond ((eq type 'after) | |
1438 | (rng-ipattern-possible-values (rng-ipattern-get-child ipattern) | |
1439 | accum)) | |
1440 | ((eq type 'choice) | |
1441 | (let ((members (rng-ipattern-get-child ipattern))) | |
1442 | (while members | |
1443 | (setq accum | |
1444 | (rng-ipattern-possible-values (car members) | |
1445 | accum)) | |
1446 | (setq members (cdr members)))) | |
1447 | accum) | |
1448 | ((eq type 'value) | |
1449 | (let ((value-object (rng-ipattern-get-value-object ipattern))) | |
1450 | (if (stringp value-object) | |
1451 | (cons value-object accum) | |
1452 | accum))) | |
1453 | (t accum)))) | |
1454 | ||
1455 | (defun rng-ipattern-required-element (ipattern) | |
1456 | (let ((type (rng-ipattern-get-type ipattern))) | |
1457 | (cond ((memq type '(after one-or-more)) | |
1458 | (rng-ipattern-required-element (rng-ipattern-get-child ipattern))) | |
1459 | ((eq type 'choice) | |
1460 | (let* ((members (rng-ipattern-get-child ipattern)) | |
1461 | (required (rng-ipattern-required-element (car members)))) | |
1462 | (while (and required | |
1463 | (setq members (cdr members))) | |
1464 | (unless (equal required | |
1465 | (rng-ipattern-required-element (car members))) | |
1466 | (setq required nil))) | |
1467 | required)) | |
1468 | ((eq type 'group) | |
1469 | (let ((members (rng-ipattern-get-child ipattern)) | |
1470 | required) | |
1471 | (while (and (not (setq required | |
1472 | (rng-ipattern-required-element | |
1473 | (car members)))) | |
1474 | (rng-ipattern-get-nullable (car members)) | |
1475 | (setq members (cdr members)))) | |
1476 | required)) | |
1477 | ((eq type 'interleave) | |
1478 | (let ((members (rng-ipattern-get-child ipattern)) | |
1479 | required) | |
1480 | (while members | |
1481 | (let ((tem (rng-ipattern-required-element (car members)))) | |
1482 | (cond ((not tem) | |
1483 | (setq members (cdr members))) | |
1484 | ((not required) | |
1485 | (setq required tem) | |
1486 | (setq members (cdr members))) | |
1487 | ((equal required tem) | |
1488 | (setq members (cdr members))) | |
1489 | (t | |
1490 | (setq required nil) | |
1491 | (setq members nil))))) | |
1492 | required)) | |
1493 | ((eq type 'element) | |
1494 | (let ((nc (rng-ipattern-get-name-class ipattern))) | |
1495 | (and (consp nc) | |
1496 | (not (eq (rng-element-get-child ipattern) | |
1497 | rng-not-allowed-ipattern)) | |
1498 | nc)))))) | |
1499 | ||
1500 | (defun rng-ipattern-required-attributes (ipattern accum) | |
1501 | (let ((type (rng-ipattern-get-type ipattern))) | |
1502 | (cond ((eq type 'after) | |
1503 | (rng-ipattern-required-attributes (rng-ipattern-get-child ipattern) | |
1504 | accum)) | |
1505 | ((memq type '(interleave group)) | |
1506 | (let ((members (rng-ipattern-get-child ipattern))) | |
1507 | (while members | |
1508 | (setq accum | |
1509 | (rng-ipattern-required-attributes (car members) | |
1510 | accum)) | |
1511 | (setq members (cdr members)))) | |
1512 | accum) | |
1513 | ((eq type 'choice) | |
1514 | (let ((members (rng-ipattern-get-child ipattern)) | |
1515 | in-all in-this new-in-all) | |
1516 | (setq in-all | |
1517 | (rng-ipattern-required-attributes (car members) | |
1518 | nil)) | |
1519 | (while (and in-all (setq members (cdr members))) | |
1520 | (setq in-this | |
1521 | (rng-ipattern-required-attributes (car members) nil)) | |
1522 | (setq new-in-all nil) | |
1523 | (while in-this | |
1524 | (when (member (car in-this) in-all) | |
1525 | (setq new-in-all | |
1526 | (cons (car in-this) new-in-all))) | |
1527 | (setq in-this (cdr in-this))) | |
1528 | (setq in-all new-in-all)) | |
1529 | (append in-all accum))) | |
1530 | ((eq type 'attribute) | |
1531 | (let ((nc (rng-ipattern-get-name-class ipattern))) | |
1532 | (if (consp nc) | |
1533 | (cons nc accum) | |
1534 | accum))) | |
1535 | ((eq type 'one-or-more) | |
1536 | (rng-ipattern-required-attributes (rng-ipattern-get-child ipattern) | |
1537 | accum)) | |
1538 | (t accum)))) | |
1539 | ||
1540 | (defun rng-compile-error (&rest args) | |
1541 | (signal 'rng-compile-error | |
1542 | (list (apply 'format args)))) | |
1543 | ||
1544 | (put 'rng-compile-error | |
1545 | 'error-conditions | |
1546 | '(error rng-error rng-compile-error)) | |
1547 | ||
1548 | (put 'rng-compile-error | |
1549 | 'error-message | |
1550 | "Incorrect schema") | |
1551 | ||
1552 | ||
1553 | ;;; External API | |
1554 | ||
1555 | (defsubst rng-match-state () rng-match-state) | |
1556 | ||
1557 | (defsubst rng-set-match-state (state) | |
1558 | (setq rng-match-state state)) | |
10545bd8 | 1559 | |
8cd39fb3 MH |
1560 | (defsubst rng-match-state-equal (state) |
1561 | (eq state rng-match-state)) | |
1562 | ||
1563 | (defun rng-schema-changed () | |
1564 | (rng-ipattern-clear) | |
1565 | (rng-compile-clear)) | |
1566 | ||
1567 | (defun rng-match-init-buffer () | |
1568 | (make-local-variable 'rng-compile-table) | |
1569 | (make-local-variable 'rng-ipattern-table) | |
1570 | (make-local-variable 'rng-last-ipattern-index)) | |
1571 | ||
1572 | (defun rng-match-start-document () | |
1573 | (rng-ipattern-maybe-init) | |
1574 | (rng-compile-maybe-init) | |
1575 | (add-hook 'rng-schema-change-hook 'rng-schema-changed nil t) | |
1576 | (setq rng-match-state (rng-compile rng-current-schema))) | |
1577 | ||
1578 | (defun rng-match-start-tag-open (name) | |
1579 | (rng-update-match-state (rng-start-tag-open-deriv rng-match-state | |
1580 | name))) | |
1581 | ||
1582 | (defun rng-match-attribute-name (name) | |
1583 | (rng-update-match-state (rng-start-attribute-deriv rng-match-state | |
1584 | name))) | |
1585 | ||
1586 | (defun rng-match-attribute-value (value) | |
1587 | (rng-update-match-state (rng-data-deriv rng-match-state | |
1588 | value))) | |
1589 | ||
1590 | (defun rng-match-element-value (value) | |
1591 | (and (rng-update-match-state (rng-text-only-deriv rng-match-state)) | |
1592 | (rng-update-match-state (rng-data-deriv rng-match-state | |
1593 | value)))) | |
1594 | ||
1595 | (defun rng-match-start-tag-close () | |
1596 | (rng-update-match-state (rng-start-tag-close-deriv rng-match-state))) | |
1597 | ||
1598 | (defun rng-match-mixed-text () | |
1599 | (rng-update-match-state (rng-mixed-text-deriv rng-match-state))) | |
1600 | ||
1601 | (defun rng-match-end-tag () | |
1602 | (rng-update-match-state (rng-end-tag-deriv rng-match-state))) | |
1603 | ||
1604 | (defun rng-match-after () | |
1605 | (rng-update-match-state | |
1606 | (rng-ipattern-after rng-match-state))) | |
1607 | ||
1608 | (defun rng-match-out-of-context-start-tag-open (name) | |
1609 | (let* ((found (rng-map-element-attribute 'rng-find-element-content-pattern | |
1610 | rng-current-schema | |
1611 | nil | |
1612 | name)) | |
1613 | (content-pattern (if found | |
1614 | (rng-intern-choice found) | |
1615 | rng-not-allowed-ipattern))) | |
1616 | (rng-update-match-state | |
1617 | (rng-intern-after content-pattern rng-match-state)))) | |
1618 | ||
1619 | (defun rng-match-possible-namespace-uris () | |
1620 | "Return a list of all the namespace URIs used in the current schema. | |
10545bd8 | 1621 | The absent URI is not included, so the result is always a list of symbols." |
8cd39fb3 MH |
1622 | (rng-map-element-attribute (lambda (pattern accum) |
1623 | (rng-find-name-class-uris (nth 1 pattern) | |
1624 | accum)) | |
1625 | rng-current-schema | |
1626 | nil)) | |
1627 | ||
1628 | (defun rng-match-unknown-start-tag-open () | |
1629 | (rng-update-match-state | |
1630 | (rng-unknown-start-tag-open-deriv rng-match-state))) | |
1631 | ||
1632 | (defun rng-match-optionalize-elements () | |
1633 | (rng-update-match-state | |
1634 | (rng-ipattern-optionalize-elements rng-match-state))) | |
1635 | ||
1636 | (defun rng-match-ignore-attributes () | |
1637 | (rng-update-match-state | |
1638 | (rng-ignore-attributes-deriv rng-match-state))) | |
1639 | ||
1640 | (defun rng-match-text-typed-p () | |
1641 | (rng-ipattern-text-typed-p rng-match-state)) | |
1642 | ||
1643 | (defun rng-match-empty-content () | |
1644 | (if (rng-match-text-typed-p) | |
1645 | (rng-match-element-value "") | |
1646 | (rng-match-end-tag))) | |
1647 | ||
1648 | (defun rng-match-empty-before-p () | |
1649 | "Return non-nil if what can be matched before an end-tag is empty. | |
1650 | In other words, return non-nil if the pattern for what can be matched | |
1651 | for an end-tag is equivalent to empty." | |
1652 | (rng-ipattern-empty-before-p rng-match-state)) | |
1653 | ||
1654 | (defun rng-match-infer-start-tag-namespace (local-name) | |
1655 | (let ((ncs (rng-ipattern-possible-start-tags rng-match-state nil)) | |
1656 | (nc nil) | |
1657 | (ns nil)) | |
1658 | (while ncs | |
1659 | (setq nc (car ncs)) | |
1660 | (if (and (equal (cdr nc) local-name) | |
1661 | (symbolp (car nc))) | |
1662 | (cond ((not ns) | |
1663 | ;; first possible namespace | |
1664 | (setq ns (car nc)) | |
1665 | (setq ncs (cdr ncs))) | |
1666 | ((equal ns (car nc)) | |
1667 | ;; same as first namespace | |
1668 | (setq ncs (cdr ncs))) | |
1669 | (t | |
1670 | ;; more than one possible namespace | |
1671 | (setq ns nil) | |
1672 | (setq ncs nil))) | |
1673 | (setq ncs (cdr ncs)))) | |
1674 | ns)) | |
1675 | ||
1676 | (defun rng-match-nullable-p () | |
1677 | (rng-ipattern-get-nullable rng-match-state)) | |
1678 | ||
1679 | (defun rng-match-possible-start-tag-names () | |
1680 | "Return a list of possible names that would be valid for start-tags. | |
1681 | ||
1682 | Each possible name is returned as a (NAMESPACE . LOCAL-NAME) pair, | |
1683 | where NAMESPACE is a symbol or nil (meaning the absent namespace) and | |
10545bd8 | 1684 | LOCAL-NAME is a string. The returned list may contain duplicates." |
8cd39fb3 MH |
1685 | (rng-ipattern-possible-start-tags rng-match-state nil)) |
1686 | ||
1687 | ;; This is no longer used. It might be useful so leave it in for now. | |
1688 | (defun rng-match-start-tag-possible-p () | |
1689 | "Return non-nil if a start-tag is possible." | |
1690 | (rng-ipattern-start-tag-possible-p rng-match-state)) | |
1691 | ||
1692 | (defun rng-match-possible-attribute-names () | |
1693 | "Return a list of possible names that would be valid for attributes. | |
1694 | ||
1695 | See the function `rng-match-possible-start-tag-names' for | |
1696 | more information." | |
1697 | (rng-ipattern-possible-attributes rng-match-state nil)) | |
1698 | ||
1699 | (defun rng-match-possible-value-strings () | |
1700 | "Return a list of strings that would be valid as content. | |
10545bd8 | 1701 | The list may contain duplicates. Typically, the list will not |
8cd39fb3 MH |
1702 | be exhaustive." |
1703 | (rng-ipattern-possible-values rng-match-state nil)) | |
1704 | ||
1705 | (defun rng-match-required-element-name () | |
1706 | "Return the name of an element which must occur, or nil if none." | |
1707 | (rng-ipattern-required-element rng-match-state)) | |
1708 | ||
1709 | (defun rng-match-required-attribute-names () | |
1710 | "Return a list of names of attributes which must all occur." | |
1711 | (rng-ipattern-required-attributes rng-match-state nil)) | |
1712 | ||
1713 | (defmacro rng-match-save (&rest body) | |
1714 | (let ((state (make-symbol "state"))) | |
1715 | `(let ((,state rng-match-state)) | |
1716 | (unwind-protect | |
1717 | (progn ,@body) | |
1718 | (setq rng-match-state ,state))))) | |
1719 | ||
1720 | (put 'rng-match-save 'lisp-indent-function 0) | |
1721 | (def-edebug-spec rng-match-save t) | |
1722 | ||
1723 | (defmacro rng-match-with-schema (schema &rest body) | |
1724 | `(let ((rng-current-schema ,schema) | |
1725 | rng-match-state | |
1726 | rng-compile-table | |
1727 | rng-ipattern-table | |
1728 | rng-last-ipattern-index) | |
1729 | (rng-ipattern-maybe-init) | |
1730 | (rng-compile-maybe-init) | |
1731 | (setq rng-match-state (rng-compile rng-current-schema)) | |
1732 | ,@body)) | |
1733 | ||
1734 | (put 'rng-match-with-schema 'lisp-indent-function 1) | |
1735 | (def-edebug-spec rng-match-with-schema t) | |
1736 | ||
1737 | (provide 'rng-match) | |
10545bd8 | 1738 | |
ab4c34c6 | 1739 | ;; arch-tag: c8c50733-edcf-49fb-85e2-0aac8749b7f8 |
8cd39fb3 | 1740 | ;;; rng-match.el ends here |