* term/xterm.el (xterm--query): Stop after first matching handler. (Bug#14615)
[bpt/emacs.git] / lisp / progmodes / cc-langs.el
CommitLineData
c38e0c97 1;;; cc-langs.el --- language specific settings for CC Mode -*- coding: utf-8 -*-
785eecbb 2
ab422c4d 3;; Copyright (C) 1985, 1987, 1992-2013 Free Software Foundation, Inc.
785eecbb 4
e309f66c
AM
5;; Authors: 2002- Alan Mackenzie
6;; 1998- Martin Stjernholm
d9e94c22 7;; 1992-1999 Barry A. Warsaw
5858f68c
GM
8;; 1987 Dave Detlefs
9;; 1987 Stewart Clamen
785eecbb 10;; 1985 Richard M. Stallman
0ec8351b 11;; Maintainer: bug-cc-mode@gnu.org
785eecbb 12;; Created: 22-Apr-1997 (split from cc-mode.el)
bd78fa1d
CY
13;; Keywords: c languages
14;; Package: cc-mode
785eecbb
RS
15
16;; This file is part of GNU Emacs.
17
b1fc2b50 18;; GNU Emacs is free software: you can redistribute it and/or modify
785eecbb 19;; it under the terms of the GNU General Public License as published by
b1fc2b50
GM
20;; the Free Software Foundation, either version 3 of the License, or
21;; (at your option) any later version.
785eecbb
RS
22
23;; GNU Emacs is distributed in the hope that it will be useful,
24;; but WITHOUT ANY WARRANTY; without even the implied warranty of
25;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
26;; GNU General Public License for more details.
27
28;; You should have received a copy of the GNU General Public License
b1fc2b50 29;; along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>.
785eecbb 30
3afbc435
PJ
31;;; Commentary:
32
d9e94c22
MS
33;; HACKERS NOTE: There's heavy macro magic here. If you need to make
34;; changes in this or other files containing `c-lang-defconst' but
35;; don't want to read through the longer discussion below then read
36;; this:
37;;
38;; o A change in a `c-lang-defconst' or `c-lang-defvar' will not take
39;; effect if the file containing the mode init function (typically
40;; cc-mode.el) is byte compiled.
41;; o To make changes show in font locking you need to reevaluate the
42;; `*-font-lock-keywords-*' constants, which normally is easiest to
43;; do with M-x eval-buffer in cc-fonts.el.
44;; o In either case it's necessary to reinitialize the mode to make
45;; the changes show in an existing buffer.
46
47;;; Introduction to the language dependent variable system:
48;;
49;; This file contains all the language dependent variables, except
50;; those specific for font locking which reside in cc-fonts.el. As
51;; far as possible, all the differences between the languages that CC
52;; Mode supports are described with these variables only, so that the
53;; code can be shared.
54;;
55;; The language constant system (see cc-defs.el) is used to specify
56;; various language dependent info at a high level, such as lists of
57;; keywords, and then from them generate - at compile time - the
58;; various regexps and other low-level structures actually employed in
59;; the code at runtime.
60;;
61;; This system is also designed to make it easy for developers of
62;; derived modes to customize the source constants for new language
63;; variants, without having to keep up with the exact regexps etc that
64;; are used in each CC Mode version. It's possible from an external
65;; package to add a new language by inheriting an existing one, and
66;; then change specific constants as necessary for the new language.
67;; The old values for those constants (and the values of all the other
68;; high-level constants) may be used to build the new ones, and those
69;; new values will in turn be used by the low-level definitions here
70;; to build the runtime constants appropriately for the new language
71;; in the current version of CC Mode.
72;;
73;; Like elsewhere in CC Mode, the existence of a doc string signifies
74;; that a language constant is part of the external API, and that it
75;; therefore can be used with a high confidence that it will continue
76;; to work with future versions of CC Mode. Even so, it's not
77;; unlikely that such constants will change meaning slightly as this
78;; system is refined further; a certain degree of dependence on the CC
79;; Mode version is unavoidable when hooking in at this level. Also
80;; note that there's still work to be done to actually use these
81;; constants everywhere inside CC Mode; there are still hardcoded
82;; values in many places in the code.
83;;
84;; Separate packages will also benefit from the compile time
85;; evaluation; the byte compiled file(s) for them will contain the
86;; compiled runtime constants ready for use by (the byte compiled) CC
87;; Mode, and the source definitions in this file don't have to be
88;; loaded then. However, if a byte compiled package is loaded that
89;; has been compiled with a different version of CC Mode than the one
90;; currently loaded, then the compiled-in values will be discarded and
91;; new ones will be built when the mode is initialized. That will
92;; automatically trig a load of the file(s) containing the source
93;; definitions (i.e. this file and/or cc-fonts.el) if necessary.
94;;
95;; A small example of a derived mode is available at
96;; <http://cc-mode.sourceforge.net/derived-mode-ex.el>. It also
97;; contains some useful hints for derived mode developers.
98
99;;; Using language variables:
100;;
101;; The `c-lang-defvar' forms in this file comprise the language
102;; variables that CC Mode uses. It does not work to use
103;; `c-lang-defvar' anywhere else (which isn't much of a limitation
104;; since these variables sole purpose is to interface with the CC Mode
105;; core functions). The values in these `c-lang-defvar's are not
106;; evaluated right away but instead collected to a single large `setq'
107;; that can be inserted for a particular language with the
108;; `c-init-language-vars' macro.
109
110;; This file is only required at compile time, or when not running
111;; from byte compiled files, or when the source definitions for the
112;; language constants are requested.
113
3afbc435
PJ
114;;; Code:
115
66d279a7
GM
116;; For Emacs < 22.2.
117(eval-and-compile
118 (unless (fboundp 'declare-function) (defmacro declare-function (&rest r))))
119
51f606de
GM
120(eval-when-compile
121 (let ((load-path
130c507e
GM
122 (if (and (boundp 'byte-compile-dest-file)
123 (stringp byte-compile-dest-file))
124 (cons (file-name-directory byte-compile-dest-file) load-path)
51f606de 125 load-path)))
d9e94c22 126 (load "cc-bytecomp" nil t)))
51f606de 127
130c507e
GM
128(cc-require 'cc-defs)
129(cc-require 'cc-vars)
a6739a05 130
0386b551 131
9a737a1f
MS
132;; This file is not always loaded. See note above.
133(cc-external-require 'cl)
134
785eecbb 135\f
d9e94c22 136;;; Setup for the `c-lang-defvar' system.
a66cd3ee
MS
137
138(eval-and-compile
d9e94c22 139 ;; These are used to collect the init forms from the subsequent
26b8f810
AM
140 ;; `c-lang-defvar' and `c-lang-setvar'. They are used to build the
141 ;; lambda in `c-make-init-lang-vars-fun' below, and to build `defvar's
142 ;; and `make-variable-buffer-local's in cc-engine and
143 ;; `make-local-variable's in `c-init-language-vars-for'.
2eb455ab
MS
144 (defvar c-lang-variable-inits nil)
145 (defvar c-lang-variable-inits-tail nil)
146 (setq c-lang-variable-inits (list nil)
26b8f810
AM
147 c-lang-variable-inits-tail c-lang-variable-inits)
148 (defvar c-emacs-variable-inits nil)
149 (defvar c-emacs-variable-inits-tail nil)
150 (setq c-emacs-variable-inits (list nil)
151 c-emacs-variable-inits-tail c-emacs-variable-inits))
d9e94c22
MS
152
153(defmacro c-lang-defvar (var val &optional doc)
0386b551
AM
154 "Declares the buffer local variable VAR to get the value VAL. VAL is
155evaluated and assigned at mode initialization. More precisely, VAL is
156evaluated and bound to VAR when the result from the macro
d9e94c22
MS
157`c-init-language-vars' is evaluated.
158
159`c-lang-const' is typically used in VAL to get the right value for the
160language being initialized, and such calls will be macro expanded to
0386b551 161the evaluated constant value at compile time."
d9e94c22
MS
162
163 (when (and (not doc)
164 (eq (car-safe val) 'c-lang-const)
165 (eq (nth 1 val) var)
166 (not (nth 2 val)))
167 ;; Special case: If there's no docstring and the value is a
168 ;; simple (c-lang-const foo) where foo is the same name as VAR
169 ;; then take the docstring from the language constant foo.
170 (setq doc (get (intern (symbol-name (nth 1 val)) c-lang-constants)
171 'variable-documentation)))
172 (or (stringp doc)
173 (setq doc nil))
174
175 (let ((elem (assq var (cdr c-lang-variable-inits))))
176 (if elem
177 (setcdr elem (list val doc))
178 (setcdr c-lang-variable-inits-tail (list (list var val doc)))
179 (setq c-lang-variable-inits-tail (cdr c-lang-variable-inits-tail))))
180
181 ;; Return the symbol, like the other def* forms.
182 `',var)
183
26b8f810
AM
184(defmacro c-lang-setvar (var val)
185 "Causes the variable VAR to be made buffer local and to get set to the
186value VAL. VAL is evaluated and assigned at mode initialization. More
187precisely, VAL is evaluated and bound to VAR when the result from the
188macro `c-init-language-vars' is evaluated. VAR is typically a standard
189Emacs variable like `comment-start'.
190
191`c-lang-const' is typically used in VAL to get the right value for the
192language being initialized, and such calls will be macro expanded to
193the evaluated constant value at compile time."
194 (let ((elem (assq var (cdr c-emacs-variable-inits))))
195 (if elem
196 (setcdr elem (list val)) ; Maybe remove "list", sometime. 2006-07-19
197 (setcdr c-emacs-variable-inits-tail (list (list var val)))
198 (setq c-emacs-variable-inits-tail (cdr c-emacs-variable-inits-tail))))
199
200 ;; Return the symbol, like the other def* forms.
201 `',var)
202
d9e94c22 203(put 'c-lang-defvar 'lisp-indent-function 'defun)
3c0ab532
AM
204; (eval-after-load "edebug" ; 2006-07-09: def-edebug-spec is now in subr.el.
205; '
206(def-edebug-spec c-lang-defvar
207 (&define name def-form &optional stringp)) ;)
c55676a1 208
66d279a7
GM
209;; Suppress "might not be defined at runtime" warning.
210;; This file is only used when compiling other cc files.
6a2e6868
GM
211;; These are defined in cl as aliases to the cl- versions.
212(declare-function delete-duplicates "cl-seq" (cl-seq &rest cl-keys) t)
213(declare-function mapcan "cl-extra" (cl-func cl-seq &rest cl-rest) t)
214(declare-function cl-macroexpand-all "cl" (form &optional env))
66d279a7 215
cb694ab7 216(eval-and-compile
0386b551
AM
217 ;; Some helper functions used when building the language constants.
218
219 (defun c-filter-ops (ops opgroup-filter op-filter &optional xlate)
e6a9e584 220 ;; Extract a subset of the operators in the list OPS in a DWIM:ey
212906e2
AM
221 ;; way. The return value is a plain list of operators:
222 ;;
e6a9e584 223 ;; OPS either has the structure of `c-operators', is a single
0386b551 224 ;; group in `c-operators', or is a plain list of operators.
cd1181db 225 ;;
e6a9e584
AM
226 ;; OPGROUP-FILTER specifies how to select the operator groups. It
227 ;; can be t to choose all groups, a list of group type symbols
228 ;; (such as 'prefix) to accept, or a function which will be called
229 ;; with the group symbol for each group and should return non-nil
230 ;; if that group is to be included.
231 ;;
0386b551
AM
232 ;; If XLATE is given, it's a function which is called for each
233 ;; matching operator and its return value is collected instead.
234 ;; If it returns a list, the elements are spliced directly into
235 ;; the final result, which is returned as a list with duplicates
e6a9e584
AM
236 ;; removed using `equal'.
237 ;;
238 ;; `c-mode-syntax-table' for the current mode is in effect during
239 ;; the whole procedure.
0386b551
AM
240 (unless (listp (car-safe ops))
241 (setq ops (list ops)))
242 (cond ((eq opgroup-filter t)
243 (setq opgroup-filter (lambda (opgroup) t)))
244 ((not (functionp opgroup-filter))
245 (setq opgroup-filter `(lambda (opgroup)
246 (memq opgroup ',opgroup-filter)))))
247 (cond ((eq op-filter t)
248 (setq op-filter (lambda (op) t)))
249 ((stringp op-filter)
250 (setq op-filter `(lambda (op)
251 (string-match ,op-filter op)))))
252 (unless xlate
253 (setq xlate 'identity))
254 (c-with-syntax-table (c-lang-const c-mode-syntax-table)
255 (delete-duplicates
256 (mapcan (lambda (opgroup)
257 (when (if (symbolp (car opgroup))
258 (when (funcall opgroup-filter (car opgroup))
259 (setq opgroup (cdr opgroup))
260 t)
261 t)
262 (mapcan (lambda (op)
263 (when (funcall op-filter op)
264 (let ((res (funcall xlate op)))
265 (if (listp res) res (list res)))))
266 opgroup)))
267 ops)
268 :test 'equal))))
269
51f606de 270\f
d9e94c22
MS
271;;; Various mode specific values that aren't language related.
272
273(c-lang-defconst c-mode-menu
274 ;; The definition for the mode menu. The menu title is prepended to
275 ;; this before it's fed to `easy-menu-define'.
276 t `(["Comment Out Region" comment-region
277 (c-fn-region-is-active-p)]
278 ["Uncomment Region" (comment-region (region-beginning)
279 (region-end) '(4))
280 (c-fn-region-is-active-p)]
281 ["Indent Expression" c-indent-exp
282 (memq (char-after) '(?\( ?\[ ?\{))]
283 ["Indent Line or Region" c-indent-line-or-region t]
284 ["Fill Comment Paragraph" c-fill-paragraph t]
285 "----"
286 ["Backward Statement" c-beginning-of-statement t]
287 ["Forward Statement" c-end-of-statement t]
288 ,@(when (c-lang-const c-opt-cpp-prefix)
289 ;; Only applicable if there's a cpp preprocessor.
290 `(["Up Conditional" c-up-conditional t]
291 ["Backward Conditional" c-backward-conditional t]
292 ["Forward Conditional" c-forward-conditional t]
293 "----"
294 ["Macro Expand Region" c-macro-expand
295 (c-fn-region-is-active-p)]
296 ["Backslashify" c-backslash-region
297 (c-fn-region-is-active-p)]))
298 "----"
b14c0c55
AM
299 ("Style..."
300 ["Set Style..." c-set-style t]
301 ["Show Current Style Name" (message
302 "Style Name: %s"
303 c-indentation-style) t]
304 ["Guess Style from this Buffer" c-guess-buffer-no-install t]
305 ["Install the Last Guessed Style..." c-guess-install
306 (and c-guess-guessed-offsets-alist
307 c-guess-guessed-basic-offset) ]
308 ["View the Last Guessed Style" c-guess-view
309 (and c-guess-guessed-offsets-alist
310 c-guess-guessed-basic-offset) ])
311 "----"
d9e94c22 312 ("Toggle..."
d91362c9
NR
313 ["Syntactic indentation" c-toggle-syntactic-indentation
314 :style toggle :selected c-syntactic-indentation]
cb694ab7
AM
315 ["Electric mode" c-toggle-electric-state
316 :style toggle :selected c-electric-flag]
317 ["Auto newline" c-toggle-auto-newline
d91362c9 318 :style toggle :selected c-auto-newline]
cb694ab7
AM
319 ["Hungry delete" c-toggle-hungry-state
320 :style toggle :selected c-hungry-delete-key]
653d1554
TH
321 ["Subword mode" subword-mode
322 :style toggle :selected (and (boundp 'subword-mode)
323 subword-mode)])))
a66cd3ee 324
d9e94c22
MS
325\f
326;;; Syntax tables.
327
328(defun c-populate-syntax-table (table)
329 "Populate the given syntax table as necessary for a C-like language.
330This includes setting ' and \" as string delimiters, and setting up
331the comment syntax to handle both line style \"//\" and block style
332\"/*\" \"*/\" comments."
333
334 (modify-syntax-entry ?_ "_" table)
335 (modify-syntax-entry ?\\ "\\" table)
336 (modify-syntax-entry ?+ "." table)
337 (modify-syntax-entry ?- "." table)
338 (modify-syntax-entry ?= "." table)
339 (modify-syntax-entry ?% "." table)
340 (modify-syntax-entry ?< "." table)
341 (modify-syntax-entry ?> "." table)
342 (modify-syntax-entry ?& "." table)
343 (modify-syntax-entry ?| "." table)
344 (modify-syntax-entry ?\' "\"" table)
345 (modify-syntax-entry ?\240 "." table)
346
347 ;; Set up block and line oriented comments. The new C
348 ;; standard mandates both comment styles even in C, so since
349 ;; all languages now require dual comments, we make this the
350 ;; default.
351 (cond
352 ;; XEmacs
353 ((memq '8-bit c-emacs-features)
354 (modify-syntax-entry ?/ ". 1456" table)
355 (modify-syntax-entry ?* ". 23" table))
356 ;; Emacs
357 ((memq '1-bit c-emacs-features)
358 (modify-syntax-entry ?/ ". 124b" table)
359 (modify-syntax-entry ?* ". 23" table))
360 ;; incompatible
361 (t (error "CC Mode is incompatible with this version of Emacs")))
362
363 (modify-syntax-entry ?\n "> b" table)
364 ;; Give CR the same syntax as newline, for selective-display
365 (modify-syntax-entry ?\^m "> b" table))
366
367(c-lang-defconst c-make-mode-syntax-table
368 "Functions that generates the mode specific syntax tables.
369The syntax tables aren't stored directly since they're quite large."
370 t `(lambda ()
371 (let ((table (make-syntax-table)))
372 (c-populate-syntax-table table)
373 ;; Mode specific syntaxes.
452ea855 374 ,(cond ((or (c-major-mode-is 'objc-mode) (c-major-mode-is 'java-mode))
0386b551
AM
375 ;; Let '@' be part of symbols in ObjC to cope with
376 ;; its compiler directives as single keyword tokens.
377 ;; This is then necessary since it's assumed that
378 ;; every keyword is a single symbol.
d9e94c22
MS
379 `(modify-syntax-entry ?@ "_" table))
380 ((c-major-mode-is 'pike-mode)
381 `(modify-syntax-entry ?@ "." table)))
382 table)))
383
384(c-lang-defconst c-mode-syntax-table
385 ;; The syntax tables in evaluated form. Only used temporarily when
386 ;; the constants in this file are evaluated.
387 t (funcall (c-lang-const c-make-mode-syntax-table)))
388
f75ef66d 389(c-lang-defconst c++-make-template-syntax-table
d9e94c22
MS
390 ;; A variant of `c++-mode-syntax-table' that defines `<' and `>' as
391 ;; parenthesis characters. Used temporarily when template argument
392 ;; lists are parsed. Note that this encourages incorrect parsing of
393 ;; templates since they might contain normal operators that uses the
394 ;; '<' and '>' characters. Therefore this syntax table might go
395 ;; away when CC Mode handles templates correctly everywhere.
396 t nil
452ea855 397 (java c++) `(lambda ()
d9e94c22
MS
398 (let ((table (funcall ,(c-lang-const c-make-mode-syntax-table))))
399 (modify-syntax-entry ?< "(>" table)
400 (modify-syntax-entry ?> ")<" table)
401 table)))
402(c-lang-defvar c++-template-syntax-table
f75ef66d
MS
403 (and (c-lang-const c++-make-template-syntax-table)
404 (funcall (c-lang-const c++-make-template-syntax-table))))
d9e94c22 405
dd969a56
AM
406(c-lang-defconst c-no-parens-syntax-table
407 ;; A variant of the standard syntax table which is used to find matching
408 ;; "<"s and ">"s which have been marked as parens using syntax table
409 ;; properties. The other paren characters (e.g. "{", ")" "]") are given a
410 ;; non-paren syntax here. so that the list commands will work on "< ... >"
411 ;; even when there's unbalanced other parens inside them.
412 ;;
413 ;; This variable is nil for languages which don't have template stuff.
414 t `(lambda ()
415 (if (c-lang-const c-recognize-<>-arglists)
416 (let ((table (funcall ,(c-lang-const c-make-mode-syntax-table))))
417 (modify-syntax-entry ?\( "." table)
418 (modify-syntax-entry ?\) "." table)
419 (modify-syntax-entry ?\[ "." table)
420 (modify-syntax-entry ?\] "." table)
421 (modify-syntax-entry ?\{ "." table)
422 (modify-syntax-entry ?\} "." table)
423 table))))
424(c-lang-defvar c-no-parens-syntax-table
425 (funcall (c-lang-const c-no-parens-syntax-table)))
426
d9e94c22
MS
427(c-lang-defconst c-identifier-syntax-modifications
428 "A list that describes the modifications that should be done to the
429mode syntax table to get a syntax table that matches all identifiers
430and keywords as words.
431
432The list is just like the one used in `font-lock-defaults': Each
433element is a cons where the car is the character to modify and the cdr
434the new syntax, as accepted by `modify-syntax-entry'."
435 ;; The $ character is not allowed in most languages (one exception
436 ;; is Java which allows it for legacy reasons) but we still classify
e4769531 437 ;; it as an identifier character since it's often used in various
d9e94c22
MS
438 ;; machine generated identifiers.
439 t '((?_ . "w") (?$ . "w"))
452ea855 440 (objc java) (append '((?@ . "w"))
d9e94c22
MS
441 (c-lang-const c-identifier-syntax-modifications))
442 awk '((?_ . "w")))
443(c-lang-defvar c-identifier-syntax-modifications
444 (c-lang-const c-identifier-syntax-modifications))
445
446(c-lang-defvar c-identifier-syntax-table
447 (let ((table (copy-syntax-table (c-mode-var "mode-syntax-table")))
448 (mods c-identifier-syntax-modifications)
449 mod)
450 (while mods
451 (setq mod (car mods)
452 mods (cdr mods))
453 (modify-syntax-entry (car mod) (cdr mod) table))
454 table)
455 "Syntax table built on the mode syntax table but additionally
456classifies symbol constituents like '_' and '$' as word constituents,
457so that all identifiers are recognized as words.")
458
dd969a56
AM
459(c-lang-defconst c-get-state-before-change-functions
460 ;; For documentation see the following c-lang-defvar of the same name.
461 ;; The value here may be a list of functions or a single function.
462 t nil
56d093a9
AM
463 c++ '(c-extend-region-for-CPP
464 c-before-change-check-<>-operators
465 c-invalidate-macro-cache)
466 (c objc) '(c-extend-region-for-CPP c-invalidate-macro-cache)
dd969a56
AM
467 ;; java 'c-before-change-check-<>-operators
468 awk 'c-awk-record-region-clear-NL)
469(c-lang-defvar c-get-state-before-change-functions
470 (let ((fs (c-lang-const c-get-state-before-change-functions)))
471 (if (listp fs)
472 fs
473 (list fs)))
474 "If non-nil, a list of functions called from c-before-change-hook.
475Typically these will record enough state to allow
5ee2e988
AM
476`c-before-font-lock-function' to extend the region to fontify,
477and may do such things as removing text-properties which must be
478recalculated.
479
dd969a56
AM
480These functions will be run in the order given. Each of them
481takes 2 parameters, the BEG and END supplied to every
5ee2e988
AM
482before-change function; on entry, the buffer will have been
483widened and match-data will have been saved; point is undefined
484on both entry and exit; the return value is ignored.
485
dd969a56
AM
486The functions are called even when font locking isn't enabled.
487
488When the mode is initialized, the functions are called with
489parameters \(point-min) and \(point-max).")
490
cb5e207c
AM
491(c-lang-defconst c-before-font-lock-functions
492 ;; For documentation see the following c-lang-defvar of the same name.
493 ;; The value here may be a list of functions or a single function.
be8b11bb
AM
494 t 'c-change-set-fl-decl-start
495 (c c++ objc) '(c-neutralize-syntax-in-and-mark-CPP
496 c-change-set-fl-decl-start)
cb5e207c
AM
497 awk 'c-awk-extend-and-syntax-tablify-region)
498(c-lang-defvar c-before-font-lock-functions
499 (let ((fs (c-lang-const c-before-font-lock-functions)))
500 (if (listp fs)
501 fs
502 (list fs)))
503 "If non-nil, a list of functions called just before font locking.
504Typically they will extend the region about to be fontified \(see
5ee2e988
AM
505below) and will set `syntax-table' text properties on the region.
506
cb5e207c
AM
507These functions will be run in the order given. Each of them
508takes 3 parameters, the BEG, END, and OLD-LEN supplied to every
509after-change function; point is undefined on both entry and exit;
510on entry, the buffer will have been widened and match-data will
511have been saved; the return value is ignored.
5ee2e988 512
cb5e207c 513The functions may extend the region to be fontified by setting the
8835a0f7 514buffer local variables c-new-BEG and c-new-END.
5ee2e988 515
cb5e207c 516The functions are called even when font locking is disabled.
5ee2e988 517
cb5e207c
AM
518When the mode is initialized, these functions are called with
519parameters \(point-min), \(point-max) and <buffer size>.")
5ee2e988 520
be8b11bb
AM
521(c-lang-defconst c-before-context-fontification-functions
522 awk nil
523 t 'c-context-set-fl-decl-start)
524 ;; For documentation see the following c-lang-defvar of the same name.
525 ;; The value here may be a list of functions or a single function.
526(c-lang-defvar c-before-context-fontification-functions
527 (let ((fs (c-lang-const c-before-context-fontification-functions)))
528 (if (listp fs)
529 fs
530 (list fs)))
531 "If non-nil, a list of functions called just before context (or
532other non-change) fontification is done. Typically they will
533extend the region.
534
535These functions will be run in the order given. Each of them
536takes 2 parameters, the BEG and END of the region to be
537fontified. Point is undefined on both entry and exit. On entry,
538the buffer will have been widened and match-data will have been
539saved; the return value is a cons of the adjusted
540region, (NEW-BEG . NEW-END).")
541
d9e94c22 542\f
536610a4
AM
543;;; Syntactic analysis ("virtual semicolons") for line-oriented languages (AWK).
544(c-lang-defconst c-at-vsemi-p-fn
545 "Contains a function \"Is there a virtual semicolon at POS or point?\".
546Such a function takes one optional parameter, a buffer position (defaults to
547point), and returns nil or t. This variable contains nil for languages which
548don't have EOL terminated statements. "
549 t nil
550 (c c++ objc) 'c-at-macro-vsemi-p
551 awk 'c-awk-at-vsemi-p)
552(c-lang-defvar c-at-vsemi-p-fn (c-lang-const c-at-vsemi-p-fn))
553
554(c-lang-defconst c-vsemi-status-unknown-p-fn
555 "Contains a function \"are we unsure whether there is a virtual semicolon on this line?\".
333f9019 556The (admittedly kludgy) purpose of such a function is to prevent an infinite
536610a4
AM
557recursion in c-beginning-of-statement-1 when point starts at a `while' token.
558The function MUST NOT UNDER ANY CIRCUMSTANCES call c-beginning-of-statement-1,
559even indirectly. This variable contains nil for languages which don't have
560EOL terminated statements."
561 t nil
562 (c c++ objc) 'c-macro-vsemi-status-unknown-p
563 awk 'c-awk-vsemi-status-unknown-p)
564(c-lang-defvar c-vsemi-status-unknown-p-fn
565 (c-lang-const c-vsemi-status-unknown-p-fn))
566
567\f
d9e94c22
MS
568;;; Lexer-level syntax (identifiers, tokens etc).
569
b248a85d
AM
570(c-lang-defconst c-has-bitfields
571 "Whether the language has bitfield declarations."
572 t nil
573 (c c++ objc) t)
574(c-lang-defvar c-has-bitfields (c-lang-const c-has-bitfields))
575
d9e94c22
MS
576(c-lang-defconst c-symbol-start
577 "Regexp that matches the start of a symbol, i.e. any identifier or
452ea855 578keyword. It's unspecified how far it matches. Does not contain a \\|
d9e94c22
MS
579operator at the top level."
580 t (concat "[" c-alpha "_]")
452ea855 581 java (concat "[" c-alpha "_@]")
542dfbde 582 objc (concat "[" c-alpha "_@]")
d9e94c22
MS
583 pike (concat "[" c-alpha "_`]"))
584(c-lang-defvar c-symbol-start (c-lang-const c-symbol-start))
585
586(c-lang-defconst c-symbol-chars
587 "Set of characters that can be part of a symbol.
bf2c1571 588This is of the form that fits inside [ ] in a regexp."
d9e94c22
MS
589 ;; Pike note: With the backquote identifiers this would include most
590 ;; operator chars too, but they are handled with other means instead.
591 t (concat c-alnum "_$")
592 objc (concat c-alnum "_$@"))
b248a85d 593(c-lang-defvar c-symbol-chars (c-lang-const c-symbol-chars))
a66cd3ee 594
a66cd3ee 595(c-lang-defconst c-symbol-key
0386b551
AM
596 "Regexp matching identifiers and keywords (with submatch 0). Assumed
597to match if `c-symbol-start' matches on the same position."
d9e94c22
MS
598 t (concat (c-lang-const c-symbol-start)
599 "[" (c-lang-const c-symbol-chars) "]*")
600 pike (concat
601 ;; Use the value from C here since the operator backquote is
602 ;; covered by the other alternative.
603 (c-lang-const c-symbol-key c)
604 "\\|"
605 (c-make-keywords-re nil
606 (c-lang-const c-overloadable-operators))))
607(c-lang-defvar c-symbol-key (c-lang-const c-symbol-key))
608
609(c-lang-defconst c-symbol-key-depth
610 ;; Number of regexp grouping parens in `c-symbol-key'.
0386b551 611 t (regexp-opt-depth (c-lang-const c-symbol-key)))
d9e94c22
MS
612
613(c-lang-defconst c-nonsymbol-chars
614 "This is the set of chars that can't be part of a symbol, i.e. the
615negation of `c-symbol-chars'."
616 t (concat "^" (c-lang-const c-symbol-chars)))
617(c-lang-defvar c-nonsymbol-chars (c-lang-const c-nonsymbol-chars))
618
619(c-lang-defconst c-nonsymbol-key
620 "Regexp that matches any character that can't be part of a symbol.
621It's usually appended to other regexps to avoid matching a prefix.
622It's assumed to not contain any submatchers."
623 ;; The same thing regarding Unicode identifiers applies here as to
624 ;; `c-symbol-key'.
625 t (concat "[" (c-lang-const c-nonsymbol-chars) "]"))
626
0386b551
AM
627(c-lang-defconst c-identifier-ops
628 "The operators that make up fully qualified identifiers. nil in
629languages that don't have such things. See `c-operators' for a
630description of the format. Binary operators can concatenate symbols,
631e.g. \"::\" in \"A::B::C\". Prefix operators can precede identifiers,
632e.g. \"~\" in \"~A::B\". Other types of operators aren't supported.
633
634This value is by default merged into `c-operators'."
d9e94c22 635 t nil
0386b551
AM
636 c++ '((prefix "~" "??-" "compl")
637 (right-assoc "::")
638 (prefix "::"))
2a15eb73
MS
639 ;; Java has "." to concatenate identifiers but it's also used for
640 ;; normal indexing. There's special code in the Java font lock
641 ;; rules to fontify qualified identifiers based on the standard
642 ;; naming conventions. We still define "." here to make
643 ;; `c-forward-name' move over as long names as possible which is
644 ;; necessary to e.g. handle throws clauses correctly.
0386b551
AM
645 java '((left-assoc "."))
646 idl '((left-assoc "::")
647 (prefix "::"))
648 pike '((left-assoc "::")
649 (prefix "::")
650 (left-assoc ".")))
651
652(c-lang-defconst c-opt-identifier-concat-key
653 ;; Appendable adorned regexp matching the operators that join
654 ;; symbols to fully qualified identifiers, or nil in languages that
655 ;; don't have such things.
656 ;;
657 ;; This was a docstring constant in 5.30. It still works but is now
658 ;; considered internal - change `c-identifier-ops' instead.
659 t (let ((ops (c-filter-ops (c-lang-const c-identifier-ops)
660 '(left-assoc right-assoc)
661 t)))
662 (when ops
663 (c-make-keywords-re 'appendable ops))))
d9e94c22
MS
664(c-lang-defvar c-opt-identifier-concat-key
665 (c-lang-const c-opt-identifier-concat-key)
666 'dont-doc)
667
0386b551
AM
668(c-lang-defconst c-opt-identifier-concat-key-depth
669 ;; Number of regexp grouping parens in `c-opt-identifier-concat-key'.
670 t (regexp-opt-depth (c-lang-const c-opt-identifier-concat-key)))
671
672(c-lang-defconst c-opt-identifier-prefix-key
673 ;; Appendable adorned regexp matching operators that might precede
674 ;; an identifier and that are part of the identifier in that case.
675 ;; nil in languages without such things.
676 t (let ((ops (c-filter-ops (c-lang-const c-identifier-ops)
677 '(prefix)
678 t)))
679 (when ops
680 (c-make-keywords-re 'appendable ops))))
681
682(c-lang-defconst c-after-id-concat-ops
683 "Operators that can occur after a binary operator on `c-identifier-ops'
684in identifiers. nil in languages that don't have such things.
685
686Operators here should also have appropriate entries in `c-operators' -
687it's not taken care of by default."
688 t nil
689 ;; '~' for destructors in C++, '*' for member pointers.
690 c++ '("~" "*")
691 ;; In Java we recognize '*' to deal with "foo.bar.*" that can occur
692 ;; in import declarations. (This will also match bogus things like
693 ;; "foo.*bar" but we don't bother.)
694 java '("*"))
695
d9e94c22 696(c-lang-defconst c-opt-after-id-concat-key
0386b551
AM
697 ;; Regexp that must match the token after
698 ;; `c-opt-identifier-concat-key' for it to be considered an
699 ;; identifier concatenation operator (which e.g. causes the
700 ;; preceding identifier to be fontified as a reference). Assumed to
701 ;; be a string if `c-opt-identifier-concat-key' is.
702 ;;
703 ;; This was a docstring constant in 5.30. It still works but is now
704 ;; considered internal - change `c-after-id-concat-ops' instead.
705 t (concat (c-lang-const c-symbol-start)
706 (if (c-lang-const c-after-id-concat-ops)
707 (concat "\\|" (c-make-keywords-re 'appendable
708 (c-lang-const c-after-id-concat-ops)))
709 "")))
d9e94c22
MS
710
711(c-lang-defconst c-identifier-start
0386b551
AM
712 "Regexp that matches the start of an (optionally qualified) identifier.
713It should also match all keywords. It's unspecified how far it
714matches."
715 t (concat (c-lang-const c-symbol-start)
716 (if (c-lang-const c-opt-identifier-prefix-key)
717 (concat "\\|"
718 (c-lang-const c-opt-identifier-prefix-key))
719 "")))
d9e94c22
MS
720(c-lang-defvar c-identifier-start (c-lang-const c-identifier-start))
721
722(c-lang-defconst c-identifier-key
723 "Regexp matching a fully qualified identifier, like \"A::B::c\" in
724C++. It does not recognize the full range of syntactic whitespace
0386b551
AM
725between the tokens; `c-forward-name' has to be used for that. It
726should also not match identifiers containing parenthesis groupings,
727e.g. identifiers with template arguments such as \"A<X,Y>\" in C++."
728 ;; This regexp is more complex than strictly necessary to ensure
729 ;; that it can be matched with a minimum of backtracking.
730 t (concat (if (c-lang-const c-opt-identifier-prefix-key)
731 (concat
732 "\\("
733 (c-lang-const c-opt-identifier-prefix-key)
734 (c-lang-const c-simple-ws) "*"
d9e94c22 735 "\\)?")
0386b551
AM
736 "")
737 "\\(" (c-lang-const c-symbol-key) "\\)"
738 (if (c-lang-const c-opt-identifier-concat-key)
739 (concat
740 "\\("
741 (c-lang-const c-simple-ws) "*"
742 (c-lang-const c-opt-identifier-concat-key)
743 (c-lang-const c-simple-ws) "*"
744 (if (c-lang-const c-after-id-concat-ops)
745 (concat
746 "\\("
747 (c-make-keywords-re 'appendable
748 (c-lang-const c-after-id-concat-ops))
749 (concat
750 ;; For flexibility, consider the symbol match
751 ;; optional if we've hit a
752 ;; `c-after-id-concat-ops' operator. This is
753 ;; also necessary to handle the "*" that can
754 ;; end import declaration identifiers in Java.
755 "\\("
756 (c-lang-const c-simple-ws) "*"
757 "\\(" (c-lang-const c-symbol-key) "\\)"
758 "\\)?")
759 "\\|"
d9e94c22 760 "\\(" (c-lang-const c-symbol-key) "\\)"
0386b551
AM
761 "\\)")
762 (concat "\\(" (c-lang-const c-symbol-key) "\\)"))
763 "\\)*")
764 "")))
d9e94c22
MS
765(c-lang-defvar c-identifier-key (c-lang-const c-identifier-key))
766
767(c-lang-defconst c-identifier-last-sym-match
0386b551
AM
768 ;; This was a docstring constant in 5.30 but it's no longer used.
769 ;; It's only kept to avoid breaking third party code.
770 ;;
771 ;; Used to identify the submatch in `c-identifier-key' that
772 ;; surrounds the last symbol in the qualified identifier. It's a
773 ;; list of submatch numbers, of which the first that has a match is
774 ;; taken. It's assumed that at least one does when the regexp has
775 ;; matched.
776 t nil)
777
778(c-lang-defconst c-string-escaped-newlines
779 "Set if the language support backslash escaped newlines inside string
780literals."
781 t nil
782 (c c++ objc pike) t)
783(c-lang-defvar c-string-escaped-newlines
784 (c-lang-const c-string-escaped-newlines))
785
786(c-lang-defconst c-multiline-string-start-char
787 "Set if the language supports multiline string literals without escaped
788newlines. If t, all string literals are multiline. If a character,
789only literals where the open quote is immediately preceded by that
790literal are multiline."
791 t nil
792 pike ?#)
793(c-lang-defvar c-multiline-string-start-char
794 (c-lang-const c-multiline-string-start-char))
d9e94c22 795
536610a4
AM
796(c-lang-defconst c-opt-cpp-symbol
797 "The symbol which starts preprocessor constructs when in the margin."
798 t "#"
799 (java awk) nil)
800(c-lang-defvar c-opt-cpp-symbol (c-lang-const c-opt-cpp-symbol))
801
d9e94c22
MS
802(c-lang-defconst c-opt-cpp-prefix
803 "Regexp matching the prefix of a cpp directive in the languages that
804normally use that macro preprocessor. Tested at bol or at boi.
805Assumed to not contain any submatches or \\| operators."
e1dbe924 806 ;; TODO (ACM, 2005-04-01). Amend the following to recognize escaped NLs;
0386b551 807 ;; amend all uses of c-opt-cpp-prefix which count regexp-depth.
d9e94c22
MS
808 t "\\s *#\\s *"
809 (java awk) nil)
810(c-lang-defvar c-opt-cpp-prefix (c-lang-const c-opt-cpp-prefix))
811
5ee2e988
AM
812(c-lang-defconst c-anchored-cpp-prefix
813 "Regexp matching the prefix of a cpp directive anchored to BOL,
814in the languages that have a macro preprocessor."
20e527d0
AM
815 t "^\\s *\\(#\\)\\s *"
816 (java awk) nil)
5ee2e988
AM
817(c-lang-defvar c-anchored-cpp-prefix (c-lang-const c-anchored-cpp-prefix))
818
d9e94c22
MS
819(c-lang-defconst c-opt-cpp-start
820 "Regexp matching the prefix of a cpp directive including the directive
821name, or nil in languages without preprocessor support. The first
822submatch surrounds the directive name."
823 t (if (c-lang-const c-opt-cpp-prefix)
824 (concat (c-lang-const c-opt-cpp-prefix)
825 "\\([" c-alnum "]+\\)"))
826 ;; Pike, being a scripting language, recognizes hash-bangs too.
827 pike (concat (c-lang-const c-opt-cpp-prefix)
828 "\\([" c-alnum "]+\\|!\\)"))
829(c-lang-defvar c-opt-cpp-start (c-lang-const c-opt-cpp-start))
830
0386b551
AM
831(c-lang-defconst c-cpp-message-directives
832 "List of cpp directives (without the prefix) that are followed by a
833string message."
834 t (if (c-lang-const c-opt-cpp-prefix)
835 '("error"))
5ee2e988 836 (c c++ objc pike) '("error" "warning"))
0386b551
AM
837
838(c-lang-defconst c-cpp-include-directives
839 "List of cpp directives (without the prefix) that are followed by a
840file name in angle brackets or quotes."
841 t (if (c-lang-const c-opt-cpp-prefix)
842 '("include"))
843 objc '("include" "import"))
844
845(c-lang-defconst c-opt-cpp-macro-define
846 "Cpp directive (without the prefix) that is followed by a macro
847definition, or nil if the language doesn't have any."
848 t (if (c-lang-const c-opt-cpp-prefix)
849 "define"))
536610a4
AM
850(c-lang-defvar c-opt-cpp-macro-define
851 (c-lang-const c-opt-cpp-macro-define))
0386b551
AM
852
853(c-lang-defconst c-opt-cpp-macro-define-start
772a3544
AM
854 ;; Regexp matching everything up to the macro body of a cpp define, or the
855 ;; end of the logical line if there is none. Submatch 1 is the name of the
856 ;; macro. Set if c-opt-cpp-macro-define is.
0386b551
AM
857 t (if (c-lang-const c-opt-cpp-macro-define)
858 (concat (c-lang-const c-opt-cpp-prefix)
859 (c-lang-const c-opt-cpp-macro-define)
772a3544
AM
860 "[ \t]+\\(\\(\\sw\\|_\\)+\\)\\(\([^\)]*\)\\)?"
861 ;; ^ ^ #defined name
0386b551
AM
862 "\\([ \t]\\|\\\\\n\\)*")))
863(c-lang-defvar c-opt-cpp-macro-define-start
864 (c-lang-const c-opt-cpp-macro-define-start))
865
51c9af45
AM
866(c-lang-defconst c-opt-cpp-macro-define-id
867 ;; Regexp matching everything up to the end of the identifier defined
868 ;; by a cpp define.
869 t (if (c-lang-const c-opt-cpp-macro-define)
870 (concat (c-lang-const c-opt-cpp-prefix) ; #
871 (c-lang-const c-opt-cpp-macro-define) ; define
872 "[ \t]+\\(\\sw\\|_\\)+")))
873(c-lang-defvar c-opt-cpp-macro-define-id
874 (c-lang-const c-opt-cpp-macro-define-id))
875
0386b551 876(c-lang-defconst c-cpp-expr-directives
5ee2e988 877 "List of cpp directives (without the prefix) that are followed by an
0386b551
AM
878expression."
879 t (if (c-lang-const c-opt-cpp-prefix)
880 '("if" "elif")))
881
b128268e
AM
882(c-lang-defconst c-cpp-expr-intro-re
883 "Regexp which matches the start of a CPP directive which contains an
884expression, or nil if there aren't any in the language."
885 t (if (c-lang-const c-cpp-expr-directives)
886 (concat
887 (c-lang-const c-opt-cpp-prefix)
888 (c-make-keywords-re t (c-lang-const c-cpp-expr-directives)))))
889(c-lang-defvar c-cpp-expr-intro-re
890 (c-lang-const c-cpp-expr-intro-re))
891
0386b551
AM
892(c-lang-defconst c-cpp-expr-functions
893 "List of functions in cpp expressions."
d9e94c22
MS
894 t (if (c-lang-const c-opt-cpp-prefix)
895 '("defined"))
896 pike '("defined" "efun" "constant"))
897
846f5040
MS
898(c-lang-defconst c-assignment-operators
899 "List of all assignment operators."
900 t '("=" "*=" "/=" "%=" "+=" "-=" ">>=" "<<=" "&=" "^=" "|=")
901 java (append (c-lang-const c-assignment-operators)
902 '(">>>="))
903 c++ (append (c-lang-const c-assignment-operators)
0386b551 904 '("and_eq" "or_eq" "xor_eq" "??!=" "??'="))
846f5040
MS
905 idl nil)
906
d9e94c22
MS
907(c-lang-defconst c-operators
908 "List describing all operators, along with their precedence and
909associativity. The order in the list corresponds to the precedence of
e6a9e584 910the operators: The operators in each element are a group with the same
d9e94c22 911precedence, and the group has higher precedence than the groups in all
e6a9e584
AM
912following elements. The car of each element describes the type of the
913operator group, and the cdr is a list of the operator tokens in it.
914The operator group types are:
d9e94c22
MS
915
916'prefix Unary prefix operators.
917'postfix Unary postfix operators.
0386b551
AM
918'postfix-if-paren
919 Unary postfix operators if and only if the chars have
920 parenthesis syntax.
d9e94c22
MS
921'left-assoc Binary left associative operators (i.e. a+b+c means (a+b)+c).
922'right-assoc Binary right associative operators (i.e. a=b=c means a=(b=c)).
923'right-assoc-sequence
924 Right associative operator that constitutes of a
925 sequence of tokens that separate expressions. All the
926 tokens in the group are in this case taken as
927 describing the sequence in one such operator, and the
928 order between them is therefore significant.
929
930Operators containing a character with paren syntax are taken to match
931with a corresponding open/close paren somewhere else. A postfix
932operator with close paren syntax is taken to end a postfix expression
933started somewhere earlier, rather than start a new one at point. Vice
934versa for prefix operators with open paren syntax.
935
936Note that operators like \".\" and \"->\" which in language references
937often are described as postfix operators are considered binary here,
938since CC Mode treats every identifier as an expression."
939
940 ;; There's currently no code in CC Mode that exploit all the info
941 ;; in this variable; precedence, associativity etc are present as a
942 ;; preparation for future work.
943
944 t `(;; Preprocessor.
945 ,@(when (c-lang-const c-opt-cpp-prefix)
946 `((prefix "#"
947 ,@(when (c-major-mode-is '(c-mode c++-mode))
948 '("%:" "??=")))
949 (left-assoc "##"
950 ,@(when (c-major-mode-is '(c-mode c++-mode))
951 '("%:%:" "??=??=")))))
952
0386b551
AM
953 ;; Primary.
954 ,@(c-lang-const c-identifier-ops)
452ea855 955 ,@(cond ((or (c-major-mode-is 'c++-mode) (c-major-mode-is 'java-mode))
0386b551 956 `((postfix-if-paren "<" ">"))) ; Templates.
d9e94c22 957 ((c-major-mode-is 'pike-mode)
0386b551 958 `((prefix "global" "predef")))
d9e94c22 959 ((c-major-mode-is 'java-mode)
0386b551 960 `((prefix "super"))))
d9e94c22
MS
961
962 ;; Postfix.
963 ,@(when (c-major-mode-is 'c++-mode)
964 ;; The following need special treatment.
965 `((prefix "dynamic_cast" "static_cast"
966 "reinterpret_cast" "const_cast" "typeid")))
967 (left-assoc "."
968 ,@(unless (c-major-mode-is 'java-mode)
969 '("->")))
970 (postfix "++" "--" "[" "]" "(" ")"
971 ,@(when (c-major-mode-is '(c-mode c++-mode))
972 '("<:" ":>" "??(" "??)")))
973
974 ;; Unary.
975 (prefix "++" "--" "+" "-" "!" "~"
976 ,@(when (c-major-mode-is 'c++-mode) '("not" "compl"))
977 ,@(when (c-major-mode-is '(c-mode c++-mode))
978 '("*" "&" "sizeof" "??-"))
979 ,@(when (c-major-mode-is 'objc-mode)
980 '("@selector" "@protocol" "@encode"))
981 ;; The following need special treatment.
982 ,@(cond ((c-major-mode-is 'c++-mode)
983 '("new" "delete"))
984 ((c-major-mode-is 'java-mode)
985 '("new"))
986 ((c-major-mode-is 'pike-mode)
987 '("class" "lambda" "catch" "throw" "gauge")))
988 "(" ")" ; Cast.
989 ,@(when (c-major-mode-is 'pike-mode)
990 '("[" "]"))) ; Type cast.
991
992 ;; Member selection.
993 ,@(when (c-major-mode-is 'c++-mode)
994 `((left-assoc ".*" "->*")))
995
996 ;; Multiplicative.
997 (left-assoc "*" "/" "%")
998
999 ;; Additive.
1000 (left-assoc "+" "-")
1001
1002 ;; Shift.
1003 (left-assoc "<<" ">>"
1004 ,@(when (c-major-mode-is 'java-mode)
1005 '(">>>")))
1006
1007 ;; Relational.
1008 (left-assoc "<" ">" "<=" ">="
1009 ,@(when (c-major-mode-is 'java-mode)
1010 '("instanceof")))
1011
1012 ;; Equality.
1013 (left-assoc "==" "!="
1014 ,@(when (c-major-mode-is 'c++-mode) '("not_eq")))
1015
1016 ;; Bitwise and.
1017 (left-assoc "&"
1018 ,@(when (c-major-mode-is 'c++-mode) '("bitand")))
1019
1020 ;; Bitwise exclusive or.
1021 (left-assoc "^"
1022 ,@(when (c-major-mode-is '(c-mode c++-mode))
1023 '("??'"))
1024 ,@(when (c-major-mode-is 'c++-mode) '("xor")))
1025
1026 ;; Bitwise or.
1027 (left-assoc "|"
1028 ,@(when (c-major-mode-is '(c-mode c++-mode))
1029 '("??!"))
1030 ,@(when (c-major-mode-is 'c++-mode) '("bitor")))
1031
1032 ;; Logical and.
1033 (left-assoc "&&"
1034 ,@(when (c-major-mode-is 'c++-mode) '("and")))
1035
1036 ;; Logical or.
1037 (left-assoc "||"
1038 ,@(when (c-major-mode-is '(c-mode c++-mode))
1039 '("??!??!"))
1040 ,@(when (c-major-mode-is 'c++-mode) '("or")))
1041
1042 ;; Conditional.
1043 (right-assoc-sequence "?" ":")
1044
1045 ;; Assignment.
846f5040 1046 (right-assoc ,@(c-lang-const c-assignment-operators))
d9e94c22
MS
1047
1048 ;; Exception.
1049 ,@(when (c-major-mode-is 'c++-mode)
1050 '((prefix "throw")))
1051
1052 ;; Sequence.
1053 (left-assoc ","))
1054
1055 ;; IDL got its own definition since it has a much smaller operator
1056 ;; set than the other languages.
1057 idl `(;; Preprocessor.
1058 (prefix "#")
1059 (left-assoc "##")
0386b551
AM
1060 ;; Primary.
1061 ,@(c-lang-const c-identifier-ops)
d9e94c22
MS
1062 ;; Unary.
1063 (prefix "+" "-" "~")
1064 ;; Multiplicative.
1065 (left-assoc "*" "/" "%")
1066 ;; Additive.
1067 (left-assoc "+" "-")
1068 ;; Shift.
1069 (left-assoc "<<" ">>")
1070 ;; And.
1071 (left-assoc "&")
1072 ;; Xor.
1073 (left-assoc "^")
1074 ;; Or.
1075 (left-assoc "|")))
1076
1077(c-lang-defconst c-operator-list
1078 ;; The operators as a flat list (without duplicates).
0386b551 1079 t (c-filter-ops (c-lang-const c-operators) t t))
d9e94c22
MS
1080
1081(c-lang-defconst c-overloadable-operators
0386b551 1082 "List of the operators that are overloadable, in their \"identifier
51c9af45 1083form\". See also `c-op-identifier-prefix'."
d9e94c22 1084 t nil
d9e94c22
MS
1085 c++ '("new" "delete" ;; Can be followed by "[]" but we ignore that.
1086 "+" "-" "*" "/" "%"
1087 "^" "??'" "xor" "&" "bitand" "|" "??!" "bitor" "~" "??-" "compl"
1088 "!" "=" "<" ">" "+=" "-=" "*=" "/=" "%=" "^="
1089 "??'=" "xor_eq" "&=" "and_eq" "|=" "??!=" "or_eq"
1090 "<<" ">>" ">>=" "<<=" "==" "!=" "not_eq" "<=" ">="
1091 "&&" "and" "||" "??!??!" "or" "++" "--" "," "->*" "->"
1092 "()" "[]" "<::>" "??(??)")
1093 ;; These work like identifiers in Pike.
1094 pike '("`+" "`-" "`&" "`|" "`^" "`<<" "`>>" "`*" "`/" "`%" "`~"
1095 "`==" "`<" "`>" "`!" "`[]" "`[]=" "`->" "`->=" "`()" "``+"
1096 "``-" "``&" "``|" "``^" "``<<" "``>>" "``*" "``/" "``%"
1097 "`+="))
1098
1099(c-lang-defconst c-overloadable-operators-regexp
1100 ;; Regexp tested after an "operator" token in C++.
1101 t nil
1102 c++ (c-make-keywords-re nil (c-lang-const c-overloadable-operators)))
1103(c-lang-defvar c-overloadable-operators-regexp
1104 (c-lang-const c-overloadable-operators-regexp))
1105
51c9af45 1106(c-lang-defconst c-opt-op-identifier-prefix
0386b551
AM
1107 "Regexp matching the token before the ones in
1108`c-overloadable-operators' when operators are specified in their
1109\"identifier form\". This typically matches \"operator\" in C++ where
1110operator functions are specified as e.g. \"operator +\". It's nil in
1111languages without operator functions or where the complete operator
1112identifier is listed in `c-overloadable-operators'.
1113
1114This regexp is assumed to not match any non-operator identifier."
1115 t nil
1116 c++ (c-make-keywords-re t '("operator")))
51c9af45
AM
1117(c-lang-defvar c-opt-op-identifier-prefix
1118 (c-lang-const c-opt-op-identifier-prefix))
1119
1120;; Note: the following alias is an old name which was a mis-spelling. It has
1121;; been corrected above and throughout cc-engine.el. It will be removed at
1122;; some release very shortly in the future. ACM, 2006-04-14.
c97833f0 1123(defvaralias 'c-opt-op-identitier-prefix 'c-opt-op-identifier-prefix)
51c9af45
AM
1124(make-obsolete-variable 'c-opt-op-identitier-prefix 'c-opt-op-identifier-prefix
1125 "CC Mode 5.31.4, 2006-04-14")
0386b551 1126
d9e94c22
MS
1127(c-lang-defconst c-other-op-syntax-tokens
1128 "List of the tokens made up of characters in the punctuation or
1129parenthesis syntax classes that have uses other than as expression
1130operators."
1131 t '("{" "}" "(" ")" "[" "]" ";" ":" "," "=" "/*" "*/" "//")
1132 (c c++ pike) (append '("#" "##" ; Used by cpp.
1133 "::" "...")
1134 (c-lang-const c-other-op-syntax-tokens))
0386b551
AM
1135 (c c++) (append '("*") (c-lang-const c-other-op-syntax-tokens))
1136 c++ (append '("&" "<%" "%>" "<:" ":>" "%:" "%:%:")
1137 (c-lang-const c-other-op-syntax-tokens))
d9e94c22
MS
1138 objc (append '("#" "##" ; Used by cpp.
1139 "+" "-") (c-lang-const c-other-op-syntax-tokens))
1140 idl (append '("#" "##") ; Used by cpp.
1141 (c-lang-const c-other-op-syntax-tokens))
1142 pike (append '("..")
1143 (c-lang-const c-other-op-syntax-tokens)
1144 (c-lang-const c-overloadable-operators))
1145 awk '("{" "}" "(" ")" "[" "]" ";" "," "=" "/"))
1146
0386b551
AM
1147(c-lang-defconst c-all-op-syntax-tokens
1148 ;; List of all tokens in the punctuation and parenthesis syntax
1149 ;; classes.
1150 t (delete-duplicates (append (c-lang-const c-other-op-syntax-tokens)
1151 (c-lang-const c-operator-list))
1152 :test 'string-equal))
1153
1154(c-lang-defconst c-nonsymbol-token-char-list
1155 ;; List containing all chars not in the word, symbol or
1156 ;; syntactically irrelevant syntax classes, i.e. all punctuation,
1157 ;; parenthesis and string delimiter chars.
1158 t (c-with-syntax-table (c-lang-const c-mode-syntax-table)
1159 ;; Only go through the chars in the printable ASCII range. No
1160 ;; language so far has 8-bit or widestring operators.
1161 (let (list (char 32))
1162 (while (< char 127)
1163 (or (memq (char-syntax char) '(?w ?_ ?< ?> ?\ ))
1164 (setq list (cons (c-int-to-char char) list)))
1165 (setq char (1+ char)))
1166 list)))
1167
d9e94c22
MS
1168(c-lang-defconst c-nonsymbol-token-regexp
1169 ;; Regexp matching all tokens in the punctuation and parenthesis
1170 ;; syntax classes. Note that this also matches ".", which can start
1171 ;; a float.
1172 t (c-make-keywords-re nil
0386b551
AM
1173 (c-filter-ops (c-lang-const c-all-op-syntax-tokens)
1174 t
1175 "\\`\\(\\s.\\|\\s\(\\|\\s\)\\)+\\'")))
d9e94c22
MS
1176(c-lang-defvar c-nonsymbol-token-regexp
1177 (c-lang-const c-nonsymbol-token-regexp))
1178
846f5040
MS
1179(c-lang-defconst c-assignment-op-regexp
1180 ;; Regexp matching all assignment operators and only them. The
1181 ;; beginning of the first submatch is used to detect the end of the
1182 ;; token, along with the end of the whole match.
1183 t (if (c-lang-const c-assignment-operators)
1184 (concat
1185 ;; Need special case for "=" since it's a prefix of "==".
1186 "=\\([^=]\\|$\\)"
1187 "\\|"
1188 (c-make-keywords-re nil
1189 (set-difference (c-lang-const c-assignment-operators)
1190 '("=")
1191 :test 'string-equal)))
1192 "\\<\\>"))
1193(c-lang-defvar c-assignment-op-regexp
1194 (c-lang-const c-assignment-op-regexp))
1195
0386b551
AM
1196(c-lang-defconst c-<>-multichar-token-regexp
1197 ;; Regexp matching all tokens containing "<" or ">" which are longer
1198 ;; than one char.
1199 t (c-make-keywords-re nil
1200 (c-filter-ops (c-lang-const c-all-op-syntax-tokens)
1201 t
1202 ".[<>]\\|[<>].")))
1203(c-lang-defvar c-<>-multichar-token-regexp
1204 (c-lang-const c-<>-multichar-token-regexp))
1205
d9e94c22
MS
1206(c-lang-defconst c-<-op-cont-regexp
1207 ;; Regexp matching the second and subsequent characters of all
1208 ;; multicharacter tokens that begin with "<".
1209 t (c-make-keywords-re nil
0386b551
AM
1210 (c-filter-ops (c-lang-const c-all-op-syntax-tokens)
1211 t
1212 "\\`<."
1213 (lambda (op) (substring op 1)))))
452ea855 1214
d9e94c22
MS
1215(c-lang-defvar c-<-op-cont-regexp (c-lang-const c-<-op-cont-regexp))
1216
1217(c-lang-defconst c->-op-cont-regexp
1218 ;; Regexp matching the second and subsequent characters of all
1219 ;; multicharacter tokens that begin with ">".
1220 t (c-make-keywords-re nil
0386b551
AM
1221 (c-filter-ops (c-lang-const c-all-op-syntax-tokens)
1222 t
1223 "\\`>."
452ea855
AM
1224 (lambda (op) (substring op 1))))
1225 java (c-make-keywords-re nil
1226 (c-filter-ops (c-lang-const c-all-op-syntax-tokens)
1227 t
1228 "\\`>[^>]\\|\\`>>[^>]"
1229 (lambda (op) (substring op 1)))))
1230
d9e94c22
MS
1231(c-lang-defvar c->-op-cont-regexp (c-lang-const c->-op-cont-regexp))
1232
1233(c-lang-defconst c-stmt-delim-chars
1234 ;; The characters that should be considered to bound statements. To
1235 ;; optimize `c-crosses-statement-barrier-p' somewhat, it's assumed to
1236 ;; begin with "^" to negate the set. If ? : operators should be
1237 ;; detected then the string must end with "?:".
536610a4 1238 t "^;{}?:")
d9e94c22
MS
1239(c-lang-defvar c-stmt-delim-chars (c-lang-const c-stmt-delim-chars))
1240
1241(c-lang-defconst c-stmt-delim-chars-with-comma
1242 ;; Variant of `c-stmt-delim-chars' that additionally contains ','.
536610a4 1243 t "^;,{}?:")
d9e94c22
MS
1244(c-lang-defvar c-stmt-delim-chars-with-comma
1245 (c-lang-const c-stmt-delim-chars-with-comma))
1246
1247\f
1248;;; Syntactic whitespace.
1249
0386b551
AM
1250(c-lang-defconst c-simple-ws
1251 "Regexp matching an ordinary whitespace character.
1252Does not contain a \\| operator at the top level."
1253 ;; "\\s " is not enough since it doesn't match line breaks.
1254 t "\\(\\s \\|[\n\r]\\)")
1255
1256(c-lang-defconst c-simple-ws-depth
1257 ;; Number of regexp grouping parens in `c-simple-ws'.
1258 t (regexp-opt-depth (c-lang-const c-simple-ws)))
1259
1260(c-lang-defconst c-line-comment-starter
1261 "String that starts line comments, or nil if such don't exist.
1262Line comments are always terminated by newlines. At least one of
1263`c-block-comment-starter' and this one is assumed to be set.
1264
1265Note that it's currently not enough to set this to support a new
1266comment style. Other stuff like the syntax table must also be set up
1267properly."
1268 t "//"
1269 awk "#")
1270(c-lang-defvar c-line-comment-starter (c-lang-const c-line-comment-starter))
1271
1272(c-lang-defconst c-block-comment-starter
1273 "String that starts block comments, or nil if such don't exist.
1274Block comments are ended by `c-block-comment-ender', which is assumed
1275to be set if this is. At least one of `c-line-comment-starter' and
1276this one is assumed to be set.
1277
1278Note that it's currently not enough to set this to support a new
1279comment style. Other stuff like the syntax table must also be set up
1280properly."
1281 t "/*"
1282 awk nil)
1283
1284(c-lang-defconst c-block-comment-ender
1285 "String that ends block comments, or nil if such don't exist.
1286
1287Note that it's currently not enough to set this to support a new
1288comment style. Other stuff like the syntax table must also be set up
1289properly."
1290 t "*/"
1291 awk nil)
1292
d9e94c22
MS
1293(c-lang-defconst c-comment-start-regexp
1294 ;; Regexp to match the start of any type of comment.
0386b551
AM
1295 t (let ((re (c-make-keywords-re nil
1296 (list (c-lang-const c-line-comment-starter)
1297 (c-lang-const c-block-comment-starter)))))
1298 (if (memq 'gen-comment-delim c-emacs-features)
1299 (concat re "\\|\\s!")
1300 re)))
d9e94c22
MS
1301(c-lang-defvar c-comment-start-regexp (c-lang-const c-comment-start-regexp))
1302
0386b551
AM
1303(c-lang-defconst c-block-comment-start-regexp
1304 ;; Regexp which matches the start of a block comment (if such exists in the
1305 ;; language)
1306 t (if (c-lang-const c-block-comment-starter)
1307 (regexp-quote (c-lang-const c-block-comment-starter))
1308 "\\<\\>"))
1309(c-lang-defvar c-block-comment-start-regexp
1310 (c-lang-const c-block-comment-start-regexp))
1311
536610a4
AM
1312(c-lang-defconst c-line-comment-start-regexp
1313 ;; Regexp which matches the start of a line comment (if such exists in the
1314 ;; language; it does in all 7 CC Mode languages).
1315 t (if (c-lang-const c-line-comment-starter)
1316 (regexp-quote (c-lang-const c-line-comment-starter))
1317 "\\<\\>"))
1318(c-lang-defvar c-line-comment-start-regexp
1319 (c-lang-const c-line-comment-start-regexp))
1320
d9e94c22
MS
1321(c-lang-defconst c-literal-start-regexp
1322 ;; Regexp to match the start of comments and string literals.
1323 t (concat (c-lang-const c-comment-start-regexp)
1324 "\\|"
1325 (if (memq 'gen-string-delim c-emacs-features)
1326 "\"|"
1327 "\"")))
1328(c-lang-defvar c-literal-start-regexp (c-lang-const c-literal-start-regexp))
1329
1330(c-lang-defconst c-doc-comment-start-regexp
1331 "Regexp to match the start of documentation comments."
1332 t "\\<\\>"
1333 ;; From font-lock.el: `doxygen' uses /*! while others use /**.
1334 (c c++ objc) "/\\*[*!]"
1335 java "/\\*\\*"
1336 pike "/[/*]!")
1337(c-lang-defvar c-doc-comment-start-regexp
1338 (c-lang-const c-doc-comment-start-regexp))
1339
1340(c-lang-defconst comment-start
1341 "String that starts comments inserted with M-; etc.
1342`comment-start' is initialized from this."
0386b551
AM
1343 ;; Default: Prefer line comments to block comments, and pad with a space.
1344 t (concat (or (c-lang-const c-line-comment-starter)
1345 (c-lang-const c-block-comment-starter))
1346 " ")
1347 ;; In C we still default to the block comment style since line
1348 ;; comments aren't entirely portable.
1349 c "/* ")
26b8f810 1350(c-lang-setvar comment-start (c-lang-const comment-start))
d9e94c22
MS
1351
1352(c-lang-defconst comment-end
1353 "String that ends comments inserted with M-; etc.
1354`comment-end' is initialized from this."
0386b551
AM
1355 ;; Default: Use block comment style if comment-start uses block
1356 ;; comments, and pad with a space in that case.
1357 t (if (string-match (concat "\\`\\("
1358 (c-lang-const c-block-comment-start-regexp)
1359 "\\)")
1360 (c-lang-const comment-start))
1361 (concat " " (c-lang-const c-block-comment-ender))
1362 ""))
26b8f810 1363(c-lang-setvar comment-end (c-lang-const comment-end))
d9e94c22
MS
1364
1365(c-lang-defconst comment-start-skip
1366 "Regexp to match the start of a comment plus everything up to its body.
1367`comment-start-skip' is initialized from this."
0386b551
AM
1368 ;; Default: Allow the last char of the comment starter(s) to be
1369 ;; repeated, then allow any amount of horizontal whitespace.
1370 t (concat "\\("
1371 (c-concat-separated
1372 (mapcar (lambda (cs)
1373 (when cs
1374 (concat (regexp-quote cs) "+")))
1375 (list (c-lang-const c-line-comment-starter)
1376 (c-lang-const c-block-comment-starter)))
1377 "\\|")
1378 "\\)\\s *"))
26b8f810 1379(c-lang-setvar comment-start-skip (c-lang-const comment-start-skip))
d9e94c22 1380
f75ef66d 1381(c-lang-defconst c-syntactic-ws-start
0386b551
AM
1382 ;; Regexp matching any sequence that can start syntactic whitespace.
1383 ;; The only uncertain case is '#' when there are cpp directives.
1384 t (concat "\\s \\|"
1385 (c-make-keywords-re nil
1386 (append (list (c-lang-const c-line-comment-starter)
1387 (c-lang-const c-block-comment-starter)
1388 (when (c-lang-const c-opt-cpp-prefix)
1389 "#"))
1390 '("\n" "\r")))
1391 "\\|\\\\[\n\r]"
1392 (when (memq 'gen-comment-delim c-emacs-features)
1393 "\\|\\s!")))
1394(c-lang-defvar c-syntactic-ws-start (c-lang-const c-syntactic-ws-start))
d9e94c22 1395
f75ef66d 1396(c-lang-defconst c-syntactic-ws-end
0386b551
AM
1397 ;; Regexp matching any single character that might end syntactic whitespace.
1398 t (concat "\\s \\|"
1399 (c-make-keywords-re nil
1400 (append (when (c-lang-const c-block-comment-ender)
1401 (list
1402 (string
1403 (elt (c-lang-const c-block-comment-ender)
1404 (1- (length
1405 (c-lang-const c-block-comment-ender)))))))
1406 '("\n" "\r")))
1407 (when (memq 'gen-comment-delim c-emacs-features)
1408 "\\|\\s!")))
1409(c-lang-defvar c-syntactic-ws-end (c-lang-const c-syntactic-ws-end))
1410
1411(c-lang-defconst c-unterminated-block-comment-regexp
1412 ;; Regexp matching an unterminated block comment that doesn't
1413 ;; contain line breaks, or nil in languages without block comments.
1414 ;; Does not contain a \| operator at the top level.
1415 t (when (c-lang-const c-block-comment-starter)
1416 (concat
1417 (regexp-quote (c-lang-const c-block-comment-starter))
1418 ;; It's messy to cook together a regexp that matches anything
1419 ;; but c-block-comment-ender.
1420 (let ((end (c-lang-const c-block-comment-ender)))
1421 (cond ((= (length end) 1)
1422 (concat "[^" end "\n\r]*"))
1423 ((= (length end) 2)
1424 (concat "[^" (substring end 0 1) "\n\r]*"
1425 "\\("
1426 (regexp-quote (substring end 0 1)) "+"
1427 "[^"
1428 ;; The quoting rules inside char classes are silly. :P
1429 (cond ((= (elt end 0) (elt end 1))
1430 (concat (substring end 0 1) "\n\r"))
1431 ((= (elt end 1) ?\])
1432 (concat (substring end 1 2) "\n\r"
1433 (substring end 0 1)))
1434 (t
1435 (concat (substring end 0 1) "\n\r"
1436 (substring end 1 2))))
1437 "]"
1438 "[^" (substring end 0 1) "\n\r]*"
1439 "\\)*"))
1440 (t
1441 (error "Can't handle a block comment ender of length %s"
1442 (length end))))))))
1443
1444(c-lang-defconst c-block-comment-regexp
1445 ;; Regexp matching a block comment that doesn't contain line breaks,
1446 ;; or nil in languages without block comments. The reason we don't
1447 ;; allow line breaks is to avoid going very far and risk running out
1448 ;; of regexp stack; this regexp is intended to handle only short
1449 ;; comments that might be put in the middle of limited constructs
1450 ;; like declarations. Does not contain a \| operator at the top
1451 ;; level.
1452 t (when (c-lang-const c-unterminated-block-comment-regexp)
1453 (concat
1454 (c-lang-const c-unterminated-block-comment-regexp)
1455 (let ((end (c-lang-const c-block-comment-ender)))
1456 (cond ((= (length end) 1)
1457 (regexp-quote end))
1458 ((= (length end) 2)
1459 (concat (regexp-quote (substring end 0 1)) "+"
1460 (regexp-quote (substring end 1 2))))
1461 (t
1462 (error "Can't handle a block comment ender of length %s"
1463 (length end))))))))
d9e94c22
MS
1464
1465(c-lang-defconst c-nonwhite-syntactic-ws
1466 ;; Regexp matching a piece of syntactic whitespace that isn't a
1467 ;; sequence of simple whitespace characters. As opposed to
1468 ;; `c-(forward|backward)-syntactic-ws', this doesn't regard cpp
1469 ;; directives as syntactic whitespace.
0386b551
AM
1470 t (c-concat-separated
1471 (list (when (c-lang-const c-line-comment-starter)
1472 (concat (regexp-quote (c-lang-const c-line-comment-starter))
1473 "[^\n\r]*[\n\r]"))
1474 (c-lang-const c-block-comment-regexp)
1475 "\\\\[\n\r]"
1476 (when (memq 'gen-comment-delim c-emacs-features)
1477 "\\s!\\S!*\\s!"))
1478 "\\|"))
d9e94c22
MS
1479
1480(c-lang-defconst c-syntactic-ws
1481 ;; Regexp matching syntactic whitespace, including possibly the
1482 ;; empty string. As opposed to `c-(forward|backward)-syntactic-ws',
1483 ;; this doesn't regard cpp directives as syntactic whitespace. Does
1484 ;; not contain a \| operator at the top level.
0386b551
AM
1485 t (concat (c-lang-const c-simple-ws) "*"
1486 "\\("
1487 (concat "\\(" (c-lang-const c-nonwhite-syntactic-ws) "\\)"
1488 (c-lang-const c-simple-ws) "*")
1489 "\\)*"))
d9e94c22
MS
1490
1491(c-lang-defconst c-syntactic-ws-depth
1492 ;; Number of regexp grouping parens in `c-syntactic-ws'.
0386b551 1493 t (regexp-opt-depth (c-lang-const c-syntactic-ws)))
d9e94c22
MS
1494
1495(c-lang-defconst c-nonempty-syntactic-ws
1496 ;; Regexp matching syntactic whitespace, which is at least one
1497 ;; character long. As opposed to `c-(forward|backward)-syntactic-ws',
1498 ;; this doesn't regard cpp directives as syntactic whitespace. Does
1499 ;; not contain a \| operator at the top level.
0386b551
AM
1500 t (concat "\\("
1501 (c-lang-const c-simple-ws)
1502 "\\|"
d9e94c22
MS
1503 (c-lang-const c-nonwhite-syntactic-ws)
1504 "\\)+"))
1505
1506(c-lang-defconst c-nonempty-syntactic-ws-depth
1507 ;; Number of regexp grouping parens in `c-nonempty-syntactic-ws'.
0386b551 1508 t (regexp-opt-depth (c-lang-const c-nonempty-syntactic-ws)))
d9e94c22
MS
1509
1510(c-lang-defconst c-single-line-syntactic-ws
1511 ;; Regexp matching syntactic whitespace without any line breaks. As
1512 ;; opposed to `c-(forward|backward)-syntactic-ws', this doesn't
1513 ;; regard cpp directives as syntactic whitespace. Does not contain
1514 ;; a \| operator at the top level.
0386b551
AM
1515 t (if (c-lang-const c-block-comment-regexp)
1516 (concat "\\s *\\("
1517 (c-lang-const c-block-comment-regexp)
1518 "\\s *\\)*")
1519 "\\s *"))
d9e94c22
MS
1520
1521(c-lang-defconst c-single-line-syntactic-ws-depth
1522 ;; Number of regexp grouping parens in `c-single-line-syntactic-ws'.
0386b551 1523 t (regexp-opt-depth (c-lang-const c-single-line-syntactic-ws)))
d9e94c22 1524
0386b551 1525(c-lang-defconst c-syntactic-eol
d9e94c22
MS
1526 ;; Regexp that matches when there is no syntactically significant
1527 ;; text before eol. Macros are regarded as syntactically
1528 ;; significant text here.
0386b551
AM
1529 t (concat (c-lang-const c-single-line-syntactic-ws)
1530 ;; Match eol (possibly inside a block comment or preceded
1531 ;; by a line continuation backslash), or the beginning of a
1532 ;; line comment. Note: This has to be modified for awk
1533 ;; where line comments start with '#'.
1534 "\\("
1535 (c-concat-separated
1536 (list (when (c-lang-const c-line-comment-starter)
1537 (regexp-quote (c-lang-const c-line-comment-starter)))
1538 (when (c-lang-const c-unterminated-block-comment-regexp)
1539 (concat (c-lang-const c-unterminated-block-comment-regexp)
1540 "$"))
1541 "\\\\$"
d9e94c22 1542 "$")
0386b551
AM
1543 "\\|")
1544 "\\)"))
1545(c-lang-defvar c-syntactic-eol (c-lang-const c-syntactic-eol))
1546
1547\f
28abe5e2
AM
1548;;; Defun functions
1549
1550;; The Emacs variables beginning-of-defun-function and
1551;; end-of-defun-function will be set so that commands like
1552;; `mark-defun' and `narrow-to-defun' work right. The key sequences
1553;; C-M-a and C-M-e are, however, bound directly to the CC Mode
e1dbe924 1554;; functions, allowing optimization for large n.
28abe5e2
AM
1555(c-lang-defconst beginning-of-defun-function
1556 "Function to which beginning-of-defun-function will be set."
1557 t 'c-beginning-of-defun
1558 awk 'c-awk-beginning-of-defun)
1559(c-lang-setvar beginning-of-defun-function
1560 (c-lang-const beginning-of-defun-function))
1561
1562(c-lang-defconst end-of-defun-function
1563 "Function to which end-of-defun-function will be set."
1564 t 'c-end-of-defun
1565 awk 'c-awk-end-of-defun)
1566(c-lang-setvar end-of-defun-function (c-lang-const end-of-defun-function))
1567\f
d9e94c22
MS
1568;;; In-comment text handling.
1569
1570(c-lang-defconst c-paragraph-start
1571 "Regexp to append to `paragraph-start'."
1572 t "$"
1573 java "\\(@[a-zA-Z]+\\>\\|$\\)" ; For Javadoc.
1574 pike "\\(@[a-zA-Z_-]+\\>\\([^{]\\|$\\)\\|$\\)") ; For Pike refdoc.
1575(c-lang-defvar c-paragraph-start (c-lang-const c-paragraph-start))
1576
1577(c-lang-defconst c-paragraph-separate
1578 "Regexp to append to `paragraph-separate'."
1579 t "$"
1580 pike (c-lang-const c-paragraph-start))
1581(c-lang-defvar c-paragraph-separate (c-lang-const c-paragraph-separate))
1582
1583\f
1584;;; Keyword lists.
1585
1586;; Note: All and only all language constants containing keyword lists
1587;; should end with "-kwds"; they're automatically collected into the
1588;; `c-kwds-lang-consts' list below and used to build `c-keywords' etc.
1589
a66cd3ee 1590(c-lang-defconst c-primitive-type-kwds
d9e94c22
MS
1591 "Primitive type keywords. As opposed to the other keyword lists, the
1592keywords listed here are fontified with the type face instead of the
1593keyword face.
1594
1595If any of these also are on `c-type-list-kwds', `c-ref-list-kwds',
1596`c-colon-type-list-kwds', `c-paren-nontype-kwds', `c-paren-type-kwds',
1597`c-<>-type-kwds', or `c-<>-arglist-kwds' then the associated clauses
1598will be handled.
1599
1600Do not try to modify this list for end user customizations; the
1601`*-font-lock-extra-types' variable, where `*' is the mode prefix, is
1602the appropriate place for that."
1603 t '("char" "double" "float" "int" "long" "short" "signed"
1604 "unsigned" "void")
1605 c (append
1606 '("_Bool" "_Complex" "_Imaginary") ; Conditionally defined in C99.
1607 (c-lang-const c-primitive-type-kwds))
1608 c++ (append
1609 '("bool" "wchar_t")
1610 (c-lang-const c-primitive-type-kwds))
1611 ;; Objective-C extends C, but probably not the new stuff in C99.
1612 objc (append
1613 '("id" "Class" "SEL" "IMP" "BOOL")
1614 (c-lang-const c-primitive-type-kwds))
a66cd3ee 1615 java '("boolean" "byte" "char" "double" "float" "int" "long" "short" "void")
d9e94c22
MS
1616 idl '("Object" "ValueBase" "any" "boolean" "char" "double" "fixed" "float"
1617 "long" "octet" "sequence" "short" "string" "void" "wchar" "wstring"
1618 ;; In CORBA PSDL:
1619 "ref"
1620 ;; The following can't really end a type, but we have to specify them
1621 ;; here due to the assumption in `c-primitive-type-prefix-kwds'. It
1622 ;; doesn't matter that much.
1623 "unsigned" "strong")
1624 pike '(;; this_program isn't really a keyword, but it's practically
1625 ;; used as a builtin type.
1626 "array" "float" "function" "int" "mapping" "mixed" "multiset"
1627 "object" "program" "string" "this_program" "void"))
1628
1629(c-lang-defconst c-primitive-type-key
1630 ;; An adorned regexp that matches `c-primitive-type-kwds'.
1631 t (c-make-keywords-re t (c-lang-const c-primitive-type-kwds)))
1632(c-lang-defvar c-primitive-type-key (c-lang-const c-primitive-type-key))
1633
1634(c-lang-defconst c-primitive-type-prefix-kwds
1635 "Keywords that might act as prefixes for primitive types. Assumed to
1636be a subset of `c-primitive-type-kwds'."
1637 t nil
1638 (c c++) '("long" "short" "signed" "unsigned")
1639 idl '("long" "unsigned"
1640 ;; In CORBA PSDL:
1641 "strong"))
1642
e15f8aaa
AM
1643(c-lang-defconst c-typedef-kwds
1644 "Prefix keyword\(s\) like \"typedef\" which make a type declaration out
1645of a variable declaration."
1646 t '("typedef")
1647 (awk idl java) nil)
1648
1649(c-lang-defconst c-typedef-key
1650 ;; Adorned regexp matching `c-typedef-kwds'.
1651 t (c-make-keywords-re t (c-lang-const c-typedef-kwds)))
1652(c-lang-defvar c-typedef-key (c-lang-const c-typedef-key))
1653
d9e94c22
MS
1654(c-lang-defconst c-type-prefix-kwds
1655 "Keywords where the following name - if any - is a type name, and
1656where the keyword together with the symbol works as a type in
1657declarations.
1658
1659Note that an alternative if the second part doesn't hold is
1660`c-type-list-kwds'. Keywords on this list are typically also present
1661on one of the `*-decl-kwds' lists."
1662 t nil
1663 c '("struct" "union" "enum")
1664 c++ (append '("class" "typename")
1665 (c-lang-const c-type-prefix-kwds c)))
1666
1667(c-lang-defconst c-type-prefix-key
1668 ;; Adorned regexp matching `c-type-prefix-kwds'.
1669 t (c-make-keywords-re t (c-lang-const c-type-prefix-kwds)))
1670(c-lang-defvar c-type-prefix-key (c-lang-const c-type-prefix-key))
1671
1672(c-lang-defconst c-type-modifier-kwds
1673 "Type modifier keywords. These can occur almost anywhere in types
1674but they don't build a type of themselves. Unlike the keywords on
1675`c-primitive-type-kwds', they are fontified with the keyword face and
1676not the type face."
1677 t nil
1678 c '("const" "restrict" "volatile")
1679 c++ '("const" "volatile" "throw")
1680 objc '("const" "volatile"))
1681
1682(c-lang-defconst c-opt-type-modifier-key
1683 ;; Adorned regexp matching `c-type-modifier-kwds', or nil in
1684 ;; languages without such keywords.
1685 t (and (c-lang-const c-type-modifier-kwds)
1686 (c-make-keywords-re t (c-lang-const c-type-modifier-kwds))))
1687(c-lang-defvar c-opt-type-modifier-key (c-lang-const c-opt-type-modifier-key))
1688
1689(c-lang-defconst c-opt-type-component-key
1690 ;; An adorned regexp that matches `c-primitive-type-prefix-kwds' and
1691 ;; `c-type-modifier-kwds', or nil in languages without any of them.
1692 t (and (or (c-lang-const c-primitive-type-prefix-kwds)
1693 (c-lang-const c-type-modifier-kwds))
1694 (c-make-keywords-re t
1695 (append (c-lang-const c-primitive-type-prefix-kwds)
1696 (c-lang-const c-type-modifier-kwds)))))
1697(c-lang-defvar c-opt-type-component-key
1698 (c-lang-const c-opt-type-component-key))
1699
0386b551
AM
1700(c-lang-defconst c-type-start-kwds
1701 ;; All keywords that can start a type (i.e. are either a type prefix
1702 ;; or a complete type).
1703 t (delete-duplicates (append (c-lang-const c-primitive-type-kwds)
1704 (c-lang-const c-type-prefix-kwds)
1705 (c-lang-const c-type-modifier-kwds))
1706 :test 'string-equal))
1707
d9e94c22
MS
1708(c-lang-defconst c-class-decl-kwds
1709 "Keywords introducing declarations where the following block (if any)
1710contains another declaration level that should be considered a class.
1711
1712If any of these also are on `c-type-list-kwds', `c-ref-list-kwds',
1713`c-colon-type-list-kwds', `c-paren-nontype-kwds', `c-paren-type-kwds',
1714`c-<>-type-kwds', or `c-<>-arglist-kwds' then the associated clauses
1715will be handled.
1716
1717Note that presence on this list does not automatically treat the
1718following identifier as a type; the keyword must also be present on
1719`c-type-prefix-kwds' or `c-type-list-kwds' to accomplish that."
1720 t nil
1721 c '("struct" "union")
1722 c++ '("class" "struct" "union")
1723 objc '("struct" "union"
1724 "@interface" "@implementation" "@protocol")
452ea855 1725 java '("class" "@interface" "interface")
d9e94c22
MS
1726 idl '("component" "eventtype" "exception" "home" "interface" "struct"
1727 "union" "valuetype"
1728 ;; In CORBA PSDL:
1729 "storagehome" "storagetype"
1730 ;; In CORBA CIDL:
1731 "catalog" "executor" "manages" "segment")
a66cd3ee
MS
1732 pike '("class"))
1733
a66cd3ee 1734(c-lang-defconst c-class-key
d9e94c22
MS
1735 ;; Regexp matching the start of a class.
1736 t (c-make-keywords-re t (c-lang-const c-class-decl-kwds)))
1737(c-lang-defvar c-class-key (c-lang-const c-class-key))
1738
1739(c-lang-defconst c-brace-list-decl-kwds
1740 "Keywords introducing declarations where the following block (if
1741any) is a brace list.
1742
1743If any of these also are on `c-type-list-kwds', `c-ref-list-kwds',
1744`c-colon-type-list-kwds', `c-paren-nontype-kwds', `c-paren-type-kwds',
1745`c-<>-type-kwds', or `c-<>-arglist-kwds' then the associated clauses
1746will be handled."
1747 t '("enum")
452ea855 1748 (awk) nil)
d9e94c22
MS
1749
1750(c-lang-defconst c-brace-list-key
1751 ;; Regexp matching the start of declarations where the following
1752 ;; block is a brace list.
1753 t (c-make-keywords-re t (c-lang-const c-brace-list-decl-kwds)))
1754(c-lang-defvar c-brace-list-key (c-lang-const c-brace-list-key))
1755
1756(c-lang-defconst c-other-block-decl-kwds
3efc2cd7 1757 "Keywords where the following block (if any) contains another
0386b551
AM
1758declaration level that should not be considered a class. For every
1759keyword here, CC Mode will add a set of special syntactic symbols for
1760those blocks. E.g. if the keyword is \"foo\" then there will be
1761`foo-open', `foo-close', and `infoo' symbols.
1762
1763The intention is that this category should be used for block
1764constructs that aren't related to object orientation concepts like
1765classes (which thus also include e.g. interfaces, templates,
1766contracts, structs, etc). The more pragmatic distinction is that
1767while most want some indentation inside classes, it's fairly common
1768that they don't want it in some of these constructs, so it should be
1769simple to configure that differently from classes. See also
1770`c-class-decl-kwds'.
d9e94c22
MS
1771
1772If any of these also are on `c-type-list-kwds', `c-ref-list-kwds',
1773`c-colon-type-list-kwds', `c-paren-nontype-kwds', `c-paren-type-kwds',
1774`c-<>-type-kwds', or `c-<>-arglist-kwds' then the associated clauses
1775will be handled."
1776 t nil
0386b551 1777 (c objc) '("extern")
a66cd3ee 1778 c++ '("namespace" "extern")
d9e94c22
MS
1779 idl '("module"
1780 ;; In CORBA CIDL:
1781 "composition"))
a66cd3ee 1782
a66cd3ee 1783(c-lang-defconst c-other-decl-block-key
d9e94c22
MS
1784 ;; Regexp matching the start of blocks besides classes that contain
1785 ;; another declaration level.
1786 t (c-make-keywords-re t (c-lang-const c-other-block-decl-kwds)))
1787(c-lang-defvar c-other-decl-block-key (c-lang-const c-other-decl-block-key))
1788
c382ec40
AM
1789(c-lang-defvar c-other-decl-block-key-in-symbols-alist
1790 (mapcar
1791 (lambda (elt)
1792 (cons elt
1793 (if (string= elt "extern")
1794 'inextern-lang
1795 (intern (concat "in" elt)))))
1796 (c-lang-const c-other-block-decl-kwds))
1797 "Alist associating keywords in c-other-decl-block-decl-kwds with
1798their matching \"in\" syntactic symbols.")
1799
d9e94c22 1800(c-lang-defconst c-typedef-decl-kwds
0386b551
AM
1801 "Keywords introducing declarations where the identifier(s) being
1802declared are types.
d9e94c22
MS
1803
1804If any of these also are on `c-type-list-kwds', `c-ref-list-kwds',
1805`c-colon-type-list-kwds', `c-paren-nontype-kwds', `c-paren-type-kwds',
1806`c-<>-type-kwds', or `c-<>-arglist-kwds' then the associated clauses
1807will be handled."
0386b551
AM
1808 ;; Default to `c-class-decl-kwds' and `c-brace-list-decl-kwds'
1809 ;; (since e.g. "Foo" is a type that's being defined in "class Foo
1810 ;; {...}").
1811 t (append (c-lang-const c-class-decl-kwds)
1812 (c-lang-const c-brace-list-decl-kwds))
1813 ;; Languages that have a "typedef" construct.
1814 (c c++ objc idl pike) (append (c-lang-const c-typedef-decl-kwds)
1815 '("typedef"))
1816 ;; Unlike most other languages, exception names are not handled as
1817 ;; types in IDL since they only can occur in "raises" specs.
1818 idl (delete "exception" (append (c-lang-const c-typedef-decl-kwds) nil)))
d9e94c22 1819
e15f8aaa
AM
1820(c-lang-defconst c-typedef-decl-key
1821 t (c-make-keywords-re t (c-lang-const c-typedef-decl-kwds)))
1822(c-lang-defvar c-typedef-decl-key (c-lang-const c-typedef-decl-key))
1823
d9e94c22 1824(c-lang-defconst c-typeless-decl-kwds
0386b551
AM
1825 "Keywords introducing declarations where the \(first) identifier
1826\(declarator) follows directly after the keyword, without any type.
d9e94c22
MS
1827
1828If any of these also are on `c-type-list-kwds', `c-ref-list-kwds',
1829`c-colon-type-list-kwds', `c-paren-nontype-kwds', `c-paren-type-kwds',
1830`c-<>-type-kwds', or `c-<>-arglist-kwds' then the associated clauses
1831will be handled."
0386b551
AM
1832 ;; Default to `c-class-decl-kwds' and `c-brace-list-decl-kwds'
1833 ;; (since e.g. "Foo" is the identifier being defined in "class Foo
1834 ;; {...}").
1835 t (append (c-lang-const c-class-decl-kwds)
1836 (c-lang-const c-brace-list-decl-kwds))
1837 ;; Note: "manages" for CORBA CIDL clashes with its presence on
1838 ;; `c-type-list-kwds' for IDL.
1839 idl (append (c-lang-const c-typeless-decl-kwds)
1840 '("factory" "finder" "native"
1841 ;; In CORBA PSDL:
1842 "key" "stores"
1843 ;; In CORBA CIDL:
1844 "facet"))
1845 pike (append (c-lang-const c-class-decl-kwds)
1846 '("constant")))
d9e94c22
MS
1847
1848(c-lang-defconst c-modifier-kwds
1849 "Keywords that can prefix normal declarations of identifiers
0386b551 1850\(and typically act as flags). Things like argument declarations
d9e94c22
MS
1851inside function headers are also considered declarations in this
1852sense.
1853
1854If any of these also are on `c-type-list-kwds', `c-ref-list-kwds',
1855`c-colon-type-list-kwds', `c-paren-nontype-kwds', `c-paren-type-kwds',
1856`c-<>-type-kwds', or `c-<>-arglist-kwds' then the associated clauses
1857will be handled."
1858 t nil
1859 (c c++) '("auto" "extern" "inline" "register" "static")
1860 c++ (append '("explicit" "friend" "mutable" "template" "using" "virtual")
1861 (c-lang-const c-modifier-kwds))
1862 objc '("auto" "bycopy" "byref" "extern" "in" "inout" "oneway" "out" "static")
1863 ;; FIXME: Some of those below ought to be on `c-other-decl-kwds' instead.
1864 idl '("abstract" "attribute" "const" "consumes" "custom" "emits" "import"
1865 "in" "inout" "local" "multiple" "oneway" "out" "private" "provides"
1866 "public" "publishes" "readonly" "typeid" "typeprefix" "uses"
1867 ;; In CORBA PSDL:
1868 "primary" "state"
1869 ;; In CORBA CIDL:
1870 "bindsTo" "delegatesTo" "implements" "proxy" "storedOn")
1871 ;; Note: "const" is not used in Java, but it's still a reserved keyword.
1872 java '("abstract" "const" "final" "native" "private" "protected" "public"
e3715033 1873 "static" "strictfp" "synchronized" "transient" "volatile")
d9e94c22
MS
1874 pike '("final" "inline" "local" "nomask" "optional" "private" "protected"
1875 "public" "static" "variant"))
a66cd3ee 1876
d9e94c22
MS
1877(c-lang-defconst c-other-decl-kwds
1878 "Keywords that can start or prefix any declaration level construct,
1879besides those on `c-class-decl-kwds', `c-brace-list-decl-kwds',
1880`c-other-block-decl-kwds', `c-typedef-decl-kwds',
0386b551 1881`c-typeless-decl-kwds' and `c-modifier-kwds'.
d9e94c22
MS
1882
1883If any of these also are on `c-type-list-kwds', `c-ref-list-kwds',
1884`c-colon-type-list-kwds', `c-paren-nontype-kwds', `c-paren-type-kwds',
1885`c-<>-type-kwds', or `c-<>-arglist-kwds' then the associated clauses
1886will be handled."
1887 t nil
d9e94c22
MS
1888 objc '("@class" "@end" "@defs")
1889 java '("import" "package")
1890 pike '("import" "inherit"))
1891
0386b551
AM
1892(c-lang-defconst c-decl-start-kwds
1893 "Keywords that always start declarations, wherever they occur.
1894This can be used for declarations that aren't recognized by the normal
1895combination of `c-decl-prefix-re' and `c-decl-start-re'."
1896 t nil
1897 ;; Classes can be declared anywhere in a Pike expression.
1898 pike '("class"))
1899
1900(c-lang-defconst c-decl-hangon-kwds
1901 "Keywords that can occur anywhere in a declaration level construct.
1902This is used for self-contained things that can be tacked on anywhere
1903on a declaration and that should be ignored to be able to recognize it
1904correctly. Typical cases are compiler extensions like
1905\"__attribute__\" or \"__declspec\":
1906
1907 __declspec(noreturn) void foo();
1908 class __declspec(dllexport) classname {...};
1909 void foo() __attribute__((noreturn));
1910
1911Note that unrecognized plain symbols are skipped anyway if they occur
1912before the type, so such things are not necessary to mention here.
1913Mentioning them here is necessary only if they can occur in other
1914places, or if they are followed by a construct that must be skipped
1915over \(like the parens in the \"__attribute__\" and \"__declspec\"
1916examples above). In the last case, they alse need to be present on
1917one of `c-type-list-kwds', `c-ref-list-kwds',
1918`c-colon-type-list-kwds', `c-paren-nontype-kwds', `c-paren-type-kwds',
1919`c-<>-type-kwds', or `c-<>-arglist-kwds'."
1920 ;; NB: These are currently not recognized in all parts of a
1921 ;; declaration. Specifically, they aren't recognized in the middle
1922 ;; of multi-token types, inside declarators, and between the
1923 ;; identifier and the arglist paren of a function declaration.
1924 ;;
1925 ;; FIXME: This ought to be user customizable since compiler stuff
1926 ;; like this usually is wrapped in project specific macros. (It'd
1927 ;; of course be even better if we could cope without knowing this.)
1928 t nil
1929 (c c++) '(;; GCC extension.
1930 "__attribute__"
1931 ;; MSVC extension.
1932 "__declspec"))
1933
1934(c-lang-defconst c-decl-hangon-key
1935 ;; Adorned regexp matching `c-decl-hangon-kwds'.
1936 t (c-make-keywords-re t (c-lang-const c-decl-hangon-kwds)))
1937(c-lang-defvar c-decl-hangon-key (c-lang-const c-decl-hangon-key))
1938
1939(c-lang-defconst c-prefix-spec-kwds
1940 ;; All keywords that can occur in the preamble of a declaration.
1941 ;; They typically occur before the type, but they are also matched
1942 ;; after presumptive types since we often can't be sure that
1943 ;; something is a type or just some sort of macro in front of the
1944 ;; declaration. They might be ambiguous with types or type
1945 ;; prefixes.
1946 t (delete-duplicates (append (c-lang-const c-class-decl-kwds)
1947 (c-lang-const c-brace-list-decl-kwds)
1948 (c-lang-const c-other-block-decl-kwds)
1949 (c-lang-const c-typedef-decl-kwds)
1950 (c-lang-const c-typeless-decl-kwds)
1951 (c-lang-const c-modifier-kwds)
1952 (c-lang-const c-other-decl-kwds)
1953 (c-lang-const c-decl-start-kwds)
1954 (c-lang-const c-decl-hangon-kwds))
1955 :test 'string-equal))
1956
1957(c-lang-defconst c-prefix-spec-kwds-re
1958 ;; Adorned regexp of `c-prefix-spec-kwds'.
e3715033 1959 t (c-make-keywords-re t (c-lang-const c-prefix-spec-kwds)))
452ea855 1960
0386b551
AM
1961(c-lang-defvar c-prefix-spec-kwds-re (c-lang-const c-prefix-spec-kwds-re))
1962
d9e94c22 1963(c-lang-defconst c-specifier-key
cc1cce14
AM
1964 ;; Adorned regexp of the keywords in `c-prefix-spec-kwds' that aren't
1965 ;; ambiguous with types or type prefixes. These are the keywords (like
1966 ;; extern, namespace, but NOT template) that can modify a declaration.
d9e94c22 1967 t (c-make-keywords-re t
0386b551 1968 (set-difference (c-lang-const c-prefix-spec-kwds)
cc1cce14
AM
1969 (append (c-lang-const c-type-start-kwds)
1970 (c-lang-const c-<>-arglist-kwds))
d9e94c22
MS
1971 :test 'string-equal)))
1972(c-lang-defvar c-specifier-key (c-lang-const c-specifier-key))
a66cd3ee 1973
0386b551
AM
1974(c-lang-defconst c-postfix-spec-kwds
1975 ;; Keywords that can occur after argument list of a function header
1976 ;; declaration, i.e. in the "K&R region".
1977 t (append (c-lang-const c-postfix-decl-spec-kwds)
1978 (c-lang-const c-decl-hangon-kwds)))
1979
1980(c-lang-defconst c-not-decl-init-keywords
1981 ;; Adorned regexp matching all keywords that can't appear at the
1982 ;; start of a declaration.
1983 t (c-make-keywords-re t
1984 (set-difference (c-lang-const c-keywords)
1985 (append (c-lang-const c-type-start-kwds)
1986 (c-lang-const c-prefix-spec-kwds))
1987 :test 'string-equal)))
1988(c-lang-defvar c-not-decl-init-keywords
1989 (c-lang-const c-not-decl-init-keywords))
1990
b248a85d
AM
1991(c-lang-defconst c-not-primitive-type-keywords
1992 "List of all keywords apart from primitive types (like \"int\")."
1993 t (set-difference (c-lang-const c-keywords)
1994 (c-lang-const c-primitive-type-kwds)
1995 :test 'string-equal)
1996 ;; The "more" for C++ is the QT keyword (as in "more slots:").
1997 ;; This variable is intended for use in c-beginning-of-statement-1.
1998 c++ (append (c-lang-const c-not-primitive-type-keywords) '("more")))
1999
2000(c-lang-defconst c-not-primitive-type-keywords-regexp
2001 t (c-make-keywords-re t
2002 (c-lang-const c-not-primitive-type-keywords)))
2003(c-lang-defvar c-not-primitive-type-keywords-regexp
2004 (c-lang-const c-not-primitive-type-keywords-regexp))
2005
d9e94c22 2006(c-lang-defconst c-protection-kwds
0386b551 2007 "Access protection label keywords in classes."
d9e94c22
MS
2008 t nil
2009 c++ '("private" "protected" "public")
2010 objc '("@private" "@protected" "@public"))
a66cd3ee 2011
d9e94c22
MS
2012(c-lang-defconst c-block-decls-with-vars
2013 "Keywords introducing declarations that can contain a block which
2014might be followed by variable declarations, e.g. like \"foo\" in
2015\"class Foo { ... } foo;\". So if there is a block in a declaration
2016like that, it ends with the following ';' and not right away.
130c507e 2017
d9e94c22
MS
2018The keywords on list are assumed to also be present on one of the
2019`*-decl-kwds' lists."
2020 t nil
2021 (c objc) '("struct" "union" "enum" "typedef")
2022 c++ '("class" "struct" "union" "enum" "typedef"))
2023
2024(c-lang-defconst c-opt-block-decls-with-vars-key
2025 ;; Regexp matching the `c-block-decls-with-vars' keywords, or nil in
2026 ;; languages without such constructs.
2027 t (and (c-lang-const c-block-decls-with-vars)
2028 (c-make-keywords-re t (c-lang-const c-block-decls-with-vars))))
2029(c-lang-defvar c-opt-block-decls-with-vars-key
2030 (c-lang-const c-opt-block-decls-with-vars-key))
2031
2032(c-lang-defconst c-postfix-decl-spec-kwds
2033 "Keywords introducing extra declaration specifiers in the region
2034between the header and the body \(i.e. the \"K&R-region\") in
2035declarations."
2036 t nil
d9e94c22
MS
2037 java '("extends" "implements" "throws")
2038 idl '("context" "getraises" "manages" "primarykey" "raises" "setraises"
2039 "supports"
2040 ;; In CORBA PSDL:
2041 "as" "const" "implements" "of" "ref"))
2042
2043(c-lang-defconst c-nonsymbol-sexp-kwds
2044 "Keywords that may be followed by a nonsymbol sexp before whatever
2045construct it's part of continues."
2046 t nil
2047 (c c++ objc) '("extern"))
2048
2049(c-lang-defconst c-type-list-kwds
2050 "Keywords that may be followed by a comma separated list of type
2051identifiers, where each optionally can be prefixed by keywords. (Can
2052also be used for the special case when the list can contain only one
2053element.)
2054
2055Assumed to be mutually exclusive with `c-ref-list-kwds'. There's no
2056reason to put keywords on this list if they are on `c-type-prefix-kwds'.
2057There's also no reason to add keywords that prefixes a normal
2058declaration consisting of a type followed by a declarator (list), so
2059the keywords on `c-modifier-kwds' should normally not be listed here
0386b551 2060either.
d9e94c22
MS
2061
2062Note: Use `c-typeless-decl-kwds' for keywords followed by a function
2063or variable identifier (that's being defined)."
0386b551 2064 t nil
fa14078b 2065 c++ '("operator")
0386b551 2066 objc '("@class")
452ea855 2067 java '("import" "new" "extends" "super" "implements" "throws")
0386b551
AM
2068 idl '("manages" "native" "primarykey" "supports"
2069 ;; In CORBA PSDL:
2070 "as" "implements" "of" "scope")
2071 pike '("inherit"))
d9e94c22
MS
2072
2073(c-lang-defconst c-ref-list-kwds
2074 "Keywords that may be followed by a comma separated list of
2075reference (i.e. namespace/scope/module) identifiers, where each
2076optionally can be prefixed by keywords. (Can also be used for the
2077special case when the list can contain only one element.) Assumed to
2078be mutually exclusive with `c-type-list-kwds'.
2079
2080Note: Use `c-typeless-decl-kwds' for keywords followed by a function
2081or variable identifier (that's being defined)."
2082 t nil
2083 c++ '("namespace")
2084 java '("package")
2085 idl '("import" "module"
2086 ;; In CORBA CIDL:
2087 "composition")
2088 pike '("import"))
2089
2090(c-lang-defconst c-colon-type-list-kwds
2091 "Keywords that may be followed (not necessarily directly) by a colon
2092and then a comma separated list of type identifiers, where each
2093optionally can be prefixed by keywords. (Can also be used for the
2094special case when the list can contain only one element.)"
2095 t nil
2096 c++ '("class" "struct")
2097 idl '("component" "eventtype" "home" "interface" "valuetype"
2098 ;; In CORBA PSDL:
2099 "storagehome" "storagetype"))
2100
2101(c-lang-defconst c-colon-type-list-re
2102 "Regexp matched after the keywords in `c-colon-type-list-kwds' to skip
2103forward to the colon. The end of the match is assumed to be directly
0386b551
AM
2104after the colon, so the regexp should end with \":\". Must be a
2105regexp if `c-colon-type-list-kwds' isn't nil."
d9e94c22
MS
2106 t (if (c-lang-const c-colon-type-list-kwds)
2107 ;; Disallow various common punctuation chars that can't come
2108 ;; before the ":" that starts the inherit list after "class"
2109 ;; or "struct" in C++. (Also used as default for other
2110 ;; languages.)
2111 "[^\]\[{}();,/#=:]*:"))
2112(c-lang-defvar c-colon-type-list-re (c-lang-const c-colon-type-list-re))
2113
2114(c-lang-defconst c-paren-nontype-kwds
2115 "Keywords that may be followed by a parenthesis expression that doesn't
2116contain type identifiers."
2117 t nil
0386b551
AM
2118 (c c++) '(;; GCC extension.
2119 "__attribute__"
2120 ;; MSVC extension.
2121 "__declspec"))
d9e94c22
MS
2122
2123(c-lang-defconst c-paren-type-kwds
2124 "Keywords that may be followed by a parenthesis expression containing
2125type identifiers separated by arbitrary tokens."
2126 t nil
2127 c++ '("throw")
2128 objc '("@defs")
2129 idl '("switch")
2130 pike '("array" "function" "int" "mapping" "multiset" "object" "program"))
2131
2132(c-lang-defconst c-paren-any-kwds
2133 t (delete-duplicates (append (c-lang-const c-paren-nontype-kwds)
2134 (c-lang-const c-paren-type-kwds))
2135 :test 'string-equal))
2136
2137(c-lang-defconst c-<>-type-kwds
2138 "Keywords that may be followed by an angle bracket expression
2139containing type identifiers separated by \",\". The difference from
2140`c-<>-arglist-kwds' is that unknown names are taken to be types and
2141not other identifiers. `c-recognize-<>-arglists' is assumed to be set
2142if this isn't nil."
2143 t nil
2144 objc '("id")
2145 idl '("sequence"
2146 ;; In CORBA PSDL:
2147 "ref"))
2148
2149(c-lang-defconst c-<>-arglist-kwds
2150 "Keywords that can be followed by a C++ style template arglist; see
2151`c-recognize-<>-arglists' for details. That language constant is
2152assumed to be set if this isn't nil."
2153 t nil
2154 c++ '("template")
2155 idl '("fixed" "string" "wstring"))
2156
2157(c-lang-defconst c-<>-sexp-kwds
2158 ;; All keywords that can be followed by an angle bracket sexp.
2159 t (delete-duplicates (append (c-lang-const c-<>-type-kwds)
2160 (c-lang-const c-<>-arglist-kwds))
2161 :test 'string-equal))
2162
2163(c-lang-defconst c-opt-<>-sexp-key
2164 ;; Adorned regexp matching keywords that can be followed by an angle
846f5040 2165 ;; bracket sexp. Always set when `c-recognize-<>-arglists' is.
d9e94c22
MS
2166 t (if (c-lang-const c-recognize-<>-arglists)
2167 (c-make-keywords-re t (c-lang-const c-<>-sexp-kwds))))
2168(c-lang-defvar c-opt-<>-sexp-key (c-lang-const c-opt-<>-sexp-key))
2169
2170(c-lang-defconst c-brace-id-list-kwds
2171 "Keywords that may be followed by a brace block containing a comma
2172separated list of identifier definitions, i.e. like the list of
2173identifiers that follows the type in a normal declaration."
2174 t (c-lang-const c-brace-list-decl-kwds))
a66cd3ee 2175
a66cd3ee 2176(c-lang-defconst c-block-stmt-1-kwds
d9e94c22
MS
2177 "Statement keywords followed directly by a substatement."
2178 t '("do" "else")
2179 c++ '("do" "else" "try")
9555a4cf 2180 objc '("do" "else" "@finally" "@try")
d9e94c22
MS
2181 java '("do" "else" "finally" "try")
2182 idl nil)
a66cd3ee 2183
a66cd3ee 2184(c-lang-defconst c-block-stmt-1-key
d9e94c22
MS
2185 ;; Regexp matching the start of any statement followed directly by a
2186 ;; substatement (doesn't match a bare block, however).
2187 t (c-make-keywords-re t (c-lang-const c-block-stmt-1-kwds)))
2188(c-lang-defvar c-block-stmt-1-key (c-lang-const c-block-stmt-1-key))
a66cd3ee 2189
a66cd3ee 2190(c-lang-defconst c-block-stmt-2-kwds
d9e94c22
MS
2191 "Statement keywords followed by a paren sexp and then by a substatement."
2192 t '("for" "if" "switch" "while")
2193 c++ '("for" "if" "switch" "while" "catch")
9555a4cf 2194 objc '("for" "if" "switch" "while" "@catch" "@synchronized")
a66cd3ee 2195 java '("for" "if" "switch" "while" "catch" "synchronized")
d9e94c22
MS
2196 idl nil
2197 pike '("for" "if" "switch" "while" "foreach")
2198 awk '("for" "if" "while"))
a66cd3ee 2199
a66cd3ee 2200(c-lang-defconst c-block-stmt-2-key
d9e94c22
MS
2201 ;; Regexp matching the start of any statement followed by a paren sexp
2202 ;; and then by a substatement.
2203 t (c-make-keywords-re t (c-lang-const c-block-stmt-2-kwds)))
2204(c-lang-defvar c-block-stmt-2-key (c-lang-const c-block-stmt-2-key))
a66cd3ee 2205
0386b551
AM
2206(c-lang-defconst c-block-stmt-kwds
2207 ;; Union of `c-block-stmt-1-kwds' and `c-block-stmt-2-kwds'.
2208 t (delete-duplicates (append (c-lang-const c-block-stmt-1-kwds)
2209 (c-lang-const c-block-stmt-2-kwds))
2210 :test 'string-equal))
2211
a66cd3ee 2212(c-lang-defconst c-opt-block-stmt-key
d9e94c22
MS
2213 ;; Regexp matching the start of any statement that has a
2214 ;; substatement (except a bare block). Nil in languages that
2215 ;; don't have such constructs.
2216 t (if (or (c-lang-const c-block-stmt-1-kwds)
2217 (c-lang-const c-block-stmt-2-kwds))
2218 (c-make-keywords-re t
2219 (append (c-lang-const c-block-stmt-1-kwds)
2220 (c-lang-const c-block-stmt-2-kwds)))))
2221(c-lang-defvar c-opt-block-stmt-key (c-lang-const c-opt-block-stmt-key))
2222
a66cd3ee 2223(c-lang-defconst c-simple-stmt-kwds
d9e94c22
MS
2224 "Statement keywords followed by an expression or nothing."
2225 t '("break" "continue" "goto" "return")
9555a4cf 2226 objc '("break" "continue" "goto" "return" "@throw")
a66cd3ee
MS
2227 ;; Note: `goto' is not valid in Java, but the keyword is still reserved.
2228 java '("break" "continue" "goto" "return" "throw")
d9e94c22
MS
2229 idl nil
2230 pike '("break" "continue" "return")
2231 awk '(;; Not sure about "delete", "exit", "getline", etc. ; ACM 2002/5/30
2232 "break" "continue" "return" "delete" "exit" "getline" "next"
2233 "nextfile" "print" "printf"))
2234
2235(c-lang-defconst c-simple-stmt-key
2236 ;; Adorned regexp matching `c-simple-stmt-kwds'.
2237 t (c-make-keywords-re t (c-lang-const c-simple-stmt-kwds)))
2238(c-lang-defvar c-simple-stmt-key (c-lang-const c-simple-stmt-key))
2239
2240(c-lang-defconst c-paren-stmt-kwds
2241 "Statement keywords followed by a parenthesis expression that
2242nevertheless contains a list separated with ';' and not ','."
2243 t '("for")
2244 idl nil)
2245
2246(c-lang-defconst c-paren-stmt-key
2247 ;; Adorned regexp matching `c-paren-stmt-kwds'.
2248 t (c-make-keywords-re t (c-lang-const c-paren-stmt-kwds)))
2249(c-lang-defvar c-paren-stmt-key (c-lang-const c-paren-stmt-key))
a66cd3ee 2250
a66cd3ee 2251(c-lang-defconst c-asm-stmt-kwds
d9e94c22
MS
2252 "Statement keywords followed by an assembler expression."
2253 t nil
2254 (c c++) '("asm" "__asm__")) ;; Not standard, but common.
a66cd3ee 2255
a66cd3ee 2256(c-lang-defconst c-opt-asm-stmt-key
d9e94c22
MS
2257 ;; Regexp matching the start of an assembler statement. Nil in
2258 ;; languages that don't support that.
2259 t (if (c-lang-const c-asm-stmt-kwds)
2260 (c-make-keywords-re t (c-lang-const c-asm-stmt-kwds))))
2261(c-lang-defvar c-opt-asm-stmt-key (c-lang-const c-opt-asm-stmt-key))
2262
d28e7f28
AM
2263(c-lang-defconst c-case-kwds
2264 "The keyword\(s) which introduce a \"case\" like construct.
2265This construct is \"<keyword> <expression> :\"."
2266 t '("case")
2267 awk nil)
2268
2269(c-lang-defconst c-case-kwds-regexp
2270 ;; Adorned regexp matching any "case"-like keyword.
2271 t (c-make-keywords-re t (c-lang-const c-case-kwds)))
2272(c-lang-defvar c-case-kwds-regexp (c-lang-const c-case-kwds-regexp))
2273
d9e94c22 2274(c-lang-defconst c-label-kwds
0386b551 2275 "Keywords introducing colon terminated labels in blocks."
898169a2 2276 t '("case" "default"))
d9e94c22 2277
0386b551
AM
2278(c-lang-defconst c-label-kwds-regexp
2279 ;; Adorned regexp matching any keyword that introduces a label.
2280 t (c-make-keywords-re t (c-lang-const c-label-kwds)))
2281(c-lang-defvar c-label-kwds-regexp (c-lang-const c-label-kwds-regexp))
2282
d9e94c22
MS
2283(c-lang-defconst c-before-label-kwds
2284 "Keywords that might be followed by a label identifier."
2285 t '("goto")
2286 (java pike) (append '("break" "continue")
2287 (c-lang-const c-before-label-kwds))
2288 idl nil
2289 awk nil)
130c507e 2290
d9e94c22
MS
2291(c-lang-defconst c-constant-kwds
2292 "Keywords for constants."
2293 t nil
2294 (c c++) '("NULL" ;; Not a keyword, but practically works as one.
2295 "false" "true") ; Defined in C99.
f0e4b2f2 2296 objc '("nil" "Nil" "YES" "NO" "NS_DURING" "NS_HANDLER" "NS_ENDHANDLER")
d9e94c22 2297 idl '("TRUE" "FALSE")
fbd4de65 2298 java '("true" "false" "null") ; technically "literals", not keywords
d9e94c22
MS
2299 pike '("UNDEFINED")) ;; Not a keyword, but practically works as one.
2300
2301(c-lang-defconst c-primary-expr-kwds
2302 "Keywords besides constants and operators that start primary expressions."
2303 t nil
2304 c++ '("operator" "this")
2305 objc '("super" "self")
2306 java '("this")
2307 pike '("this")) ;; Not really a keyword, but practically works as one.
130c507e 2308
a66cd3ee 2309(c-lang-defconst c-expr-kwds
d9e94c22
MS
2310 ;; Keywords that can occur anywhere in expressions. Built from
2311 ;; `c-primary-expr-kwds' and all keyword operators in `c-operators'.
2312 t (delete-duplicates
2313 (append (c-lang-const c-primary-expr-kwds)
0386b551
AM
2314 (c-filter-ops (c-lang-const c-operator-list)
2315 t
2316 "\\`\\(\\w\\|\\s_\\)+\\'"))
d9e94c22
MS
2317 :test 'string-equal))
2318
2319(c-lang-defconst c-lambda-kwds
2320 "Keywords that start lambda constructs, i.e. function definitions in
2321expressions."
2322 t nil
2323 pike '("lambda"))
a66cd3ee 2324
d9e94c22
MS
2325(c-lang-defconst c-inexpr-block-kwds
2326 "Keywords that start constructs followed by statement blocks which can
2327be used in expressions \(the gcc extension for this in C and C++ is
0386b551 2328handled separately by `c-recognize-paren-inexpr-blocks')."
d9e94c22
MS
2329 t nil
2330 pike '("catch" "gauge"))
a66cd3ee 2331
a66cd3ee 2332(c-lang-defconst c-inexpr-class-kwds
d9e94c22
MS
2333 "Keywords that can start classes inside expressions."
2334 t nil
a66cd3ee
MS
2335 java '("new")
2336 pike '("class"))
2337
d9e94c22
MS
2338(c-lang-defconst c-inexpr-brace-list-kwds
2339 "Keywords that can start brace list blocks inside expressions.
2340Note that Java specific rules are currently applied to tell this from
2341`c-inexpr-class-kwds'."
2342 t nil
2343 java '("new"))
2344
2345(c-lang-defconst c-opt-inexpr-brace-list-key
2346 ;; Regexp matching the start of a brace list in an expression, or
2347 ;; nil in languages that don't have such things. This should not
2348 ;; match brace lists recognized through `c-special-brace-lists'.
2349 t (and (c-lang-const c-inexpr-brace-list-kwds)
2350 (c-make-keywords-re t (c-lang-const c-inexpr-brace-list-kwds))))
2351(c-lang-defvar c-opt-inexpr-brace-list-key
2352 (c-lang-const c-opt-inexpr-brace-list-key))
a66cd3ee 2353
a66cd3ee 2354(c-lang-defconst c-decl-block-key
0386b551
AM
2355 ;; Regexp matching keywords in any construct that contain another
2356 ;; declaration level, i.e. that isn't followed by a function block
2357 ;; or brace list. When the first submatch matches, it's an
2358 ;; unambiguous construct, otherwise it's an ambiguous match that
2359 ;; might also be the return type of a function declaration.
2360 t (let* ((decl-kwds (append (c-lang-const c-class-decl-kwds)
2361 (c-lang-const c-other-block-decl-kwds)
2362 (c-lang-const c-inexpr-class-kwds)))
2363 (unambiguous (set-difference decl-kwds
2364 (c-lang-const c-type-start-kwds)
2365 :test 'string-equal))
2366 (ambiguous (intersection decl-kwds
2367 (c-lang-const c-type-start-kwds)
2368 :test 'string-equal)))
2369 (if ambiguous
2370 (concat (c-make-keywords-re t unambiguous)
2371 "\\|"
2372 (c-make-keywords-re t ambiguous))
2373 (c-make-keywords-re t unambiguous))))
d9e94c22
MS
2374(c-lang-defvar c-decl-block-key (c-lang-const c-decl-block-key))
2375
a66cd3ee 2376(c-lang-defconst c-bitfield-kwds
d9e94c22
MS
2377 "Keywords that can introduce bitfields."
2378 t nil
2379 (c c++ objc) '("char" "int" "long" "signed" "unsigned"))
a66cd3ee 2380
a66cd3ee 2381(c-lang-defconst c-opt-bitfield-key
d9e94c22
MS
2382 ;; Regexp matching the start of a bitfield (not uniquely), or nil in
2383 ;; languages without bitfield support.
2384 t nil
2385 (c c++) (c-make-keywords-re t (c-lang-const c-bitfield-kwds)))
2386(c-lang-defvar c-opt-bitfield-key (c-lang-const c-opt-bitfield-key))
2387
2388(c-lang-defconst c-other-kwds
2389 "Keywords not accounted for by any other `*-kwds' language constant."
2390 t nil
2391 idl '("truncatable"
2392 ;; In CORBA CIDL: (These are declaration keywords that never
2393 ;; can start a declaration.)
2394 "entity" "process" "service" "session" "storage"))
2395
2396\f
2397;;; Constants built from keywords.
2398
2399;; Note: No `*-kwds' language constants may be defined below this point.
2400
2401(eval-and-compile
2402 (defconst c-kwds-lang-consts
2403 ;; List of all the language constants that contain keyword lists.
2404 (let (list)
2405 (mapatoms (lambda (sym)
2406 (when (and (boundp sym)
2407 (string-match "-kwds\\'" (symbol-name sym)))
2408 ;; Make the list of globally interned symbols
2409 ;; instead of ones interned in `c-lang-constants'.
2410 (setq list (cons (intern (symbol-name sym)) list))))
2411 c-lang-constants)
2412 list)))
a66cd3ee 2413
a66cd3ee 2414(c-lang-defconst c-keywords
d9e94c22
MS
2415 ;; All keywords as a list.
2416 t (delete-duplicates
2417 (c-lang-defconst-eval-immediately
2418 `(append ,@(mapcar (lambda (kwds-lang-const)
2419 `(c-lang-const ,kwds-lang-const))
2420 c-kwds-lang-consts)
2421 nil))
2422 :test 'string-equal))
2423
a66cd3ee 2424(c-lang-defconst c-keywords-regexp
d9e94c22
MS
2425 ;; All keywords as an adorned regexp.
2426 t (c-make-keywords-re t (c-lang-const c-keywords)))
2427(c-lang-defvar c-keywords-regexp (c-lang-const c-keywords-regexp))
2428
2429(c-lang-defconst c-keyword-member-alist
2430 ;; An alist with all the keywords in the cars. The cdr for each
2431 ;; keyword is a list of the symbols for the `*-kwds' lists that
2432 ;; contains it.
2433 t (let ((kwd-list-alist
2434 (c-lang-defconst-eval-immediately
2435 `(list ,@(mapcar (lambda (kwds-lang-const)
2436 `(cons ',kwds-lang-const
2437 (c-lang-const ,kwds-lang-const)))
2438 c-kwds-lang-consts))))
2439 lang-const kwd-list kwd
2440 result-alist elem)
2441 (while kwd-list-alist
2442 (setq lang-const (caar kwd-list-alist)
2443 kwd-list (cdar kwd-list-alist)
2444 kwd-list-alist (cdr kwd-list-alist))
2445 (while kwd-list
2446 (setq kwd (car kwd-list)
2447 kwd-list (cdr kwd-list))
2448 (unless (setq elem (assoc kwd result-alist))
2449 (setq result-alist (cons (setq elem (list kwd)) result-alist)))
2450 (unless (memq lang-const (cdr elem))
2451 (setcdr elem (cons lang-const (cdr elem))))))
2452 result-alist))
2453
2454(c-lang-defvar c-keywords-obarray
2455 ;; An obarray containing all keywords as symbols. The property list
2456 ;; of each symbol has a non-nil entry for the specific `*-kwds'
2457 ;; lists it's a member of.
2458 ;;
2459 ;; E.g. to see whether the string str contains a keyword on
2460 ;; `c-class-decl-kwds', one can do like this:
2461 ;; (get (intern-soft str c-keyword-obarray) 'c-class-decl-kwds)
2462 ;; Which preferably is written using the associated functions in
2463 ;; cc-engine:
2464 ;; (c-keyword-member (c-keyword-sym str) 'c-class-decl-kwds)
2465
2466 ;; The obarray is not stored directly as a language constant since
2467 ;; the printed representation for obarrays used in .elc files isn't
2468 ;; complete.
2469
2470 (let* ((alist (c-lang-const c-keyword-member-alist))
2471 kwd lang-const-list
2472 (obarray (make-vector (* (length alist) 2) 0)))
2473 (while alist
2474 (setq kwd (caar alist)
2475 lang-const-list (cdar alist)
2476 alist (cdr alist))
2477 (setplist (intern kwd obarray)
2478 ;; Emacs has an odd bug that causes `mapcan' to fail
0386b551 2479 ;; with unintelligible errors. (XEmacs works.)
d9e94c22
MS
2480 ;;(mapcan (lambda (lang-const)
2481 ;; (list lang-const t))
2482 ;; lang-const-list)
2483 (apply 'nconc (mapcar (lambda (lang-const)
2484 (list lang-const t))
2485 lang-const-list))))
2486 obarray))
2487
2488(c-lang-defconst c-regular-keywords-regexp
0386b551
AM
2489 ;; Adorned regexp matching all keywords that should be fontified
2490 ;; with the keywords face. I.e. that aren't types or constants.
d9e94c22
MS
2491 t (c-make-keywords-re t
2492 (set-difference (c-lang-const c-keywords)
2493 (append (c-lang-const c-primitive-type-kwds)
2494 (c-lang-const c-constant-kwds))
2495 :test 'string-equal)))
2496(c-lang-defvar c-regular-keywords-regexp
2497 (c-lang-const c-regular-keywords-regexp))
2498
d9e94c22
MS
2499(c-lang-defconst c-primary-expr-regexp
2500 ;; Regexp matching the start of any primary expression, i.e. any
2501 ;; literal, symbol, prefix operator, and '('. It doesn't need to
2502 ;; exclude keywords; they are excluded afterwards unless the second
2503 ;; submatch matches. If the first but not the second submatch
2504 ;; matches then it is an ambiguous primary expression; it could also
2505 ;; be a match of e.g. an infix operator. (The case with ambiguous
2506 ;; keyword operators isn't handled.)
2507
0386b551
AM
2508 t (let* ((prefix-ops
2509 (c-filter-ops (c-lang-const c-operators)
2510 '(prefix)
2511 (lambda (op)
2512 ;; Filter out the special case prefix
2513 ;; operators that are close parens.
2514 (not (string-match "\\s)" op)))))
2515
2516 (nonkeyword-prefix-ops
2517 (c-filter-ops prefix-ops
2518 t
2519 "\\`\\(\\s.\\|\\s(\\|\\s)\\)+\\'"))
2520
2521 (in-or-postfix-ops
2522 (c-filter-ops (c-lang-const c-operators)
2523 '(postfix
2524 postfix-if-paren
2525 left-assoc
2526 right-assoc
2527 right-assoc-sequence)
2528 t))
2529
2530 (unambiguous-prefix-ops (set-difference nonkeyword-prefix-ops
2531 in-or-postfix-ops
2532 :test 'string-equal))
2533 (ambiguous-prefix-ops (intersection nonkeyword-prefix-ops
2534 in-or-postfix-ops
2535 :test 'string-equal)))
2536
2537 (concat
2538 "\\("
2539 ;; Take out all symbol class operators from `prefix-ops' and make the
2540 ;; first submatch from them together with `c-primary-expr-kwds'.
2541 (c-make-keywords-re t
2542 (append (c-lang-const c-primary-expr-kwds)
2543 (set-difference prefix-ops nonkeyword-prefix-ops
2544 :test 'string-equal)))
2545
2546 "\\|"
2547 ;; Match all ambiguous operators.
2548 (c-make-keywords-re nil
2549 (intersection nonkeyword-prefix-ops in-or-postfix-ops
2550 :test 'string-equal))
2551 "\\)"
d9e94c22 2552
0386b551
AM
2553 "\\|"
2554 ;; Now match all other symbols.
2555 (c-lang-const c-symbol-start)
d9e94c22 2556
0386b551
AM
2557 "\\|"
2558 ;; The chars that can start integer and floating point
2559 ;; constants.
2560 "\\.?[0-9]"
d9e94c22 2561
0386b551 2562 "\\|"
e1dbe924 2563 ;; The unambiguous operators from `prefix-ops'.
0386b551
AM
2564 (c-make-keywords-re nil
2565 (set-difference nonkeyword-prefix-ops in-or-postfix-ops
2566 :test 'string-equal))
d9e94c22 2567
0386b551
AM
2568 "\\|"
2569 ;; Match string and character literals.
2570 "\\s\""
2571 (if (memq 'gen-string-delim c-emacs-features)
2572 "\\|\\s|"
2573 ""))))
d9e94c22 2574(c-lang-defvar c-primary-expr-regexp (c-lang-const c-primary-expr-regexp))
a66cd3ee 2575
d9e94c22
MS
2576\f
2577;;; Additional constants for parser-level constructs.
2578
2579(c-lang-defconst c-decl-prefix-re
0386b551
AM
2580 "Regexp matching something that might precede a declaration, cast or
2581label, such as the last token of a preceding statement or declaration.
2582This is used in the common situation where a declaration or cast
2583doesn't start with any specific token that can be searched for.
2584
2585The regexp should not match bob; that is done implicitly. It can't
2586require a match longer than one token. The end of the token is taken
2587to be at the end of the first submatch, which is assumed to always
2588match. It's undefined whether identifier syntax (see
2589`c-identifier-syntax-table') is in effect or not. This regexp is
2590assumed to be a superset of `c-label-prefix-re' if
2591`c-recognize-colon-labels' is set.
2592
2593Besides this, `c-decl-start-kwds' is used to find declarations.
2594
2595Note: This variable together with `c-decl-start-re' and
2596`c-decl-start-kwds' is only used to detect \"likely\"
2597declaration/cast/label starts. I.e. they might produce more matches
2598but should not miss anything (or else it's necessary to use text
2599properties - see the next note). Wherever they match, the following
2600construct is analyzed to see if it indeed is a declaration, cast or
2601label. That analysis is not cheap, so it's important that not too
2602many false matches are triggered.
2603
2604Note: If a declaration/cast/label start can't be detected with this
2605variable, it's necessary to use the `c-type' text property with the
2606value `c-decl-end' on the last char of the last token preceding the
2607declaration. See the comment blurb at the start of cc-engine.el for
2608more info."
2609
d9e94c22
MS
2610 ;; We match a sequence of characters to skip over things like \"};\"
2611 ;; more quickly. We match ")" in C for K&R region declarations, and
2612 ;; in all languages except Java for when a cpp macro definition
2613 ;; begins with a declaration.
2614 t "\\([\{\}\(\);,]+\\)"
452ea855 2615 java "\\([\{\}\(;,<]+\\)"
d9e94c22
MS
2616 ;; Match "<" in C++ to get the first argument in a template arglist.
2617 ;; In that case there's an additional check in `c-find-decl-spots'
2618 ;; that it got open paren syntax.
0386b551 2619 c++ "\\([\{\}\(\);,<]+\\)"
d9e94c22
MS
2620 ;; Additionally match the protection directives in Objective-C.
2621 ;; Note that this doesn't cope with the longer directives, which we
2622 ;; would have to match from start to end since they don't end with
2623 ;; any easily recognized characters.
2624 objc (concat "\\([\{\}\(\);,]+\\|"
2625 (c-make-keywords-re nil (c-lang-const c-protection-kwds))
2626 "\\)")
d9e94c22
MS
2627 ;; Pike is like C but we also match "[" for multiple value
2628 ;; assignments and type casts.
2629 pike "\\([\{\}\(\)\[;,]+\\)")
2630(c-lang-defvar c-decl-prefix-re (c-lang-const c-decl-prefix-re)
2631 'dont-doc)
2632
0386b551
AM
2633(c-lang-defconst c-decl-start-re
2634 "Regexp matching the start of any declaration, cast or label.
2635It's used on the token after the one `c-decl-prefix-re' matched. This
2636regexp should not try to match those constructs accurately as it's
2637only used as a sieve to avoid spending more time checking other
2638constructs."
2639 t (c-lang-const c-identifier-start))
2640(c-lang-defvar c-decl-start-re (c-lang-const c-decl-start-re))
2641
2642(c-lang-defconst c-decl-prefix-or-start-re
2643 ;; Regexp matching something that might precede or start a
2644 ;; declaration, cast or label.
2645 ;;
2646 ;; If the first submatch matches, it's taken to match the end of a
2647 ;; token that might precede such a construct, e.g. ';', '}' or '{'.
2648 ;; It's built from `c-decl-prefix-re'.
2649 ;;
2650 ;; If the first submatch did not match, the match of the whole
2651 ;; regexp is taken to be at the first token in the declaration.
2652 ;; `c-decl-start-re' is not checked in this case.
2653 ;;
2654 ;; Design note: The reason the same regexp is used to match both
2655 ;; tokens that precede declarations and start them is to avoid an
2656 ;; extra regexp search from the previous declaration spot in
2657 ;; `c-find-decl-spots'. Users of `c-find-decl-spots' also count on
2658 ;; that it finds all declaration/cast/label starts in approximately
2659 ;; linear order, so we can't do the searches in two separate passes.
2660 t (if (c-lang-const c-decl-start-kwds)
2661 (concat (c-lang-const c-decl-prefix-re)
2662 "\\|"
2663 (c-make-keywords-re t (c-lang-const c-decl-start-kwds)))
2664 (c-lang-const c-decl-prefix-re)))
2665(c-lang-defvar c-decl-prefix-or-start-re
2666 (c-lang-const c-decl-prefix-or-start-re)
2667 'dont-doc)
2668
d9e94c22
MS
2669(c-lang-defconst c-cast-parens
2670 ;; List containing the paren characters that can open a cast, or nil in
2671 ;; languages without casts.
0386b551
AM
2672 t (c-filter-ops (c-lang-const c-operators)
2673 '(prefix)
2674 "\\`\\s\(\\'"
2675 (lambda (op) (elt op 0))))
d9e94c22
MS
2676(c-lang-defvar c-cast-parens (c-lang-const c-cast-parens))
2677
0386b551
AM
2678(c-lang-defconst c-block-prefix-disallowed-chars
2679 "List of syntactically relevant characters that never can occur before
2680the open brace in any construct that contains a brace block, e.g. in
2681the \"class Foo: public Bar\" part of:
2682
2683 class Foo: public Bar {int x();} a, *b;
2684
2685If parens can occur, the chars inside those aren't filtered with this
2686list.
2687
2688'<' and '>' should be disallowed even if angle bracket arglists can
2689occur. That since the search function needs to stop at them anyway to
2690ensure they are given paren syntax.
2691
2692This is used to skip backward from the open brace to find the region
2693in which to look for a construct like \"class\", \"enum\",
2694\"namespace\" or whatever. That skipping should be as tight as
2695possible for good performance."
2696
2697 ;; Default to all chars that only occurs in nonsymbol tokens outside
2698 ;; identifiers.
2699 t (set-difference
2700 (c-lang-const c-nonsymbol-token-char-list)
2701 (c-filter-ops (append (c-lang-const c-identifier-ops)
2702 (list (cons nil
2703 (c-lang-const c-after-id-concat-ops))))
2704 t
2705 t
2706 (lambda (op)
2707 (let ((pos 0) res)
2708 (while (string-match "\\(\\s.\\|\\s(\\|\\s)\\)"
2709 op pos)
2710 (setq res (cons (aref op (match-beginning 1)) res)
2711 pos (match-end 0)))
2712 res))))
2713
e1dbe924 2714 ;; Allow cpp operations (where applicable).
0386b551
AM
2715 t (if (c-lang-const c-opt-cpp-prefix)
2716 (set-difference (c-lang-const c-block-prefix-disallowed-chars)
2717 '(?#))
2718 (c-lang-const c-block-prefix-disallowed-chars))
2719
2720 ;; Allow ':' for inherit list starters.
2721 (c++ objc idl) (set-difference (c-lang-const c-block-prefix-disallowed-chars)
2722 '(?:))
2723
2724 ;; Allow ',' for multiple inherits.
2725 (c++ java) (set-difference (c-lang-const c-block-prefix-disallowed-chars)
2726 '(?,))
2727
2728 ;; Allow parentheses for anonymous inner classes in Java and class
2729 ;; initializer lists in Pike.
2730 (java pike) (set-difference (c-lang-const c-block-prefix-disallowed-chars)
2731 '(?\( ?\)))
2732
2733 ;; Allow '"' for extern clauses (e.g. extern "C" {...}).
2734 (c c++ objc) (set-difference (c-lang-const c-block-prefix-disallowed-chars)
2735 '(?\" ?')))
2736
2737(c-lang-defconst c-block-prefix-charset
2738 ;; `c-block-prefix-disallowed-chars' as an inverted charset suitable
2739 ;; for `c-syntactic-skip-backward'.
2740 t (c-make-bare-char-alt (c-lang-const c-block-prefix-disallowed-chars) t))
2741(c-lang-defvar c-block-prefix-charset (c-lang-const c-block-prefix-charset))
2742
d9e94c22 2743(c-lang-defconst c-type-decl-prefix-key
0386b551
AM
2744 "Regexp matching the declarator operators that might precede the
2745identifier in a declaration, e.g. the \"*\" in \"char *argv\". This
2746regexp should match \"(\" if parentheses are valid in declarators.
2747The end of the first submatch is taken as the end of the operator.
2748Identifier syntax is in effect when this is matched \(see
2749`c-identifier-syntax-table')."
d9e94c22 2750 t (if (c-lang-const c-type-modifier-kwds)
0386b551 2751 (concat (regexp-opt (c-lang-const c-type-modifier-kwds) t) "\\>")
d9e94c22
MS
2752 ;; Default to a regexp that never matches.
2753 "\\<\\>")
0386b551
AM
2754 ;; Check that there's no "=" afterwards to avoid matching tokens
2755 ;; like "*=".
d9e94c22
MS
2756 (c objc) (concat "\\("
2757 "[*\(]"
2758 "\\|"
2759 (c-lang-const c-type-decl-prefix-key)
2760 "\\)"
2761 "\\([^=]\\|$\\)")
2762 c++ (concat "\\("
2763 "[*\(&]"
2764 "\\|"
7f0789c9
AM
2765 (c-lang-const c-type-decl-prefix-key)
2766 "\\|"
2767 (concat "\\(" ; 3
d9e94c22
MS
2768 ;; If this matches there's special treatment in
2769 ;; `c-font-lock-declarators' and
2770 ;; `c-font-lock-declarations' that check for a
2771 ;; complete name followed by ":: *".
2772 (c-lang-const c-identifier-start)
2773 "\\)")
d9e94c22
MS
2774 "\\)"
2775 "\\([^=]\\|$\\)")
0386b551 2776 pike "\\(\\*\\)\\([^=]\\|$\\)")
d9e94c22
MS
2777(c-lang-defvar c-type-decl-prefix-key (c-lang-const c-type-decl-prefix-key)
2778 'dont-doc)
2779
2780(c-lang-defconst c-type-decl-suffix-key
0386b551
AM
2781 "Regexp matching the declarator operators that might follow after the
2782identifier in a declaration, e.g. the \"[\" in \"char argv[]\". This
2783regexp should match \")\" if parentheses are valid in declarators. If
d9e94c22
MS
2784it matches an open paren of some kind, the type declaration check
2785continues at the corresponding close paren, otherwise the end of the
2786first submatch is taken as the end of the operator. Identifier syntax
2787is in effect when this is matched (see `c-identifier-syntax-table')."
2788 ;; Default to a regexp that matches `c-type-modifier-kwds' and a
2789 ;; function argument list parenthesis.
2790 t (if (c-lang-const c-type-modifier-kwds)
2791 (concat "\\(\(\\|"
0386b551 2792 (regexp-opt (c-lang-const c-type-modifier-kwds) t) "\\>"
d9e94c22
MS
2793 "\\)")
2794 "\\(\(\\)")
2795 (c c++ objc) (concat
2796 "\\("
2797 "[\)\[\(]"
0386b551
AM
2798 (if (c-lang-const c-type-modifier-kwds)
2799 (concat
2800 "\\|"
2801 ;; "throw" in `c-type-modifier-kwds' is followed
2802 ;; by a parenthesis list, but no extra measures
2803 ;; are necessary to handle that.
2804 (regexp-opt (c-lang-const c-type-modifier-kwds) t)
2805 "\\>")
2806 "")
d9e94c22
MS
2807 "\\)")
2808 (java idl) "\\([\[\(]\\)")
2809(c-lang-defvar c-type-decl-suffix-key (c-lang-const c-type-decl-suffix-key)
2810 'dont-doc)
2811
2812(c-lang-defconst c-after-suffixed-type-decl-key
0386b551 2813 "This regexp is matched after a declarator expression where
d9e94c22
MS
2814`c-type-decl-suffix-key' has matched. If it matches then the
2815construct is taken as a declaration. It's typically used to match the
2816beginning of a function body or whatever might occur after the
2817function header in a function declaration or definition. It's
2818undefined whether identifier syntax (see `c-identifier-syntax-table')
2819is in effect or not.
2820
2821Note that it's used in cases like after \"foo (bar)\" so it should
65e7ca35 2822only match when it's certain that it's a declaration, e.g., \"{\" but
d9e94c22
MS
2823not \",\" or \";\"."
2824 t "{"
2825 ;; If K&R style declarations should be recognized then one could
2826 ;; consider to match the start of any symbol since we want to match
2827 ;; the start of the first declaration in the "K&R region". That
2828 ;; could however produce false matches on code like "FOO(bar) x"
2829 ;; where FOO is a cpp macro, so it's better to leave it out and rely
2830 ;; on the other heuristics in that case.
0386b551
AM
2831 t (if (c-lang-const c-postfix-spec-kwds)
2832 ;; Add on the keywords in `c-postfix-spec-kwds'.
d9e94c22
MS
2833 (concat (c-lang-const c-after-suffixed-type-decl-key)
2834 "\\|"
0386b551 2835 (c-make-keywords-re t (c-lang-const c-postfix-spec-kwds)))
d9e94c22
MS
2836 (c-lang-const c-after-suffixed-type-decl-key))
2837 ;; Also match the colon that starts a base class initializer list in
2838 ;; C++. That can be confused with a function call before the colon
2839 ;; in a ? : operator, but we count on that `c-decl-prefix-re' won't
2840 ;; match before such a thing (as a declaration-level construct;
2841 ;; matches inside arglist contexts are already excluded).
2842 c++ "[{:]")
2843(c-lang-defvar c-after-suffixed-type-decl-key
2844 (c-lang-const c-after-suffixed-type-decl-key)
2845 'dont-doc)
2846
2847(c-lang-defconst c-after-suffixed-type-maybe-decl-key
2848 ;; Regexp that in addition to `c-after-suffixed-type-decl-key'
2849 ;; matches ";" and ",".
2850 t (concat "\\(" (c-lang-const c-after-suffixed-type-decl-key) "\\)"
2851 "\\|[;,]"))
2852(c-lang-defvar c-after-suffixed-type-maybe-decl-key
2853 (c-lang-const c-after-suffixed-type-maybe-decl-key))
2854
2855(c-lang-defconst c-opt-type-concat-key
2856 "Regexp matching operators that concatenate types, e.g. the \"|\" in
2857\"int|string\" in Pike. The end of the first submatch is taken as the
2858end of the operator. nil in languages without such operators. It's
2859undefined whether identifier syntax (see `c-identifier-syntax-table')
2860is in effect or not."
2861 t nil
2862 pike "\\([|.&]\\)\\($\\|[^|.&]\\)")
2863(c-lang-defvar c-opt-type-concat-key (c-lang-const c-opt-type-concat-key)
2864 'dont-doc)
2865
2866(c-lang-defconst c-opt-type-suffix-key
2867 "Regexp matching operators that might follow after a type, or nil in
2868languages that don't have such operators. The end of the first
2869submatch is taken as the end of the operator. This should not match
2870things like C++ template arglists if `c-recognize-<>-arglists' is set.
2871It's undefined whether identifier syntax (see `c-identifier-syntax-table')
2872is in effect or not."
2873 t nil
2874 (c c++ objc pike) "\\(\\.\\.\\.\\)"
452ea855 2875 java (concat "\\(\\[" (c-lang-const c-simple-ws) "*\\]\\|\\.\\.\\.\\)"))
d9e94c22
MS
2876(c-lang-defvar c-opt-type-suffix-key (c-lang-const c-opt-type-suffix-key))
2877
2878(c-lang-defvar c-known-type-key
2879 ;; Regexp matching the known type identifiers. This is initialized
2880 ;; from the type keywords and `*-font-lock-extra-types'. The first
2881 ;; submatch is the one that matches the type. Note that this regexp
2882 ;; assumes that symbol constituents like '_' and '$' have word
2883 ;; syntax.
0386b551
AM
2884 (let* ((extra-types
2885 (when (boundp (c-mode-symbol "font-lock-extra-types"))
2886 (c-mode-var "font-lock-extra-types")))
2887 (regexp-strings
6faed041
AM
2888 (apply 'nconc
2889 (mapcar (lambda (re)
0386b551
AM
2890 (when (string-match "[][.*+?^$\\]" re)
2891 (list re)))
6faed041 2892 extra-types)))
0386b551 2893 (plain-strings
6faed041
AM
2894 (apply 'nconc
2895 (mapcar (lambda (re)
0386b551
AM
2896 (unless (string-match "[][.*+?^$\\]" re)
2897 (list re)))
6faed041 2898 extra-types))))
d9e94c22 2899 (concat "\\<\\("
0386b551
AM
2900 (c-concat-separated
2901 (append (list (c-make-keywords-re nil
2902 (append (c-lang-const c-primitive-type-kwds)
2903 plain-strings)))
2904 regexp-strings)
2905 "\\|")
d9e94c22
MS
2906 "\\)\\>")))
2907
2908(c-lang-defconst c-special-brace-lists
2909"List of open- and close-chars that makes up a pike-style brace list,
c38e0c97 2910i.e. for a ([ ]) list there should be a cons (?\\[ . ?\\]) in this
d9e94c22
MS
2911list."
2912 t nil
2913 pike '((?{ . ?}) (?\[ . ?\]) (?< . ?>)))
2914(c-lang-defvar c-special-brace-lists (c-lang-const c-special-brace-lists))
2915
2916(c-lang-defconst c-recognize-knr-p
2917 "Non-nil means K&R style argument declarations are valid."
2918 t nil
2919 c t)
2920(c-lang-defvar c-recognize-knr-p (c-lang-const c-recognize-knr-p))
2921
2922(c-lang-defconst c-recognize-typeless-decls
2923 "Non-nil means function declarations without return type should be
2924recognized. That can introduce an ambiguity with parenthesized macro
2925calls before a brace block. This setting does not affect declarations
2926that are preceded by a declaration starting keyword, so
2927e.g. `c-typeless-decl-kwds' may still be used when it's set to nil."
2928 t nil
2929 (c c++ objc) t)
2930(c-lang-defvar c-recognize-typeless-decls
2931 (c-lang-const c-recognize-typeless-decls))
2932
2933(c-lang-defconst c-recognize-<>-arglists
2934 "Non-nil means C++ style template arglists should be handled. More
2935specifically, this means a comma separated list of types or
2936expressions surrounded by \"<\" and \">\". It's always preceded by an
2937identifier or one of the keywords on `c-<>-type-kwds' or
2938`c-<>-arglist-kwds'. If there's an identifier before then the whole
2939expression is considered to be a type."
2940 t (or (consp (c-lang-const c-<>-type-kwds))
2941 (consp (c-lang-const c-<>-arglist-kwds))))
2942(c-lang-defvar c-recognize-<>-arglists (c-lang-const c-recognize-<>-arglists))
2943
9d5a8f0b
AM
2944(c-lang-defconst c-enums-contain-decls
2945 "Non-nil means that an enum structure can contain declarations."
2946 t nil
2947 java t)
2948(c-lang-defvar c-enums-contain-decls (c-lang-const c-enums-contain-decls))
2949
d9e94c22
MS
2950(c-lang-defconst c-recognize-paren-inits
2951 "Non-nil means that parenthesis style initializers exist,
2952i.e. constructs like
2953
2954Foo bar (gnu);
2955
2956in addition to the more classic
2957
2958Foo bar = gnu;"
2959 t nil
2960 c++ t)
2961(c-lang-defvar c-recognize-paren-inits (c-lang-const c-recognize-paren-inits))
2962
0386b551
AM
2963(c-lang-defconst c-recognize-paren-inexpr-blocks
2964 "Non-nil to recognize gcc style in-expression blocks,
2965i.e. compound statements surrounded by parentheses inside expressions."
2966 t nil
2967 (c c++) t)
2968(c-lang-defvar c-recognize-paren-inexpr-blocks
2969 (c-lang-const c-recognize-paren-inexpr-blocks))
2970
d9e94c22
MS
2971(c-lang-defconst c-opt-<>-arglist-start
2972 ;; Regexp matching the start of angle bracket arglists in languages
2973 ;; where `c-recognize-<>-arglists' is set. Does not exclude
2974 ;; keywords outside `c-<>-arglist-kwds'. The first submatch is
2975 ;; assumed to surround the preceding symbol. The whole match is
2976 ;; assumed to end directly after the opening "<".
2977 t (if (c-lang-const c-recognize-<>-arglists)
2978 (concat "\\("
2979 (c-lang-const c-symbol-key)
2980 "\\)"
2981 (c-lang-const c-syntactic-ws)
2982 "<")))
2983(c-lang-defvar c-opt-<>-arglist-start (c-lang-const c-opt-<>-arglist-start))
2984
2985(c-lang-defconst c-opt-<>-arglist-start-in-paren
2986 ;; Regexp that in addition to `c-opt-<>-arglist-start' matches close
2987 ;; parens. The first submatch is assumed to surround
2988 ;; `c-opt-<>-arglist-start'.
2989 t (if (c-lang-const c-opt-<>-arglist-start)
2990 (concat "\\("
2991 (c-lang-const c-opt-<>-arglist-start)
2992 "\\)\\|\\s\)")))
2993(c-lang-defvar c-opt-<>-arglist-start-in-paren
2994 (c-lang-const c-opt-<>-arglist-start-in-paren))
a66cd3ee 2995
d9e94c22
MS
2996(c-lang-defconst c-opt-postfix-decl-spec-key
2997 ;; Regexp matching the beginning of a declaration specifier in the
2998 ;; region between the header and the body of a declaration.
2999 ;;
3000 ;; TODO: This is currently not used uniformly; c++-mode and
3001 ;; java-mode each have their own ways of using it.
0386b551
AM
3002 t nil
3003 c++ (concat ":?"
3004 (c-lang-const c-simple-ws) "*"
3005 "\\(virtual" (c-lang-const c-simple-ws) "+\\)?\\("
3006 (c-make-keywords-re nil (c-lang-const c-protection-kwds))
3007 "\\)" (c-lang-const c-simple-ws) "+"
3008 "\\(" (c-lang-const c-symbol-key) "\\)")
3009 java (c-make-keywords-re t (c-lang-const c-postfix-spec-kwds)))
d9e94c22
MS
3010(c-lang-defvar c-opt-postfix-decl-spec-key
3011 (c-lang-const c-opt-postfix-decl-spec-key))
a66cd3ee 3012
0386b551
AM
3013(c-lang-defconst c-recognize-colon-labels
3014 "Non-nil if generic labels ending with \":\" should be recognized.
3015That includes labels in code and access keys in classes. This does
3016not apply to labels recognized by `c-label-kwds' and
3017`c-opt-extra-label-key'."
3018 t nil
3019 (c c++ objc java pike) t)
3020(c-lang-defvar c-recognize-colon-labels
3021 (c-lang-const c-recognize-colon-labels))
3022
3023(c-lang-defconst c-label-prefix-re
3024 "Regexp like `c-decl-prefix-re' that matches any token that can precede
3025a generic colon label. Not used if `c-recognize-colon-labels' is
3026nil."
3027 t "\\([{};]+\\)")
3028(c-lang-defvar c-label-prefix-re
3029 (c-lang-const c-label-prefix-re))
3030
3031(c-lang-defconst c-nonlabel-token-key
3032 "Regexp matching things that can't occur in generic colon labels,
3033neither in a statement nor in a declaration context. The regexp is
3034tested at the beginning of every sexp in a suspected label,
3035i.e. before \":\". Only used if `c-recognize-colon-labels' is set."
3036 t (concat
0386b551
AM
3037 ;; All keywords except `c-label-kwds' and `c-protection-kwds'.
3038 (c-make-keywords-re t
3039 (set-difference (c-lang-const c-keywords)
3040 (append (c-lang-const c-label-kwds)
3041 (c-lang-const c-protection-kwds))
3042 :test 'string-equal)))
898169a2
AM
3043 ;; Don't allow string literals, except in AWK. Character constants are OK.
3044 (c objc java pike idl) (concat "\"\\|"
3045 (c-lang-const c-nonlabel-token-key))
0386b551
AM
3046 ;; Also check for open parens in C++, to catch member init lists in
3047 ;; constructors. We normally allow it so that macros with arguments
3048 ;; work in labels.
898169a2 3049 c++ (concat "\\s\(\\|\"\\|" (c-lang-const c-nonlabel-token-key)))
0386b551
AM
3050(c-lang-defvar c-nonlabel-token-key (c-lang-const c-nonlabel-token-key))
3051
a6ba2ab9
AM
3052(c-lang-defconst c-nonlabel-token-2-key
3053 "Regexp matching things that can't occur two symbols before a colon in
3054a label construct. This catches C++'s inheritance construct \"class foo
3055: bar\". Only used if `c-recognize-colon-labels' is set."
3056 t "\\<\\>" ; matches nothing
3057 c++ (c-make-keywords-re t '("class")))
3058(c-lang-defvar c-nonlabel-token-2-key (c-lang-const c-nonlabel-token-2-key))
3059
0386b551
AM
3060(c-lang-defconst c-opt-extra-label-key
3061 "Optional regexp matching labels.
3062Normally, labels are detected according to `c-nonlabel-token-key',
3063`c-decl-prefix-re' and `c-nonlabel-decl-prefix-re'. This regexp can
3064be used if there are additional labels that aren't recognized that
3065way."
3066 t nil
3067 objc (c-make-keywords-re t (c-lang-const c-protection-kwds)))
3068(c-lang-defvar c-opt-extra-label-key (c-lang-const c-opt-extra-label-key))
3069
a66cd3ee 3070(c-lang-defconst c-opt-friend-key
d9e94c22
MS
3071 ;; Regexp describing friend declarations classes, or nil in
3072 ;; languages that don't have such things.
3073 ;;
0386b551
AM
3074 ;; TODO: Ought to use `c-prefix-spec-kwds-re' or similar, and the
3075 ;; template skipping isn't done properly. This will disappear soon.
3076 t nil
3077 c++ (concat "friend" (c-lang-const c-simple-ws) "+"
3078 "\\|"
3079 (concat "template"
3080 (c-lang-const c-simple-ws) "*"
3081 "<.+>"
3082 (c-lang-const c-simple-ws) "*"
3083 "friend"
3084 (c-lang-const c-simple-ws) "+")))
d9e94c22 3085(c-lang-defvar c-opt-friend-key (c-lang-const c-opt-friend-key))
a66cd3ee 3086
a66cd3ee 3087(c-lang-defconst c-opt-method-key
d9e94c22
MS
3088 ;; Special regexp to match the start of Objective-C methods. The
3089 ;; first submatch is assumed to end after the + or - key.
0386b551 3090 t nil
a66cd3ee 3091 objc (concat
d9e94c22 3092 ;; TODO: Ought to use a better method than anchoring on bol.
0386b551
AM
3093 "^\\s *"
3094 "\\([+-]\\)"
3095 (c-lang-const c-simple-ws) "*"
3096 (concat "\\(" ; Return type.
3097 "([^\)]*)"
3098 (c-lang-const c-simple-ws) "*"
3099 "\\)?")
d9e94c22
MS
3100 "\\(" (c-lang-const c-symbol-key) "\\)"))
3101(c-lang-defvar c-opt-method-key (c-lang-const c-opt-method-key))
0ec8351b 3102
0386b551
AM
3103(c-lang-defconst c-type-decl-end-used
3104 ;; Must be set in buffers where the `c-type' text property might be
3105 ;; used with the value `c-decl-end'.
3106 ;;
3107 ;; `c-decl-end' is used to mark the ends of labels and access keys
3108 ;; to make interactive refontification work better.
3109 t (or (c-lang-const c-recognize-colon-labels)
3110 (and (c-lang-const c-label-kwds) t))
3111 ;; `c-decl-end' is used to mark the end of the @-style directives in
3112 ;; Objective-C.
3113 objc t)
3114(c-lang-defvar c-type-decl-end-used (c-lang-const c-type-decl-end-used))
3115
785eecbb 3116\f
d9e94c22
MS
3117;;; Wrap up the `c-lang-defvar' system.
3118
3119;; Compile in the list of language variables that has been collected
26b8f810
AM
3120;; with the `c-lang-defvar' and `c-lang-setvar' macros. Note that the
3121;; first element of each is nil.
d9e94c22 3122(defconst c-lang-variable-inits (cc-eval-when-compile c-lang-variable-inits))
26b8f810 3123(defconst c-emacs-variable-inits (cc-eval-when-compile c-emacs-variable-inits))
d9e94c22 3124
473944f3
AM
3125;; Make the `c-lang-setvar' variables buffer local in the current buffer.
3126;; These are typically standard emacs variables such as `comment-start'.
3127(defmacro c-make-emacs-variables-local ()
3128 `(progn
3129 ,@(mapcar (lambda (init)
3130 `(make-local-variable ',(car init)))
3131 (cdr c-emacs-variable-inits))))
3132
d9e94c22
MS
3133(defun c-make-init-lang-vars-fun (mode)
3134 "Create a function that initializes all the language dependent variables
3135for the given mode.
3136
3137This function should be evaluated at compile time, so that the
3138function it returns is byte compiled with all the evaluated results
3139from the language constants. Use the `c-init-language-vars' macro to
0386b551 3140accomplish that conveniently."
d9e94c22
MS
3141
3142 (if (and (not load-in-progress)
3143 (boundp 'byte-compile-dest-file)
3144 (stringp byte-compile-dest-file))
3145
3146 ;; No need to byte compile this lambda since the byte compiler is
3147 ;; smart enough to detect the `funcall' construct in the
3148 ;; `c-init-language-vars' macro below and compile it all straight
3149 ;; into the function that contains `c-init-language-vars'.
3150 `(lambda ()
3151
3152 ;; This let sets up the context for `c-mode-var' and similar
3153 ;; that could be in the result from `cl-macroexpand-all'.
3154 (let ((c-buffer-is-cc-mode ',mode)
cb694ab7 3155 current-var source-eval)
473944f3 3156 (c-make-emacs-variables-local)
d9e94c22
MS
3157 (condition-case err
3158
3159 (if (eq c-version-sym ',c-version-sym)
3160 (setq ,@(let ((c-buffer-is-cc-mode mode)
3161 (c-lang-const-expansion 'immediate))
3162 ;; `c-lang-const' will expand to the evaluated
3163 ;; constant immediately in `cl-macroexpand-all'
3164 ;; below.
26b8f810
AM
3165 (mapcan
3166 (lambda (init)
3167 `(current-var ',(car init)
3168 ,(car init) ,(cl-macroexpand-all
3169 (elt init 1))))
3170 ;; Note: The following `append' copies the
3171 ;; first argument. That list is small, so
3172 ;; this doesn't matter too much.
3173 (append (cdr c-emacs-variable-inits)
3174 (cdr c-lang-variable-inits)))))
d9e94c22 3175
0386b551
AM
3176 ;; This diagnostic message isn't useful for end
3177 ;; users, so it's disabled.
3178 ;;(unless (get ',mode 'c-has-warned-lang-consts)
3179 ;; (message ,(concat "%s compiled with CC Mode %s "
3180 ;; "but loaded with %s - evaluating "
3181 ;; "language constants from source")
3182 ;; ',mode ,c-version c-version)
3183 ;; (put ',mode 'c-has-warned-lang-consts t))
d9e94c22 3184
cb694ab7 3185 (setq source-eval t)
a9901f61
AM
3186 (let ((init ',(append (cdr c-emacs-variable-inits)
3187 (cdr c-lang-variable-inits))))
d9e94c22
MS
3188 (while init
3189 (setq current-var (caar init))
3190 (set (caar init) (eval (cadar init)))
3191 (setq init (cdr init)))))
3192
3193 (error
3194 (if current-var
26b8f810 3195 (message "Eval error in the `c-lang-defvar' or `c-lang-setvar' for `%s'%s: %S"
cb694ab7
AM
3196 current-var
3197 (if source-eval
3198 (format "\
3199 (fallback source eval - %s compiled with CC Mode %s but loaded with %s)"
3200 ',mode ,c-version c-version)
3201 "")
3202 err)
d9e94c22
MS
3203 (signal (car err) (cdr err)))))))
3204
3205 ;; Being evaluated from source. Always use the dynamic method to
3206 ;; work well when `c-lang-defvar's in this file are reevaluated
3207 ;; interactively.
3208 `(lambda ()
3209 (require 'cc-langs)
3210 (let ((c-buffer-is-cc-mode ',mode)
26b8f810
AM
3211 (init (append (cdr c-emacs-variable-inits)
3212 (cdr c-lang-variable-inits)))
d9e94c22 3213 current-var)
473944f3 3214 (c-make-emacs-variables-local)
d9e94c22
MS
3215 (condition-case err
3216
3217 (while init
3218 (setq current-var (caar init))
3219 (set (caar init) (eval (cadar init)))
3220 (setq init (cdr init)))
3221
3222 (error
3223 (if current-var
cb694ab7 3224 (message
26b8f810 3225 "Eval error in the `c-lang-defvar' or `c-lang-setver' for `%s' (source eval): %S"
cb694ab7 3226 current-var err)
d9e94c22
MS
3227 (signal (car err) (cdr err)))))))
3228 ))
3229
3230(defmacro c-init-language-vars (mode)
3231 "Initialize all the language dependent variables for the given mode.
3232This macro is expanded at compile time to a form tailored for the mode
3233in question, so MODE must be a constant. Therefore MODE is not
0386b551 3234evaluated and should not be quoted."
d9e94c22 3235 `(funcall ,(c-make-init-lang-vars-fun mode)))
130c507e 3236
fb032a95 3237\f
130c507e 3238(cc-provide 'cc-langs)
3afbc435 3239
785eecbb 3240;;; cc-langs.el ends here