Merge from emacs-24; up to 2014-04-02T16:17:08Z!dmantipov@yandex.ru
[bpt/emacs.git] / lisp / progmodes / cc-langs.el
CommitLineData
c38e0c97 1;;; cc-langs.el --- language specific settings for CC Mode -*- coding: utf-8 -*-
785eecbb 2
ba318903 3;; Copyright (C) 1985, 1987, 1992-2014 Free Software Foundation, Inc.
785eecbb 4
e309f66c
AM
5;; Authors: 2002- Alan Mackenzie
6;; 1998- Martin Stjernholm
d9e94c22 7;; 1992-1999 Barry A. Warsaw
5858f68c
GM
8;; 1987 Dave Detlefs
9;; 1987 Stewart Clamen
785eecbb 10;; 1985 Richard M. Stallman
0ec8351b 11;; Maintainer: bug-cc-mode@gnu.org
785eecbb 12;; Created: 22-Apr-1997 (split from cc-mode.el)
bd78fa1d
CY
13;; Keywords: c languages
14;; Package: cc-mode
785eecbb
RS
15
16;; This file is part of GNU Emacs.
17
b1fc2b50 18;; GNU Emacs is free software: you can redistribute it and/or modify
785eecbb 19;; it under the terms of the GNU General Public License as published by
b1fc2b50
GM
20;; the Free Software Foundation, either version 3 of the License, or
21;; (at your option) any later version.
785eecbb
RS
22
23;; GNU Emacs is distributed in the hope that it will be useful,
24;; but WITHOUT ANY WARRANTY; without even the implied warranty of
25;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
26;; GNU General Public License for more details.
27
28;; You should have received a copy of the GNU General Public License
b1fc2b50 29;; along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>.
785eecbb 30
3afbc435
PJ
31;;; Commentary:
32
d9e94c22
MS
33;; HACKERS NOTE: There's heavy macro magic here. If you need to make
34;; changes in this or other files containing `c-lang-defconst' but
35;; don't want to read through the longer discussion below then read
36;; this:
37;;
38;; o A change in a `c-lang-defconst' or `c-lang-defvar' will not take
39;; effect if the file containing the mode init function (typically
40;; cc-mode.el) is byte compiled.
41;; o To make changes show in font locking you need to reevaluate the
42;; `*-font-lock-keywords-*' constants, which normally is easiest to
43;; do with M-x eval-buffer in cc-fonts.el.
44;; o In either case it's necessary to reinitialize the mode to make
45;; the changes show in an existing buffer.
46
47;;; Introduction to the language dependent variable system:
48;;
49;; This file contains all the language dependent variables, except
50;; those specific for font locking which reside in cc-fonts.el. As
51;; far as possible, all the differences between the languages that CC
52;; Mode supports are described with these variables only, so that the
53;; code can be shared.
54;;
55;; The language constant system (see cc-defs.el) is used to specify
56;; various language dependent info at a high level, such as lists of
57;; keywords, and then from them generate - at compile time - the
58;; various regexps and other low-level structures actually employed in
59;; the code at runtime.
60;;
61;; This system is also designed to make it easy for developers of
62;; derived modes to customize the source constants for new language
63;; variants, without having to keep up with the exact regexps etc that
64;; are used in each CC Mode version. It's possible from an external
65;; package to add a new language by inheriting an existing one, and
66;; then change specific constants as necessary for the new language.
67;; The old values for those constants (and the values of all the other
68;; high-level constants) may be used to build the new ones, and those
69;; new values will in turn be used by the low-level definitions here
70;; to build the runtime constants appropriately for the new language
71;; in the current version of CC Mode.
72;;
73;; Like elsewhere in CC Mode, the existence of a doc string signifies
74;; that a language constant is part of the external API, and that it
75;; therefore can be used with a high confidence that it will continue
76;; to work with future versions of CC Mode. Even so, it's not
77;; unlikely that such constants will change meaning slightly as this
78;; system is refined further; a certain degree of dependence on the CC
79;; Mode version is unavoidable when hooking in at this level. Also
80;; note that there's still work to be done to actually use these
81;; constants everywhere inside CC Mode; there are still hardcoded
82;; values in many places in the code.
83;;
84;; Separate packages will also benefit from the compile time
85;; evaluation; the byte compiled file(s) for them will contain the
86;; compiled runtime constants ready for use by (the byte compiled) CC
87;; Mode, and the source definitions in this file don't have to be
88;; loaded then. However, if a byte compiled package is loaded that
89;; has been compiled with a different version of CC Mode than the one
90;; currently loaded, then the compiled-in values will be discarded and
91;; new ones will be built when the mode is initialized. That will
92;; automatically trig a load of the file(s) containing the source
93;; definitions (i.e. this file and/or cc-fonts.el) if necessary.
94;;
95;; A small example of a derived mode is available at
96;; <http://cc-mode.sourceforge.net/derived-mode-ex.el>. It also
97;; contains some useful hints for derived mode developers.
98
99;;; Using language variables:
100;;
101;; The `c-lang-defvar' forms in this file comprise the language
102;; variables that CC Mode uses. It does not work to use
103;; `c-lang-defvar' anywhere else (which isn't much of a limitation
104;; since these variables sole purpose is to interface with the CC Mode
105;; core functions). The values in these `c-lang-defvar's are not
106;; evaluated right away but instead collected to a single large `setq'
107;; that can be inserted for a particular language with the
108;; `c-init-language-vars' macro.
109
110;; This file is only required at compile time, or when not running
111;; from byte compiled files, or when the source definitions for the
112;; language constants are requested.
113
3afbc435
PJ
114;;; Code:
115
66d279a7
GM
116;; For Emacs < 22.2.
117(eval-and-compile
118 (unless (fboundp 'declare-function) (defmacro declare-function (&rest r))))
119
51f606de
GM
120(eval-when-compile
121 (let ((load-path
130c507e
GM
122 (if (and (boundp 'byte-compile-dest-file)
123 (stringp byte-compile-dest-file))
124 (cons (file-name-directory byte-compile-dest-file) load-path)
51f606de 125 load-path)))
d9e94c22 126 (load "cc-bytecomp" nil t)))
51f606de 127
130c507e
GM
128(cc-require 'cc-defs)
129(cc-require 'cc-vars)
a6739a05 130
0386b551 131
9a737a1f
MS
132;; This file is not always loaded. See note above.
133(cc-external-require 'cl)
134
785eecbb 135\f
d9e94c22 136;;; Setup for the `c-lang-defvar' system.
a66cd3ee
MS
137
138(eval-and-compile
d9e94c22 139 ;; These are used to collect the init forms from the subsequent
26b8f810
AM
140 ;; `c-lang-defvar' and `c-lang-setvar'. They are used to build the
141 ;; lambda in `c-make-init-lang-vars-fun' below, and to build `defvar's
142 ;; and `make-variable-buffer-local's in cc-engine and
143 ;; `make-local-variable's in `c-init-language-vars-for'.
2eb455ab
MS
144 (defvar c-lang-variable-inits nil)
145 (defvar c-lang-variable-inits-tail nil)
146 (setq c-lang-variable-inits (list nil)
26b8f810
AM
147 c-lang-variable-inits-tail c-lang-variable-inits)
148 (defvar c-emacs-variable-inits nil)
149 (defvar c-emacs-variable-inits-tail nil)
150 (setq c-emacs-variable-inits (list nil)
151 c-emacs-variable-inits-tail c-emacs-variable-inits))
d9e94c22
MS
152
153(defmacro c-lang-defvar (var val &optional doc)
0386b551
AM
154 "Declares the buffer local variable VAR to get the value VAL. VAL is
155evaluated and assigned at mode initialization. More precisely, VAL is
156evaluated and bound to VAR when the result from the macro
d9e94c22
MS
157`c-init-language-vars' is evaluated.
158
159`c-lang-const' is typically used in VAL to get the right value for the
160language being initialized, and such calls will be macro expanded to
0386b551 161the evaluated constant value at compile time."
d9e94c22
MS
162
163 (when (and (not doc)
164 (eq (car-safe val) 'c-lang-const)
165 (eq (nth 1 val) var)
166 (not (nth 2 val)))
167 ;; Special case: If there's no docstring and the value is a
168 ;; simple (c-lang-const foo) where foo is the same name as VAR
169 ;; then take the docstring from the language constant foo.
170 (setq doc (get (intern (symbol-name (nth 1 val)) c-lang-constants)
171 'variable-documentation)))
172 (or (stringp doc)
173 (setq doc nil))
174
175 (let ((elem (assq var (cdr c-lang-variable-inits))))
176 (if elem
177 (setcdr elem (list val doc))
178 (setcdr c-lang-variable-inits-tail (list (list var val doc)))
179 (setq c-lang-variable-inits-tail (cdr c-lang-variable-inits-tail))))
180
181 ;; Return the symbol, like the other def* forms.
182 `',var)
183
26b8f810
AM
184(defmacro c-lang-setvar (var val)
185 "Causes the variable VAR to be made buffer local and to get set to the
186value VAL. VAL is evaluated and assigned at mode initialization. More
187precisely, VAL is evaluated and bound to VAR when the result from the
188macro `c-init-language-vars' is evaluated. VAR is typically a standard
189Emacs variable like `comment-start'.
190
191`c-lang-const' is typically used in VAL to get the right value for the
192language being initialized, and such calls will be macro expanded to
193the evaluated constant value at compile time."
194 (let ((elem (assq var (cdr c-emacs-variable-inits))))
195 (if elem
196 (setcdr elem (list val)) ; Maybe remove "list", sometime. 2006-07-19
197 (setcdr c-emacs-variable-inits-tail (list (list var val)))
198 (setq c-emacs-variable-inits-tail (cdr c-emacs-variable-inits-tail))))
199
200 ;; Return the symbol, like the other def* forms.
201 `',var)
202
d9e94c22 203(put 'c-lang-defvar 'lisp-indent-function 'defun)
3c0ab532
AM
204; (eval-after-load "edebug" ; 2006-07-09: def-edebug-spec is now in subr.el.
205; '
206(def-edebug-spec c-lang-defvar
207 (&define name def-form &optional stringp)) ;)
c55676a1 208
66d279a7
GM
209;; Suppress "might not be defined at runtime" warning.
210;; This file is only used when compiling other cc files.
6a2e6868
GM
211;; These are defined in cl as aliases to the cl- versions.
212(declare-function delete-duplicates "cl-seq" (cl-seq &rest cl-keys) t)
213(declare-function mapcan "cl-extra" (cl-func cl-seq &rest cl-rest) t)
214(declare-function cl-macroexpand-all "cl" (form &optional env))
66d279a7 215
cb694ab7 216(eval-and-compile
0386b551
AM
217 ;; Some helper functions used when building the language constants.
218
219 (defun c-filter-ops (ops opgroup-filter op-filter &optional xlate)
e6a9e584 220 ;; Extract a subset of the operators in the list OPS in a DWIM:ey
212906e2
AM
221 ;; way. The return value is a plain list of operators:
222 ;;
e6a9e584 223 ;; OPS either has the structure of `c-operators', is a single
0386b551 224 ;; group in `c-operators', or is a plain list of operators.
cd1181db 225 ;;
e6a9e584
AM
226 ;; OPGROUP-FILTER specifies how to select the operator groups. It
227 ;; can be t to choose all groups, a list of group type symbols
228 ;; (such as 'prefix) to accept, or a function which will be called
229 ;; with the group symbol for each group and should return non-nil
230 ;; if that group is to be included.
231 ;;
0386b551
AM
232 ;; If XLATE is given, it's a function which is called for each
233 ;; matching operator and its return value is collected instead.
234 ;; If it returns a list, the elements are spliced directly into
235 ;; the final result, which is returned as a list with duplicates
e6a9e584
AM
236 ;; removed using `equal'.
237 ;;
238 ;; `c-mode-syntax-table' for the current mode is in effect during
239 ;; the whole procedure.
0386b551
AM
240 (unless (listp (car-safe ops))
241 (setq ops (list ops)))
242 (cond ((eq opgroup-filter t)
243 (setq opgroup-filter (lambda (opgroup) t)))
244 ((not (functionp opgroup-filter))
245 (setq opgroup-filter `(lambda (opgroup)
246 (memq opgroup ',opgroup-filter)))))
247 (cond ((eq op-filter t)
248 (setq op-filter (lambda (op) t)))
249 ((stringp op-filter)
250 (setq op-filter `(lambda (op)
251 (string-match ,op-filter op)))))
252 (unless xlate
253 (setq xlate 'identity))
254 (c-with-syntax-table (c-lang-const c-mode-syntax-table)
255 (delete-duplicates
256 (mapcan (lambda (opgroup)
257 (when (if (symbolp (car opgroup))
258 (when (funcall opgroup-filter (car opgroup))
259 (setq opgroup (cdr opgroup))
260 t)
261 t)
262 (mapcan (lambda (op)
263 (when (funcall op-filter op)
264 (let ((res (funcall xlate op)))
265 (if (listp res) res (list res)))))
266 opgroup)))
267 ops)
268 :test 'equal))))
269
51f606de 270\f
d9e94c22
MS
271;;; Various mode specific values that aren't language related.
272
273(c-lang-defconst c-mode-menu
274 ;; The definition for the mode menu. The menu title is prepended to
275 ;; this before it's fed to `easy-menu-define'.
276 t `(["Comment Out Region" comment-region
277 (c-fn-region-is-active-p)]
278 ["Uncomment Region" (comment-region (region-beginning)
279 (region-end) '(4))
280 (c-fn-region-is-active-p)]
281 ["Indent Expression" c-indent-exp
282 (memq (char-after) '(?\( ?\[ ?\{))]
283 ["Indent Line or Region" c-indent-line-or-region t]
284 ["Fill Comment Paragraph" c-fill-paragraph t]
285 "----"
286 ["Backward Statement" c-beginning-of-statement t]
287 ["Forward Statement" c-end-of-statement t]
288 ,@(when (c-lang-const c-opt-cpp-prefix)
289 ;; Only applicable if there's a cpp preprocessor.
290 `(["Up Conditional" c-up-conditional t]
291 ["Backward Conditional" c-backward-conditional t]
292 ["Forward Conditional" c-forward-conditional t]
293 "----"
294 ["Macro Expand Region" c-macro-expand
295 (c-fn-region-is-active-p)]
296 ["Backslashify" c-backslash-region
297 (c-fn-region-is-active-p)]))
298 "----"
b14c0c55
AM
299 ("Style..."
300 ["Set Style..." c-set-style t]
301 ["Show Current Style Name" (message
302 "Style Name: %s"
303 c-indentation-style) t]
304 ["Guess Style from this Buffer" c-guess-buffer-no-install t]
305 ["Install the Last Guessed Style..." c-guess-install
306 (and c-guess-guessed-offsets-alist
307 c-guess-guessed-basic-offset) ]
308 ["View the Last Guessed Style" c-guess-view
309 (and c-guess-guessed-offsets-alist
310 c-guess-guessed-basic-offset) ])
311 "----"
d9e94c22 312 ("Toggle..."
d91362c9
NR
313 ["Syntactic indentation" c-toggle-syntactic-indentation
314 :style toggle :selected c-syntactic-indentation]
cb694ab7
AM
315 ["Electric mode" c-toggle-electric-state
316 :style toggle :selected c-electric-flag]
317 ["Auto newline" c-toggle-auto-newline
d91362c9 318 :style toggle :selected c-auto-newline]
cb694ab7
AM
319 ["Hungry delete" c-toggle-hungry-state
320 :style toggle :selected c-hungry-delete-key]
653d1554
TH
321 ["Subword mode" subword-mode
322 :style toggle :selected (and (boundp 'subword-mode)
323 subword-mode)])))
a66cd3ee 324
d9e94c22
MS
325\f
326;;; Syntax tables.
327
328(defun c-populate-syntax-table (table)
329 "Populate the given syntax table as necessary for a C-like language.
330This includes setting ' and \" as string delimiters, and setting up
331the comment syntax to handle both line style \"//\" and block style
332\"/*\" \"*/\" comments."
333
334 (modify-syntax-entry ?_ "_" table)
335 (modify-syntax-entry ?\\ "\\" table)
336 (modify-syntax-entry ?+ "." table)
337 (modify-syntax-entry ?- "." table)
338 (modify-syntax-entry ?= "." table)
339 (modify-syntax-entry ?% "." table)
340 (modify-syntax-entry ?< "." table)
341 (modify-syntax-entry ?> "." table)
342 (modify-syntax-entry ?& "." table)
343 (modify-syntax-entry ?| "." table)
344 (modify-syntax-entry ?\' "\"" table)
345 (modify-syntax-entry ?\240 "." table)
346
347 ;; Set up block and line oriented comments. The new C
348 ;; standard mandates both comment styles even in C, so since
349 ;; all languages now require dual comments, we make this the
350 ;; default.
351 (cond
352 ;; XEmacs
353 ((memq '8-bit c-emacs-features)
354 (modify-syntax-entry ?/ ". 1456" table)
355 (modify-syntax-entry ?* ". 23" table))
356 ;; Emacs
357 ((memq '1-bit c-emacs-features)
358 (modify-syntax-entry ?/ ". 124b" table)
359 (modify-syntax-entry ?* ". 23" table))
360 ;; incompatible
361 (t (error "CC Mode is incompatible with this version of Emacs")))
362
363 (modify-syntax-entry ?\n "> b" table)
364 ;; Give CR the same syntax as newline, for selective-display
365 (modify-syntax-entry ?\^m "> b" table))
366
367(c-lang-defconst c-make-mode-syntax-table
368 "Functions that generates the mode specific syntax tables.
369The syntax tables aren't stored directly since they're quite large."
370 t `(lambda ()
371 (let ((table (make-syntax-table)))
372 (c-populate-syntax-table table)
373 ;; Mode specific syntaxes.
452ea855 374 ,(cond ((or (c-major-mode-is 'objc-mode) (c-major-mode-is 'java-mode))
0386b551
AM
375 ;; Let '@' be part of symbols in ObjC to cope with
376 ;; its compiler directives as single keyword tokens.
377 ;; This is then necessary since it's assumed that
378 ;; every keyword is a single symbol.
d9e94c22
MS
379 `(modify-syntax-entry ?@ "_" table))
380 ((c-major-mode-is 'pike-mode)
381 `(modify-syntax-entry ?@ "." table)))
382 table)))
383
384(c-lang-defconst c-mode-syntax-table
385 ;; The syntax tables in evaluated form. Only used temporarily when
386 ;; the constants in this file are evaluated.
387 t (funcall (c-lang-const c-make-mode-syntax-table)))
388
f75ef66d 389(c-lang-defconst c++-make-template-syntax-table
d9e94c22
MS
390 ;; A variant of `c++-mode-syntax-table' that defines `<' and `>' as
391 ;; parenthesis characters. Used temporarily when template argument
392 ;; lists are parsed. Note that this encourages incorrect parsing of
393 ;; templates since they might contain normal operators that uses the
394 ;; '<' and '>' characters. Therefore this syntax table might go
395 ;; away when CC Mode handles templates correctly everywhere.
396 t nil
452ea855 397 (java c++) `(lambda ()
d9e94c22
MS
398 (let ((table (funcall ,(c-lang-const c-make-mode-syntax-table))))
399 (modify-syntax-entry ?< "(>" table)
400 (modify-syntax-entry ?> ")<" table)
401 table)))
402(c-lang-defvar c++-template-syntax-table
f75ef66d
MS
403 (and (c-lang-const c++-make-template-syntax-table)
404 (funcall (c-lang-const c++-make-template-syntax-table))))
d9e94c22 405
dd969a56
AM
406(c-lang-defconst c-no-parens-syntax-table
407 ;; A variant of the standard syntax table which is used to find matching
408 ;; "<"s and ">"s which have been marked as parens using syntax table
409 ;; properties. The other paren characters (e.g. "{", ")" "]") are given a
410 ;; non-paren syntax here. so that the list commands will work on "< ... >"
411 ;; even when there's unbalanced other parens inside them.
412 ;;
413 ;; This variable is nil for languages which don't have template stuff.
414 t `(lambda ()
415 (if (c-lang-const c-recognize-<>-arglists)
416 (let ((table (funcall ,(c-lang-const c-make-mode-syntax-table))))
417 (modify-syntax-entry ?\( "." table)
418 (modify-syntax-entry ?\) "." table)
419 (modify-syntax-entry ?\[ "." table)
420 (modify-syntax-entry ?\] "." table)
421 (modify-syntax-entry ?\{ "." table)
422 (modify-syntax-entry ?\} "." table)
423 table))))
424(c-lang-defvar c-no-parens-syntax-table
425 (funcall (c-lang-const c-no-parens-syntax-table)))
426
d9e94c22
MS
427(c-lang-defconst c-identifier-syntax-modifications
428 "A list that describes the modifications that should be done to the
429mode syntax table to get a syntax table that matches all identifiers
430and keywords as words.
431
432The list is just like the one used in `font-lock-defaults': Each
433element is a cons where the car is the character to modify and the cdr
434the new syntax, as accepted by `modify-syntax-entry'."
435 ;; The $ character is not allowed in most languages (one exception
436 ;; is Java which allows it for legacy reasons) but we still classify
e4769531 437 ;; it as an identifier character since it's often used in various
d9e94c22
MS
438 ;; machine generated identifiers.
439 t '((?_ . "w") (?$ . "w"))
452ea855 440 (objc java) (append '((?@ . "w"))
d9e94c22
MS
441 (c-lang-const c-identifier-syntax-modifications))
442 awk '((?_ . "w")))
443(c-lang-defvar c-identifier-syntax-modifications
444 (c-lang-const c-identifier-syntax-modifications))
445
446(c-lang-defvar c-identifier-syntax-table
447 (let ((table (copy-syntax-table (c-mode-var "mode-syntax-table")))
448 (mods c-identifier-syntax-modifications)
449 mod)
450 (while mods
451 (setq mod (car mods)
452 mods (cdr mods))
453 (modify-syntax-entry (car mod) (cdr mod) table))
454 table)
455 "Syntax table built on the mode syntax table but additionally
456classifies symbol constituents like '_' and '$' as word constituents,
457so that all identifiers are recognized as words.")
458
dd969a56
AM
459(c-lang-defconst c-get-state-before-change-functions
460 ;; For documentation see the following c-lang-defvar of the same name.
461 ;; The value here may be a list of functions or a single function.
462 t nil
56d093a9
AM
463 c++ '(c-extend-region-for-CPP
464 c-before-change-check-<>-operators
465 c-invalidate-macro-cache)
466 (c objc) '(c-extend-region-for-CPP c-invalidate-macro-cache)
dd969a56
AM
467 ;; java 'c-before-change-check-<>-operators
468 awk 'c-awk-record-region-clear-NL)
469(c-lang-defvar c-get-state-before-change-functions
470 (let ((fs (c-lang-const c-get-state-before-change-functions)))
471 (if (listp fs)
472 fs
473 (list fs)))
474 "If non-nil, a list of functions called from c-before-change-hook.
475Typically these will record enough state to allow
5ee2e988
AM
476`c-before-font-lock-function' to extend the region to fontify,
477and may do such things as removing text-properties which must be
478recalculated.
479
dd969a56
AM
480These functions will be run in the order given. Each of them
481takes 2 parameters, the BEG and END supplied to every
5ee2e988
AM
482before-change function; on entry, the buffer will have been
483widened and match-data will have been saved; point is undefined
484on both entry and exit; the return value is ignored.
485
dd969a56
AM
486The functions are called even when font locking isn't enabled.
487
488When the mode is initialized, the functions are called with
489parameters \(point-min) and \(point-max).")
490
cb5e207c
AM
491(c-lang-defconst c-before-font-lock-functions
492 ;; For documentation see the following c-lang-defvar of the same name.
493 ;; The value here may be a list of functions or a single function.
be8b11bb
AM
494 t 'c-change-set-fl-decl-start
495 (c c++ objc) '(c-neutralize-syntax-in-and-mark-CPP
496 c-change-set-fl-decl-start)
cb5e207c
AM
497 awk 'c-awk-extend-and-syntax-tablify-region)
498(c-lang-defvar c-before-font-lock-functions
499 (let ((fs (c-lang-const c-before-font-lock-functions)))
500 (if (listp fs)
501 fs
502 (list fs)))
503 "If non-nil, a list of functions called just before font locking.
504Typically they will extend the region about to be fontified \(see
5ee2e988
AM
505below) and will set `syntax-table' text properties on the region.
506
cb5e207c
AM
507These functions will be run in the order given. Each of them
508takes 3 parameters, the BEG, END, and OLD-LEN supplied to every
509after-change function; point is undefined on both entry and exit;
510on entry, the buffer will have been widened and match-data will
511have been saved; the return value is ignored.
5ee2e988 512
cb5e207c 513The functions may extend the region to be fontified by setting the
8835a0f7 514buffer local variables c-new-BEG and c-new-END.
5ee2e988 515
cb5e207c 516The functions are called even when font locking is disabled.
5ee2e988 517
cb5e207c
AM
518When the mode is initialized, these functions are called with
519parameters \(point-min), \(point-max) and <buffer size>.")
5ee2e988 520
be8b11bb
AM
521(c-lang-defconst c-before-context-fontification-functions
522 awk nil
523 t 'c-context-set-fl-decl-start)
524 ;; For documentation see the following c-lang-defvar of the same name.
525 ;; The value here may be a list of functions or a single function.
526(c-lang-defvar c-before-context-fontification-functions
527 (let ((fs (c-lang-const c-before-context-fontification-functions)))
528 (if (listp fs)
529 fs
530 (list fs)))
531 "If non-nil, a list of functions called just before context (or
532other non-change) fontification is done. Typically they will
533extend the region.
534
535These functions will be run in the order given. Each of them
536takes 2 parameters, the BEG and END of the region to be
537fontified. Point is undefined on both entry and exit. On entry,
538the buffer will have been widened and match-data will have been
539saved; the return value is a cons of the adjusted
540region, (NEW-BEG . NEW-END).")
541
d9e94c22 542\f
536610a4
AM
543;;; Syntactic analysis ("virtual semicolons") for line-oriented languages (AWK).
544(c-lang-defconst c-at-vsemi-p-fn
545 "Contains a function \"Is there a virtual semicolon at POS or point?\".
546Such a function takes one optional parameter, a buffer position (defaults to
547point), and returns nil or t. This variable contains nil for languages which
548don't have EOL terminated statements. "
549 t nil
550 (c c++ objc) 'c-at-macro-vsemi-p
551 awk 'c-awk-at-vsemi-p)
552(c-lang-defvar c-at-vsemi-p-fn (c-lang-const c-at-vsemi-p-fn))
553
554(c-lang-defconst c-vsemi-status-unknown-p-fn
555 "Contains a function \"are we unsure whether there is a virtual semicolon on this line?\".
333f9019 556The (admittedly kludgy) purpose of such a function is to prevent an infinite
536610a4
AM
557recursion in c-beginning-of-statement-1 when point starts at a `while' token.
558The function MUST NOT UNDER ANY CIRCUMSTANCES call c-beginning-of-statement-1,
559even indirectly. This variable contains nil for languages which don't have
560EOL terminated statements."
561 t nil
562 (c c++ objc) 'c-macro-vsemi-status-unknown-p
563 awk 'c-awk-vsemi-status-unknown-p)
564(c-lang-defvar c-vsemi-status-unknown-p-fn
565 (c-lang-const c-vsemi-status-unknown-p-fn))
566
567\f
d9e94c22
MS
568;;; Lexer-level syntax (identifiers, tokens etc).
569
b248a85d
AM
570(c-lang-defconst c-has-bitfields
571 "Whether the language has bitfield declarations."
572 t nil
573 (c c++ objc) t)
574(c-lang-defvar c-has-bitfields (c-lang-const c-has-bitfields))
575
d9e94c22
MS
576(c-lang-defconst c-symbol-start
577 "Regexp that matches the start of a symbol, i.e. any identifier or
452ea855 578keyword. It's unspecified how far it matches. Does not contain a \\|
d9e94c22
MS
579operator at the top level."
580 t (concat "[" c-alpha "_]")
452ea855 581 java (concat "[" c-alpha "_@]")
542dfbde 582 objc (concat "[" c-alpha "_@]")
d9e94c22
MS
583 pike (concat "[" c-alpha "_`]"))
584(c-lang-defvar c-symbol-start (c-lang-const c-symbol-start))
585
586(c-lang-defconst c-symbol-chars
587 "Set of characters that can be part of a symbol.
bf2c1571 588This is of the form that fits inside [ ] in a regexp."
d9e94c22
MS
589 ;; Pike note: With the backquote identifiers this would include most
590 ;; operator chars too, but they are handled with other means instead.
591 t (concat c-alnum "_$")
592 objc (concat c-alnum "_$@"))
b248a85d 593(c-lang-defvar c-symbol-chars (c-lang-const c-symbol-chars))
a66cd3ee 594
a66cd3ee 595(c-lang-defconst c-symbol-key
0386b551
AM
596 "Regexp matching identifiers and keywords (with submatch 0). Assumed
597to match if `c-symbol-start' matches on the same position."
d9e94c22
MS
598 t (concat (c-lang-const c-symbol-start)
599 "[" (c-lang-const c-symbol-chars) "]*")
600 pike (concat
601 ;; Use the value from C here since the operator backquote is
602 ;; covered by the other alternative.
603 (c-lang-const c-symbol-key c)
604 "\\|"
605 (c-make-keywords-re nil
606 (c-lang-const c-overloadable-operators))))
607(c-lang-defvar c-symbol-key (c-lang-const c-symbol-key))
608
609(c-lang-defconst c-symbol-key-depth
610 ;; Number of regexp grouping parens in `c-symbol-key'.
0386b551 611 t (regexp-opt-depth (c-lang-const c-symbol-key)))
d9e94c22
MS
612
613(c-lang-defconst c-nonsymbol-chars
614 "This is the set of chars that can't be part of a symbol, i.e. the
615negation of `c-symbol-chars'."
616 t (concat "^" (c-lang-const c-symbol-chars)))
617(c-lang-defvar c-nonsymbol-chars (c-lang-const c-nonsymbol-chars))
618
619(c-lang-defconst c-nonsymbol-key
620 "Regexp that matches any character that can't be part of a symbol.
621It's usually appended to other regexps to avoid matching a prefix.
622It's assumed to not contain any submatchers."
623 ;; The same thing regarding Unicode identifiers applies here as to
624 ;; `c-symbol-key'.
625 t (concat "[" (c-lang-const c-nonsymbol-chars) "]"))
626
0386b551
AM
627(c-lang-defconst c-identifier-ops
628 "The operators that make up fully qualified identifiers. nil in
629languages that don't have such things. See `c-operators' for a
630description of the format. Binary operators can concatenate symbols,
631e.g. \"::\" in \"A::B::C\". Prefix operators can precede identifiers,
632e.g. \"~\" in \"~A::B\". Other types of operators aren't supported.
633
634This value is by default merged into `c-operators'."
d9e94c22 635 t nil
0386b551
AM
636 c++ '((prefix "~" "??-" "compl")
637 (right-assoc "::")
638 (prefix "::"))
2a15eb73
MS
639 ;; Java has "." to concatenate identifiers but it's also used for
640 ;; normal indexing. There's special code in the Java font lock
641 ;; rules to fontify qualified identifiers based on the standard
642 ;; naming conventions. We still define "." here to make
643 ;; `c-forward-name' move over as long names as possible which is
644 ;; necessary to e.g. handle throws clauses correctly.
0386b551
AM
645 java '((left-assoc "."))
646 idl '((left-assoc "::")
647 (prefix "::"))
648 pike '((left-assoc "::")
649 (prefix "::")
650 (left-assoc ".")))
651
652(c-lang-defconst c-opt-identifier-concat-key
653 ;; Appendable adorned regexp matching the operators that join
654 ;; symbols to fully qualified identifiers, or nil in languages that
655 ;; don't have such things.
656 ;;
657 ;; This was a docstring constant in 5.30. It still works but is now
658 ;; considered internal - change `c-identifier-ops' instead.
659 t (let ((ops (c-filter-ops (c-lang-const c-identifier-ops)
660 '(left-assoc right-assoc)
661 t)))
662 (when ops
663 (c-make-keywords-re 'appendable ops))))
d9e94c22
MS
664(c-lang-defvar c-opt-identifier-concat-key
665 (c-lang-const c-opt-identifier-concat-key)
666 'dont-doc)
667
0386b551
AM
668(c-lang-defconst c-opt-identifier-concat-key-depth
669 ;; Number of regexp grouping parens in `c-opt-identifier-concat-key'.
670 t (regexp-opt-depth (c-lang-const c-opt-identifier-concat-key)))
671
672(c-lang-defconst c-opt-identifier-prefix-key
673 ;; Appendable adorned regexp matching operators that might precede
674 ;; an identifier and that are part of the identifier in that case.
675 ;; nil in languages without such things.
676 t (let ((ops (c-filter-ops (c-lang-const c-identifier-ops)
677 '(prefix)
678 t)))
679 (when ops
680 (c-make-keywords-re 'appendable ops))))
681
682(c-lang-defconst c-after-id-concat-ops
683 "Operators that can occur after a binary operator on `c-identifier-ops'
684in identifiers. nil in languages that don't have such things.
685
686Operators here should also have appropriate entries in `c-operators' -
687it's not taken care of by default."
688 t nil
689 ;; '~' for destructors in C++, '*' for member pointers.
690 c++ '("~" "*")
691 ;; In Java we recognize '*' to deal with "foo.bar.*" that can occur
692 ;; in import declarations. (This will also match bogus things like
693 ;; "foo.*bar" but we don't bother.)
694 java '("*"))
695
d9e94c22 696(c-lang-defconst c-opt-after-id-concat-key
0386b551
AM
697 ;; Regexp that must match the token after
698 ;; `c-opt-identifier-concat-key' for it to be considered an
699 ;; identifier concatenation operator (which e.g. causes the
700 ;; preceding identifier to be fontified as a reference). Assumed to
701 ;; be a string if `c-opt-identifier-concat-key' is.
702 ;;
703 ;; This was a docstring constant in 5.30. It still works but is now
704 ;; considered internal - change `c-after-id-concat-ops' instead.
705 t (concat (c-lang-const c-symbol-start)
706 (if (c-lang-const c-after-id-concat-ops)
707 (concat "\\|" (c-make-keywords-re 'appendable
708 (c-lang-const c-after-id-concat-ops)))
709 "")))
d9e94c22
MS
710
711(c-lang-defconst c-identifier-start
0386b551
AM
712 "Regexp that matches the start of an (optionally qualified) identifier.
713It should also match all keywords. It's unspecified how far it
714matches."
715 t (concat (c-lang-const c-symbol-start)
716 (if (c-lang-const c-opt-identifier-prefix-key)
717 (concat "\\|"
718 (c-lang-const c-opt-identifier-prefix-key))
719 "")))
d9e94c22
MS
720(c-lang-defvar c-identifier-start (c-lang-const c-identifier-start))
721
722(c-lang-defconst c-identifier-key
723 "Regexp matching a fully qualified identifier, like \"A::B::c\" in
724C++. It does not recognize the full range of syntactic whitespace
0386b551
AM
725between the tokens; `c-forward-name' has to be used for that. It
726should also not match identifiers containing parenthesis groupings,
727e.g. identifiers with template arguments such as \"A<X,Y>\" in C++."
728 ;; This regexp is more complex than strictly necessary to ensure
729 ;; that it can be matched with a minimum of backtracking.
730 t (concat (if (c-lang-const c-opt-identifier-prefix-key)
731 (concat
732 "\\("
733 (c-lang-const c-opt-identifier-prefix-key)
734 (c-lang-const c-simple-ws) "*"
d9e94c22 735 "\\)?")
0386b551
AM
736 "")
737 "\\(" (c-lang-const c-symbol-key) "\\)"
738 (if (c-lang-const c-opt-identifier-concat-key)
739 (concat
740 "\\("
741 (c-lang-const c-simple-ws) "*"
742 (c-lang-const c-opt-identifier-concat-key)
743 (c-lang-const c-simple-ws) "*"
744 (if (c-lang-const c-after-id-concat-ops)
745 (concat
746 "\\("
747 (c-make-keywords-re 'appendable
748 (c-lang-const c-after-id-concat-ops))
749 (concat
750 ;; For flexibility, consider the symbol match
751 ;; optional if we've hit a
752 ;; `c-after-id-concat-ops' operator. This is
753 ;; also necessary to handle the "*" that can
754 ;; end import declaration identifiers in Java.
755 "\\("
756 (c-lang-const c-simple-ws) "*"
757 "\\(" (c-lang-const c-symbol-key) "\\)"
758 "\\)?")
759 "\\|"
d9e94c22 760 "\\(" (c-lang-const c-symbol-key) "\\)"
0386b551
AM
761 "\\)")
762 (concat "\\(" (c-lang-const c-symbol-key) "\\)"))
763 "\\)*")
764 "")))
d9e94c22
MS
765(c-lang-defvar c-identifier-key (c-lang-const c-identifier-key))
766
767(c-lang-defconst c-identifier-last-sym-match
0386b551
AM
768 ;; This was a docstring constant in 5.30 but it's no longer used.
769 ;; It's only kept to avoid breaking third party code.
770 ;;
771 ;; Used to identify the submatch in `c-identifier-key' that
772 ;; surrounds the last symbol in the qualified identifier. It's a
773 ;; list of submatch numbers, of which the first that has a match is
774 ;; taken. It's assumed that at least one does when the regexp has
775 ;; matched.
776 t nil)
777
778(c-lang-defconst c-string-escaped-newlines
779 "Set if the language support backslash escaped newlines inside string
780literals."
781 t nil
782 (c c++ objc pike) t)
783(c-lang-defvar c-string-escaped-newlines
784 (c-lang-const c-string-escaped-newlines))
785
786(c-lang-defconst c-multiline-string-start-char
787 "Set if the language supports multiline string literals without escaped
788newlines. If t, all string literals are multiline. If a character,
789only literals where the open quote is immediately preceded by that
790literal are multiline."
791 t nil
792 pike ?#)
793(c-lang-defvar c-multiline-string-start-char
794 (c-lang-const c-multiline-string-start-char))
d9e94c22 795
536610a4
AM
796(c-lang-defconst c-opt-cpp-symbol
797 "The symbol which starts preprocessor constructs when in the margin."
798 t "#"
799 (java awk) nil)
800(c-lang-defvar c-opt-cpp-symbol (c-lang-const c-opt-cpp-symbol))
801
d9e94c22
MS
802(c-lang-defconst c-opt-cpp-prefix
803 "Regexp matching the prefix of a cpp directive in the languages that
804normally use that macro preprocessor. Tested at bol or at boi.
805Assumed to not contain any submatches or \\| operators."
e1dbe924 806 ;; TODO (ACM, 2005-04-01). Amend the following to recognize escaped NLs;
0386b551 807 ;; amend all uses of c-opt-cpp-prefix which count regexp-depth.
d9e94c22
MS
808 t "\\s *#\\s *"
809 (java awk) nil)
810(c-lang-defvar c-opt-cpp-prefix (c-lang-const c-opt-cpp-prefix))
811
5ee2e988
AM
812(c-lang-defconst c-anchored-cpp-prefix
813 "Regexp matching the prefix of a cpp directive anchored to BOL,
814in the languages that have a macro preprocessor."
20e527d0
AM
815 t "^\\s *\\(#\\)\\s *"
816 (java awk) nil)
5ee2e988
AM
817(c-lang-defvar c-anchored-cpp-prefix (c-lang-const c-anchored-cpp-prefix))
818
d9e94c22
MS
819(c-lang-defconst c-opt-cpp-start
820 "Regexp matching the prefix of a cpp directive including the directive
821name, or nil in languages without preprocessor support. The first
822submatch surrounds the directive name."
823 t (if (c-lang-const c-opt-cpp-prefix)
824 (concat (c-lang-const c-opt-cpp-prefix)
825 "\\([" c-alnum "]+\\)"))
826 ;; Pike, being a scripting language, recognizes hash-bangs too.
827 pike (concat (c-lang-const c-opt-cpp-prefix)
828 "\\([" c-alnum "]+\\|!\\)"))
829(c-lang-defvar c-opt-cpp-start (c-lang-const c-opt-cpp-start))
830
0386b551
AM
831(c-lang-defconst c-cpp-message-directives
832 "List of cpp directives (without the prefix) that are followed by a
833string message."
834 t (if (c-lang-const c-opt-cpp-prefix)
835 '("error"))
5ee2e988 836 (c c++ objc pike) '("error" "warning"))
0386b551
AM
837
838(c-lang-defconst c-cpp-include-directives
839 "List of cpp directives (without the prefix) that are followed by a
840file name in angle brackets or quotes."
841 t (if (c-lang-const c-opt-cpp-prefix)
842 '("include"))
843 objc '("include" "import"))
844
845(c-lang-defconst c-opt-cpp-macro-define
846 "Cpp directive (without the prefix) that is followed by a macro
847definition, or nil if the language doesn't have any."
848 t (if (c-lang-const c-opt-cpp-prefix)
849 "define"))
536610a4
AM
850(c-lang-defvar c-opt-cpp-macro-define
851 (c-lang-const c-opt-cpp-macro-define))
0386b551
AM
852
853(c-lang-defconst c-opt-cpp-macro-define-start
772a3544
AM
854 ;; Regexp matching everything up to the macro body of a cpp define, or the
855 ;; end of the logical line if there is none. Submatch 1 is the name of the
856 ;; macro. Set if c-opt-cpp-macro-define is.
0386b551
AM
857 t (if (c-lang-const c-opt-cpp-macro-define)
858 (concat (c-lang-const c-opt-cpp-prefix)
859 (c-lang-const c-opt-cpp-macro-define)
772a3544
AM
860 "[ \t]+\\(\\(\\sw\\|_\\)+\\)\\(\([^\)]*\)\\)?"
861 ;; ^ ^ #defined name
0386b551
AM
862 "\\([ \t]\\|\\\\\n\\)*")))
863(c-lang-defvar c-opt-cpp-macro-define-start
864 (c-lang-const c-opt-cpp-macro-define-start))
865
51c9af45
AM
866(c-lang-defconst c-opt-cpp-macro-define-id
867 ;; Regexp matching everything up to the end of the identifier defined
868 ;; by a cpp define.
869 t (if (c-lang-const c-opt-cpp-macro-define)
870 (concat (c-lang-const c-opt-cpp-prefix) ; #
871 (c-lang-const c-opt-cpp-macro-define) ; define
872 "[ \t]+\\(\\sw\\|_\\)+")))
873(c-lang-defvar c-opt-cpp-macro-define-id
874 (c-lang-const c-opt-cpp-macro-define-id))
875
0386b551 876(c-lang-defconst c-cpp-expr-directives
5ee2e988 877 "List of cpp directives (without the prefix) that are followed by an
0386b551
AM
878expression."
879 t (if (c-lang-const c-opt-cpp-prefix)
880 '("if" "elif")))
881
b128268e
AM
882(c-lang-defconst c-cpp-expr-intro-re
883 "Regexp which matches the start of a CPP directive which contains an
884expression, or nil if there aren't any in the language."
885 t (if (c-lang-const c-cpp-expr-directives)
886 (concat
887 (c-lang-const c-opt-cpp-prefix)
888 (c-make-keywords-re t (c-lang-const c-cpp-expr-directives)))))
889(c-lang-defvar c-cpp-expr-intro-re
890 (c-lang-const c-cpp-expr-intro-re))
891
0386b551
AM
892(c-lang-defconst c-cpp-expr-functions
893 "List of functions in cpp expressions."
d9e94c22
MS
894 t (if (c-lang-const c-opt-cpp-prefix)
895 '("defined"))
896 pike '("defined" "efun" "constant"))
897
846f5040
MS
898(c-lang-defconst c-assignment-operators
899 "List of all assignment operators."
900 t '("=" "*=" "/=" "%=" "+=" "-=" ">>=" "<<=" "&=" "^=" "|=")
901 java (append (c-lang-const c-assignment-operators)
902 '(">>>="))
903 c++ (append (c-lang-const c-assignment-operators)
0386b551 904 '("and_eq" "or_eq" "xor_eq" "??!=" "??'="))
846f5040
MS
905 idl nil)
906
d9e94c22
MS
907(c-lang-defconst c-operators
908 "List describing all operators, along with their precedence and
909associativity. The order in the list corresponds to the precedence of
e6a9e584 910the operators: The operators in each element are a group with the same
d9e94c22 911precedence, and the group has higher precedence than the groups in all
e6a9e584
AM
912following elements. The car of each element describes the type of the
913operator group, and the cdr is a list of the operator tokens in it.
914The operator group types are:
d9e94c22
MS
915
916'prefix Unary prefix operators.
917'postfix Unary postfix operators.
0386b551
AM
918'postfix-if-paren
919 Unary postfix operators if and only if the chars have
920 parenthesis syntax.
d9e94c22
MS
921'left-assoc Binary left associative operators (i.e. a+b+c means (a+b)+c).
922'right-assoc Binary right associative operators (i.e. a=b=c means a=(b=c)).
923'right-assoc-sequence
924 Right associative operator that constitutes of a
925 sequence of tokens that separate expressions. All the
926 tokens in the group are in this case taken as
927 describing the sequence in one such operator, and the
928 order between them is therefore significant.
929
930Operators containing a character with paren syntax are taken to match
931with a corresponding open/close paren somewhere else. A postfix
932operator with close paren syntax is taken to end a postfix expression
933started somewhere earlier, rather than start a new one at point. Vice
934versa for prefix operators with open paren syntax.
935
936Note that operators like \".\" and \"->\" which in language references
937often are described as postfix operators are considered binary here,
938since CC Mode treats every identifier as an expression."
939
940 ;; There's currently no code in CC Mode that exploit all the info
941 ;; in this variable; precedence, associativity etc are present as a
942 ;; preparation for future work.
943
944 t `(;; Preprocessor.
945 ,@(when (c-lang-const c-opt-cpp-prefix)
946 `((prefix "#"
947 ,@(when (c-major-mode-is '(c-mode c++-mode))
948 '("%:" "??=")))
949 (left-assoc "##"
950 ,@(when (c-major-mode-is '(c-mode c++-mode))
951 '("%:%:" "??=??=")))))
952
0386b551
AM
953 ;; Primary.
954 ,@(c-lang-const c-identifier-ops)
452ea855 955 ,@(cond ((or (c-major-mode-is 'c++-mode) (c-major-mode-is 'java-mode))
0386b551 956 `((postfix-if-paren "<" ">"))) ; Templates.
d9e94c22 957 ((c-major-mode-is 'pike-mode)
0386b551 958 `((prefix "global" "predef")))
d9e94c22 959 ((c-major-mode-is 'java-mode)
0386b551 960 `((prefix "super"))))
d9e94c22
MS
961
962 ;; Postfix.
963 ,@(when (c-major-mode-is 'c++-mode)
964 ;; The following need special treatment.
965 `((prefix "dynamic_cast" "static_cast"
966 "reinterpret_cast" "const_cast" "typeid")))
967 (left-assoc "."
968 ,@(unless (c-major-mode-is 'java-mode)
969 '("->")))
970 (postfix "++" "--" "[" "]" "(" ")"
971 ,@(when (c-major-mode-is '(c-mode c++-mode))
972 '("<:" ":>" "??(" "??)")))
973
974 ;; Unary.
975 (prefix "++" "--" "+" "-" "!" "~"
976 ,@(when (c-major-mode-is 'c++-mode) '("not" "compl"))
977 ,@(when (c-major-mode-is '(c-mode c++-mode))
978 '("*" "&" "sizeof" "??-"))
979 ,@(when (c-major-mode-is 'objc-mode)
980 '("@selector" "@protocol" "@encode"))
981 ;; The following need special treatment.
982 ,@(cond ((c-major-mode-is 'c++-mode)
983 '("new" "delete"))
984 ((c-major-mode-is 'java-mode)
985 '("new"))
986 ((c-major-mode-is 'pike-mode)
987 '("class" "lambda" "catch" "throw" "gauge")))
988 "(" ")" ; Cast.
989 ,@(when (c-major-mode-is 'pike-mode)
990 '("[" "]"))) ; Type cast.
991
992 ;; Member selection.
993 ,@(when (c-major-mode-is 'c++-mode)
994 `((left-assoc ".*" "->*")))
995
996 ;; Multiplicative.
997 (left-assoc "*" "/" "%")
998
999 ;; Additive.
1000 (left-assoc "+" "-")
1001
1002 ;; Shift.
1003 (left-assoc "<<" ">>"
1004 ,@(when (c-major-mode-is 'java-mode)
1005 '(">>>")))
1006
1007 ;; Relational.
1008 (left-assoc "<" ">" "<=" ">="
1009 ,@(when (c-major-mode-is 'java-mode)
1010 '("instanceof")))
1011
1012 ;; Equality.
1013 (left-assoc "==" "!="
1014 ,@(when (c-major-mode-is 'c++-mode) '("not_eq")))
1015
1016 ;; Bitwise and.
1017 (left-assoc "&"
1018 ,@(when (c-major-mode-is 'c++-mode) '("bitand")))
1019
1020 ;; Bitwise exclusive or.
1021 (left-assoc "^"
1022 ,@(when (c-major-mode-is '(c-mode c++-mode))
1023 '("??'"))
1024 ,@(when (c-major-mode-is 'c++-mode) '("xor")))
1025
1026 ;; Bitwise or.
1027 (left-assoc "|"
1028 ,@(when (c-major-mode-is '(c-mode c++-mode))
1029 '("??!"))
1030 ,@(when (c-major-mode-is 'c++-mode) '("bitor")))
1031
1032 ;; Logical and.
1033 (left-assoc "&&"
1034 ,@(when (c-major-mode-is 'c++-mode) '("and")))
1035
1036 ;; Logical or.
1037 (left-assoc "||"
1038 ,@(when (c-major-mode-is '(c-mode c++-mode))
1039 '("??!??!"))
1040 ,@(when (c-major-mode-is 'c++-mode) '("or")))
1041
1042 ;; Conditional.
1043 (right-assoc-sequence "?" ":")
1044
1045 ;; Assignment.
846f5040 1046 (right-assoc ,@(c-lang-const c-assignment-operators))
d9e94c22
MS
1047
1048 ;; Exception.
1049 ,@(when (c-major-mode-is 'c++-mode)
1050 '((prefix "throw")))
1051
1052 ;; Sequence.
1053 (left-assoc ","))
1054
1055 ;; IDL got its own definition since it has a much smaller operator
1056 ;; set than the other languages.
1057 idl `(;; Preprocessor.
1058 (prefix "#")
1059 (left-assoc "##")
0386b551
AM
1060 ;; Primary.
1061 ,@(c-lang-const c-identifier-ops)
d9e94c22
MS
1062 ;; Unary.
1063 (prefix "+" "-" "~")
1064 ;; Multiplicative.
1065 (left-assoc "*" "/" "%")
1066 ;; Additive.
1067 (left-assoc "+" "-")
1068 ;; Shift.
1069 (left-assoc "<<" ">>")
1070 ;; And.
1071 (left-assoc "&")
1072 ;; Xor.
1073 (left-assoc "^")
1074 ;; Or.
1075 (left-assoc "|")))
1076
1077(c-lang-defconst c-operator-list
1078 ;; The operators as a flat list (without duplicates).
0386b551 1079 t (c-filter-ops (c-lang-const c-operators) t t))
d9e94c22
MS
1080
1081(c-lang-defconst c-overloadable-operators
0386b551 1082 "List of the operators that are overloadable, in their \"identifier
51c9af45 1083form\". See also `c-op-identifier-prefix'."
d9e94c22 1084 t nil
d9e94c22
MS
1085 c++ '("new" "delete" ;; Can be followed by "[]" but we ignore that.
1086 "+" "-" "*" "/" "%"
1087 "^" "??'" "xor" "&" "bitand" "|" "??!" "bitor" "~" "??-" "compl"
1088 "!" "=" "<" ">" "+=" "-=" "*=" "/=" "%=" "^="
1089 "??'=" "xor_eq" "&=" "and_eq" "|=" "??!=" "or_eq"
1090 "<<" ">>" ">>=" "<<=" "==" "!=" "not_eq" "<=" ">="
1091 "&&" "and" "||" "??!??!" "or" "++" "--" "," "->*" "->"
1092 "()" "[]" "<::>" "??(??)")
1093 ;; These work like identifiers in Pike.
1094 pike '("`+" "`-" "`&" "`|" "`^" "`<<" "`>>" "`*" "`/" "`%" "`~"
1095 "`==" "`<" "`>" "`!" "`[]" "`[]=" "`->" "`->=" "`()" "``+"
1096 "``-" "``&" "``|" "``^" "``<<" "``>>" "``*" "``/" "``%"
1097 "`+="))
1098
1099(c-lang-defconst c-overloadable-operators-regexp
1100 ;; Regexp tested after an "operator" token in C++.
1101 t nil
1102 c++ (c-make-keywords-re nil (c-lang-const c-overloadable-operators)))
1103(c-lang-defvar c-overloadable-operators-regexp
1104 (c-lang-const c-overloadable-operators-regexp))
1105
51c9af45 1106(c-lang-defconst c-opt-op-identifier-prefix
0386b551
AM
1107 "Regexp matching the token before the ones in
1108`c-overloadable-operators' when operators are specified in their
1109\"identifier form\". This typically matches \"operator\" in C++ where
1110operator functions are specified as e.g. \"operator +\". It's nil in
1111languages without operator functions or where the complete operator
1112identifier is listed in `c-overloadable-operators'.
1113
1114This regexp is assumed to not match any non-operator identifier."
1115 t nil
1116 c++ (c-make-keywords-re t '("operator")))
51c9af45
AM
1117(c-lang-defvar c-opt-op-identifier-prefix
1118 (c-lang-const c-opt-op-identifier-prefix))
1119
1120;; Note: the following alias is an old name which was a mis-spelling. It has
1121;; been corrected above and throughout cc-engine.el. It will be removed at
1122;; some release very shortly in the future. ACM, 2006-04-14.
c97833f0 1123(defvaralias 'c-opt-op-identitier-prefix 'c-opt-op-identifier-prefix)
51c9af45
AM
1124(make-obsolete-variable 'c-opt-op-identitier-prefix 'c-opt-op-identifier-prefix
1125 "CC Mode 5.31.4, 2006-04-14")
0386b551 1126
d9e94c22
MS
1127(c-lang-defconst c-other-op-syntax-tokens
1128 "List of the tokens made up of characters in the punctuation or
1129parenthesis syntax classes that have uses other than as expression
1130operators."
1131 t '("{" "}" "(" ")" "[" "]" ";" ":" "," "=" "/*" "*/" "//")
1132 (c c++ pike) (append '("#" "##" ; Used by cpp.
1133 "::" "...")
1134 (c-lang-const c-other-op-syntax-tokens))
0386b551
AM
1135 (c c++) (append '("*") (c-lang-const c-other-op-syntax-tokens))
1136 c++ (append '("&" "<%" "%>" "<:" ":>" "%:" "%:%:")
1137 (c-lang-const c-other-op-syntax-tokens))
d9e94c22
MS
1138 objc (append '("#" "##" ; Used by cpp.
1139 "+" "-") (c-lang-const c-other-op-syntax-tokens))
1140 idl (append '("#" "##") ; Used by cpp.
1141 (c-lang-const c-other-op-syntax-tokens))
1142 pike (append '("..")
1143 (c-lang-const c-other-op-syntax-tokens)
1144 (c-lang-const c-overloadable-operators))
1145 awk '("{" "}" "(" ")" "[" "]" ";" "," "=" "/"))
1146
0386b551
AM
1147(c-lang-defconst c-all-op-syntax-tokens
1148 ;; List of all tokens in the punctuation and parenthesis syntax
1149 ;; classes.
1150 t (delete-duplicates (append (c-lang-const c-other-op-syntax-tokens)
1151 (c-lang-const c-operator-list))
1152 :test 'string-equal))
1153
1154(c-lang-defconst c-nonsymbol-token-char-list
1155 ;; List containing all chars not in the word, symbol or
1156 ;; syntactically irrelevant syntax classes, i.e. all punctuation,
1157 ;; parenthesis and string delimiter chars.
1158 t (c-with-syntax-table (c-lang-const c-mode-syntax-table)
1159 ;; Only go through the chars in the printable ASCII range. No
1160 ;; language so far has 8-bit or widestring operators.
1161 (let (list (char 32))
1162 (while (< char 127)
1163 (or (memq (char-syntax char) '(?w ?_ ?< ?> ?\ ))
1164 (setq list (cons (c-int-to-char char) list)))
1165 (setq char (1+ char)))
1166 list)))
1167
d9e94c22
MS
1168(c-lang-defconst c-nonsymbol-token-regexp
1169 ;; Regexp matching all tokens in the punctuation and parenthesis
1170 ;; syntax classes. Note that this also matches ".", which can start
1171 ;; a float.
1172 t (c-make-keywords-re nil
0386b551
AM
1173 (c-filter-ops (c-lang-const c-all-op-syntax-tokens)
1174 t
1175 "\\`\\(\\s.\\|\\s\(\\|\\s\)\\)+\\'")))
d9e94c22
MS
1176(c-lang-defvar c-nonsymbol-token-regexp
1177 (c-lang-const c-nonsymbol-token-regexp))
1178
846f5040
MS
1179(c-lang-defconst c-assignment-op-regexp
1180 ;; Regexp matching all assignment operators and only them. The
1181 ;; beginning of the first submatch is used to detect the end of the
1182 ;; token, along with the end of the whole match.
1183 t (if (c-lang-const c-assignment-operators)
1184 (concat
1185 ;; Need special case for "=" since it's a prefix of "==".
1186 "=\\([^=]\\|$\\)"
1187 "\\|"
1188 (c-make-keywords-re nil
1189 (set-difference (c-lang-const c-assignment-operators)
1190 '("=")
1191 :test 'string-equal)))
1192 "\\<\\>"))
1193(c-lang-defvar c-assignment-op-regexp
1194 (c-lang-const c-assignment-op-regexp))
1195
0386b551
AM
1196(c-lang-defconst c-<>-multichar-token-regexp
1197 ;; Regexp matching all tokens containing "<" or ">" which are longer
1198 ;; than one char.
1199 t (c-make-keywords-re nil
1200 (c-filter-ops (c-lang-const c-all-op-syntax-tokens)
1201 t
1202 ".[<>]\\|[<>].")))
1203(c-lang-defvar c-<>-multichar-token-regexp
1204 (c-lang-const c-<>-multichar-token-regexp))
1205
d9e94c22
MS
1206(c-lang-defconst c-<-op-cont-regexp
1207 ;; Regexp matching the second and subsequent characters of all
1208 ;; multicharacter tokens that begin with "<".
1209 t (c-make-keywords-re nil
0386b551
AM
1210 (c-filter-ops (c-lang-const c-all-op-syntax-tokens)
1211 t
1212 "\\`<."
1213 (lambda (op) (substring op 1)))))
452ea855 1214
d9e94c22
MS
1215(c-lang-defvar c-<-op-cont-regexp (c-lang-const c-<-op-cont-regexp))
1216
1217(c-lang-defconst c->-op-cont-regexp
1218 ;; Regexp matching the second and subsequent characters of all
1219 ;; multicharacter tokens that begin with ">".
1220 t (c-make-keywords-re nil
0386b551
AM
1221 (c-filter-ops (c-lang-const c-all-op-syntax-tokens)
1222 t
1223 "\\`>."
452ea855
AM
1224 (lambda (op) (substring op 1))))
1225 java (c-make-keywords-re nil
1226 (c-filter-ops (c-lang-const c-all-op-syntax-tokens)
1227 t
1228 "\\`>[^>]\\|\\`>>[^>]"
1229 (lambda (op) (substring op 1)))))
1230
d9e94c22
MS
1231(c-lang-defvar c->-op-cont-regexp (c-lang-const c->-op-cont-regexp))
1232
1233(c-lang-defconst c-stmt-delim-chars
1234 ;; The characters that should be considered to bound statements. To
1235 ;; optimize `c-crosses-statement-barrier-p' somewhat, it's assumed to
1236 ;; begin with "^" to negate the set. If ? : operators should be
1237 ;; detected then the string must end with "?:".
536610a4 1238 t "^;{}?:")
d9e94c22
MS
1239(c-lang-defvar c-stmt-delim-chars (c-lang-const c-stmt-delim-chars))
1240
1241(c-lang-defconst c-stmt-delim-chars-with-comma
1242 ;; Variant of `c-stmt-delim-chars' that additionally contains ','.
536610a4 1243 t "^;,{}?:")
d9e94c22
MS
1244(c-lang-defvar c-stmt-delim-chars-with-comma
1245 (c-lang-const c-stmt-delim-chars-with-comma))
1246
1247\f
1248;;; Syntactic whitespace.
1249
0386b551
AM
1250(c-lang-defconst c-simple-ws
1251 "Regexp matching an ordinary whitespace character.
1252Does not contain a \\| operator at the top level."
1253 ;; "\\s " is not enough since it doesn't match line breaks.
1254 t "\\(\\s \\|[\n\r]\\)")
1255
1256(c-lang-defconst c-simple-ws-depth
1257 ;; Number of regexp grouping parens in `c-simple-ws'.
1258 t (regexp-opt-depth (c-lang-const c-simple-ws)))
1259
1260(c-lang-defconst c-line-comment-starter
1261 "String that starts line comments, or nil if such don't exist.
1262Line comments are always terminated by newlines. At least one of
1263`c-block-comment-starter' and this one is assumed to be set.
1264
1265Note that it's currently not enough to set this to support a new
1266comment style. Other stuff like the syntax table must also be set up
1267properly."
1268 t "//"
1269 awk "#")
1270(c-lang-defvar c-line-comment-starter (c-lang-const c-line-comment-starter))
1271
1272(c-lang-defconst c-block-comment-starter
1273 "String that starts block comments, or nil if such don't exist.
1274Block comments are ended by `c-block-comment-ender', which is assumed
1275to be set if this is. At least one of `c-line-comment-starter' and
1276this one is assumed to be set.
1277
1278Note that it's currently not enough to set this to support a new
1279comment style. Other stuff like the syntax table must also be set up
1280properly."
1281 t "/*"
1282 awk nil)
1283
1284(c-lang-defconst c-block-comment-ender
1285 "String that ends block comments, or nil if such don't exist.
1286
1287Note that it's currently not enough to set this to support a new
1288comment style. Other stuff like the syntax table must also be set up
1289properly."
1290 t "*/"
1291 awk nil)
1292
d9e94c22
MS
1293(c-lang-defconst c-comment-start-regexp
1294 ;; Regexp to match the start of any type of comment.
0386b551
AM
1295 t (let ((re (c-make-keywords-re nil
1296 (list (c-lang-const c-line-comment-starter)
1297 (c-lang-const c-block-comment-starter)))))
1298 (if (memq 'gen-comment-delim c-emacs-features)
1299 (concat re "\\|\\s!")
1300 re)))
d9e94c22
MS
1301(c-lang-defvar c-comment-start-regexp (c-lang-const c-comment-start-regexp))
1302
0386b551
AM
1303(c-lang-defconst c-block-comment-start-regexp
1304 ;; Regexp which matches the start of a block comment (if such exists in the
1305 ;; language)
1306 t (if (c-lang-const c-block-comment-starter)
1307 (regexp-quote (c-lang-const c-block-comment-starter))
1308 "\\<\\>"))
1309(c-lang-defvar c-block-comment-start-regexp
1310 (c-lang-const c-block-comment-start-regexp))
1311
536610a4
AM
1312(c-lang-defconst c-line-comment-start-regexp
1313 ;; Regexp which matches the start of a line comment (if such exists in the
1314 ;; language; it does in all 7 CC Mode languages).
1315 t (if (c-lang-const c-line-comment-starter)
1316 (regexp-quote (c-lang-const c-line-comment-starter))
1317 "\\<\\>"))
1318(c-lang-defvar c-line-comment-start-regexp
1319 (c-lang-const c-line-comment-start-regexp))
1320
d9e94c22
MS
1321(c-lang-defconst c-literal-start-regexp
1322 ;; Regexp to match the start of comments and string literals.
1323 t (concat (c-lang-const c-comment-start-regexp)
1324 "\\|"
1325 (if (memq 'gen-string-delim c-emacs-features)
1326 "\"|"
1327 "\"")))
1328(c-lang-defvar c-literal-start-regexp (c-lang-const c-literal-start-regexp))
1329
1330(c-lang-defconst c-doc-comment-start-regexp
1331 "Regexp to match the start of documentation comments."
1332 t "\\<\\>"
1333 ;; From font-lock.el: `doxygen' uses /*! while others use /**.
1334 (c c++ objc) "/\\*[*!]"
1335 java "/\\*\\*"
1336 pike "/[/*]!")
1337(c-lang-defvar c-doc-comment-start-regexp
1338 (c-lang-const c-doc-comment-start-regexp))
1339
1340(c-lang-defconst comment-start
1341 "String that starts comments inserted with M-; etc.
1342`comment-start' is initialized from this."
0386b551
AM
1343 ;; Default: Prefer line comments to block comments, and pad with a space.
1344 t (concat (or (c-lang-const c-line-comment-starter)
1345 (c-lang-const c-block-comment-starter))
1346 " ")
1347 ;; In C we still default to the block comment style since line
1348 ;; comments aren't entirely portable.
1349 c "/* ")
26b8f810 1350(c-lang-setvar comment-start (c-lang-const comment-start))
d9e94c22
MS
1351
1352(c-lang-defconst comment-end
1353 "String that ends comments inserted with M-; etc.
1354`comment-end' is initialized from this."
0386b551
AM
1355 ;; Default: Use block comment style if comment-start uses block
1356 ;; comments, and pad with a space in that case.
1357 t (if (string-match (concat "\\`\\("
1358 (c-lang-const c-block-comment-start-regexp)
1359 "\\)")
1360 (c-lang-const comment-start))
1361 (concat " " (c-lang-const c-block-comment-ender))
1362 ""))
26b8f810 1363(c-lang-setvar comment-end (c-lang-const comment-end))
d9e94c22
MS
1364
1365(c-lang-defconst comment-start-skip
1366 "Regexp to match the start of a comment plus everything up to its body.
1367`comment-start-skip' is initialized from this."
0386b551
AM
1368 ;; Default: Allow the last char of the comment starter(s) to be
1369 ;; repeated, then allow any amount of horizontal whitespace.
1370 t (concat "\\("
1371 (c-concat-separated
1372 (mapcar (lambda (cs)
1373 (when cs
1374 (concat (regexp-quote cs) "+")))
1375 (list (c-lang-const c-line-comment-starter)
1376 (c-lang-const c-block-comment-starter)))
1377 "\\|")
1378 "\\)\\s *"))
26b8f810 1379(c-lang-setvar comment-start-skip (c-lang-const comment-start-skip))
d9e94c22 1380
f75ef66d 1381(c-lang-defconst c-syntactic-ws-start
0386b551
AM
1382 ;; Regexp matching any sequence that can start syntactic whitespace.
1383 ;; The only uncertain case is '#' when there are cpp directives.
1384 t (concat "\\s \\|"
1385 (c-make-keywords-re nil
1386 (append (list (c-lang-const c-line-comment-starter)
1387 (c-lang-const c-block-comment-starter)
1388 (when (c-lang-const c-opt-cpp-prefix)
1389 "#"))
1390 '("\n" "\r")))
1391 "\\|\\\\[\n\r]"
1392 (when (memq 'gen-comment-delim c-emacs-features)
1393 "\\|\\s!")))
1394(c-lang-defvar c-syntactic-ws-start (c-lang-const c-syntactic-ws-start))
d9e94c22 1395
f75ef66d 1396(c-lang-defconst c-syntactic-ws-end
0386b551
AM
1397 ;; Regexp matching any single character that might end syntactic whitespace.
1398 t (concat "\\s \\|"
1399 (c-make-keywords-re nil
1400 (append (when (c-lang-const c-block-comment-ender)
1401 (list
1402 (string
1403 (elt (c-lang-const c-block-comment-ender)
1404 (1- (length
1405 (c-lang-const c-block-comment-ender)))))))
1406 '("\n" "\r")))
1407 (when (memq 'gen-comment-delim c-emacs-features)
1408 "\\|\\s!")))
1409(c-lang-defvar c-syntactic-ws-end (c-lang-const c-syntactic-ws-end))
1410
1411(c-lang-defconst c-unterminated-block-comment-regexp
1412 ;; Regexp matching an unterminated block comment that doesn't
1413 ;; contain line breaks, or nil in languages without block comments.
1414 ;; Does not contain a \| operator at the top level.
1415 t (when (c-lang-const c-block-comment-starter)
1416 (concat
1417 (regexp-quote (c-lang-const c-block-comment-starter))
1418 ;; It's messy to cook together a regexp that matches anything
1419 ;; but c-block-comment-ender.
1420 (let ((end (c-lang-const c-block-comment-ender)))
1421 (cond ((= (length end) 1)
1422 (concat "[^" end "\n\r]*"))
1423 ((= (length end) 2)
1424 (concat "[^" (substring end 0 1) "\n\r]*"
1425 "\\("
1426 (regexp-quote (substring end 0 1)) "+"
1427 "[^"
1428 ;; The quoting rules inside char classes are silly. :P
1429 (cond ((= (elt end 0) (elt end 1))
1430 (concat (substring end 0 1) "\n\r"))
1431 ((= (elt end 1) ?\])
1432 (concat (substring end 1 2) "\n\r"
1433 (substring end 0 1)))
1434 (t
1435 (concat (substring end 0 1) "\n\r"
1436 (substring end 1 2))))
1437 "]"
1438 "[^" (substring end 0 1) "\n\r]*"
1439 "\\)*"))
1440 (t
1441 (error "Can't handle a block comment ender of length %s"
1442 (length end))))))))
1443
1444(c-lang-defconst c-block-comment-regexp
1445 ;; Regexp matching a block comment that doesn't contain line breaks,
1446 ;; or nil in languages without block comments. The reason we don't
1447 ;; allow line breaks is to avoid going very far and risk running out
1448 ;; of regexp stack; this regexp is intended to handle only short
1449 ;; comments that might be put in the middle of limited constructs
1450 ;; like declarations. Does not contain a \| operator at the top
1451 ;; level.
1452 t (when (c-lang-const c-unterminated-block-comment-regexp)
1453 (concat
1454 (c-lang-const c-unterminated-block-comment-regexp)
1455 (let ((end (c-lang-const c-block-comment-ender)))
1456 (cond ((= (length end) 1)
1457 (regexp-quote end))
1458 ((= (length end) 2)
1459 (concat (regexp-quote (substring end 0 1)) "+"
1460 (regexp-quote (substring end 1 2))))
1461 (t
1462 (error "Can't handle a block comment ender of length %s"
1463 (length end))))))))
d9e94c22
MS
1464
1465(c-lang-defconst c-nonwhite-syntactic-ws
1466 ;; Regexp matching a piece of syntactic whitespace that isn't a
1467 ;; sequence of simple whitespace characters. As opposed to
1468 ;; `c-(forward|backward)-syntactic-ws', this doesn't regard cpp
1469 ;; directives as syntactic whitespace.
0386b551
AM
1470 t (c-concat-separated
1471 (list (when (c-lang-const c-line-comment-starter)
1472 (concat (regexp-quote (c-lang-const c-line-comment-starter))
1473 "[^\n\r]*[\n\r]"))
1474 (c-lang-const c-block-comment-regexp)
1475 "\\\\[\n\r]"
1476 (when (memq 'gen-comment-delim c-emacs-features)
1477 "\\s!\\S!*\\s!"))
1478 "\\|"))
d9e94c22
MS
1479
1480(c-lang-defconst c-syntactic-ws
1481 ;; Regexp matching syntactic whitespace, including possibly the
1482 ;; empty string. As opposed to `c-(forward|backward)-syntactic-ws',
1483 ;; this doesn't regard cpp directives as syntactic whitespace. Does
1484 ;; not contain a \| operator at the top level.
0386b551
AM
1485 t (concat (c-lang-const c-simple-ws) "*"
1486 "\\("
1487 (concat "\\(" (c-lang-const c-nonwhite-syntactic-ws) "\\)"
1488 (c-lang-const c-simple-ws) "*")
1489 "\\)*"))
d9e94c22
MS
1490
1491(c-lang-defconst c-syntactic-ws-depth
1492 ;; Number of regexp grouping parens in `c-syntactic-ws'.
0386b551 1493 t (regexp-opt-depth (c-lang-const c-syntactic-ws)))
d9e94c22
MS
1494
1495(c-lang-defconst c-nonempty-syntactic-ws
1496 ;; Regexp matching syntactic whitespace, which is at least one
1497 ;; character long. As opposed to `c-(forward|backward)-syntactic-ws',
1498 ;; this doesn't regard cpp directives as syntactic whitespace. Does
1499 ;; not contain a \| operator at the top level.
0386b551
AM
1500 t (concat "\\("
1501 (c-lang-const c-simple-ws)
1502 "\\|"
d9e94c22
MS
1503 (c-lang-const c-nonwhite-syntactic-ws)
1504 "\\)+"))
1505
1506(c-lang-defconst c-nonempty-syntactic-ws-depth
1507 ;; Number of regexp grouping parens in `c-nonempty-syntactic-ws'.
0386b551 1508 t (regexp-opt-depth (c-lang-const c-nonempty-syntactic-ws)))
d9e94c22
MS
1509
1510(c-lang-defconst c-single-line-syntactic-ws
1511 ;; Regexp matching syntactic whitespace without any line breaks. As
1512 ;; opposed to `c-(forward|backward)-syntactic-ws', this doesn't
1513 ;; regard cpp directives as syntactic whitespace. Does not contain
1514 ;; a \| operator at the top level.
0386b551
AM
1515 t (if (c-lang-const c-block-comment-regexp)
1516 (concat "\\s *\\("
1517 (c-lang-const c-block-comment-regexp)
1518 "\\s *\\)*")
1519 "\\s *"))
d9e94c22
MS
1520
1521(c-lang-defconst c-single-line-syntactic-ws-depth
1522 ;; Number of regexp grouping parens in `c-single-line-syntactic-ws'.
0386b551 1523 t (regexp-opt-depth (c-lang-const c-single-line-syntactic-ws)))
d9e94c22 1524
0386b551 1525(c-lang-defconst c-syntactic-eol
d9e94c22
MS
1526 ;; Regexp that matches when there is no syntactically significant
1527 ;; text before eol. Macros are regarded as syntactically
1528 ;; significant text here.
0386b551
AM
1529 t (concat (c-lang-const c-single-line-syntactic-ws)
1530 ;; Match eol (possibly inside a block comment or preceded
1531 ;; by a line continuation backslash), or the beginning of a
1532 ;; line comment. Note: This has to be modified for awk
1533 ;; where line comments start with '#'.
1534 "\\("
1535 (c-concat-separated
1536 (list (when (c-lang-const c-line-comment-starter)
1537 (regexp-quote (c-lang-const c-line-comment-starter)))
1538 (when (c-lang-const c-unterminated-block-comment-regexp)
1539 (concat (c-lang-const c-unterminated-block-comment-regexp)
1540 "$"))
1541 "\\\\$"
d9e94c22 1542 "$")
0386b551
AM
1543 "\\|")
1544 "\\)"))
1545(c-lang-defvar c-syntactic-eol (c-lang-const c-syntactic-eol))
1546
1547\f
28abe5e2
AM
1548;;; Defun functions
1549
1550;; The Emacs variables beginning-of-defun-function and
1551;; end-of-defun-function will be set so that commands like
1552;; `mark-defun' and `narrow-to-defun' work right. The key sequences
1553;; C-M-a and C-M-e are, however, bound directly to the CC Mode
e1dbe924 1554;; functions, allowing optimization for large n.
28abe5e2
AM
1555(c-lang-defconst beginning-of-defun-function
1556 "Function to which beginning-of-defun-function will be set."
1557 t 'c-beginning-of-defun
1558 awk 'c-awk-beginning-of-defun)
1559(c-lang-setvar beginning-of-defun-function
1560 (c-lang-const beginning-of-defun-function))
1561
1562(c-lang-defconst end-of-defun-function
1563 "Function to which end-of-defun-function will be set."
1564 t 'c-end-of-defun
1565 awk 'c-awk-end-of-defun)
1566(c-lang-setvar end-of-defun-function (c-lang-const end-of-defun-function))
1567\f
d9e94c22
MS
1568;;; In-comment text handling.
1569
1570(c-lang-defconst c-paragraph-start
1571 "Regexp to append to `paragraph-start'."
1572 t "$"
1573 java "\\(@[a-zA-Z]+\\>\\|$\\)" ; For Javadoc.
1574 pike "\\(@[a-zA-Z_-]+\\>\\([^{]\\|$\\)\\|$\\)") ; For Pike refdoc.
1575(c-lang-defvar c-paragraph-start (c-lang-const c-paragraph-start))
1576
1577(c-lang-defconst c-paragraph-separate
1578 "Regexp to append to `paragraph-separate'."
1579 t "$"
1580 pike (c-lang-const c-paragraph-start))
1581(c-lang-defvar c-paragraph-separate (c-lang-const c-paragraph-separate))
1582
1583\f
1584;;; Keyword lists.
1585
1586;; Note: All and only all language constants containing keyword lists
1587;; should end with "-kwds"; they're automatically collected into the
1588;; `c-kwds-lang-consts' list below and used to build `c-keywords' etc.
1589
a66cd3ee 1590(c-lang-defconst c-primitive-type-kwds
d9e94c22
MS
1591 "Primitive type keywords. As opposed to the other keyword lists, the
1592keywords listed here are fontified with the type face instead of the
1593keyword face.
1594
1595If any of these also are on `c-type-list-kwds', `c-ref-list-kwds',
1596`c-colon-type-list-kwds', `c-paren-nontype-kwds', `c-paren-type-kwds',
1597`c-<>-type-kwds', or `c-<>-arglist-kwds' then the associated clauses
1598will be handled.
1599
1600Do not try to modify this list for end user customizations; the
1601`*-font-lock-extra-types' variable, where `*' is the mode prefix, is
1602the appropriate place for that."
1603 t '("char" "double" "float" "int" "long" "short" "signed"
1604 "unsigned" "void")
1605 c (append
1606 '("_Bool" "_Complex" "_Imaginary") ; Conditionally defined in C99.
1607 (c-lang-const c-primitive-type-kwds))
1608 c++ (append
1609 '("bool" "wchar_t")
1610 (c-lang-const c-primitive-type-kwds))
1611 ;; Objective-C extends C, but probably not the new stuff in C99.
1612 objc (append
1613 '("id" "Class" "SEL" "IMP" "BOOL")
1614 (c-lang-const c-primitive-type-kwds))
a66cd3ee 1615 java '("boolean" "byte" "char" "double" "float" "int" "long" "short" "void")
d9e94c22
MS
1616 idl '("Object" "ValueBase" "any" "boolean" "char" "double" "fixed" "float"
1617 "long" "octet" "sequence" "short" "string" "void" "wchar" "wstring"
1618 ;; In CORBA PSDL:
1619 "ref"
1620 ;; The following can't really end a type, but we have to specify them
1621 ;; here due to the assumption in `c-primitive-type-prefix-kwds'. It
1622 ;; doesn't matter that much.
1623 "unsigned" "strong")
1624 pike '(;; this_program isn't really a keyword, but it's practically
1625 ;; used as a builtin type.
1626 "array" "float" "function" "int" "mapping" "mixed" "multiset"
1627 "object" "program" "string" "this_program" "void"))
1628
1629(c-lang-defconst c-primitive-type-key
1630 ;; An adorned regexp that matches `c-primitive-type-kwds'.
1631 t (c-make-keywords-re t (c-lang-const c-primitive-type-kwds)))
1632(c-lang-defvar c-primitive-type-key (c-lang-const c-primitive-type-key))
1633
1634(c-lang-defconst c-primitive-type-prefix-kwds
1635 "Keywords that might act as prefixes for primitive types. Assumed to
1636be a subset of `c-primitive-type-kwds'."
1637 t nil
1638 (c c++) '("long" "short" "signed" "unsigned")
1639 idl '("long" "unsigned"
1640 ;; In CORBA PSDL:
1641 "strong"))
1642
e15f8aaa
AM
1643(c-lang-defconst c-typedef-kwds
1644 "Prefix keyword\(s\) like \"typedef\" which make a type declaration out
1645of a variable declaration."
1646 t '("typedef")
1647 (awk idl java) nil)
1648
1649(c-lang-defconst c-typedef-key
1650 ;; Adorned regexp matching `c-typedef-kwds'.
1651 t (c-make-keywords-re t (c-lang-const c-typedef-kwds)))
1652(c-lang-defvar c-typedef-key (c-lang-const c-typedef-key))
1653
d9e94c22
MS
1654(c-lang-defconst c-type-prefix-kwds
1655 "Keywords where the following name - if any - is a type name, and
1656where the keyword together with the symbol works as a type in
1657declarations.
1658
1659Note that an alternative if the second part doesn't hold is
1660`c-type-list-kwds'. Keywords on this list are typically also present
1661on one of the `*-decl-kwds' lists."
1662 t nil
1663 c '("struct" "union" "enum")
1664 c++ (append '("class" "typename")
1665 (c-lang-const c-type-prefix-kwds c)))
1666
1667(c-lang-defconst c-type-prefix-key
1668 ;; Adorned regexp matching `c-type-prefix-kwds'.
1669 t (c-make-keywords-re t (c-lang-const c-type-prefix-kwds)))
1670(c-lang-defvar c-type-prefix-key (c-lang-const c-type-prefix-key))
1671
1672(c-lang-defconst c-type-modifier-kwds
1673 "Type modifier keywords. These can occur almost anywhere in types
1674but they don't build a type of themselves. Unlike the keywords on
1675`c-primitive-type-kwds', they are fontified with the keyword face and
1676not the type face."
1677 t nil
1678 c '("const" "restrict" "volatile")
1679 c++ '("const" "volatile" "throw")
1680 objc '("const" "volatile"))
1681
1682(c-lang-defconst c-opt-type-modifier-key
1683 ;; Adorned regexp matching `c-type-modifier-kwds', or nil in
1684 ;; languages without such keywords.
1685 t (and (c-lang-const c-type-modifier-kwds)
1686 (c-make-keywords-re t (c-lang-const c-type-modifier-kwds))))
1687(c-lang-defvar c-opt-type-modifier-key (c-lang-const c-opt-type-modifier-key))
1688
1689(c-lang-defconst c-opt-type-component-key
1690 ;; An adorned regexp that matches `c-primitive-type-prefix-kwds' and
1691 ;; `c-type-modifier-kwds', or nil in languages without any of them.
1692 t (and (or (c-lang-const c-primitive-type-prefix-kwds)
1693 (c-lang-const c-type-modifier-kwds))
1694 (c-make-keywords-re t
1695 (append (c-lang-const c-primitive-type-prefix-kwds)
1696 (c-lang-const c-type-modifier-kwds)))))
1697(c-lang-defvar c-opt-type-component-key
1698 (c-lang-const c-opt-type-component-key))
1699
0386b551
AM
1700(c-lang-defconst c-type-start-kwds
1701 ;; All keywords that can start a type (i.e. are either a type prefix
1702 ;; or a complete type).
1703 t (delete-duplicates (append (c-lang-const c-primitive-type-kwds)
1704 (c-lang-const c-type-prefix-kwds)
1705 (c-lang-const c-type-modifier-kwds))
1706 :test 'string-equal))
1707
d9e94c22
MS
1708(c-lang-defconst c-class-decl-kwds
1709 "Keywords introducing declarations where the following block (if any)
1710contains another declaration level that should be considered a class.
1711
1712If any of these also are on `c-type-list-kwds', `c-ref-list-kwds',
1713`c-colon-type-list-kwds', `c-paren-nontype-kwds', `c-paren-type-kwds',
1714`c-<>-type-kwds', or `c-<>-arglist-kwds' then the associated clauses
1715will be handled.
1716
1717Note that presence on this list does not automatically treat the
1718following identifier as a type; the keyword must also be present on
1719`c-type-prefix-kwds' or `c-type-list-kwds' to accomplish that."
1720 t nil
1721 c '("struct" "union")
1722 c++ '("class" "struct" "union")
1723 objc '("struct" "union"
1724 "@interface" "@implementation" "@protocol")
452ea855 1725 java '("class" "@interface" "interface")
d9e94c22
MS
1726 idl '("component" "eventtype" "exception" "home" "interface" "struct"
1727 "union" "valuetype"
1728 ;; In CORBA PSDL:
1729 "storagehome" "storagetype"
1730 ;; In CORBA CIDL:
1731 "catalog" "executor" "manages" "segment")
a66cd3ee
MS
1732 pike '("class"))
1733
a66cd3ee 1734(c-lang-defconst c-class-key
d9e94c22
MS
1735 ;; Regexp matching the start of a class.
1736 t (c-make-keywords-re t (c-lang-const c-class-decl-kwds)))
1737(c-lang-defvar c-class-key (c-lang-const c-class-key))
1738
1739(c-lang-defconst c-brace-list-decl-kwds
1740 "Keywords introducing declarations where the following block (if
1741any) is a brace list.
1742
1743If any of these also are on `c-type-list-kwds', `c-ref-list-kwds',
1744`c-colon-type-list-kwds', `c-paren-nontype-kwds', `c-paren-type-kwds',
1745`c-<>-type-kwds', or `c-<>-arglist-kwds' then the associated clauses
1746will be handled."
1747 t '("enum")
452ea855 1748 (awk) nil)
d9e94c22
MS
1749
1750(c-lang-defconst c-brace-list-key
1751 ;; Regexp matching the start of declarations where the following
1752 ;; block is a brace list.
1753 t (c-make-keywords-re t (c-lang-const c-brace-list-decl-kwds)))
1754(c-lang-defvar c-brace-list-key (c-lang-const c-brace-list-key))
1755
1756(c-lang-defconst c-other-block-decl-kwds
3efc2cd7 1757 "Keywords where the following block (if any) contains another
0386b551
AM
1758declaration level that should not be considered a class. For every
1759keyword here, CC Mode will add a set of special syntactic symbols for
1760those blocks. E.g. if the keyword is \"foo\" then there will be
1761`foo-open', `foo-close', and `infoo' symbols.
1762
1763The intention is that this category should be used for block
1764constructs that aren't related to object orientation concepts like
1765classes (which thus also include e.g. interfaces, templates,
1766contracts, structs, etc). The more pragmatic distinction is that
1767while most want some indentation inside classes, it's fairly common
1768that they don't want it in some of these constructs, so it should be
1769simple to configure that differently from classes. See also
1770`c-class-decl-kwds'.
d9e94c22
MS
1771
1772If any of these also are on `c-type-list-kwds', `c-ref-list-kwds',
1773`c-colon-type-list-kwds', `c-paren-nontype-kwds', `c-paren-type-kwds',
1774`c-<>-type-kwds', or `c-<>-arglist-kwds' then the associated clauses
1775will be handled."
1776 t nil
0386b551 1777 (c objc) '("extern")
a66cd3ee 1778 c++ '("namespace" "extern")
d9e94c22
MS
1779 idl '("module"
1780 ;; In CORBA CIDL:
1781 "composition"))
a66cd3ee 1782
a66cd3ee 1783(c-lang-defconst c-other-decl-block-key
d9e94c22
MS
1784 ;; Regexp matching the start of blocks besides classes that contain
1785 ;; another declaration level.
1786 t (c-make-keywords-re t (c-lang-const c-other-block-decl-kwds)))
1787(c-lang-defvar c-other-decl-block-key (c-lang-const c-other-decl-block-key))
1788
c382ec40
AM
1789(c-lang-defvar c-other-decl-block-key-in-symbols-alist
1790 (mapcar
1791 (lambda (elt)
1792 (cons elt
1793 (if (string= elt "extern")
1794 'inextern-lang
1795 (intern (concat "in" elt)))))
1796 (c-lang-const c-other-block-decl-kwds))
1797 "Alist associating keywords in c-other-decl-block-decl-kwds with
1798their matching \"in\" syntactic symbols.")
1799
d9e94c22 1800(c-lang-defconst c-typedef-decl-kwds
0386b551
AM
1801 "Keywords introducing declarations where the identifier(s) being
1802declared are types.
d9e94c22
MS
1803
1804If any of these also are on `c-type-list-kwds', `c-ref-list-kwds',
1805`c-colon-type-list-kwds', `c-paren-nontype-kwds', `c-paren-type-kwds',
1806`c-<>-type-kwds', or `c-<>-arglist-kwds' then the associated clauses
1807will be handled."
0386b551
AM
1808 ;; Default to `c-class-decl-kwds' and `c-brace-list-decl-kwds'
1809 ;; (since e.g. "Foo" is a type that's being defined in "class Foo
1810 ;; {...}").
1811 t (append (c-lang-const c-class-decl-kwds)
1812 (c-lang-const c-brace-list-decl-kwds))
1813 ;; Languages that have a "typedef" construct.
1814 (c c++ objc idl pike) (append (c-lang-const c-typedef-decl-kwds)
1815 '("typedef"))
1816 ;; Unlike most other languages, exception names are not handled as
1817 ;; types in IDL since they only can occur in "raises" specs.
1818 idl (delete "exception" (append (c-lang-const c-typedef-decl-kwds) nil)))
d9e94c22 1819
e15f8aaa
AM
1820(c-lang-defconst c-typedef-decl-key
1821 t (c-make-keywords-re t (c-lang-const c-typedef-decl-kwds)))
1822(c-lang-defvar c-typedef-decl-key (c-lang-const c-typedef-decl-key))
1823
d9e94c22 1824(c-lang-defconst c-typeless-decl-kwds
0386b551
AM
1825 "Keywords introducing declarations where the \(first) identifier
1826\(declarator) follows directly after the keyword, without any type.
d9e94c22
MS
1827
1828If any of these also are on `c-type-list-kwds', `c-ref-list-kwds',
1829`c-colon-type-list-kwds', `c-paren-nontype-kwds', `c-paren-type-kwds',
1830`c-<>-type-kwds', or `c-<>-arglist-kwds' then the associated clauses
1831will be handled."
0386b551
AM
1832 ;; Default to `c-class-decl-kwds' and `c-brace-list-decl-kwds'
1833 ;; (since e.g. "Foo" is the identifier being defined in "class Foo
1834 ;; {...}").
1835 t (append (c-lang-const c-class-decl-kwds)
1836 (c-lang-const c-brace-list-decl-kwds))
1837 ;; Note: "manages" for CORBA CIDL clashes with its presence on
1838 ;; `c-type-list-kwds' for IDL.
1839 idl (append (c-lang-const c-typeless-decl-kwds)
1840 '("factory" "finder" "native"
1841 ;; In CORBA PSDL:
1842 "key" "stores"
1843 ;; In CORBA CIDL:
1844 "facet"))
1845 pike (append (c-lang-const c-class-decl-kwds)
1846 '("constant")))
d9e94c22
MS
1847
1848(c-lang-defconst c-modifier-kwds
1849 "Keywords that can prefix normal declarations of identifiers
0386b551 1850\(and typically act as flags). Things like argument declarations
d9e94c22
MS
1851inside function headers are also considered declarations in this
1852sense.
1853
1854If any of these also are on `c-type-list-kwds', `c-ref-list-kwds',
1855`c-colon-type-list-kwds', `c-paren-nontype-kwds', `c-paren-type-kwds',
1856`c-<>-type-kwds', or `c-<>-arglist-kwds' then the associated clauses
1857will be handled."
1858 t nil
1859 (c c++) '("auto" "extern" "inline" "register" "static")
1860 c++ (append '("explicit" "friend" "mutable" "template" "using" "virtual")
1861 (c-lang-const c-modifier-kwds))
1862 objc '("auto" "bycopy" "byref" "extern" "in" "inout" "oneway" "out" "static")
1863 ;; FIXME: Some of those below ought to be on `c-other-decl-kwds' instead.
1864 idl '("abstract" "attribute" "const" "consumes" "custom" "emits" "import"
1865 "in" "inout" "local" "multiple" "oneway" "out" "private" "provides"
1866 "public" "publishes" "readonly" "typeid" "typeprefix" "uses"
1867 ;; In CORBA PSDL:
1868 "primary" "state"
1869 ;; In CORBA CIDL:
1870 "bindsTo" "delegatesTo" "implements" "proxy" "storedOn")
1871 ;; Note: "const" is not used in Java, but it's still a reserved keyword.
1872 java '("abstract" "const" "final" "native" "private" "protected" "public"
e3715033 1873 "static" "strictfp" "synchronized" "transient" "volatile")
d9e94c22
MS
1874 pike '("final" "inline" "local" "nomask" "optional" "private" "protected"
1875 "public" "static" "variant"))
a66cd3ee 1876
d9e94c22
MS
1877(c-lang-defconst c-other-decl-kwds
1878 "Keywords that can start or prefix any declaration level construct,
1879besides those on `c-class-decl-kwds', `c-brace-list-decl-kwds',
1880`c-other-block-decl-kwds', `c-typedef-decl-kwds',
0386b551 1881`c-typeless-decl-kwds' and `c-modifier-kwds'.
d9e94c22
MS
1882
1883If any of these also are on `c-type-list-kwds', `c-ref-list-kwds',
1884`c-colon-type-list-kwds', `c-paren-nontype-kwds', `c-paren-type-kwds',
1885`c-<>-type-kwds', or `c-<>-arglist-kwds' then the associated clauses
1886will be handled."
1887 t nil
d9e94c22
MS
1888 objc '("@class" "@end" "@defs")
1889 java '("import" "package")
1890 pike '("import" "inherit"))
1891
0386b551
AM
1892(c-lang-defconst c-decl-start-kwds
1893 "Keywords that always start declarations, wherever they occur.
1894This can be used for declarations that aren't recognized by the normal
1895combination of `c-decl-prefix-re' and `c-decl-start-re'."
1896 t nil
1897 ;; Classes can be declared anywhere in a Pike expression.
1898 pike '("class"))
1899
1900(c-lang-defconst c-decl-hangon-kwds
1901 "Keywords that can occur anywhere in a declaration level construct.
1902This is used for self-contained things that can be tacked on anywhere
1903on a declaration and that should be ignored to be able to recognize it
1904correctly. Typical cases are compiler extensions like
1905\"__attribute__\" or \"__declspec\":
1906
1907 __declspec(noreturn) void foo();
1908 class __declspec(dllexport) classname {...};
1909 void foo() __attribute__((noreturn));
1910
1911Note that unrecognized plain symbols are skipped anyway if they occur
1912before the type, so such things are not necessary to mention here.
1913Mentioning them here is necessary only if they can occur in other
1914places, or if they are followed by a construct that must be skipped
1915over \(like the parens in the \"__attribute__\" and \"__declspec\"
1916examples above). In the last case, they alse need to be present on
1917one of `c-type-list-kwds', `c-ref-list-kwds',
1918`c-colon-type-list-kwds', `c-paren-nontype-kwds', `c-paren-type-kwds',
1919`c-<>-type-kwds', or `c-<>-arglist-kwds'."
1920 ;; NB: These are currently not recognized in all parts of a
1921 ;; declaration. Specifically, they aren't recognized in the middle
1922 ;; of multi-token types, inside declarators, and between the
1923 ;; identifier and the arglist paren of a function declaration.
1924 ;;
1925 ;; FIXME: This ought to be user customizable since compiler stuff
1926 ;; like this usually is wrapped in project specific macros. (It'd
1927 ;; of course be even better if we could cope without knowing this.)
1928 t nil
1929 (c c++) '(;; GCC extension.
1930 "__attribute__"
1931 ;; MSVC extension.
1932 "__declspec"))
1933
1934(c-lang-defconst c-decl-hangon-key
1935 ;; Adorned regexp matching `c-decl-hangon-kwds'.
1936 t (c-make-keywords-re t (c-lang-const c-decl-hangon-kwds)))
1937(c-lang-defvar c-decl-hangon-key (c-lang-const c-decl-hangon-key))
1938
1939(c-lang-defconst c-prefix-spec-kwds
1940 ;; All keywords that can occur in the preamble of a declaration.
1941 ;; They typically occur before the type, but they are also matched
1942 ;; after presumptive types since we often can't be sure that
1943 ;; something is a type or just some sort of macro in front of the
1944 ;; declaration. They might be ambiguous with types or type
1945 ;; prefixes.
1946 t (delete-duplicates (append (c-lang-const c-class-decl-kwds)
1947 (c-lang-const c-brace-list-decl-kwds)
1948 (c-lang-const c-other-block-decl-kwds)
1949 (c-lang-const c-typedef-decl-kwds)
1950 (c-lang-const c-typeless-decl-kwds)
1951 (c-lang-const c-modifier-kwds)
1952 (c-lang-const c-other-decl-kwds)
1953 (c-lang-const c-decl-start-kwds)
1954 (c-lang-const c-decl-hangon-kwds))
1955 :test 'string-equal))
1956
1957(c-lang-defconst c-prefix-spec-kwds-re
1958 ;; Adorned regexp of `c-prefix-spec-kwds'.
e3715033 1959 t (c-make-keywords-re t (c-lang-const c-prefix-spec-kwds)))
452ea855 1960
0386b551
AM
1961(c-lang-defvar c-prefix-spec-kwds-re (c-lang-const c-prefix-spec-kwds-re))
1962
d9e94c22 1963(c-lang-defconst c-specifier-key
cc1cce14
AM
1964 ;; Adorned regexp of the keywords in `c-prefix-spec-kwds' that aren't
1965 ;; ambiguous with types or type prefixes. These are the keywords (like
1966 ;; extern, namespace, but NOT template) that can modify a declaration.
d9e94c22 1967 t (c-make-keywords-re t
0386b551 1968 (set-difference (c-lang-const c-prefix-spec-kwds)
cc1cce14
AM
1969 (append (c-lang-const c-type-start-kwds)
1970 (c-lang-const c-<>-arglist-kwds))
d9e94c22
MS
1971 :test 'string-equal)))
1972(c-lang-defvar c-specifier-key (c-lang-const c-specifier-key))
a66cd3ee 1973
0386b551
AM
1974(c-lang-defconst c-postfix-spec-kwds
1975 ;; Keywords that can occur after argument list of a function header
1976 ;; declaration, i.e. in the "K&R region".
1977 t (append (c-lang-const c-postfix-decl-spec-kwds)
1978 (c-lang-const c-decl-hangon-kwds)))
1979
1980(c-lang-defconst c-not-decl-init-keywords
1981 ;; Adorned regexp matching all keywords that can't appear at the
1982 ;; start of a declaration.
1983 t (c-make-keywords-re t
1984 (set-difference (c-lang-const c-keywords)
1985 (append (c-lang-const c-type-start-kwds)
1986 (c-lang-const c-prefix-spec-kwds))
1987 :test 'string-equal)))
1988(c-lang-defvar c-not-decl-init-keywords
1989 (c-lang-const c-not-decl-init-keywords))
1990
b248a85d
AM
1991(c-lang-defconst c-not-primitive-type-keywords
1992 "List of all keywords apart from primitive types (like \"int\")."
1993 t (set-difference (c-lang-const c-keywords)
1994 (c-lang-const c-primitive-type-kwds)
1995 :test 'string-equal)
1996 ;; The "more" for C++ is the QT keyword (as in "more slots:").
1997 ;; This variable is intended for use in c-beginning-of-statement-1.
1998 c++ (append (c-lang-const c-not-primitive-type-keywords) '("more")))
1999
2000(c-lang-defconst c-not-primitive-type-keywords-regexp
2001 t (c-make-keywords-re t
2002 (c-lang-const c-not-primitive-type-keywords)))
2003(c-lang-defvar c-not-primitive-type-keywords-regexp
2004 (c-lang-const c-not-primitive-type-keywords-regexp))
2005
d9e94c22 2006(c-lang-defconst c-protection-kwds
0386b551 2007 "Access protection label keywords in classes."
d9e94c22
MS
2008 t nil
2009 c++ '("private" "protected" "public")
2010 objc '("@private" "@protected" "@public"))
a66cd3ee 2011
d9e94c22
MS
2012(c-lang-defconst c-block-decls-with-vars
2013 "Keywords introducing declarations that can contain a block which
2014might be followed by variable declarations, e.g. like \"foo\" in
2015\"class Foo { ... } foo;\". So if there is a block in a declaration
2016like that, it ends with the following ';' and not right away.
130c507e 2017
d9e94c22
MS
2018The keywords on list are assumed to also be present on one of the
2019`*-decl-kwds' lists."
2020 t nil
2021 (c objc) '("struct" "union" "enum" "typedef")
2022 c++ '("class" "struct" "union" "enum" "typedef"))
2023
2024(c-lang-defconst c-opt-block-decls-with-vars-key
2025 ;; Regexp matching the `c-block-decls-with-vars' keywords, or nil in
2026 ;; languages without such constructs.
2027 t (and (c-lang-const c-block-decls-with-vars)
2028 (c-make-keywords-re t (c-lang-const c-block-decls-with-vars))))
2029(c-lang-defvar c-opt-block-decls-with-vars-key
2030 (c-lang-const c-opt-block-decls-with-vars-key))
2031
2032(c-lang-defconst c-postfix-decl-spec-kwds
2033 "Keywords introducing extra declaration specifiers in the region
2034between the header and the body \(i.e. the \"K&R-region\") in
2035declarations."
2036 t nil
d9e94c22
MS
2037 java '("extends" "implements" "throws")
2038 idl '("context" "getraises" "manages" "primarykey" "raises" "setraises"
2039 "supports"
2040 ;; In CORBA PSDL:
2041 "as" "const" "implements" "of" "ref"))
2042
38de11bd
AM
2043(c-lang-defconst c-postfix-decl-spec-key
2044 ;; Regexp matching the keywords in `c-postfix-decl-spec-kwds'.
2045 t (c-make-keywords-re t (c-lang-const c-postfix-decl-spec-kwds)))
2046(c-lang-defvar c-postfix-decl-spec-key
2047 (c-lang-const c-postfix-decl-spec-key))
2048
d9e94c22
MS
2049(c-lang-defconst c-nonsymbol-sexp-kwds
2050 "Keywords that may be followed by a nonsymbol sexp before whatever
2051construct it's part of continues."
2052 t nil
2053 (c c++ objc) '("extern"))
2054
2055(c-lang-defconst c-type-list-kwds
2056 "Keywords that may be followed by a comma separated list of type
2057identifiers, where each optionally can be prefixed by keywords. (Can
2058also be used for the special case when the list can contain only one
2059element.)
2060
2061Assumed to be mutually exclusive with `c-ref-list-kwds'. There's no
2062reason to put keywords on this list if they are on `c-type-prefix-kwds'.
2063There's also no reason to add keywords that prefixes a normal
2064declaration consisting of a type followed by a declarator (list), so
2065the keywords on `c-modifier-kwds' should normally not be listed here
0386b551 2066either.
d9e94c22
MS
2067
2068Note: Use `c-typeless-decl-kwds' for keywords followed by a function
2069or variable identifier (that's being defined)."
0386b551 2070 t nil
fa14078b 2071 c++ '("operator")
0386b551 2072 objc '("@class")
452ea855 2073 java '("import" "new" "extends" "super" "implements" "throws")
0386b551
AM
2074 idl '("manages" "native" "primarykey" "supports"
2075 ;; In CORBA PSDL:
2076 "as" "implements" "of" "scope")
2077 pike '("inherit"))
d9e94c22
MS
2078
2079(c-lang-defconst c-ref-list-kwds
2080 "Keywords that may be followed by a comma separated list of
2081reference (i.e. namespace/scope/module) identifiers, where each
2082optionally can be prefixed by keywords. (Can also be used for the
2083special case when the list can contain only one element.) Assumed to
2084be mutually exclusive with `c-type-list-kwds'.
2085
2086Note: Use `c-typeless-decl-kwds' for keywords followed by a function
2087or variable identifier (that's being defined)."
2088 t nil
2089 c++ '("namespace")
2090 java '("package")
2091 idl '("import" "module"
2092 ;; In CORBA CIDL:
2093 "composition")
2094 pike '("import"))
2095
2096(c-lang-defconst c-colon-type-list-kwds
2097 "Keywords that may be followed (not necessarily directly) by a colon
2098and then a comma separated list of type identifiers, where each
2099optionally can be prefixed by keywords. (Can also be used for the
2100special case when the list can contain only one element.)"
2101 t nil
2102 c++ '("class" "struct")
2103 idl '("component" "eventtype" "home" "interface" "valuetype"
2104 ;; In CORBA PSDL:
2105 "storagehome" "storagetype"))
2106
2107(c-lang-defconst c-colon-type-list-re
2108 "Regexp matched after the keywords in `c-colon-type-list-kwds' to skip
2109forward to the colon. The end of the match is assumed to be directly
0386b551
AM
2110after the colon, so the regexp should end with \":\". Must be a
2111regexp if `c-colon-type-list-kwds' isn't nil."
d9e94c22
MS
2112 t (if (c-lang-const c-colon-type-list-kwds)
2113 ;; Disallow various common punctuation chars that can't come
2114 ;; before the ":" that starts the inherit list after "class"
2115 ;; or "struct" in C++. (Also used as default for other
2116 ;; languages.)
2117 "[^\]\[{}();,/#=:]*:"))
2118(c-lang-defvar c-colon-type-list-re (c-lang-const c-colon-type-list-re))
2119
2120(c-lang-defconst c-paren-nontype-kwds
2121 "Keywords that may be followed by a parenthesis expression that doesn't
2122contain type identifiers."
2123 t nil
0386b551
AM
2124 (c c++) '(;; GCC extension.
2125 "__attribute__"
2126 ;; MSVC extension.
2127 "__declspec"))
d9e94c22
MS
2128
2129(c-lang-defconst c-paren-type-kwds
2130 "Keywords that may be followed by a parenthesis expression containing
2131type identifiers separated by arbitrary tokens."
2132 t nil
2133 c++ '("throw")
2134 objc '("@defs")
2135 idl '("switch")
2136 pike '("array" "function" "int" "mapping" "multiset" "object" "program"))
2137
2138(c-lang-defconst c-paren-any-kwds
2139 t (delete-duplicates (append (c-lang-const c-paren-nontype-kwds)
2140 (c-lang-const c-paren-type-kwds))
2141 :test 'string-equal))
2142
2143(c-lang-defconst c-<>-type-kwds
2144 "Keywords that may be followed by an angle bracket expression
2145containing type identifiers separated by \",\". The difference from
2146`c-<>-arglist-kwds' is that unknown names are taken to be types and
2147not other identifiers. `c-recognize-<>-arglists' is assumed to be set
2148if this isn't nil."
2149 t nil
2150 objc '("id")
2151 idl '("sequence"
2152 ;; In CORBA PSDL:
2153 "ref"))
2154
2155(c-lang-defconst c-<>-arglist-kwds
2156 "Keywords that can be followed by a C++ style template arglist; see
2157`c-recognize-<>-arglists' for details. That language constant is
2158assumed to be set if this isn't nil."
2159 t nil
2160 c++ '("template")
2161 idl '("fixed" "string" "wstring"))
2162
2163(c-lang-defconst c-<>-sexp-kwds
2164 ;; All keywords that can be followed by an angle bracket sexp.
2165 t (delete-duplicates (append (c-lang-const c-<>-type-kwds)
2166 (c-lang-const c-<>-arglist-kwds))
2167 :test 'string-equal))
2168
2169(c-lang-defconst c-opt-<>-sexp-key
2170 ;; Adorned regexp matching keywords that can be followed by an angle
846f5040 2171 ;; bracket sexp. Always set when `c-recognize-<>-arglists' is.
869455d4 2172 t (c-make-keywords-re t (c-lang-const c-<>-sexp-kwds)))
d9e94c22
MS
2173(c-lang-defvar c-opt-<>-sexp-key (c-lang-const c-opt-<>-sexp-key))
2174
2175(c-lang-defconst c-brace-id-list-kwds
2176 "Keywords that may be followed by a brace block containing a comma
2177separated list of identifier definitions, i.e. like the list of
2178identifiers that follows the type in a normal declaration."
2179 t (c-lang-const c-brace-list-decl-kwds))
a66cd3ee 2180
a66cd3ee 2181(c-lang-defconst c-block-stmt-1-kwds
d9e94c22
MS
2182 "Statement keywords followed directly by a substatement."
2183 t '("do" "else")
2184 c++ '("do" "else" "try")
9555a4cf 2185 objc '("do" "else" "@finally" "@try")
d9e94c22
MS
2186 java '("do" "else" "finally" "try")
2187 idl nil)
a66cd3ee 2188
a66cd3ee 2189(c-lang-defconst c-block-stmt-1-key
d9e94c22
MS
2190 ;; Regexp matching the start of any statement followed directly by a
2191 ;; substatement (doesn't match a bare block, however).
2192 t (c-make-keywords-re t (c-lang-const c-block-stmt-1-kwds)))
2193(c-lang-defvar c-block-stmt-1-key (c-lang-const c-block-stmt-1-key))
a66cd3ee 2194
5ab78d3d
AM
2195(c-lang-defconst c-block-stmt-1-2-kwds
2196 "Statement keywords optionally followed by a paren sexp.
2197Keywords here should also be in `c-block-stmt-1-kwds'."
2198 t nil
2199 java '("try"))
2200
2201(c-lang-defconst c-block-stmt-1-2-key
2202 ;; Regexp matching the start of a statement which may be followed by a
2203 ;; paren sexp and will then be followed by a substatement.
2204 t (c-make-keywords-re t (c-lang-const c-block-stmt-1-2-kwds)))
2205(c-lang-defvar c-block-stmt-1-2-key (c-lang-const c-block-stmt-1-2-key))
2206
a66cd3ee 2207(c-lang-defconst c-block-stmt-2-kwds
d9e94c22
MS
2208 "Statement keywords followed by a paren sexp and then by a substatement."
2209 t '("for" "if" "switch" "while")
2210 c++ '("for" "if" "switch" "while" "catch")
9555a4cf 2211 objc '("for" "if" "switch" "while" "@catch" "@synchronized")
a66cd3ee 2212 java '("for" "if" "switch" "while" "catch" "synchronized")
d9e94c22
MS
2213 idl nil
2214 pike '("for" "if" "switch" "while" "foreach")
2215 awk '("for" "if" "while"))
a66cd3ee 2216
a66cd3ee 2217(c-lang-defconst c-block-stmt-2-key
d9e94c22
MS
2218 ;; Regexp matching the start of any statement followed by a paren sexp
2219 ;; and then by a substatement.
2220 t (c-make-keywords-re t (c-lang-const c-block-stmt-2-kwds)))
2221(c-lang-defvar c-block-stmt-2-key (c-lang-const c-block-stmt-2-key))
a66cd3ee 2222
0386b551
AM
2223(c-lang-defconst c-block-stmt-kwds
2224 ;; Union of `c-block-stmt-1-kwds' and `c-block-stmt-2-kwds'.
2225 t (delete-duplicates (append (c-lang-const c-block-stmt-1-kwds)
2226 (c-lang-const c-block-stmt-2-kwds))
2227 :test 'string-equal))
2228
a66cd3ee 2229(c-lang-defconst c-opt-block-stmt-key
d9e94c22
MS
2230 ;; Regexp matching the start of any statement that has a
2231 ;; substatement (except a bare block). Nil in languages that
2232 ;; don't have such constructs.
2233 t (if (or (c-lang-const c-block-stmt-1-kwds)
2234 (c-lang-const c-block-stmt-2-kwds))
2235 (c-make-keywords-re t
2236 (append (c-lang-const c-block-stmt-1-kwds)
2237 (c-lang-const c-block-stmt-2-kwds)))))
2238(c-lang-defvar c-opt-block-stmt-key (c-lang-const c-opt-block-stmt-key))
2239
a66cd3ee 2240(c-lang-defconst c-simple-stmt-kwds
d9e94c22
MS
2241 "Statement keywords followed by an expression or nothing."
2242 t '("break" "continue" "goto" "return")
9555a4cf 2243 objc '("break" "continue" "goto" "return" "@throw")
a66cd3ee
MS
2244 ;; Note: `goto' is not valid in Java, but the keyword is still reserved.
2245 java '("break" "continue" "goto" "return" "throw")
d9e94c22
MS
2246 idl nil
2247 pike '("break" "continue" "return")
2248 awk '(;; Not sure about "delete", "exit", "getline", etc. ; ACM 2002/5/30
2249 "break" "continue" "return" "delete" "exit" "getline" "next"
2250 "nextfile" "print" "printf"))
2251
2252(c-lang-defconst c-simple-stmt-key
2253 ;; Adorned regexp matching `c-simple-stmt-kwds'.
2254 t (c-make-keywords-re t (c-lang-const c-simple-stmt-kwds)))
2255(c-lang-defvar c-simple-stmt-key (c-lang-const c-simple-stmt-key))
2256
2257(c-lang-defconst c-paren-stmt-kwds
2258 "Statement keywords followed by a parenthesis expression that
2259nevertheless contains a list separated with ';' and not ','."
2260 t '("for")
2261 idl nil)
2262
2263(c-lang-defconst c-paren-stmt-key
2264 ;; Adorned regexp matching `c-paren-stmt-kwds'.
2265 t (c-make-keywords-re t (c-lang-const c-paren-stmt-kwds)))
2266(c-lang-defvar c-paren-stmt-key (c-lang-const c-paren-stmt-key))
a66cd3ee 2267
a66cd3ee 2268(c-lang-defconst c-asm-stmt-kwds
d9e94c22
MS
2269 "Statement keywords followed by an assembler expression."
2270 t nil
2271 (c c++) '("asm" "__asm__")) ;; Not standard, but common.
a66cd3ee 2272
a66cd3ee 2273(c-lang-defconst c-opt-asm-stmt-key
d9e94c22
MS
2274 ;; Regexp matching the start of an assembler statement. Nil in
2275 ;; languages that don't support that.
2276 t (if (c-lang-const c-asm-stmt-kwds)
2277 (c-make-keywords-re t (c-lang-const c-asm-stmt-kwds))))
2278(c-lang-defvar c-opt-asm-stmt-key (c-lang-const c-opt-asm-stmt-key))
2279
d28e7f28
AM
2280(c-lang-defconst c-case-kwds
2281 "The keyword\(s) which introduce a \"case\" like construct.
2282This construct is \"<keyword> <expression> :\"."
2283 t '("case")
2284 awk nil)
2285
2286(c-lang-defconst c-case-kwds-regexp
2287 ;; Adorned regexp matching any "case"-like keyword.
2288 t (c-make-keywords-re t (c-lang-const c-case-kwds)))
2289(c-lang-defvar c-case-kwds-regexp (c-lang-const c-case-kwds-regexp))
2290
d9e94c22 2291(c-lang-defconst c-label-kwds
0386b551 2292 "Keywords introducing colon terminated labels in blocks."
898169a2 2293 t '("case" "default"))
d9e94c22 2294
0386b551
AM
2295(c-lang-defconst c-label-kwds-regexp
2296 ;; Adorned regexp matching any keyword that introduces a label.
2297 t (c-make-keywords-re t (c-lang-const c-label-kwds)))
2298(c-lang-defvar c-label-kwds-regexp (c-lang-const c-label-kwds-regexp))
2299
d9e94c22
MS
2300(c-lang-defconst c-before-label-kwds
2301 "Keywords that might be followed by a label identifier."
2302 t '("goto")
2303 (java pike) (append '("break" "continue")
2304 (c-lang-const c-before-label-kwds))
2305 idl nil
2306 awk nil)
130c507e 2307
d9e94c22
MS
2308(c-lang-defconst c-constant-kwds
2309 "Keywords for constants."
2310 t nil
2311 (c c++) '("NULL" ;; Not a keyword, but practically works as one.
2312 "false" "true") ; Defined in C99.
f0e4b2f2 2313 objc '("nil" "Nil" "YES" "NO" "NS_DURING" "NS_HANDLER" "NS_ENDHANDLER")
d9e94c22 2314 idl '("TRUE" "FALSE")
fbd4de65 2315 java '("true" "false" "null") ; technically "literals", not keywords
d9e94c22
MS
2316 pike '("UNDEFINED")) ;; Not a keyword, but practically works as one.
2317
2318(c-lang-defconst c-primary-expr-kwds
2319 "Keywords besides constants and operators that start primary expressions."
2320 t nil
2321 c++ '("operator" "this")
2322 objc '("super" "self")
2323 java '("this")
2324 pike '("this")) ;; Not really a keyword, but practically works as one.
130c507e 2325
a66cd3ee 2326(c-lang-defconst c-expr-kwds
d9e94c22
MS
2327 ;; Keywords that can occur anywhere in expressions. Built from
2328 ;; `c-primary-expr-kwds' and all keyword operators in `c-operators'.
2329 t (delete-duplicates
2330 (append (c-lang-const c-primary-expr-kwds)
0386b551
AM
2331 (c-filter-ops (c-lang-const c-operator-list)
2332 t
2333 "\\`\\(\\w\\|\\s_\\)+\\'"))
d9e94c22
MS
2334 :test 'string-equal))
2335
2336(c-lang-defconst c-lambda-kwds
2337 "Keywords that start lambda constructs, i.e. function definitions in
2338expressions."
2339 t nil
2340 pike '("lambda"))
a66cd3ee 2341
d9e94c22
MS
2342(c-lang-defconst c-inexpr-block-kwds
2343 "Keywords that start constructs followed by statement blocks which can
2344be used in expressions \(the gcc extension for this in C and C++ is
0386b551 2345handled separately by `c-recognize-paren-inexpr-blocks')."
d9e94c22
MS
2346 t nil
2347 pike '("catch" "gauge"))
a66cd3ee 2348
a66cd3ee 2349(c-lang-defconst c-inexpr-class-kwds
d9e94c22
MS
2350 "Keywords that can start classes inside expressions."
2351 t nil
a66cd3ee
MS
2352 java '("new")
2353 pike '("class"))
2354
d9e94c22
MS
2355(c-lang-defconst c-inexpr-brace-list-kwds
2356 "Keywords that can start brace list blocks inside expressions.
2357Note that Java specific rules are currently applied to tell this from
2358`c-inexpr-class-kwds'."
2359 t nil
2360 java '("new"))
2361
2362(c-lang-defconst c-opt-inexpr-brace-list-key
2363 ;; Regexp matching the start of a brace list in an expression, or
2364 ;; nil in languages that don't have such things. This should not
2365 ;; match brace lists recognized through `c-special-brace-lists'.
2366 t (and (c-lang-const c-inexpr-brace-list-kwds)
2367 (c-make-keywords-re t (c-lang-const c-inexpr-brace-list-kwds))))
2368(c-lang-defvar c-opt-inexpr-brace-list-key
2369 (c-lang-const c-opt-inexpr-brace-list-key))
a66cd3ee 2370
a66cd3ee 2371(c-lang-defconst c-decl-block-key
0386b551
AM
2372 ;; Regexp matching keywords in any construct that contain another
2373 ;; declaration level, i.e. that isn't followed by a function block
2374 ;; or brace list. When the first submatch matches, it's an
2375 ;; unambiguous construct, otherwise it's an ambiguous match that
2376 ;; might also be the return type of a function declaration.
2377 t (let* ((decl-kwds (append (c-lang-const c-class-decl-kwds)
2378 (c-lang-const c-other-block-decl-kwds)
2379 (c-lang-const c-inexpr-class-kwds)))
2380 (unambiguous (set-difference decl-kwds
2381 (c-lang-const c-type-start-kwds)
2382 :test 'string-equal))
2383 (ambiguous (intersection decl-kwds
2384 (c-lang-const c-type-start-kwds)
2385 :test 'string-equal)))
2386 (if ambiguous
2387 (concat (c-make-keywords-re t unambiguous)
2388 "\\|"
2389 (c-make-keywords-re t ambiguous))
2390 (c-make-keywords-re t unambiguous))))
d9e94c22
MS
2391(c-lang-defvar c-decl-block-key (c-lang-const c-decl-block-key))
2392
a66cd3ee 2393(c-lang-defconst c-bitfield-kwds
d9e94c22
MS
2394 "Keywords that can introduce bitfields."
2395 t nil
2396 (c c++ objc) '("char" "int" "long" "signed" "unsigned"))
a66cd3ee 2397
a66cd3ee 2398(c-lang-defconst c-opt-bitfield-key
d9e94c22
MS
2399 ;; Regexp matching the start of a bitfield (not uniquely), or nil in
2400 ;; languages without bitfield support.
2401 t nil
2402 (c c++) (c-make-keywords-re t (c-lang-const c-bitfield-kwds)))
2403(c-lang-defvar c-opt-bitfield-key (c-lang-const c-opt-bitfield-key))
2404
2405(c-lang-defconst c-other-kwds
2406 "Keywords not accounted for by any other `*-kwds' language constant."
2407 t nil
2408 idl '("truncatable"
2409 ;; In CORBA CIDL: (These are declaration keywords that never
2410 ;; can start a declaration.)
2411 "entity" "process" "service" "session" "storage"))
2412
2413\f
2414;;; Constants built from keywords.
2415
2416;; Note: No `*-kwds' language constants may be defined below this point.
2417
2418(eval-and-compile
2419 (defconst c-kwds-lang-consts
2420 ;; List of all the language constants that contain keyword lists.
2421 (let (list)
2422 (mapatoms (lambda (sym)
2423 (when (and (boundp sym)
2424 (string-match "-kwds\\'" (symbol-name sym)))
2425 ;; Make the list of globally interned symbols
2426 ;; instead of ones interned in `c-lang-constants'.
2427 (setq list (cons (intern (symbol-name sym)) list))))
2428 c-lang-constants)
2429 list)))
a66cd3ee 2430
a66cd3ee 2431(c-lang-defconst c-keywords
d9e94c22
MS
2432 ;; All keywords as a list.
2433 t (delete-duplicates
2434 (c-lang-defconst-eval-immediately
2435 `(append ,@(mapcar (lambda (kwds-lang-const)
2436 `(c-lang-const ,kwds-lang-const))
2437 c-kwds-lang-consts)
2438 nil))
2439 :test 'string-equal))
2440
a66cd3ee 2441(c-lang-defconst c-keywords-regexp
d9e94c22
MS
2442 ;; All keywords as an adorned regexp.
2443 t (c-make-keywords-re t (c-lang-const c-keywords)))
2444(c-lang-defvar c-keywords-regexp (c-lang-const c-keywords-regexp))
2445
2446(c-lang-defconst c-keyword-member-alist
2447 ;; An alist with all the keywords in the cars. The cdr for each
2448 ;; keyword is a list of the symbols for the `*-kwds' lists that
2449 ;; contains it.
2450 t (let ((kwd-list-alist
2451 (c-lang-defconst-eval-immediately
2452 `(list ,@(mapcar (lambda (kwds-lang-const)
2453 `(cons ',kwds-lang-const
2454 (c-lang-const ,kwds-lang-const)))
2455 c-kwds-lang-consts))))
2456 lang-const kwd-list kwd
2457 result-alist elem)
2458 (while kwd-list-alist
2459 (setq lang-const (caar kwd-list-alist)
2460 kwd-list (cdar kwd-list-alist)
2461 kwd-list-alist (cdr kwd-list-alist))
2462 (while kwd-list
2463 (setq kwd (car kwd-list)
2464 kwd-list (cdr kwd-list))
2465 (unless (setq elem (assoc kwd result-alist))
2466 (setq result-alist (cons (setq elem (list kwd)) result-alist)))
2467 (unless (memq lang-const (cdr elem))
2468 (setcdr elem (cons lang-const (cdr elem))))))
2469 result-alist))
2470
2471(c-lang-defvar c-keywords-obarray
2472 ;; An obarray containing all keywords as symbols. The property list
2473 ;; of each symbol has a non-nil entry for the specific `*-kwds'
2474 ;; lists it's a member of.
2475 ;;
2476 ;; E.g. to see whether the string str contains a keyword on
2477 ;; `c-class-decl-kwds', one can do like this:
2478 ;; (get (intern-soft str c-keyword-obarray) 'c-class-decl-kwds)
2479 ;; Which preferably is written using the associated functions in
2480 ;; cc-engine:
2481 ;; (c-keyword-member (c-keyword-sym str) 'c-class-decl-kwds)
2482
2483 ;; The obarray is not stored directly as a language constant since
2484 ;; the printed representation for obarrays used in .elc files isn't
2485 ;; complete.
2486
2487 (let* ((alist (c-lang-const c-keyword-member-alist))
2488 kwd lang-const-list
2489 (obarray (make-vector (* (length alist) 2) 0)))
2490 (while alist
2491 (setq kwd (caar alist)
2492 lang-const-list (cdar alist)
2493 alist (cdr alist))
2494 (setplist (intern kwd obarray)
2495 ;; Emacs has an odd bug that causes `mapcan' to fail
0386b551 2496 ;; with unintelligible errors. (XEmacs works.)
d9e94c22
MS
2497 ;;(mapcan (lambda (lang-const)
2498 ;; (list lang-const t))
2499 ;; lang-const-list)
2500 (apply 'nconc (mapcar (lambda (lang-const)
2501 (list lang-const t))
2502 lang-const-list))))
2503 obarray))
2504
2505(c-lang-defconst c-regular-keywords-regexp
0386b551
AM
2506 ;; Adorned regexp matching all keywords that should be fontified
2507 ;; with the keywords face. I.e. that aren't types or constants.
d9e94c22
MS
2508 t (c-make-keywords-re t
2509 (set-difference (c-lang-const c-keywords)
2510 (append (c-lang-const c-primitive-type-kwds)
2511 (c-lang-const c-constant-kwds))
2512 :test 'string-equal)))
2513(c-lang-defvar c-regular-keywords-regexp
2514 (c-lang-const c-regular-keywords-regexp))
2515
d9e94c22
MS
2516(c-lang-defconst c-primary-expr-regexp
2517 ;; Regexp matching the start of any primary expression, i.e. any
2518 ;; literal, symbol, prefix operator, and '('. It doesn't need to
2519 ;; exclude keywords; they are excluded afterwards unless the second
2520 ;; submatch matches. If the first but not the second submatch
2521 ;; matches then it is an ambiguous primary expression; it could also
2522 ;; be a match of e.g. an infix operator. (The case with ambiguous
2523 ;; keyword operators isn't handled.)
2524
0386b551
AM
2525 t (let* ((prefix-ops
2526 (c-filter-ops (c-lang-const c-operators)
2527 '(prefix)
2528 (lambda (op)
2529 ;; Filter out the special case prefix
2530 ;; operators that are close parens.
2531 (not (string-match "\\s)" op)))))
2532
2533 (nonkeyword-prefix-ops
2534 (c-filter-ops prefix-ops
2535 t
2536 "\\`\\(\\s.\\|\\s(\\|\\s)\\)+\\'"))
2537
2538 (in-or-postfix-ops
2539 (c-filter-ops (c-lang-const c-operators)
2540 '(postfix
2541 postfix-if-paren
2542 left-assoc
2543 right-assoc
2544 right-assoc-sequence)
2545 t))
2546
2547 (unambiguous-prefix-ops (set-difference nonkeyword-prefix-ops
2548 in-or-postfix-ops
2549 :test 'string-equal))
2550 (ambiguous-prefix-ops (intersection nonkeyword-prefix-ops
2551 in-or-postfix-ops
2552 :test 'string-equal)))
2553
2554 (concat
2555 "\\("
2556 ;; Take out all symbol class operators from `prefix-ops' and make the
2557 ;; first submatch from them together with `c-primary-expr-kwds'.
2558 (c-make-keywords-re t
2559 (append (c-lang-const c-primary-expr-kwds)
2560 (set-difference prefix-ops nonkeyword-prefix-ops
2561 :test 'string-equal)))
2562
2563 "\\|"
2564 ;; Match all ambiguous operators.
2565 (c-make-keywords-re nil
2566 (intersection nonkeyword-prefix-ops in-or-postfix-ops
2567 :test 'string-equal))
2568 "\\)"
d9e94c22 2569
0386b551
AM
2570 "\\|"
2571 ;; Now match all other symbols.
2572 (c-lang-const c-symbol-start)
d9e94c22 2573
0386b551
AM
2574 "\\|"
2575 ;; The chars that can start integer and floating point
2576 ;; constants.
2577 "\\.?[0-9]"
d9e94c22 2578
0386b551 2579 "\\|"
e1dbe924 2580 ;; The unambiguous operators from `prefix-ops'.
0386b551
AM
2581 (c-make-keywords-re nil
2582 (set-difference nonkeyword-prefix-ops in-or-postfix-ops
2583 :test 'string-equal))
d9e94c22 2584
0386b551
AM
2585 "\\|"
2586 ;; Match string and character literals.
2587 "\\s\""
2588 (if (memq 'gen-string-delim c-emacs-features)
2589 "\\|\\s|"
2590 ""))))
d9e94c22 2591(c-lang-defvar c-primary-expr-regexp (c-lang-const c-primary-expr-regexp))
a66cd3ee 2592
d9e94c22
MS
2593\f
2594;;; Additional constants for parser-level constructs.
2595
ece15004
AM
2596(c-lang-defconst c-decl-start-colon-kwd-re
2597 "Regexp matching a keyword that is followed by a colon, where
2598 the whole construct can precede a declaration.
2599 E.g. \"public:\" in C++."
2600 t "\\<\\>"
2601 c++ (c-make-keywords-re t (c-lang-const c-protection-kwds)))
2602(c-lang-defvar c-decl-start-colon-kwd-re
2603 (c-lang-const c-decl-start-colon-kwd-re))
2604
d9e94c22 2605(c-lang-defconst c-decl-prefix-re
0386b551
AM
2606 "Regexp matching something that might precede a declaration, cast or
2607label, such as the last token of a preceding statement or declaration.
2608This is used in the common situation where a declaration or cast
2609doesn't start with any specific token that can be searched for.
2610
2611The regexp should not match bob; that is done implicitly. It can't
2612require a match longer than one token. The end of the token is taken
2613to be at the end of the first submatch, which is assumed to always
2614match. It's undefined whether identifier syntax (see
2615`c-identifier-syntax-table') is in effect or not. This regexp is
2616assumed to be a superset of `c-label-prefix-re' if
2617`c-recognize-colon-labels' is set.
2618
2619Besides this, `c-decl-start-kwds' is used to find declarations.
2620
2621Note: This variable together with `c-decl-start-re' and
2622`c-decl-start-kwds' is only used to detect \"likely\"
2623declaration/cast/label starts. I.e. they might produce more matches
2624but should not miss anything (or else it's necessary to use text
2625properties - see the next note). Wherever they match, the following
2626construct is analyzed to see if it indeed is a declaration, cast or
2627label. That analysis is not cheap, so it's important that not too
2628many false matches are triggered.
2629
2630Note: If a declaration/cast/label start can't be detected with this
2631variable, it's necessary to use the `c-type' text property with the
2632value `c-decl-end' on the last char of the last token preceding the
2633declaration. See the comment blurb at the start of cc-engine.el for
2634more info."
2635
d9e94c22
MS
2636 ;; We match a sequence of characters to skip over things like \"};\"
2637 ;; more quickly. We match ")" in C for K&R region declarations, and
2638 ;; in all languages except Java for when a cpp macro definition
2639 ;; begins with a declaration.
2640 t "\\([\{\}\(\);,]+\\)"
452ea855 2641 java "\\([\{\}\(;,<]+\\)"
d9e94c22
MS
2642 ;; Match "<" in C++ to get the first argument in a template arglist.
2643 ;; In that case there's an additional check in `c-find-decl-spots'
ece15004
AM
2644 ;; that it got open paren syntax. Match ":" to aid in picking up
2645 ;; "public:", etc. This involves additional checks in
2646 ;; `c-find-decl-prefix-search' to prevent a match of identifiers
2647 ;; or labels.
2648 c++ "\\([\{\}\(\);:,<]+\\)"
d9e94c22
MS
2649 ;; Additionally match the protection directives in Objective-C.
2650 ;; Note that this doesn't cope with the longer directives, which we
2651 ;; would have to match from start to end since they don't end with
2652 ;; any easily recognized characters.
2653 objc (concat "\\([\{\}\(\);,]+\\|"
2654 (c-make-keywords-re nil (c-lang-const c-protection-kwds))
2655 "\\)")
d9e94c22
MS
2656 ;; Pike is like C but we also match "[" for multiple value
2657 ;; assignments and type casts.
2658 pike "\\([\{\}\(\)\[;,]+\\)")
2659(c-lang-defvar c-decl-prefix-re (c-lang-const c-decl-prefix-re)
2660 'dont-doc)
2661
0386b551
AM
2662(c-lang-defconst c-decl-start-re
2663 "Regexp matching the start of any declaration, cast or label.
2664It's used on the token after the one `c-decl-prefix-re' matched. This
2665regexp should not try to match those constructs accurately as it's
2666only used as a sieve to avoid spending more time checking other
2667constructs."
2668 t (c-lang-const c-identifier-start))
2669(c-lang-defvar c-decl-start-re (c-lang-const c-decl-start-re))
2670
2671(c-lang-defconst c-decl-prefix-or-start-re
2672 ;; Regexp matching something that might precede or start a
2673 ;; declaration, cast or label.
2674 ;;
2675 ;; If the first submatch matches, it's taken to match the end of a
2676 ;; token that might precede such a construct, e.g. ';', '}' or '{'.
2677 ;; It's built from `c-decl-prefix-re'.
2678 ;;
2679 ;; If the first submatch did not match, the match of the whole
2680 ;; regexp is taken to be at the first token in the declaration.
2681 ;; `c-decl-start-re' is not checked in this case.
2682 ;;
2683 ;; Design note: The reason the same regexp is used to match both
2684 ;; tokens that precede declarations and start them is to avoid an
2685 ;; extra regexp search from the previous declaration spot in
2686 ;; `c-find-decl-spots'. Users of `c-find-decl-spots' also count on
2687 ;; that it finds all declaration/cast/label starts in approximately
2688 ;; linear order, so we can't do the searches in two separate passes.
2689 t (if (c-lang-const c-decl-start-kwds)
2690 (concat (c-lang-const c-decl-prefix-re)
2691 "\\|"
2692 (c-make-keywords-re t (c-lang-const c-decl-start-kwds)))
2693 (c-lang-const c-decl-prefix-re)))
2694(c-lang-defvar c-decl-prefix-or-start-re
2695 (c-lang-const c-decl-prefix-or-start-re)
2696 'dont-doc)
2697
d9e94c22
MS
2698(c-lang-defconst c-cast-parens
2699 ;; List containing the paren characters that can open a cast, or nil in
2700 ;; languages without casts.
0386b551
AM
2701 t (c-filter-ops (c-lang-const c-operators)
2702 '(prefix)
2703 "\\`\\s\(\\'"
2704 (lambda (op) (elt op 0))))
d9e94c22
MS
2705(c-lang-defvar c-cast-parens (c-lang-const c-cast-parens))
2706
0386b551
AM
2707(c-lang-defconst c-block-prefix-disallowed-chars
2708 "List of syntactically relevant characters that never can occur before
2709the open brace in any construct that contains a brace block, e.g. in
2710the \"class Foo: public Bar\" part of:
2711
2712 class Foo: public Bar {int x();} a, *b;
2713
2714If parens can occur, the chars inside those aren't filtered with this
2715list.
2716
2717'<' and '>' should be disallowed even if angle bracket arglists can
2718occur. That since the search function needs to stop at them anyway to
2719ensure they are given paren syntax.
2720
2721This is used to skip backward from the open brace to find the region
2722in which to look for a construct like \"class\", \"enum\",
2723\"namespace\" or whatever. That skipping should be as tight as
2724possible for good performance."
2725
2726 ;; Default to all chars that only occurs in nonsymbol tokens outside
2727 ;; identifiers.
2728 t (set-difference
2729 (c-lang-const c-nonsymbol-token-char-list)
2730 (c-filter-ops (append (c-lang-const c-identifier-ops)
2731 (list (cons nil
2732 (c-lang-const c-after-id-concat-ops))))
2733 t
2734 t
2735 (lambda (op)
2736 (let ((pos 0) res)
2737 (while (string-match "\\(\\s.\\|\\s(\\|\\s)\\)"
2738 op pos)
2739 (setq res (cons (aref op (match-beginning 1)) res)
2740 pos (match-end 0)))
2741 res))))
2742
e1dbe924 2743 ;; Allow cpp operations (where applicable).
0386b551
AM
2744 t (if (c-lang-const c-opt-cpp-prefix)
2745 (set-difference (c-lang-const c-block-prefix-disallowed-chars)
2746 '(?#))
2747 (c-lang-const c-block-prefix-disallowed-chars))
2748
2749 ;; Allow ':' for inherit list starters.
2750 (c++ objc idl) (set-difference (c-lang-const c-block-prefix-disallowed-chars)
2751 '(?:))
2752
2753 ;; Allow ',' for multiple inherits.
2754 (c++ java) (set-difference (c-lang-const c-block-prefix-disallowed-chars)
2755 '(?,))
2756
2757 ;; Allow parentheses for anonymous inner classes in Java and class
2758 ;; initializer lists in Pike.
2759 (java pike) (set-difference (c-lang-const c-block-prefix-disallowed-chars)
2760 '(?\( ?\)))
2761
2762 ;; Allow '"' for extern clauses (e.g. extern "C" {...}).
2763 (c c++ objc) (set-difference (c-lang-const c-block-prefix-disallowed-chars)
2764 '(?\" ?')))
2765
2766(c-lang-defconst c-block-prefix-charset
2767 ;; `c-block-prefix-disallowed-chars' as an inverted charset suitable
2768 ;; for `c-syntactic-skip-backward'.
2769 t (c-make-bare-char-alt (c-lang-const c-block-prefix-disallowed-chars) t))
2770(c-lang-defvar c-block-prefix-charset (c-lang-const c-block-prefix-charset))
2771
d9e94c22 2772(c-lang-defconst c-type-decl-prefix-key
0386b551
AM
2773 "Regexp matching the declarator operators that might precede the
2774identifier in a declaration, e.g. the \"*\" in \"char *argv\". This
2775regexp should match \"(\" if parentheses are valid in declarators.
2776The end of the first submatch is taken as the end of the operator.
2777Identifier syntax is in effect when this is matched \(see
2778`c-identifier-syntax-table')."
d9e94c22 2779 t (if (c-lang-const c-type-modifier-kwds)
0386b551 2780 (concat (regexp-opt (c-lang-const c-type-modifier-kwds) t) "\\>")
d9e94c22
MS
2781 ;; Default to a regexp that never matches.
2782 "\\<\\>")
0386b551
AM
2783 ;; Check that there's no "=" afterwards to avoid matching tokens
2784 ;; like "*=".
d9e94c22
MS
2785 (c objc) (concat "\\("
2786 "[*\(]"
2787 "\\|"
2788 (c-lang-const c-type-decl-prefix-key)
2789 "\\)"
2790 "\\([^=]\\|$\\)")
2791 c++ (concat "\\("
2792 "[*\(&]"
2793 "\\|"
7f0789c9
AM
2794 (c-lang-const c-type-decl-prefix-key)
2795 "\\|"
2796 (concat "\\(" ; 3
d9e94c22
MS
2797 ;; If this matches there's special treatment in
2798 ;; `c-font-lock-declarators' and
2799 ;; `c-font-lock-declarations' that check for a
2800 ;; complete name followed by ":: *".
2801 (c-lang-const c-identifier-start)
2802 "\\)")
d9e94c22
MS
2803 "\\)"
2804 "\\([^=]\\|$\\)")
0386b551 2805 pike "\\(\\*\\)\\([^=]\\|$\\)")
d9e94c22
MS
2806(c-lang-defvar c-type-decl-prefix-key (c-lang-const c-type-decl-prefix-key)
2807 'dont-doc)
2808
2809(c-lang-defconst c-type-decl-suffix-key
0386b551
AM
2810 "Regexp matching the declarator operators that might follow after the
2811identifier in a declaration, e.g. the \"[\" in \"char argv[]\". This
2812regexp should match \")\" if parentheses are valid in declarators. If
d9e94c22
MS
2813it matches an open paren of some kind, the type declaration check
2814continues at the corresponding close paren, otherwise the end of the
2815first submatch is taken as the end of the operator. Identifier syntax
2816is in effect when this is matched (see `c-identifier-syntax-table')."
2817 ;; Default to a regexp that matches `c-type-modifier-kwds' and a
2818 ;; function argument list parenthesis.
2819 t (if (c-lang-const c-type-modifier-kwds)
2820 (concat "\\(\(\\|"
0386b551 2821 (regexp-opt (c-lang-const c-type-modifier-kwds) t) "\\>"
d9e94c22
MS
2822 "\\)")
2823 "\\(\(\\)")
2824 (c c++ objc) (concat
2825 "\\("
2826 "[\)\[\(]"
0386b551
AM
2827 (if (c-lang-const c-type-modifier-kwds)
2828 (concat
2829 "\\|"
2830 ;; "throw" in `c-type-modifier-kwds' is followed
2831 ;; by a parenthesis list, but no extra measures
2832 ;; are necessary to handle that.
2833 (regexp-opt (c-lang-const c-type-modifier-kwds) t)
2834 "\\>")
2835 "")
d9e94c22 2836 "\\)")
e8dd0787
AM
2837 java "\\([\[\(\)]\\)"
2838 idl "\\([\[\(]\\)")
d9e94c22
MS
2839(c-lang-defvar c-type-decl-suffix-key (c-lang-const c-type-decl-suffix-key)
2840 'dont-doc)
2841
2842(c-lang-defconst c-after-suffixed-type-decl-key
0386b551 2843 "This regexp is matched after a declarator expression where
d9e94c22
MS
2844`c-type-decl-suffix-key' has matched. If it matches then the
2845construct is taken as a declaration. It's typically used to match the
2846beginning of a function body or whatever might occur after the
2847function header in a function declaration or definition. It's
2848undefined whether identifier syntax (see `c-identifier-syntax-table')
2849is in effect or not.
2850
2851Note that it's used in cases like after \"foo (bar)\" so it should
65e7ca35 2852only match when it's certain that it's a declaration, e.g., \"{\" but
d9e94c22
MS
2853not \",\" or \";\"."
2854 t "{"
2855 ;; If K&R style declarations should be recognized then one could
2856 ;; consider to match the start of any symbol since we want to match
2857 ;; the start of the first declaration in the "K&R region". That
2858 ;; could however produce false matches on code like "FOO(bar) x"
2859 ;; where FOO is a cpp macro, so it's better to leave it out and rely
2860 ;; on the other heuristics in that case.
0386b551
AM
2861 t (if (c-lang-const c-postfix-spec-kwds)
2862 ;; Add on the keywords in `c-postfix-spec-kwds'.
d9e94c22
MS
2863 (concat (c-lang-const c-after-suffixed-type-decl-key)
2864 "\\|"
0386b551 2865 (c-make-keywords-re t (c-lang-const c-postfix-spec-kwds)))
d9e94c22
MS
2866 (c-lang-const c-after-suffixed-type-decl-key))
2867 ;; Also match the colon that starts a base class initializer list in
2868 ;; C++. That can be confused with a function call before the colon
2869 ;; in a ? : operator, but we count on that `c-decl-prefix-re' won't
2870 ;; match before such a thing (as a declaration-level construct;
2871 ;; matches inside arglist contexts are already excluded).
2872 c++ "[{:]")
2873(c-lang-defvar c-after-suffixed-type-decl-key
2874 (c-lang-const c-after-suffixed-type-decl-key)
2875 'dont-doc)
2876
2877(c-lang-defconst c-after-suffixed-type-maybe-decl-key
2878 ;; Regexp that in addition to `c-after-suffixed-type-decl-key'
2879 ;; matches ";" and ",".
2880 t (concat "\\(" (c-lang-const c-after-suffixed-type-decl-key) "\\)"
2881 "\\|[;,]"))
2882(c-lang-defvar c-after-suffixed-type-maybe-decl-key
2883 (c-lang-const c-after-suffixed-type-maybe-decl-key))
2884
2885(c-lang-defconst c-opt-type-concat-key
2886 "Regexp matching operators that concatenate types, e.g. the \"|\" in
2887\"int|string\" in Pike. The end of the first submatch is taken as the
2888end of the operator. nil in languages without such operators. It's
2889undefined whether identifier syntax (see `c-identifier-syntax-table')
2890is in effect or not."
2891 t nil
2892 pike "\\([|.&]\\)\\($\\|[^|.&]\\)")
2893(c-lang-defvar c-opt-type-concat-key (c-lang-const c-opt-type-concat-key)
2894 'dont-doc)
2895
2896(c-lang-defconst c-opt-type-suffix-key
2897 "Regexp matching operators that might follow after a type, or nil in
2898languages that don't have such operators. The end of the first
2899submatch is taken as the end of the operator. This should not match
2900things like C++ template arglists if `c-recognize-<>-arglists' is set.
2901It's undefined whether identifier syntax (see `c-identifier-syntax-table')
2902is in effect or not."
2903 t nil
2904 (c c++ objc pike) "\\(\\.\\.\\.\\)"
452ea855 2905 java (concat "\\(\\[" (c-lang-const c-simple-ws) "*\\]\\|\\.\\.\\.\\)"))
d9e94c22
MS
2906(c-lang-defvar c-opt-type-suffix-key (c-lang-const c-opt-type-suffix-key))
2907
2908(c-lang-defvar c-known-type-key
2909 ;; Regexp matching the known type identifiers. This is initialized
2910 ;; from the type keywords and `*-font-lock-extra-types'. The first
2911 ;; submatch is the one that matches the type. Note that this regexp
2912 ;; assumes that symbol constituents like '_' and '$' have word
2913 ;; syntax.
0386b551
AM
2914 (let* ((extra-types
2915 (when (boundp (c-mode-symbol "font-lock-extra-types"))
2916 (c-mode-var "font-lock-extra-types")))
2917 (regexp-strings
6faed041
AM
2918 (apply 'nconc
2919 (mapcar (lambda (re)
0386b551
AM
2920 (when (string-match "[][.*+?^$\\]" re)
2921 (list re)))
6faed041 2922 extra-types)))
0386b551 2923 (plain-strings
6faed041
AM
2924 (apply 'nconc
2925 (mapcar (lambda (re)
0386b551
AM
2926 (unless (string-match "[][.*+?^$\\]" re)
2927 (list re)))
6faed041 2928 extra-types))))
d9e94c22 2929 (concat "\\<\\("
0386b551
AM
2930 (c-concat-separated
2931 (append (list (c-make-keywords-re nil
2932 (append (c-lang-const c-primitive-type-kwds)
2933 plain-strings)))
2934 regexp-strings)
2935 "\\|")
d9e94c22
MS
2936 "\\)\\>")))
2937
2938(c-lang-defconst c-special-brace-lists
2939"List of open- and close-chars that makes up a pike-style brace list,
c38e0c97 2940i.e. for a ([ ]) list there should be a cons (?\\[ . ?\\]) in this
d9e94c22
MS
2941list."
2942 t nil
2943 pike '((?{ . ?}) (?\[ . ?\]) (?< . ?>)))
2944(c-lang-defvar c-special-brace-lists (c-lang-const c-special-brace-lists))
2945
2946(c-lang-defconst c-recognize-knr-p
2947 "Non-nil means K&R style argument declarations are valid."
2948 t nil
2949 c t)
2950(c-lang-defvar c-recognize-knr-p (c-lang-const c-recognize-knr-p))
2951
2952(c-lang-defconst c-recognize-typeless-decls
2953 "Non-nil means function declarations without return type should be
2954recognized. That can introduce an ambiguity with parenthesized macro
2955calls before a brace block. This setting does not affect declarations
2956that are preceded by a declaration starting keyword, so
2957e.g. `c-typeless-decl-kwds' may still be used when it's set to nil."
2958 t nil
e8dd0787 2959 (c c++ objc java) t)
d9e94c22
MS
2960(c-lang-defvar c-recognize-typeless-decls
2961 (c-lang-const c-recognize-typeless-decls))
2962
2963(c-lang-defconst c-recognize-<>-arglists
2964 "Non-nil means C++ style template arglists should be handled. More
2965specifically, this means a comma separated list of types or
2966expressions surrounded by \"<\" and \">\". It's always preceded by an
2967identifier or one of the keywords on `c-<>-type-kwds' or
2968`c-<>-arglist-kwds'. If there's an identifier before then the whole
2969expression is considered to be a type."
2970 t (or (consp (c-lang-const c-<>-type-kwds))
f5950f7a
AM
2971 (consp (c-lang-const c-<>-arglist-kwds)))
2972 java t)
d9e94c22
MS
2973(c-lang-defvar c-recognize-<>-arglists (c-lang-const c-recognize-<>-arglists))
2974
9d5a8f0b
AM
2975(c-lang-defconst c-enums-contain-decls
2976 "Non-nil means that an enum structure can contain declarations."
2977 t nil
2978 java t)
2979(c-lang-defvar c-enums-contain-decls (c-lang-const c-enums-contain-decls))
2980
d9e94c22
MS
2981(c-lang-defconst c-recognize-paren-inits
2982 "Non-nil means that parenthesis style initializers exist,
2983i.e. constructs like
2984
2985Foo bar (gnu);
2986
2987in addition to the more classic
2988
2989Foo bar = gnu;"
2990 t nil
2991 c++ t)
2992(c-lang-defvar c-recognize-paren-inits (c-lang-const c-recognize-paren-inits))
2993
0386b551
AM
2994(c-lang-defconst c-recognize-paren-inexpr-blocks
2995 "Non-nil to recognize gcc style in-expression blocks,
2996i.e. compound statements surrounded by parentheses inside expressions."
2997 t nil
2998 (c c++) t)
2999(c-lang-defvar c-recognize-paren-inexpr-blocks
3000 (c-lang-const c-recognize-paren-inexpr-blocks))
3001
d9e94c22
MS
3002(c-lang-defconst c-opt-<>-arglist-start
3003 ;; Regexp matching the start of angle bracket arglists in languages
3004 ;; where `c-recognize-<>-arglists' is set. Does not exclude
3005 ;; keywords outside `c-<>-arglist-kwds'. The first submatch is
3006 ;; assumed to surround the preceding symbol. The whole match is
3007 ;; assumed to end directly after the opening "<".
3008 t (if (c-lang-const c-recognize-<>-arglists)
3009 (concat "\\("
3010 (c-lang-const c-symbol-key)
3011 "\\)"
3012 (c-lang-const c-syntactic-ws)
3013 "<")))
3014(c-lang-defvar c-opt-<>-arglist-start (c-lang-const c-opt-<>-arglist-start))
3015
3016(c-lang-defconst c-opt-<>-arglist-start-in-paren
3017 ;; Regexp that in addition to `c-opt-<>-arglist-start' matches close
3018 ;; parens. The first submatch is assumed to surround
3019 ;; `c-opt-<>-arglist-start'.
3020 t (if (c-lang-const c-opt-<>-arglist-start)
3021 (concat "\\("
3022 (c-lang-const c-opt-<>-arglist-start)
3023 "\\)\\|\\s\)")))
3024(c-lang-defvar c-opt-<>-arglist-start-in-paren
3025 (c-lang-const c-opt-<>-arglist-start-in-paren))
a66cd3ee 3026
d9e94c22
MS
3027(c-lang-defconst c-opt-postfix-decl-spec-key
3028 ;; Regexp matching the beginning of a declaration specifier in the
3029 ;; region between the header and the body of a declaration.
3030 ;;
3031 ;; TODO: This is currently not used uniformly; c++-mode and
3032 ;; java-mode each have their own ways of using it.
0386b551
AM
3033 t nil
3034 c++ (concat ":?"
3035 (c-lang-const c-simple-ws) "*"
3036 "\\(virtual" (c-lang-const c-simple-ws) "+\\)?\\("
3037 (c-make-keywords-re nil (c-lang-const c-protection-kwds))
3038 "\\)" (c-lang-const c-simple-ws) "+"
3039 "\\(" (c-lang-const c-symbol-key) "\\)")
3040 java (c-make-keywords-re t (c-lang-const c-postfix-spec-kwds)))
d9e94c22
MS
3041(c-lang-defvar c-opt-postfix-decl-spec-key
3042 (c-lang-const c-opt-postfix-decl-spec-key))
a66cd3ee 3043
0386b551
AM
3044(c-lang-defconst c-recognize-colon-labels
3045 "Non-nil if generic labels ending with \":\" should be recognized.
3046That includes labels in code and access keys in classes. This does
3047not apply to labels recognized by `c-label-kwds' and
3048`c-opt-extra-label-key'."
3049 t nil
3050 (c c++ objc java pike) t)
3051(c-lang-defvar c-recognize-colon-labels
3052 (c-lang-const c-recognize-colon-labels))
3053
3054(c-lang-defconst c-label-prefix-re
3055 "Regexp like `c-decl-prefix-re' that matches any token that can precede
3056a generic colon label. Not used if `c-recognize-colon-labels' is
3057nil."
3058 t "\\([{};]+\\)")
3059(c-lang-defvar c-label-prefix-re
3060 (c-lang-const c-label-prefix-re))
3061
3062(c-lang-defconst c-nonlabel-token-key
3063 "Regexp matching things that can't occur in generic colon labels,
3064neither in a statement nor in a declaration context. The regexp is
3065tested at the beginning of every sexp in a suspected label,
3066i.e. before \":\". Only used if `c-recognize-colon-labels' is set."
3067 t (concat
0386b551
AM
3068 ;; All keywords except `c-label-kwds' and `c-protection-kwds'.
3069 (c-make-keywords-re t
3070 (set-difference (c-lang-const c-keywords)
3071 (append (c-lang-const c-label-kwds)
3072 (c-lang-const c-protection-kwds))
3073 :test 'string-equal)))
898169a2
AM
3074 ;; Don't allow string literals, except in AWK. Character constants are OK.
3075 (c objc java pike idl) (concat "\"\\|"
3076 (c-lang-const c-nonlabel-token-key))
0386b551
AM
3077 ;; Also check for open parens in C++, to catch member init lists in
3078 ;; constructors. We normally allow it so that macros with arguments
3079 ;; work in labels.
898169a2 3080 c++ (concat "\\s\(\\|\"\\|" (c-lang-const c-nonlabel-token-key)))
0386b551
AM
3081(c-lang-defvar c-nonlabel-token-key (c-lang-const c-nonlabel-token-key))
3082
a6ba2ab9
AM
3083(c-lang-defconst c-nonlabel-token-2-key
3084 "Regexp matching things that can't occur two symbols before a colon in
3085a label construct. This catches C++'s inheritance construct \"class foo
3086: bar\". Only used if `c-recognize-colon-labels' is set."
3087 t "\\<\\>" ; matches nothing
3088 c++ (c-make-keywords-re t '("class")))
3089(c-lang-defvar c-nonlabel-token-2-key (c-lang-const c-nonlabel-token-2-key))
3090
0386b551
AM
3091(c-lang-defconst c-opt-extra-label-key
3092 "Optional regexp matching labels.
3093Normally, labels are detected according to `c-nonlabel-token-key',
3094`c-decl-prefix-re' and `c-nonlabel-decl-prefix-re'. This regexp can
3095be used if there are additional labels that aren't recognized that
3096way."
3097 t nil
3098 objc (c-make-keywords-re t (c-lang-const c-protection-kwds)))
3099(c-lang-defvar c-opt-extra-label-key (c-lang-const c-opt-extra-label-key))
3100
a66cd3ee 3101(c-lang-defconst c-opt-friend-key
d9e94c22
MS
3102 ;; Regexp describing friend declarations classes, or nil in
3103 ;; languages that don't have such things.
3104 ;;
0386b551
AM
3105 ;; TODO: Ought to use `c-prefix-spec-kwds-re' or similar, and the
3106 ;; template skipping isn't done properly. This will disappear soon.
3107 t nil
3108 c++ (concat "friend" (c-lang-const c-simple-ws) "+"
3109 "\\|"
3110 (concat "template"
3111 (c-lang-const c-simple-ws) "*"
3112 "<.+>"
3113 (c-lang-const c-simple-ws) "*"
3114 "friend"
3115 (c-lang-const c-simple-ws) "+")))
d9e94c22 3116(c-lang-defvar c-opt-friend-key (c-lang-const c-opt-friend-key))
a66cd3ee 3117
a66cd3ee 3118(c-lang-defconst c-opt-method-key
d9e94c22
MS
3119 ;; Special regexp to match the start of Objective-C methods. The
3120 ;; first submatch is assumed to end after the + or - key.
0386b551 3121 t nil
a66cd3ee 3122 objc (concat
d9e94c22 3123 ;; TODO: Ought to use a better method than anchoring on bol.
0386b551
AM
3124 "^\\s *"
3125 "\\([+-]\\)"
3126 (c-lang-const c-simple-ws) "*"
3127 (concat "\\(" ; Return type.
3128 "([^\)]*)"
3129 (c-lang-const c-simple-ws) "*"
3130 "\\)?")
d9e94c22
MS
3131 "\\(" (c-lang-const c-symbol-key) "\\)"))
3132(c-lang-defvar c-opt-method-key (c-lang-const c-opt-method-key))
0ec8351b 3133
0386b551
AM
3134(c-lang-defconst c-type-decl-end-used
3135 ;; Must be set in buffers where the `c-type' text property might be
3136 ;; used with the value `c-decl-end'.
3137 ;;
3138 ;; `c-decl-end' is used to mark the ends of labels and access keys
3139 ;; to make interactive refontification work better.
3140 t (or (c-lang-const c-recognize-colon-labels)
3141 (and (c-lang-const c-label-kwds) t))
3142 ;; `c-decl-end' is used to mark the end of the @-style directives in
3143 ;; Objective-C.
3144 objc t)
3145(c-lang-defvar c-type-decl-end-used (c-lang-const c-type-decl-end-used))
3146
785eecbb 3147\f
d9e94c22
MS
3148;;; Wrap up the `c-lang-defvar' system.
3149
3150;; Compile in the list of language variables that has been collected
26b8f810
AM
3151;; with the `c-lang-defvar' and `c-lang-setvar' macros. Note that the
3152;; first element of each is nil.
d9e94c22 3153(defconst c-lang-variable-inits (cc-eval-when-compile c-lang-variable-inits))
26b8f810 3154(defconst c-emacs-variable-inits (cc-eval-when-compile c-emacs-variable-inits))
d9e94c22 3155
473944f3
AM
3156;; Make the `c-lang-setvar' variables buffer local in the current buffer.
3157;; These are typically standard emacs variables such as `comment-start'.
3158(defmacro c-make-emacs-variables-local ()
3159 `(progn
3160 ,@(mapcar (lambda (init)
3161 `(make-local-variable ',(car init)))
3162 (cdr c-emacs-variable-inits))))
3163
d9e94c22
MS
3164(defun c-make-init-lang-vars-fun (mode)
3165 "Create a function that initializes all the language dependent variables
3166for the given mode.
3167
3168This function should be evaluated at compile time, so that the
3169function it returns is byte compiled with all the evaluated results
3170from the language constants. Use the `c-init-language-vars' macro to
0386b551 3171accomplish that conveniently."
d9e94c22
MS
3172
3173 (if (and (not load-in-progress)
3174 (boundp 'byte-compile-dest-file)
3175 (stringp byte-compile-dest-file))
3176
3177 ;; No need to byte compile this lambda since the byte compiler is
3178 ;; smart enough to detect the `funcall' construct in the
3179 ;; `c-init-language-vars' macro below and compile it all straight
3180 ;; into the function that contains `c-init-language-vars'.
3181 `(lambda ()
3182
3183 ;; This let sets up the context for `c-mode-var' and similar
3184 ;; that could be in the result from `cl-macroexpand-all'.
3185 (let ((c-buffer-is-cc-mode ',mode)
cb694ab7 3186 current-var source-eval)
473944f3 3187 (c-make-emacs-variables-local)
d9e94c22
MS
3188 (condition-case err
3189
3190 (if (eq c-version-sym ',c-version-sym)
3191 (setq ,@(let ((c-buffer-is-cc-mode mode)
3192 (c-lang-const-expansion 'immediate))
3193 ;; `c-lang-const' will expand to the evaluated
3194 ;; constant immediately in `cl-macroexpand-all'
3195 ;; below.
26b8f810
AM
3196 (mapcan
3197 (lambda (init)
3198 `(current-var ',(car init)
3199 ,(car init) ,(cl-macroexpand-all
3200 (elt init 1))))
3201 ;; Note: The following `append' copies the
3202 ;; first argument. That list is small, so
3203 ;; this doesn't matter too much.
3204 (append (cdr c-emacs-variable-inits)
3205 (cdr c-lang-variable-inits)))))
d9e94c22 3206
0386b551
AM
3207 ;; This diagnostic message isn't useful for end
3208 ;; users, so it's disabled.
3209 ;;(unless (get ',mode 'c-has-warned-lang-consts)
3210 ;; (message ,(concat "%s compiled with CC Mode %s "
3211 ;; "but loaded with %s - evaluating "
3212 ;; "language constants from source")
3213 ;; ',mode ,c-version c-version)
3214 ;; (put ',mode 'c-has-warned-lang-consts t))
d9e94c22 3215
cb694ab7 3216 (setq source-eval t)
a9901f61
AM
3217 (let ((init ',(append (cdr c-emacs-variable-inits)
3218 (cdr c-lang-variable-inits))))
d9e94c22
MS
3219 (while init
3220 (setq current-var (caar init))
3221 (set (caar init) (eval (cadar init)))
3222 (setq init (cdr init)))))
3223
3224 (error
3225 (if current-var
26b8f810 3226 (message "Eval error in the `c-lang-defvar' or `c-lang-setvar' for `%s'%s: %S"
cb694ab7
AM
3227 current-var
3228 (if source-eval
3229 (format "\
3230 (fallback source eval - %s compiled with CC Mode %s but loaded with %s)"
3231 ',mode ,c-version c-version)
3232 "")
3233 err)
d9e94c22
MS
3234 (signal (car err) (cdr err)))))))
3235
3236 ;; Being evaluated from source. Always use the dynamic method to
3237 ;; work well when `c-lang-defvar's in this file are reevaluated
3238 ;; interactively.
3239 `(lambda ()
3240 (require 'cc-langs)
3241 (let ((c-buffer-is-cc-mode ',mode)
26b8f810
AM
3242 (init (append (cdr c-emacs-variable-inits)
3243 (cdr c-lang-variable-inits)))
d9e94c22 3244 current-var)
473944f3 3245 (c-make-emacs-variables-local)
d9e94c22
MS
3246 (condition-case err
3247
3248 (while init
3249 (setq current-var (caar init))
3250 (set (caar init) (eval (cadar init)))
3251 (setq init (cdr init)))
3252
3253 (error
3254 (if current-var
cb694ab7 3255 (message
26b8f810 3256 "Eval error in the `c-lang-defvar' or `c-lang-setver' for `%s' (source eval): %S"
cb694ab7 3257 current-var err)
d9e94c22
MS
3258 (signal (car err) (cdr err)))))))
3259 ))
3260
3261(defmacro c-init-language-vars (mode)
3262 "Initialize all the language dependent variables for the given mode.
3263This macro is expanded at compile time to a form tailored for the mode
3264in question, so MODE must be a constant. Therefore MODE is not
0386b551 3265evaluated and should not be quoted."
d9e94c22 3266 `(funcall ,(c-make-init-lang-vars-fun mode)))
130c507e 3267
fb032a95 3268\f
130c507e 3269(cc-provide 'cc-langs)
3afbc435 3270
785eecbb 3271;;; cc-langs.el ends here