New syntax-propertize functionality.
[bpt/emacs.git] / lisp / progmodes / perl-mode.el
1 ;;; perl-mode.el --- Perl code editing commands for GNU Emacs
2
3 ;; Copyright (C) 1990, 1994, 2001, 2002, 2003, 2004, 2005, 2006, 2007,
4 ;; 2008, 2009, 2010 Free Software Foundation, Inc.
5
6 ;; Author: William F. Mann
7 ;; Maintainer: FSF
8 ;; Adapted-By: ESR
9 ;; Keywords: languages
10
11 ;; Adapted from C code editing commands 'c-mode.el', Copyright 1987 by the
12 ;; Free Software Foundation, under terms of its General Public License.
13
14 ;; This file is part of GNU Emacs.
15
16 ;; GNU Emacs is free software: you can redistribute it and/or modify
17 ;; it under the terms of the GNU General Public License as published by
18 ;; the Free Software Foundation, either version 3 of the License, or
19 ;; (at your option) any later version.
20
21 ;; GNU Emacs is distributed in the hope that it will be useful,
22 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
23 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
24 ;; GNU General Public License for more details.
25
26 ;; You should have received a copy of the GNU General Public License
27 ;; along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>.
28
29 ;;; Commentary:
30
31 ;; To enter perl-mode automatically, add (autoload 'perl-mode "perl-mode")
32 ;; to your .emacs file and change the first line of your perl script to:
33 ;; #!/usr/bin/perl -- # -*-Perl-*-
34 ;; With arguments to perl:
35 ;; #!/usr/bin/perl -P- # -*-Perl-*-
36 ;; To handle files included with do 'filename.pl';, add something like
37 ;; (setq auto-mode-alist (append (list (cons "\\.pl\\'" 'perl-mode))
38 ;; auto-mode-alist))
39 ;; to your .emacs file; otherwise the .pl suffix defaults to prolog-mode.
40
41 ;; This code is based on the 18.53 version c-mode.el, with extensive
42 ;; rewriting. Most of the features of c-mode survived intact.
43
44 ;; I added a new feature which adds functionality to TAB; it is controlled
45 ;; by the variable perl-tab-to-comment. With it enabled, TAB does the
46 ;; first thing it can from the following list: change the indentation;
47 ;; move past leading white space; delete an empty comment; reindent a
48 ;; comment; move to end of line; create an empty comment; tell you that
49 ;; the line ends in a quoted string, or has a # which should be a \#.
50
51 ;; If your machine is slow, you may want to remove some of the bindings
52 ;; to perl-electric-terminator. I changed the indenting defaults to be
53 ;; what Larry Wall uses in perl/lib, but left in all the options.
54
55 ;; I also tuned a few things: comments and labels starting in column
56 ;; zero are left there by perl-indent-exp; perl-beginning-of-function
57 ;; goes back to the first open brace/paren in column zero, the open brace
58 ;; in 'sub ... {', or the equal sign in 'format ... ='; perl-indent-exp
59 ;; (meta-^q) indents from the current line through the close of the next
60 ;; brace/paren, so you don't need to start exactly at a brace or paren.
61
62 ;; It may be good style to put a set of redundant braces around your
63 ;; main program. This will let you reindent it with meta-^q.
64
65 ;; Known problems (these are all caused by limitations in the Emacs Lisp
66 ;; parsing routine (parse-partial-sexp), which was not designed for such
67 ;; a rich language; writing a more suitable parser would be a big job):
68 ;; 2) The globbing syntax <pattern> is not recognized, so special
69 ;; characters in the pattern string must be backslashed.
70 ;; 3) The << quoting operators are not recognized; see below.
71 ;; 5) To make '$' work correctly, $' is not recognized as a variable.
72 ;; Use "$'" or $POSTMATCH instead.
73 ;;
74 ;; If you don't use font-lock, additional problems will appear:
75 ;; 1) Regular expression delimiters do not act as quotes, so special
76 ;; characters such as `'"#:;[](){} may need to be backslashed
77 ;; in regular expressions and in both parts of s/// and tr///.
78 ;; 4) The q and qq quoting operators are not recognized; see below.
79 ;; 5) To make variables such a $' and $#array work, perl-mode treats
80 ;; $ just like backslash, so '$' is not treated correctly.
81 ;; 6) Unfortunately, treating $ like \ makes ${var} be treated as an
82 ;; unmatched }. See below.
83 ;; 7) When ' (quote) is used as a package name separator, perl-mode
84 ;; doesn't understand, and thinks it is seeing a quoted string.
85
86 ;; Here are some ugly tricks to bypass some of these problems: the perl
87 ;; expression /`/ (that's a back-tick) usually evaluates harmlessly,
88 ;; but will trick perl-mode into starting a quoted string, which
89 ;; can be ended with another /`/. Assuming you have no embedded
90 ;; back-ticks, this can used to help solve problem 3:
91 ;;
92 ;; /`/; $ugly = q?"'$?; /`/;
93 ;;
94 ;; The same trick can be used for problem 6 as in:
95 ;; /{/; while (<${glob_me}>)
96 ;; but a simpler solution is to add a space between the $ and the {:
97 ;; while (<$ {glob_me}>)
98 ;;
99 ;; Problem 7 is even worse, but this 'fix' does work :-(
100 ;; $DB'stop#'
101 ;; [$DB'line#'
102 ;; ] =~ s/;9$//;
103
104 ;;; Code:
105
106 (eval-when-compile (require 'cl))
107
108 (defvar font-lock-comment-face)
109 (defvar font-lock-doc-face)
110 (defvar font-lock-string-face)
111
112 (defgroup perl nil
113 "Major mode for editing Perl code."
114 :link '(custom-group-link :tag "Font Lock Faces group" font-lock-faces)
115 :prefix "perl-"
116 :group 'languages)
117
118 (defvar perl-mode-abbrev-table nil
119 "Abbrev table in use in perl-mode buffers.")
120 (define-abbrev-table 'perl-mode-abbrev-table ())
121
122 (defvar perl-mode-map
123 (let ((map (make-sparse-keymap)))
124 (define-key map "{" 'perl-electric-terminator)
125 (define-key map "}" 'perl-electric-terminator)
126 (define-key map ";" 'perl-electric-terminator)
127 (define-key map ":" 'perl-electric-terminator)
128 (define-key map "\e\C-a" 'perl-beginning-of-function)
129 (define-key map "\e\C-e" 'perl-end-of-function)
130 (define-key map "\e\C-h" 'perl-mark-function)
131 (define-key map "\e\C-q" 'perl-indent-exp)
132 (define-key map "\177" 'backward-delete-char-untabify)
133 (define-key map "\t" 'perl-indent-command)
134 map)
135 "Keymap used in Perl mode.")
136
137 (autoload 'c-macro-expand "cmacexp"
138 "Display the result of expanding all C macros occurring in the region.
139 The expansion is entirely correct because it uses the C preprocessor."
140 t)
141
142 (defvar perl-mode-syntax-table
143 (let ((st (make-syntax-table (standard-syntax-table))))
144 (modify-syntax-entry ?\n ">" st)
145 (modify-syntax-entry ?# "<" st)
146 ;; `$' is also a prefix char so I was tempted to say "/ p",
147 ;; but the `p' thingy basically overrides the `/' :-( --stef
148 (modify-syntax-entry ?$ "/" st)
149 (modify-syntax-entry ?% ". p" st)
150 (modify-syntax-entry ?@ ". p" st)
151 (modify-syntax-entry ?& "." st)
152 (modify-syntax-entry ?\' "\"" st)
153 (modify-syntax-entry ?* "." st)
154 (modify-syntax-entry ?+ "." st)
155 (modify-syntax-entry ?- "." st)
156 (modify-syntax-entry ?/ "." st)
157 (modify-syntax-entry ?< "." st)
158 (modify-syntax-entry ?= "." st)
159 (modify-syntax-entry ?> "." st)
160 (modify-syntax-entry ?\\ "\\" st)
161 (modify-syntax-entry ?` "\"" st)
162 (modify-syntax-entry ?| "." st)
163 st)
164 "Syntax table in use in `perl-mode' buffers.")
165
166 (defvar perl-imenu-generic-expression
167 '(;; Functions
168 (nil "^sub\\s-+\\([-A-Za-z0-9+_:]+\\)" 1)
169 ;;Variables
170 ("Variables" "^\\([$@%][-A-Za-z0-9+_:]+\\)\\s-*=" 1)
171 ("Packages" "^package\\s-+\\([-A-Za-z0-9+_:]+\\);" 1)
172 ("Doc sections" "^=head[0-9][ \t]+\\(.*\\)" 1))
173 "Imenu generic expression for Perl mode. See `imenu-generic-expression'.")
174
175 ;; Regexps updated with help from Tom Tromey <tromey@cambric.colorado.edu> and
176 ;; Jim Campbell <jec@murzim.ca.boeing.com>.
177
178 (defconst perl-font-lock-keywords-1
179 '(;; What is this for?
180 ;;("\\(--- .* ---\\|=== .* ===\\)" . font-lock-string-face)
181 ;;
182 ;; Fontify preprocessor statements as we do in `c-font-lock-keywords'.
183 ;; Ilya Zakharevich <ilya@math.ohio-state.edu> thinks this is a bad idea.
184 ;; ("^#[ \t]*include[ \t]+\\(<[^>\"\n]+>\\)" 1 font-lock-string-face)
185 ;; ("^#[ \t]*define[ \t]+\\(\\sw+\\)(" 1 font-lock-function-name-face)
186 ;; ("^#[ \t]*if\\>"
187 ;; ("\\<\\(defined\\)\\>[ \t]*(?\\(\\sw+\\)?" nil nil
188 ;; (1 font-lock-constant-face) (2 font-lock-variable-name-face nil t)))
189 ;; ("^#[ \t]*\\(\\sw+\\)\\>[ \t]*\\(\\sw+\\)?"
190 ;; (1 font-lock-constant-face) (2 font-lock-variable-name-face nil t))
191 ;;
192 ;; Fontify function and package names in declarations.
193 ("\\<\\(package\\|sub\\)\\>[ \t]*\\(\\sw+\\)?"
194 (1 font-lock-keyword-face) (2 font-lock-function-name-face nil t))
195 ("\\<\\(import\\|no\\|require\\|use\\)\\>[ \t]*\\(\\sw+\\)?"
196 (1 font-lock-keyword-face) (2 font-lock-constant-face nil t)))
197 "Subdued level highlighting for Perl mode.")
198
199 (defconst perl-font-lock-keywords-2
200 (append perl-font-lock-keywords-1
201 (list
202 ;;
203 ;; Fontify keywords, except those fontified otherwise.
204 (concat "\\<"
205 (regexp-opt '("if" "until" "while" "elsif" "else" "unless"
206 "do" "dump" "for" "foreach" "exit" "die"
207 "BEGIN" "END" "return" "exec" "eval") t)
208 "\\>")
209 ;;
210 ;; Fontify local and my keywords as types.
211 '("\\<\\(local\\|my\\)\\>" . font-lock-type-face)
212 ;;
213 ;; Fontify function, variable and file name references.
214 '("&\\(\\sw+\\(::\\sw+\\)*\\)" 1 font-lock-function-name-face)
215 ;; Additionally underline non-scalar variables. Maybe this is a bad idea.
216 ;;'("[$@%*][#{]?\\(\\sw+\\)" 1 font-lock-variable-name-face)
217 '("[$*]{?\\(\\sw+\\(::\\sw+\\)*\\)" 1 font-lock-variable-name-face)
218 '("\\([@%]\\|\\$#\\)\\(\\sw+\\(::\\sw+\\)*\\)"
219 (2 (cons font-lock-variable-name-face '(underline))))
220 '("<\\(\\sw+\\)>" 1 font-lock-constant-face)
221 ;;
222 ;; Fontify keywords with/and labels as we do in `c++-font-lock-keywords'.
223 '("\\<\\(continue\\|goto\\|last\\|next\\|redo\\)\\>[ \t]*\\(\\sw+\\)?"
224 (1 font-lock-keyword-face) (2 font-lock-constant-face nil t))
225 '("^[ \t]*\\(\\sw+\\)[ \t]*:[^:]" 1 font-lock-constant-face)))
226 "Gaudy level highlighting for Perl mode.")
227
228 (defvar perl-font-lock-keywords perl-font-lock-keywords-1
229 "Default expressions to highlight in Perl mode.")
230
231 (defvar perl-quote-like-pairs
232 '((?\( . ?\)) (?\[ . ?\]) (?\{ . ?\}) (?\< . ?\>)))
233
234 ;; FIXME: handle here-docs and regexps.
235 ;; <<EOF <<"EOF" <<'EOF' (no space)
236 ;; see `man perlop'
237 ;; ?...?
238 ;; /.../
239 ;; m [...]
240 ;; m /.../
241 ;; q /.../ = '...'
242 ;; qq /.../ = "..."
243 ;; qx /.../ = `...`
244 ;; qr /.../ = precompiled regexp =~=~ m/.../
245 ;; qw /.../
246 ;; s /.../.../
247 ;; s <...> /.../
248 ;; s '...'...'
249 ;; tr /.../.../
250 ;; y /.../.../
251 ;;
252 ;; <file*glob>
253 (defun perl-syntax-propertize-function (start end)
254 (let ((case-fold-search nil))
255 (goto-char start)
256 (perl-syntax-propertize-special-constructs end)
257 ;; TODO: here-documents ("<<\\(\\sw\\|['\"]\\)")
258 (funcall
259 (syntax-propertize-rules
260 ;; Turn POD into b-style comments. Place the cut rule first since it's
261 ;; more specific.
262 ("^=cut\\>.*\\(\n\\)" (1 "> b"))
263 ("^\\(=\\)\\sw" (1 "< b"))
264 ;; Catch ${ so that ${var} doesn't screw up indentation.
265 ;; This also catches $' to handle 'foo$', although it should really
266 ;; check that it occurs inside a '..' string.
267 ("\\(\\$\\)[{']" (1 ". p"))
268 ;; Handle funny names like $DB'stop.
269 ("\\$ ?{?^?[_a-zA-Z][_a-zA-Z0-9]*\\('\\)[_a-zA-Z]" (1 "_"))
270 ;; format statements
271 ("^[ \t]*format.*=[ \t]*\\(\n\\)"
272 (1 (prog1 "\"" (perl-syntax-propertize-special-constructs end))))
273 ;; Funny things in `sub' arg-specs like `sub myfun ($)' or `sub ($)'.
274 ;; Be careful not to match "sub { (...) ... }".
275 ("\\<sub\\(?:[[:space:]]+[^{}[:punct:][:space:]]+\\)?[[:space:]]*(\\([^)]+\\))"
276 (1 "."))
277 ;; Regexp and funny quotes. Distinguishing a / that starts a regexp
278 ;; match from the division operator is ...interesting.
279 ;; Basically, / is a regexp match if it's preceded by an infix operator
280 ;; (or some similar separator), or by one of the special keywords
281 ;; corresponding to builtin functions that can take their first arg
282 ;; without parentheses. Of course, that presume we're looking at the
283 ;; *opening* slash. We can afford to mis-match the closing ones
284 ;; here, because they will be re-treated separately later in
285 ;; perl-font-lock-special-syntactic-constructs.
286 ((concat "\\(?:\\(?:^\\|[^$@&%[:word:]]\\)"
287 (regexp-opt '("split" "if" "unless" "until" "while" "split"
288 "grep" "map" "not" "or" "and"))
289 "\\|[?:.,;=!~({[]\\|\\(^\\)\\)[ \t\n]*\\(/\\)")
290 (2 (ignore
291 (if (and (match-end 1) ; / at BOL.
292 (save-excursion
293 (goto-char (match-end 1))
294 (forward-comment (- (point-max)))
295 (put-text-property (point) (match-end 2)
296 'syntax-multiline t)
297 (not (memq (char-before)
298 '(?? ?: ?. ?, ?\; ?= ?! ?~ ?\( ?\[)))))
299 nil ;; A division sign instead of a regexp-match.
300 (put-text-property (match-beginning 2) (match-end 2)
301 'syntax-table (string-to-syntax "\""))
302 (perl-syntax-propertize-special-constructs end)))))
303 ("\\(^\\|[?:.,;=!~({[ \t]\\)\\([msy]\\|q[qxrw]?\\|tr\\)\\>\\s-*\\([^])}> \n\t]\\)"
304 ;; Nasty cases:
305 ;; /foo/m $a->m $#m $m @m %m
306 ;; \s (appears often in regexps).
307 ;; -s file
308 ;; sub tr {...}
309 (3 (ignore
310 (if (save-excursion (goto-char (match-beginning 0))
311 (forward-word -1)
312 (looking-at-p "sub[ \t\n]"))
313 ;; This is defining a function.
314 nil
315 (put-text-property (match-beginning 3) (match-end 3)
316 'syntax-table
317 (if (assoc (char-after (match-beginning 3))
318 perl-quote-like-pairs)
319 (string-to-syntax "|")
320 (string-to-syntax "\"")))
321 (perl-syntax-propertize-special-constructs end))))))
322 (point) end)))
323
324 (defvar perl-empty-syntax-table
325 (let ((st (copy-syntax-table)))
326 ;; Make all chars be of punctuation syntax.
327 (dotimes (i 256) (aset st i '(1)))
328 (modify-syntax-entry ?\\ "\\" st)
329 st)
330 "Syntax table used internally for processing quote-like operators.")
331
332 (defun perl-quote-syntax-table (char)
333 (let ((close (cdr (assq char perl-quote-like-pairs)))
334 (st (copy-syntax-table perl-empty-syntax-table)))
335 (if (not close)
336 (modify-syntax-entry char "\"" st)
337 (modify-syntax-entry char "(" st)
338 (modify-syntax-entry close ")" st))
339 st))
340
341 (defun perl-syntax-propertize-special-constructs (limit)
342 "Propertize special constructs like regexps and formats."
343 (let ((state (syntax-ppss))
344 char)
345 (cond
346 ((or (null (setq char (nth 3 state)))
347 (and (characterp char) (eq (char-syntax (nth 3 state)) ?\")))
348 ;; Normal text, or comment, or docstring, or normal string.
349 nil)
350 ((eq (nth 3 state) ?\n)
351 ;; A `format' command.
352 (when (re-search-forward "^\\s *\\.\\s *\n" limit 'move)
353 (put-text-property (1- (point)) (point)
354 'syntax-table (string-to-syntax "\""))))
355 (t
356 ;; This is regexp like quote thingy.
357 (setq char (char-after (nth 8 state)))
358 (let ((twoargs (save-excursion
359 (goto-char (nth 8 state))
360 (skip-syntax-backward " ")
361 (skip-syntax-backward "w")
362 (member (buffer-substring
363 (point) (progn (forward-word 1) (point)))
364 '("tr" "s" "y"))))
365 (close (cdr (assq char perl-quote-like-pairs)))
366 (st (perl-quote-syntax-table char)))
367 (when (with-syntax-table st
368 (if close
369 ;; For paired delimiters, Perl allows nesting them, but
370 ;; since we treat them as strings, Emacs does not count
371 ;; those delimiters in `state', so we don't know how deep
372 ;; we are: we have to go back to the beginning of this
373 ;; "string" and count from there.
374 (condition-case nil
375 (progn
376 ;; Start after the first char since it doesn't have
377 ;; paren-syntax (an alternative would be to let-bind
378 ;; parse-sexp-lookup-properties).
379 (goto-char (1+ (nth 8 state)))
380 (up-list 1)
381 t)
382 (scan-error nil))
383 (not (or (nth 8 (parse-partial-sexp
384 (point) limit nil nil state 'syntax-table))
385 ;; If we have a self-paired opener and a twoargs
386 ;; command, the form is s/../../ so we have to skip
387 ;; a second time.
388 ;; In the case of s{...}{...}, we only handle the
389 ;; first part here and the next below.
390 (when (and twoargs (not close))
391 (nth 8 (parse-partial-sexp
392 (point) limit
393 nil nil state 'syntax-table)))))))
394 ;; Point is now right after the arg(s).
395 (when (eq (char-before (1- (point))) ?$)
396 (put-text-property (- (point) 2) (1- (point))
397 'syntax-table '(1)))
398 (put-text-property (1- (point)) (point)
399 'syntax-table
400 (if close
401 (string-to-syntax "|")
402 (string-to-syntax "\"")))
403 ;; If we have two args with a non-self-paired starter (e.g.
404 ;; s{...}{...}) we're right after the first arg, so we still have to
405 ;; handle the second part.
406 (when (and twoargs close)
407 ;; Skip whitespace and make sure that font-lock will
408 ;; refontify the second part in the proper context.
409 (put-text-property
410 (point) (progn (forward-comment (point-max)) (point))
411 'syntax-multiline t)
412 ;;
413 (when (< (point) limit)
414 (put-text-property (point) (1+ (point))
415 'syntax-table
416 (if (assoc (char-after)
417 perl-quote-like-pairs)
418 ;; Put an `e' in the cdr to mark this
419 ;; char as "second arg starter".
420 (string-to-syntax "|e")
421 (string-to-syntax "\"e")))
422 (forward-char 1)
423 ;; Re-use perl-syntax-propertize-special-constructs to handle the
424 ;; second part (the first delimiter of second part can't be
425 ;; preceded by "s" or "tr" or "y", so it will not be considered
426 ;; as twoarg).
427 (perl-syntax-propertize-special-constructs limit)))))))))
428
429 (defun perl-font-lock-syntactic-face-function (state)
430 (cond
431 ((and (nth 3 state)
432 (eq ?e (cdr-safe (get-text-property (nth 8 state) 'syntax-table)))
433 ;; This is a second-arg of s{..}{...} form; let's check if this second
434 ;; arg is executable code rather than a string. For that, we need to
435 ;; look for an "e" after this second arg, so we have to hunt for the
436 ;; end of the arg. Depending on whether the whole arg has already
437 ;; been syntax-propertized or not, the end-char will have different
438 ;; syntaxes, so let's ignore syntax-properties temporarily so we can
439 ;; pretend it has not been syntax-propertized yet.
440 (let* ((parse-sexp-lookup-properties nil)
441 (char (char-after (nth 8 state)))
442 (paired (assq char perl-quote-like-pairs)))
443 (with-syntax-table (perl-quote-syntax-table char)
444 (save-excursion
445 (if (not paired)
446 (parse-partial-sexp (point) (point-max)
447 nil nil state 'syntax-table)
448 (condition-case nil
449 (progn
450 (goto-char (1+ (nth 8 state)))
451 (up-list 1))
452 (scan-error (goto-char (point-max)))))
453 (put-text-property (nth 8 state) (point)
454 'jit-lock-defer-multiline t)
455 (looking-at "[ \t]*\\sw*e")))))
456 nil)
457 (t (funcall (default-value 'font-lock-syntactic-face-function) state))))
458
459 (defcustom perl-indent-level 4
460 "*Indentation of Perl statements with respect to containing block."
461 :type 'integer
462 :group 'perl)
463
464 ;; Is is not unusual to put both things like perl-indent-level and
465 ;; cperl-indent-level in the local variable section of a file. If only
466 ;; one of perl-mode and cperl-mode is in use, a warning will be issued
467 ;; about the variable. Autoload these here, so that no warning is
468 ;; issued when using either perl-mode or cperl-mode.
469 ;;;###autoload(put 'perl-indent-level 'safe-local-variable 'integerp)
470 ;;;###autoload(put 'perl-continued-statement-offset 'safe-local-variable 'integerp)
471 ;;;###autoload(put 'perl-continued-brace-offset 'safe-local-variable 'integerp)
472 ;;;###autoload(put 'perl-brace-offset 'safe-local-variable 'integerp)
473 ;;;###autoload(put 'perl-brace-imaginary-offset 'safe-local-variable 'integerp)
474 ;;;###autoload(put 'perl-label-offset 'safe-local-variable 'integerp)
475
476 (defcustom perl-continued-statement-offset 4
477 "*Extra indent for lines not starting new statements."
478 :type 'integer
479 :group 'perl)
480 (defcustom perl-continued-brace-offset -4
481 "*Extra indent for substatements that start with open-braces.
482 This is in addition to `perl-continued-statement-offset'."
483 :type 'integer
484 :group 'perl)
485 (defcustom perl-brace-offset 0
486 "*Extra indentation for braces, compared with other text in same context."
487 :type 'integer
488 :group 'perl)
489 (defcustom perl-brace-imaginary-offset 0
490 "*Imagined indentation of an open brace that actually follows a statement."
491 :type 'integer
492 :group 'perl)
493 (defcustom perl-label-offset -2
494 "*Offset of Perl label lines relative to usual indentation."
495 :type 'integer
496 :group 'perl)
497 (defcustom perl-indent-continued-arguments nil
498 "*If non-nil offset of argument lines relative to usual indentation.
499 If nil, continued arguments are aligned with the first argument."
500 :type '(choice integer (const nil))
501 :group 'perl)
502
503 (defcustom perl-tab-always-indent tab-always-indent
504 "Non-nil means TAB in Perl mode always indents the current line.
505 Otherwise it inserts a tab character if you type it past the first
506 nonwhite character on the line."
507 :type 'boolean
508 :group 'perl)
509
510 ;; I changed the default to nil for consistency with general Emacs
511 ;; conventions -- rms.
512 (defcustom perl-tab-to-comment nil
513 "*Non-nil means TAB moves to eol or makes a comment in some cases.
514 For lines which don't need indenting, TAB either indents an
515 existing comment, moves to end-of-line, or if at end-of-line already,
516 create a new comment."
517 :type 'boolean
518 :group 'perl)
519
520 (defcustom perl-nochange ";?#\\|\f\\|\\s(\\|\\(\\w\\|\\s_\\)+:[^:]"
521 "*Lines starting with this regular expression are not auto-indented."
522 :type 'regexp
523 :group 'perl)
524
525 ;; Outline support
526
527 (defvar perl-outline-regexp
528 (concat (mapconcat 'cadr perl-imenu-generic-expression "\\|")
529 "\\|^=cut\\>"))
530
531 (defun perl-outline-level ()
532 (cond
533 ((looking-at "package\\s-") 0)
534 ((looking-at "sub\\s-") 1)
535 ((looking-at "=head[0-9]") (- (char-before (match-end 0)) ?0))
536 ((looking-at "=cut") 1)
537 (t 3)))
538 \f
539 (defvar perl-mode-hook nil
540 "Normal hook to run when entering Perl mode.")
541
542 ;;;###autoload
543 (defun perl-mode ()
544 "Major mode for editing Perl code.
545 Expression and list commands understand all Perl brackets.
546 Tab indents for Perl code.
547 Comments are delimited with # ... \\n.
548 Paragraphs are separated by blank lines only.
549 Delete converts tabs to spaces as it moves back.
550 \\{perl-mode-map}
551 Variables controlling indentation style:
552 `perl-tab-always-indent'
553 Non-nil means TAB in Perl mode should always indent the current line,
554 regardless of where in the line point is when the TAB command is used.
555 `perl-tab-to-comment'
556 Non-nil means that for lines which don't need indenting, TAB will
557 either delete an empty comment, indent an existing comment, move
558 to end-of-line, or if at end-of-line already, create a new comment.
559 `perl-nochange'
560 Lines starting with this regular expression are not auto-indented.
561 `perl-indent-level'
562 Indentation of Perl statements within surrounding block.
563 The surrounding block's indentation is the indentation
564 of the line on which the open-brace appears.
565 `perl-continued-statement-offset'
566 Extra indentation given to a substatement, such as the
567 then-clause of an if or body of a while.
568 `perl-continued-brace-offset'
569 Extra indentation given to a brace that starts a substatement.
570 This is in addition to `perl-continued-statement-offset'.
571 `perl-brace-offset'
572 Extra indentation for line if it starts with an open brace.
573 `perl-brace-imaginary-offset'
574 An open brace following other text is treated as if it were
575 this far to the right of the start of its line.
576 `perl-label-offset'
577 Extra indentation for line that is a label.
578 `perl-indent-continued-arguments'
579 Offset of argument lines relative to usual indentation.
580
581 Various indentation styles: K&R BSD BLK GNU LW
582 perl-indent-level 5 8 0 2 4
583 perl-continued-statement-offset 5 8 4 2 4
584 perl-continued-brace-offset 0 0 0 0 -4
585 perl-brace-offset -5 -8 0 0 0
586 perl-brace-imaginary-offset 0 0 4 0 0
587 perl-label-offset -5 -8 -2 -2 -2
588
589 Turning on Perl mode runs the normal hook `perl-mode-hook'."
590 (interactive)
591 (kill-all-local-variables)
592 (use-local-map perl-mode-map)
593 (setq major-mode 'perl-mode)
594 (setq mode-name "Perl")
595 (setq local-abbrev-table perl-mode-abbrev-table)
596 (set-syntax-table perl-mode-syntax-table)
597 (make-local-variable 'paragraph-start)
598 (setq paragraph-start (concat "$\\|" page-delimiter))
599 (make-local-variable 'paragraph-separate)
600 (setq paragraph-separate paragraph-start)
601 (make-local-variable 'paragraph-ignore-fill-prefix)
602 (setq paragraph-ignore-fill-prefix t)
603 (make-local-variable 'indent-line-function)
604 (setq indent-line-function 'perl-indent-line)
605 (make-local-variable 'require-final-newline)
606 (setq require-final-newline mode-require-final-newline)
607 (make-local-variable 'comment-start)
608 (setq comment-start "# ")
609 (make-local-variable 'comment-end)
610 (setq comment-end "")
611 (make-local-variable 'comment-start-skip)
612 (setq comment-start-skip "\\(^\\|\\s-\\);?#+ *")
613 (make-local-variable 'comment-indent-function)
614 (setq comment-indent-function 'perl-comment-indent)
615 (make-local-variable 'parse-sexp-ignore-comments)
616 (setq parse-sexp-ignore-comments t)
617 ;; Tell font-lock.el how to handle Perl.
618 (setq font-lock-defaults '((perl-font-lock-keywords
619 perl-font-lock-keywords-1
620 perl-font-lock-keywords-2)
621 nil nil ((?\_ . "w")) nil
622 (font-lock-syntactic-face-function
623 . perl-font-lock-syntactic-face-function)))
624 (set (make-local-variable 'syntax-propertize-function)
625 #'perl-syntax-propertize-function)
626 (add-hook 'syntax-propertize-extend-region-functions
627 #'syntax-propertize-multiline 'append 'local)
628 ;; Tell imenu how to handle Perl.
629 (set (make-local-variable 'imenu-generic-expression)
630 perl-imenu-generic-expression)
631 (setq imenu-case-fold-search nil)
632 ;; Setup outline-minor-mode.
633 (set (make-local-variable 'outline-regexp) perl-outline-regexp)
634 (set (make-local-variable 'outline-level) 'perl-outline-level)
635 (run-mode-hooks 'perl-mode-hook))
636 \f
637 ;; This is used by indent-for-comment
638 ;; to decide how much to indent a comment in Perl code
639 ;; based on its context.
640 (defun perl-comment-indent ()
641 (if (and (bolp) (not (eolp)))
642 0 ;Existing comment at bol stays there.
643 comment-column))
644
645 (defalias 'electric-perl-terminator 'perl-electric-terminator)
646 (defun perl-electric-terminator (arg)
647 "Insert character and adjust indentation.
648 If at end-of-line, and not in a comment or a quote, correct the's indentation."
649 (interactive "P")
650 (let ((insertpos (point)))
651 (and (not arg) ; decide whether to indent
652 (eolp)
653 (save-excursion
654 (beginning-of-line)
655 (and (not ; eliminate comments quickly
656 (and comment-start-skip
657 (re-search-forward comment-start-skip insertpos t)) )
658 (or (/= last-command-event ?:)
659 ;; Colon is special only after a label ....
660 (looking-at "\\s-*\\(\\w\\|\\s_\\)+$"))
661 (let ((pps (parse-partial-sexp
662 (perl-beginning-of-function) insertpos)))
663 (not (or (nth 3 pps) (nth 4 pps) (nth 5 pps))))))
664 (progn ; must insert, indent, delete
665 (insert-char last-command-event 1)
666 (perl-indent-line)
667 (delete-char -1))))
668 (self-insert-command (prefix-numeric-value arg)))
669
670 ;; not used anymore, but may be useful someday:
671 ;;(defun perl-inside-parens-p ()
672 ;; (condition-case ()
673 ;; (save-excursion
674 ;; (save-restriction
675 ;; (narrow-to-region (point)
676 ;; (perl-beginning-of-function))
677 ;; (goto-char (point-max))
678 ;; (= (char-after (or (scan-lists (point) -1 1) (point-min))) ?\()))
679 ;; (error nil)))
680 \f
681 (defun perl-indent-command (&optional arg)
682 "Indent Perl code in the active region or current line.
683 In Transient Mark mode, when the region is active, reindent the region.
684 Otherwise, with a prefix argument, reindent the current line
685 unconditionally.
686
687 Otherwise, if `perl-tab-always-indent' is nil and point is not in
688 the indentation area at the beginning of the line, insert a tab.
689
690 Otherwise, indent the current line. If point was within the
691 indentation area, it is moved to the end of the indentation area.
692 If the line was already indented properly and point was not
693 within the indentation area, and if `perl-tab-to-comment' is
694 non-nil (the default), then do the first possible action from the
695 following list:
696
697 1) delete an empty comment
698 2) move forward to start of comment, indenting if necessary
699 3) move forward to end of line
700 4) create an empty comment
701 5) move backward to start of comment, indenting if necessary."
702 (interactive "P")
703 (cond ((use-region-p) ; indent the active region
704 (indent-region (region-beginning) (region-end)))
705 (arg
706 (perl-indent-line "\f")) ; just indent this line
707 ((and (not perl-tab-always-indent)
708 (> (current-column) (current-indentation)))
709 (insert-tab))
710 (t
711 (let* ((oldpnt (point))
712 (lsexp (progn (beginning-of-line) (point)))
713 (bof (perl-beginning-of-function))
714 (delta (progn
715 (goto-char oldpnt)
716 (perl-indent-line "\f\\|;?#" bof))))
717 (and perl-tab-to-comment
718 (= oldpnt (point)) ; done if point moved
719 (if (listp delta) ; if line starts in a quoted string
720 (setq lsexp (or (nth 2 delta) bof))
721 (= delta 0)) ; done if indenting occurred
722 (let ((eol (progn (end-of-line) (point)))
723 state)
724 (cond ((= (char-after bof) ?=)
725 (if (= oldpnt eol)
726 (message "In a format statement")))
727 ((progn (setq state (parse-partial-sexp lsexp eol))
728 (nth 3 state))
729 (if (= oldpnt eol) ; already at eol in a string
730 (message "In a string which starts with a %c."
731 (nth 3 state))))
732 ((not (nth 4 state))
733 (if (= oldpnt eol) ; no comment, create one?
734 (indent-for-comment)))
735 ((progn (beginning-of-line)
736 (and comment-start-skip
737 (re-search-forward
738 comment-start-skip eol 'move)))
739 (if (eolp)
740 (progn ; delete existing comment
741 (goto-char (match-beginning 0))
742 (skip-chars-backward " \t")
743 (delete-region (point) eol))
744 (if (or (< oldpnt (point)) (= oldpnt eol))
745 (indent-for-comment) ; indent existing comment
746 (end-of-line))))
747 ((/= oldpnt eol)
748 (end-of-line))
749 (t
750 (message "Use backslash to quote # characters.")
751 (ding t)))))))))
752
753 (defun perl-indent-line (&optional nochange parse-start)
754 "Indent current line as Perl code.
755 Return the amount the indentation
756 changed by, or (parse-state) if line starts in a quoted string."
757 (let ((case-fold-search nil)
758 (pos (- (point-max) (point)))
759 (bof (or parse-start (save-excursion (perl-beginning-of-function))))
760 beg indent shift-amt)
761 (beginning-of-line)
762 (setq beg (point))
763 (setq shift-amt
764 (cond ((eq (char-after bof) ?=) 0)
765 ((listp (setq indent (perl-calculate-indent bof))) indent)
766 ((looking-at (or nochange perl-nochange)) 0)
767 (t
768 (skip-chars-forward " \t\f")
769 (setq indent (perl-indent-new-calculate nil indent bof))
770 (- indent (current-column)))))
771 (skip-chars-forward " \t\f")
772 (if (and (numberp shift-amt) (/= 0 shift-amt))
773 (progn (delete-region beg (point))
774 (indent-to indent)))
775 ;; If initial point was within line's indentation,
776 ;; position after the indentation. Else stay at same point in text.
777 (if (> (- (point-max) pos) (point))
778 (goto-char (- (point-max) pos)))
779 shift-amt))
780
781 (defun perl-continuation-line-p (limit)
782 "Move to end of previous line and return non-nil if continued."
783 ;; Statement level. Is it a continuation or a new statement?
784 ;; Find previous non-comment character.
785 (perl-backward-to-noncomment)
786 ;; Back up over label lines, since they don't
787 ;; affect whether our line is a continuation.
788 (while (or (eq (preceding-char) ?\,)
789 (and (eq (preceding-char) ?:)
790 (memq (char-syntax (char-after (- (point) 2)))
791 '(?w ?_))))
792 (if (eq (preceding-char) ?\,)
793 (perl-backward-to-start-of-continued-exp limit)
794 (beginning-of-line))
795 (perl-backward-to-noncomment))
796 ;; Now we get the answer.
797 (not (memq (preceding-char) '(?\; ?\} ?\{))))
798
799 (defun perl-hanging-paren-p ()
800 "Non-nil if we are right after a hanging parenthesis-like char."
801 (and (looking-at "[ \t]*$")
802 (save-excursion
803 (skip-syntax-backward " (") (not (bolp)))))
804
805 (defun perl-indent-new-calculate (&optional virtual default parse-start)
806 (or
807 (and virtual (save-excursion (skip-chars-backward " \t") (bolp))
808 (current-column))
809 (and (looking-at "\\(\\w\\|\\s_\\)+:[^:]")
810 (max 1 (+ (or default (perl-calculate-indent parse-start))
811 perl-label-offset)))
812 (and (= (char-syntax (following-char)) ?\))
813 (save-excursion
814 (forward-char 1)
815 (forward-sexp -1)
816 (perl-indent-new-calculate
817 ;; Recalculate the parsing-start, since we may have jumped
818 ;; dangerously close (typically in the case of nested functions).
819 'virtual nil (save-excursion (perl-beginning-of-function)))))
820 (and (and (= (following-char) ?{)
821 (save-excursion (forward-char) (perl-hanging-paren-p)))
822 (+ (or default (perl-calculate-indent parse-start))
823 perl-brace-offset))
824 (or default (perl-calculate-indent parse-start))))
825
826 (defun perl-calculate-indent (&optional parse-start)
827 "Return appropriate indentation for current line as Perl code.
828 In usual case returns an integer: the column to indent to.
829 Returns (parse-state) if line starts inside a string.
830 Optional argument PARSE-START should be the position of `beginning-of-defun'."
831 (save-excursion
832 (let ((indent-point (point))
833 (case-fold-search nil)
834 (colon-line-end 0)
835 state containing-sexp)
836 (if parse-start ;used to avoid searching
837 (goto-char parse-start)
838 (perl-beginning-of-function))
839 ;; We might be now looking at a local function that has nothing to
840 ;; do with us because `indent-point' is past it. In this case
841 ;; look further back up for another `perl-beginning-of-function'.
842 (while (and (looking-at "{")
843 (save-excursion
844 (beginning-of-line)
845 (looking-at "\\s-+sub\\>"))
846 (> indent-point (save-excursion (forward-sexp 1) (point))))
847 (perl-beginning-of-function))
848 (while (< (point) indent-point) ;repeat until right sexp
849 (setq state (parse-partial-sexp (point) indent-point 0))
850 ;; state = (depth_in_parens innermost_containing_list
851 ;; last_complete_sexp string_terminator_or_nil inside_commentp
852 ;; following_quotep minimum_paren-depth_this_scan)
853 ;; Parsing stops if depth in parentheses becomes equal to third arg.
854 (setq containing-sexp (nth 1 state)))
855 (cond ((nth 3 state) state) ; In a quoted string?
856 ((null containing-sexp) ; Line is at top level.
857 (skip-chars-forward " \t\f")
858 (if (= (following-char) ?{)
859 0 ; move to beginning of line if it starts a function body
860 ;; indent a little if this is a continuation line
861 (perl-backward-to-noncomment)
862 (if (or (bobp)
863 (memq (preceding-char) '(?\; ?\})))
864 0 perl-continued-statement-offset)))
865 ((/= (char-after containing-sexp) ?{)
866 ;; line is expression, not statement:
867 ;; indent to just after the surrounding open.
868 (goto-char (1+ containing-sexp))
869 (if (perl-hanging-paren-p)
870 ;; We're indenting an arg of a call like:
871 ;; $a = foobarlongnamefun (
872 ;; arg1
873 ;; arg2
874 ;; );
875 (progn
876 (skip-syntax-backward "(")
877 (condition-case err
878 (while (save-excursion
879 (skip-syntax-backward " ") (not (bolp)))
880 (forward-sexp -1))
881 (scan-error nil))
882 (+ (current-column) perl-indent-level))
883 (if perl-indent-continued-arguments
884 (+ perl-indent-continued-arguments (current-indentation))
885 (skip-chars-forward " \t")
886 (current-column))))
887 (t
888 ;; Statement level. Is it a continuation or a new statement?
889 (if (perl-continuation-line-p containing-sexp)
890 ;; This line is continuation of preceding line's statement;
891 ;; indent perl-continued-statement-offset more than the
892 ;; previous line of the statement.
893 (progn
894 (perl-backward-to-start-of-continued-exp containing-sexp)
895 (+ (if (save-excursion
896 (perl-continuation-line-p containing-sexp))
897 ;; If the continued line is itself a continuation
898 ;; line, then align, otherwise add an offset.
899 0 perl-continued-statement-offset)
900 (current-column)
901 (if (save-excursion (goto-char indent-point)
902 (looking-at "[ \t]*{"))
903 perl-continued-brace-offset 0)))
904 ;; This line starts a new statement.
905 ;; Position at last unclosed open.
906 (goto-char containing-sexp)
907 (or
908 ;; Is line first statement after an open-brace?
909 ;; If no, find that first statement and indent like it.
910 (save-excursion
911 (forward-char 1)
912 ;; Skip over comments and labels following openbrace.
913 (while (progn
914 (skip-chars-forward " \t\f\n")
915 (cond ((looking-at ";?#")
916 (forward-line 1) t)
917 ((looking-at "\\(\\w\\|\\s_\\)+:[^:]")
918 (save-excursion
919 (end-of-line)
920 (setq colon-line-end (point)))
921 (search-forward ":")))))
922 ;; The first following code counts
923 ;; if it is before the line we want to indent.
924 (and (< (point) indent-point)
925 (if (> colon-line-end (point))
926 (- (current-indentation) perl-label-offset)
927 (current-column))))
928 ;; If no previous statement,
929 ;; indent it relative to line brace is on.
930 ;; For open paren in column zero, don't let statement
931 ;; start there too. If perl-indent-level is zero,
932 ;; use perl-brace-offset + perl-continued-statement-offset
933 ;; For open-braces not the first thing in a line,
934 ;; add in perl-brace-imaginary-offset.
935 (+ (if (and (bolp) (zerop perl-indent-level))
936 (+ perl-brace-offset perl-continued-statement-offset)
937 perl-indent-level)
938 ;; Move back over whitespace before the openbrace.
939 ;; If openbrace is not first nonwhite thing on the line,
940 ;; add the perl-brace-imaginary-offset.
941 (progn (skip-chars-backward " \t")
942 (if (bolp) 0 perl-brace-imaginary-offset))
943 ;; If the openbrace is preceded by a parenthesized exp,
944 ;; move to the beginning of that;
945 ;; possibly a different line
946 (progn
947 (if (eq (preceding-char) ?\))
948 (forward-sexp -1))
949 ;; Get initial indentation of the line we are on.
950 (current-indentation))))))))))
951
952 (defun perl-backward-to-noncomment ()
953 "Move point backward to after the first non-white-space, skipping comments."
954 (interactive)
955 (forward-comment (- (point-max))))
956
957 (defun perl-backward-to-start-of-continued-exp (lim)
958 (if (= (preceding-char) ?\))
959 (forward-sexp -1))
960 (beginning-of-line)
961 (if (<= (point) lim)
962 (goto-char (1+ lim)))
963 (skip-chars-forward " \t\f"))
964 \f
965 ;; note: this may be slower than the c-mode version, but I can understand it.
966 (defalias 'indent-perl-exp 'perl-indent-exp)
967 (defun perl-indent-exp ()
968 "Indent each line of the Perl grouping following point."
969 (interactive)
970 (let* ((case-fold-search nil)
971 (oldpnt (point-marker))
972 (bof-mark (save-excursion
973 (end-of-line 2)
974 (perl-beginning-of-function)
975 (point-marker)))
976 eol last-mark lsexp-mark delta)
977 (if (= (char-after (marker-position bof-mark)) ?=)
978 (message "Can't indent a format statement")
979 (message "Indenting Perl expression...")
980 (save-excursion (end-of-line) (setq eol (point)))
981 (save-excursion ; locate matching close paren
982 (while (and (not (eobp)) (<= (point) eol))
983 (parse-partial-sexp (point) (point-max) 0))
984 (setq last-mark (point-marker)))
985 (setq lsexp-mark bof-mark)
986 (beginning-of-line)
987 (while (< (point) (marker-position last-mark))
988 (setq delta (perl-indent-line nil (marker-position bof-mark)))
989 (if (numberp delta) ; unquoted start-of-line?
990 (progn
991 (if (eolp)
992 (delete-horizontal-space))
993 (setq lsexp-mark (point-marker))))
994 (end-of-line)
995 (setq eol (point))
996 (if (nth 4 (parse-partial-sexp (marker-position lsexp-mark) eol))
997 (progn ; line ends in a comment
998 (beginning-of-line)
999 (if (or (not (looking-at "\\s-*;?#"))
1000 (listp delta)
1001 (and (/= 0 delta)
1002 (= (- (current-indentation) delta) comment-column)))
1003 (if (and comment-start-skip
1004 (re-search-forward comment-start-skip eol t))
1005 (indent-for-comment))))) ; indent existing comment
1006 (forward-line 1))
1007 (goto-char (marker-position oldpnt))
1008 (message "Indenting Perl expression...done"))))
1009 \f
1010 (defun perl-beginning-of-function (&optional arg)
1011 "Move backward to next beginning-of-function, or as far as possible.
1012 With argument, repeat that many times; negative args move forward.
1013 Returns new value of point in all cases."
1014 (interactive "p")
1015 (or arg (setq arg 1))
1016 (if (< arg 0) (forward-char 1))
1017 (and (/= arg 0)
1018 (re-search-backward
1019 "^\\s(\\|^\\s-*sub\\b[ \t\n]*\\_<[^{]+{\\|^\\s-*format\\b[^=]*=\\|^\\."
1020 nil 'move arg)
1021 (goto-char (1- (match-end 0))))
1022 (point))
1023
1024 ;; note: this routine is adapted directly from emacs lisp.el, end-of-defun;
1025 ;; no bugs have been removed :-)
1026 (defun perl-end-of-function (&optional arg)
1027 "Move forward to next end-of-function.
1028 The end of a function is found by moving forward from the beginning of one.
1029 With argument, repeat that many times; negative args move backward."
1030 (interactive "p")
1031 (or arg (setq arg 1))
1032 (let ((first t))
1033 (while (and (> arg 0) (< (point) (point-max)))
1034 (let ((pos (point)))
1035 (while (progn
1036 (if (and first
1037 (progn
1038 (forward-char 1)
1039 (perl-beginning-of-function 1)
1040 (not (bobp))))
1041 nil
1042 (or (bobp) (forward-char -1))
1043 (perl-beginning-of-function -1))
1044 (setq first nil)
1045 (forward-list 1)
1046 (skip-chars-forward " \t")
1047 (if (looking-at "[#\n]")
1048 (forward-line 1))
1049 (<= (point) pos))))
1050 (setq arg (1- arg)))
1051 (while (< arg 0)
1052 (let ((pos (point)))
1053 (perl-beginning-of-function 1)
1054 (forward-sexp 1)
1055 (forward-line 1)
1056 (if (>= (point) pos)
1057 (if (progn (perl-beginning-of-function 2) (not (bobp)))
1058 (progn
1059 (forward-list 1)
1060 (skip-chars-forward " \t")
1061 (if (looking-at "[#\n]")
1062 (forward-line 1)))
1063 (goto-char (point-min)))))
1064 (setq arg (1+ arg)))))
1065
1066 (defalias 'mark-perl-function 'perl-mark-function)
1067 (defun perl-mark-function ()
1068 "Put mark at end of Perl function, point at beginning."
1069 (interactive)
1070 (push-mark (point))
1071 (perl-end-of-function)
1072 (push-mark (point))
1073 (perl-beginning-of-function)
1074 (backward-paragraph))
1075
1076 (provide 'perl-mode)
1077
1078 ;; arch-tag: 8c7ff68d-15f3-46a2-ade2-b7c41f176826
1079 ;;; perl-mode.el ends here