1 ;;; align.el --- align text to a specific column, by regexp -*- lexical-binding:t -*-
3 ;; Copyright (C) 1999-2015 Free Software Foundation, Inc.
5 ;; Author: John Wiegley <johnw@gnu.org>
6 ;; Maintainer: emacs-devel@gnu.org
7 ;; Keywords: convenience languages lisp
9 ;; This file is part of GNU Emacs.
11 ;; GNU Emacs is free software: you can redistribute it and/or modify
12 ;; it under the terms of the GNU General Public License as published by
13 ;; the Free Software Foundation, either version 3 of the License, or
14 ;; (at your option) any later version.
16 ;; GNU Emacs is distributed in the hope that it will be useful,
17 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
18 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
19 ;; GNU General Public License for more details.
21 ;; You should have received a copy of the GNU General Public License
22 ;; along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>.
26 ;; This mode allows you to align regions in a context-sensitive fashion.
27 ;; The classic use is to align assignments:
41 ;; There are several variables which define how certain "categories"
42 ;; of syntax are to be treated. These variables go by the name
43 ;; `align-CATEGORY-modes'. For example, "c++" is such a category.
44 ;; There are several rules which apply to c++, but since several other
45 ;; languages have a syntax similar to c++ (e.g., c, java, etc), these
46 ;; modes are treated as belonging to the same category.
48 ;; If you want to add a new mode under a certain category, just
49 ;; customize that list, or add the new mode manually. For example, to
50 ;; make jde-mode a c++ category mode, use this code in your .emacs
53 ;; (setq align-c++-modes (cons 'jde-mode align-c++-modes))
55 ;; In some programming modes, it's useful to have the aligner run only
56 ;; after indentation is performed. To achieve this, customize or set
57 ;; the variable `align-indent-before-aligning' to t.
61 ;; In order to incorporate align's functionality into your own
62 ;; modules, there are only a few steps you have to follow.
64 ;; 1. Require or load in the align.el library.
66 ;; 2. Define your alignment and exclusion rules lists, either
67 ;; customizable or not.
69 ;; 3. In your mode function, set the variables
70 ;; `align-mode-rules-list' and `align-mode-exclude-rules-list'
71 ;; to your own rules lists.
73 ;; If there is any need to add your mode name to one of the
74 ;; align-?-modes variables (for example, `align-dq-string-modes'), use
75 ;; `add-to-list', or some similar function which checks first to see
76 ;; if the value is already there. Since the user may customize that
77 ;; mode list, and then write your mode name into their init file,
78 ;; causing the symbol already to be present the next time they load
85 ;; (defcustom my-align-rules-list
87 ;; (regexp . "Sample")))
88 ;; :type align-rules-list-type
89 ;; :group 'my-package)
91 ;; (put 'my-align-rules-list 'risky-local-variable t)
93 ;; (add-to-list 'align-dq-string-modes 'my-package-mode)
94 ;; (add-to-list 'align-open-comment-modes 'my-package-mode)
98 ;; (setq align-mode-rules-list my-align-rules-list))
100 ;; Note that if you need to install your own exclusion rules, then you
101 ;; will also need to reproduce any double-quoted string, or open
102 ;; comment exclusion rules that are defined in the standard
103 ;; `align-exclude-rules-list'. At the moment there is no convenient
104 ;; way to mix both mode-local and global rules lists.
108 ;; Version 1.0 was created in the earlier part of 1996, using a very
109 ;; simple algorithm that understand only basic regular expressions.
110 ;; Parts of the code were broken up and included in vhdl-mode.el
111 ;; around this time. After several comments from users, and a need to
112 ;; find a more robust, higher performing algorithm, 2.0 was born in late
113 ;; 1998. Many different approaches were taken (mostly due to the
114 ;; complexity of TeX tables), but finally a scheme was discovered
115 ;; which worked fairly well for most common usage cases. Development
116 ;; beyond version 2.8 is not planned, except for problems that users
122 "Align text to a specific column, by regexp."
128 (defcustom align-load-hook nil
129 "Hook that gets run after the aligner has been loaded."
133 (defcustom align-indent-before-aligning nil
134 "If non-nil, indent the marked region before aligning it."
138 (defcustom align-default-spacing
1
139 "An integer that represents the default amount of padding to use.
140 If `align-to-tab-stop' is non-nil, this will represent the number of
141 tab stops to use for alignment, rather than the number of spaces.
142 Each alignment rule can optionally override both this variable and
143 `align-to-tab-stop'. See `align-rules-list'."
147 (defcustom align-to-tab-stop
'indent-tabs-mode
148 "If non-nil, alignments will always fall on a tab boundary.
149 It may also be a symbol, whose value will be taken."
150 :type
'(choice (const nil
) symbol
)
153 (defcustom align-region-heuristic
500
154 "If non-nil, used as a heuristic by `align-current'.
155 Since each alignment rule can possibly have its own set of alignment
156 sections (whenever `align-region-separate' is non-nil, and not a
157 string), this heuristic is used to determine how far before and after
158 point we should search in looking for a region separator. Larger
159 values can mean slower performance in large files, although smaller
160 values may cause unexpected behavior at times."
164 (defcustom align-highlight-change-face
'highlight
165 "The face to highlight with if changes are necessary."
169 (defcustom align-highlight-nochange-face
'secondary-selection
170 "The face to highlight with if no changes are necessary."
174 (defcustom align-large-region
10000
175 "If an integer, defines what constitutes a \"large\" region.
176 If nil, then no messages will ever be printed to the minibuffer."
180 (defcustom align-c
++-modes
'(c++-mode c-mode java-mode
)
181 "A list of modes whose syntax resembles C/C++."
182 :type
'(repeat symbol
)
185 (defcustom align-perl-modes
'(perl-mode cperl-mode
)
186 "A list of modes where Perl syntax is to be seen."
187 :type
'(repeat symbol
)
190 (defcustom align-lisp-modes
191 '(emacs-lisp-mode lisp-interaction-mode lisp-mode scheme-mode
)
192 "A list of modes whose syntax resembles Lisp."
193 :type
'(repeat symbol
)
196 (defcustom align-tex-modes
197 '(tex-mode plain-tex-mode latex-mode slitex-mode
)
198 "A list of modes whose syntax resembles TeX (and family)."
199 :type
'(repeat symbol
)
202 (defcustom align-text-modes
'(text-mode outline-mode
)
203 "A list of modes whose content is plain text."
204 :type
'(repeat symbol
)
207 (defcustom align-dq-string-modes
208 (append align-lisp-modes align-c
++-modes align-perl-modes
210 "A list of modes where double quoted strings should be excluded."
211 :type
'(repeat symbol
)
214 (defcustom align-sq-string-modes
215 (append align-perl-modes
'(python-mode))
216 "A list of modes where single quoted strings should be excluded."
217 :type
'(repeat symbol
)
220 (defcustom align-open-comment-modes
221 (append align-lisp-modes align-c
++-modes align-perl-modes
222 '(python-mode makefile-mode
))
223 "A list of modes with a single-line comment syntax.
224 These are comments as in Lisp, which have a beginning, but end with
225 the line (i.e., `comment-end' is an empty string)."
226 :type
'(repeat symbol
)
229 (defcustom align-region-separate
"^\\s-*[{}]?\\s-*$"
230 "Select the method by which alignment sections will be separated.
231 If this is a symbol, that symbol's value will be used.
233 For the sake of clarification, consider the following example, which
234 will be referred to in the descriptions below.
236 int alpha = 1; /* one */
238 long gamma; /* ten */
240 unsigned int delta = 1; /* one */
241 long double epsilon = 3.0;
242 long long omega; /* ten */
244 The possible settings for `align-region-separate' are:
246 `entire' The entire region being aligned will be considered as a
247 single alignment section. Assuming that comments were not
248 being aligned to a particular column, the example would
251 int alpha = 1; /* one */
253 long gamma; /* ten */
255 unsigned int delta = 1; /* one */
257 long long chi = 10; /* ten */
259 `group' Each contiguous set of lines where a specific alignment
260 occurs is considered a section for that alignment rule.
261 Note that each rule may have any entirely different set
262 of section divisions than another.
264 int alpha = 1; /* one */
266 long gamma; /* ten */
268 unsigned int delta = 1; /* one */
270 long long chi = 10; /* ten */
272 `largest' When contiguous rule sets overlap, the largest section
273 described will be taken as the alignment section for each
274 rule touched by that section.
276 int alpha = 1; /* one */
278 long gamma; /* ten */
280 unsigned int delta = 1; /* one */
282 long long chi = 10; /* ten */
284 NOTE: This option is not supported yet, due to algorithmic
285 issues which haven't been satisfactorily resolved. There
286 are ways to do it, but they're both ugly and resource
289 regexp A regular expression string which defines the section
290 divider. If the mode you're in has a consistent divider
291 between sections, the behavior will be very similar to
292 `largest', and faster. But if the mode does not use clear
293 separators (for example, if you collapse your braces onto
294 the preceding statement in C or Perl), `largest' is
295 probably the better alternative.
297 function A function that will be passed the beginning and ending
298 locations of the region in which to look for the section
299 separator. At the very beginning of the attempt to align,
300 both of these parameters will be nil, in which case the
301 function should return non-nil if it wants each rule to
302 define its own section, or nil if it wants the largest
303 section found to be used as the common section for all
304 rules that occur there.
306 list A list of markers within the buffer that represent where
307 the section dividers lie. Be certain to use markers! For
308 when the aligning begins, the ensuing contract/expanding of
309 whitespace will throw off any non-marker positions.
311 This method is intended for use in Lisp programs, and not
314 (const :tag
"Entire region is one section" entire
)
315 (const :tag
"Align by contiguous groups" group
)
317 (regexp :tag
"Regexp defines section boundaries")
318 (function :tag
"Function defines section boundaries"))
321 (put 'align-region-separate
'risky-local-variable t
)
323 (defvar align-rules-list-type
326 :tag
"Alignment rule"
327 (symbol :tag
"Title")
328 (cons :tag
"Required attributes"
330 (const :tag
"(Regular expression to match)" regexp
)
331 (choice :value
"\\(\\s-+\\)" regexp function
))
333 :tag
"Optional attributes"
336 (const :tag
"(Repeat this rule throughout line)"
339 (cons :tag
"Paren group"
340 (const :tag
"(Parenthesis group to use)" group
)
342 integer
(repeat integer
)))
344 (const :tag
"(Modes where this rule applies)" modes
)
345 (sexp :value
(text-mode)))
346 (cons :tag
"Case-fold"
347 (const :tag
"(Should case be ignored for this rule)"
350 (cons :tag
"To Tab Stop"
351 (const :tag
"(Should rule align to tab stops)"
353 (boolean :value nil
))
355 (const :tag
"(Return non-nil if rule is valid)"
359 (const :tag
"(Return non-nil if rule should run)"
363 (const :tag
"(Column to fix alignment at)" column
)
364 (choice :value comment-column
367 (const :tag
"(Amount of spacing to use)" spacing
)
370 (const :tag
"(Should text be right justified)"
373 ;; make sure this stays up-to-date with any changes
374 ;; in `align-region-separate'
375 (cons :tag
"Separate"
376 (const :tag
"(Separation to use for this rule)"
378 (choice :value
"^\\s-*$"
382 regexp function
)))))))
383 "The `type' form for any `align-rules-list' variable.")
385 (defcustom align-rules-list
387 (regexp .
"\\(^\\s-+[^( \t\n]\\|(\\(\\S-+\\)\\s-+\\)\\S-+\\(\\s-+\\)")
389 (modes . align-lisp-modes
)
390 (run-if .
,(function (lambda () current-prefix-arg
))))
393 (regexp .
"\\(\\s-*\\)\\.\\(\\s-*\\)")
395 (modes . align-lisp-modes
))
399 (lambda (end reverse
)
400 (funcall (if reverse
're-search-backward
402 (concat "[^ \t\n\\\\]"
403 (regexp-quote comment-start
)
404 "\\(.+\\)$") end t
))))
405 (modes . align-open-comment-modes
))
408 (regexp .
"^\\s-*#\\s-*define\\s-+\\S-+\\(\\s-+\\)")
409 (modes . align-c
++-modes
))
411 (c-variable-declaration
412 (regexp .
,(concat "[*&0-9A-Za-z_]>?[&*]*\\(\\s-+[*&]*\\)"
413 "[A-Za-z_][0-9A-Za-z:_]*\\s-*\\(\\()\\|"
414 "=[^=\n].*\\|(.*)\\|\\(\\[.*\\]\\)*\\)?"
415 "\\s-*[;,]\\|)\\s-*$\\)"))
417 (modes . align-c
++-modes
)
422 (not (or (save-excursion
423 (goto-char (match-beginning 1))
426 "\\(goto\\|return\\|new\\|delete\\|throw\\)"))
427 (if (and (boundp 'font-lock-mode
) font-lock-mode
)
428 (eq (get-text-property (point) 'face
)
429 'font-lock-comment-face
)
430 (eq (caar (c-guess-basic-syntax)) 'c
))))))))
433 (regexp .
,(concat "[^-=!^&*+<>/| \t\n]\\(\\s-*[-=!^&*+<>/|]*\\)"
434 "=\\(\\s-*\\)\\([^= \t\n]\\|$\\)"))
436 (modes . align-c
++-modes
)
441 (regexp .
,(concat "[^=!^&*-+<>/| \t\n]\\(\\s-*\\)=[~>]?"
442 "\\(\\s-*\\)\\([^>= \t\n]\\|$\\)"))
444 (modes . align-perl-modes
)
448 (regexp .
,(concat "[^=!<> \t\n]\\(\\s-*\\)="
449 "\\(\\s-*\\)\\([^>= \t\n]\\|$\\)"))
451 (modes .
'(python-mode))
455 (regexp .
"^\\s-*\\w+\\(\\s-*\\):?=\\(\\s-*\\)\\([^\t\n \\\\]\\|$\\)")
457 (modes .
'(makefile-mode))
461 (regexp .
",\\(\\s-*\\)[^/ \t\n]")
463 (modes . align-c
++-modes
)
464 (run-if .
,(function (lambda () current-prefix-arg
))))
468 ; (memq (caar (c-guess-basic-syntax))
471 ; brace-entry-open))))))
473 ;; With a prefix argument, comma delimiter will be aligned. Since
474 ;; perl-mode doesn't give us enough syntactic information (and we
475 ;; don't do our own parsing yet), this rule is too destructive to
477 (basic-comma-delimiter
478 (regexp .
",\\(\\s-*\\)[^# \t\n]")
480 (modes .
(append align-perl-modes
'(python-mode)))
481 (run-if .
,(function (lambda () current-prefix-arg
))))
484 (regexp .
"\\(\\s-*\\)\\(//.*\\|/\\*.*\\*/\\s-*\\)$")
485 (modes . align-c
++-modes
)
486 (column . comment-column
)
490 (goto-char (match-beginning 1))
494 (regexp .
"\\(\\s-*\\)\\(&&\\|||\\|\\<and\\>\\|\\<or\\>\\)")
495 (modes . align-c
++-modes
)
499 (goto-char (match-end 2))
500 (looking-at "\\s-*\\(/[*/]\\|$\\)"))))))
503 (regexp .
"\\(\\s-*\\)\\(&&\\|||\\|\\<and\\>\\|\\<or\\>\\)")
504 (modes . align-perl-modes
)
508 (goto-char (match-end 2))
509 (looking-at "\\s-*\\(#\\|$\\)"))))))
512 (regexp .
"\\(\\s-*\\)\\(\\<and\\>\\|\\<or\\>\\)")
513 (modes .
'(python-mode))
517 (goto-char (match-end 2))
518 (looking-at "\\s-*\\(#\\|$\\|\\\\\\)"))))))
520 (c-macro-line-continuation
521 (regexp .
"\\(\\s-*\\)\\\\$")
522 (modes . align-c
++-modes
)
523 (column . c-backslash-column
))
527 ; (memq (caar (c-guess-basic-syntax))
528 ; '(cpp-macro cpp-macro-cont))))))
530 (basic-line-continuation
531 (regexp .
"\\(\\s-*\\)\\\\$")
532 (modes .
'(python-mode makefile-mode
)))
534 (tex-record-separator
536 (lambda (end reverse
)
537 (align-match-tex-pattern "&" end reverse
))))
539 (modes . align-tex-modes
)
542 (tex-tabbing-separator
544 (lambda (end reverse
)
545 (align-match-tex-pattern "\\\\[=>]" end reverse
))))
547 (modes . align-tex-modes
)
551 (eq major-mode
'latex-mode
)))))
554 (regexp .
"\\(\\s-*\\)\\\\\\\\")
555 (modes . align-tex-modes
))
557 ;; With a numeric prefix argument, or C-u, space delimited text
558 ;; tables will be aligned.
560 (regexp .
"\\(^\\|\\S-\\)\\([ \t]+\\)\\(\\S-\\|$\\)")
562 (modes . align-text-modes
)
566 (and current-prefix-arg
567 (not (eq '- current-prefix-arg
)))))))
569 ;; With a negative prefix argument, lists of dollar figures will
572 (regexp .
"\\$?\\(\\s-+[0-9]+\\)\\.")
573 (modes . align-text-modes
)
577 (eq '- current-prefix-arg
)))))
580 (regexp .
"^\\s-*\\w+:\\(\\s-*\\).*;")
582 (modes .
'(css-mode html-mode
))))
583 "A list describing all of the available alignment rules.
587 (ATTRIBUTE . VALUE) ...)
590 The following attributes are meaningful:
592 `regexp' This required attribute must be either a string describing
593 a regular expression, or a function (described below).
594 For every line within the section that this regular
595 expression matches, the given rule will be applied to that
596 line. The exclusion rules denote which part(s) of the
597 line should not be modified; the alignment rules cause the
598 identified whitespace group to be contracted/expanded such
599 that the \"alignment character\" (the character
600 immediately following the identified parenthesis group),
601 occurs in the same column for every line within the
602 alignment section (see `align-region-separate' for a
603 description of how the region is broken up into alignment
606 The `regexp' attribute describes how the text should be
607 treated. Within this regexp, there must be at least one
608 group of characters (typically whitespace) identified by
609 the special opening and closing parens used in regexp
610 expressions (`\\\\(' and `\\\\)') (see the Emacs manual on
611 the syntax of regular expressions for more info).
613 If `regexp' is a function, it will be called as a
614 replacement for `re-search-forward'. This means that it
615 should return nil if nothing is found to match the rule,
616 or it should set the match data appropriately, move point
617 to the end of the match, and return the value of point.
619 `group' For exclusion rules, the group identifies the range of
620 characters that should be ignored. For alignment rules,
621 these are the characters that will be deleted/expanded for
622 the purposes of alignment. The \"alignment character\" is
623 always the first character immediately following this
624 parenthesis group. This attribute may also be a list of
625 integers, in which case multiple alignment characters will
626 be aligned, with the list of integers identifying the
627 whitespace groups which precede them. The default for
630 `modes' The `modes' attribute, if set, should name a list of
631 major modes -- or evaluate to such a value -- in which the
632 rule is valid. If not set, the rule will apply to all
635 `case-fold' If `regexp' is an ordinary regular expression string
636 containing alphabetic character, sometimes you may want
637 the search to proceed case-insensitively (for languages
638 that ignore case, such as Pascal for example). In that
639 case, set `case-fold' to a non-nil value, and the regular
640 expression search will ignore case. If `regexp' is set to
641 a function, that function must handle the job of ignoring
644 `tab-stop' If the `tab-stop' attribute is set, and non-nil, the
645 alignment character will always fall on a tab stop
646 (whether it uses tabs to get there or not depends on the
647 value of `indent-tabs-mode'). If the `tab-stop' attribute
648 is set to nil, tab stops will never be used. Otherwise,
649 the value of `align-to-tab-stop' determines whether or not
650 to align to a tab stop. The `tab-stop' attribute may also
651 be a list of t or nil values, corresponding to the number
652 of parenthesis groups specified by the `group' attribute.
654 `repeat' If the `repeat' attribute is present, and non-nil, the
655 rule will be applied to the line continuously until no
656 further matches are found.
658 `valid' If the `valid' attribute is set, it will be used to
659 determine whether the rule should be invoked. This form
660 is evaluated after the regular expression match has been
661 performed, so that it is possible to use the results of
662 that match to determine whether the alignment should be
663 performed. The buffer should not be modified during the
664 evaluation of this form.
666 `run-if' Like `valid', the `run-if' attribute tests whether the
667 rule should be run at all -- even before any searches are
668 done to determine if the rule applies to the alignment
669 region. This can save time, since `run-if' will only be
670 run once for each rule. If it returns nil, the rule will
673 `column' For alignment rules, if the `column' attribute is set --
674 which must be an integer, or a symbol whose value is an
675 integer -- it will be used as the column in which to align
676 the alignment character. If the text on a particular line
677 happens to overrun that column, a single space character,
678 or tab stop (see `align-to-tab-stop') will be added
679 between the last text character and the alignment
682 `spacing' Alignment rules may also override the amount of spacing
683 that would normally be used by providing a `spacing'
684 attribute. This must be an integer, or a list of integers
685 corresponding to the number of parenthesis groups matched
686 by the `group' attribute. If a list of value is used, and
687 any of those values is nil, `align-default-spacing' will
688 be used for that subgroup. See `align-default-spacing'
689 for more details on spacing, tab stops, and how to
690 indicate how much spacing should be used. If TAB-STOP is
691 present, it will override the value of `align-to-tab-stop'
694 `justify' It is possible with `regexp' and `group' to identify a
695 character group that contains more than just whitespace
696 characters. By default, any non-whitespace characters in
697 that group will also be deleted while aligning the
698 alignment character. However, if the `justify' attribute
699 is set to a non-nil value, only the initial whitespace
700 characters within that group will be deleted. This has
701 the effect of right-justifying the characters that remain,
702 and can be used for outdenting or just plain old right-
705 `separate' Each rule can define its own section separator, which
706 describes how to identify the separation of \"sections\"
707 within the region to be aligned. Setting the `separate'
708 attribute overrides the value of `align-region-separate'
709 (see the documentation of that variable for possible
710 values), and any separation argument passed to `align'."
711 :type align-rules-list-type
714 (put 'align-rules-list
'risky-local-variable t
)
716 (defvar align-exclude-rules-list-type
719 :tag
"Exclusion rule"
720 (symbol :tag
"Title")
721 (cons :tag
"Required attributes"
723 (const :tag
"(Regular expression to match)" regexp
)
724 (choice :value
"\\(\\s-+\\)" regexp function
))
726 :tag
"Optional attributes"
729 (const :tag
"(Repeat this rule throughout line)"
732 (cons :tag
"Paren group"
733 (const :tag
"(Parenthesis group to use)" group
)
735 integer
(repeat integer
)))
737 (const :tag
"(Modes where this rule applies)" modes
)
738 (sexp :value
(text-mode)))
739 (cons :tag
"Case-fold"
740 (const :tag
"(Should case be ignored for this rule)"
742 (boolean :value t
)))))))
743 "The `type' form for any `align-exclude-rules-list' variable.")
745 (defcustom align-exclude-rules-list
747 (regexp .
"\"\\([^\"\n]+\\)\"")
749 (modes . align-dq-string-modes
))
752 (regexp .
"'\\([^'\n]+\\)'")
754 (modes . align-sq-string-modes
))
759 (lambda (end reverse
)
760 (funcall (if reverse
're-search-backward
762 (concat "[^ \t\n\\\\]"
763 (regexp-quote comment-start
)
764 "\\(.+\\)$") end t
))))
765 (modes . align-open-comment-modes
))
768 (regexp .
"/\\*\\(.+\\)\\*/")
770 (modes . align-c
++-modes
))
773 (regexp .
"(\\([^)\n]+\\))")
775 (modes . align-c
++-modes
))
778 (regexp .
"^\\s-*#\\s-*\\(if\\w*\\|endif\\)\\(.*\\)$")
780 (modes . align-c
++-modes
)))
781 "A list describing text that should be excluded from alignment.
782 See the documentation for `align-rules-list' for more info."
783 :type align-exclude-rules-list-type
786 (put 'align-exclude-rules-list
'risky-local-variable t
)
788 ;;; Internal Variables:
790 (defvar align-mode-rules-list nil
791 "Alignment rules specific to the current major mode.
792 See the variable `align-rules-list' for more details.")
794 (make-variable-buffer-local 'align-mode-rules-list
)
796 (defvar align-mode-exclude-rules-list nil
797 "Alignment exclusion rules specific to the current major mode.
798 See the variable `align-exclude-rules-list' for more details.")
800 (make-variable-buffer-local 'align-mode-exclude-rules-list
)
802 (defvar align-highlight-overlays nil
803 "The current overlays highlighting the text matched by a rule.")
805 ;; Sample extension rule set, for vhdl-mode. This should properly be
806 ;; in vhdl-mode.el itself.
808 (defcustom align-vhdl-rules-list
810 (regexp .
"\\(signal\\|variable\\|constant\\)\\(\\s-+\\)\\S-")
814 (regexp .
"\\(others\\|[^ \t\n=<]\\)\\(\\s-*\\)=>\\(\\s-*\\)\\S-")
819 (not (string= (downcase (match-string 1))
823 (regexp .
"[^ \t\n:]\\(\\s-*\\):\\(\\s-*\\)[^=\n]")
827 (regexp .
":\\s-*\\(in\\|out\\|inout\\|buffer\\)\\(\\s-*\\)")
831 (regexp .
"[^ \t\n=<]\\(\\s-*\\)<=\\(\\s-*\\)\\S-")
835 (regexp .
"[^ \t\n:]\\(\\s-*\\):="))
838 (regexp .
"\\(\\s-+\\)use\\s-+entity")))
839 "Alignment rules for `vhdl-mode'. See `align-rules-list' for more info."
840 :type align-rules-list-type
843 (put 'align-vhdl-rules-list
'risky-local-variable t
)
845 (defun align-set-vhdl-rules ()
846 "Setup the `align-mode-rules-list' variable for `vhdl-mode'."
847 (setq align-mode-rules-list align-vhdl-rules-list
))
849 (add-hook 'vhdl-mode-hook
'align-set-vhdl-rules
)
851 (add-to-list 'align-dq-string-modes
'vhdl-mode
)
852 (add-to-list 'align-open-comment-modes
'vhdl-mode
)
857 (defun align (beg end
&optional separate rules exclude-rules
)
858 "Attempt to align a region based on a set of alignment rules.
859 BEG and END mark the region. If BEG and END are specifically set to
860 nil (this can only be done programmatically), the beginning and end of
861 the current alignment section will be calculated based on the location
862 of point, and the value of `align-region-separate' (or possibly each
863 rule's `separate' attribute).
865 If SEPARATE is non-nil, it overrides the value of
866 `align-region-separate' for all rules, except those that have their
867 `separate' attribute set.
869 RULES and EXCLUDE-RULES, if either is non-nil, will replace the
870 default rule lists defined in `align-rules-list' and
871 `align-exclude-rules-list'. See `align-rules-list' for more details
872 on the format of these lists."
876 (if (and (symbolp align-region-separate
)
877 (boundp align-region-separate
))
878 (symbol-value align-region-separate
)
879 align-region-separate
)
881 (if (not (or ;(eq separator 'largest)
882 (and (functionp separator
)
883 (not (funcall separator nil nil
)))))
884 (align-region beg end separator
885 (or rules align-mode-rules-list align-rules-list
)
886 (or exclude-rules align-mode-exclude-rules-list
887 align-exclude-rules-list
))
888 (let ((sec-first end
)
890 (align-region beg end
892 align-mode-exclude-rules-list
893 align-exclude-rules-list
) nil
897 (when (and mode
(listp mode
))
898 (setq sec-first
(min sec-first b
)
899 sec-last
(max sec-last e
))))))
900 (if (< sec-first sec-last
)
901 (align-region sec-first sec-last
'entire
902 (or rules align-mode-rules-list align-rules-list
)
903 (or exclude-rules align-mode-exclude-rules-list
904 align-exclude-rules-list
)))))))
907 (defun align-regexp (beg end regexp
&optional group spacing repeat
)
908 "Align the current region using an ad-hoc rule read from the minibuffer.
909 BEG and END mark the limits of the region. Interactively, this function
910 prompts for the regular expression REGEXP to align with.
912 For example, let's say you had a list of phone numbers, and wanted to
913 align them so that the opening parentheses would line up:
917 Mary-Anne (123) 456-7890
920 There is no predefined rule to handle this, but you could easily do it
921 using a REGEXP like \"(\". Interactively, all you would have to do is
922 to mark the region, call `align-regexp' and enter that regular expression.
924 REGEXP must contain at least one parenthesized subexpression, typically
925 whitespace of the form \"\\\\(\\\\s-*\\\\)\". In normal interactive use,
926 this is automatically added to the start of your regular expression after
927 you enter it. You only need to supply the characters to be lined up, and
928 any preceding whitespace is replaced.
930 If you specify a prefix argument (or use this function non-interactively),
931 you must enter the full regular expression, including the subexpression.
932 The function also then prompts for which subexpression parenthesis GROUP
933 \(default 1) within REGEXP to modify, the amount of SPACING (default
934 `align-default-spacing') to use, and whether or not to REPEAT the rule
937 See `align-rules-list' for more information about these options.
939 The non-interactive form of the previous example would look something like:
940 (align-regexp (point-min) (point-max) \"\\\\(\\\\s-*\\\\)(\")
942 This function is a nothing more than a small wrapper that helps you
943 construct a rule to pass to `align-region', which does the real work."
946 (list (region-beginning) (region-end))
947 (if current-prefix-arg
948 (list (read-string "Complex align using regexp: "
952 "Parenthesis group to modify (justify if negative): " "1"))
954 (read-string "Amount of spacing (or column if negative): "
955 (number-to-string align-default-spacing
)))
956 (y-or-n-p "Repeat throughout line? "))
957 (list (concat "\\(\\s-*\\)"
958 (read-string "Align regexp: "))
959 1 align-default-spacing nil
))))
960 (or group
(setq group
1))
961 (or spacing
(setq spacing align-default-spacing
))
963 (list (list nil
(cons 'regexp regexp
)
964 (cons 'group
(abs group
))
969 (cons 'spacing spacing
)
970 (cons 'column
(abs spacing
)))
971 (cons 'repeat repeat
)))))
972 (align-region beg end
'entire rule nil nil
)))
975 (defun align-entire (beg end
&optional rules exclude-rules
)
976 "Align the selected region as if it were one alignment section.
977 BEG and END mark the extent of the region. If RULES or EXCLUDE-RULES
978 is set to a list of rules (see `align-rules-list'), it can be used to
979 override the default alignment rules that would have been used to
982 (align beg end
'entire rules exclude-rules
))
985 (defun align-current (&optional rules exclude-rules
)
986 "Call `align' on the current alignment section.
987 This function assumes you want to align only the current section, and
988 so saves you from having to specify the region. If RULES or
989 EXCLUDE-RULES is set to a list of rules (see `align-rules-list'), it
990 can be used to override the default alignment rules that would have
991 been used to align that section."
993 (align nil nil nil rules exclude-rules
))
996 (defun align-highlight-rule (beg end title
&optional rules exclude-rules
)
997 "Highlight the whitespace which a given rule would have modified.
998 BEG and END mark the extent of the region. TITLE identifies the rule
999 that should be highlighted. If RULES or EXCLUDE-RULES is set to a
1000 list of rules (see `align-rules-list'), it can be used to override the
1001 default alignment rules that would have been used to identify the text
1004 (list (region-beginning) (region-end)
1006 "Title of rule to highlight: "
1010 (list (symbol-name (car rule
)))))
1011 (append (or align-mode-rules-list align-rules-list
)
1012 (or align-mode-exclude-rules-list
1013 align-exclude-rules-list
))) nil t
)))
1014 (let ((ex-rule (assq (intern title
)
1015 (or align-mode-exclude-rules-list
1016 align-exclude-rules-list
)))
1018 (align-unhighlight-rule)
1021 (or rules
(if ex-rule
1022 (or exclude-rules align-mode-exclude-rules-list
1023 align-exclude-rules-list
)
1024 (or align-mode-rules-list align-rules-list
)))
1025 (unless ex-rule
(or exclude-rules align-mode-exclude-rules-list
1026 align-exclude-rules-list
))
1029 (if (and mode
(listp mode
))
1030 (if (equal (symbol-name (car mode
)) title
)
1031 (setq face
(cons align-highlight-change-face
1032 align-highlight-nochange-face
))
1035 (let ((overlay (make-overlay b e
)))
1036 (setq align-highlight-overlays
1037 (cons overlay align-highlight-overlays
))
1038 (overlay-put overlay
'face
1041 (cdr face
)))))))))))
1044 (defun align-unhighlight-rule ()
1045 "Remove any highlighting that was added by `align-highlight-rule'."
1047 (while align-highlight-overlays
1048 (delete-overlay (car align-highlight-overlays
))
1049 (setq align-highlight-overlays
1050 (cdr align-highlight-overlays
))))
1053 (defun align-newline-and-indent ()
1054 "A replacement function for `newline-and-indent', aligning as it goes."
1056 (let ((separate (or (if (and (symbolp align-region-separate
)
1057 (boundp align-region-separate
))
1058 (symbol-value align-region-separate
)
1059 align-region-separate
)
1062 (call-interactively 'newline-and-indent
)
1065 (while (not (or (bobp)
1066 (align-new-section-p (point) end separate
)))
1068 (align (point) end
))))
1070 ;;; Internal Functions:
1072 (defun align-match-tex-pattern (regexp end
&optional reverse
)
1073 "Match REGEXP in TeX mode, counting backslashes appropriately.
1074 END denotes the end of the region to be searched, while REVERSE, if
1075 non-nil, indicates that the search should proceed backward from the
1081 (if reverse
're-search-backward
1083 (concat "\\(\\s-*\\)" regexp
1084 "\\(\\s-*\\)") end t
))
1085 (let ((pos (match-end 1))
1087 (while (and (> pos
(point-min))
1088 (eq (char-before pos
) ?
\\))
1089 (setq count
(1+ count
) pos
(1- pos
)))
1090 (eq (mod count
2) 1))
1091 (goto-char (match-beginning (if reverse
1 2)))))
1094 (defun align-new-section-p (beg end separator
)
1095 "Is there a section divider between BEG and END?
1096 SEPARATOR specifies how to look for the section divider. See the
1097 documentation for `align-region-separate' for more details."
1098 (cond ((or (not separator
)
1099 (eq separator
'entire
))
1101 ((eq separator
'group
)
1107 (> (count-lines beg end
) amount
)))
1108 ((stringp separator
)
1111 (re-search-forward separator end t
)))
1112 ((functionp separator
)
1113 (funcall separator beg end
))
1115 (let ((seps separator
) yes
)
1117 (if (and (>= (car seps
) beg
)
1118 (<= (car seps
) end
))
1119 (setq yes t seps nil
)
1120 (setq seps
(cdr seps
))))
1123 (defun align-adjust-col-for-rule (column _rule spacing tab-stop
)
1124 "Adjust COLUMN according to the given RULE.
1125 SPACING specifies how much spacing to use.
1126 TAB-STOP specifies whether SPACING refers to tab-stop boundaries."
1128 (setq spacing align-default-spacing
))
1133 (dotimes (_ spacing
)
1134 (setq column
(indent-next-tab-stop column
)))
1137 (defsubst align-column
(pos)
1138 "Given a position in the buffer, state what column it's in.
1139 POS is the position whose column will be taken. Note that this
1140 function will change the location of point."
1144 (defsubst align-regions
(regions props rule func
)
1145 "Align the regions specified in REGIONS, a list of cons cells.
1146 PROPS describes formatting features specific to the given regions.
1147 RULE specifies exactly how to perform the alignments.
1148 If FUNC is specified, it will be called with each region that would
1149 have been aligned, rather than modifying the text."
1152 (align-areas (car regions
) (car props
) rule func
))
1153 (setq regions
(cdr regions
)
1154 props
(cdr props
))))
1156 (defun align-areas (areas props rule func
)
1157 "Given a list of AREAS and formatting PROPS, align according to RULE.
1158 AREAS should be a list of cons cells containing beginning and ending
1159 markers. This function sweeps through all of the beginning markers,
1160 finds out which one starts in the furthermost column, and then deletes
1161 and inserts text such that all of the ending markers occur in the same
1164 If FUNC is non-nil, it will be called for each text region that would
1165 have been aligned. No changes will be made to the buffer."
1166 (let* ((column (cdr (assq 'column rule
)))
1167 (fixed (if (symbolp column
)
1168 (symbol-value column
)
1170 (justify (cdr (assq 'justify rule
)))
1175 ;; Determine the alignment column.
1179 (setq col
(max col
(align-column (caar a
)))))
1181 (goto-char (cdar a
))
1183 (if (/= ecol
(current-column))
1185 (setq ecol
(current-column))))
1187 (goto-char (caar a
))
1188 (if (and (re-search-forward "\\s-*" (cdar a
) t
)
1189 (/= (point) (cdar a
)))
1190 (let ((bcol (current-column)))
1191 (setcdr (car a
) (cons (point-marker) (cdar a
)))
1192 (goto-char (cdr (cdar a
)))
1193 (setq width
(max width
(- (current-column) bcol
))))))
1197 (setq col
(+ (align-adjust-col-for-rule
1198 col rule
(car props
) (cdr props
)) width
)))
1200 ;; Make all ending positions to occur in the goal column. Since
1201 ;; the whitespace to be modified was already deleted by
1202 ;; `align-region', all we have to do here is indent.
1205 (setq change
(and ecol
(/= col ecol
))))
1207 (when (or func change
)
1209 (let ((area (car areas
))
1214 (marker-position (car area
))
1215 (marker-position (cdr area
))
1217 (if (not (and justify
1218 (consp (cdr area
))))
1219 (goto-char (cdr area
))
1220 (goto-char (cddr area
))
1221 (let ((ecol (current-column)))
1222 (goto-char (cadr area
))
1223 (setq gocol
(- col
(- ecol
(current-column))))))
1224 (setq cur
(current-column))
1225 (cond ((< gocol
0) t
) ; don't do anything
1226 ((= cur gocol
) t
) ; don't need to
1227 ((< cur gocol
) ; just add space
1228 ;; FIXME: It is stated above that "...the
1229 ;; whitespace to be modified was already
1230 ;; deleted by `align-region', all we have
1231 ;; to do here is indent." However, this
1232 ;; doesn't seem to be true, so we first
1233 ;; delete the whitespace to avoid tabs
1235 (delete-horizontal-space t
)
1238 ;; This code works around an oddity in the
1239 ;; FORCE argument of `move-to-column', which
1240 ;; tends to screw up markers if there is any
1242 (let ((endcol (align-column
1248 (align-column (car area
)))))
1250 (goto-char (car area
))
1251 (move-to-column gocol t
))
1252 (let ((here (point)))
1253 (move-to-column endcol t
)
1254 (delete-region here
(point))
1256 (indent-to (align-adjust-col-for-rule
1257 (current-column) rule
1258 (car props
) (cdr props
)))))))))))
1259 (setq areas
(cdr areas
))))))
1261 (defmacro align--set-marker
(marker-var pos
&optional type
)
1262 "If MARKER-VAR is a marker, move it to position POS.
1263 Otherwise, create a new marker at position POS, with type TYPE."
1264 `(if (markerp ,marker-var
)
1265 (move-marker ,marker-var
,pos
)
1266 (setq ,marker-var
(copy-marker ,pos
,type
))))
1268 (defun align-region (beg end separate rules exclude-rules
1270 "Align a region based on a given set of alignment rules.
1271 BEG and END specify the region to be aligned. Either may be nil, in
1272 which case the range will stop at the nearest section division (see
1273 `align-region-separate', and `align-region-heuristic' for more
1276 The region will be divided into separate alignment sections based on
1277 the value of SEPARATE.
1279 RULES and EXCLUDE-RULES are a pair of lists describing how to align
1280 the region, and which text areas within it should be excluded from
1281 alignment. See the `align-rules-list' for more information on the
1282 required format of these two lists.
1284 If FUNC is specified, no text will be modified. What `align-region'
1285 will do with the rules is to search for the alignment areas, as it
1286 regularly would, taking account for exclusions, and then call FUNC,
1287 first with the beginning and ending of the region to be aligned
1288 according to that rule (this can be different for each rule, if BEG
1289 and END were nil), and then with the beginning and ending of each
1290 text region that the rule would have applied to.
1292 The signature of FUNC should thus be:
1294 (defun my-align-function (beg end mode)
1295 \"If MODE is a rule (a list), return t if BEG to END are to be searched.
1296 Otherwise BEG to END will be a region of text that matches the rule's
1297 definition, and MODE will be non-nil if any changes are necessary.\"
1298 (unless (and mode (listp mode))
1299 (message \"Would have aligned from %d to %d...\" beg end)))
1301 This feature (of passing a FUNC) is used internally to locate the
1302 position of exclusion areas, but could also be used for any other
1303 purpose where you might want to know where the regions that the
1304 aligner would have dealt with are."
1305 (let ((end-mark (and end
(copy-marker end t
)))
1307 (report (and (not func
) align-large-region beg end
1308 (>= (- end beg
) align-large-region
)))
1310 (rule-count (length rules
))
1312 (if (and align-indent-before-aligning real-beg end-mark
)
1313 (indent-region real-beg end-mark nil
))
1315 (let* ((rule (car rules
))
1316 (run-if (assq 'run-if rule
))
1317 (modes (assq 'modes rule
)))
1318 ;; unless the `run-if' form tells us not to, look for the
1320 (unless (or (and modes
(not (memq major-mode
1321 (eval (cdr modes
)))))
1322 (and run-if
(not (funcall (cdr run-if
)))))
1323 (let* ((case-fold-search case-fold-search
)
1324 (case-fold (assq 'case-fold rule
))
1325 (regexp (cdr (assq 'regexp rule
)))
1326 (regfunc (and (functionp regexp
) regexp
))
1327 (rulesep (assq 'separate rule
))
1328 (thissep (if rulesep
(cdr rulesep
) separate
))
1343 ;; if beg and end were not given, figure out what the
1344 ;; current alignment region should be. Depending on the
1345 ;; value of `align-region-separate' it's possible for
1346 ;; each rule to have its own definition of what that
1347 ;; current alignment section is.
1350 (if (or (not thissep
) (eq thissep
'entire
))
1351 (error "Cannot determine alignment region for '%s'"
1352 (symbol-name (cdr (assq 'title rule
)))))
1354 (while (and (not (eobp))
1355 (looking-at "^\\s-*$"))
1357 (let* ((here (point))
1361 (and align-region-heuristic
1363 align-region-heuristic
))))
1365 (funcall regfunc terminus t
)
1366 (re-search-backward regexp
1368 (if (align-new-section-p (point) here thissep
)
1371 (setq here
(point))))
1380 (and align-region-heuristic
1382 align-region-heuristic
))))
1384 (funcall regfunc terminus nil
)
1385 (re-search-forward regexp terminus t
))))
1386 (if (align-new-section-p here
(point) thissep
)
1389 (setq here
(point))))
1394 (align--set-marker end-mark end t
)
1397 ;; If we have a region to align, and `func' is set and
1398 ;; reports back that the region is ok, then align it.
1399 (when (or (not func
)
1400 (funcall func beg end rule
))
1401 (let (rule-beg exclude-areas
)
1402 ;; determine first of all where the exclusions
1403 ;; lie in this region
1409 (or (and mode
(listp mode
))
1415 (sort exclude-areas
#'car-less-than-car
))))
1417 ;; set `case-fold-search' according to the
1418 ;; (optional) `case-fold' property
1420 (setq case-fold-search
(cdr case-fold
)))
1422 ;; while we can find the rule in the alignment
1424 (while (and (< (point) end-mark
)
1425 (setq search-start
(point))
1427 (funcall regfunc end-mark nil
)
1428 (re-search-forward regexp
1431 ;; give the user some indication of where we
1432 ;; are, if it's a very large region being
1435 (let ((symbol (car rule
)))
1436 (if (and symbol
(symbolp symbol
))
1438 "Aligning `%s' (rule %d of %d) %d%%..."
1439 (symbol-name symbol
) rule-index rule-count
1440 (floor (* (- (point) real-beg
) 100.0)
1441 (- end-mark real-beg
)))
1444 (floor (* (- (point) real-beg
) 100.0)
1445 (- end-mark real-beg
))))))
1447 ;; if the search ended us on the beginning of
1448 ;; the next line, move back to the end of the
1450 (if (and (bolp) (> (point) search-start
))
1453 ;; lookup the `group' attribute the first time
1456 (setq groups
(or (cdr (assq 'group rule
)) 1))
1457 (unless (listp groups
)
1458 (setq groups
(list groups
)))
1459 (setq first
(car groups
)))
1462 (setq spacing
(cdr (assq 'spacing rule
))
1467 (let ((rule-ts (assq 'tab-stop rule
)))
1470 ((symbolp align-to-tab-stop
)
1471 (symbol-value align-to-tab-stop
))
1473 align-to-tab-stop
)))
1476 ;; test whether we have found a match on the same
1477 ;; line as a previous match
1478 (when (> (point) eol
)
1480 (align--set-marker eol
(line-end-position)))
1482 ;; lookup the `repeat' attribute the first time
1484 (setq repeat
(cdr (assq 'repeat rule
))
1487 ;; lookup the `valid' attribute the first time
1489 (setq valid
(assq 'valid rule
)
1492 ;; remember the beginning position of this rule
1493 ;; match, and save the match-data, since either
1494 ;; the `valid' form, or the code that searches for
1495 ;; section separation, might alter it
1496 (setq rule-beg
(match-beginning first
)
1497 save-match-data
(match-data))
1500 (error "No match for subexpression %s" first
))
1502 ;; unless the `valid' attribute is set, and tells
1503 ;; us that the rule is not valid at this point in
1505 (unless (and valid
(not (funcall (cdr valid
))))
1507 ;; look to see if this match begins a new
1508 ;; section. If so, we should align what we've
1509 ;; collected so far, and then begin collecting
1510 ;; anew for the next alignment section
1511 (when (and last-point
1512 (align-new-section-p last-point rule-beg
1514 (align-regions regions align-props rule func
)
1516 (setq align-props nil
))
1517 (align--set-marker last-point rule-beg t
)
1519 ;; restore the match data
1520 (set-match-data save-match-data
)
1522 ;; check whether the region to be aligned
1523 ;; straddles an exclusion area
1524 (let ((excls exclude-areas
))
1525 (setq exclude-p nil
)
1527 (if (and (< (match-beginning (car groups
))
1529 (> (match-end (car (last groups
)))
1533 (setq excls
(cdr excls
)))))
1535 ;; go through the parenthesis groups
1536 ;; matching whitespace to be contracted or
1537 ;; expanded (or possibly justified, if the
1538 ;; `justify' attribute was set)
1541 ;; We must use markers, since
1542 ;; `align-areas' may modify the buffer.
1543 ;; Avoid polluting the markers.
1544 (let* ((group-beg (copy-marker
1545 (match-beginning g
) t
))
1546 (group-end (copy-marker
1548 (region (cons group-beg group-end
))
1549 (props (cons (if (listp spacing
)
1552 (if (listp tab-stop
)
1555 (push group-beg markers
)
1556 (push group-end markers
)
1557 (setq index
(if same
(1+ index
) 0))
1559 ((nth index regions
)
1560 (setcar (nthcdr index regions
)
1562 (nth index regions
))))
1565 (list (list region
)))
1566 (nconc align-props
(list props
)))
1569 (list (list region
)))
1570 (setq align-props
(list props
)))))
1571 ;; If any further rule matches are found
1572 ;; before `eol', they are on the same
1573 ;; line as this one; this can only
1574 ;; happen if the `repeat' attribute is
1577 (setq spacing
(cdr spacing
)))
1578 (if (listp tab-stop
)
1579 (setq tab-stop
(cdr tab-stop
)))
1582 ;; if `repeat' has not been set, move to
1583 ;; the next line; don't bother searching
1584 ;; anymore on this one
1585 (if (and (not repeat
) (not (bolp)))
1588 ;; if the search did not change point,
1589 ;; move forward to avoid an infinite loop
1590 (if (= (point) search-start
)
1593 ;; when they are no more matches for this rule,
1594 ;; align whatever was left over
1596 (align-regions regions align-props rule func
))))))))
1597 (setq rules
(cdr rules
)
1598 rule-index
(1+ rule-index
)))
1599 ;; This function can use a lot of temporary markers, so instead of
1600 ;; waiting for the next GC we delete them immediately (Bug#10047).
1601 (when end-mark
(set-marker end-mark nil
))
1606 (message "Aligning...done"))))
1612 (run-hooks 'align-load-hook
)
1614 ;;; align.el ends here