1 ;;; align.el --- align text to a specific column, by regexp -*- lexical-binding:t -*-
3 ;; Copyright (C) 1999-2018 Free Software Foundation, Inc.
5 ;; Author: John Wiegley <johnw@gnu.org>
6 ;; Maintainer: emacs-devel@gnu.org
7 ;; Keywords: convenience languages lisp
9 ;; This file is part of GNU Emacs.
11 ;; GNU Emacs is free software: you can redistribute it and/or modify
12 ;; it under the terms of the GNU General Public License as published by
13 ;; the Free Software Foundation, either version 3 of the License, or
14 ;; (at your option) any later version.
16 ;; GNU Emacs is distributed in the hope that it will be useful,
17 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
18 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
19 ;; GNU General Public License for more details.
21 ;; You should have received a copy of the GNU General Public License
22 ;; along with GNU Emacs. If not, see <https://www.gnu.org/licenses/>.
26 ;; This mode allows you to align regions in a context-sensitive fashion.
27 ;; The classic use is to align assignments:
41 ;; There are several variables which define how certain "categories"
42 ;; of syntax are to be treated. These variables go by the name
43 ;; `align-CATEGORY-modes'. For example, "c++" is such a category.
44 ;; There are several rules which apply to c++, but since several other
45 ;; languages have a syntax similar to c++ (e.g., c, java, etc), these
46 ;; modes are treated as belonging to the same category.
48 ;; If you want to add a new mode under a certain category, just
49 ;; customize that list, or add the new mode manually. For example, to
50 ;; make jde-mode a c++ category mode, use this code in your .emacs
53 ;; (setq align-c++-modes (cons 'jde-mode align-c++-modes))
55 ;; In some programming modes, it's useful to have the aligner run only
56 ;; after indentation is performed. To achieve this, customize or set
57 ;; the variable `align-indent-before-aligning' to t.
61 ;; In order to incorporate align's functionality into your own
62 ;; modules, there are only a few steps you have to follow.
64 ;; 1. Require or load in the align.el library.
66 ;; 2. Define your alignment and exclusion rules lists, either
67 ;; customizable or not.
69 ;; 3. In your mode function, set the variables
70 ;; `align-mode-rules-list' and `align-mode-exclude-rules-list'
71 ;; to your own rules lists.
73 ;; If there is any need to add your mode name to one of the
74 ;; align-?-modes variables (for example, `align-dq-string-modes'), use
75 ;; `add-to-list', or some similar function which checks first to see
76 ;; if the value is already there. Since the user may customize that
77 ;; mode list, and then write your mode name into their init file,
78 ;; causing the symbol already to be present the next time they load
85 ;; (defcustom my-align-rules-list
87 ;; (regexp . "Sample")))
88 ;; :type align-rules-list-type
89 ;; :group 'my-package)
91 ;; (put 'my-align-rules-list 'risky-local-variable t)
93 ;; (add-to-list 'align-dq-string-modes 'my-package-mode)
94 ;; (add-to-list 'align-open-comment-modes 'my-package-mode)
98 ;; (setq align-mode-rules-list my-align-rules-list))
100 ;; Note that if you need to install your own exclusion rules, then you
101 ;; will also need to reproduce any double-quoted string, or open
102 ;; comment exclusion rules that are defined in the standard
103 ;; `align-exclude-rules-list'. At the moment there is no convenient
104 ;; way to mix both mode-local and global rules lists.
108 ;; Version 1.0 was created in the earlier part of 1996, using a very
109 ;; simple algorithm that understand only basic regular expressions.
110 ;; Parts of the code were broken up and included in vhdl-mode.el
111 ;; around this time. After several comments from users, and a need to
112 ;; find a more robust, higher performing algorithm, 2.0 was born in late
113 ;; 1998. Many different approaches were taken (mostly due to the
114 ;; complexity of TeX tables), but finally a scheme was discovered
115 ;; which worked fairly well for most common usage cases. Development
116 ;; beyond version 2.8 is not planned, except for problems that users
122 "Align text to a specific column, by regexp."
128 (defcustom align-load-hook nil
129 "Hook that gets run after the aligner has been loaded."
133 (defcustom align-indent-before-aligning nil
134 "If non-nil, indent the marked region before aligning it."
138 (defcustom align-default-spacing
1
139 "An integer that represents the default amount of padding to use.
140 If `align-to-tab-stop' is non-nil, this will represent the number of
141 tab stops to use for alignment, rather than the number of spaces.
142 Each alignment rule can optionally override both this variable and
143 `align-to-tab-stop'. See `align-rules-list'."
147 (defcustom align-to-tab-stop
'indent-tabs-mode
148 "If non-nil, alignments will always fall on a tab boundary.
149 It may also be a symbol, whose value will be taken."
150 :type
'(choice (const nil
) symbol
)
153 (defcustom align-region-heuristic
500
154 "If non-nil, used as a heuristic by `align-current'.
155 Since each alignment rule can possibly have its own set of alignment
156 sections (whenever `align-region-separate' is non-nil, and not a
157 string), this heuristic is used to determine how far before and after
158 point we should search in looking for a region separator. Larger
159 values can mean slower performance in large files, although smaller
160 values may cause unexpected behavior at times."
164 (defcustom align-highlight-change-face
'highlight
165 "The face to highlight with if changes are necessary."
169 (defcustom align-highlight-nochange-face
'secondary-selection
170 "The face to highlight with if no changes are necessary."
174 (defcustom align-large-region
10000
175 "If an integer, defines what constitutes a \"large\" region.
176 If nil, then no messages will ever be printed to the minibuffer."
180 (defcustom align-c
++-modes
'(c++-mode c-mode java-mode
)
181 "A list of modes whose syntax resembles C/C++."
182 :type
'(repeat symbol
)
185 (defcustom align-perl-modes
'(perl-mode cperl-mode
)
186 "A list of modes where Perl syntax is to be seen."
187 :type
'(repeat symbol
)
190 (defcustom align-lisp-modes
191 '(emacs-lisp-mode lisp-interaction-mode lisp-mode scheme-mode
)
192 "A list of modes whose syntax resembles Lisp."
193 :type
'(repeat symbol
)
196 (defcustom align-tex-modes
197 '(tex-mode plain-tex-mode latex-mode slitex-mode
)
198 "A list of modes whose syntax resembles TeX (and family)."
199 :type
'(repeat symbol
)
202 (defcustom align-text-modes
'(text-mode outline-mode
)
203 "A list of modes whose content is plain text."
204 :type
'(repeat symbol
)
207 (defcustom align-dq-string-modes
208 (append align-lisp-modes align-c
++-modes align-perl-modes
210 "A list of modes where double quoted strings should be excluded."
211 :type
'(repeat symbol
)
214 (defcustom align-sq-string-modes
215 (append align-perl-modes
'(python-mode))
216 "A list of modes where single quoted strings should be excluded."
217 :type
'(repeat symbol
)
220 (defcustom align-open-comment-modes
221 (append align-lisp-modes align-c
++-modes align-perl-modes
222 '(python-mode makefile-mode
))
223 "A list of modes with a single-line comment syntax.
224 These are comments as in Lisp, which have a beginning, but end with
225 the line (i.e., `comment-end' is an empty string)."
226 :type
'(repeat symbol
)
229 (defcustom align-region-separate
"^\\s-*[{}]?\\s-*$"
230 "Select the method by which alignment sections will be separated.
231 If this is a symbol, that symbol's value will be used.
233 For the sake of clarification, consider the following example, which
234 will be referred to in the descriptions below.
236 int alpha = 1; /* one */
238 long gamma; /* ten */
240 unsigned int delta = 1; /* one */
241 long double epsilon = 3.0;
242 long long omega; /* ten */
244 The possible settings for `align-region-separate' are:
246 `entire' The entire region being aligned will be considered as a
247 single alignment section. Assuming that comments were not
248 being aligned to a particular column, the example would
251 int alpha = 1; /* one */
253 long gamma; /* ten */
255 unsigned int delta = 1; /* one */
257 long long chi = 10; /* ten */
259 `group' Each contiguous set of lines where a specific alignment
260 occurs is considered a section for that alignment rule.
261 Note that each rule may have any entirely different set
262 of section divisions than another.
264 int alpha = 1; /* one */
266 long gamma; /* ten */
268 unsigned int delta = 1; /* one */
270 long long chi = 10; /* ten */
272 `largest' When contiguous rule sets overlap, the largest section
273 described will be taken as the alignment section for each
274 rule touched by that section.
276 int alpha = 1; /* one */
278 long gamma; /* ten */
280 unsigned int delta = 1; /* one */
282 long long chi = 10; /* ten */
284 NOTE: This option is not supported yet, due to algorithmic
285 issues which haven't been satisfactorily resolved. There
286 are ways to do it, but they're both ugly and resource
289 regexp A regular expression string which defines the section
290 divider. If the mode you're in has a consistent divider
291 between sections, the behavior will be very similar to
292 `largest', and faster. But if the mode does not use clear
293 separators (for example, if you collapse your braces onto
294 the preceding statement in C or Perl), `largest' is
295 probably the better alternative.
297 function A function that will be passed the beginning and ending
298 locations of the region in which to look for the section
299 separator. At the very beginning of the attempt to align,
300 both of these parameters will be nil, in which case the
301 function should return non-nil if it wants each rule to
302 define its own section, or nil if it wants the largest
303 section found to be used as the common section for all
304 rules that occur there.
306 list A list of markers within the buffer that represent where
307 the section dividers lie. Be certain to use markers! For
308 when the aligning begins, the ensuing contract/expanding of
309 whitespace will throw off any non-marker positions.
311 This method is intended for use in Lisp programs, and not
314 (const :tag
"Entire region is one section" entire
)
315 (const :tag
"Align by contiguous groups" group
)
317 (regexp :tag
"Regexp defines section boundaries")
318 (function :tag
"Function defines section boundaries"))
321 (put 'align-region-separate
'risky-local-variable t
)
323 (defvar align-rules-list-type
326 :tag
"Alignment rule"
327 (symbol :tag
"Title")
328 (cons :tag
"Required attributes"
330 (const :tag
"(Regular expression to match)" regexp
)
331 (choice :value
"\\(\\s-+\\)" regexp function
))
333 :tag
"Optional attributes"
336 (const :tag
"(Repeat this rule throughout line)"
339 (cons :tag
"Paren group"
340 (const :tag
"(Parenthesis group to use)" group
)
342 integer
(repeat integer
)))
344 (const :tag
"(Modes where this rule applies)" modes
)
345 (sexp :value
(text-mode)))
346 (cons :tag
"Case-fold"
347 (const :tag
"(Should case be ignored for this rule)"
350 (cons :tag
"To Tab Stop"
351 (const :tag
"(Should rule align to tab stops)"
353 (boolean :value nil
))
355 (const :tag
"(Return non-nil if rule is valid)"
359 (const :tag
"(Return non-nil if rule should run)"
363 (const :tag
"(Column to fix alignment at)" column
)
364 (choice :value comment-column
367 (const :tag
"(Amount of spacing to use)" spacing
)
370 (const :tag
"(Should text be right justified)"
373 ;; make sure this stays up-to-date with any changes
374 ;; in `align-region-separate'
375 (cons :tag
"Separate"
376 (const :tag
"(Separation to use for this rule)"
378 (choice :value
"^\\s-*$"
382 regexp function
)))))))
383 "The `type' form for any `align-rules-list' variable.")
385 (defcustom align-rules-list
387 (regexp .
"\\(^\\s-+[^( \t\n]\\|(\\(\\S-+\\)\\s-+\\)\\S-+\\(\\s-+\\)")
389 (modes . align-lisp-modes
)
390 (run-if .
,(function (lambda () current-prefix-arg
))))
393 (regexp .
"\\(\\s-*\\)\\.\\(\\s-*\\)")
395 (modes . align-lisp-modes
))
399 (lambda (end reverse
)
400 (funcall (if reverse
're-search-backward
402 (concat "[^ \t\n\\\\]"
403 (regexp-quote comment-start
)
404 "\\(.+\\)$") end t
))))
405 (modes . align-open-comment-modes
))
408 (regexp .
"^\\s-*#\\s-*define\\s-+\\S-+\\(\\s-+\\)")
409 (modes . align-c
++-modes
))
411 (c-variable-declaration
412 (regexp .
,(concat "[*&0-9A-Za-z_]>?[&*]*\\(\\s-+[*&]*\\)"
413 "[A-Za-z_][0-9A-Za-z:_]*\\s-*\\(\\()\\|"
414 "=[^=\n].*\\|(.*)\\|\\(\\[.*\\]\\)*\\)?"
415 "\\s-*[;,]\\|)\\s-*$\\)"))
417 (modes . align-c
++-modes
)
422 (not (or (save-excursion
423 (goto-char (match-beginning 1))
426 "\\(goto\\|return\\|new\\|delete\\|throw\\)"))
427 (if (and (boundp 'font-lock-mode
) font-lock-mode
)
428 (eq (get-text-property (point) 'face
)
429 'font-lock-comment-face
)
430 (eq (caar (c-guess-basic-syntax)) 'c
))))))))
433 (regexp .
,(concat "[^-=!^&*+<>/| \t\n]\\(\\s-*[-=!^&*+<>/|]*\\)"
434 "=\\(\\s-*\\)\\([^= \t\n]\\|$\\)"))
436 (modes . align-c
++-modes
)
441 (regexp .
,(concat "[^=!^&*-+<>/| \t\n]\\(\\s-*\\)=[~>]?"
442 "\\(\\s-*\\)\\([^>= \t\n]\\|$\\)"))
444 (modes . align-perl-modes
)
448 (regexp .
,(concat "[^=!<> \t\n]\\(\\s-*\\)="
449 "\\(\\s-*\\)\\([^>= \t\n]\\|$\\)"))
451 (modes .
'(python-mode))
455 (regexp .
"^\\s-*\\w+\\(\\s-*\\):?=\\(\\s-*\\)\\([^\t\n \\\\]\\|$\\)")
457 (modes .
'(makefile-mode))
461 (regexp .
",\\(\\s-*\\)[^/ \t\n]")
463 (modes . align-c
++-modes
)
464 (run-if .
,(function (lambda () current-prefix-arg
))))
468 ; (memq (caar (c-guess-basic-syntax))
471 ; brace-entry-open))))))
473 ;; With a prefix argument, comma delimiter will be aligned. Since
474 ;; perl-mode doesn't give us enough syntactic information (and we
475 ;; don't do our own parsing yet), this rule is too destructive to
477 (basic-comma-delimiter
478 (regexp .
",\\(\\s-*\\)[^# \t\n]")
480 (modes .
(append align-perl-modes
'(python-mode)))
481 (run-if .
,(function (lambda () current-prefix-arg
))))
484 (regexp .
"\\(\\s-*\\)\\(//.*\\|/\\*.*\\*/\\s-*\\)$")
485 (modes . align-c
++-modes
)
486 (column . comment-column
)
490 (goto-char (match-beginning 1))
494 (regexp .
"\\(\\s-*\\)\\(&&\\|||\\|\\<and\\>\\|\\<or\\>\\)")
495 (modes . align-c
++-modes
)
499 (goto-char (match-end 2))
500 (looking-at "\\s-*\\(/[*/]\\|$\\)"))))))
503 (regexp .
"\\(\\s-*\\)\\(&&\\|||\\|\\<and\\>\\|\\<or\\>\\)")
504 (modes . align-perl-modes
)
508 (goto-char (match-end 2))
509 (looking-at "\\s-*\\(#\\|$\\)"))))))
512 (regexp .
"\\(\\s-*\\)\\(\\<and\\>\\|\\<or\\>\\)")
513 (modes .
'(python-mode))
517 (goto-char (match-end 2))
518 (looking-at "\\s-*\\(#\\|$\\|\\\\\\)"))))))
520 (c-macro-line-continuation
521 (regexp .
"\\(\\s-*\\)\\\\$")
522 (modes . align-c
++-modes
)
523 (column . c-backslash-column
))
527 ; (memq (caar (c-guess-basic-syntax))
528 ; '(cpp-macro cpp-macro-cont))))))
530 (basic-line-continuation
531 (regexp .
"\\(\\s-*\\)\\\\$")
532 (modes .
'(python-mode makefile-mode
)))
534 (tex-record-separator
536 (lambda (end reverse
)
537 (align-match-tex-pattern "&" end reverse
))))
539 (modes . align-tex-modes
)
542 (tex-tabbing-separator
544 (lambda (end reverse
)
545 (align-match-tex-pattern "\\\\[=>]" end reverse
))))
547 (modes . align-tex-modes
)
551 (eq major-mode
'latex-mode
)))))
554 (regexp .
"\\(\\s-*\\)\\\\\\\\")
555 (modes . align-tex-modes
))
557 ;; With a numeric prefix argument, or C-u, space delimited text
558 ;; tables will be aligned.
560 (regexp .
"\\(^\\|\\S-\\)\\([ \t]+\\)\\(\\S-\\|$\\)")
562 (modes . align-text-modes
)
566 (and current-prefix-arg
567 (not (eq '- current-prefix-arg
)))))))
569 ;; With a negative prefix argument, lists of dollar figures will
572 (regexp .
"\\$?\\(\\s-+[0-9]+\\)\\.")
573 (modes . align-text-modes
)
577 (eq '- current-prefix-arg
)))))
580 (regexp .
"^\\s-*\\(?:\\w-?\\)+:\\(\\s-*\\).*;")
582 (modes .
'(css-mode html-mode
))))
583 "A list describing all of the available alignment rules.
587 (ATTRIBUTE . VALUE) ...)
590 The following attributes are meaningful:
592 `regexp' This required attribute must be either a string describing
593 a regular expression, or a function (described below).
594 For every line within the section that this regular
595 expression matches, the given rule will be applied to that
596 line. The exclusion rules denote which part(s) of the
597 line should not be modified; the alignment rules cause the
598 identified whitespace group to be contracted/expanded such
599 that the \"alignment character\" (the character
600 immediately following the identified parenthesis group),
601 occurs in the same column for every line within the
602 alignment section (see `align-region-separate' for a
603 description of how the region is broken up into alignment
606 The `regexp' attribute describes how the text should be
607 treated. Within this regexp, there must be at least one
608 group of characters (typically whitespace) identified by
609 the special opening and closing parens used in regexp
610 expressions (`\\\\(' and `\\\\)') (see the Emacs manual on
611 the syntax of regular expressions for more info).
613 If `regexp' is a function, it will be called as a
614 replacement for `re-search-forward'. This means that it
615 should return nil if nothing is found to match the rule,
616 or it should set the match data appropriately, move point
617 to the end of the match, and return the value of point.
619 `group' For exclusion rules, the group identifies the range of
620 characters that should be ignored. For alignment rules,
621 these are the characters that will be deleted/expanded for
622 the purposes of alignment. The \"alignment character\" is
623 always the first character immediately following this
624 parenthesis group. This attribute may also be a list of
625 integers, in which case multiple alignment characters will
626 be aligned, with the list of integers identifying the
627 whitespace groups which precede them. The default for
630 `modes' The `modes' attribute, if set, should name a list of
631 major modes -- or evaluate to such a value -- in which the
632 rule is valid. If not set, the rule will apply to all
635 `case-fold' If `regexp' is an ordinary regular expression string
636 containing alphabetic character, sometimes you may want
637 the search to proceed case-insensitively (for languages
638 that ignore case, such as Pascal for example). In that
639 case, set `case-fold' to a non-nil value, and the regular
640 expression search will ignore case. If `regexp' is set to
641 a function, that function must handle the job of ignoring
644 `tab-stop' If the `tab-stop' attribute is set, and non-nil, the
645 alignment character will always fall on a tab stop
646 (whether it uses tabs to get there or not depends on the
647 value of `indent-tabs-mode'). If the `tab-stop' attribute
648 is set to nil, tab stops will never be used. Otherwise,
649 the value of `align-to-tab-stop' determines whether or not
650 to align to a tab stop. The `tab-stop' attribute may also
651 be a list of t or nil values, corresponding to the number
652 of parenthesis groups specified by the `group' attribute.
654 `repeat' If the `repeat' attribute is present, and non-nil, the
655 rule will be applied to the line continuously until no
656 further matches are found.
658 `valid' If the `valid' attribute is set, it will be used to
659 determine whether the rule should be invoked. This form
660 is evaluated after the regular expression match has been
661 performed, so that it is possible to use the results of
662 that match to determine whether the alignment should be
663 performed. The buffer should not be modified during the
664 evaluation of this form.
666 `run-if' Like `valid', the `run-if' attribute tests whether the
667 rule should be run at all -- even before any searches are
668 done to determine if the rule applies to the alignment
669 region. This can save time, since `run-if' will only be
670 run once for each rule. If it returns nil, the rule will
673 `column' For alignment rules, if the `column' attribute is set --
674 which must be an integer, or a symbol whose value is an
675 integer -- it will be used as the column in which to align
676 the alignment character. If the text on a particular line
677 happens to overrun that column, a single space character,
678 or tab stop (see `align-to-tab-stop') will be added
679 between the last text character and the alignment
682 `spacing' Alignment rules may also override the amount of spacing
683 that would normally be used by providing a `spacing'
684 attribute. This must be an integer, or a list of integers
685 corresponding to the number of parenthesis groups matched
686 by the `group' attribute. If a list of value is used, and
687 any of those values is nil, `align-default-spacing' will
688 be used for that subgroup. See `align-default-spacing'
689 for more details on spacing, tab stops, and how to
690 indicate how much spacing should be used. If TAB-STOP is
691 present, it will override the value of `align-to-tab-stop'
694 `justify' It is possible with `regexp' and `group' to identify a
695 character group that contains more than just whitespace
696 characters. By default, any non-whitespace characters in
697 that group will also be deleted while aligning the
698 alignment character. However, if the `justify' attribute
699 is set to a non-nil value, only the initial whitespace
700 characters within that group will be deleted. This has
701 the effect of right-justifying the characters that remain,
702 and can be used for outdenting or just plain old right-
705 `separate' Each rule can define its own section separator, which
706 describes how to identify the separation of \"sections\"
707 within the region to be aligned. Setting the `separate'
708 attribute overrides the value of `align-region-separate'
709 (see the documentation of that variable for possible
710 values), and any separation argument passed to `align'."
711 :type align-rules-list-type
714 (put 'align-rules-list
'risky-local-variable t
)
716 (defvar align-exclude-rules-list-type
719 :tag
"Exclusion rule"
720 (symbol :tag
"Title")
721 (cons :tag
"Required attributes"
723 (const :tag
"(Regular expression to match)" regexp
)
724 (choice :value
"\\(\\s-+\\)" regexp function
))
726 :tag
"Optional attributes"
729 (const :tag
"(Repeat this rule throughout line)"
732 (cons :tag
"Paren group"
733 (const :tag
"(Parenthesis group to use)" group
)
735 integer
(repeat integer
)))
737 (const :tag
"(Modes where this rule applies)" modes
)
738 (sexp :value
(text-mode)))
739 (cons :tag
"Case-fold"
740 (const :tag
"(Should case be ignored for this rule)"
742 (boolean :value t
)))))))
743 "The `type' form for any `align-exclude-rules-list' variable.")
745 (defcustom align-exclude-rules-list
747 (regexp .
"\"\\([^\"\n]+\\)\"")
749 (modes . align-dq-string-modes
))
752 (regexp .
"'\\([^'\n]+\\)'")
754 (modes . align-sq-string-modes
))
759 (lambda (end reverse
)
760 (funcall (if reverse
're-search-backward
762 (concat "[^ \t\n\\\\]"
763 (regexp-quote comment-start
)
764 "\\(.+\\)$") end t
))))
765 (modes . align-open-comment-modes
))
768 (regexp .
"/\\*\\(.+\\)\\*/")
770 (modes . align-c
++-modes
))
773 (regexp .
"(\\([^)\n]+\\))")
775 (modes . align-c
++-modes
))
778 (regexp .
"^\\s-*#\\s-*\\(if\\w*\\|endif\\)\\(.*\\)$")
780 (modes . align-c
++-modes
)))
781 "A list describing text that should be excluded from alignment.
782 See the documentation for `align-rules-list' for more info."
783 :type align-exclude-rules-list-type
786 (put 'align-exclude-rules-list
'risky-local-variable t
)
788 ;;; Internal Variables:
790 (defvar align-mode-rules-list nil
791 "Alignment rules specific to the current major mode.
792 See the variable `align-rules-list' for more details.")
794 (make-variable-buffer-local 'align-mode-rules-list
)
796 (defvar align-mode-exclude-rules-list nil
797 "Alignment exclusion rules specific to the current major mode.
798 See the variable `align-exclude-rules-list' for more details.")
800 (make-variable-buffer-local 'align-mode-exclude-rules-list
)
802 (defvar align-highlight-overlays nil
803 "The current overlays highlighting the text matched by a rule.")
805 (defvar align-regexp-history nil
806 "Input history for the full user-entered regex in `align-regexp'")
808 ;; Sample extension rule set, for vhdl-mode. This should properly be
809 ;; in vhdl-mode.el itself.
811 (defcustom align-vhdl-rules-list
813 (regexp .
"\\(signal\\|variable\\|constant\\)\\(\\s-+\\)\\S-")
817 (regexp .
"\\(others\\|[^ \t\n=<]\\)\\(\\s-*\\)=>\\(\\s-*\\)\\S-")
822 (not (string= (downcase (match-string 1))
826 (regexp .
"[^ \t\n:]\\(\\s-*\\):\\(\\s-*\\)[^=\n]")
830 (regexp .
":\\s-*\\(in\\|out\\|inout\\|buffer\\)\\(\\s-*\\)")
834 (regexp .
"[^ \t\n=<]\\(\\s-*\\)<=\\(\\s-*\\)\\S-")
838 (regexp .
"[^ \t\n:]\\(\\s-*\\):="))
841 (regexp .
"\\(\\s-+\\)use\\s-+entity")))
842 "Alignment rules for `vhdl-mode'. See `align-rules-list' for more info."
843 :type align-rules-list-type
846 (put 'align-vhdl-rules-list
'risky-local-variable t
)
848 (defun align-set-vhdl-rules ()
849 "Setup the `align-mode-rules-list' variable for `vhdl-mode'."
850 (setq align-mode-rules-list align-vhdl-rules-list
))
852 (add-hook 'vhdl-mode-hook
'align-set-vhdl-rules
)
854 (add-to-list 'align-dq-string-modes
'vhdl-mode
)
855 (add-to-list 'align-open-comment-modes
'vhdl-mode
)
860 (defun align (beg end
&optional separate rules exclude-rules
)
861 "Attempt to align a region based on a set of alignment rules.
862 BEG and END mark the region. If BEG and END are specifically set to
863 nil (this can only be done programmatically), the beginning and end of
864 the current alignment section will be calculated based on the location
865 of point, and the value of `align-region-separate' (or possibly each
866 rule's `separate' attribute).
868 If SEPARATE is non-nil, it overrides the value of
869 `align-region-separate' for all rules, except those that have their
870 `separate' attribute set.
872 RULES and EXCLUDE-RULES, if either is non-nil, will replace the
873 default rule lists defined in `align-rules-list' and
874 `align-exclude-rules-list'. See `align-rules-list' for more details
875 on the format of these lists."
879 (if (and (symbolp align-region-separate
)
880 (boundp align-region-separate
))
881 (symbol-value align-region-separate
)
882 align-region-separate
)
884 (if (not (or ;(eq separator 'largest)
885 (and (functionp separator
)
886 (not (funcall separator nil nil
)))))
887 (align-region beg end separator
888 (or rules align-mode-rules-list align-rules-list
)
889 (or exclude-rules align-mode-exclude-rules-list
890 align-exclude-rules-list
))
891 (let ((sec-first end
)
893 (align-region beg end
897 align-mode-exclude-rules-list
898 align-exclude-rules-list
)
901 (setq sec-first
(min sec-first b
)
902 sec-last
(max sec-last e
)))))
903 (if (< sec-first sec-last
)
904 (align-region sec-first sec-last
'entire
905 (or rules align-mode-rules-list align-rules-list
)
906 (or exclude-rules align-mode-exclude-rules-list
907 align-exclude-rules-list
)))))))
910 (defun align-regexp (beg end regexp
&optional group spacing repeat
)
911 "Align the current region using an ad-hoc rule read from the minibuffer.
912 BEG and END mark the limits of the region. Interactively, this function
913 prompts for the regular expression REGEXP to align with.
915 For example, let's say you had a list of phone numbers, and wanted to
916 align them so that the opening parentheses would line up:
920 Mary-Anne (123) 456-7890
923 There is no predefined rule to handle this, but you could easily do it
924 using a REGEXP like \"(\". Interactively, all you would have to do is
925 to mark the region, call `align-regexp' and enter that regular expression.
927 REGEXP must contain at least one parenthesized subexpression, typically
928 whitespace of the form \"\\\\(\\\\s-*\\\\)\". In normal interactive use,
929 this is automatically added to the start of your regular expression after
930 you enter it. You only need to supply the characters to be lined up, and
931 any preceding whitespace is replaced.
933 If you specify a prefix argument (or use this function non-interactively),
934 you must enter the full regular expression, including the subexpression.
935 The function also then prompts for which subexpression parenthesis GROUP
936 \(default 1) within REGEXP to modify, the amount of SPACING (default
937 `align-default-spacing') to use, and whether or not to REPEAT the rule
940 See `align-rules-list' for more information about these options.
942 The non-interactive form of the previous example would look something like:
943 (align-regexp (point-min) (point-max) \"\\\\(\\\\s-*\\\\)(\")
945 This function is a nothing more than a small wrapper that helps you
946 construct a rule to pass to `align-region', which does the real work."
949 (list (region-beginning) (region-end))
950 (if current-prefix-arg
951 (list (read-string "Complex align using regexp: "
952 "\\(\\s-*\\)" 'align-regexp-history
)
955 "Parenthesis group to modify (justify if negative): " "1"))
957 (read-string "Amount of spacing (or column if negative): "
958 (number-to-string align-default-spacing
)))
959 (y-or-n-p "Repeat throughout line? "))
960 (list (concat "\\(\\s-*\\)"
961 (read-string "Align regexp: "))
962 1 align-default-spacing nil
))))
963 (or group
(setq group
1))
964 (or spacing
(setq spacing align-default-spacing
))
966 (list (list nil
(cons 'regexp regexp
)
967 (cons 'group
(abs group
))
972 (cons 'spacing spacing
)
973 (cons 'column
(abs spacing
)))
974 (cons 'repeat repeat
)))))
975 (align-region beg end
'entire rule nil nil
)))
978 (defun align-entire (beg end
&optional rules exclude-rules
)
979 "Align the selected region as if it were one alignment section.
980 BEG and END mark the extent of the region. If RULES or EXCLUDE-RULES
981 is set to a list of rules (see `align-rules-list'), it can be used to
982 override the default alignment rules that would have been used to
985 (align beg end
'entire rules exclude-rules
))
988 (defun align-current (&optional rules exclude-rules
)
989 "Call `align' on the current alignment section.
990 This function assumes you want to align only the current section, and
991 so saves you from having to specify the region. If RULES or
992 EXCLUDE-RULES is set to a list of rules (see `align-rules-list'), it
993 can be used to override the default alignment rules that would have
994 been used to align that section."
996 (align nil nil nil rules exclude-rules
))
999 (defun align-highlight-rule (beg end title
&optional rules exclude-rules
)
1000 "Highlight the whitespace which a given rule would have modified.
1001 BEG and END mark the extent of the region. TITLE identifies the rule
1002 that should be highlighted. If RULES or EXCLUDE-RULES is set to a
1003 list of rules (see `align-rules-list'), it can be used to override the
1004 default alignment rules that would have been used to identify the text
1007 (list (region-beginning) (region-end)
1009 "Title of rule to highlight: "
1013 (list (symbol-name (car rule
)))))
1014 (append (or align-mode-rules-list align-rules-list
)
1015 (or align-mode-exclude-rules-list
1016 align-exclude-rules-list
))) nil t
)))
1017 (let ((ex-rule (assq (intern title
)
1018 (or align-mode-exclude-rules-list
1019 align-exclude-rules-list
)))
1021 (align-unhighlight-rule)
1024 (or rules
(if ex-rule
1025 (or exclude-rules align-mode-exclude-rules-list
1026 align-exclude-rules-list
)
1027 (or align-mode-rules-list align-rules-list
)))
1028 (unless ex-rule
(or exclude-rules align-mode-exclude-rules-list
1029 align-exclude-rules-list
))
1032 (if (and mode
(listp mode
))
1033 (if (equal (symbol-name (car mode
)) title
)
1034 (setq face
(cons align-highlight-change-face
1035 align-highlight-nochange-face
))
1038 (let ((overlay (make-overlay b e
)))
1039 (setq align-highlight-overlays
1040 (cons overlay align-highlight-overlays
))
1041 (overlay-put overlay
'face
1044 (cdr face
)))))))))))
1047 (defun align-unhighlight-rule ()
1048 "Remove any highlighting that was added by `align-highlight-rule'."
1050 (while align-highlight-overlays
1051 (delete-overlay (car align-highlight-overlays
))
1052 (setq align-highlight-overlays
1053 (cdr align-highlight-overlays
))))
1056 (defun align-newline-and-indent ()
1057 "A replacement function for `newline-and-indent', aligning as it goes.
1058 The alignment is done by calling `align' on the region that was
1061 (let ((separate (or (if (and (symbolp align-region-separate
)
1062 (boundp align-region-separate
))
1063 (symbol-value align-region-separate
)
1064 align-region-separate
)
1067 (call-interactively 'newline-and-indent
)
1070 (while (not (or (bobp)
1071 (align-new-section-p (point) end separate
)))
1073 (align (point) end
))))
1075 ;;; Internal Functions:
1077 (defun align-match-tex-pattern (regexp end
&optional reverse
)
1078 "Match REGEXP in TeX mode, counting backslashes appropriately.
1079 END denotes the end of the region to be searched, while REVERSE, if
1080 non-nil, indicates that the search should proceed backward from the
1086 (if reverse
're-search-backward
1088 (concat "\\(\\s-*\\)" regexp
1089 "\\(\\s-*\\)") end t
))
1090 (let ((pos (match-end 1))
1092 (while (and (> pos
(point-min))
1093 (eq (char-before pos
) ?
\\))
1094 (setq count
(1+ count
) pos
(1- pos
)))
1095 (eq (mod count
2) 1))
1096 (goto-char (match-beginning (if reverse
1 2)))))
1099 (defun align-new-section-p (beg end separator
)
1100 "Is there a section divider between BEG and END?
1101 SEPARATOR specifies how to look for the section divider. See the
1102 documentation for `align-region-separate' for more details."
1103 (cond ((or (not separator
)
1104 (eq separator
'entire
))
1106 ((eq separator
'group
)
1112 (> (count-lines beg end
) amount
)))
1113 ((stringp separator
)
1116 (re-search-forward separator end t
)))
1117 ((functionp separator
)
1118 (funcall separator beg end
))
1120 (let ((seps separator
) yes
)
1122 (if (and (>= (car seps
) beg
)
1123 (<= (car seps
) end
))
1124 (setq yes t seps nil
)
1125 (setq seps
(cdr seps
))))
1128 (defun align-adjust-col-for-rule (column _rule spacing tab-stop
)
1129 "Adjust COLUMN according to the given RULE.
1130 SPACING specifies how much spacing to use.
1131 TAB-STOP specifies whether SPACING refers to tab-stop boundaries."
1133 (setq spacing align-default-spacing
))
1138 (dotimes (_ spacing
)
1139 (setq column
(indent-next-tab-stop column
)))
1142 (defsubst align-column
(pos)
1143 "Given a position in the buffer, state what column it's in.
1144 POS is the position whose column will be taken. Note that this
1145 function will change the location of point."
1149 (defsubst align-regions
(regions props rule func
)
1150 "Align the regions specified in REGIONS, a list of cons cells.
1151 PROPS describes formatting features specific to the given regions.
1152 RULE specifies exactly how to perform the alignments.
1153 If FUNC is specified, it will be called with each region that would
1154 have been aligned, rather than modifying the text."
1157 (align-areas (car regions
) (car props
) rule func
))
1158 (setq regions
(cdr regions
)
1159 props
(cdr props
))))
1161 (defun align-areas (areas props rule func
)
1162 "Given a list of AREAS and formatting PROPS, align according to RULE.
1163 AREAS should be a list of cons cells containing beginning and ending
1164 markers. This function sweeps through all of the beginning markers,
1165 finds out which one starts in the furthermost column, and then deletes
1166 and inserts text such that all of the ending markers occur in the same
1169 If FUNC is non-nil, it will be called for each text region that would
1170 have been aligned. No changes will be made to the buffer."
1171 (let* ((column (cdr (assq 'column rule
)))
1172 (fixed (if (symbolp column
)
1173 (symbol-value column
)
1175 (justify (cdr (assq 'justify rule
)))
1180 ;; Determine the alignment column.
1184 (setq col
(max col
(align-column (caar a
)))))
1186 (goto-char (cdar a
))
1188 (if (/= ecol
(current-column))
1190 (setq ecol
(current-column))))
1192 (goto-char (caar a
))
1193 (if (and (re-search-forward "\\s-*" (cdar a
) t
)
1194 (/= (point) (cdar a
)))
1195 (let ((bcol (current-column)))
1196 (setcdr (car a
) (cons (point-marker) (cdar a
)))
1197 (goto-char (cdr (cdar a
)))
1198 (setq width
(max width
(- (current-column) bcol
))))))
1202 (setq col
(+ (align-adjust-col-for-rule
1203 col rule
(car props
) (cdr props
)) width
)))
1205 ;; Make all ending positions to occur in the goal column. Since
1206 ;; the whitespace to be modified was already deleted by
1207 ;; `align-region', all we have to do here is indent.
1210 (setq change
(and ecol
(/= col ecol
))))
1212 (when (or func change
)
1214 (let ((area (car areas
))
1219 (marker-position (car area
))
1220 (marker-position (cdr area
))
1222 (if (not (and justify
1223 (consp (cdr area
))))
1224 (goto-char (cdr area
))
1225 (goto-char (cddr area
))
1226 (let ((ecol (current-column)))
1227 (goto-char (cadr area
))
1228 (setq gocol
(- col
(- ecol
(current-column))))))
1229 (setq cur
(current-column))
1230 (cond ((< gocol
0) t
) ; don't do anything
1231 ((= cur gocol
) t
) ; don't need to
1232 ((< cur gocol
) ; just add space
1233 ;; FIXME: It is stated above that "...the
1234 ;; whitespace to be modified was already
1235 ;; deleted by `align-region', all we have
1236 ;; to do here is indent." However, this
1237 ;; doesn't seem to be true, so we first
1238 ;; delete the whitespace to avoid tabs
1240 (delete-horizontal-space t
)
1243 ;; This code works around an oddity in the
1244 ;; FORCE argument of `move-to-column', which
1245 ;; tends to screw up markers if there is any
1247 (let ((endcol (align-column
1253 (align-column (car area
)))))
1255 (goto-char (car area
))
1256 (move-to-column gocol t
))
1257 (let ((here (point)))
1258 (move-to-column endcol t
)
1259 (delete-region here
(point))
1261 (indent-to (align-adjust-col-for-rule
1262 (current-column) rule
1263 (car props
) (cdr props
)))))))))))
1264 (setq areas
(cdr areas
))))))
1266 (defmacro align--set-marker
(marker-var pos
&optional type
)
1267 "If MARKER-VAR is a marker, move it to position POS.
1268 Otherwise, create a new marker at position POS, with type TYPE."
1269 `(if (markerp ,marker-var
)
1270 (move-marker ,marker-var
,pos
)
1271 (setq ,marker-var
(copy-marker ,pos
,type
))))
1273 (defun align-region (beg end separate rules exclude-rules
1275 "Align a region based on a given set of alignment rules.
1276 BEG and END specify the region to be aligned. Either may be nil, in
1277 which case the range will stop at the nearest section division (see
1278 `align-region-separate', and `align-region-heuristic' for more
1281 The region will be divided into separate alignment sections based on
1282 the value of SEPARATE.
1284 RULES and EXCLUDE-RULES are a pair of lists describing how to align
1285 the region, and which text areas within it should be excluded from
1286 alignment. See the `align-rules-list' for more information on the
1287 required format of these two lists.
1289 If FUNC is specified, no text will be modified. What `align-region'
1290 will do with the rules is to search for the alignment areas, as it
1291 regularly would, taking account for exclusions, and then call FUNC,
1292 first with the beginning and ending of the region to be aligned
1293 according to that rule (this can be different for each rule, if BEG
1294 and END were nil), and then with the beginning and ending of each
1295 text region that the rule would have applied to.
1297 The signature of FUNC should thus be:
1299 (defun my-align-function (beg end mode)
1300 \"If MODE is a rule (a list), return t if BEG to END are to be searched.
1301 Otherwise BEG to END will be a region of text that matches the rule's
1302 definition, and MODE will be non-nil if any changes are necessary.\"
1303 (unless (and mode (listp mode))
1304 (message \"Would have aligned from %d to %d...\" beg end)))
1306 This feature (of passing a FUNC) is used internally to locate the
1307 position of exclusion areas, but could also be used for any other
1308 purpose where you might want to know where the regions that the
1309 aligner would have dealt with are."
1310 (let ((end-mark (and end
(copy-marker end t
)))
1312 (report (and (not func
) align-large-region beg end
1313 (>= (- end beg
) align-large-region
)))
1315 (rule-count (length rules
))
1317 (if (and align-indent-before-aligning real-beg end-mark
)
1318 (indent-region real-beg end-mark nil
))
1320 (let* ((rule (car rules
))
1321 (run-if (assq 'run-if rule
))
1322 (modes (assq 'modes rule
)))
1323 ;; unless the `run-if' form tells us not to, look for the
1325 (unless (or (and modes
(not (apply #'derived-mode-p
(eval (cdr modes
)))))
1326 (and run-if
(not (funcall (cdr run-if
)))))
1327 (let* ((case-fold-search case-fold-search
)
1328 (case-fold (assq 'case-fold rule
))
1329 (regexp (cdr (assq 'regexp rule
)))
1330 (regfunc (and (functionp regexp
) regexp
))
1331 (rulesep (assq 'separate rule
))
1332 (thissep (if rulesep
(cdr rulesep
) separate
))
1347 ;; if beg and end were not given, figure out what the
1348 ;; current alignment region should be. Depending on the
1349 ;; value of `align-region-separate' it's possible for
1350 ;; each rule to have its own definition of what that
1351 ;; current alignment section is.
1354 (if (or (not thissep
) (eq thissep
'entire
))
1355 (error "Cannot determine alignment region for `%s'"
1356 (symbol-name (cdr (assq 'title rule
)))))
1358 (while (and (not (eobp))
1359 (looking-at "^\\s-*$"))
1361 (let* ((here (point))
1365 (and align-region-heuristic
1367 align-region-heuristic
))))
1369 (funcall regfunc terminus t
)
1370 (re-search-backward regexp
1372 (if (align-new-section-p (point) here thissep
)
1375 (setq here
(point))))
1384 (and align-region-heuristic
1386 align-region-heuristic
))))
1388 (funcall regfunc terminus nil
)
1389 (re-search-forward regexp terminus t
))))
1390 (if (align-new-section-p here
(point) thissep
)
1393 (setq here
(point))))
1398 (align--set-marker end-mark end t
)
1401 ;; If we have a region to align, and `func' is set and
1402 ;; reports back that the region is ok, then align it.
1403 (when (or (not func
)
1404 (funcall func beg end rule
))
1405 (let (rule-beg exclude-areas
)
1406 ;; determine first of all where the exclusions
1407 ;; lie in this region
1413 (or (and mode
(listp mode
))
1419 (sort exclude-areas
#'car-less-than-car
))))
1421 ;; set `case-fold-search' according to the
1422 ;; (optional) `case-fold' property
1424 (setq case-fold-search
(cdr case-fold
)))
1426 ;; while we can find the rule in the alignment
1428 (while (and (< (point) end-mark
)
1429 (setq search-start
(point))
1431 (funcall regfunc end-mark nil
)
1432 (re-search-forward regexp
1435 ;; give the user some indication of where we
1436 ;; are, if it's a very large region being
1439 (let ((symbol (car rule
)))
1440 (if (and symbol
(symbolp symbol
))
1442 "Aligning `%s' (rule %d of %d) %d%%..."
1443 (symbol-name symbol
) rule-index rule-count
1444 (floor (* (- (point) real-beg
) 100.0)
1445 (- end-mark real-beg
)))
1448 (floor (* (- (point) real-beg
) 100.0)
1449 (- end-mark real-beg
))))))
1451 ;; if the search ended us on the beginning of
1452 ;; the next line, move back to the end of the
1454 (if (and (bolp) (> (point) search-start
))
1457 ;; lookup the `group' attribute the first time
1460 (setq groups
(or (cdr (assq 'group rule
)) 1))
1461 (unless (listp groups
)
1462 (setq groups
(list groups
)))
1463 (setq first
(car groups
)))
1466 (setq spacing
(cdr (assq 'spacing rule
))
1471 (let ((rule-ts (assq 'tab-stop rule
)))
1474 ((symbolp align-to-tab-stop
)
1475 (symbol-value align-to-tab-stop
))
1477 align-to-tab-stop
)))
1480 ;; test whether we have found a match on the same
1481 ;; line as a previous match
1482 (when (> (point) eol
)
1484 (align--set-marker eol
(line-end-position)))
1486 ;; lookup the `repeat' attribute the first time
1488 (setq repeat
(cdr (assq 'repeat rule
))
1491 ;; lookup the `valid' attribute the first time
1493 (setq valid
(assq 'valid rule
)
1496 ;; remember the beginning position of this rule
1497 ;; match, and save the match-data, since either
1498 ;; the `valid' form, or the code that searches for
1499 ;; section separation, might alter it
1500 (setq rule-beg
(match-beginning first
)
1501 save-match-data
(match-data))
1504 (error "No match for subexpression %s" first
))
1506 ;; unless the `valid' attribute is set, and tells
1507 ;; us that the rule is not valid at this point in
1509 (unless (and valid
(not (funcall (cdr valid
))))
1511 ;; look to see if this match begins a new
1512 ;; section. If so, we should align what we've
1513 ;; collected so far, and then begin collecting
1514 ;; anew for the next alignment section
1515 (when (and last-point
1516 (align-new-section-p last-point rule-beg
1518 (align-regions regions align-props rule func
)
1520 (setq align-props nil
))
1521 (align--set-marker last-point rule-beg t
)
1523 ;; restore the match data
1524 (set-match-data save-match-data
)
1526 ;; check whether the region to be aligned
1527 ;; straddles an exclusion area
1528 (let ((excls exclude-areas
))
1529 (setq exclude-p nil
)
1531 (if (and (< (match-beginning (car groups
))
1533 (> (match-end (car (last groups
)))
1537 (setq excls
(cdr excls
)))))
1539 ;; go through the parenthesis groups
1540 ;; matching whitespace to be contracted or
1541 ;; expanded (or possibly justified, if the
1542 ;; `justify' attribute was set)
1545 ;; We must use markers, since
1546 ;; `align-areas' may modify the buffer.
1547 ;; Avoid polluting the markers.
1548 (let* ((group-beg (copy-marker
1549 (match-beginning g
) t
))
1550 (group-end (copy-marker
1552 (region (cons group-beg group-end
))
1553 (props (cons (if (listp spacing
)
1556 (if (listp tab-stop
)
1559 (push group-beg markers
)
1560 (push group-end markers
)
1561 (setq index
(if same
(1+ index
) 0))
1563 ((nth index regions
)
1564 (setcar (nthcdr index regions
)
1566 (nth index regions
))))
1569 (list (list region
)))
1570 (nconc align-props
(list props
)))
1573 (list (list region
)))
1574 (setq align-props
(list props
)))))
1575 ;; If any further rule matches are found
1576 ;; before `eol', they are on the same
1577 ;; line as this one; this can only
1578 ;; happen if the `repeat' attribute is
1581 (setq spacing
(cdr spacing
)))
1582 (if (listp tab-stop
)
1583 (setq tab-stop
(cdr tab-stop
)))
1586 ;; if `repeat' has not been set, move to
1587 ;; the next line; don't bother searching
1588 ;; anymore on this one
1589 (if (and (not repeat
) (not (bolp)))
1592 ;; if the search did not change point,
1593 ;; move forward to avoid an infinite loop
1594 (if (= (point) search-start
)
1597 ;; when they are no more matches for this rule,
1598 ;; align whatever was left over
1600 (align-regions regions align-props rule func
))))))))
1601 (setq rules
(cdr rules
)
1602 rule-index
(1+ rule-index
)))
1603 ;; This function can use a lot of temporary markers, so instead of
1604 ;; waiting for the next GC we delete them immediately (Bug#10047).
1605 (when end-mark
(set-marker end-mark nil
))
1610 (message "Aligning...done"))))
1616 (run-hooks 'align-load-hook
)
1618 ;;; align.el ends here