Files
emacs/lisp/sql-indent/sql-indent.el
2023-11-04 19:26:41 +01:00

2584 lines
100 KiB
EmacsLisp
Raw Permalink Blame History

This file contains invisible Unicode characters
This file contains invisible Unicode characters that are indistinguishable to humans but may be processed differently by a computer. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.
;;; sql-indent.el --- Support for indenting code in SQL files. -*- lexical-binding: t -*-
;; Copyright (C) 2015, 2017-2018 Free Software Foundation, Inc
;; Author: Alex Harsanyi <AlexHarsanyi@gmail.com>
;; Created: 27 Sep 2006
;; Version: 1.7
;; Keywords: languages sql
;; Homepage: https://github.com/alex-hhh/emacs-sql-indent
;; Package-Requires: ((cl-lib "0.5"))
;;
;; This program is free software; you can redistribute it and/or modify
;; it under the terms of the GNU General Public License as published by
;; the Free Software Foundation; either version 3 of the License, or
;; (at your option) any later version.
;;
;; This program is distributed in the hope that it will be useful,
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
;; GNU General Public License for more details.
;;
;; You should have received a copy of the GNU General Public License
;; along with GNU Emacs. If not, see <https://www.gnu.org/licenses/>.
;;; Commentary:
;;
;; `sqlind-minor-mode' is a minor mode that enables syntax-based indentation
;; for `sql-mode' buffers: the TAB key indents the current line based on the
;; SQL code on previous lines. To setup syntax-based indentation for every
;; SQL buffer, add `sqlind-minor-mode' to `sql-mode-hook'. Indentation rules
;; are flexible and can be customized to match your personal coding style.
;; For more information, see the "sql-indent.org" file.
;;
;; The package also defines align rules so that the `align' function works for
;; SQL statements, see `sqlind-align-rules'.
;;; Code:
(require 'sql)
(require 'cl-lib)
;;;; General setup
(defvar sqlind-syntax-table
(let ((table (make-syntax-table)))
;; C-style comments /**/ (see elisp manual "Syntax Flags"))
(modify-syntax-entry ?/ ". 14" table)
(modify-syntax-entry ?* ". 23" table)
;; double-dash starts comment
(modify-syntax-entry ?- ". 12b" table)
;; newline and formfeed end coments
(modify-syntax-entry ?\n "> b" table)
(modify-syntax-entry ?\f "> b" table)
;; single quotes (') quotes delimit strings
(modify-syntax-entry ?' "\"" table)
;; backslash is no escape character
(modify-syntax-entry ?\\ "." table)
;; the following are symbol constituents. Note that the dot '.' is more
;; usefull as a symbol constituent than as a punctuation char.
(modify-syntax-entry ?_ "_" table)
(modify-syntax-entry ?. "_" table)
(modify-syntax-entry ?$ "_" table)
(modify-syntax-entry ?# "_" table)
(modify-syntax-entry ?% "_" table)
table)
"Syntax table used in `sql-mode' for indenting SQL code.
This is slightly different than the syntax table used for
navigation: some punctuation characters are made symbol
constituents so that syntactic navigation works over them.")
;;;; Utilities
;; The following routines perform rudimentary syntactical analysis of SQL
;; code. The indentation engine decides how to indent based on what this code
;; returns. The main function is `sqlind-syntax-of-line'.
;;
;; To examine the syntax of the current line, you can use the
;; `sqlind-show-syntax-of-line'. This is only useful if you want to debug this
;; package or are just curious.
(defconst sqlind-comment-start-skip "\\(--+\\|/\\*+\\)\\s *"
"Regexp to match the start of a SQL comment.")
(defconst sqlind-comment-end "\\*+/"
"Regexp to match the end of a multiline SQL comment.")
(defvar sqlind-comment-prefix "\\*+\\s "
"Regexp to match the line prefix inside comments.
This is used to indent multi-line comments.")
(defsubst sqlind-in-comment-or-string (pos)
"Return non nil if POS is inside a comment or a string.
We actually return \\='string if POS is inside a string,
\\='comment if POS is inside a comment, nil otherwise."
(syntax-ppss-context (syntax-ppss pos)))
(defun sqlind-backward-syntactic-ws ()
"Move point backwards over whitespace and comments.
Leave point on the first character which is not syntactic
whitespace, or at the beginning of the buffer."
(let ((done nil))
(while (not done)
(skip-chars-backward " \t\n\r\f\v")
(unless (eq (point) (point-min))
(forward-char -1))
(let ((pps (syntax-ppss (point))))
(if (nth 4 pps) ; inside a comment?
(goto-char (nth 8 pps)) ; move to comment start than repeat
(setq done t)))))
(point))
(defun sqlind-forward-syntactic-ws ()
"Move point forward over whitespace and comments.
Leave point at the first character which is not syntactic
whitespace, or at the end of the buffer."
;; if we are inside a comment, move to the comment start and scan
;; from there.
(let ((pps (syntax-ppss (point))))
(when (nth 4 pps)
(goto-char (nth 8 pps))))
(let ((done nil))
(while (not done)
(skip-chars-forward " \t\n\r\f\v")
(cond ((looking-at sqlind-comment-start-skip) (forward-comment 1))
;; a slash ("/") by itself is a SQL*plus directive and
;; counts as whitespace
((looking-at "/\\s *$") (goto-char (match-end 0)))
(t (setq done t)))))
(point))
(defun sqlind-search-backward (start regexp limit)
"Search for REGEXP from START backward until LIMIT.
Finds a match that is not inside a comment or string, moves point
to the match and returns it. If no match is found, point is moved
to LIMIT and nil is returned."
(goto-char start)
(let ((done nil))
(while (and (not done)
(re-search-backward regexp limit 'noerror))
(when (sqlind-same-level-statement (point) start)
(setq done (point))))
done))
(defsubst sqlind-match-string (pos)
"Return the match data at POS in the current buffer.
This is similar to `match-data', but the text is fetched without
text properties and it is conveted to lower case."
(let ((start (match-beginning pos))
(end (match-end pos)))
(when (and start end)
(downcase (buffer-substring-no-properties start end)))))
(defsubst sqlind-labels-match (lb1 lb2)
"Return t when LB1 equals LB2 or LB1 is an empty string.
This is used to compare start/end block labels where the end
block label might be empty."
(or (string= lb1 lb2)
(string= lb1 "")))
(defun sqlind-same-level-statement (point start)
"Return t if POINT is at the same syntactic level as START.
This means that POINT is at the same nesting level and not inside
a string or comment."
(save-excursion
(let ((ppss-point (syntax-ppss point))
(ppss-start (syntax-ppss start)))
(and (equal (nth 3 ppss-point) (nth 3 ppss-start)) ; string
(equal (nth 4 ppss-point) (nth 4 ppss-start)) ; comment
(= (nth 0 ppss-point) (nth 0 ppss-start)))))) ; same nesting
(defun sqlind-column-definition-start (pos limit)
"Find the beginning of a column definition in a select statement.
POS is the current position of the line to be indented, assumed
to be in a \\='select-column-continuation syntax.
LIMIT is the limit of the search, the beginning of the select
statement."
(save-excursion
(goto-char pos)
(catch 'found
(while (re-search-backward "," limit 'noerror)
(when (sqlind-same-level-statement (point) limit)
(forward-char 1)
(sqlind-forward-syntactic-ws)
(throw 'found (point))))
;; nothing was found in (while ...) so try to find the first column definition.
(goto-char limit)
(forward-sexp)
(sqlind-forward-syntactic-ws)
(point))))
(defun sqlind-syntax (context)
"Return the most specific syntax of CONTEXT.
See `sqlind-syntax-of-line' for the definition of CONTEXT."
(when context
(caar context)))
(defun sqlind-syntax-symbol (context)
"Return the syntax symbol for the most specific syntax of CONTEXT.
See `sqlind-syntax-of-line' for the definition of CONTEXT."
(when context
(let ((syntax-part (caar context)))
(if (symbolp syntax-part)
syntax-part
(car syntax-part)))))
(defun sqlind-syntax-keyword (context)
"Return the syntax keyword for the most specific syntax of CONTEXT.
This is used for complex syntax symbols like \\='(in-block case
\"\"), in that case, it will return the \\='case symbol. See
`sqlind-syntax-of-line' for the definition of CONTEXT."
(when context
(let ((syntax-part (caar context)))
(if (symbolp syntax-part)
nil ; no KEYWORD
(nth 1 syntax-part)))))
(defun sqlind-anchor-point (context)
"Return the anchor point for the most specifc syntax of CONTEXT.
See `sqlind-syntax-of-line' for the definition of CONTEXT."
(when context
(cdar context)))
(defun sqlind-outer-context (context)
"Return the outer context from CONTEXT.
See `sqlind-syntax-of-line' for the definition of CONTEXT."
(when context
(cdr context)))
(defun sqlind-find-context (syntax-symbol context)
"Find SYNTAX-SYMBOL in the CONTEXT chain.
CONTEXT chain is a list of (SYNTAX-SYMBOL . ANCHOR), as returned
by `sqlind-syntax-of-line'. The function finds the fist element
which matches the specified syntax symbol and returns the list
from that point.
See `sqlind-indentation-syntax-symbols' for the possible syntax
symbols and their meaning."
(cond ((null context)
nil)
((eq syntax-symbol (sqlind-syntax-symbol context))
context)
(t
(sqlind-find-context syntax-symbol (sqlind-outer-context context)))))
(defun sqlind-looking-at-begin-transaction ()
"Return t if the point is on a \"begin transaction\" statement."
(and (looking-at "begin")
(save-excursion
(forward-word 1)
(sqlind-forward-syntactic-ws)
(looking-at "transaction\\>\\|work\\>\\|;"))))
;;;; Syntactic analysis of SQL code
;;;;; Find the beginning of the current statement
(defconst sqlind-sqlplus-directive
(concat ;; SET is handled in a special way, to avoid conflicts with the SET
;; keyworkd in updated clauses
"\\(^set\\s-+\\w+\\(\\s-+[^=].*\\)?$\\)\\|\\(^"
(regexp-opt '("column" "rem" "define" "spool" "prompt"
"clear" "compute" "whenever" "@" "@@" "start")
t)
"\\)\\b")
"Match an SQL*Plus directive at the beginning of a line.
A directive always stands on a line by itself -- we use that to
determine the statement start in SQL*Plus scripts.")
(defconst sqlind-sqlite-directive
"^[.].*?\\>"
"Match an SQLite directive at the beginning of a line.
A directive always stands on a line by itself -- we use that to
determine the statement start in SQLite scripts.")
(defconst sqlind-ms-directive
(concat
"\\(^set\\s-+\\(\\w\\|\\s_\\)+\\s-+\\(on\\|off\\)\\)\\|\\(^"
(regexp-opt '("use" "go" "declare") t)
"\\)\\b")
"Match an MS SQL Sever directive at the beginning of a line.")
(defun sqlind-beginning-of-directive ()
"Return the position of an SQL directive, or nil.
We will never move past one of these in our scan. We also assume
they are one-line only directives."
(let ((rx (cl-case (and (boundp 'sql-product) sql-product)
(ms sqlind-ms-directive)
(sqlite sqlind-sqlite-directive)
(oracle sqlind-sqlplus-directive)
(t nil))))
(when rx
(save-excursion
(when (re-search-backward rx nil 'noerror)
(forward-line 1)
(point))))))
(defvar sqlind-search-limit nil
"Limit of search when looking for syntactic elements.
This variable is dynamically bound.")
(defun sqlind-beginning-of-statement-1 (limit)
"Return the position of a block start, or nil.
But don't go before LIMIT."
(save-excursion
(catch 'done
(while (> (point) (or limit (point-min)))
(when (re-search-backward ";\\|:=\\|\\_<\\(declare\\|\\(begin\\(\\(\\s-+not\\)?\\s-+atomic\\)?\\)\\|cursor\\|for\\|while\\|loop\\|if\\|then\\|else\\|elsif\\|elseif\\)\\_>\\|)\\|\\$\\$"
limit 'noerror)
(unless (sqlind-in-comment-or-string (point))
(let ((candidate-pos (match-end 0)))
(cond ((looking-at ")")
;; Skip parenthesis expressions, we don't want to find one
;; of the keywords inside one of them and think this is a
;; statement start.
(progn (forward-char 1) (forward-sexp -1)))
((looking-at "cursor\\|for")
(unless (eq sql-product 'postgres)
(throw 'done (point))))
((looking-at "while")
(throw 'done (point)))
((looking-at "declare")
(when (eq sql-product 'postgres)
(throw 'done (point))))
((looking-at "else?if")
;; statement begins at the start of the keyword
(throw 'done (point)))
((looking-at "then\\|else")
;; then and else start statements when they are inside
;; blocks, not expressions.
(sqlind-backward-syntactic-ws)
(when (looking-at ";")
;; Statement begins after the keyword
(throw 'done candidate-pos)))
((looking-at "if")
(when (sqlind-good-if-candidate)
;; statement begins at the start of the keyword
(throw 'done (point))))
((looking-at ":=")
;; assignment statements start at the assigned variable
(sqlind-backward-syntactic-ws)
(forward-sexp -1)
(throw 'done (point)))
((looking-at "\\$\\$")
(when (eq sql-product 'postgres)
(sqlind-forward-syntactic-ws)
(throw 'done (point))))
((sqlind-looking-at-begin-transaction)
;; This is a "begin transaction" call, statement begins
;; at "begin", see #66
(throw 'done (point)))
((not (sqlind-in-comment-or-string (point)))
(throw 'done candidate-pos))))))))))
(defun sqlind-beginning-of-statement ()
"Move point to the beginning of the current statement."
(interactive)
(goto-char
(or
;; If we are inside a paranthesis expression, the start is the start of
;; that expression.
(let ((ppss (syntax-ppss (point))))
(when (> (nth 0 ppss) 0)
(nth 1 ppss)))
;; Look for an ordinary statement start
(or (sqlind-beginning-of-statement-1 sqlind-search-limit)
;; Fall back on the search limit
sqlind-search-limit)
;; ... or point-min
(point-min)))
;; a loop keyword might be part of an "end loop" statement, in that case,
;; the statement starts with the "end" keyword. we use skip-syntax-backward
;; so we won't skip over a semicolon (;)
(let ((pos (point)))
(skip-syntax-backward "w")
(if (looking-at "loop")
(progn
(forward-word -1)
(if (looking-at "\\bend\\b")
(goto-char (match-beginning 0))
(goto-char pos)))
(goto-char pos)))
;; now skip over any whitespace and comments until we find the first
;; character that is program code.
(sqlind-forward-syntactic-ws))
;;;;; Find the syntax and beginning of the current block
(defconst sqlind-end-statement-regexp
"\\_<end\\_>\\(?:[ \t\n\r\f]*\\)\\(if\\_>\\|loop\\_>\\|case\\_>\\)?\\(?:[ \t\n\r\f]*\\)\\([a-z0-9_]+\\)?"
"Match an end of statement.
Matches a string like \"end if|loop|case MAYBE-LABEL\".")
(defvar sqlind-end-stmt-stack nil
"Stack of end-of-statement positions.
This is used by the sqlind-maybe-* functions to skip over SQL
programming blocks. This variable is dynamically bound.")
(defun sqlind-maybe-end-statement ()
"Look for SQL end statements return t if found one.
If (point) is at an end statement, add it to the
`sqlind-end-stmt-stack' and return t, otherwise return nil.
See also `sqlind-beginning-of-block'"
(when (looking-at sqlind-end-statement-regexp)
(prog1 t ; make sure we return t
(let ((kind (or (sqlind-match-string 1) ""))
(label (or (sqlind-match-string 2) "")))
(push (list (point) (if (equal kind "") nil (intern kind)) label)
sqlind-end-stmt-stack)))))
(defun sqlind-maybe-then-statement ()
"Find the corresponding start block for a \"then\" statement.
When (point) is on a \"then\" statement, find the corresponding
start of the block and report its syntax. This code will skip
over nested statements to determine the actual start.
Only keywords in program code are matched, not the ones inside
expressions.
See also `sqlind-beginning-of-block'"
(when (looking-at "then")
(prog1 t ; make sure we return t
(let ((start-pos (point)))
;; a then keyword at the begining of a line is a block start
(when (null sqlind-end-stmt-stack)
(save-excursion
(back-to-indentation)
(when (eq (point) start-pos)
(throw 'finished (list 'in-block 'then "")))))
;; if it is not at the beginning of a line, the beginning of
;; the statement is the block start
(ignore-errors (forward-char -1))
(sqlind-beginning-of-statement)
;; a then keyword only starts a block when it is part of an
;; if, case/when or exception statement
(cond
((looking-at "\\(<<[a-z0-9_]+>>\\)?\\(?:[ \t\n\r\f]*\\)\\(\\(?:els\\)?if\\)\\_>")
(let ((if-label (sqlind-match-string 1))
(if-kind (intern (sqlind-match-string 2)))) ; can be if or elsif
(setq if-label (if if-label (substring if-label 2 -2) ""))
(if (null sqlind-end-stmt-stack)
(throw 'finished (list 'in-block if-kind if-label))
;; "if" blocks (but not "elsif" blocks) need to be
;; ended with "end if"
(when (eq if-kind 'if)
(cl-destructuring-bind (pos kind label)
(pop sqlind-end-stmt-stack)
(unless (and (eq kind 'if)
(sqlind-labels-match label if-label))
(throw 'finished
(list 'syntax-error
"bad closing for if block" (point) pos))))))))
((looking-at "\\(<<[a-z0-9_]+>>\\)?\\(?:[ \t\n\r\f]*\\)case\\_>")
;; find the nearest when block, but only if there are no
;; end statements in the stack
(let ((case-label (sqlind-match-string 1)))
(setq case-label
(if case-label (substring case-label 2 -2) ""))
(if (null sqlind-end-stmt-stack)
(save-excursion
(when (sqlind-search-backward start-pos "\\_<when\\_>" (point))
(throw 'finished (list 'in-block 'case case-label))))
;; else
(cl-destructuring-bind (pos kind label)
(pop sqlind-end-stmt-stack)
(unless (and (eq kind 'case)
(sqlind-labels-match label case-label))
(throw 'finished
(list 'syntax-error
"bad closing for case block" (point) pos)))))))
((looking-at "exception\\_>")
;; an exception statement is a block start only if we have
;; no end statements in the stack
(when (null sqlind-end-stmt-stack)
(throw 'finished (list 'in-block 'exception ""))))
(t ; restore position if we didn't do anything
(goto-char start-pos)
nil))))))
(defun sqlind-good-if-candidate ()
"Return non-nil if point is on an actual if statement.
We try to avoid false positives, like \"end if\" or the various
\"drop STUFF if exists\" variants."
(and (looking-at "if")
(save-excursion
(sqlind-backward-syntactic-ws)
(forward-word -1)
;; we don't want to match an "end if", and things like "drop index if
;; exists..." and "create index if not exist..."
(not (looking-at "end\\|schema\\|table\\|view\\|index\\|constraint\\|type\\|trigger\\|procedure\\|function\\|routine\\|package\\|body\\|extension")))))
(defun sqlind-maybe-if-statement ()
"If (point) is on an IF statement, report its syntax."
(when (sqlind-good-if-candidate)
(cond ((null sqlind-end-stmt-stack)
(throw 'finished (list 'in-block 'if "")))
(t
(cl-destructuring-bind (pos kind _label)
(pop sqlind-end-stmt-stack)
(unless (eq kind 'if)
(throw 'finshed
(list 'syntax-error
"bad closing for if block" (point) pos))))))))
(defun sqlind-maybe-case-statement ()
"If (point) is on a case statement."
(when (looking-at "case")
(save-excursion
(sqlind-backward-syntactic-ws)
(forward-word -1)
(unless (looking-at "end") ; we don't want to match an "end case" here
(if (null sqlind-end-stmt-stack)
(throw 'finished (list 'in-block 'case ""))
(cl-destructuring-bind (pos kind _label)
(pop sqlind-end-stmt-stack)
(unless (or (not kind) (eq kind 'case))
(throw 'finished
(list 'syntax-error
"bad closing for case block" (point) pos)))))))))
(defun sqlind-maybe-else-statement ()
"If (point) is on an ELSE statement, report its syntax.
Only keywords in program code are matched, not the ones inside
expressions.
See also `sqlind-beginning-of-block'"
;; an else statement is only a block start if the `sqlind-end-stmt-stack' is
;; empty, otherwise, we don't do anything.
(when (and (looking-at "els\\(e\\|if\\)")
(null sqlind-end-stmt-stack))
(throw 'finished (list 'in-block (intern (sqlind-match-string 0)) ""))))
(defun sqlind-maybe-loop-statement ()
"If (point) is on a LOOP statement, report its syntax.
Only keywords in program code are matched, not the ones inside
expressions.
See also `sqlind-beginning-of-block'"
(when (looking-at "loop")
(prog1 t ; make sure we return t
(sqlind-beginning-of-statement)
;; note that we might have found a loop in an "end loop;" statement.
(or (sqlind-maybe-end-statement)
(progn
(let ((posn (point)))
(unless (looking-at "<<") ;; whe're inside an label.
(forward-word -1)
(back-to-indentation))
(let ((loop-label (if (looking-at "<<\\([a-z0-9_]+\\)>>")
(sqlind-match-string 1) "")))
(goto-char posn)
;; start of loop. this always starts a block, we only check if
;; the labels match
(if (null sqlind-end-stmt-stack)
(throw 'finished (list 'in-block 'loop loop-label))
(cl-destructuring-bind (pos kind label)
(pop sqlind-end-stmt-stack)
(unless (and (eq kind 'loop)
(sqlind-labels-match label loop-label))
(throw 'finished
(list 'syntax-error
"bad closing for loop block" (point) pos))))))))))))
(defun sqlind-maybe-begin-statement ()
"Return the syntax of a \"begin\" statement.
If (point) is on a \"begin\" statement, report its syntax. Only
keywords in program code are matched, not the ones inside
expressions.
See also `sqlind-beginning-of-block'"
(when (and (looking-at "begin") (not (sqlind-looking-at-begin-transaction)))
;; a begin statement starts a block unless it is the first begin in a
;; procedure over which we need to skip it.
(prog1 t ; make sure we return t
(let* ((saved-pos (point))
(begin-label (save-excursion
(sqlind-beginning-of-statement)
(if (looking-at "<<\\([a-z0-9_]+\\)>>\\_>")
(sqlind-match-string 1) "")))
(previous-block (save-excursion
(ignore-errors (forward-char -1))
(cons (sqlind-beginning-of-block) (point))))
(previous-block-kind (nth 0 previous-block)))
(goto-char saved-pos)
(when (null sqlind-end-stmt-stack)
(throw 'finished
(cond ((memq previous-block-kind '(toplevel declare-statement))
(list 'in-begin-block 'toplevel-block begin-label))
((and (listp previous-block-kind)
(eq (nth 0 previous-block-kind) 'defun-start))
(list 'in-begin-block 'defun (nth 1 previous-block-kind)))
((and (listp previous-block-kind)
(memq (nth 0 previous-block-kind) '(package package-body)))
(list 'in-begin-block 'package (nth 1 previous-block-kind)))
(t
(list 'in-begin-block nil begin-label)))))
(cl-destructuring-bind (pos kind label) (pop sqlind-end-stmt-stack)
(cond
(kind
(throw 'finished
(list 'syntax-error "bad closing for begin block" (point) pos)))
((not (equal begin-label ""))
;; we have a begin label. In this case it must match the end
;; label
(unless (equal begin-label label)
(throw 'finished
(list 'syntax-error "mismatched block labels" (point) pos))))
(t
;; we don't have a begin label. In this case, the begin
;; statement might not start a block if it is the begining of a
;; procedure or declare block over which we need to skip.
(cond ((memq previous-block-kind '(toplevel declare-statement))
(goto-char (cdr previous-block)))
((and (listp previous-block-kind)
(memq (nth 0 previous-block-kind)
'(defun-start package package-body)))
(unless (sqlind-labels-match
label (nth 1 previous-block-kind))
(throw 'finished
(list 'syntax-error
"bad end label for defun" (point) pos)))
(goto-char (cdr previous-block)))))))))))
(defun sqlind-maybe-declare-statement ()
"If (point) is on a DECLARE statement, report its syntax.
Only keywords in program code are matched, not the ones inside
expressions, also we don't match DECLARE directives here.
See also `sqlind-beginning-of-block'"
(when (looking-at "declare")
;; In Postgres, a DECLARE statement can be a block, or define a cursor
;; (see pr67.sql, pr92.sql for examples). It is somewhat tricky to
;; determine which is which, so we use the heuristic that a declare
;; statement immediately following a $$ is a block, otherwise it is not.
(when (or (not (eq sql-product 'postgres))
(save-excursion
(sqlind-backward-syntactic-ws)
(skip-syntax-backward "_w") ; note that the $$ is symbol constituent!
(looking-at "\\(\\$\\$\\)\\|begin\\|then\\|else\\|\\(<<[a-z0-9_]+>>\\)")))
(throw 'finished
(if (null sqlind-end-stmt-stack)
'declare-statement
(list 'syntax-error "nested declare block" (point) (point)))))))
(defun sqlind-maybe-skip-create-options ()
"Move point past any MySQL option declarations.
Statements like \"CREATE VIEW\" or \"CREATE TABLE\" can have
various options betwen the CREATE keyword and the thing being
created. If such options exist at (point) the cursor is moved
past them.
Currently we move over the following options, for different
products:
MySQL:
TEMPORARY
ALGORITHM = {UNDEFINED | MERGE | TEMPTABLE}
DEFINER = { user | CURENT_USER }
SQL SECURITY { DEFINER | INVOKER }
PostgresSQL
TEMP
TEMPORARY
GLOBAL
LOCAL
UNLOGGED
MATERIALIZED
Oracle
PRIVATE
TEMP
TEMPORARY
MATERIALIZED
We don't consider if the options are valid or not for the thing
being created. We just skip any and all of them that are
present."
(cond
((eq sql-product 'mysql)
(catch 'finished
(while t
(cond
((looking-at "temporary\\_>")
(goto-char (match-end 0))
(sqlind-forward-syntactic-ws))
((looking-at "\\(definer\\|algorithm\\)\\(\\s-\\|[\n]\\)*=\\(\\s-\\|[\n]\\)*\\S-+")
(goto-char (match-end 0))
(sqlind-forward-syntactic-ws))
((looking-at "sql\\(\\s-\\|[\n]\\)+security\\(\\s-\\|[\n]\\)+\\S-+")
(goto-char (match-end 0))
(sqlind-forward-syntactic-ws))
(t (throw 'finished nil))))))
((eq sql-product 'postgres)
(catch 'finished
(while t
(cond
((looking-at "temp\\(orary\\)?\\_>")
(goto-char (match-end 0))
(sqlind-forward-syntactic-ws))
((looking-at "\\(global\\|local\\|unlogged\\)\\_>")
(goto-char (match-end 0))
(sqlind-forward-syntactic-ws))
((looking-at "materialized\\_>")
(goto-char (match-end 0))
(sqlind-forward-syntactic-ws))
(t (throw 'finished nil))))))
((eq sql-product 'oracle)
(catch 'finished
(while t
(cond
((looking-at "temp\\(orary\\)\\_>")
(goto-char (match-end 0))
(sqlind-forward-syntactic-ws))
((looking-at "materialized\\_>")
(goto-char (match-end 0))
(sqlind-forward-syntactic-ws))
((looking-at "private\\_>")
(goto-char (match-end 0))
(sqlind-forward-syntactic-ws))
(t (throw 'finished nil))))))))
(defun sqlind-maybe-create-statement (&optional all-statements)
"If (point) is on a CREATE statement, report its syntax.
See also `sqlind-beginning-of-block'
Normally, only block start create statements are considered (such
as creation of procedures). In particular, create
table/view/index statements are ignored unless the ALL-STATEMENTS
argument is t"
(when (or (looking-at "create\\_>\\(?:[ \t\n\r\f]+\\)\\(or\\(?:[ \t\n\r\f]+\\)replace\\_>\\)?")
(looking-at "alter\\_>"))
(prog1 t ; make sure we return t
(save-excursion
;; let's see what are we creating
(goto-char (match-end 0))
(sqlind-forward-syntactic-ws)
(sqlind-maybe-skip-create-options)
(let ((what (intern (downcase (buffer-substring-no-properties
(point)
(progn (forward-word) (point))))))
(name (downcase (buffer-substring-no-properties
(progn (sqlind-forward-syntactic-ws)
;; Skip over a possible "if (not)
;; exists", to get the actual name
(when (looking-at "if\\(\\s-\\|[\n]\\)+\\(not\\)?\\(\\s-\\|[\n]\\)exists")
(goto-char (match-end 0))
(sqlind-forward-syntactic-ws))
(point))
(progn (skip-syntax-forward "w_()") (point))))))
(when (and (eq what 'package) (equal name "body"))
(setq what 'package-body)
(setq name (downcase
(buffer-substring-no-properties
(progn (sqlind-forward-syntactic-ws) (point))
(progn (skip-syntax-forward "w_()") (point))))))
;; Keep just the name, not the argument list
(when (string-match "\\(.*?\\)(" name)
(setq name (match-string 1 name)))
(cond
((memq what '(procedure function package package-body))
;; check is name is in the form user.name, if so then suppress user part.
(when (string-match "\\(?:.*\\.\\)?\\(.*\\)" name)
(setq name (match-string 1 name)))
(if (null sqlind-end-stmt-stack)
(throw 'finished
(list (if (memq what '(procedure function)) 'defun-start what)
name))
(cl-destructuring-bind (pos kind label) (pop sqlind-end-stmt-stack)
(when (not (eq kind nil))
(throw 'finished
(list 'syntax-error
"bad closing for create block" (point) pos)))
(unless (sqlind-labels-match label name)
(throw 'finished
(list 'syntax-error
"label mismatch in create block" (point) pos))))))
((memq what '(table view index))
;; Table, view and index creations do not begin blocks and they
;; are ignored unless the ALL-STATEMENTS parameter is t
(when all-statements
(throw 'finished (list 'create-statement what name))))
(t
(unless (null sqlind-end-stmt-stack)
(throw 'finished
(list 'syntax-error "nested create statement" (point) (point))))
(throw 'finished (list 'create-statement what name)))))))))
(defun sqlind-maybe-defun-statement ()
"If (point) is on a procedure definition statement, report its syntax.
See also `sqlind-beginning-of-block'"
(catch 'exit
(when (looking-at "\\(procedure\\|function\\)\\(?:[ \t\n\r\f]+\\)\\(?:[a-z0-9_]+\\.\\)?\\([a-z0-9_]+\\)")
(prog1 t ; make sure we return t
(let ((proc-name (sqlind-match-string 2)))
;; need to find out if this is a procedure/function
;; declaration or a definition
(save-excursion
(goto-char (match-end 0))
(sqlind-forward-syntactic-ws)
;; skip param list, if any.
(when (looking-at "(")
(ignore-errors (forward-sexp 1))
(sqlind-forward-syntactic-ws))
(when (looking-at "return\\(?:[ \t\n\r\f]+\\)\\([a-z0-9_.]+\\(?:%\\(?:row\\)?type\\)?\\)")
(goto-char (match-end 0))
(sqlind-forward-syntactic-ws))
(when (looking-at ";")
;; not a procedure after all.
(throw 'exit nil)))
(save-excursion
(sqlind-backward-syntactic-ws)
;; Find out if it is a drop procedure or function statement
(forward-word -1)
(when (looking-at "drop")
;; not a procedure after all
(throw 'exit nil))
;; Find out if it is a "comment on" statement (postgres only)
(when (and (eq sql-product 'postgres)
(looking-at "on"))
(sqlind-backward-syntactic-ws)
(forward-word -1)
(when (looking-at "comment")
;; not a procedure after all.
(throw 'exit nil))))
;; so it is a definition
;; if the procedure starts with "create or replace", move
;; point to the real start
(let ((real-start (point)))
(save-excursion
(forward-word -1)
(when (looking-at "replace")
(forward-word -2))
(when (and (or (looking-at "create\\([ \t\r\n\f]+or[ \t\r\n\f]+replace\\)?")
(looking-at "alter"))
(not (sqlind-in-comment-or-string (point))))
(setq real-start (point))))
(goto-char real-start))
(when (null sqlind-end-stmt-stack)
(throw 'finished (list 'defun-start proc-name)))
(cl-destructuring-bind (pos kind label) (pop sqlind-end-stmt-stack)
(unless (and (eq kind nil)
(sqlind-labels-match label proc-name))
(throw 'finished
(list 'syntax-error "bad end label for defun" (point) pos)))))))))
(defun sqlind-maybe-exception-statement ()
"If (point) is on an exception keyword, report its syntax.
See also `sqlind-beginning-of-block'"
(when (and (looking-at "exception")
(null sqlind-end-stmt-stack))
;; Exception is both a keyword and a type. We need to only stop on the
;; keyword. We detect that if the previous token is either ";" or
;; "BEGIN".
(save-excursion
(forward-char -1)
(sqlind-backward-syntactic-ws)
(when (or (looking-at ";")
(progn (forward-word -1) (looking-at "\\<_begin\\_>")))
(throw 'finished (list 'in-block 'exception))))))
(defun sqlind-maybe-$$-statement ()
"If (point) is on a PostgreSQL $$ quote, report its syntax.
PostgreSQL uses $$ to delimit SQL blocks in create statements,
this function tries to determine if the $$ block is a begin or an
end block and creates the appropiate syntactic context.
See also `sqlind-beginning-of-block'"
(when (looking-at "\\$\\$")
(prog1 t
(let* ((saved-pos (point)))
(ignore-errors (forward-char -1))
(sqlind-backward-syntactic-ws)
(cond ((looking-at ";")
;; Assume the $$ is ending a statement (previous line is a ';'
;; which ends another statement)
(push (list saved-pos '$$ "") sqlind-end-stmt-stack)
(goto-char saved-pos))
((progn (forward-word -1)
(looking-at "end"))
;; Assume the $$ is ending a statement (previous line contains
;; an "end" keyword)
(push (list saved-pos '$$ "") sqlind-end-stmt-stack)
(goto-char saved-pos))
((null sqlind-end-stmt-stack)
(sqlind-beginning-of-statement)
(let ((syntax (catch 'finished
(sqlind-maybe-create-statement)
(sqlind-maybe-defun-statement)
'toplevel)))
(if (and (listp syntax) (eq (nth 0 syntax) 'defun-start))
(throw 'finished (list 'in-begin-block 'defun (nth 1 syntax)))
(throw 'finished (list 'in-begin-block syntax nil)))))
(t
(sqlind-beginning-of-statement)
(cl-destructuring-bind (pos kind _label) (pop sqlind-end-stmt-stack)
(unless (eq kind '$$)
(throw 'finished
(list 'syntax-error "bad closing for $$ begin block" (point) pos))))))))))
(defconst sqlind-start-block-regexp
(concat "\\(\\_<"
(regexp-opt '("if" "then" "else" "elsif" "elseif" "loop"
"begin" "declare" "create" "alter" "exception"
"procedure" "function" "end" "case") t)
"\\_>\\)\\|)\\|\\$\\$")
"Regexp to match the start of a block.")
(defun sqlind-beginning-of-block (&optional end-statement-stack)
"Find the start of the current block and return its syntax.
END-STATEMENT-STACK contains a list of \"end\" syntaxes in
reverse order (a stack) and is used to skip over nested blocks."
(interactive)
;; This function works as follows: `sqlind-start-block-regexp` defines the
;; keywords where it stops to inspect the code. Each time it stops at one
;; of these keywords, it checks to see if the keyword is inside a comment or
;; string. If the keyworkd is not inside a comment or string, the
;; `sqlind-maybe-*` functions are called to check if the keyword is valid.
;; Each of these functions will do one of the following:
;;
;; * throw a syntax object with a 'finished tag, if they decide that the
;; keyword is valid
;;
;; * return t to indicate that they decided that the keyword is not valid
;; and `sqlind-beginning-of-block` should search for the next keyword
;;
;; * return nil to indicate that they don't recognize the keyword and
;; another `sqlind-maybe-*` function should be called
;;
;; Some of these `sqlind-maybe-*` functions are specific to the
;; `sql-product` and are only invoked for the speficied SQL dialect.
(catch 'finished
(let ((sqlind-end-stmt-stack end-statement-stack))
(while (re-search-backward sqlind-start-block-regexp sqlind-search-limit 'noerror)
(or (sqlind-in-comment-or-string (point))
(when (looking-at ")") (forward-char 1) (forward-sexp -1) t)
(sqlind-maybe-end-statement)
(sqlind-maybe-if-statement)
(sqlind-maybe-case-statement)
(sqlind-maybe-then-statement)
(sqlind-maybe-exception-statement)
(sqlind-maybe-else-statement)
(sqlind-maybe-loop-statement)
(sqlind-maybe-begin-statement)
(when (memq sql-product '(oracle postgres))
;; declare statements only start blocks in PL/SQL and PostgresSQL
(sqlind-maybe-declare-statement))
(when (eq sql-product 'postgres)
(sqlind-maybe-$$-statement))
(sqlind-maybe-create-statement)
(sqlind-maybe-defun-statement))))
'toplevel))
;;;;; Determine the syntax inside a case expression
(defconst sqlind-case-clauses-regexp
"\\_<\\(when\\|then\\|else\\|end\\)\\_>")
(defun sqlind-syntax-in-case (pos start)
"Return the syntax at POS which is part a \"case\" expression at START."
(save-excursion
(goto-char pos)
(cond ((looking-at "when\\|else")
;; A WHEN, or ELSE clause is indented relative to the start of the
;; case expression
(cons 'case-clause start))
((looking-at "end")
(cons (list 'block-end 'case "") start))
((looking-at "then")
;; THEN and ELSE clauses are indented relative to the start of the
;; when clause, which we must find
(while (not (and (re-search-backward "\\_<when\\_>")
(sqlind-same-level-statement (point) start)))
nil)
(cons 'case-clause-item (point)))
(t
;; It is a statement continuation from the closest CASE element
(while (and (not (= (point) start))
(not (and (re-search-backward sqlind-case-clauses-regexp start 'noerror)
(sqlind-same-level-statement (point) start))))
nil)
(cons 'case-clause-item-cont (point))))))
;;;;; Determine the syntax inside a with statement
(defconst sqlind-with-clauses-regexp
"\\_<\\(with\\|recursive\\)\\_>")
(defun sqlind-syntax-in-with (pos start)
"Return the syntax at POS which is part of a \"with\" statement at START."
(save-excursion
(catch 'finished
(goto-char pos)
(cond
((looking-at sqlind-with-clauses-regexp)
(throw 'finished (cons 'with-clause start)))
((and (looking-at "\\_<select\\_>")
(sqlind-same-level-statement (point) start))
(throw 'finished (cons 'with-clause start))))
(while (re-search-backward "\\_<select\\_>" start 'noerror)
(when (sqlind-same-level-statement (point) start)
(throw 'finished (sqlind-syntax-in-select pos (point)))))
(goto-char pos)
(when (looking-at "\\_<as\\_>")
(throw 'finished (cons 'with-clause-cte-cont start)))
(sqlind-backward-syntactic-ws)
(when (looking-at ",")
(throw 'finished (cons 'with-clause-cte start)))
(forward-word -1)
(when (looking-at sqlind-with-clauses-regexp)
;; We're right after the with (recursive keyword)
(throw 'finished (cons 'with-clause-cte start)))
(throw 'finished (cons 'with-clause-cte-cont start)))))
;;;;; Determine the syntax inside a select statement
(defconst sqlind-select-clauses-regexp
(concat
"\\_<\\("
"\\(\\(union\\(\\s-+all\\)?\\)\\|intersect\\|minus\\|except\\)?[ \t\r\n\f]*select\\|"
"\\(bulk[ \t\r\n\f]+collect[ \t\r\n\f]+\\)?into\\|"
"perform\\|"
"from\\|"
"where\\|"
"order[ \t\r\n\f]+by\\|"
"having\\|"
"group[ \t\r\n\f]+by\\|"
"connect[ \t\r\n\f]+by\\|"
"start[ \t\r\n\f]+with\\|"
"limit"
"\\)\\_>"))
(defconst sqlind-select-join-regexp
(regexp-opt '("inner" "left" "right" "natural" "cross" "full") 'symbols))
(defconst sqlind-join-condition-regexp
(regexp-opt '("on" "using" "and" "or") 'symbols))
(defun sqlind-find-join-start (start limit)
"Look backwards for the start of a JOIN statement,
begin looking for it at the START position in the buffer, and
look backwards until LIMIT is reached. Returns the buffer
position where the JOIN condition starts, or nil if no JOIN
statement is found."
(save-excursion
(when (sqlind-search-backward start "\\bjoin\\b" limit)
(let ((candidate (point)))
(forward-char -1)
(sqlind-backward-syntactic-ws)
(backward-word)
(if (looking-at sqlind-select-join-regexp)
(point)
;; The "outer" keyword is composed with a "left" or "right" keyword
;; so we need to move backwards one more word.
(if (looking-at "\\bouter\\b")
(progn
(forward-char -1)
(sqlind-backward-syntactic-ws)
(backward-word)
(if (looking-at "\\b\\(left\\|right\\)\\b")
(point)
candidate))
candidate))))))
(defun sqlind-syntax-in-select (pos start)
"Return the syntax ar POS which is inside a \"select\" statement at START."
(save-excursion
(catch 'finished
(goto-char pos)
;; all select query components are indented relative to the
;; start of the select statement)
(when (looking-at sqlind-select-clauses-regexp)
(throw 'finished (cons 'select-clause start)))
;; when we are not looking at a select component, find the
;; nearest one from us.
(while (sqlind-search-backward (point) sqlind-select-clauses-regexp start)
(let* ((match-pos (match-beginning 0))
(clause (sqlind-match-string 0)))
(setq clause (replace-regexp-in-string "[ \t\r\n\f]" " " clause))
(when (sqlind-same-level-statement (point) start)
(cond
((or (looking-at "select\\(\\s *\\_<\\(top\\s +[0-9]+\\|distinct\\|unique\\)\\_>\\)?")
(and (eq sql-product 'postgres) (looking-at "perform\\_>")))
;; we are in the column selection section.
(goto-char pos)
(if (looking-at ",")
(throw 'finished (cons 'select-column match-pos))
(progn
(sqlind-backward-syntactic-ws)
(throw 'finished
(cons (if (or (eq (match-end 0) (1+ (point)))
(looking-at ","))
'select-column
'select-column-continuation)
match-pos)))))
((looking-at "from")
;; FROM is only keyword if the previous char is NOT a
;; comma ','
(forward-char -1)
(sqlind-backward-syntactic-ws)
(unless (looking-at ",")
;; We are in the from section. If this line starts with 'on'
;; or the previous line ends with 'on' we have a join
;; condition
(goto-char pos)
(when (or (looking-at sqlind-join-condition-regexp)
(progn (forward-word -1)
(and (sqlind-same-level-statement (point) pos)
(looking-at sqlind-select-join-regexp))))
;; look for the join start, that will be the anchor
(let ((jstart (sqlind-find-join-start (point) start)))
(when jstart
(throw 'finished (cons 'select-join-condition jstart))))))
;; if this line starts with a ',' or the previous line starts
;; with a ',', we have a new table
(goto-char pos)
;; NOTE: the combination of tests and movement operations in
;; the when clause is not ideal...
(when (or (looking-at ",")
(looking-at sqlind-select-join-regexp)
(looking-at "join\\b")
(progn
(sqlind-backward-syntactic-ws)
(or (looking-at ",")
(progn
(forward-word -1)
(or (looking-at sqlind-select-join-regexp)
(looking-at "join\\b")
(looking-at "from\\b"))))))
(throw 'finished (cons 'select-table match-pos)))
(goto-char pos)
(let ((limit match-pos))
(if (sqlind-search-backward (point) (regexp-opt (list "," "join") 'symbols) limit)
(progn
(goto-char (match-end 0))
(sqlind-forward-syntactic-ws)
(when (looking-at "lateral")
(forward-word 1)
(sqlind-forward-syntactic-ws))
;; otherwise, we continue the table definition from the
;; previous line.
(throw 'finished
;; If, after following all these joins, we got back
;; to our line, we are in a select-table after all,
;; otherwise it is a table continuation.
(if (eq (point) pos)
(cons 'select-table match-pos)
(cons 'select-table-continuation (point)))))
(progn ; this must be the first table in the FROM section
(when (looking-at "from\\b")
(forward-word)
(sqlind-forward-syntactic-ws))
(throw 'finished (cons 'select-table-continuation (point)))))))
(t
(throw 'finished
(cons (list 'in-select-clause clause) match-pos))))))))))
;;;;; Determine the syntax inside an insert statement
(defconst sqlind-insert-clauses-regexp
"\\_<\\(insert\\([ \t\r\n\f]+into\\)?\\|values\\|select\\)\\_>")
(defun sqlind-syntax-in-insert (pos start)
"Return the syntax at POS which is inside an \"insert\" statement at START."
;; The insert clause is really easy since it has the form insert into TABLE
;; (COLUMN_LIST) values (VALUE_LIST) or insert into TABLE select
;; SELECT_CLAUSE
;;
;; note that we will never be called when point is in COLUMN_LIST or
;; VALUE_LIST, as that is a nested-statement-continuation which starts with
;; the open paranthesis.
;;
;; if we are inside the SELECT_CLAUSE, we delegate the syntax to
;; `sqlind-syntax-in-select'
(save-excursion
(catch 'finished
(goto-char pos)
;; all select query components are indented relative to the
;; start of the select statement)
(when (looking-at sqlind-insert-clauses-regexp)
(throw 'finished (cons 'insert-clause start)))
(while (re-search-backward sqlind-insert-clauses-regexp start t)
(let* ((match-pos (match-beginning 0))
(clause (sqlind-match-string 0)))
(setq clause (replace-regexp-in-string "[ \t\r\n\f]" " " clause))
(when (sqlind-same-level-statement (point) start)
(throw 'finished
(if (looking-at "select")
(sqlind-syntax-in-select pos match-pos)
(cons (list 'in-insert-clause clause) match-pos)))))))))
;;;;; Determine the syntax inside a delete statement
(defconst sqlind-delete-clauses-regexp
"\\_<\\(delete\\([ \t\r\n\f]+from\\)?\\|where\\|returning\\|\\(bulk[ \t\r\n\f]collect[ \t\r\n\f]\\)?into\\)\\_>")
(defun sqlind-syntax-in-delete (pos start)
"Return the syntax at POS which is inside a \"delete\" statement at START."
(save-excursion
(catch 'finished
(goto-char pos)
;; all select query components are indented relative to the
;; start of the select statement)
(when (looking-at sqlind-delete-clauses-regexp)
(throw 'finished (cons 'delete-clause start)))
(while (re-search-backward sqlind-delete-clauses-regexp start t)
(let* ((match-pos (match-beginning 0))
(clause (sqlind-match-string 0)))
(setq clause (replace-regexp-in-string "[ \t\r\n\f]" " " clause))
(when (sqlind-same-level-statement (point) start)
(throw 'finished
(cons (list 'in-delete-clause clause) match-pos))))))))
;;;;; Determine the syntax inside an update statement
(defconst sqlind-update-clauses-regexp
"\\_<\\(update\\|set\\|where\\)\\_>")
(defun sqlind-syntax-in-update (pos start)
"Return the syntax at POS which is inside an \"update\" statement at START."
(save-excursion
(catch 'finished
(goto-char pos)
;; all select query components are indented relative to the start of the
;; select statement)
(when (looking-at sqlind-update-clauses-regexp)
(throw 'finished (cons 'update-clause start)))
(while (re-search-backward sqlind-update-clauses-regexp start t)
(let* ((match-pos (match-beginning 0))
(clause (sqlind-match-string 0)))
(setq clause (replace-regexp-in-string "[ \t\r\n\f]" " " clause))
(when (sqlind-same-level-statement (point) start)
(throw 'finished
(cons (list 'in-update-clause clause) match-pos))))))))
;;;;; Refine the syntax of an end statement.
(defun sqlind-refine-end-syntax (end-kind end-label end-pos context)
"Return a \\='block-end syntax when line contains an \"end\" keyword.
END-KIND contains the symbol after the end statement (\\='if if
the statement is an \"end if\", \\='loop if the statement is an
\"end loop\", etc). This can be nil if there is a plain \"end\"
keyword.
END-LABEL contains the label of the end statement, when there is
one.
END-POS is the position where the \"end\" keyword is.
CONTEXT represents the syntactic context up to the current line.
The function will perform some validations, for example, an \"end
if\" must close an if statement, an \"end loop\" must close a
loop, etc. It will return a \\='syntax-error syntax if the
validation fails.
If all checks pass, it will return a (block-end KIND LABEL) where
KIND is the symbol determining the type of the block (\\='if,
\\='loop, \\='procedure, etc) and LABEL is the block label, if
there is any."
(catch 'done
(when (null context) ; can happen
(throw 'done
(cons (list 'syntax-error "end statement closes nothing"
end-pos end-pos)
end-pos)))
(let ((syntax (sqlind-syntax context))
(anchor (sqlind-anchor-point context))
(syntax-symbol (sqlind-syntax-symbol context)))
(cond
((memq syntax-symbol '(package package-body))
;; we are closing a package declaration or body, `end-kind' must be
;; empty, `end-label' can be empty or it must match the package name
(throw 'done
(cons
(cond (end-kind ; no end-kind is allowed for a package
(list 'syntax-error
"bad closing for package" anchor end-pos))
((sqlind-labels-match end-label (nth 1 syntax))
(list 'block-end syntax-symbol (nth 1 syntax)))
(t
(list 'syntax-error "mismatched end label for package"
anchor end-pos)))
anchor)))
((eq syntax-symbol 'in-begin-block)
;; we are closing a begin block (either toplevel, procedure/function
;; or a simple begin block. `end-kind' must be empty, `end-label'
;; can be empty or it must match the pakage-name
(let ((block-label (nth 2 syntax)))
(throw 'done
(cons
(cond (end-kind ; no end-kind is allowed for a begin block
(list 'syntax-error
"bad closing for begin block" anchor end-pos))
((sqlind-labels-match end-label block-label)
(list 'block-end (nth 1 syntax) block-label))
(t
(list 'syntax-error "mismatched end label for block"
anchor end-pos)))
anchor))))
((eq syntax-symbol 'in-block)
(let ((block-kind (nth 1 syntax))
(block-label (nth 2 syntax)))
(cond
((eq block-kind 'exception)
(goto-char anchor)
(throw 'done
(sqlind-refine-end-syntax
end-kind end-label end-pos (sqlind-syntax-of-line))))
((eq block-kind 'loop)
(throw 'done
(cons
(cond ((not (eq end-kind 'loop))
(list 'syntax-error "bad closing for loop block"
anchor end-pos))
((not (sqlind-labels-match end-label block-label))
(list 'syntax-error "mismatched end label for loop"
anchor end-pos))
(t
(list 'block-end block-kind block-label)))
anchor)))
((eq block-kind 'then)
(goto-char anchor)
(catch 'found
(while t
(let ((then-context (sqlind-syntax-of-line)))
(goto-char (cdar then-context))
(cond
((looking-at "when\\_>\\|then\\_>") t)
((looking-at "\\(?:<<\\([a-z0-9_]+\\)>>[ \t\r\n\f]*\\)?\\_<\\(if\\|case\\)\\_>")
(throw 'found t))
(t
(throw 'done
(cons
(list 'syntax-error "bad syntax start for then keyword"
(point) (point))
anchor)))))))
(let ((start-label (or (sqlind-match-string 1) ""))
(start-kind (intern (sqlind-match-string 2))))
(throw 'done
(cons
(cond ((not (or (null end-kind) (eq end-kind start-kind)))
(list 'syntax-error "bad closing for if/case block"
(point) end-pos))
((not (sqlind-labels-match end-label start-label))
(list 'syntax-error "mismatched labels for if/case block"
(point) end-pos))
(t
(list 'block-end start-kind start-label)))
anchor))))
((memq block-kind '(else elsif elseif))
;; search the enclosing then context and refine form there. The
;; `cdr' in sqlind-syntax-of-line is used to remove the
;; block-start context for the else clause
(goto-char anchor)
(throw 'done
(sqlind-refine-end-syntax
end-kind end-label end-pos (cdr (sqlind-syntax-of-line)))))
((memq block-kind '(if case))
(throw 'done
(cons
(cond ((not (eq end-kind block-kind))
(list 'syntax-error "bad closing for if/case block"
anchor end-pos))
((not (sqlind-labels-match end-label block-label))
(list 'syntax-error
"bad closing for if/case block (label mismatch)"
anchor end-pos))
(t (list 'block-end block-kind block-label)))
anchor)))
)))
((memq syntax-symbol '(block-start comment-start))
;; there is a more generic context following one of these
(throw 'done
(sqlind-refine-end-syntax
end-kind end-label end-pos (cdr context))))
((eq syntax-symbol 'defun-start)
(throw 'done
(cons
(if (and (null end-kind)
(sqlind-labels-match end-label (nth 1 syntax)))
(list 'block-end 'defun end-label)
(list 'syntax-error "mismatched end label for defun"
anchor end-pos))
anchor)))
((eq syntax-symbol 'block-end)
(goto-char anchor)
(forward-line -1)
(throw 'done
(sqlind-refine-end-syntax
end-kind end-label end-pos (sqlind-syntax-of-line)))))
;; if the above cond fell through, we have a syntax error
(cons (list 'syntax-error "end statement closes nothing"
end-pos end-pos)
anchor))))
;;;;; sqlind-syntax-of-line
(defun sqlind-refine-syntax (context pos have-block-context)
"Refine a basic syntax CONTEXT at POS.
CONTEXT is a syntactic context obtained by looking at the
statement start and block start, see `sqlind-syntax-of-line'. We
refine it by looking at the contents of the current line and the
contents of the anchor.
HAVE-BLOCK-CONTEXT indicates that we are indenting a statement,
not a statement-continuation POS is the same as the
`sqlind-beginning-of-statement'."
(let ((syntax (sqlind-syntax context))
(anchor (sqlind-anchor-point context))
(syntax-symbol (sqlind-syntax-symbol context)))
(goto-char pos)
(cond
;; do we start a comment?
((and (not (eq syntax-symbol 'comment-continuation))
(looking-at sqlind-comment-start-skip))
(push (cons 'comment-start anchor) context))
;; Refine a statement continuation
((memq syntax-symbol '(statement-continuation nested-statement-continuation))
;; a (nested) statement continuation which starts with loop
;; or then is a block start
(if (and have-block-context (looking-at "\\(loop\\|then\\|when\\)\\_>"))
(push (cons (list 'block-start (intern (sqlind-match-string 0))) anchor)
context)
;; else
(goto-char anchor)
(when (eq syntax 'nested-statement-continuation)
(forward-char 1)
(sqlind-forward-syntactic-ws)
(setq anchor (point)))
;; when all we have before `pos' is a label, we have a
;; labeled-statement-start
(when (looking-at "<<\\([a-z0-9_]+\\)>>")
(goto-char (match-end 0))
(forward-char 1)
(sqlind-forward-syntactic-ws)
(when (eq (point) pos)
(push (cons 'labeled-statement-start anchor) context)))
(when (looking-at "when\\_>")
(let* ((acontext (sqlind-syntax-of-line))
(asyntax (sqlind-syntax acontext)))
(cond ((equal asyntax '(in-block exception ""))
(push (cons '(in-block exception-handler "") (point)) context))
((equal asyntax '(block-start when))
;; Refine again in the context of the when line
(setq context (sqlind-refine-syntax (cdr acontext) pos have-block-context))))))
;; maybe we have a DML statement (select, insert, update and
;; delete)
;; skip a cursor definition if it is before our point, in the
;; following format:
;;
;; CURSOR name IS
;; CURSOR name type IS
(when (looking-at "cursor\\b")
(let ((origin (point)))
(forward-sexp 1) ; skip "cursor"
(sqlind-forward-syntactic-ws)
(forward-sexp 1)
(sqlind-forward-syntactic-ws)
(if (looking-at "is\\b")
(progn
(goto-char (match-end 0))
(sqlind-forward-syntactic-ws))
(forward-sexp 1)
(sqlind-forward-syntactic-ws)
(when (looking-at "is\\b")
(goto-char (match-end 0))
(sqlind-forward-syntactic-ws)))
(unless (<= (point) pos)
(goto-char origin))))
;; Skip a PostgreSQL cursor declaration
(when (and (eq sql-product 'postgres)
(looking-at "\\(\\(declare\\)\\|\\(cursor\\)\\|\\(for\\)\\)\\b"))
(when (re-search-forward "\\b\\(select\\|update\\|delete\\|insert\\)\\b" pos 'noerror)
(goto-char (match-beginning 0))))
;; skip a forall statement if it is before our point
(when (looking-at "forall\\b")
(when (re-search-forward "\\b\\(select\\|update\\|delete\\|insert\\)\\b" pos 'noerror)
(goto-char (match-beginning 0))))
;; only check for syntax inside DML clauses if we are not
;; at the start of one.
(when (< (point) pos)
(cond
;; NOTE: We only catch here "CASE" expressions, not CASE
;; statements. We also catch assignments with case (var
;; := CASE ...)
((looking-at "\\(\\w+[ \t\r\n\f]+:=[ \t\r\n\f]+\\)?\\(case\\)")
(when (< (match-beginning 2) pos)
(push (sqlind-syntax-in-case pos (match-beginning 2)) context)))
((looking-at "with")
(push (sqlind-syntax-in-with pos (point)) context))
((looking-at "select")
(push (sqlind-syntax-in-select pos (point)) context))
((and (eq sql-product 'postgres)
(looking-at "perform"))
(push (sqlind-syntax-in-select pos (point)) context))
((looking-at "insert")
(push (sqlind-syntax-in-insert pos (point)) context))
((looking-at "delete")
(push (sqlind-syntax-in-delete pos (point)) context))
((looking-at "update")
(push (sqlind-syntax-in-update pos (point)) context))))
(when (eq (sqlind-syntax-symbol context) 'select-column-continuation)
(let ((cdef (sqlind-column-definition-start pos (sqlind-anchor-point context))))
(when cdef
(save-excursion
(goto-char cdef)
(when (looking-at "case")
(push (sqlind-syntax-in-case pos (point)) context))))))
(when (eq (sqlind-syntax-symbol context) 'nested-statement-continuation)
(save-excursion
;; Look for a join expression inside a nested statement, see #70
(goto-char pos)
(when (or (looking-at sqlind-join-condition-regexp)
(progn (forward-word -1) (looking-at sqlind-join-condition-regexp)))
;; look for the join start, that will be the anchor
(let ((jstart (sqlind-find-join-start (point) anchor)))
(when jstart
(push (cons 'select-join-condition jstart) context))))))
))
;; create block start syntax if needed
((and (eq syntax-symbol 'in-block)
(memq (nth 1 syntax) '(if elsif elseif then case))
(looking-at "\\(then\\|\\(els\\(e\\|e?if\\)\\)\\)\\_>"))
(let ((what (intern (sqlind-match-string 0))))
;; the only invalid combination is a then statement in
;; an (in-block "then") context
(unless (and (eq what 'then) (equal (nth 1 syntax) 'then))
(push (cons (list 'block-start what) anchor) context))))
((and (eq syntax-symbol 'in-block)
(eq (nth 1 syntax) 'exception)
(not (looking-at "\\(when\\|end\\)\\_>")))
(save-excursion
(when (sqlind-search-backward pos "when\\_>" anchor)
(push (cons (list 'in-block 'exception-handler) (point)) context))))
;; note that begin is not a block-start in a 'in-begin-block
;; context
((and (memq syntax-symbol '(defun-start declare-statement toplevel
package package-body))
(or (looking-at "begin\\_>")
(and (eq sql-product 'postgres) (looking-at "\\$\\$"))))
(push (cons (list 'block-start 'begin) anchor) context))
((and (memq syntax-symbol '(defun-start package package-body))
(looking-at "\\(is\\|as\\)\\_>"))
(push (cons (list 'block-start 'is-or-as) anchor) context))
((and (memq syntax-symbol '(in-begin-block in-block))
(looking-at "exception\\_>"))
(push (cons (list 'block-start 'exception) anchor) context))
((and (eq syntax-symbol 'in-block)
(memq (nth 1 syntax) '(then case))
(not (looking-at "end\\s-*\\_<\\(if\\|case\\)\\_>")))
(if (looking-at "when\\_>")
(push (cons (list 'block-start 'when) anchor) context)
;; NOTE: the "when" case is handed above
(when (sqlind-search-backward pos "when\\_>" anchor)
(push (cons '(in-block when) (point)) context))))
;; indenting the select clause inside a view or a "create table as"
;; statement.
((and (eq syntax-symbol 'create-statement)
(memq (nth 1 syntax) '(view table)))
(goto-char anchor)
(catch 'done
(while (re-search-forward "\\bselect\\b" pos 'noerror)
(goto-char (match-beginning 0))
(when (sqlind-same-level-statement (point) anchor)
(push (sqlind-syntax-in-select pos (point)) context)
(throw 'done nil))
(goto-char (match-end 0)))))
;; create a block-end syntax if needed
((and (not (eq syntax-symbol 'comment-continuation))
(looking-at "end[ \t\r\n\f]*\\(\\_<\\(?:if\\|loop\\|case\\)\\_>\\)?[ \t\r\n\f]*\\(\\_<\\(?:[a-z0-9_]+\\)\\_>\\)?"))
;; so we see the syntax which closes the current block. We still
;; need to check if the current end is a valid closing block
(let ((kind (or (sqlind-match-string 1) ""))
(label (or (sqlind-match-string 2) "")))
(push (sqlind-refine-end-syntax
(if (equal kind "") nil (intern kind))
label (point) context)
context)))
((and (eq sql-product 'postgres)
(not (eq syntax-symbol 'comment-continuation))
(looking-at "\\$\\$"))
(push (sqlind-refine-end-syntax
nil "" (point) context)
context))
;; See #92 and pr92b.sql, no such thing as a nested declare statement, use
;; the context of the previous declare-statement!
((and (eq sql-product 'postgres)
(eq syntax-symbol 'declare-statement)
(looking-at "declare\\_>"))
(goto-char anchor)
(setq context (sqlind-syntax-of-line)))
)
context))
(defun sqlind-syntax-of-line ()
"Return the syntax at the start of the current line.
The function returns a list of (SYNTAX . ANCHOR) cons cells.
SYNTAX is either a symbol or a list starting with a symbol,
ANCHOR is a buffer position which is the reference for the
SYNTAX. `sqlind-indentation-syntax-symbols' lists the syntax
symbols and their meaning.
The first element in the list is the most specific syntax for the
line, the remaining elemens are more generic ones. For example,
a line can be inside an SELECT clause which itself is inside a
procedure block."
(save-excursion
(with-syntax-table sqlind-syntax-table
(let* ((pos (progn (back-to-indentation) (point)))
(sqlind-search-limit (sqlind-beginning-of-directive))
(context-start (progn (sqlind-beginning-of-statement) (point)))
(context (list (cons 'statement-continuation context-start)))
(have-block-context nil))
(goto-char context-start)
(when (or (>= context-start pos)
(and (looking-at sqlind-start-block-regexp)
;; create table/view/index statements are not block
;; contexts
(or (not (looking-at "\\(create\\)\\|\\(alter\\)"))
(catch 'finished (sqlind-maybe-create-statement) nil))
;; A declare statement may or may not be a block context
(or (not (looking-at "declare"))
(catch 'finished (sqlind-maybe-declare-statement) nil))
(not (sqlind-looking-at-begin-transaction))))
(goto-char pos)
;; if we are at the start of a statement, or the nearest statement
;; starts after us, make the enclosing block the starting context
(setq have-block-context t)
(let ((block-info (sqlind-beginning-of-block)))
;; certain kind of blocks end within a statement
;; (e.g. create view). If we found one of those blocks and
;; it is not within our statement, we ignore the block info.
(if (and (listp block-info)
(eq (nth 0 block-info) 'create-statement)
(not (memq (nth 1 block-info) '(function procedure)))
(not (eql context-start (point))))
(progn
(setq context-start (point-min))
(setq context (list (cons 'toplevel context-start))))
;; else
(setq context-start (point))
(setq context (list (cons block-info context-start))))))
(goto-char context-start)
(when (and (eq 'statement-continuation (sqlind-syntax-symbol context))
(looking-at "\\(create\\)\\|\\(alter\\)"))
(let ((create-info (catch 'finished (sqlind-maybe-create-statement t) nil)))
(when create-info
(pop context) ; remove the statement continuation syntax
(push (cons create-info context-start) context))))
(let ((parse-info (syntax-ppss pos)))
(cond ((nth 4 parse-info) ; inside a comment
(push (cons 'comment-continuation (nth 8 parse-info)) context))
((nth 3 parse-info) ; inside a string
(push (cons 'string-continuation (nth 8 parse-info)) context))
((> (nth 0 parse-info) 0) ; nesting
(let ((start (nth 1 parse-info)))
(goto-char (1+ start))
(skip-chars-forward " \t\r\n\f\v" pos)
(if (eq (point) pos)
(push (cons 'nested-statement-open start) context)
(goto-char pos)
(if (looking-at ")")
(push (cons 'nested-statement-close start) context)
(push (cons 'nested-statement-continuation start) context)))))))
;; now let's refine the syntax by adding info about the current line
;; into the mix.
(sqlind-refine-syntax context pos have-block-context)))))
(defun sqlind-show-syntax-of-line ()
"Print the syntax of the current line."
(interactive)
(prin1 (sqlind-syntax-of-line)))
;;;; Indentation of SQL code
;;;;; Indentation calculation routines
(defvar sqlind-basic-offset 2
"The basic indentaion amount for SQL code.
Indentation is usually done in multiples of this amount, but
special indentation functions can do other types of indentation
such as aligning. See also `sqlind-indentation-offsets-alist'.")
(make-variable-buffer-local 'sqlind-basic-offset)
(defvar sqlind-indentation-syntax-symbols '()
"This variable exists just for its documentation.
The the SQL parsing code returns a syntax definition (either a
symbol or a list) and an anchor point, which is a buffer
position. The syntax symbols can be used to define how to indent
each line, see `sqlind-indentation-offsets-alist'
The following syntax symbols are defined for SQL code:
- (syntax-error MESSAGE START END) -- this is returned when the
parse failed. MESSAGE is an informative message, START and END
are buffer locations denoting the problematic region. ANCHOR
is undefined for this syntax info
- `in-comment' -- line is inside a multi line comment, ANCHOR is
the start of the comment.
- `comment-start' -- line starts with a comment. ANCHOR is the
start of the enclosing block.
- `in-string' -- line is inside a string, ANCHOR denotes the start
of the string.
- `toplevel' -- line is at toplevel (not inside any programming
construct). ANCHOR is usually (point-min).
- (in-block BLOCK-KIND LABEL) -- line is inside a block
construct. BLOCK-KIND (a symbol) is the actual block type and
can be one of \"if\", \"case\", \"exception\", \"loop\" etc.
If the block is labeled, LABEL contains the label. ANCHOR is
the start of the block.
- (in-begin-block KIND LABEL) -- line is inside a block started
by a begin statement. KIND (a symbol) is \"toplevel-block\"
for a begin at toplevel, \"defun\" for a begin that starts the
body of a procedure or function, \"package\" for a begin that
starts the body of a package, or nil for a begin that is none
of the previous. For a \"defun\" or \"package\", LABEL is the
name of the procedure, function or package, for the other block
types LABEL contains the block label, or the empty string if
the block has no label. ANCHOR is the start of the block.
- (block-start KIND) -- line begins with a statement that starts
a block. KIND (a symbol) can be one of \"then\", \"else\" or
\"loop\". ANCHOR is the reference point for the block
start (the coresponding if, case, etc).
- (block-end KIND LABEL) -- the line contains an end statement.
KIND (a symbol) is the type of block we are closing, LABEL (a
string) is the block label (or procedure name for an end
defun).
- declare-statement -- line is after a declare keyword, but
before the begin. ANCHOR is the start of the declare
statement.
- (package NAME) -- line is inside a package definition. NAME is
the name of the package, ANCHOR is the start of the package.
- (package-body NAME) -- line is inside a package body. NAME is
the name of the package, ANCHOR is the start of the package
body.
- (create-statement WHAT NAME) -- line is inside a CREATE
statement (other than create procedure or function). WHAT is
the thing being created, NAME is its name. ANCHOR is the start
of the create statement.
- (defun-start NAME) -- line is inside a procedure of function
definition but before the begin block that starts the body.
NAME is the name of the procedure/function, ANCHOR is the start
of the procedure/function definition.
The following SYNTAX-es are for SQL statements. For all of
them ANCHOR points to the start of a statement itself.
- labeled-statement-start -- line is just after a label.
- statement-continuation -- line is inside a statement which
starts on a previous line.
- nested-statement-open -- line is just inside an opening
bracket, but the actual bracket is on a previous line.
- nested-statement-continuation -- line is inside an opening
bracket, but not the first element after the bracket.
- nested-statement-close -- line is inside an opening bracket and
the line contains the closing bracket as the first character.
The following SYNTAX-es are for statements which are SQL
code (DML statements). They are pecialisations on the previous
statement syntaxes and for all of them a previous generic
statement syntax is present earlier in the SYNTAX list. Unless
otherwise specified, ANCHOR points to the start of the
clause (select, from, where, etc) in which the current point is.
- with-clause -- line is inside a WITH clause, but before the
main SELECT clause.
- with-clause-cte -- line is inside a with clause before a
CTE (common table expression) declaration
- with-clause-cte-cont -- line is inside a with clause before a
CTE definition
- case-clause -- line is on a CASE expression (WHEN or END
clauses). ANCHOR is the start of the CASE expression.
- case-clause-item -- line is on a CASE expression (THEN and ELSE
clauses). ANCHOR is the position of the case clause.
- case-clause-item-cont -- line is on a CASE expression but not
on one of the CASE sub-keywords. ANCHOR points to the case
keyword that this line is a continuation of.
- select-clause -- line is inside a select statement, right
before one of its clauses (from, where, order by, etc).
- select-column -- line is inside the select column section,
after a full column was defined (and a new column definition is
about to start).
- select-column-continuation -- line is inside the select column
section, but in the middle of a column definition. The defined
column starts on a previous like. Note that ANCHOR still
points to the start of the select statement itself.
- select-join-condition -- line is right before or just after the ON clause
for an INNER, LEFT or RIGHT join. ANCHOR points to the join statement
for which the ON is defined.
- select-table -- line is inside the from clause, just after a
table was defined and a new one is about to start.
- select-table-continuation -- line is inside the from clause,
inside a table definition which starts on a previous line. Note
that ANCHOR still points to the start of the select statement
itself.
- (in-select-clause CLAUSE) -- line is inside the select CLAUSE,
which can be \"where\", \"order by\", \"group by\" or
\"having\". Note that CLAUSE can never be \"select\" and
\"from\", because we have special syntaxes inside those
clauses.
- insert-clause -- line is inside an insert statement, right
before one of its clauses (values, select).
- (in-insert-clause CLAUSE) -- line is inside the insert CLAUSE,
which can be \"insert into\" or \"values\".
- delete-clause -- line is inside a delete statement right before
one of its clauses.
- (in-delete-clause CLAUSE) -- line is inside a delete CLAUSE,
which can be \"delete from\" or \"where\".
- update-clause -- line is inside an update statement right
before one of its clauses.
- (in-update-clause CLAUSE) -- line is inside an update CLAUSE,
which can be \"update\", \"set\" or \"where\".")
(defconst sqlind-default-indentation-offsets-alist
'((syntax-error sqlind-report-sytax-error)
(in-string sqlind-report-runaway-string)
(comment-continuation sqlind-indent-comment-continuation)
(comment-start sqlind-indent-comment-start)
(toplevel 0)
(in-block +)
(in-begin-block +)
(block-start 0)
(block-end 0)
(declare-statement +)
(package ++)
(package-body 0)
(create-statement +)
(defun-start +)
(labeled-statement-start 0)
(statement-continuation +)
(nested-statement-open sqlind-use-anchor-indentation +)
(nested-statement-continuation sqlind-use-previous-line-indentation)
(nested-statement-close sqlind-use-anchor-indentation)
(with-clause sqlind-use-anchor-indentation)
(with-clause-cte +)
(with-clause-cte-cont ++)
(case-clause 0)
(case-clause-item sqlind-use-anchor-indentation +)
(case-clause-item-cont sqlind-right-justify-clause)
(select-clause sqlind-right-justify-clause)
(select-column sqlind-indent-select-column)
(select-column-continuation sqlind-indent-select-column +)
(select-join-condition ++)
(select-table sqlind-indent-select-table)
(select-table-continuation sqlind-indent-select-table +)
(in-select-clause sqlind-lineup-to-clause-end
sqlind-right-justify-logical-operator)
(insert-clause sqlind-right-justify-clause)
(in-insert-clause sqlind-lineup-to-clause-end
sqlind-right-justify-logical-operator)
(delete-clause sqlind-right-justify-clause)
(in-delete-clause sqlind-lineup-to-clause-end
sqlind-right-justify-logical-operator)
(update-clause sqlind-right-justify-clause)
(in-update-clause sqlind-lineup-to-clause-end
sqlind-right-justify-logical-operator))
"Define the indentation amount for each syntactic symbol.
The value of this variable is an ALIST with the format:
((SYNTACTIC-SYMBOL . INDENTATION-OFFSETS) ... )
`sqlind-indentation-syntax-symbols' documents the list of possible
SYNTACTIC-SYMBOL values.
INDENTATION-OFFSETS defines the adjustments made to the
indentation for each syntactic-symbol. It is a list of:
a NUMBER -- the NUMBER will be added to the indentation offset.
'+ -- the current indentation offset is incremented by
`sqlind-basic-offset'
'++ -- the current indentation offset is indentation by 2 *
`sqlind-basic-offset'
'- -- the current indentation offset is decremented by
`sqlind-basic-offset'
'-- -- the current indentation offset is decremented by 2 *
`sqlind-basic-offset'
a FUNCTION -- the syntax and current indentation offset is
passed to the function and its result is used as the new
indentation offset.
See `sqlind-calculate-indentation' for how the indentation offset
is calculated.")
(defvar sqlind-indentation-offsets-alist
sqlind-default-indentation-offsets-alist
"Define the indentation amount for each syntactic symbol.
See also `sqlind-default-indentation-offsets-alist',
`sqlind-indentation-syntax-symbols' and
`sqlind-calculate-indentation'")
(make-variable-buffer-local 'sqlind-indentation-offsets-alist)
(defun sqlind-calculate-indentation (syntax &optional base-indentation)
"Return the indentation that should be applied to the current line.
SYNTAX is the syntaxtic information as returned by
`sqlind-syntax-of-line', BASE-INDENTATION is an indentation offset
to start with. When BASE-INDENTATION is nil, it is initialised
to the column of the anchor.
The indentation is done as follows: first, the indentation
offsets for the current syntactic symbol is looked up in
`sqlind-indentation-offsets-alist'. Than, for each indentation
offset, BASE-INDENTATION is adjusted according to that
indentation offset. The final value of BASE-INDENTATION is than
returned."
(if (null syntax)
base-indentation
;; else
;; when the user did not specify a base-indentation, we use the
;; column of the anchor as a starting point
(when (null base-indentation)
(setq base-indentation (save-excursion
(goto-char (cdar syntax))
(current-column))))
(let* ((syntax-symbol (sqlind-syntax-symbol syntax))
(indent-info (cdr (assoc syntax-symbol
sqlind-indentation-offsets-alist)))
(new-indentation base-indentation))
;; the funcall below can create a nil indentation symbol to
;; abort the indentation process
(while (and new-indentation indent-info)
(let ((i (car indent-info)))
(setq new-indentation
(cond
((eq i '+) (+ new-indentation sqlind-basic-offset))
((eq i '++) (+ new-indentation (* 2 sqlind-basic-offset)))
((eq i '-) (- new-indentation sqlind-basic-offset))
((eq i '--) (- new-indentation (* 2 sqlind-basic-offset)))
((integerp i) (+ new-indentation i))
((functionp i) (funcall i syntax new-indentation))
;; ignore unknown symbols by default
(t new-indentation))))
(setq indent-info (cdr indent-info)))
new-indentation)))
;;;;; Indentation helper functions
(defun sqlind-report-sytax-error (syntax _base-indentation)
"Report a syntax error for a \\='syntax-error SYNTAX."
(cl-destructuring-bind (_sym msg start end) (sqlind-syntax syntax)
(message "%s (%d %d)" msg start end))
nil)
(defun sqlind-report-runaway-string (_syntax _base-indentation)
"Report an error for a runaway string.
This is a string that extends over multiple lines. This is not
supported in SQL."
(message "runaway string constant")
nil)
(defun sqlind-use-anchor-indentation (syntax _base-indentation)
"Return the indentation of the line containing anchor of SYNTAX.
By default, the column of the anchor position is uses as a base
indentation. You can use this function to switch to using the
indentation of the anchor as the base indentation."
(save-excursion
(goto-char (sqlind-anchor-point syntax))
(current-indentation)))
(defun sqlind-lineup-to-anchor (syntax _base-indentation)
"Return the column of the anchor point of SYNTAX.
This need not be the indentation of the actual line that contains
anchor."
(save-excursion
(goto-char (sqlind-anchor-point syntax))
(current-column)))
(defun sqlind-use-previous-line-indentation (syntax _base-indentation)
"Return the indentation of the previous non-empty line.
If the start of the previous line is before the anchor of SYNTAX,
use the column of the anchor + 1."
(let ((anchor (sqlind-anchor-point syntax)))
(save-excursion
(forward-line -1)
(beginning-of-line)
(while (and (looking-at "^\\s-*$") (> (point) anchor)) ; empty line, skip it
(forward-line -1)
(beginning-of-line))
(back-to-indentation)
(if (< (point) anchor)
(progn
(goto-char anchor)
(1+ (current-column)))
(current-column)))))
(defun sqlind-indent-comment-continuation (syntax _base-indentation)
"Return the indentation for a line inside a comment SYNTAX.
If the current line matches `sqlind-comment-prefix' or
`sqlind-comment-end', we indent to one plus the column of the
comment start, which will make comments line up nicely, like
this:
/* Some comment line
* another comment line
*/
When the current line does not match `sqlind-comment-prefix', we
indent it so it lines up with the text of the start of the
comment, like this:
/* Some comment line
Some other comment line
*/"
(save-excursion
(back-to-indentation)
(if (or (looking-at sqlind-comment-prefix)
(looking-at sqlind-comment-end))
(progn
(goto-char (sqlind-anchor-point syntax))
(1+ (current-column)))
;; else
(goto-char (sqlind-anchor-point syntax))
(when (looking-at sqlind-comment-start-skip)
(goto-char (match-end 0)))
(current-column))))
(defun sqlind-indent-comment-start (syntax base-indentation)
"Return the indentation for a comment start SYNTAX.
If we start a line comment (--) and the previous line also has a
line comment, we line up the two comments. Otherwise we indent
in the previous context (cdr SYNTAX) starting at
BASE-INDENTATION."
(save-excursion
(back-to-indentation)
(if (and (looking-at "\\s *--")
(progn
(forward-line -1)
(re-search-forward "--" (line-end-position) t)))
(progn
(goto-char (match-beginning 0))
(current-column))
(sqlind-calculate-indentation
(sqlind-outer-context syntax) base-indentation))))
(defun sqlind-indent-select-column (syntax base-indentation)
"Return the indentation for a column of a SELECT clause.
SYNTAX is the syntax of the current line, BASE-INDENTATION is the
current indentation, which we need to update.
We try to align to the previous column start, but if we are the
first column after the SELECT clause we simply add
`sqlind-basic-offset'."
(save-excursion
(goto-char (sqlind-anchor-point syntax))
(when (or (looking-at "select\\s *\\(top\\s +[0-9]+\\|distinct\\|unique\\)?")
(and (eq sql-product 'postgres) (looking-at "perform\\_>")))
(goto-char (match-end 0)))
(skip-syntax-forward " ")
(if (or (looking-at sqlind-comment-start-skip)
(eolp))
(+ base-indentation sqlind-basic-offset)
(current-column))))
(defun sqlind-indent-select-table (syntax base-indentation)
"Return the indentation for a table in the FROM section.
SYNTAX is the syntax of the current line, BASE-INDENTATION is the
current indentation, which we need to update.
We try to align to the first table, but if we are the first
table, we simply add `sqlind-basic-offset'."
(save-excursion
(goto-char (sqlind-anchor-point syntax))
(when (looking-at "from")
(goto-char (match-end 0)))
(skip-syntax-forward " ")
(if (or (looking-at sqlind-comment-start-skip)
(eolp))
(+ base-indentation sqlind-basic-offset)
(current-column))))
(defun sqlind-lineup-to-clause-end (syntax base-indentation)
"Line up the current line with the end of a query clause.
This assumes SYNTAX is one of in-select-clause, in-update-clause,
in-insert-clause or in-delete-clause. It will return an
indentation so that:
If the clause is on a line by itself, the current line is
indented by `sqlind-basic-offset', otherwise the current line is
indented so that it starts in next column from where the clause
keyword ends.
Argument BASE-INDENTATION is updated."
(cl-destructuring-bind ((_sym clause) . anchor) (car syntax)
(save-excursion
(goto-char anchor)
(forward-char (1+ (length clause)))
(skip-syntax-forward " ")
(if (or (looking-at sqlind-comment-start-skip)
(eolp))
;; if the clause is on a line by itself, indent this line with a
;; sqlind-basic-offset
(+ base-indentation sqlind-basic-offset)
;; otherwise, align to the end of the clause, with a few exceptions
(current-column)))))
(defun sqlind-right-justify-logical-operator (syntax base-indentation)
"Align an AND, OR or NOT operator with the end of the WHERE clause.
SYNTAX is the syntax of the current line, BASE-INDENTATION is the
current indentation, which we need to update.
If this rule is added to the \\='in-select-clause syntax after
the `sqlind-lineup-to-clause-end' rule, it will adjust lines
starting with AND, OR or NOT to be aligned so they sit under the
WHERE clause."
(save-excursion
(back-to-indentation)
(cl-destructuring-bind ((_sym clause) . anchor) (car syntax)
(if (and (equal clause "where")
(looking-at "and\\|or\\|not"))
(progn
(goto-char anchor)
(+ (current-column)
(- (length clause) (- (match-end 0) (match-beginning 0)))))
base-indentation))))
(defun sqlind-left-justify-logical-operator (syntax base-indentation)
"Align an AND, OR or NOT operator with the start of the WHERE clause.
SYNTAX is the syntax of the current line, BASE-INDENTATION is the
current indentation, which we need to update.
If this rule is added to the \\='in-select-clause syntax after
the `sqlind-lineup-to-clause-end' rule, it will adjust lines
starting with AND, OR or NOT to be aligned so they sit left under
the WHERE clause."
(save-excursion
(back-to-indentation)
(cl-destructuring-bind ((_sym clause) . anchor) (car syntax)
(if (and (equal clause "where")
(looking-at "and\\|or\\|not"))
(progn (goto-char anchor) (current-column))
base-indentation))))
(defconst sqlind-operator-regexp
(concat (regexp-opt '("||" "*" "/" "%" "+" "-" "<<" ">>" "&" "|"
"<" "<=" ">" ">=" "=" "==" "!=" "<>")
t)
"\\s-*")
"Regexp to match a SQL expression operator.")
(defun sqlind-adjust-operator (syntax base-indentation)
"Adjust the indentation for operators in select clauses.
If the line to be indented starts with an operator, the
right-hand operand is lined up with the left hand operand on the
previous line. Otherwise, BASE-INDENTATION is returned. For
example:
select col1, col2
|| col3 as composed_column,
col4
|| col5 as composed_column2
from my_table
where cond1 = 1
and cond2 = 2;
This is an indentation adjuster and needs to be added to the
`sqlind-indentation-offsets-alist`"
(save-excursion
(with-syntax-table sqlind-syntax-table
(back-to-indentation)
;; If there are non-word constituents at the beginning if the line,
;; consider them an operator and line up the line to the first word of the
;; line, not the operator
(cond ((looking-at sqlind-operator-regexp)
(let ((ofs (length (match-string 0))))
(if (eq (sqlind-syntax-symbol syntax)
'select-column-continuation)
(goto-char (sqlind-column-definition-start
(point) (sqlind-anchor-point syntax)))
(forward-line -1)
(end-of-line)
(sqlind-backward-syntactic-ws)
;; Previous function leaves us on the first non-white-space
;; character. This might be a string terminator (') char, move
;; the cursor one to the left, so 'forward-sexp' works correctly.
(ignore-errors (forward-char 1))
(forward-sexp -1))
(max 0 (- (current-column) ofs))))
('t base-indentation)))))
(defun sqlind-lone-semicolon (syntax base-indentation)
"Indent a lone semicolon with the statement start. For example:
If the current line contains a single semicolon ';', it will be
indented at the same level as the anhcor of SYNTAX. Otherwise,
BASE-INDENTATION is returned unchanged. For example:
select col
from my_table
;
This is an indentation adjuster and needs to be added to the
`sqlind-indentation-offsets-alist`"
(save-excursion
(back-to-indentation)
(if (looking-at ";")
(sqlind-use-anchor-indentation syntax base-indentation)
base-indentation)))
(defun sqlind-right-justify-clause (syntax base-indentation)
"Return an indentation which right-aligns the first word at
anchor of SYNTAX with the first word in the curent line.
This is intended to be used as an indentation function for
select-clause, update-clause, insert-clause and update-clause
syntaxes"
(save-excursion
(let ((clause-length 0)
(statement-keyword-length 0)
offset)
(back-to-indentation)
(when (looking-at "\\sw+\\b")
(setq clause-length (- (match-end 0) (match-beginning 0))))
(goto-char (cdar syntax)) ; move to ANCHOR
(when (looking-at "\\sw+\\b")
(setq statement-keyword-length (- (match-end 0) (match-beginning 0))))
(setq offset (- statement-keyword-length clause-length))
(if (> offset 0)
(+ base-indentation offset)
base-indentation))))
(defun sqlind-lineup-joins-to-anchor (syntax base-indentation)
"Align JOIN keywords with the anchor point of SYNTAX.
If the line starts with an INNER,OUTER or CROSS JOIN keyword,
return the column of the anchor point, otherwise return
BASE-INDENTATION.
If this rule is added to `select-table-continuation' indentation,
it will indent lines starting with JOIN keywords to line up with
the FROM keyword."
(save-excursion
(back-to-indentation)
;; NOTE: we are a bit loose here as we only look for the first keyword
;; which might indicate a join regexp, e.g. we are happy to see "left"
;; even though, the correct statement is "left outer? join"
(if (or (looking-at sqlind-select-join-regexp)
(looking-at "\\bjoin\\b"))
(sqlind-lineup-to-anchor syntax base-indentation)
base-indentation)))
(defun sqlind-lineup-open-paren-to-anchor (syntax base-indentation)
"Align an open paranthesis with the anchor point of SYNTAX.
If the line starts with an open paren \\='(\\=', return the
column of the anchor point. If line does not start with an open
paren, the function returns BASE-INDENTATION, acting as a no-op."
(save-excursion
(back-to-indentation)
(if (looking-at "(")
(sqlind-lineup-to-anchor syntax base-indentation)
base-indentation)))
(defun sqlind-adjust-comma (_syntax base-indentation)
"Lineup lines starting with a comma ',' to the word start.
Adjust BASE-INDENTATION so that the actual word is lined up. For
example:
SELECT col1
, col2 -- ignore the comma and align the actual word."
(save-excursion
(back-to-indentation)
(let ((ofs (if (looking-at ",\\s-*") (length (match-string 0)) 0)))
(max 0 (- base-indentation ofs)))))
(defun sqlind-lineup-into-nested-statement (syntax _base-indentation)
"Align the line to the first word inside a nested statement.
Return the column of the first non-whitespace char in a nested
statement. For example:
( a,
b, -- b is always aligned with \\='a\\='
)
This function only makes sense in a
\\='nested-statement-continuation SYTNAX indentation rule."
(save-excursion
(goto-char (sqlind-anchor-point syntax))
(end-of-line)
(let ((limit (point)))
(goto-char (sqlind-anchor-point syntax))
(forward-char 1)
(sqlind-forward-syntactic-ws)
(if (< (point) limit)
(current-column)
(progn
(goto-char (sqlind-anchor-point syntax))
(back-to-indentation)
(+ (current-column) sqlind-basic-offset))))))
;;;;; sqlind-indent-line
(defun sqlind-indent-line ()
"Indent the current line according to SQL conventions.
`sqlind-basic-offset' defined the number of spaces in the basic
indentation unit and `sqlind-indentation-offsets-alist' is used to
determine how to indent each type of syntactic element."
(let* ((syntax (sqlind-syntax-of-line))
(base-column (current-column))
(indent-column (sqlind-calculate-indentation syntax)))
(when indent-column
(back-to-indentation)
(let ((offset (- base-column (current-column))))
;; avoid modifying the buffer when the indentation does not
;; have to change
(unless (eq (current-column) indent-column)
(indent-line-to indent-column))
(when (> offset 0)
(forward-char offset))))))
;;;; Alignment rules
(defvar sqlind-align-rules
`(;; Line up the two side of arrow =>
(sql-arrow-lineup
(regexp . "\\(\\s-*\\)=>\\(\\s-*\\)")
(modes quote (sql-mode))
(group 1 2)
(case-fold . t)
(repeat . t))
;; Line up the two sides of an assigment
(sql-assign-lineup
(regexp . "^\\s-*\\S-+\\(\\s-*\\):=\\(\\s-*\\)")
(modes quote (sql-mode))
(group 1 2)
(case-fold . t)
(repeat . t))
;; lineup a variable declaration with an assignment
(sql-assign-lineup-2
(regexp . "^\\s-*\\S-+\\(\\s-+\\)\\S-+\\(\\s-*\\):=\\(\\s-*\\)")
(modes quote (sql-mode))
(group 1 2 3)
(case-fold . t)
(repeat . t))
;; Line up the two sides of in / out / in out parameter
(sql-param-lineup-in-out
(regexp . "\\(\\s-+\\)\\(in out\\|in\\|out\\)\\(\\s-+\\)")
(modes quote (sql-mode))
(group 1 3)
(case-fold . t)
(repeat . t))
;; Line up the two sides of an equal sign in an update expression
(sql-equals
(regexp . "[^:<>!]\\(\\s-*\\)=\\(\\s-*\\)[^>]")
(modes quote (sql-mode))
(group 1 2)
(case-fold . t)
(valid . ,(function (lambda ()
(save-excursion
(goto-char (match-end 1))
(not (nth 3 (syntax-ppss (point))))))))
(repeat . t))
(sql-comparison-operators ; see issue #47
(regexp . "[^:]\\(\\s-*\\)[<>=!]+\\(\\s-*\\)[^>]")
(modes quote (sql-mode))
(group 1 2)
(case-fold . t)
(valid . ,(function (lambda ()
(save-excursion
(goto-char (match-end 1))
(not (nth 3 (syntax-ppss (point))))))))
(repeat . t))
;; Line up the two sides of piped string
(sql-pipes
(regexp . "[^:]\\(\\s-*\\)||\\(\\s-*\\)[^>]")
(modes quote (sql-mode))
(group 1 2)
(case-fold . t)
(repeat . t))
;; lineup the column aliases (the "as name" part) in a select statement
(sql-select-lineup-column-names
(regexp . ".*?\\(\\s +\\)as\\(\\s +\\).*")
(modes quote (sql-mode))
(group 1 2)
(case-fold . t)
(repeat . t)))
"Align rules for SQL codes.
These rules help aligning some SQL statements, such as the column
names in select queries, or equal signs in update statements or
where clauses.
To use it, select the region to be aligned and run \\[align].
See also `align' and `align-rules-list'")
;;;; sqlind-minor-mode, sqlind-setup
(defvar sqlind-minor-mode-map
(let ((map (make-sparse-keymap)))
(define-key map [remap beginning-of-defun] 'sqlind-beginning-of-block)
map))
(defvar align-mode-rules-list)
;;;###autoload
(define-minor-mode sqlind-minor-mode
"Toggle SQL syntactic indentation on or off.
With syntactic indentation, hitting TAB on a line in a SQL buffer
will indent the line according to the syntactic context of the
SQL statement being edited.
A set of alignment rules are also enabled with this minor mode.
Selecting a region of text and typing `M-x align RET' will align
the statements. This can be used, for example, to align the `as'
column aliases in select statements."
:lighter " sqlind"
;; :group 'sqlind ;;FIXME: There's no such group!
:global nil
:init-value nil
(if sqlind-minor-mode
(progn
(set (make-local-variable 'indent-line-function) #'sqlind-indent-line)
(set (make-local-variable 'align-mode-rules-list) sqlind-align-rules))
(progn
(kill-local-variable 'indent-line-function)
(kill-local-variable 'align-mode-rules-list))))
;;;###autoload
(defun sqlind-setup ()
"Enable SQL syntactic indentation unconditionally.
This function is deprecated, consider using the function
`sqlind-minor-mode' instead."
(set (make-local-variable 'indent-line-function) 'sqlind-indent-line)
(define-key sql-mode-map [remap beginning-of-defun] 'sqlind-beginning-of-statement)
(setq align-mode-rules-list sqlind-align-rules))
;; Local Variables:
;; mode: emacs-lisp
;; mode: outline-minor
;; outline-regexp: ";;;;+"
;; End:
(provide 'sql-indent)
;;; sql-indent.el ends here