1 // Scintilla source code edit control
3 ** Lexer for SQL, including PL/SQL and SQL*Plus.
5 // Copyright 1998-2005 by Neil Hodgson <neilh@scintilla.org>
6 // The License.txt file describes the conditions under which this software may be distributed.
18 #include "StyleContext.h"
20 #include "Scintilla.h"
23 static inline bool IsAWordChar(int ch
) {
24 return (ch
< 0x80) && (isalnum(ch
) || ch
== '.' || ch
== '_');
27 static inline bool IsAWordStart(int ch
) {
28 return (ch
< 0x80) && (isalpha(ch
) || ch
== '_');
31 static inline bool IsADoxygenChar(int ch
) {
32 return (islower(ch
) || ch
== '$' || ch
== '@' ||
33 ch
== '\\' || ch
== '&' || ch
== '<' ||
34 ch
== '>' || ch
== '#' || ch
== '{' ||
35 ch
== '}' || ch
== '[' || ch
== ']');
38 static inline bool IsANumberChar(int ch
) {
39 // Not exactly following number definition (several dots are seen as OK, etc.)
40 // but probably enough in most cases.
42 (isdigit(ch
) || toupper(ch
) == 'E' ||
43 ch
== '.' || ch
== '-' || ch
== '+');
46 static void ColouriseSQLDoc(unsigned int startPos
, int length
, int initStyle
, WordList
*keywordlists
[],
49 WordList
&keywords1
= *keywordlists
[0];
50 WordList
&keywords2
= *keywordlists
[1];
51 WordList
&kw_pldoc
= *keywordlists
[2];
52 WordList
&kw_sqlplus
= *keywordlists
[3];
53 WordList
&kw_user1
= *keywordlists
[4];
54 WordList
&kw_user2
= *keywordlists
[5];
55 WordList
&kw_user3
= *keywordlists
[6];
56 WordList
&kw_user4
= *keywordlists
[7];
58 StyleContext
sc(startPos
, length
, initStyle
, styler
);
60 bool sqlBackslashEscapes
= styler
.GetPropertyInt("sql.backslash.escapes", 0) != 0;
61 bool sqlBackticksIdentifier
= styler
.GetPropertyInt("lexer.sql.backticks.identifier", 0) != 0;
62 int styleBeforeDCKeyword
= SCE_SQL_DEFAULT
;
63 for (; sc
.More(); sc
.Forward()) {
64 // Determine if the current state should terminate.
66 case SCE_SQL_OPERATOR
:
67 sc
.SetState(SCE_SQL_DEFAULT
);
70 // We stop the number definition on non-numerical non-dot non-eE non-sign char
71 if (!IsANumberChar(sc
.ch
)) {
72 sc
.SetState(SCE_SQL_DEFAULT
);
75 case SCE_SQL_IDENTIFIER
:
76 if (!IsAWordChar(sc
.ch
)) {
77 int nextState
= SCE_SQL_DEFAULT
;
79 sc
.GetCurrentLowered(s
, sizeof(s
));
80 if (keywords1
.InList(s
)) {
81 sc
.ChangeState(SCE_SQL_WORD
);
82 } else if (keywords2
.InList(s
)) {
83 sc
.ChangeState(SCE_SQL_WORD2
);
84 } else if (kw_sqlplus
.InListAbbreviated(s
, '~')) {
85 sc
.ChangeState(SCE_SQL_SQLPLUS
);
86 if (strncmp(s
, "rem", 3) == 0) {
87 nextState
= SCE_SQL_SQLPLUS_COMMENT
;
88 } else if (strncmp(s
, "pro", 3) == 0) {
89 nextState
= SCE_SQL_SQLPLUS_PROMPT
;
91 } else if (kw_user1
.InList(s
)) {
92 sc
.ChangeState(SCE_SQL_USER1
);
93 } else if (kw_user2
.InList(s
)) {
94 sc
.ChangeState(SCE_SQL_USER2
);
95 } else if (kw_user3
.InList(s
)) {
96 sc
.ChangeState(SCE_SQL_USER3
);
97 } else if (kw_user4
.InList(s
)) {
98 sc
.ChangeState(SCE_SQL_USER4
);
100 sc
.SetState(nextState
);
103 case SCE_SQL_QUOTEDIDENTIFIER
:
105 if (sc
.chNext
== 0x60) {
106 sc
.Forward(); // Ignore it
108 sc
.ForwardSetState(SCE_SQL_DEFAULT
);
112 case SCE_SQL_COMMENT
:
113 if (sc
.Match('*', '/')) {
115 sc
.ForwardSetState(SCE_SQL_DEFAULT
);
118 case SCE_SQL_COMMENTDOC
:
119 if (sc
.Match('*', '/')) {
121 sc
.ForwardSetState(SCE_SQL_DEFAULT
);
122 } else if (sc
.ch
== '@' || sc
.ch
== '\\') { // Doxygen support
123 // Verify that we have the conditions to mark a comment-doc-keyword
124 if ((IsASpace(sc
.chPrev
) || sc
.chPrev
== '*') && (!IsASpace(sc
.chNext
))) {
125 styleBeforeDCKeyword
= SCE_SQL_COMMENTDOC
;
126 sc
.SetState(SCE_SQL_COMMENTDOCKEYWORD
);
130 case SCE_SQL_COMMENTLINE
:
131 case SCE_SQL_COMMENTLINEDOC
:
132 case SCE_SQL_SQLPLUS_COMMENT
:
133 case SCE_SQL_SQLPLUS_PROMPT
:
134 if (sc
.atLineStart
) {
135 sc
.SetState(SCE_SQL_DEFAULT
);
138 case SCE_SQL_COMMENTDOCKEYWORD
:
139 if ((styleBeforeDCKeyword
== SCE_SQL_COMMENTDOC
) && sc
.Match('*', '/')) {
140 sc
.ChangeState(SCE_SQL_COMMENTDOCKEYWORDERROR
);
142 sc
.ForwardSetState(SCE_SQL_DEFAULT
);
143 } else if (!IsADoxygenChar(sc
.ch
)) {
145 sc
.GetCurrentLowered(s
, sizeof(s
));
146 if (!isspace(sc
.ch
) || !kw_pldoc
.InList(s
+ 1)) {
147 sc
.ChangeState(SCE_SQL_COMMENTDOCKEYWORDERROR
);
149 sc
.SetState(styleBeforeDCKeyword
);
152 case SCE_SQL_CHARACTER
:
153 if (sqlBackslashEscapes
&& sc
.ch
== '\\') {
155 } else if (sc
.ch
== '\'') {
156 if (sc
.chNext
== '\"') {
159 sc
.ForwardSetState(SCE_SQL_DEFAULT
);
167 } else if (sc
.ch
== '\"') {
168 if (sc
.chNext
== '\"') {
171 sc
.ForwardSetState(SCE_SQL_DEFAULT
);
177 // Determine if a new state should be entered.
178 if (sc
.state
== SCE_SQL_DEFAULT
) {
179 if (IsADigit(sc
.ch
) || (sc
.ch
== '.' && IsADigit(sc
.chNext
))) {
180 sc
.SetState(SCE_SQL_NUMBER
);
181 } else if (IsAWordStart(sc
.ch
)) {
182 sc
.SetState(SCE_SQL_IDENTIFIER
);
183 } else if (sc
.ch
== 0x60 && sqlBackticksIdentifier
) {
184 sc
.SetState(SCE_SQL_QUOTEDIDENTIFIER
);
185 } else if (sc
.Match('/', '*')) {
186 if (sc
.Match("/**") || sc
.Match("/*!")) { // Support of Doxygen doc. style
187 sc
.SetState(SCE_SQL_COMMENTDOC
);
189 sc
.SetState(SCE_SQL_COMMENT
);
191 sc
.Forward(); // Eat the * so it isn't used for the end of the comment
192 } else if (sc
.Match('-', '-')) {
193 // MySQL requires a space or control char after --
194 // http://dev.mysql.com/doc/mysql/en/ansi-diff-comments.html
195 // Perhaps we should enforce that with proper property:
196 //~ } else if (sc.Match("-- ")) {
197 sc
.SetState(SCE_SQL_COMMENTLINE
);
198 } else if (sc
.ch
== '#') {
199 sc
.SetState(SCE_SQL_COMMENTLINEDOC
);
200 } else if (sc
.ch
== '\'') {
201 sc
.SetState(SCE_SQL_CHARACTER
);
202 } else if (sc
.ch
== '\"') {
203 sc
.SetState(SCE_SQL_STRING
);
204 } else if (isoperator(static_cast<char>(sc
.ch
))) {
205 sc
.SetState(SCE_SQL_OPERATOR
);
212 static bool IsStreamCommentStyle(int style
) {
213 return style
== SCE_SQL_COMMENT
||
214 style
== SCE_SQL_COMMENTDOC
||
215 style
== SCE_SQL_COMMENTDOCKEYWORD
||
216 style
== SCE_SQL_COMMENTDOCKEYWORDERROR
;
219 // Store both the current line's fold level and the next lines in the
220 // level store to make it easy to pick up with each increment.
221 static void FoldSQLDoc(unsigned int startPos
, int length
, int initStyle
,
222 WordList
*[], Accessor
&styler
) {
223 bool foldComment
= styler
.GetPropertyInt("fold.comment") != 0;
224 bool foldCompact
= styler
.GetPropertyInt("fold.compact", 1) != 0;
225 bool foldOnlyBegin
= styler
.GetPropertyInt("fold.sql.only.begin", 0) != 0;
227 unsigned int endPos
= startPos
+ length
;
228 int visibleChars
= 0;
229 int lineCurrent
= styler
.GetLine(startPos
);
230 int levelCurrent
= SC_FOLDLEVELBASE
;
231 if (lineCurrent
> 0) {
232 levelCurrent
= styler
.LevelAt(lineCurrent
- 1) >> 16;
234 int levelNext
= levelCurrent
;
235 char chNext
= styler
[startPos
];
236 int styleNext
= styler
.StyleAt(startPos
);
237 int style
= initStyle
;
238 bool endFound
= false;
239 for (unsigned int i
= startPos
; i
< endPos
; i
++) {
241 chNext
= styler
.SafeGetCharAt(i
+ 1);
242 int stylePrev
= style
;
244 styleNext
= styler
.StyleAt(i
+ 1);
245 bool atEOL
= (ch
== '\r' && chNext
!= '\n') || (ch
== '\n');
246 if (foldComment
&& IsStreamCommentStyle(style
)) {
247 if (!IsStreamCommentStyle(stylePrev
)) {
249 } else if (!IsStreamCommentStyle(styleNext
) && !atEOL
) {
250 // Comments don't end at end of line and the next character may be unstyled.
254 if (foldComment
&& (style
== SCE_SQL_COMMENTLINE
)) {
255 // MySQL needs -- comments to be followed by space or control char
256 if ((ch
== '-') && (chNext
== '-')) {
257 char chNext2
= styler
.SafeGetCharAt(i
+ 2);
258 char chNext3
= styler
.SafeGetCharAt(i
+ 3);
259 if (chNext2
== '{' || chNext3
== '{') {
261 } else if (chNext2
== '}' || chNext3
== '}') {
266 if (style
== SCE_SQL_OPERATOR
) {
269 } else if (ch
== ')') {
273 // If new keyword (cannot trigger on elseif or nullif, does less tests)
274 if (style
== SCE_SQL_WORD
&& stylePrev
!= SCE_SQL_WORD
) {
275 const int MAX_KW_LEN
= 6; // Maximum length of folding keywords
276 char s
[MAX_KW_LEN
+ 2];
278 for (; j
< MAX_KW_LEN
+ 1; j
++) {
279 if (!iswordchar(styler
[i
+ j
])) {
282 s
[j
] = static_cast<char>(tolower(styler
[i
+ j
]));
284 if (j
== MAX_KW_LEN
+ 1) {
285 // Keyword too long, don't test it
290 if ((!foldOnlyBegin
) && (strcmp(s
, "if") == 0 || strcmp(s
, "loop") == 0)) {
297 } else if (strcmp(s
, "begin") == 0) {
299 } else if (strcmp(s
, "end") == 0 ||
300 // DROP TABLE IF EXISTS or CREATE TABLE IF NOT EXISTS
301 strcmp(s
, "exists") == 0) {
304 if (levelNext
< SC_FOLDLEVELBASE
) {
305 levelNext
= SC_FOLDLEVELBASE
;
310 int levelUse
= levelCurrent
;
311 int lev
= levelUse
| levelNext
<< 16;
312 if (visibleChars
== 0 && foldCompact
)
313 lev
|= SC_FOLDLEVELWHITEFLAG
;
314 if (levelUse
< levelNext
)
315 lev
|= SC_FOLDLEVELHEADERFLAG
;
316 if (lev
!= styler
.LevelAt(lineCurrent
)) {
317 styler
.SetLevel(lineCurrent
, lev
);
320 levelCurrent
= levelNext
;
324 if (!isspacechar(ch
)) {
330 static const char * const sqlWordListDesc
[] = {
342 LexerModule
lmSQL(SCLEX_SQL
, ColouriseSQLDoc
, "sql", FoldSQLDoc
, sqlWordListDesc
);