569 lines
17 KiB
C++
569 lines
17 KiB
C++
/** @file LexD.cxx
|
|
** Lexer for D.
|
|
**
|
|
** Copyright (c) 2006 by Waldemar Augustyn <waldemar@wdmsys.com>
|
|
** Converted to lexer object and added further folding features/properties by "Udo Lechner" <dlchnr(at)gmx(dot)net>
|
|
**/
|
|
// Copyright 1998-2005 by Neil Hodgson <neilh@scintilla.org>
|
|
// The License.txt file describes the conditions under which this software may be distributed.
|
|
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include <stdio.h>
|
|
#include <stdarg.h>
|
|
#include <assert.h>
|
|
#include <ctype.h>
|
|
|
|
#include <string>
|
|
#include <map>
|
|
|
|
#include "ILexer.h"
|
|
#include "Scintilla.h"
|
|
#include "SciLexer.h"
|
|
|
|
#include "WordList.h"
|
|
#include "LexAccessor.h"
|
|
#include "StyleContext.h"
|
|
#include "CharacterSet.h"
|
|
#include "LexerModule.h"
|
|
#include "OptionSet.h"
|
|
|
|
#ifdef SCI_NAMESPACE
|
|
using namespace Scintilla;
|
|
#endif
|
|
|
|
/* Nested comments require keeping the value of the nesting level for every
|
|
position in the document. But since scintilla always styles line by line,
|
|
we only need to store one value per line. The non-negative number indicates
|
|
nesting level at the end of the line.
|
|
*/
|
|
|
|
// Underscore, letter, digit and universal alphas from C99 Appendix D.
|
|
|
|
static bool IsWordStart(int ch) {
|
|
return (isascii(ch) && (isalpha(ch) || ch == '_')) || !isascii(ch);
|
|
}
|
|
|
|
static bool IsWord(int ch) {
|
|
return (isascii(ch) && (isalnum(ch) || ch == '_')) || !isascii(ch);
|
|
}
|
|
|
|
static bool IsDoxygen(int ch) {
|
|
if (isascii(ch) && islower(ch))
|
|
return true;
|
|
if (ch == '$' || ch == '@' || ch == '\\' ||
|
|
ch == '&' || ch == '#' || ch == '<' || ch == '>' ||
|
|
ch == '{' || ch == '}' || ch == '[' || ch == ']')
|
|
return true;
|
|
return false;
|
|
}
|
|
|
|
static bool IsStringSuffix(int ch) {
|
|
return ch == 'c' || ch == 'w' || ch == 'd';
|
|
}
|
|
|
|
static bool IsStreamCommentStyle(int style) {
|
|
return style == SCE_D_COMMENT ||
|
|
style == SCE_D_COMMENTDOC ||
|
|
style == SCE_D_COMMENTDOCKEYWORD ||
|
|
style == SCE_D_COMMENTDOCKEYWORDERROR;
|
|
}
|
|
|
|
// An individual named option for use in an OptionSet
|
|
|
|
// Options used for LexerD
|
|
struct OptionsD {
|
|
bool fold;
|
|
bool foldSyntaxBased;
|
|
bool foldComment;
|
|
bool foldCommentMultiline;
|
|
bool foldCommentExplicit;
|
|
std::string foldExplicitStart;
|
|
std::string foldExplicitEnd;
|
|
bool foldExplicitAnywhere;
|
|
bool foldCompact;
|
|
int foldAtElseInt;
|
|
bool foldAtElse;
|
|
OptionsD() {
|
|
fold = false;
|
|
foldSyntaxBased = true;
|
|
foldComment = false;
|
|
foldCommentMultiline = true;
|
|
foldCommentExplicit = true;
|
|
foldExplicitStart = "";
|
|
foldExplicitEnd = "";
|
|
foldExplicitAnywhere = false;
|
|
foldCompact = true;
|
|
foldAtElseInt = -1;
|
|
foldAtElse = false;
|
|
}
|
|
};
|
|
|
|
static const char * const dWordLists[] = {
|
|
"Primary keywords and identifiers",
|
|
"Secondary keywords and identifiers",
|
|
"Documentation comment keywords",
|
|
"Type definitions and aliases",
|
|
"Keywords 5",
|
|
"Keywords 6",
|
|
"Keywords 7",
|
|
0,
|
|
};
|
|
|
|
struct OptionSetD : public OptionSet<OptionsD> {
|
|
OptionSetD() {
|
|
DefineProperty("fold", &OptionsD::fold);
|
|
|
|
DefineProperty("fold.d.syntax.based", &OptionsD::foldSyntaxBased,
|
|
"Set this property to 0 to disable syntax based folding.");
|
|
|
|
DefineProperty("fold.comment", &OptionsD::foldComment);
|
|
|
|
DefineProperty("fold.d.comment.multiline", &OptionsD::foldCommentMultiline,
|
|
"Set this property to 0 to disable folding multi-line comments when fold.comment=1.");
|
|
|
|
DefineProperty("fold.d.comment.explicit", &OptionsD::foldCommentExplicit,
|
|
"Set this property to 0 to disable folding explicit fold points when fold.comment=1.");
|
|
|
|
DefineProperty("fold.d.explicit.start", &OptionsD::foldExplicitStart,
|
|
"The string to use for explicit fold start points, replacing the standard //{.");
|
|
|
|
DefineProperty("fold.d.explicit.end", &OptionsD::foldExplicitEnd,
|
|
"The string to use for explicit fold end points, replacing the standard //}.");
|
|
|
|
DefineProperty("fold.d.explicit.anywhere", &OptionsD::foldExplicitAnywhere,
|
|
"Set this property to 1 to enable explicit fold points anywhere, not just in line comments.");
|
|
|
|
DefineProperty("fold.compact", &OptionsD::foldCompact);
|
|
|
|
DefineProperty("lexer.d.fold.at.else", &OptionsD::foldAtElseInt,
|
|
"This option enables D folding on a \"} else {\" line of an if statement.");
|
|
|
|
DefineProperty("fold.at.else", &OptionsD::foldAtElse);
|
|
|
|
DefineWordListSets(dWordLists);
|
|
}
|
|
};
|
|
|
|
class LexerD : public ILexer {
|
|
bool caseSensitive;
|
|
WordList keywords;
|
|
WordList keywords2;
|
|
WordList keywords3;
|
|
WordList keywords4;
|
|
WordList keywords5;
|
|
WordList keywords6;
|
|
WordList keywords7;
|
|
OptionsD options;
|
|
OptionSetD osD;
|
|
public:
|
|
LexerD(bool caseSensitive_) :
|
|
caseSensitive(caseSensitive_) {
|
|
}
|
|
virtual ~LexerD() {
|
|
}
|
|
void SCI_METHOD Release() {
|
|
delete this;
|
|
}
|
|
int SCI_METHOD Version() const {
|
|
return lvOriginal;
|
|
}
|
|
const char * SCI_METHOD PropertyNames() {
|
|
return osD.PropertyNames();
|
|
}
|
|
int SCI_METHOD PropertyType(const char *name) {
|
|
return osD.PropertyType(name);
|
|
}
|
|
const char * SCI_METHOD DescribeProperty(const char *name) {
|
|
return osD.DescribeProperty(name);
|
|
}
|
|
int SCI_METHOD PropertySet(const char *key, const char *val);
|
|
const char * SCI_METHOD DescribeWordListSets() {
|
|
return osD.DescribeWordListSets();
|
|
}
|
|
int SCI_METHOD WordListSet(int n, const char *wl);
|
|
void SCI_METHOD Lex(unsigned int startPos, int length, int initStyle, IDocument *pAccess);
|
|
void SCI_METHOD Fold(unsigned int startPos, int length, int initStyle, IDocument *pAccess);
|
|
|
|
void * SCI_METHOD PrivateCall(int, void *) {
|
|
return 0;
|
|
}
|
|
|
|
static ILexer *LexerFactoryD() {
|
|
return new LexerD(true);
|
|
}
|
|
static ILexer *LexerFactoryDInsensitive() {
|
|
return new LexerD(false);
|
|
}
|
|
};
|
|
|
|
int SCI_METHOD LexerD::PropertySet(const char *key, const char *val) {
|
|
if (osD.PropertySet(&options, key, val)) {
|
|
return 0;
|
|
}
|
|
return -1;
|
|
}
|
|
|
|
int SCI_METHOD LexerD::WordListSet(int n, const char *wl) {
|
|
WordList *wordListN = 0;
|
|
switch (n) {
|
|
case 0:
|
|
wordListN = &keywords;
|
|
break;
|
|
case 1:
|
|
wordListN = &keywords2;
|
|
break;
|
|
case 2:
|
|
wordListN = &keywords3;
|
|
break;
|
|
case 3:
|
|
wordListN = &keywords4;
|
|
break;
|
|
case 4:
|
|
wordListN = &keywords5;
|
|
break;
|
|
case 5:
|
|
wordListN = &keywords6;
|
|
break;
|
|
case 6:
|
|
wordListN = &keywords7;
|
|
break;
|
|
}
|
|
int firstModification = -1;
|
|
if (wordListN) {
|
|
WordList wlNew;
|
|
wlNew.Set(wl);
|
|
if (*wordListN != wlNew) {
|
|
wordListN->Set(wl);
|
|
firstModification = 0;
|
|
}
|
|
}
|
|
return firstModification;
|
|
}
|
|
|
|
void SCI_METHOD LexerD::Lex(unsigned int startPos, int length, int initStyle, IDocument *pAccess) {
|
|
LexAccessor styler(pAccess);
|
|
|
|
int styleBeforeDCKeyword = SCE_D_DEFAULT;
|
|
|
|
StyleContext sc(startPos, length, initStyle, styler);
|
|
|
|
int curLine = styler.GetLine(startPos);
|
|
int curNcLevel = curLine > 0? styler.GetLineState(curLine-1): 0;
|
|
bool numFloat = false; // Float literals have '+' and '-' signs
|
|
bool numHex = false;
|
|
|
|
for (; sc.More(); sc.Forward()) {
|
|
|
|
if (sc.atLineStart) {
|
|
curLine = styler.GetLine(sc.currentPos);
|
|
styler.SetLineState(curLine, curNcLevel);
|
|
}
|
|
|
|
// Determine if the current state should terminate.
|
|
switch (sc.state) {
|
|
case SCE_D_OPERATOR:
|
|
sc.SetState(SCE_D_DEFAULT);
|
|
break;
|
|
case SCE_D_NUMBER:
|
|
// We accept almost anything because of hex. and number suffixes
|
|
if (isascii(sc.ch) && (isalnum(sc.ch) || sc.ch == '_')) {
|
|
continue;
|
|
} else if (sc.ch == '.' && sc.chNext != '.' && !numFloat) {
|
|
// Don't parse 0..2 as number.
|
|
numFloat=true;
|
|
continue;
|
|
} else if ( ( sc.ch == '-' || sc.ch == '+' ) && ( /*sign and*/
|
|
( !numHex && ( sc.chPrev == 'e' || sc.chPrev == 'E' ) ) || /*decimal or*/
|
|
( sc.chPrev == 'p' || sc.chPrev == 'P' ) ) ) { /*hex*/
|
|
// Parse exponent sign in float literals: 2e+10 0x2e+10
|
|
continue;
|
|
} else {
|
|
sc.SetState(SCE_D_DEFAULT);
|
|
}
|
|
break;
|
|
case SCE_D_IDENTIFIER:
|
|
if (!IsWord(sc.ch)) {
|
|
char s[1000];
|
|
if (caseSensitive) {
|
|
sc.GetCurrent(s, sizeof(s));
|
|
} else {
|
|
sc.GetCurrentLowered(s, sizeof(s));
|
|
}
|
|
if (keywords.InList(s)) {
|
|
sc.ChangeState(SCE_D_WORD);
|
|
} else if (keywords2.InList(s)) {
|
|
sc.ChangeState(SCE_D_WORD2);
|
|
} else if (keywords4.InList(s)) {
|
|
sc.ChangeState(SCE_D_TYPEDEF);
|
|
} else if (keywords5.InList(s)) {
|
|
sc.ChangeState(SCE_D_WORD5);
|
|
} else if (keywords6.InList(s)) {
|
|
sc.ChangeState(SCE_D_WORD6);
|
|
} else if (keywords7.InList(s)) {
|
|
sc.ChangeState(SCE_D_WORD7);
|
|
}
|
|
sc.SetState(SCE_D_DEFAULT);
|
|
}
|
|
break;
|
|
case SCE_D_COMMENT:
|
|
if (sc.Match('*', '/')) {
|
|
sc.Forward();
|
|
sc.ForwardSetState(SCE_D_DEFAULT);
|
|
}
|
|
break;
|
|
case SCE_D_COMMENTDOC:
|
|
if (sc.Match('*', '/')) {
|
|
sc.Forward();
|
|
sc.ForwardSetState(SCE_D_DEFAULT);
|
|
} else if (sc.ch == '@' || sc.ch == '\\') { // JavaDoc and Doxygen support
|
|
// Verify that we have the conditions to mark a comment-doc-keyword
|
|
if ((IsASpace(sc.chPrev) || sc.chPrev == '*') && (!IsASpace(sc.chNext))) {
|
|
styleBeforeDCKeyword = SCE_D_COMMENTDOC;
|
|
sc.SetState(SCE_D_COMMENTDOCKEYWORD);
|
|
}
|
|
}
|
|
break;
|
|
case SCE_D_COMMENTLINE:
|
|
if (sc.atLineStart) {
|
|
sc.SetState(SCE_D_DEFAULT);
|
|
}
|
|
break;
|
|
case SCE_D_COMMENTLINEDOC:
|
|
if (sc.atLineStart) {
|
|
sc.SetState(SCE_D_DEFAULT);
|
|
} else if (sc.ch == '@' || sc.ch == '\\') { // JavaDoc and Doxygen support
|
|
// Verify that we have the conditions to mark a comment-doc-keyword
|
|
if ((IsASpace(sc.chPrev) || sc.chPrev == '/' || sc.chPrev == '!') && (!IsASpace(sc.chNext))) {
|
|
styleBeforeDCKeyword = SCE_D_COMMENTLINEDOC;
|
|
sc.SetState(SCE_D_COMMENTDOCKEYWORD);
|
|
}
|
|
}
|
|
break;
|
|
case SCE_D_COMMENTDOCKEYWORD:
|
|
if ((styleBeforeDCKeyword == SCE_D_COMMENTDOC) && sc.Match('*', '/')) {
|
|
sc.ChangeState(SCE_D_COMMENTDOCKEYWORDERROR);
|
|
sc.Forward();
|
|
sc.ForwardSetState(SCE_D_DEFAULT);
|
|
} else if (!IsDoxygen(sc.ch)) {
|
|
char s[100];
|
|
if (caseSensitive) {
|
|
sc.GetCurrent(s, sizeof(s));
|
|
} else {
|
|
sc.GetCurrentLowered(s, sizeof(s));
|
|
}
|
|
if (!IsASpace(sc.ch) || !keywords3.InList(s + 1)) {
|
|
sc.ChangeState(SCE_D_COMMENTDOCKEYWORDERROR);
|
|
}
|
|
sc.SetState(styleBeforeDCKeyword);
|
|
}
|
|
break;
|
|
case SCE_D_COMMENTNESTED:
|
|
if (sc.Match('+', '/')) {
|
|
if (curNcLevel > 0)
|
|
curNcLevel -= 1;
|
|
curLine = styler.GetLine(sc.currentPos);
|
|
styler.SetLineState(curLine, curNcLevel);
|
|
sc.Forward();
|
|
if (curNcLevel == 0) {
|
|
sc.ForwardSetState(SCE_D_DEFAULT);
|
|
}
|
|
} else if (sc.Match('/','+')) {
|
|
curNcLevel += 1;
|
|
curLine = styler.GetLine(sc.currentPos);
|
|
styler.SetLineState(curLine, curNcLevel);
|
|
sc.Forward();
|
|
}
|
|
break;
|
|
case SCE_D_STRING:
|
|
if (sc.ch == '\\') {
|
|
if (sc.chNext == '"' || sc.chNext == '\\') {
|
|
sc.Forward();
|
|
}
|
|
} else if (sc.ch == '"') {
|
|
if(IsStringSuffix(sc.chNext))
|
|
sc.Forward();
|
|
sc.ForwardSetState(SCE_D_DEFAULT);
|
|
}
|
|
break;
|
|
case SCE_D_CHARACTER:
|
|
if (sc.atLineEnd) {
|
|
sc.ChangeState(SCE_D_STRINGEOL);
|
|
} else if (sc.ch == '\\') {
|
|
if (sc.chNext == '\'' || sc.chNext == '\\') {
|
|
sc.Forward();
|
|
}
|
|
} else if (sc.ch == '\'') {
|
|
// Char has no suffixes
|
|
sc.ForwardSetState(SCE_D_DEFAULT);
|
|
}
|
|
break;
|
|
case SCE_D_STRINGEOL:
|
|
if (sc.atLineStart) {
|
|
sc.SetState(SCE_D_DEFAULT);
|
|
}
|
|
break;
|
|
case SCE_D_STRINGB:
|
|
if (sc.ch == '`') {
|
|
if(IsStringSuffix(sc.chNext))
|
|
sc.Forward();
|
|
sc.ForwardSetState(SCE_D_DEFAULT);
|
|
}
|
|
break;
|
|
case SCE_D_STRINGR:
|
|
if (sc.ch == '"') {
|
|
if(IsStringSuffix(sc.chNext))
|
|
sc.Forward();
|
|
sc.ForwardSetState(SCE_D_DEFAULT);
|
|
}
|
|
break;
|
|
}
|
|
|
|
// Determine if a new state should be entered.
|
|
if (sc.state == SCE_D_DEFAULT) {
|
|
if (IsADigit(sc.ch) || (sc.ch == '.' && IsADigit(sc.chNext))) {
|
|
sc.SetState(SCE_D_NUMBER);
|
|
numFloat = sc.ch == '.';
|
|
// Remember hex literal
|
|
numHex = sc.ch == '0' && ( sc.chNext == 'x' || sc.chNext == 'X' );
|
|
} else if ( (sc.ch == 'r' || sc.ch == 'x' || sc.ch == 'q')
|
|
&& sc.chNext == '"' ) {
|
|
// Limited support for hex and delimited strings: parse as r""
|
|
sc.SetState(SCE_D_STRINGR);
|
|
sc.Forward();
|
|
} else if (IsWordStart(sc.ch) || sc.ch == '$') {
|
|
sc.SetState(SCE_D_IDENTIFIER);
|
|
} else if (sc.Match('/','+')) {
|
|
curNcLevel += 1;
|
|
curLine = styler.GetLine(sc.currentPos);
|
|
styler.SetLineState(curLine, curNcLevel);
|
|
sc.SetState(SCE_D_COMMENTNESTED);
|
|
sc.Forward();
|
|
} else if (sc.Match('/', '*')) {
|
|
if (sc.Match("/**") || sc.Match("/*!")) { // Support of Qt/Doxygen doc. style
|
|
sc.SetState(SCE_D_COMMENTDOC);
|
|
} else {
|
|
sc.SetState(SCE_D_COMMENT);
|
|
}
|
|
sc.Forward(); // Eat the * so it isn't used for the end of the comment
|
|
} else if (sc.Match('/', '/')) {
|
|
if ((sc.Match("///") && !sc.Match("////")) || sc.Match("//!"))
|
|
// Support of Qt/Doxygen doc. style
|
|
sc.SetState(SCE_D_COMMENTLINEDOC);
|
|
else
|
|
sc.SetState(SCE_D_COMMENTLINE);
|
|
} else if (sc.ch == '"') {
|
|
sc.SetState(SCE_D_STRING);
|
|
} else if (sc.ch == '\'') {
|
|
sc.SetState(SCE_D_CHARACTER);
|
|
} else if (sc.ch == '`') {
|
|
sc.SetState(SCE_D_STRINGB);
|
|
} else if (isoperator(static_cast<char>(sc.ch))) {
|
|
sc.SetState(SCE_D_OPERATOR);
|
|
if (sc.ch == '.' && sc.chNext == '.') sc.Forward(); // Range operator
|
|
}
|
|
}
|
|
}
|
|
sc.Complete();
|
|
}
|
|
|
|
// Store both the current line's fold level and the next lines in the
|
|
// level store to make it easy to pick up with each increment
|
|
// and to make it possible to fiddle the current level for "} else {".
|
|
|
|
void SCI_METHOD LexerD::Fold(unsigned int startPos, int length, int initStyle, IDocument *pAccess) {
|
|
|
|
if (!options.fold)
|
|
return;
|
|
|
|
LexAccessor styler(pAccess);
|
|
|
|
unsigned int endPos = startPos + length;
|
|
int visibleChars = 0;
|
|
int lineCurrent = styler.GetLine(startPos);
|
|
int levelCurrent = SC_FOLDLEVELBASE;
|
|
if (lineCurrent > 0)
|
|
levelCurrent = styler.LevelAt(lineCurrent-1) >> 16;
|
|
int levelMinCurrent = levelCurrent;
|
|
int levelNext = levelCurrent;
|
|
char chNext = styler[startPos];
|
|
int styleNext = styler.StyleAt(startPos);
|
|
int style = initStyle;
|
|
bool foldAtElse = options.foldAtElseInt >= 0 ? options.foldAtElseInt != 0 : options.foldAtElse;
|
|
const bool userDefinedFoldMarkers = !options.foldExplicitStart.empty() && !options.foldExplicitEnd.empty();
|
|
for (unsigned int i = startPos; i < endPos; i++) {
|
|
char ch = chNext;
|
|
chNext = styler.SafeGetCharAt(i + 1);
|
|
int stylePrev = style;
|
|
style = styleNext;
|
|
styleNext = styler.StyleAt(i + 1);
|
|
bool atEOL = (ch == '\r' && chNext != '\n') || (ch == '\n');
|
|
if (options.foldComment && options.foldCommentMultiline && IsStreamCommentStyle(style)) {
|
|
if (!IsStreamCommentStyle(stylePrev)) {
|
|
levelNext++;
|
|
} else if (!IsStreamCommentStyle(styleNext) && !atEOL) {
|
|
// Comments don't end at end of line and the next character may be unstyled.
|
|
levelNext--;
|
|
}
|
|
}
|
|
if (options.foldComment && options.foldCommentExplicit && ((style == SCE_D_COMMENTLINE) || options.foldExplicitAnywhere)) {
|
|
if (userDefinedFoldMarkers) {
|
|
if (styler.Match(i, options.foldExplicitStart.c_str())) {
|
|
levelNext++;
|
|
} else if (styler.Match(i, options.foldExplicitEnd.c_str())) {
|
|
levelNext--;
|
|
}
|
|
} else {
|
|
if ((ch == '/') && (chNext == '/')) {
|
|
char chNext2 = styler.SafeGetCharAt(i + 2);
|
|
if (chNext2 == '{') {
|
|
levelNext++;
|
|
} else if (chNext2 == '}') {
|
|
levelNext--;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
if (options.foldSyntaxBased && (style == SCE_D_OPERATOR)) {
|
|
if (ch == '{') {
|
|
// Measure the minimum before a '{' to allow
|
|
// folding on "} else {"
|
|
if (levelMinCurrent > levelNext) {
|
|
levelMinCurrent = levelNext;
|
|
}
|
|
levelNext++;
|
|
} else if (ch == '}') {
|
|
levelNext--;
|
|
}
|
|
}
|
|
if (atEOL || (i == endPos-1)) {
|
|
if (options.foldComment && options.foldCommentMultiline) { // Handle nested comments
|
|
int nc;
|
|
nc = styler.GetLineState(lineCurrent);
|
|
nc -= lineCurrent>0? styler.GetLineState(lineCurrent-1): 0;
|
|
levelNext += nc;
|
|
}
|
|
int levelUse = levelCurrent;
|
|
if (options.foldSyntaxBased && foldAtElse) {
|
|
levelUse = levelMinCurrent;
|
|
}
|
|
int lev = levelUse | levelNext << 16;
|
|
if (visibleChars == 0 && options.foldCompact)
|
|
lev |= SC_FOLDLEVELWHITEFLAG;
|
|
if (levelUse < levelNext)
|
|
lev |= SC_FOLDLEVELHEADERFLAG;
|
|
if (lev != styler.LevelAt(lineCurrent)) {
|
|
styler.SetLevel(lineCurrent, lev);
|
|
}
|
|
lineCurrent++;
|
|
levelCurrent = levelNext;
|
|
levelMinCurrent = levelCurrent;
|
|
visibleChars = 0;
|
|
}
|
|
if (!IsASpace(ch))
|
|
visibleChars++;
|
|
}
|
|
}
|
|
|
|
LexerModule lmD(SCLEX_D, LexerD::LexerFactoryD, "d", dWordLists);
|