2022-01-04 23:07:50 +00:00
|
|
|
// Lexilla lexer library
|
2021-02-21 04:53:09 +00:00
|
|
|
/** @file TestDocument.cxx
|
|
|
|
** Lexer testing.
|
|
|
|
**/
|
|
|
|
// Copyright 2019 by Neil Hodgson <neilh@scintilla.org>
|
|
|
|
// The License.txt file describes the conditions under which this software may be distributed.
|
|
|
|
|
|
|
|
#include <cassert>
|
|
|
|
|
|
|
|
#include <string>
|
|
|
|
#include <string_view>
|
|
|
|
#include <vector>
|
|
|
|
#include <algorithm>
|
|
|
|
|
|
|
|
#include <iostream>
|
|
|
|
|
|
|
|
#include "ILexer.h"
|
|
|
|
|
|
|
|
#include "TestDocument.h"
|
|
|
|
|
|
|
|
namespace {
|
|
|
|
|
|
|
|
const unsigned char UTF8BytesOfLead[256] = {
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 00 - 0F
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 10 - 1F
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 20 - 2F
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 30 - 3F
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 40 - 4F
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 50 - 5F
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 60 - 6F
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 70 - 7F
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 80 - 8F
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 90 - 9F
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // A0 - AF
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // B0 - BF
|
|
|
|
1, 1, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, // C0 - CF
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, // D0 - DF
|
|
|
|
3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, // E0 - EF
|
|
|
|
4, 4, 4, 4, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // F0 - FF
|
|
|
|
};
|
|
|
|
|
|
|
|
int UnicodeFromUTF8(const unsigned char *us) noexcept {
|
2022-04-13 11:10:12 +00:00
|
|
|
assert(us);
|
2021-02-21 04:53:09 +00:00
|
|
|
switch (UTF8BytesOfLead[us[0]]) {
|
|
|
|
case 1:
|
|
|
|
return us[0];
|
|
|
|
case 2:
|
|
|
|
return ((us[0] & 0x1F) << 6) + (us[1] & 0x3F);
|
|
|
|
case 3:
|
|
|
|
return ((us[0] & 0xF) << 12) + ((us[1] & 0x3F) << 6) + (us[2] & 0x3F);
|
|
|
|
default:
|
|
|
|
return ((us[0] & 0x7) << 18) + ((us[1] & 0x3F) << 12) + ((us[2] & 0x3F) << 6) + (us[3] & 0x3F);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
inline constexpr bool UTF8IsTrailByte(unsigned char ch) noexcept {
|
|
|
|
return (ch >= 0x80) && (ch < 0xc0);
|
|
|
|
}
|
|
|
|
|
2022-04-13 11:10:12 +00:00
|
|
|
constexpr unsigned char TrailByteValue(unsigned char c) {
|
|
|
|
// The top 2 bits are 0b10 to indicate a trail byte.
|
|
|
|
// The lower 6 bits contain the value.
|
|
|
|
return c & 0b0011'1111;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
std::u32string UTF32FromUTF8(std::string_view svu8) {
|
|
|
|
std::u32string ret;
|
|
|
|
for (size_t i = 0; i < svu8.length();) {
|
|
|
|
unsigned char ch = svu8.at(i);
|
|
|
|
const unsigned int byteCount = UTF8BytesOfLead[ch];
|
|
|
|
unsigned int value = 0;
|
|
|
|
|
|
|
|
if (i + byteCount > svu8.length()) {
|
|
|
|
// Trying to read past end
|
|
|
|
ret.push_back(ch);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
i++;
|
|
|
|
switch (byteCount) {
|
|
|
|
case 1:
|
|
|
|
value = ch;
|
|
|
|
break;
|
|
|
|
case 2:
|
|
|
|
value = (ch & 0x1F) << 6;
|
|
|
|
ch = svu8.at(i++);
|
|
|
|
value += TrailByteValue(ch);
|
|
|
|
break;
|
|
|
|
case 3:
|
|
|
|
value = (ch & 0xF) << 12;
|
|
|
|
ch = svu8.at(i++);
|
|
|
|
value += TrailByteValue(ch) << 6;
|
|
|
|
ch = svu8.at(i++);
|
|
|
|
value += TrailByteValue(ch);
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
value = (ch & 0x7) << 18;
|
|
|
|
ch = svu8.at(i++);
|
|
|
|
value += TrailByteValue(ch) << 12;
|
|
|
|
ch = svu8.at(i++);
|
|
|
|
value += TrailByteValue(ch) << 6;
|
|
|
|
ch = svu8.at(i++);
|
|
|
|
value += TrailByteValue(ch);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
ret.push_back(value);
|
|
|
|
}
|
|
|
|
return ret;
|
2021-02-21 04:53:09 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void TestDocument::Set(std::string_view sv) {
|
|
|
|
text = sv;
|
2022-01-04 23:07:50 +00:00
|
|
|
textStyles.resize(text.size() + 1);
|
2021-02-21 04:53:09 +00:00
|
|
|
lineStarts.clear();
|
|
|
|
endStyled = 0;
|
|
|
|
lineStarts.push_back(0);
|
|
|
|
for (size_t pos = 0; pos < text.length(); pos++) {
|
2022-04-13 11:10:12 +00:00
|
|
|
if (text.at(pos) == '\n') {
|
2021-02-21 04:53:09 +00:00
|
|
|
lineStarts.push_back(pos + 1);
|
|
|
|
}
|
|
|
|
}
|
Update scintilla 5.3.4 and lexilla 5.2.4 with:
https://www.scintilla.org/scintilla534.zip
Released 8 March 2023.
Add multithreaded wrap to significantly improve performance of wrapping large files.
More typesafe bindings of *Full APIs in ScintillaCall. Feature #1477.
Fix overlapping of text with line end wrap marker. Bug #2378.
Fix clipping of line end wrap symbol for SC_WRAPVISUALFLAGLOC_END_BY_TEXT.
Where a multi-byte character contains multiple styles, display each byte as a representation. This makes it easier to see and fix lexers that change styles mid-character, commonly because they use fixed size buffers.
Fix a potential crash with autocompletion list fill-ups where a SCN_CHARADDED handler retriggered an autocompletion list, but with no items that match the typed character.
lexilla523
Released 8 March 2023.
Add scripts/PromoteNew.bat script to promote .new files after checking.
Makefile: Remove 1024-byte line length limit..
Ruby: Add new lexical classes for % literals SCE_RB_STRING_W (%w non-interpolable string array), SCE_RB_STRING_I (%i non-interpolable symbol array), SCE_RB_STRING_QI (%I interpolable symbol array), and SCE_RB_STRING_QS (%s symbol). Issue #124.
Ruby: Disambiguate %= which may be a quote or modulo assignment. Issue #124, Bug #1255, Bug #2182.
Ruby: Fix additional fold level for single character in SCE_RB_STRING_QW. Issue #132.
Ruby: Set SCE_RB_HERE_QQ for unquoted and double-quoted heredocs and SCE_RB_HERE_QX for backticks-quoted heredocs. Issue #134.
Ruby: Recognise #{} inside SCE_RB_HERE_QQ and SCE_RB_HERE_QX. Issue #134.
Ruby: Improve regex and heredoc recognition. Issue #136.
Ruby: Highlight #@, #@@ and #$ style interpolation. Issue #140.
Ruby: Fix folding for multiple heredocs started on one line. Fix folding when there is a space after heredoc opening delimiter. Issue #135.
YAML: Remove 1024-byte line length limit.
https://www.scintilla.org/lexilla524.zip
Released 13 March 2023.
C++: Fix failure to recognize keywords containing upper case. Issue #149.
GDScript: Support % and $ node paths. Issue #145, Pull request #146.
Close #13338
2023-03-10 02:37:21 +00:00
|
|
|
if (lineStarts.back() != Length()) {
|
|
|
|
lineStarts.push_back(Length());
|
|
|
|
}
|
2023-09-22 09:32:35 +00:00
|
|
|
lineStates.resize(lineStarts.size() + 1);
|
2022-01-04 23:07:50 +00:00
|
|
|
lineLevels.resize(lineStarts.size(), 0x400);
|
2021-02-21 04:53:09 +00:00
|
|
|
}
|
|
|
|
|
2023-02-09 16:57:24 +00:00
|
|
|
#if defined(_MSC_VER)
|
2022-01-04 23:07:50 +00:00
|
|
|
// IDocument interface does not specify noexcept so best to not add it to implementation
|
|
|
|
#pragma warning(disable: 26440)
|
|
|
|
#endif
|
|
|
|
|
Update scintilla 5.3.4 and lexilla 5.2.4 with:
https://www.scintilla.org/scintilla534.zip
Released 8 March 2023.
Add multithreaded wrap to significantly improve performance of wrapping large files.
More typesafe bindings of *Full APIs in ScintillaCall. Feature #1477.
Fix overlapping of text with line end wrap marker. Bug #2378.
Fix clipping of line end wrap symbol for SC_WRAPVISUALFLAGLOC_END_BY_TEXT.
Where a multi-byte character contains multiple styles, display each byte as a representation. This makes it easier to see and fix lexers that change styles mid-character, commonly because they use fixed size buffers.
Fix a potential crash with autocompletion list fill-ups where a SCN_CHARADDED handler retriggered an autocompletion list, but with no items that match the typed character.
lexilla523
Released 8 March 2023.
Add scripts/PromoteNew.bat script to promote .new files after checking.
Makefile: Remove 1024-byte line length limit..
Ruby: Add new lexical classes for % literals SCE_RB_STRING_W (%w non-interpolable string array), SCE_RB_STRING_I (%i non-interpolable symbol array), SCE_RB_STRING_QI (%I interpolable symbol array), and SCE_RB_STRING_QS (%s symbol). Issue #124.
Ruby: Disambiguate %= which may be a quote or modulo assignment. Issue #124, Bug #1255, Bug #2182.
Ruby: Fix additional fold level for single character in SCE_RB_STRING_QW. Issue #132.
Ruby: Set SCE_RB_HERE_QQ for unquoted and double-quoted heredocs and SCE_RB_HERE_QX for backticks-quoted heredocs. Issue #134.
Ruby: Recognise #{} inside SCE_RB_HERE_QQ and SCE_RB_HERE_QX. Issue #134.
Ruby: Improve regex and heredoc recognition. Issue #136.
Ruby: Highlight #@, #@@ and #$ style interpolation. Issue #140.
Ruby: Fix folding for multiple heredocs started on one line. Fix folding when there is a space after heredoc opening delimiter. Issue #135.
YAML: Remove 1024-byte line length limit.
https://www.scintilla.org/lexilla524.zip
Released 13 March 2023.
C++: Fix failure to recognize keywords containing upper case. Issue #149.
GDScript: Support % and $ node paths. Issue #145, Pull request #146.
Close #13338
2023-03-10 02:37:21 +00:00
|
|
|
Sci_Position TestDocument::MaxLine() const noexcept {
|
|
|
|
return lineStarts.size() - 1;
|
|
|
|
}
|
|
|
|
|
2021-02-21 04:53:09 +00:00
|
|
|
int SCI_METHOD TestDocument::Version() const {
|
|
|
|
return Scintilla::dvRelease4;
|
|
|
|
}
|
|
|
|
|
|
|
|
void SCI_METHOD TestDocument::SetErrorStatus(int) {
|
|
|
|
}
|
|
|
|
|
|
|
|
Sci_Position SCI_METHOD TestDocument::Length() const {
|
|
|
|
return text.length();
|
|
|
|
}
|
|
|
|
|
|
|
|
void SCI_METHOD TestDocument::GetCharRange(char *buffer, Sci_Position position, Sci_Position lengthRetrieve) const {
|
|
|
|
text.copy(buffer, lengthRetrieve, position);
|
|
|
|
}
|
|
|
|
|
|
|
|
char SCI_METHOD TestDocument::StyleAt(Sci_Position position) const {
|
2022-01-04 23:07:50 +00:00
|
|
|
if (position < 0) {
|
|
|
|
return 0;
|
|
|
|
}
|
2021-02-21 04:53:09 +00:00
|
|
|
return textStyles.at(position);
|
|
|
|
}
|
|
|
|
|
|
|
|
Sci_Position SCI_METHOD TestDocument::LineFromPosition(Sci_Position position) const {
|
Update scintilla 5.3.4 and lexilla 5.2.4 with:
https://www.scintilla.org/scintilla534.zip
Released 8 March 2023.
Add multithreaded wrap to significantly improve performance of wrapping large files.
More typesafe bindings of *Full APIs in ScintillaCall. Feature #1477.
Fix overlapping of text with line end wrap marker. Bug #2378.
Fix clipping of line end wrap symbol for SC_WRAPVISUALFLAGLOC_END_BY_TEXT.
Where a multi-byte character contains multiple styles, display each byte as a representation. This makes it easier to see and fix lexers that change styles mid-character, commonly because they use fixed size buffers.
Fix a potential crash with autocompletion list fill-ups where a SCN_CHARADDED handler retriggered an autocompletion list, but with no items that match the typed character.
lexilla523
Released 8 March 2023.
Add scripts/PromoteNew.bat script to promote .new files after checking.
Makefile: Remove 1024-byte line length limit..
Ruby: Add new lexical classes for % literals SCE_RB_STRING_W (%w non-interpolable string array), SCE_RB_STRING_I (%i non-interpolable symbol array), SCE_RB_STRING_QI (%I interpolable symbol array), and SCE_RB_STRING_QS (%s symbol). Issue #124.
Ruby: Disambiguate %= which may be a quote or modulo assignment. Issue #124, Bug #1255, Bug #2182.
Ruby: Fix additional fold level for single character in SCE_RB_STRING_QW. Issue #132.
Ruby: Set SCE_RB_HERE_QQ for unquoted and double-quoted heredocs and SCE_RB_HERE_QX for backticks-quoted heredocs. Issue #134.
Ruby: Recognise #{} inside SCE_RB_HERE_QQ and SCE_RB_HERE_QX. Issue #134.
Ruby: Improve regex and heredoc recognition. Issue #136.
Ruby: Highlight #@, #@@ and #$ style interpolation. Issue #140.
Ruby: Fix folding for multiple heredocs started on one line. Fix folding when there is a space after heredoc opening delimiter. Issue #135.
YAML: Remove 1024-byte line length limit.
https://www.scintilla.org/lexilla524.zip
Released 13 March 2023.
C++: Fix failure to recognize keywords containing upper case. Issue #149.
GDScript: Support % and $ node paths. Issue #145, Pull request #146.
Close #13338
2023-03-10 02:37:21 +00:00
|
|
|
if (position >= Length()) {
|
|
|
|
return MaxLine();
|
2021-02-21 04:53:09 +00:00
|
|
|
}
|
|
|
|
|
2022-01-04 23:07:50 +00:00
|
|
|
const std::vector<Sci_Position>::const_iterator it = std::lower_bound(lineStarts.begin(), lineStarts.end(), position);
|
2021-02-21 04:53:09 +00:00
|
|
|
Sci_Position line = it - lineStarts.begin();
|
|
|
|
if (*it > position)
|
|
|
|
line--;
|
|
|
|
return line;
|
|
|
|
}
|
|
|
|
|
|
|
|
Sci_Position SCI_METHOD TestDocument::LineStart(Sci_Position line) const {
|
2022-01-04 23:07:50 +00:00
|
|
|
if (line < 0) {
|
|
|
|
return 0;
|
|
|
|
}
|
2021-02-21 04:53:09 +00:00
|
|
|
if (line >= static_cast<Sci_Position>(lineStarts.size())) {
|
Update scintilla 5.3.4 and lexilla 5.2.4 with:
https://www.scintilla.org/scintilla534.zip
Released 8 March 2023.
Add multithreaded wrap to significantly improve performance of wrapping large files.
More typesafe bindings of *Full APIs in ScintillaCall. Feature #1477.
Fix overlapping of text with line end wrap marker. Bug #2378.
Fix clipping of line end wrap symbol for SC_WRAPVISUALFLAGLOC_END_BY_TEXT.
Where a multi-byte character contains multiple styles, display each byte as a representation. This makes it easier to see and fix lexers that change styles mid-character, commonly because they use fixed size buffers.
Fix a potential crash with autocompletion list fill-ups where a SCN_CHARADDED handler retriggered an autocompletion list, but with no items that match the typed character.
lexilla523
Released 8 March 2023.
Add scripts/PromoteNew.bat script to promote .new files after checking.
Makefile: Remove 1024-byte line length limit..
Ruby: Add new lexical classes for % literals SCE_RB_STRING_W (%w non-interpolable string array), SCE_RB_STRING_I (%i non-interpolable symbol array), SCE_RB_STRING_QI (%I interpolable symbol array), and SCE_RB_STRING_QS (%s symbol). Issue #124.
Ruby: Disambiguate %= which may be a quote or modulo assignment. Issue #124, Bug #1255, Bug #2182.
Ruby: Fix additional fold level for single character in SCE_RB_STRING_QW. Issue #132.
Ruby: Set SCE_RB_HERE_QQ for unquoted and double-quoted heredocs and SCE_RB_HERE_QX for backticks-quoted heredocs. Issue #134.
Ruby: Recognise #{} inside SCE_RB_HERE_QQ and SCE_RB_HERE_QX. Issue #134.
Ruby: Improve regex and heredoc recognition. Issue #136.
Ruby: Highlight #@, #@@ and #$ style interpolation. Issue #140.
Ruby: Fix folding for multiple heredocs started on one line. Fix folding when there is a space after heredoc opening delimiter. Issue #135.
YAML: Remove 1024-byte line length limit.
https://www.scintilla.org/lexilla524.zip
Released 13 March 2023.
C++: Fix failure to recognize keywords containing upper case. Issue #149.
GDScript: Support % and $ node paths. Issue #145, Pull request #146.
Close #13338
2023-03-10 02:37:21 +00:00
|
|
|
return Length();
|
2021-02-21 04:53:09 +00:00
|
|
|
}
|
|
|
|
return lineStarts.at(line);
|
|
|
|
}
|
|
|
|
|
2022-01-04 23:07:50 +00:00
|
|
|
int SCI_METHOD TestDocument::GetLevel(Sci_Position line) const {
|
|
|
|
return lineLevels.at(line);
|
2021-02-21 04:53:09 +00:00
|
|
|
}
|
|
|
|
|
2022-01-04 23:07:50 +00:00
|
|
|
int SCI_METHOD TestDocument::SetLevel(Sci_Position line, int level) {
|
Update scintilla 5.3.4 and lexilla 5.2.4 with:
https://www.scintilla.org/scintilla534.zip
Released 8 March 2023.
Add multithreaded wrap to significantly improve performance of wrapping large files.
More typesafe bindings of *Full APIs in ScintillaCall. Feature #1477.
Fix overlapping of text with line end wrap marker. Bug #2378.
Fix clipping of line end wrap symbol for SC_WRAPVISUALFLAGLOC_END_BY_TEXT.
Where a multi-byte character contains multiple styles, display each byte as a representation. This makes it easier to see and fix lexers that change styles mid-character, commonly because they use fixed size buffers.
Fix a potential crash with autocompletion list fill-ups where a SCN_CHARADDED handler retriggered an autocompletion list, but with no items that match the typed character.
lexilla523
Released 8 March 2023.
Add scripts/PromoteNew.bat script to promote .new files after checking.
Makefile: Remove 1024-byte line length limit..
Ruby: Add new lexical classes for % literals SCE_RB_STRING_W (%w non-interpolable string array), SCE_RB_STRING_I (%i non-interpolable symbol array), SCE_RB_STRING_QI (%I interpolable symbol array), and SCE_RB_STRING_QS (%s symbol). Issue #124.
Ruby: Disambiguate %= which may be a quote or modulo assignment. Issue #124, Bug #1255, Bug #2182.
Ruby: Fix additional fold level for single character in SCE_RB_STRING_QW. Issue #132.
Ruby: Set SCE_RB_HERE_QQ for unquoted and double-quoted heredocs and SCE_RB_HERE_QX for backticks-quoted heredocs. Issue #134.
Ruby: Recognise #{} inside SCE_RB_HERE_QQ and SCE_RB_HERE_QX. Issue #134.
Ruby: Improve regex and heredoc recognition. Issue #136.
Ruby: Highlight #@, #@@ and #$ style interpolation. Issue #140.
Ruby: Fix folding for multiple heredocs started on one line. Fix folding when there is a space after heredoc opening delimiter. Issue #135.
YAML: Remove 1024-byte line length limit.
https://www.scintilla.org/lexilla524.zip
Released 13 March 2023.
C++: Fix failure to recognize keywords containing upper case. Issue #149.
GDScript: Support % and $ node paths. Issue #145, Pull request #146.
Close #13338
2023-03-10 02:37:21 +00:00
|
|
|
if (line == static_cast<Sci_Position>(lineLevels.size())) {
|
|
|
|
return 0x400;
|
|
|
|
}
|
2022-01-04 23:07:50 +00:00
|
|
|
return lineLevels.at(line) = level;
|
2021-02-21 04:53:09 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
int SCI_METHOD TestDocument::GetLineState(Sci_Position line) const {
|
|
|
|
return lineStates.at(line);
|
|
|
|
}
|
|
|
|
|
|
|
|
int SCI_METHOD TestDocument::SetLineState(Sci_Position line, int state) {
|
|
|
|
return lineStates.at(line) = state;
|
|
|
|
}
|
|
|
|
|
|
|
|
void SCI_METHOD TestDocument::StartStyling(Sci_Position position) {
|
|
|
|
endStyled = position;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool SCI_METHOD TestDocument::SetStyleFor(Sci_Position length, char style) {
|
|
|
|
for (Sci_Position i = 0; i < length; i++) {
|
2022-04-13 11:10:12 +00:00
|
|
|
textStyles.at(endStyled) = style;
|
2021-02-21 04:53:09 +00:00
|
|
|
endStyled++;
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool SCI_METHOD TestDocument::SetStyles(Sci_Position length, const char *styles) {
|
2022-04-13 11:10:12 +00:00
|
|
|
assert(styles);
|
2021-02-21 04:53:09 +00:00
|
|
|
for (Sci_Position i = 0; i < length; i++) {
|
2022-04-13 11:10:12 +00:00
|
|
|
textStyles.at(endStyled) = styles[i];
|
2021-02-21 04:53:09 +00:00
|
|
|
endStyled++;
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
void SCI_METHOD TestDocument::DecorationSetCurrentIndicator(int) {
|
|
|
|
// Not implemented as no way to read decorations
|
|
|
|
}
|
|
|
|
|
|
|
|
void SCI_METHOD TestDocument::DecorationFillRange(Sci_Position, int, Sci_Position) {
|
|
|
|
// Not implemented as no way to read decorations
|
|
|
|
}
|
|
|
|
|
|
|
|
void SCI_METHOD TestDocument::ChangeLexerState(Sci_Position, Sci_Position) {
|
|
|
|
// Not implemented as no watcher to trigger
|
|
|
|
}
|
|
|
|
|
|
|
|
int SCI_METHOD TestDocument::CodePage() const {
|
|
|
|
// Always UTF-8 for now
|
|
|
|
return 65001;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool SCI_METHOD TestDocument::IsDBCSLeadByte(char) const {
|
|
|
|
// Always UTF-8 for now
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
const char *SCI_METHOD TestDocument::BufferPointer() {
|
|
|
|
return text.c_str();
|
|
|
|
}
|
|
|
|
|
|
|
|
int SCI_METHOD TestDocument::GetLineIndentation(Sci_Position) {
|
|
|
|
// Never actually called - lexers use Accessor::IndentAmount
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
Sci_Position SCI_METHOD TestDocument::LineEnd(Sci_Position line) const {
|
Update scintilla 5.3.4 and lexilla 5.2.4 with:
https://www.scintilla.org/scintilla534.zip
Released 8 March 2023.
Add multithreaded wrap to significantly improve performance of wrapping large files.
More typesafe bindings of *Full APIs in ScintillaCall. Feature #1477.
Fix overlapping of text with line end wrap marker. Bug #2378.
Fix clipping of line end wrap symbol for SC_WRAPVISUALFLAGLOC_END_BY_TEXT.
Where a multi-byte character contains multiple styles, display each byte as a representation. This makes it easier to see and fix lexers that change styles mid-character, commonly because they use fixed size buffers.
Fix a potential crash with autocompletion list fill-ups where a SCN_CHARADDED handler retriggered an autocompletion list, but with no items that match the typed character.
lexilla523
Released 8 March 2023.
Add scripts/PromoteNew.bat script to promote .new files after checking.
Makefile: Remove 1024-byte line length limit..
Ruby: Add new lexical classes for % literals SCE_RB_STRING_W (%w non-interpolable string array), SCE_RB_STRING_I (%i non-interpolable symbol array), SCE_RB_STRING_QI (%I interpolable symbol array), and SCE_RB_STRING_QS (%s symbol). Issue #124.
Ruby: Disambiguate %= which may be a quote or modulo assignment. Issue #124, Bug #1255, Bug #2182.
Ruby: Fix additional fold level for single character in SCE_RB_STRING_QW. Issue #132.
Ruby: Set SCE_RB_HERE_QQ for unquoted and double-quoted heredocs and SCE_RB_HERE_QX for backticks-quoted heredocs. Issue #134.
Ruby: Recognise #{} inside SCE_RB_HERE_QQ and SCE_RB_HERE_QX. Issue #134.
Ruby: Improve regex and heredoc recognition. Issue #136.
Ruby: Highlight #@, #@@ and #$ style interpolation. Issue #140.
Ruby: Fix folding for multiple heredocs started on one line. Fix folding when there is a space after heredoc opening delimiter. Issue #135.
YAML: Remove 1024-byte line length limit.
https://www.scintilla.org/lexilla524.zip
Released 13 March 2023.
C++: Fix failure to recognize keywords containing upper case. Issue #149.
GDScript: Support % and $ node paths. Issue #145, Pull request #146.
Close #13338
2023-03-10 02:37:21 +00:00
|
|
|
const Sci_Position maxLine = MaxLine();
|
|
|
|
if (line == maxLine || line == maxLine+1) {
|
|
|
|
return text.length();
|
|
|
|
}
|
|
|
|
assert(line < maxLine);
|
2021-02-21 04:53:09 +00:00
|
|
|
Sci_Position position = LineStart(line + 1);
|
|
|
|
position--; // Back over CR or LF
|
|
|
|
// When line terminator is CR+LF, may need to go back one more
|
|
|
|
if ((position > LineStart(line)) && (text.at(position - 1) == '\r')) {
|
|
|
|
position--;
|
|
|
|
}
|
|
|
|
return position;
|
|
|
|
}
|
|
|
|
|
|
|
|
Sci_Position SCI_METHOD TestDocument::GetRelativePosition(Sci_Position positionStart, Sci_Position characterOffset) const {
|
|
|
|
Sci_Position pos = positionStart;
|
|
|
|
if (characterOffset < 0) {
|
|
|
|
while (characterOffset < 0) {
|
|
|
|
if (pos <= 0) {
|
2023-09-22 09:32:35 +00:00
|
|
|
return -1;
|
2021-02-21 04:53:09 +00:00
|
|
|
}
|
|
|
|
unsigned char previousByte = text.at(pos - 1);
|
|
|
|
if (previousByte < 0x80) {
|
|
|
|
pos--;
|
|
|
|
characterOffset++;
|
|
|
|
} else {
|
|
|
|
while ((pos > 1) && UTF8IsTrailByte(previousByte)) {
|
|
|
|
pos--;
|
|
|
|
previousByte = text.at(pos - 1);
|
|
|
|
}
|
|
|
|
pos--;
|
|
|
|
// text[pos] is now a character start
|
|
|
|
characterOffset++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return pos;
|
|
|
|
}
|
|
|
|
assert(characterOffset >= 0);
|
|
|
|
// TODO: invalid UTF-8
|
|
|
|
while (characterOffset > 0) {
|
|
|
|
Sci_Position width = 0;
|
|
|
|
GetCharacterAndWidth(pos, &width);
|
|
|
|
pos += width;
|
|
|
|
characterOffset--;
|
|
|
|
}
|
|
|
|
return pos;
|
|
|
|
}
|
|
|
|
|
|
|
|
int SCI_METHOD TestDocument::GetCharacterAndWidth(Sci_Position position, Sci_Position *pWidth) const {
|
|
|
|
// TODO: invalid UTF-8
|
2023-09-22 09:32:35 +00:00
|
|
|
if ((position < 0) || (position >= Length())) {
|
|
|
|
// Return NULs before document start and after document end
|
2021-02-21 04:53:09 +00:00
|
|
|
if (pWidth) {
|
|
|
|
*pWidth = 1;
|
|
|
|
}
|
|
|
|
return '\0';
|
|
|
|
}
|
|
|
|
const unsigned char leadByte = text.at(position);
|
2022-01-04 23:07:50 +00:00
|
|
|
if (leadByte < 0x80) {
|
|
|
|
if (pWidth) {
|
|
|
|
*pWidth = 1;
|
|
|
|
}
|
|
|
|
return leadByte;
|
|
|
|
}
|
2021-02-21 04:53:09 +00:00
|
|
|
const int widthCharBytes = UTF8BytesOfLead[leadByte];
|
|
|
|
unsigned char charBytes[] = { leadByte,0,0,0 };
|
2022-04-13 11:10:12 +00:00
|
|
|
for (int b = 1; b < widthCharBytes; b++) {
|
|
|
|
charBytes[b] = text.at(position + b);
|
|
|
|
}
|
2021-02-21 04:53:09 +00:00
|
|
|
|
|
|
|
if (pWidth) {
|
|
|
|
*pWidth = widthCharBytes;
|
|
|
|
}
|
|
|
|
return UnicodeFromUTF8(charBytes);
|
|
|
|
}
|