2010-08-21 23:59:56 +00:00
|
|
|
// Scintilla source code edit control
|
|
|
|
/** @file CharacterSet.h
|
|
|
|
** Encapsulates a set of characters. Used to test if a character is within a set.
|
|
|
|
**/
|
|
|
|
// Copyright 2007 by Neil Hodgson <neilh@scintilla.org>
|
|
|
|
// The License.txt file describes the conditions under which this software may be distributed.
|
|
|
|
|
|
|
|
#ifndef CHARACTERSET_H
|
|
|
|
#define CHARACTERSET_H
|
|
|
|
|
|
|
|
namespace Scintilla {
|
|
|
|
|
|
|
|
class CharacterSet {
|
|
|
|
int size;
|
|
|
|
bool valueAfter;
|
|
|
|
bool *bset;
|
|
|
|
public:
|
|
|
|
enum setBase {
|
|
|
|
setNone=0,
|
|
|
|
setLower=1,
|
|
|
|
setUpper=2,
|
|
|
|
setDigits=4,
|
|
|
|
setAlpha=setLower|setUpper,
|
|
|
|
setAlphaNum=setAlpha|setDigits
|
|
|
|
};
|
|
|
|
CharacterSet(setBase base=setNone, const char *initialSet="", int size_=0x80, bool valueAfter_=false) {
|
|
|
|
size = size_;
|
|
|
|
valueAfter = valueAfter_;
|
|
|
|
bset = new bool[size];
|
|
|
|
for (int i=0; i < size; i++) {
|
|
|
|
bset[i] = false;
|
|
|
|
}
|
|
|
|
AddString(initialSet);
|
|
|
|
if (base & setLower)
|
|
|
|
AddString("abcdefghijklmnopqrstuvwxyz");
|
|
|
|
if (base & setUpper)
|
|
|
|
AddString("ABCDEFGHIJKLMNOPQRSTUVWXYZ");
|
|
|
|
if (base & setDigits)
|
|
|
|
AddString("0123456789");
|
|
|
|
}
|
2013-08-28 00:44:27 +00:00
|
|
|
CharacterSet(const CharacterSet &other) {
|
|
|
|
size = other.size;
|
|
|
|
valueAfter = other.valueAfter;
|
|
|
|
bset = new bool[size];
|
|
|
|
for (int i=0; i < size; i++) {
|
|
|
|
bset[i] = other.bset[i];
|
|
|
|
}
|
|
|
|
}
|
2021-02-21 04:53:09 +00:00
|
|
|
CharacterSet(CharacterSet &&other) noexcept {
|
|
|
|
size = other.size;
|
|
|
|
valueAfter = other.valueAfter;
|
|
|
|
bset = other.bset;
|
|
|
|
other.size = 0;
|
|
|
|
other.bset = nullptr;
|
|
|
|
}
|
|
|
|
CharacterSet &operator=(const CharacterSet &other) {
|
|
|
|
if (this != &other) {
|
|
|
|
bool *bsetNew = new bool[other.size];
|
|
|
|
for (int i = 0; i < other.size; i++) {
|
|
|
|
bsetNew[i] = other.bset[i];
|
|
|
|
}
|
|
|
|
delete[]bset;
|
|
|
|
size = other.size;
|
|
|
|
valueAfter = other.valueAfter;
|
|
|
|
bset = bsetNew;
|
|
|
|
}
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
CharacterSet &operator=(CharacterSet &&other) noexcept {
|
2019-05-04 18:14:48 +00:00
|
|
|
if (this != &other) {
|
|
|
|
delete []bset;
|
|
|
|
size = other.size;
|
|
|
|
valueAfter = other.valueAfter;
|
|
|
|
bset = other.bset;
|
|
|
|
other.size = 0;
|
|
|
|
other.bset = nullptr;
|
|
|
|
}
|
|
|
|
return *this;
|
|
|
|
}
|
2010-08-21 23:59:56 +00:00
|
|
|
~CharacterSet() {
|
|
|
|
delete []bset;
|
2019-05-04 18:14:48 +00:00
|
|
|
bset = nullptr;
|
2010-08-21 23:59:56 +00:00
|
|
|
size = 0;
|
|
|
|
}
|
|
|
|
void Add(int val) {
|
|
|
|
assert(val >= 0);
|
|
|
|
assert(val < size);
|
|
|
|
bset[val] = true;
|
|
|
|
}
|
2011-03-22 00:16:49 +00:00
|
|
|
void AddString(const char *setToAdd) {
|
|
|
|
for (const char *cp=setToAdd; *cp; cp++) {
|
2019-07-21 13:26:02 +00:00
|
|
|
const unsigned char uch = *cp;
|
|
|
|
assert(uch < size);
|
|
|
|
bset[uch] = true;
|
2010-08-21 23:59:56 +00:00
|
|
|
}
|
|
|
|
}
|
2021-02-21 04:53:09 +00:00
|
|
|
bool Contains(int val) const noexcept {
|
2010-08-21 23:59:56 +00:00
|
|
|
assert(val >= 0);
|
|
|
|
if (val < 0) return false;
|
|
|
|
return (val < size) ? bset[val] : valueAfter;
|
|
|
|
}
|
2021-02-21 04:53:09 +00:00
|
|
|
bool Contains(char ch) const noexcept {
|
2019-07-21 13:26:02 +00:00
|
|
|
// Overload char as char may be signed
|
|
|
|
const unsigned char uch = ch;
|
|
|
|
return Contains(uch);
|
|
|
|
}
|
2010-08-21 23:59:56 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
// Functions for classifying characters
|
|
|
|
|
2021-02-21 04:53:09 +00:00
|
|
|
constexpr bool IsASpace(int ch) noexcept {
|
2010-08-21 23:59:56 +00:00
|
|
|
return (ch == ' ') || ((ch >= 0x09) && (ch <= 0x0d));
|
|
|
|
}
|
|
|
|
|
2021-02-21 04:53:09 +00:00
|
|
|
constexpr bool IsASpaceOrTab(int ch) noexcept {
|
2010-08-21 23:59:56 +00:00
|
|
|
return (ch == ' ') || (ch == '\t');
|
|
|
|
}
|
|
|
|
|
2021-02-21 04:53:09 +00:00
|
|
|
constexpr bool IsADigit(int ch) noexcept {
|
2010-08-21 23:59:56 +00:00
|
|
|
return (ch >= '0') && (ch <= '9');
|
|
|
|
}
|
|
|
|
|
2021-02-21 04:53:09 +00:00
|
|
|
constexpr bool IsADigit(int ch, int base) noexcept {
|
2010-08-21 23:59:56 +00:00
|
|
|
if (base <= 10) {
|
|
|
|
return (ch >= '0') && (ch < '0' + base);
|
|
|
|
} else {
|
|
|
|
return ((ch >= '0') && (ch <= '9')) ||
|
|
|
|
((ch >= 'A') && (ch < 'A' + base - 10)) ||
|
|
|
|
((ch >= 'a') && (ch < 'a' + base - 10));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-02-21 04:53:09 +00:00
|
|
|
constexpr bool IsASCII(int ch) noexcept {
|
2013-08-28 00:44:27 +00:00
|
|
|
return (ch >= 0) && (ch < 0x80);
|
|
|
|
}
|
|
|
|
|
2021-02-21 04:53:09 +00:00
|
|
|
constexpr bool IsLowerCase(int ch) noexcept {
|
2013-08-28 00:44:27 +00:00
|
|
|
return (ch >= 'a') && (ch <= 'z');
|
|
|
|
}
|
|
|
|
|
2021-02-21 04:53:09 +00:00
|
|
|
constexpr bool IsUpperCase(int ch) noexcept {
|
2013-08-28 00:44:27 +00:00
|
|
|
return (ch >= 'A') && (ch <= 'Z');
|
2010-08-21 23:59:56 +00:00
|
|
|
}
|
|
|
|
|
2021-02-21 04:53:09 +00:00
|
|
|
constexpr bool IsUpperOrLowerCase(int ch) noexcept {
|
2019-07-21 13:26:02 +00:00
|
|
|
return IsUpperCase(ch) || IsLowerCase(ch);
|
|
|
|
}
|
|
|
|
|
2021-02-21 04:53:09 +00:00
|
|
|
constexpr bool IsAlphaNumeric(int ch) noexcept {
|
2010-08-21 23:59:56 +00:00
|
|
|
return
|
|
|
|
((ch >= '0') && (ch <= '9')) ||
|
|
|
|
((ch >= 'a') && (ch <= 'z')) ||
|
|
|
|
((ch >= 'A') && (ch <= 'Z'));
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Check if a character is a space.
|
|
|
|
* This is ASCII specific but is safe with chars >= 0x80.
|
|
|
|
*/
|
2021-02-21 04:53:09 +00:00
|
|
|
constexpr bool isspacechar(int ch) noexcept {
|
2010-08-21 23:59:56 +00:00
|
|
|
return (ch == ' ') || ((ch >= 0x09) && (ch <= 0x0d));
|
|
|
|
}
|
|
|
|
|
2021-02-21 04:53:09 +00:00
|
|
|
constexpr bool iswordchar(int ch) noexcept {
|
2013-08-28 00:44:27 +00:00
|
|
|
return IsAlphaNumeric(ch) || ch == '.' || ch == '_';
|
2010-08-21 23:59:56 +00:00
|
|
|
}
|
|
|
|
|
2021-02-21 04:53:09 +00:00
|
|
|
constexpr bool iswordstart(int ch) noexcept {
|
2013-08-28 00:44:27 +00:00
|
|
|
return IsAlphaNumeric(ch) || ch == '_';
|
2010-08-21 23:59:56 +00:00
|
|
|
}
|
|
|
|
|
2021-02-21 04:53:09 +00:00
|
|
|
constexpr bool isoperator(int ch) noexcept {
|
2013-08-28 00:44:27 +00:00
|
|
|
if (IsAlphaNumeric(ch))
|
2010-08-21 23:59:56 +00:00
|
|
|
return false;
|
|
|
|
if (ch == '%' || ch == '^' || ch == '&' || ch == '*' ||
|
|
|
|
ch == '(' || ch == ')' || ch == '-' || ch == '+' ||
|
|
|
|
ch == '=' || ch == '|' || ch == '{' || ch == '}' ||
|
|
|
|
ch == '[' || ch == ']' || ch == ':' || ch == ';' ||
|
|
|
|
ch == '<' || ch == '>' || ch == ',' || ch == '/' ||
|
|
|
|
ch == '?' || ch == '!' || ch == '.' || ch == '~')
|
|
|
|
return true;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2019-05-04 18:14:48 +00:00
|
|
|
// Simple case functions for ASCII supersets.
|
2010-08-21 23:59:56 +00:00
|
|
|
|
2019-05-04 18:14:48 +00:00
|
|
|
template <typename T>
|
2021-02-21 04:53:09 +00:00
|
|
|
constexpr T MakeUpperCase(T ch) noexcept {
|
2010-08-21 23:59:56 +00:00
|
|
|
if (ch < 'a' || ch > 'z')
|
|
|
|
return ch;
|
|
|
|
else
|
2019-05-04 18:14:48 +00:00
|
|
|
return ch - 'a' + 'A';
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename T>
|
2021-02-21 04:53:09 +00:00
|
|
|
constexpr T MakeLowerCase(T ch) noexcept {
|
2019-05-04 18:14:48 +00:00
|
|
|
if (ch < 'A' || ch > 'Z')
|
|
|
|
return ch;
|
|
|
|
else
|
|
|
|
return ch - 'A' + 'a';
|
2010-08-21 23:59:56 +00:00
|
|
|
}
|
|
|
|
|
2021-02-21 04:53:09 +00:00
|
|
|
int CompareCaseInsensitive(const char *a, const char *b) noexcept;
|
|
|
|
int CompareNCaseInsensitive(const char *a, const char *b, size_t len) noexcept;
|
2010-08-21 23:59:56 +00:00
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
#endif
|