You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
50 lines
1.3 KiB
50 lines
1.3 KiB
// Scintilla source code edit control |
|
/** @file CharacterCategory.h |
|
** Returns the Unicode general category of a character. |
|
**/ |
|
// Copyright 2013 by Neil Hodgson <neilh@scintilla.org> |
|
// The License.txt file describes the conditions under which this software may be distributed. |
|
|
|
#ifndef CHARACTERCATEGORY_H |
|
#define CHARACTERCATEGORY_H |
|
|
|
namespace Lexilla { |
|
|
|
enum CharacterCategory { |
|
ccLu, ccLl, ccLt, ccLm, ccLo, |
|
ccMn, ccMc, ccMe, |
|
ccNd, ccNl, ccNo, |
|
ccPc, ccPd, ccPs, ccPe, ccPi, ccPf, ccPo, |
|
ccSm, ccSc, ccSk, ccSo, |
|
ccZs, ccZl, ccZp, |
|
ccCc, ccCf, ccCs, ccCo, ccCn |
|
}; |
|
|
|
CharacterCategory CategoriseCharacter(int character) noexcept; |
|
|
|
// Common definitions of allowable characters in identifiers from UAX #31. |
|
bool IsIdStart(int character) noexcept; |
|
bool IsIdContinue(int character) noexcept; |
|
bool IsXidStart(int character) noexcept; |
|
bool IsXidContinue(int character) noexcept; |
|
|
|
class CharacterCategoryMap { |
|
private: |
|
std::vector<unsigned char> dense; |
|
public: |
|
CharacterCategoryMap(); |
|
CharacterCategory CategoryFor(int character) const noexcept { |
|
if (static_cast<size_t>(character) < dense.size()) { |
|
return static_cast<CharacterCategory>(dense[character]); |
|
} else { |
|
// binary search through ranges |
|
return CategoriseCharacter(character); |
|
} |
|
} |
|
int Size() const noexcept; |
|
void Optimize(int countCharacters); |
|
}; |
|
|
|
} |
|
|
|
#endif
|
|
|