185 lines
6.5 KiB
Python
185 lines
6.5 KiB
Python
#!/usr/bin/env python3
|
|
# -*- coding: utf-8 -*-
|
|
# Requires Python 2.7 or later
|
|
|
|
import io, os, sys, unittest
|
|
|
|
if sys.platform == "win32":
|
|
import XiteWin as Xite
|
|
else:
|
|
import XiteQt as Xite
|
|
|
|
keywordsHTML = [
|
|
b"b body content head href html link meta "
|
|
b"name rel script strong title type xmlns",
|
|
b"function",
|
|
b"sub"
|
|
]
|
|
|
|
keywordsPerl = [
|
|
b"NULL __FILE__ __LINE__ __PACKAGE__ __DATA__ __END__ AUTOLOAD "
|
|
b"BEGIN CORE DESTROY END EQ GE GT INIT LE LT NE CHECK abs accept "
|
|
b"alarm and atan2 bind binmode bless caller chdir chmod chomp chop "
|
|
b"chown chr chroot close closedir cmp connect continue cos crypt "
|
|
b"dbmclose dbmopen defined delete die do dump each else elsif endgrent "
|
|
b"endhostent endnetent endprotoent endpwent endservent eof eq eval "
|
|
b"exec exists exit exp fcntl fileno flock for foreach fork format "
|
|
b"formline ge getc getgrent getgrgid getgrnam gethostbyaddr gethostbyname "
|
|
b"gethostent getlogin getnetbyaddr getnetbyname getnetent getpeername "
|
|
b"getpgrp getppid getpriority getprotobyname getprotobynumber getprotoent "
|
|
b"getpwent getpwnam getpwuid getservbyname getservbyport getservent "
|
|
b"getsockname getsockopt glob gmtime goto grep gt hex if index "
|
|
b"int ioctl join keys kill last lc lcfirst le length link listen "
|
|
b"local localtime lock log lstat lt map mkdir msgctl msgget msgrcv "
|
|
b"msgsnd my ne next no not oct open opendir or ord our pack package "
|
|
b"pipe pop pos print printf prototype push quotemeta qu "
|
|
b"rand read readdir readline readlink readpipe recv redo "
|
|
b"ref rename require reset return reverse rewinddir rindex rmdir "
|
|
b"scalar seek seekdir select semctl semget semop send setgrent "
|
|
b"sethostent setnetent setpgrp setpriority setprotoent setpwent "
|
|
b"setservent setsockopt shift shmctl shmget shmread shmwrite shutdown "
|
|
b"sin sleep socket socketpair sort splice split sprintf sqrt srand "
|
|
b"stat study sub substr symlink syscall sysopen sysread sysseek "
|
|
b"system syswrite tell telldir tie tied time times truncate "
|
|
b"uc ucfirst umask undef unless unlink unpack unshift untie until "
|
|
b"use utime values vec wait waitpid wantarray warn while write "
|
|
b"xor "
|
|
b"given when default break say state UNITCHECK __SUB__ fc"
|
|
]
|
|
|
|
class TestLexers(unittest.TestCase):
|
|
|
|
def setUp(self):
|
|
self.xite = Xite.xiteFrame
|
|
self.ed = self.xite.ed
|
|
self.ed.ClearAll()
|
|
self.ed.EmptyUndoBuffer()
|
|
|
|
def AsStyled(self, withWindowsLineEnds):
|
|
text = self.ed.Contents()
|
|
data = io.BytesIO()
|
|
prevStyle = -1
|
|
for o in range(self.ed.Length):
|
|
styleNow = self.ed.GetStyleAt(o)
|
|
if styleNow != prevStyle:
|
|
styleBuf = "{%0d}" % styleNow
|
|
data.write(styleBuf.encode('utf-8'))
|
|
prevStyle = styleNow
|
|
data.write(text[o:o+1])
|
|
if withWindowsLineEnds:
|
|
return data.getvalue().replace(b"\n", b"\r\n")
|
|
else:
|
|
return data.getvalue()
|
|
|
|
def LexExample(self, name, lexerName, keywords, fileMode="b"):
|
|
self.ed.ClearAll()
|
|
self.ed.EmptyUndoBuffer()
|
|
self.ed.SetCodePage(65001)
|
|
self.ed.LexerLanguage = lexerName
|
|
mask = 0xff
|
|
for i in range(len(keywords)):
|
|
self.ed.SetKeyWords(i, keywords[i])
|
|
|
|
nameExample = os.path.join("examples", name)
|
|
namePrevious = nameExample +".styled"
|
|
nameNew = nameExample +".new"
|
|
with open(nameExample, "rb") as f:
|
|
prog = f.read()
|
|
if fileMode == "t" and sys.platform == "win32":
|
|
prog = prog.replace(b"\r\n", b"\n")
|
|
BOM = b"\xEF\xBB\xBF"
|
|
if prog.startswith(BOM):
|
|
prog = prog[len(BOM):]
|
|
lenDocument = len(prog)
|
|
self.ed.AddText(lenDocument, prog)
|
|
self.ed.Colourise(0, lenDocument)
|
|
self.assertEquals(self.ed.EndStyled, lenDocument)
|
|
try:
|
|
with open(namePrevious, "rb") as f:
|
|
prevStyled = f.read()
|
|
if fileMode == "t" and sys.platform == "win32":
|
|
prog = prog.replace(b"\r\n", b"\n")
|
|
except EnvironmentError:
|
|
prevStyled = ""
|
|
progStyled = self.AsStyled(fileMode == "t" and sys.platform == "win32")
|
|
if progStyled != prevStyled:
|
|
with open(nameNew, "wb") as f:
|
|
f.write(progStyled)
|
|
print("Incorrect lex for " + name)
|
|
print(progStyled)
|
|
print(prevStyled)
|
|
self.assertEquals(progStyled, prevStyled)
|
|
# The whole file doesn't parse like it did before so don't try line by line
|
|
# as that is likely to fail many times.
|
|
return
|
|
|
|
if fileMode == "b": # "t" files are large and this is a quadratic check
|
|
# Try partial lexes from the start of every line which should all be identical.
|
|
for line in range(self.ed.LineCount):
|
|
lineStart = self.ed.PositionFromLine(line)
|
|
self.ed.StartStyling(lineStart, mask)
|
|
self.assertEquals(self.ed.EndStyled, lineStart)
|
|
self.ed.Colourise(lineStart, lenDocument)
|
|
progStyled = self.AsStyled(fileMode == "t" and sys.platform == "win32")
|
|
if progStyled != prevStyled:
|
|
print("Incorrect partial lex for " + name + " at line " + line)
|
|
with open(nameNew, "wb") as f:
|
|
f.write(progStyled)
|
|
self.assertEquals(progStyled, prevStyled)
|
|
# Give up after one failure
|
|
return
|
|
|
|
# Test lexing just once from beginning to end in text form.
|
|
# This is used for test cases that are too long to be exhaustively tested by lines and
|
|
# may be sensitive to line ends so are tested as if using Unix LF line ends.
|
|
def LexLongCase(self, name, lexerName, keywords, fileMode="b"):
|
|
self.LexExample(name, lexerName, keywords, "t")
|
|
|
|
def testCXX(self):
|
|
self.LexExample("x.cxx", b"cpp", [b"int"])
|
|
|
|
def testPython(self):
|
|
self.LexExample("x.py", b"python",
|
|
[b"class def else for if import in print return while"])
|
|
|
|
def testHTML(self):
|
|
self.LexExample("x.html", b"hypertext", keywordsHTML)
|
|
|
|
def testASP(self):
|
|
self.LexExample("x.asp", b"hypertext", keywordsHTML)
|
|
|
|
def testPHP(self):
|
|
self.LexExample("x.php", b"hypertext", keywordsHTML)
|
|
|
|
def testVB(self):
|
|
self.LexExample("x.vb", b"vb", [b"as dim or string"])
|
|
|
|
def testLua(self):
|
|
self.LexExample("x.lua", b"lua", [b"function end"])
|
|
|
|
def testNim(self):
|
|
self.LexExample("x.nim", b"nim", [b"else end if let proc"])
|
|
|
|
def testRuby(self):
|
|
self.LexExample("x.rb", b"ruby", [b"class def end"])
|
|
|
|
def testPerl(self):
|
|
self.LexExample("x.pl", b"perl", keywordsPerl)
|
|
|
|
def testPerl52(self):
|
|
self.LexLongCase("perl-test-5220delta.pl", b"perl", keywordsPerl)
|
|
|
|
def testPerlPrototypes(self):
|
|
self.LexLongCase("perl-test-sub-prototypes.pl", b"perl", keywordsPerl)
|
|
|
|
def testD(self):
|
|
self.LexExample("x.d", b"d",
|
|
[b"keyword1", b"keyword2", b"", b"keyword4", b"keyword5",
|
|
b"keyword6", b"keyword7"])
|
|
|
|
def testTCL(self):
|
|
self.LexExample("x.tcl", b"tcl", [b"proc set socket vwait"])
|
|
|
|
if __name__ == '__main__':
|
|
Xite.main("lexTests")
|