263 lines
6.2 KiB
Go
263 lines
6.2 KiB
Go
package scanner_test
|
||
|
||
import (
|
||
"fmt"
|
||
"math/rand"
|
||
"strings"
|
||
"testing"
|
||
"time"
|
||
|
||
"github.com/d5/tengo/assert"
|
||
"github.com/d5/tengo/scanner"
|
||
"github.com/d5/tengo/source"
|
||
"github.com/d5/tengo/token"
|
||
)
|
||
|
||
var testFileSet = source.NewFileSet()
|
||
|
||
type scanResult struct {
|
||
Token token.Token
|
||
Literal string
|
||
Line int
|
||
Column int
|
||
}
|
||
|
||
func TestScanner_Scan(t *testing.T) {
|
||
var testCases = [...]struct {
|
||
token token.Token
|
||
literal string
|
||
}{
|
||
{token.Comment, "/* a comment */"},
|
||
{token.Comment, "// a comment \n"},
|
||
{token.Comment, "/*\r*/"},
|
||
{token.Comment, "/**\r/*/"},
|
||
{token.Comment, "/**\r\r/*/"},
|
||
{token.Comment, "//\r\n"},
|
||
{token.Ident, "foobar"},
|
||
{token.Ident, "a۰۱۸"},
|
||
{token.Ident, "foo६४"},
|
||
{token.Ident, "bar9876"},
|
||
{token.Ident, "ŝ"},
|
||
{token.Ident, "ŝfoo"},
|
||
{token.Int, "0"},
|
||
{token.Int, "1"},
|
||
{token.Int, "123456789012345678890"},
|
||
{token.Int, "01234567"},
|
||
{token.Int, "0xcafebabe"},
|
||
{token.Float, "0."},
|
||
{token.Float, ".0"},
|
||
{token.Float, "3.14159265"},
|
||
{token.Float, "1e0"},
|
||
{token.Float, "1e+100"},
|
||
{token.Float, "1e-100"},
|
||
{token.Float, "2.71828e-1000"},
|
||
{token.Char, "'a'"},
|
||
{token.Char, "'\\000'"},
|
||
{token.Char, "'\\xFF'"},
|
||
{token.Char, "'\\uff16'"},
|
||
{token.Char, "'\\U0000ff16'"},
|
||
{token.String, "`foobar`"},
|
||
{token.String, "`" + `foo
|
||
bar` +
|
||
"`",
|
||
},
|
||
{token.String, "`\r`"},
|
||
{token.String, "`foo\r\nbar`"},
|
||
{token.Add, "+"},
|
||
{token.Sub, "-"},
|
||
{token.Mul, "*"},
|
||
{token.Quo, "/"},
|
||
{token.Rem, "%"},
|
||
{token.And, "&"},
|
||
{token.Or, "|"},
|
||
{token.Xor, "^"},
|
||
{token.Shl, "<<"},
|
||
{token.Shr, ">>"},
|
||
{token.AndNot, "&^"},
|
||
{token.AddAssign, "+="},
|
||
{token.SubAssign, "-="},
|
||
{token.MulAssign, "*="},
|
||
{token.QuoAssign, "/="},
|
||
{token.RemAssign, "%="},
|
||
{token.AndAssign, "&="},
|
||
{token.OrAssign, "|="},
|
||
{token.XorAssign, "^="},
|
||
{token.ShlAssign, "<<="},
|
||
{token.ShrAssign, ">>="},
|
||
{token.AndNotAssign, "&^="},
|
||
{token.LAnd, "&&"},
|
||
{token.LOr, "||"},
|
||
{token.Inc, "++"},
|
||
{token.Dec, "--"},
|
||
{token.Equal, "=="},
|
||
{token.Less, "<"},
|
||
{token.Greater, ">"},
|
||
{token.Assign, "="},
|
||
{token.Not, "!"},
|
||
{token.NotEqual, "!="},
|
||
{token.LessEq, "<="},
|
||
{token.GreaterEq, ">="},
|
||
{token.Define, ":="},
|
||
{token.Ellipsis, "..."},
|
||
{token.LParen, "("},
|
||
{token.LBrack, "["},
|
||
{token.LBrace, "{"},
|
||
{token.Comma, ","},
|
||
{token.Period, "."},
|
||
{token.RParen, ")"},
|
||
{token.RBrack, "]"},
|
||
{token.RBrace, "}"},
|
||
{token.Semicolon, ";"},
|
||
{token.Colon, ":"},
|
||
{token.Break, "break"},
|
||
{token.Case, "case"},
|
||
{token.Continue, "continue"},
|
||
{token.Default, "default"},
|
||
{token.Else, "else"},
|
||
{token.For, "for"},
|
||
{token.Func, "func"},
|
||
{token.If, "if"},
|
||
{token.Return, "return"},
|
||
{token.Switch, "switch"},
|
||
{token.Var, "var"},
|
||
}
|
||
|
||
// combine
|
||
var lines []string
|
||
var lineSum int
|
||
lineNos := make([]int, len(testCases))
|
||
columnNos := make([]int, len(testCases))
|
||
for i, tc := range testCases {
|
||
// add 0-2 lines before each test case
|
||
emptyLines := rand.Intn(3)
|
||
for j := 0; j < emptyLines; j++ {
|
||
lines = append(lines, strings.Repeat(" ", rand.Intn(10)))
|
||
}
|
||
|
||
// add test case line with some whitespaces around it
|
||
emptyColumns := rand.Intn(10)
|
||
lines = append(lines, fmt.Sprintf("%s%s%s",
|
||
strings.Repeat(" ", emptyColumns),
|
||
tc.literal,
|
||
strings.Repeat(" ", rand.Intn(10))))
|
||
|
||
lineNos[i] = lineSum + emptyLines + 1
|
||
lineSum += emptyLines + countLines(tc.literal)
|
||
columnNos[i] = emptyColumns + 1
|
||
}
|
||
|
||
// expected results
|
||
var expected []scanResult
|
||
var expectedSkipComments []scanResult
|
||
for i, tc := range testCases {
|
||
// expected literal
|
||
var expectedLiteral string
|
||
switch tc.token {
|
||
case token.Comment:
|
||
// strip CRs in comments
|
||
expectedLiteral = string(scanner.StripCR([]byte(tc.literal), tc.literal[1] == '*'))
|
||
|
||
//-style comment literal doesn't contain newline
|
||
if expectedLiteral[1] == '/' {
|
||
expectedLiteral = expectedLiteral[:len(expectedLiteral)-1]
|
||
}
|
||
case token.Ident:
|
||
expectedLiteral = tc.literal
|
||
case token.Semicolon:
|
||
expectedLiteral = ";"
|
||
default:
|
||
if tc.token.IsLiteral() {
|
||
// strip CRs in raw string
|
||
expectedLiteral = tc.literal
|
||
if expectedLiteral[0] == '`' {
|
||
expectedLiteral = string(scanner.StripCR([]byte(expectedLiteral), false))
|
||
}
|
||
} else if tc.token.IsKeyword() {
|
||
expectedLiteral = tc.literal
|
||
}
|
||
}
|
||
|
||
res := scanResult{
|
||
Token: tc.token,
|
||
Literal: expectedLiteral,
|
||
Line: lineNos[i],
|
||
Column: columnNos[i],
|
||
}
|
||
|
||
expected = append(expected, res)
|
||
if tc.token != token.Comment {
|
||
expectedSkipComments = append(expectedSkipComments, res)
|
||
}
|
||
}
|
||
|
||
scanExpect(t, strings.Join(lines, "\n"), scanner.ScanComments|scanner.DontInsertSemis, expected...)
|
||
scanExpect(t, strings.Join(lines, "\n"), scanner.DontInsertSemis, expectedSkipComments...)
|
||
}
|
||
|
||
func TestStripCR(t *testing.T) {
|
||
for _, tc := range []struct {
|
||
input string
|
||
expect string
|
||
}{
|
||
{"//\n", "//\n"},
|
||
{"//\r\n", "//\n"},
|
||
{"//\r\r\r\n", "//\n"},
|
||
{"//\r*\r/\r\n", "//*/\n"},
|
||
{"/**/", "/**/"},
|
||
{"/*\r/*/", "/*/*/"},
|
||
{"/*\r*/", "/**/"},
|
||
{"/**\r/*/", "/**\r/*/"},
|
||
{"/*\r/\r*\r/*/", "/*/*\r/*/"},
|
||
{"/*\r\r\r\r*/", "/**/"},
|
||
} {
|
||
actual := string(scanner.StripCR([]byte(tc.input), len(tc.input) >= 2 && tc.input[1] == '*'))
|
||
assert.Equal(t, tc.expect, actual)
|
||
}
|
||
}
|
||
|
||
func scanExpect(t *testing.T, input string, mode scanner.Mode, expected ...scanResult) bool {
|
||
testFile := testFileSet.AddFile("", testFileSet.Base(), len(input))
|
||
|
||
s := scanner.NewScanner(
|
||
testFile,
|
||
[]byte(input),
|
||
func(_ source.FilePos, msg string) { assert.Fail(t, msg) },
|
||
mode)
|
||
|
||
for idx, e := range expected {
|
||
tok, literal, pos := s.Scan()
|
||
|
||
filePos := testFile.Position(pos)
|
||
|
||
if !assert.Equal(t, e.Token, tok, "[%d] expected: %s, actual: %s", idx, e.Token.String(), tok.String()) ||
|
||
!assert.Equal(t, e.Literal, literal) ||
|
||
!assert.Equal(t, e.Line, filePos.Line) ||
|
||
!assert.Equal(t, e.Column, filePos.Column) {
|
||
return false
|
||
}
|
||
}
|
||
|
||
tok, _, _ := s.Scan()
|
||
assert.Equal(t, token.EOF, tok, "more tokens left")
|
||
|
||
return assert.Equal(t, 0, s.ErrorCount())
|
||
}
|
||
|
||
func countLines(s string) int {
|
||
if s == "" {
|
||
return 0
|
||
}
|
||
|
||
n := 1
|
||
for i := 0; i < len(s); i++ {
|
||
if s[i] == '\n' {
|
||
n++
|
||
}
|
||
}
|
||
|
||
return n
|
||
}
|
||
|
||
func init() {
|
||
rand.Seed(time.Now().UnixNano())
|
||
}
|