mirror of
https://github.com/caddyserver/caddy.git
synced 2025-01-13 22:51:08 -05:00
c12bf4054c
Newlines (\n) can be escaped outside of quoted areas and the newline will be treated as whitespace but not as an actual line break. Escaping newlines inside a quoted area is not necessary, and because quotes trigger literal interpretation of the contents, the escaping backslash will be parsed as a literal backslash, and the newline will not be escaped. Caveat: When a newline is escaped, tokens after it until an unescaped newline will appear to the parser be on the same line as the initial token after the last unescaped newline. This may technically lead to some false line numbers if errors are given, but escaped newlines are counted so that the next token after an unescaped newline is correct. See #2766
232 lines
5.1 KiB
Go
Executable file
232 lines
5.1 KiB
Go
Executable file
// Copyright 2015 Light Code Labs, LLC
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
package caddyfile
|
|
|
|
import (
|
|
"log"
|
|
"strings"
|
|
"testing"
|
|
)
|
|
|
|
type lexerTestCase struct {
|
|
input string
|
|
expected []Token
|
|
}
|
|
|
|
func TestLexer(t *testing.T) {
|
|
testCases := []lexerTestCase{
|
|
{
|
|
input: `host:123`,
|
|
expected: []Token{
|
|
{Line: 1, Text: "host:123"},
|
|
},
|
|
},
|
|
{
|
|
input: `host:123
|
|
|
|
directive`,
|
|
expected: []Token{
|
|
{Line: 1, Text: "host:123"},
|
|
{Line: 3, Text: "directive"},
|
|
},
|
|
},
|
|
{
|
|
input: `host:123 {
|
|
directive
|
|
}`,
|
|
expected: []Token{
|
|
{Line: 1, Text: "host:123"},
|
|
{Line: 1, Text: "{"},
|
|
{Line: 2, Text: "directive"},
|
|
{Line: 3, Text: "}"},
|
|
},
|
|
},
|
|
{
|
|
input: `host:123 { directive }`,
|
|
expected: []Token{
|
|
{Line: 1, Text: "host:123"},
|
|
{Line: 1, Text: "{"},
|
|
{Line: 1, Text: "directive"},
|
|
{Line: 1, Text: "}"},
|
|
},
|
|
},
|
|
{
|
|
input: `host:123 {
|
|
#comment
|
|
directive
|
|
# comment
|
|
foobar # another comment
|
|
}`,
|
|
expected: []Token{
|
|
{Line: 1, Text: "host:123"},
|
|
{Line: 1, Text: "{"},
|
|
{Line: 3, Text: "directive"},
|
|
{Line: 5, Text: "foobar"},
|
|
{Line: 6, Text: "}"},
|
|
},
|
|
},
|
|
{
|
|
input: `a "quoted value" b
|
|
foobar`,
|
|
expected: []Token{
|
|
{Line: 1, Text: "a"},
|
|
{Line: 1, Text: "quoted value"},
|
|
{Line: 1, Text: "b"},
|
|
{Line: 2, Text: "foobar"},
|
|
},
|
|
},
|
|
{
|
|
input: `A "quoted \"value\" inside" B`,
|
|
expected: []Token{
|
|
{Line: 1, Text: "A"},
|
|
{Line: 1, Text: `quoted "value" inside`},
|
|
{Line: 1, Text: "B"},
|
|
},
|
|
},
|
|
{
|
|
input: "An escaped \"newline\\\ninside\" quotes",
|
|
expected: []Token{
|
|
{Line: 1, Text: "An"},
|
|
{Line: 1, Text: "escaped"},
|
|
{Line: 1, Text: "newline\\\ninside"},
|
|
{Line: 2, Text: "quotes"},
|
|
},
|
|
},
|
|
{
|
|
input: "An escaped newline\\\noutside quotes",
|
|
expected: []Token{
|
|
{Line: 1, Text: "An"},
|
|
{Line: 1, Text: "escaped"},
|
|
{Line: 1, Text: "newline"},
|
|
{Line: 1, Text: "outside"},
|
|
{Line: 1, Text: "quotes"},
|
|
},
|
|
},
|
|
{
|
|
input: "line1\\\nescaped\nline2\nline3",
|
|
expected: []Token{
|
|
{Line: 1, Text: "line1"},
|
|
{Line: 1, Text: "escaped"},
|
|
{Line: 3, Text: "line2"},
|
|
{Line: 4, Text: "line3"},
|
|
},
|
|
},
|
|
{
|
|
input: "line1\\\nescaped1\\\nescaped2\nline4\nline5",
|
|
expected: []Token{
|
|
{Line: 1, Text: "line1"},
|
|
{Line: 1, Text: "escaped1"},
|
|
{Line: 1, Text: "escaped2"},
|
|
{Line: 4, Text: "line4"},
|
|
{Line: 5, Text: "line5"},
|
|
},
|
|
},
|
|
{
|
|
input: `"unescapable\ in quotes"`,
|
|
expected: []Token{
|
|
{Line: 1, Text: `unescapable\ in quotes`},
|
|
},
|
|
},
|
|
{
|
|
input: `"don't\escape"`,
|
|
expected: []Token{
|
|
{Line: 1, Text: `don't\escape`},
|
|
},
|
|
},
|
|
{
|
|
input: `"don't\\escape"`,
|
|
expected: []Token{
|
|
{Line: 1, Text: `don't\\escape`},
|
|
},
|
|
},
|
|
{
|
|
input: `A "quoted value with line
|
|
break inside" {
|
|
foobar
|
|
}`,
|
|
expected: []Token{
|
|
{Line: 1, Text: "A"},
|
|
{Line: 1, Text: "quoted value with line\n\t\t\t\t\tbreak inside"},
|
|
{Line: 2, Text: "{"},
|
|
{Line: 3, Text: "foobar"},
|
|
{Line: 4, Text: "}"},
|
|
},
|
|
},
|
|
{
|
|
input: `"C:\php\php-cgi.exe"`,
|
|
expected: []Token{
|
|
{Line: 1, Text: `C:\php\php-cgi.exe`},
|
|
},
|
|
},
|
|
{
|
|
input: `empty "" string`,
|
|
expected: []Token{
|
|
{Line: 1, Text: `empty`},
|
|
{Line: 1, Text: ``},
|
|
{Line: 1, Text: `string`},
|
|
},
|
|
},
|
|
{
|
|
input: "skip those\r\nCR characters",
|
|
expected: []Token{
|
|
{Line: 1, Text: "skip"},
|
|
{Line: 1, Text: "those"},
|
|
{Line: 2, Text: "CR"},
|
|
{Line: 2, Text: "characters"},
|
|
},
|
|
},
|
|
{
|
|
input: "\xEF\xBB\xBF:8080", // test with leading byte order mark
|
|
expected: []Token{
|
|
{Line: 1, Text: ":8080"},
|
|
},
|
|
},
|
|
}
|
|
|
|
for i, testCase := range testCases {
|
|
actual := tokenize(testCase.input)
|
|
lexerCompare(t, i, testCase.expected, actual)
|
|
}
|
|
}
|
|
|
|
func tokenize(input string) (tokens []Token) {
|
|
l := lexer{}
|
|
if err := l.load(strings.NewReader(input)); err != nil {
|
|
log.Printf("[ERROR] load failed: %v", err)
|
|
}
|
|
for l.next() {
|
|
tokens = append(tokens, l.token)
|
|
}
|
|
return
|
|
}
|
|
|
|
func lexerCompare(t *testing.T, n int, expected, actual []Token) {
|
|
if len(expected) != len(actual) {
|
|
t.Errorf("Test case %d: expected %d token(s) but got %d", n, len(expected), len(actual))
|
|
}
|
|
|
|
for i := 0; i < len(actual) && i < len(expected); i++ {
|
|
if actual[i].Line != expected[i].Line {
|
|
t.Errorf("Test case %d token %d ('%s'): expected line %d but was line %d",
|
|
n, i, expected[i].Text, expected[i].Line, actual[i].Line)
|
|
break
|
|
}
|
|
if actual[i].Text != expected[i].Text {
|
|
t.Errorf("Test case %d token %d: expected text '%s' but was '%s'",
|
|
n, i, expected[i].Text, actual[i].Text)
|
|
break
|
|
}
|
|
}
|
|
}
|