goparsify/literals.go
2017-08-08 20:52:25 +10:00

174 lines
3.2 KiB
Go

package goparsify
import (
"bytes"
"strconv"
"unicode/utf8"
)
func StringLit(allowedQuotes string) Parser {
return NewParser("string literal", func(ps *State) Node {
ps.AutoWS()
for i := 0; i < len(allowedQuotes); i++ {
if ps.Input[ps.Pos] == allowedQuotes[i] {
}
}
if !stringContainsByte(allowedQuotes, ps.Input[ps.Pos]) {
ps.ErrorHere(allowedQuotes)
return Node{}
}
quote := ps.Input[ps.Pos]
var end int = ps.Pos + 1
inputLen := len(ps.Input)
var buf *bytes.Buffer
for end < inputLen {
switch ps.Input[end] {
case '\\':
if end+1 >= inputLen {
ps.ErrorHere(string(quote))
return Node{}
}
if buf == nil {
buf = bytes.NewBufferString(ps.Input[ps.Pos+1 : end])
}
c := ps.Input[end+1]
if c == 'u' {
if end+6 >= inputLen {
ps.Error.Expected = "[a-f0-9]{4}"
ps.Error.pos = end + 2
return Node{}
}
r, ok := unhex(ps.Input[end+2 : end+6])
if !ok {
ps.Error.Expected = "[a-f0-9]"
ps.Error.pos = end + 2
return Node{}
}
buf.WriteRune(r)
end += 6
} else {
buf.WriteByte(c)
end += 2
}
case quote:
if buf == nil {
result := ps.Input[ps.Pos+1 : end]
ps.Pos = end + 1
return Node{Result: result}
}
ps.Pos = end + 1
return Node{Result: buf.String()}
default:
if buf == nil {
if ps.Input[end] < 127 {
end++
} else {
_, w := utf8.DecodeRuneInString(ps.Input[end:])
end += w
}
} else {
r, w := utf8.DecodeRuneInString(ps.Input[end:])
end += w
buf.WriteRune(r)
}
}
}
ps.ErrorHere(string(quote))
return Node{}
})
}
func NumberLit() Parser {
return NewParser("number literal", func(ps *State) Node {
ps.AutoWS()
end := ps.Pos
float := false
inputLen := len(ps.Input)
if end < inputLen && (ps.Input[end] == '-' || ps.Input[end] == '+') {
end++
}
for end < inputLen && ps.Input[end] >= '0' && ps.Input[end] <= '9' {
end++
}
if end < inputLen && ps.Input[end] == '.' {
float = true
end++
}
for end < inputLen && ps.Input[end] >= '0' && ps.Input[end] <= '9' {
end++
}
if end < inputLen && (ps.Input[end] == 'e' || ps.Input[end] == 'E') {
end++
float = true
if end < inputLen && (ps.Input[end] == '-' || ps.Input[end] == '+') {
end++
}
for end < inputLen && ps.Input[end] >= '0' && ps.Input[end] <= '9' {
end++
}
}
if end == ps.Pos {
ps.ErrorHere("number")
return Node{}
}
var result interface{}
var err error
if float {
result, err = strconv.ParseFloat(ps.Input[ps.Pos:end], 10)
} else {
result, err = strconv.ParseInt(ps.Input[ps.Pos:end], 10, 64)
}
if err != nil {
ps.ErrorHere("number")
return Node{}
}
ps.Pos = end
return Node{Result: result}
})
}
func stringContainsByte(s string, b byte) bool {
for i := 0; i < len(s); i++ {
if b == s[i] {
return true
}
}
return false
}
func unhex(b string) (v rune, ok bool) {
for _, c := range b {
v <<= 4
switch {
case '0' <= c && c <= '9':
v |= c - '0'
case 'a' <= c && c <= 'f':
v |= c - 'a' + 10
case 'A' <= c && c <= 'F':
v |= c - 'A' + 10
default:
return 0, false
}
}
return v, true
}