forked from Shiloh/githaven
836 lines
17 KiB
Go
836 lines
17 KiB
Go
|
// Package cascadia is an implementation of CSS selectors.
|
||
|
package cascadia
|
||
|
|
||
|
import (
|
||
|
"errors"
|
||
|
"fmt"
|
||
|
"regexp"
|
||
|
"strconv"
|
||
|
"strings"
|
||
|
|
||
|
"golang.org/x/net/html"
|
||
|
)
|
||
|
|
||
|
// a parser for CSS selectors
|
||
|
type parser struct {
|
||
|
s string // the source text
|
||
|
i int // the current position
|
||
|
}
|
||
|
|
||
|
// parseEscape parses a backslash escape.
|
||
|
func (p *parser) parseEscape() (result string, err error) {
|
||
|
if len(p.s) < p.i+2 || p.s[p.i] != '\\' {
|
||
|
return "", errors.New("invalid escape sequence")
|
||
|
}
|
||
|
|
||
|
start := p.i + 1
|
||
|
c := p.s[start]
|
||
|
switch {
|
||
|
case c == '\r' || c == '\n' || c == '\f':
|
||
|
return "", errors.New("escaped line ending outside string")
|
||
|
case hexDigit(c):
|
||
|
// unicode escape (hex)
|
||
|
var i int
|
||
|
for i = start; i < p.i+6 && i < len(p.s) && hexDigit(p.s[i]); i++ {
|
||
|
// empty
|
||
|
}
|
||
|
v, _ := strconv.ParseUint(p.s[start:i], 16, 21)
|
||
|
if len(p.s) > i {
|
||
|
switch p.s[i] {
|
||
|
case '\r':
|
||
|
i++
|
||
|
if len(p.s) > i && p.s[i] == '\n' {
|
||
|
i++
|
||
|
}
|
||
|
case ' ', '\t', '\n', '\f':
|
||
|
i++
|
||
|
}
|
||
|
}
|
||
|
p.i = i
|
||
|
return string(rune(v)), nil
|
||
|
}
|
||
|
|
||
|
// Return the literal character after the backslash.
|
||
|
result = p.s[start : start+1]
|
||
|
p.i += 2
|
||
|
return result, nil
|
||
|
}
|
||
|
|
||
|
func hexDigit(c byte) bool {
|
||
|
return '0' <= c && c <= '9' || 'a' <= c && c <= 'f' || 'A' <= c && c <= 'F'
|
||
|
}
|
||
|
|
||
|
// nameStart returns whether c can be the first character of an identifier
|
||
|
// (not counting an initial hyphen, or an escape sequence).
|
||
|
func nameStart(c byte) bool {
|
||
|
return 'a' <= c && c <= 'z' || 'A' <= c && c <= 'Z' || c == '_' || c > 127
|
||
|
}
|
||
|
|
||
|
// nameChar returns whether c can be a character within an identifier
|
||
|
// (not counting an escape sequence).
|
||
|
func nameChar(c byte) bool {
|
||
|
return 'a' <= c && c <= 'z' || 'A' <= c && c <= 'Z' || c == '_' || c > 127 ||
|
||
|
c == '-' || '0' <= c && c <= '9'
|
||
|
}
|
||
|
|
||
|
// parseIdentifier parses an identifier.
|
||
|
func (p *parser) parseIdentifier() (result string, err error) {
|
||
|
startingDash := false
|
||
|
if len(p.s) > p.i && p.s[p.i] == '-' {
|
||
|
startingDash = true
|
||
|
p.i++
|
||
|
}
|
||
|
|
||
|
if len(p.s) <= p.i {
|
||
|
return "", errors.New("expected identifier, found EOF instead")
|
||
|
}
|
||
|
|
||
|
if c := p.s[p.i]; !(nameStart(c) || c == '\\') {
|
||
|
return "", fmt.Errorf("expected identifier, found %c instead", c)
|
||
|
}
|
||
|
|
||
|
result, err = p.parseName()
|
||
|
if startingDash && err == nil {
|
||
|
result = "-" + result
|
||
|
}
|
||
|
return
|
||
|
}
|
||
|
|
||
|
// parseName parses a name (which is like an identifier, but doesn't have
|
||
|
// extra restrictions on the first character).
|
||
|
func (p *parser) parseName() (result string, err error) {
|
||
|
i := p.i
|
||
|
loop:
|
||
|
for i < len(p.s) {
|
||
|
c := p.s[i]
|
||
|
switch {
|
||
|
case nameChar(c):
|
||
|
start := i
|
||
|
for i < len(p.s) && nameChar(p.s[i]) {
|
||
|
i++
|
||
|
}
|
||
|
result += p.s[start:i]
|
||
|
case c == '\\':
|
||
|
p.i = i
|
||
|
val, err := p.parseEscape()
|
||
|
if err != nil {
|
||
|
return "", err
|
||
|
}
|
||
|
i = p.i
|
||
|
result += val
|
||
|
default:
|
||
|
break loop
|
||
|
}
|
||
|
}
|
||
|
|
||
|
if result == "" {
|
||
|
return "", errors.New("expected name, found EOF instead")
|
||
|
}
|
||
|
|
||
|
p.i = i
|
||
|
return result, nil
|
||
|
}
|
||
|
|
||
|
// parseString parses a single- or double-quoted string.
|
||
|
func (p *parser) parseString() (result string, err error) {
|
||
|
i := p.i
|
||
|
if len(p.s) < i+2 {
|
||
|
return "", errors.New("expected string, found EOF instead")
|
||
|
}
|
||
|
|
||
|
quote := p.s[i]
|
||
|
i++
|
||
|
|
||
|
loop:
|
||
|
for i < len(p.s) {
|
||
|
switch p.s[i] {
|
||
|
case '\\':
|
||
|
if len(p.s) > i+1 {
|
||
|
switch c := p.s[i+1]; c {
|
||
|
case '\r':
|
||
|
if len(p.s) > i+2 && p.s[i+2] == '\n' {
|
||
|
i += 3
|
||
|
continue loop
|
||
|
}
|
||
|
fallthrough
|
||
|
case '\n', '\f':
|
||
|
i += 2
|
||
|
continue loop
|
||
|
}
|
||
|
}
|
||
|
p.i = i
|
||
|
val, err := p.parseEscape()
|
||
|
if err != nil {
|
||
|
return "", err
|
||
|
}
|
||
|
i = p.i
|
||
|
result += val
|
||
|
case quote:
|
||
|
break loop
|
||
|
case '\r', '\n', '\f':
|
||
|
return "", errors.New("unexpected end of line in string")
|
||
|
default:
|
||
|
start := i
|
||
|
for i < len(p.s) {
|
||
|
if c := p.s[i]; c == quote || c == '\\' || c == '\r' || c == '\n' || c == '\f' {
|
||
|
break
|
||
|
}
|
||
|
i++
|
||
|
}
|
||
|
result += p.s[start:i]
|
||
|
}
|
||
|
}
|
||
|
|
||
|
if i >= len(p.s) {
|
||
|
return "", errors.New("EOF in string")
|
||
|
}
|
||
|
|
||
|
// Consume the final quote.
|
||
|
i++
|
||
|
|
||
|
p.i = i
|
||
|
return result, nil
|
||
|
}
|
||
|
|
||
|
// parseRegex parses a regular expression; the end is defined by encountering an
|
||
|
// unmatched closing ')' or ']' which is not consumed
|
||
|
func (p *parser) parseRegex() (rx *regexp.Regexp, err error) {
|
||
|
i := p.i
|
||
|
if len(p.s) < i+2 {
|
||
|
return nil, errors.New("expected regular expression, found EOF instead")
|
||
|
}
|
||
|
|
||
|
// number of open parens or brackets;
|
||
|
// when it becomes negative, finished parsing regex
|
||
|
open := 0
|
||
|
|
||
|
loop:
|
||
|
for i < len(p.s) {
|
||
|
switch p.s[i] {
|
||
|
case '(', '[':
|
||
|
open++
|
||
|
case ')', ']':
|
||
|
open--
|
||
|
if open < 0 {
|
||
|
break loop
|
||
|
}
|
||
|
}
|
||
|
i++
|
||
|
}
|
||
|
|
||
|
if i >= len(p.s) {
|
||
|
return nil, errors.New("EOF in regular expression")
|
||
|
}
|
||
|
rx, err = regexp.Compile(p.s[p.i:i])
|
||
|
p.i = i
|
||
|
return rx, err
|
||
|
}
|
||
|
|
||
|
// skipWhitespace consumes whitespace characters and comments.
|
||
|
// It returns true if there was actually anything to skip.
|
||
|
func (p *parser) skipWhitespace() bool {
|
||
|
i := p.i
|
||
|
for i < len(p.s) {
|
||
|
switch p.s[i] {
|
||
|
case ' ', '\t', '\r', '\n', '\f':
|
||
|
i++
|
||
|
continue
|
||
|
case '/':
|
||
|
if strings.HasPrefix(p.s[i:], "/*") {
|
||
|
end := strings.Index(p.s[i+len("/*"):], "*/")
|
||
|
if end != -1 {
|
||
|
i += end + len("/**/")
|
||
|
continue
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
break
|
||
|
}
|
||
|
|
||
|
if i > p.i {
|
||
|
p.i = i
|
||
|
return true
|
||
|
}
|
||
|
|
||
|
return false
|
||
|
}
|
||
|
|
||
|
// consumeParenthesis consumes an opening parenthesis and any following
|
||
|
// whitespace. It returns true if there was actually a parenthesis to skip.
|
||
|
func (p *parser) consumeParenthesis() bool {
|
||
|
if p.i < len(p.s) && p.s[p.i] == '(' {
|
||
|
p.i++
|
||
|
p.skipWhitespace()
|
||
|
return true
|
||
|
}
|
||
|
return false
|
||
|
}
|
||
|
|
||
|
// consumeClosingParenthesis consumes a closing parenthesis and any preceding
|
||
|
// whitespace. It returns true if there was actually a parenthesis to skip.
|
||
|
func (p *parser) consumeClosingParenthesis() bool {
|
||
|
i := p.i
|
||
|
p.skipWhitespace()
|
||
|
if p.i < len(p.s) && p.s[p.i] == ')' {
|
||
|
p.i++
|
||
|
return true
|
||
|
}
|
||
|
p.i = i
|
||
|
return false
|
||
|
}
|
||
|
|
||
|
// parseTypeSelector parses a type selector (one that matches by tag name).
|
||
|
func (p *parser) parseTypeSelector() (result Selector, err error) {
|
||
|
tag, err := p.parseIdentifier()
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
|
||
|
return typeSelector(tag), nil
|
||
|
}
|
||
|
|
||
|
// parseIDSelector parses a selector that matches by id attribute.
|
||
|
func (p *parser) parseIDSelector() (Selector, error) {
|
||
|
if p.i >= len(p.s) {
|
||
|
return nil, fmt.Errorf("expected id selector (#id), found EOF instead")
|
||
|
}
|
||
|
if p.s[p.i] != '#' {
|
||
|
return nil, fmt.Errorf("expected id selector (#id), found '%c' instead", p.s[p.i])
|
||
|
}
|
||
|
|
||
|
p.i++
|
||
|
id, err := p.parseName()
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
|
||
|
return attributeEqualsSelector("id", id), nil
|
||
|
}
|
||
|
|
||
|
// parseClassSelector parses a selector that matches by class attribute.
|
||
|
func (p *parser) parseClassSelector() (Selector, error) {
|
||
|
if p.i >= len(p.s) {
|
||
|
return nil, fmt.Errorf("expected class selector (.class), found EOF instead")
|
||
|
}
|
||
|
if p.s[p.i] != '.' {
|
||
|
return nil, fmt.Errorf("expected class selector (.class), found '%c' instead", p.s[p.i])
|
||
|
}
|
||
|
|
||
|
p.i++
|
||
|
class, err := p.parseIdentifier()
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
|
||
|
return attributeIncludesSelector("class", class), nil
|
||
|
}
|
||
|
|
||
|
// parseAttributeSelector parses a selector that matches by attribute value.
|
||
|
func (p *parser) parseAttributeSelector() (Selector, error) {
|
||
|
if p.i >= len(p.s) {
|
||
|
return nil, fmt.Errorf("expected attribute selector ([attribute]), found EOF instead")
|
||
|
}
|
||
|
if p.s[p.i] != '[' {
|
||
|
return nil, fmt.Errorf("expected attribute selector ([attribute]), found '%c' instead", p.s[p.i])
|
||
|
}
|
||
|
|
||
|
p.i++
|
||
|
p.skipWhitespace()
|
||
|
key, err := p.parseIdentifier()
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
|
||
|
p.skipWhitespace()
|
||
|
if p.i >= len(p.s) {
|
||
|
return nil, errors.New("unexpected EOF in attribute selector")
|
||
|
}
|
||
|
|
||
|
if p.s[p.i] == ']' {
|
||
|
p.i++
|
||
|
return attributeExistsSelector(key), nil
|
||
|
}
|
||
|
|
||
|
if p.i+2 >= len(p.s) {
|
||
|
return nil, errors.New("unexpected EOF in attribute selector")
|
||
|
}
|
||
|
|
||
|
op := p.s[p.i : p.i+2]
|
||
|
if op[0] == '=' {
|
||
|
op = "="
|
||
|
} else if op[1] != '=' {
|
||
|
return nil, fmt.Errorf(`expected equality operator, found "%s" instead`, op)
|
||
|
}
|
||
|
p.i += len(op)
|
||
|
|
||
|
p.skipWhitespace()
|
||
|
if p.i >= len(p.s) {
|
||
|
return nil, errors.New("unexpected EOF in attribute selector")
|
||
|
}
|
||
|
var val string
|
||
|
var rx *regexp.Regexp
|
||
|
if op == "#=" {
|
||
|
rx, err = p.parseRegex()
|
||
|
} else {
|
||
|
switch p.s[p.i] {
|
||
|
case '\'', '"':
|
||
|
val, err = p.parseString()
|
||
|
default:
|
||
|
val, err = p.parseIdentifier()
|
||
|
}
|
||
|
}
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
|
||
|
p.skipWhitespace()
|
||
|
if p.i >= len(p.s) {
|
||
|
return nil, errors.New("unexpected EOF in attribute selector")
|
||
|
}
|
||
|
if p.s[p.i] != ']' {
|
||
|
return nil, fmt.Errorf("expected ']', found '%c' instead", p.s[p.i])
|
||
|
}
|
||
|
p.i++
|
||
|
|
||
|
switch op {
|
||
|
case "=":
|
||
|
return attributeEqualsSelector(key, val), nil
|
||
|
case "!=":
|
||
|
return attributeNotEqualSelector(key, val), nil
|
||
|
case "~=":
|
||
|
return attributeIncludesSelector(key, val), nil
|
||
|
case "|=":
|
||
|
return attributeDashmatchSelector(key, val), nil
|
||
|
case "^=":
|
||
|
return attributePrefixSelector(key, val), nil
|
||
|
case "$=":
|
||
|
return attributeSuffixSelector(key, val), nil
|
||
|
case "*=":
|
||
|
return attributeSubstringSelector(key, val), nil
|
||
|
case "#=":
|
||
|
return attributeRegexSelector(key, rx), nil
|
||
|
}
|
||
|
|
||
|
return nil, fmt.Errorf("attribute operator %q is not supported", op)
|
||
|
}
|
||
|
|
||
|
var errExpectedParenthesis = errors.New("expected '(' but didn't find it")
|
||
|
var errExpectedClosingParenthesis = errors.New("expected ')' but didn't find it")
|
||
|
var errUnmatchedParenthesis = errors.New("unmatched '('")
|
||
|
|
||
|
// parsePseudoclassSelector parses a pseudoclass selector like :not(p).
|
||
|
func (p *parser) parsePseudoclassSelector() (Selector, error) {
|
||
|
if p.i >= len(p.s) {
|
||
|
return nil, fmt.Errorf("expected pseudoclass selector (:pseudoclass), found EOF instead")
|
||
|
}
|
||
|
if p.s[p.i] != ':' {
|
||
|
return nil, fmt.Errorf("expected attribute selector (:pseudoclass), found '%c' instead", p.s[p.i])
|
||
|
}
|
||
|
|
||
|
p.i++
|
||
|
name, err := p.parseIdentifier()
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
name = toLowerASCII(name)
|
||
|
|
||
|
switch name {
|
||
|
case "not", "has", "haschild":
|
||
|
if !p.consumeParenthesis() {
|
||
|
return nil, errExpectedParenthesis
|
||
|
}
|
||
|
sel, parseErr := p.parseSelectorGroup()
|
||
|
if parseErr != nil {
|
||
|
return nil, parseErr
|
||
|
}
|
||
|
if !p.consumeClosingParenthesis() {
|
||
|
return nil, errExpectedClosingParenthesis
|
||
|
}
|
||
|
|
||
|
switch name {
|
||
|
case "not":
|
||
|
return negatedSelector(sel), nil
|
||
|
case "has":
|
||
|
return hasDescendantSelector(sel), nil
|
||
|
case "haschild":
|
||
|
return hasChildSelector(sel), nil
|
||
|
}
|
||
|
|
||
|
case "contains", "containsown":
|
||
|
if !p.consumeParenthesis() {
|
||
|
return nil, errExpectedParenthesis
|
||
|
}
|
||
|
if p.i == len(p.s) {
|
||
|
return nil, errUnmatchedParenthesis
|
||
|
}
|
||
|
var val string
|
||
|
switch p.s[p.i] {
|
||
|
case '\'', '"':
|
||
|
val, err = p.parseString()
|
||
|
default:
|
||
|
val, err = p.parseIdentifier()
|
||
|
}
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
val = strings.ToLower(val)
|
||
|
p.skipWhitespace()
|
||
|
if p.i >= len(p.s) {
|
||
|
return nil, errors.New("unexpected EOF in pseudo selector")
|
||
|
}
|
||
|
if !p.consumeClosingParenthesis() {
|
||
|
return nil, errExpectedClosingParenthesis
|
||
|
}
|
||
|
|
||
|
switch name {
|
||
|
case "contains":
|
||
|
return textSubstrSelector(val), nil
|
||
|
case "containsown":
|
||
|
return ownTextSubstrSelector(val), nil
|
||
|
}
|
||
|
|
||
|
case "matches", "matchesown":
|
||
|
if !p.consumeParenthesis() {
|
||
|
return nil, errExpectedParenthesis
|
||
|
}
|
||
|
rx, err := p.parseRegex()
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
if p.i >= len(p.s) {
|
||
|
return nil, errors.New("unexpected EOF in pseudo selector")
|
||
|
}
|
||
|
if !p.consumeClosingParenthesis() {
|
||
|
return nil, errExpectedClosingParenthesis
|
||
|
}
|
||
|
|
||
|
switch name {
|
||
|
case "matches":
|
||
|
return textRegexSelector(rx), nil
|
||
|
case "matchesown":
|
||
|
return ownTextRegexSelector(rx), nil
|
||
|
}
|
||
|
|
||
|
case "nth-child", "nth-last-child", "nth-of-type", "nth-last-of-type":
|
||
|
if !p.consumeParenthesis() {
|
||
|
return nil, errExpectedParenthesis
|
||
|
}
|
||
|
a, b, err := p.parseNth()
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
if !p.consumeClosingParenthesis() {
|
||
|
return nil, errExpectedClosingParenthesis
|
||
|
}
|
||
|
if a == 0 {
|
||
|
switch name {
|
||
|
case "nth-child":
|
||
|
return simpleNthChildSelector(b, false), nil
|
||
|
case "nth-of-type":
|
||
|
return simpleNthChildSelector(b, true), nil
|
||
|
case "nth-last-child":
|
||
|
return simpleNthLastChildSelector(b, false), nil
|
||
|
case "nth-last-of-type":
|
||
|
return simpleNthLastChildSelector(b, true), nil
|
||
|
}
|
||
|
}
|
||
|
return nthChildSelector(a, b,
|
||
|
name == "nth-last-child" || name == "nth-last-of-type",
|
||
|
name == "nth-of-type" || name == "nth-last-of-type"),
|
||
|
nil
|
||
|
|
||
|
case "first-child":
|
||
|
return simpleNthChildSelector(1, false), nil
|
||
|
case "last-child":
|
||
|
return simpleNthLastChildSelector(1, false), nil
|
||
|
case "first-of-type":
|
||
|
return simpleNthChildSelector(1, true), nil
|
||
|
case "last-of-type":
|
||
|
return simpleNthLastChildSelector(1, true), nil
|
||
|
case "only-child":
|
||
|
return onlyChildSelector(false), nil
|
||
|
case "only-of-type":
|
||
|
return onlyChildSelector(true), nil
|
||
|
case "input":
|
||
|
return inputSelector, nil
|
||
|
case "empty":
|
||
|
return emptyElementSelector, nil
|
||
|
case "root":
|
||
|
return rootSelector, nil
|
||
|
}
|
||
|
|
||
|
return nil, fmt.Errorf("unknown pseudoclass :%s", name)
|
||
|
}
|
||
|
|
||
|
// parseInteger parses a decimal integer.
|
||
|
func (p *parser) parseInteger() (int, error) {
|
||
|
i := p.i
|
||
|
start := i
|
||
|
for i < len(p.s) && '0' <= p.s[i] && p.s[i] <= '9' {
|
||
|
i++
|
||
|
}
|
||
|
if i == start {
|
||
|
return 0, errors.New("expected integer, but didn't find it")
|
||
|
}
|
||
|
p.i = i
|
||
|
|
||
|
val, err := strconv.Atoi(p.s[start:i])
|
||
|
if err != nil {
|
||
|
return 0, err
|
||
|
}
|
||
|
|
||
|
return val, nil
|
||
|
}
|
||
|
|
||
|
// parseNth parses the argument for :nth-child (normally of the form an+b).
|
||
|
func (p *parser) parseNth() (a, b int, err error) {
|
||
|
// initial state
|
||
|
if p.i >= len(p.s) {
|
||
|
goto eof
|
||
|
}
|
||
|
switch p.s[p.i] {
|
||
|
case '-':
|
||
|
p.i++
|
||
|
goto negativeA
|
||
|
case '+':
|
||
|
p.i++
|
||
|
goto positiveA
|
||
|
case '0', '1', '2', '3', '4', '5', '6', '7', '8', '9':
|
||
|
goto positiveA
|
||
|
case 'n', 'N':
|
||
|
a = 1
|
||
|
p.i++
|
||
|
goto readN
|
||
|
case 'o', 'O', 'e', 'E':
|
||
|
id, nameErr := p.parseName()
|
||
|
if nameErr != nil {
|
||
|
return 0, 0, nameErr
|
||
|
}
|
||
|
id = toLowerASCII(id)
|
||
|
if id == "odd" {
|
||
|
return 2, 1, nil
|
||
|
}
|
||
|
if id == "even" {
|
||
|
return 2, 0, nil
|
||
|
}
|
||
|
return 0, 0, fmt.Errorf("expected 'odd' or 'even', but found '%s' instead", id)
|
||
|
default:
|
||
|
goto invalid
|
||
|
}
|
||
|
|
||
|
positiveA:
|
||
|
if p.i >= len(p.s) {
|
||
|
goto eof
|
||
|
}
|
||
|
switch p.s[p.i] {
|
||
|
case '0', '1', '2', '3', '4', '5', '6', '7', '8', '9':
|
||
|
a, err = p.parseInteger()
|
||
|
if err != nil {
|
||
|
return 0, 0, err
|
||
|
}
|
||
|
goto readA
|
||
|
case 'n', 'N':
|
||
|
a = 1
|
||
|
p.i++
|
||
|
goto readN
|
||
|
default:
|
||
|
goto invalid
|
||
|
}
|
||
|
|
||
|
negativeA:
|
||
|
if p.i >= len(p.s) {
|
||
|
goto eof
|
||
|
}
|
||
|
switch p.s[p.i] {
|
||
|
case '0', '1', '2', '3', '4', '5', '6', '7', '8', '9':
|
||
|
a, err = p.parseInteger()
|
||
|
if err != nil {
|
||
|
return 0, 0, err
|
||
|
}
|
||
|
a = -a
|
||
|
goto readA
|
||
|
case 'n', 'N':
|
||
|
a = -1
|
||
|
p.i++
|
||
|
goto readN
|
||
|
default:
|
||
|
goto invalid
|
||
|
}
|
||
|
|
||
|
readA:
|
||
|
if p.i >= len(p.s) {
|
||
|
goto eof
|
||
|
}
|
||
|
switch p.s[p.i] {
|
||
|
case 'n', 'N':
|
||
|
p.i++
|
||
|
goto readN
|
||
|
default:
|
||
|
// The number we read as a is actually b.
|
||
|
return 0, a, nil
|
||
|
}
|
||
|
|
||
|
readN:
|
||
|
p.skipWhitespace()
|
||
|
if p.i >= len(p.s) {
|
||
|
goto eof
|
||
|
}
|
||
|
switch p.s[p.i] {
|
||
|
case '+':
|
||
|
p.i++
|
||
|
p.skipWhitespace()
|
||
|
b, err = p.parseInteger()
|
||
|
if err != nil {
|
||
|
return 0, 0, err
|
||
|
}
|
||
|
return a, b, nil
|
||
|
case '-':
|
||
|
p.i++
|
||
|
p.skipWhitespace()
|
||
|
b, err = p.parseInteger()
|
||
|
if err != nil {
|
||
|
return 0, 0, err
|
||
|
}
|
||
|
return a, -b, nil
|
||
|
default:
|
||
|
return a, 0, nil
|
||
|
}
|
||
|
|
||
|
eof:
|
||
|
return 0, 0, errors.New("unexpected EOF while attempting to parse expression of form an+b")
|
||
|
|
||
|
invalid:
|
||
|
return 0, 0, errors.New("unexpected character while attempting to parse expression of form an+b")
|
||
|
}
|
||
|
|
||
|
// parseSimpleSelectorSequence parses a selector sequence that applies to
|
||
|
// a single element.
|
||
|
func (p *parser) parseSimpleSelectorSequence() (Selector, error) {
|
||
|
var result Selector
|
||
|
|
||
|
if p.i >= len(p.s) {
|
||
|
return nil, errors.New("expected selector, found EOF instead")
|
||
|
}
|
||
|
|
||
|
switch p.s[p.i] {
|
||
|
case '*':
|
||
|
// It's the universal selector. Just skip over it, since it doesn't affect the meaning.
|
||
|
p.i++
|
||
|
case '#', '.', '[', ':':
|
||
|
// There's no type selector. Wait to process the other till the main loop.
|
||
|
default:
|
||
|
r, err := p.parseTypeSelector()
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
result = r
|
||
|
}
|
||
|
|
||
|
loop:
|
||
|
for p.i < len(p.s) {
|
||
|
var ns Selector
|
||
|
var err error
|
||
|
switch p.s[p.i] {
|
||
|
case '#':
|
||
|
ns, err = p.parseIDSelector()
|
||
|
case '.':
|
||
|
ns, err = p.parseClassSelector()
|
||
|
case '[':
|
||
|
ns, err = p.parseAttributeSelector()
|
||
|
case ':':
|
||
|
ns, err = p.parsePseudoclassSelector()
|
||
|
default:
|
||
|
break loop
|
||
|
}
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
if result == nil {
|
||
|
result = ns
|
||
|
} else {
|
||
|
result = intersectionSelector(result, ns)
|
||
|
}
|
||
|
}
|
||
|
|
||
|
if result == nil {
|
||
|
result = func(n *html.Node) bool {
|
||
|
return n.Type == html.ElementNode
|
||
|
}
|
||
|
}
|
||
|
|
||
|
return result, nil
|
||
|
}
|
||
|
|
||
|
// parseSelector parses a selector that may include combinators.
|
||
|
func (p *parser) parseSelector() (result Selector, err error) {
|
||
|
p.skipWhitespace()
|
||
|
result, err = p.parseSimpleSelectorSequence()
|
||
|
if err != nil {
|
||
|
return
|
||
|
}
|
||
|
|
||
|
for {
|
||
|
var combinator byte
|
||
|
if p.skipWhitespace() {
|
||
|
combinator = ' '
|
||
|
}
|
||
|
if p.i >= len(p.s) {
|
||
|
return
|
||
|
}
|
||
|
|
||
|
switch p.s[p.i] {
|
||
|
case '+', '>', '~':
|
||
|
combinator = p.s[p.i]
|
||
|
p.i++
|
||
|
p.skipWhitespace()
|
||
|
case ',', ')':
|
||
|
// These characters can't begin a selector, but they can legally occur after one.
|
||
|
return
|
||
|
}
|
||
|
|
||
|
if combinator == 0 {
|
||
|
return
|
||
|
}
|
||
|
|
||
|
c, err := p.parseSimpleSelectorSequence()
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
|
||
|
switch combinator {
|
||
|
case ' ':
|
||
|
result = descendantSelector(result, c)
|
||
|
case '>':
|
||
|
result = childSelector(result, c)
|
||
|
case '+':
|
||
|
result = siblingSelector(result, c, true)
|
||
|
case '~':
|
||
|
result = siblingSelector(result, c, false)
|
||
|
}
|
||
|
}
|
||
|
|
||
|
panic("unreachable")
|
||
|
}
|
||
|
|
||
|
// parseSelectorGroup parses a group of selectors, separated by commas.
|
||
|
func (p *parser) parseSelectorGroup() (result Selector, err error) {
|
||
|
result, err = p.parseSelector()
|
||
|
if err != nil {
|
||
|
return
|
||
|
}
|
||
|
|
||
|
for p.i < len(p.s) {
|
||
|
if p.s[p.i] != ',' {
|
||
|
return result, nil
|
||
|
}
|
||
|
p.i++
|
||
|
c, err := p.parseSelector()
|
||
|
if err != nil {
|
||
|
return nil, err
|
||
|
}
|
||
|
result = unionSelector(result, c)
|
||
|
}
|
||
|
|
||
|
return
|
||
|
}
|