githaven/vendor/github.com/yuin/goldmark/parser/raw_html.go

package parser

import (
	"bytes"
	"regexp"

	"github.com/yuin/goldmark/ast"
	"github.com/yuin/goldmark/text"
	"github.com/yuin/goldmark/util"
)

type rawHTMLParser struct {
}

var defaultRawHTMLParser = &rawHTMLParser{}

// NewRawHTMLParser return a new InlineParser that can parse
// inline htmls
func NewRawHTMLParser() InlineParser {
	return defaultRawHTMLParser
}

func (s *rawHTMLParser) Trigger() []byte {
	return []byte{'<'}
}

func (s *rawHTMLParser) Parse(parent ast.Node, block text.Reader, pc Context) ast.Node {
	line, _ := block.PeekLine()
	if len(line) > 1 && util.IsAlphaNumeric(line[1]) {
		return s.parseMultiLineRegexp(openTagRegexp, block, pc)
	}
	if len(line) > 2 && line[1] == '/' && util.IsAlphaNumeric(line[2]) {
		return s.parseMultiLineRegexp(closeTagRegexp, block, pc)
	}
	if bytes.HasPrefix(line, []byte("<!--")) {
		return s.parseMultiLineRegexp(commentRegexp, block, pc)
	}
	if bytes.HasPrefix(line, []byte("<?")) {
		return s.parseSingleLineRegexp(processingInstructionRegexp, block, pc)
	}
	if len(line) > 2 && line[1] == '!' && line[2] >= 'A' && line[2] <= 'Z' {
		return s.parseSingleLineRegexp(declRegexp, block, pc)
	}
	if bytes.HasPrefix(line, []byte("<![CDATA[")) {
		return s.parseMultiLineRegexp(cdataRegexp, block, pc)
	}
	return nil
}

var tagnamePattern = `([A-Za-z][A-Za-z0-9-]*)`
var attributePattern = `(?:\s+[a-zA-Z_:][a-zA-Z0-9:._-]*(?:\s*=\s*(?:[^\"'=<>` + "`" + `\x00-\x20]+|'[^']*'|"[^"]*"))?)`
var openTagRegexp = regexp.MustCompile("^<" + tagnamePattern + attributePattern + `*\s*/?>`)
var closeTagRegexp = regexp.MustCompile("^</" + tagnamePattern + `\s*>`)
var commentRegexp = regexp.MustCompile(`^<!---->|<!--(?:-?[^>-])(?:-?[^-])*-->`)
var processingInstructionRegexp = regexp.MustCompile(`^(?:<\?).*?(?:\?>)`)
var declRegexp = regexp.MustCompile(`^<![A-Z]+\s+[^>]*>`)
var cdataRegexp = regexp.MustCompile(`<!\[CDATA\[[\s\S]*?\]\]>`)

func (s *rawHTMLParser) parseSingleLineRegexp(reg *regexp.Regexp, block text.Reader, pc Context) ast.Node {
	line, segment := block.PeekLine()
	match := reg.FindSubmatchIndex(line)
	if match == nil {
		return nil
	}
	node := ast.NewRawHTML()
	node.Segments.Append(segment.WithStop(segment.Start + match[1]))
	block.Advance(match[1])
	return node
}

func (s *rawHTMLParser) parseMultiLineRegexp(reg *regexp.Regexp, block text.Reader, pc Context) ast.Node {
	sline, ssegment := block.Position()
	if block.Match(reg) {
		node := ast.NewRawHTML()
		eline, esegment := block.Position()
		block.SetPosition(sline, ssegment)
		for {
			line, segment := block.PeekLine()
			if line == nil {
				break
			}
			l, _ := block.Position()
			start := segment.Start
			if l == sline {
				start = ssegment.Start
			}
			end := segment.Stop
			if l == eline {
				end = esegment.Start
			}

			node.Segments.Append(text.NewSegment(start, end))
			if l == eline {
				block.Advance(end - start)
				break
			} else {
				block.AdvanceLine()
			}
		}
		return node
	}
	return nil
}
Change markdown rendering from blackfriday to goldmark (#9533) * Move to goldmark Markdown rendering moved from blackfriday to the goldmark. Multiple subtle changes required to the goldmark extensions to keep current rendering and defaults. Can go further with goldmark linkify and have this work within markdown rendering making the link processor unnecessary. Need to think about how to go about allowing extensions - at present it seems that these would be hard to do without recompilation. * linter fixes Co-authored-by: Lauris BH <lauris@nix.lv> 2019-12-31 01:53:28 +00:00			`package parser`

			`import (`
			`"bytes"`
Vendor Update (#14496) * update code.gitea.io/sdk/gitea v0.13.1 -> v0.13.2 * update github.com/go-swagger/go-swagger v0.25.0 -> v0.26.0 * update github.com/google/uuid v1.1.2 -> v1.2.0 * update github.com/klauspost/compress v1.11.3 -> v1.11.7 * update github.com/lib/pq 083382b7e6fc -> v1.9.0 * update github.com/markbates/goth v1.65.0 -> v1.66.1 * update github.com/mattn/go-sqlite3 v1.14.4 -> v1.14.6 * update github.com/mgechev/revive 246eac737dc7 -> v1.0.3 * update github.com/minio/minio-go/v7 v7.0.6 -> v7.0.7 * update github.com/niklasfasching/go-org v1.3.2 -> v1.4.0 * update github.com/olivere/elastic/v7 v7.0.21 -> v7.0.22 * update github.com/pquerna/otp v1.2.0 -> v1.3.0 * update github.com/xanzy/go-gitlab v0.39.0 -> v0.42.0 * update github.com/yuin/goldmark v1.2.1 -> v1.3.1 2021-01-28 16:56:38 +00:00			`"regexp"`

Change markdown rendering from blackfriday to goldmark (#9533) * Move to goldmark Markdown rendering moved from blackfriday to the goldmark. Multiple subtle changes required to the goldmark extensions to keep current rendering and defaults. Can go further with goldmark linkify and have this work within markdown rendering making the link processor unnecessary. Need to think about how to go about allowing extensions - at present it seems that these would be hard to do without recompilation. * linter fixes Co-authored-by: Lauris BH <lauris@nix.lv> 2019-12-31 01:53:28 +00:00			`"github.com/yuin/goldmark/ast"`
			`"github.com/yuin/goldmark/text"`
			`"github.com/yuin/goldmark/util"`
			`)`

			`type rawHTMLParser struct {`
			`}`

			`var defaultRawHTMLParser = &rawHTMLParser{}`

			`// NewRawHTMLParser return a new InlineParser that can parse`
			`// inline htmls`
			`func NewRawHTMLParser() InlineParser {`
			`return defaultRawHTMLParser`
			`}`

			`func (s *rawHTMLParser) Trigger() []byte {`
			`return []byte{'<'}`
			`}`

			`func (s *rawHTMLParser) Parse(parent ast.Node, block text.Reader, pc Context) ast.Node {`
			`line, _ := block.PeekLine()`
			`if len(line) > 1 && util.IsAlphaNumeric(line[1]) {`
			`return s.parseMultiLineRegexp(openTagRegexp, block, pc)`
			`}`
			`if len(line) > 2 && line[1] == '/' && util.IsAlphaNumeric(line[2]) {`
			`return s.parseMultiLineRegexp(closeTagRegexp, block, pc)`
			`}`
			`if bytes.HasPrefix(line, []byte("<!--")) {`
			`return s.parseMultiLineRegexp(commentRegexp, block, pc)`
			`}`
			`if bytes.HasPrefix(line, []byte("<?")) {`
			`return s.parseSingleLineRegexp(processingInstructionRegexp, block, pc)`
			`}`
			`if len(line) > 2 && line[1] == '!' && line[2] >= 'A' && line[2] <= 'Z' {`
			`return s.parseSingleLineRegexp(declRegexp, block, pc)`
			`}`
			`if bytes.HasPrefix(line, []byte("<![CDATA[")) {`
			`return s.parseMultiLineRegexp(cdataRegexp, block, pc)`
			`}`
			`return nil`
			`}`

			var tagnamePattern = `([A-Za-z][A-Za-z0-9-]*)`
			var attributePattern = `(?:\s+[a-zA-Z_:][a-zA-Z0-9:._-](?:\s=\s(?:[^\"'=<>` + "`" + `\x00-\x20]+\|'[^']'\|"[^"]*"))?)`
			var openTagRegexp = regexp.MustCompile("^<" + tagnamePattern + attributePattern + `\s/?>`)
			var closeTagRegexp = regexp.MustCompile("^</" + tagnamePattern + `\s*>`)
			var commentRegexp = regexp.MustCompile(`^<!---->\|<!--(?:-?[^>-])(?:-?[^-])*-->`)
			var processingInstructionRegexp = regexp.MustCompile(`^(?:<\?).*?(?:\?>)`)
			var declRegexp = regexp.MustCompile(`^<![A-Z]+\s+[^>]*>`)
			var cdataRegexp = regexp.MustCompile(`<!\[CDATA\[[\s\S]*?\]\]>`)

			`func (s rawHTMLParser) parseSingleLineRegexp(reg regexp.Regexp, block text.Reader, pc Context) ast.Node {`
			`line, segment := block.PeekLine()`
			`match := reg.FindSubmatchIndex(line)`
			`if match == nil {`
			`return nil`
			`}`
			`node := ast.NewRawHTML()`
			`node.Segments.Append(segment.WithStop(segment.Start + match[1]))`
			`block.Advance(match[1])`
			`return node`
			`}`

			`func (s rawHTMLParser) parseMultiLineRegexp(reg regexp.Regexp, block text.Reader, pc Context) ast.Node {`
			`sline, ssegment := block.Position()`
			`if block.Match(reg) {`
			`node := ast.NewRawHTML()`
			`eline, esegment := block.Position()`
			`block.SetPosition(sline, ssegment)`
			`for {`
			`line, segment := block.PeekLine()`
			`if line == nil {`
			`break`
			`}`
			`l, _ := block.Position()`
			`start := segment.Start`
			`if l == sline {`
			`start = ssegment.Start`
			`}`
			`end := segment.Stop`
			`if l == eline {`
			`end = esegment.Start`
			`}`

			`node.Segments.Append(text.NewSegment(start, end))`
			`if l == eline {`
			`block.Advance(end - start)`
			`break`
			`} else {`
			`block.AdvanceLine()`
			`}`
			`}`
			`return node`
			`}`
			`return nil`
			`}`