mirror of
				https://github.com/go-gitea/gitea
				synced 2025-10-26 17:08:25 +00:00 
			
		
		
		
	* Move to goldmark Markdown rendering moved from blackfriday to the goldmark. Multiple subtle changes required to the goldmark extensions to keep current rendering and defaults. Can go further with goldmark linkify and have this work within markdown rendering making the link processor unnecessary. Need to think about how to go about allowing extensions - at present it seems that these would be hard to do without recompilation. * linter fixes Co-authored-by: Lauris BH <lauris@nix.lv>
		
			
				
	
	
		
			868 lines
		
	
	
		
			25 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
			
		
		
	
	
			868 lines
		
	
	
		
			25 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
| // Copyright 2017 The Gitea Authors. All rights reserved.
 | ||
| // Use of this source code is governed by a MIT-style
 | ||
| // license that can be found in the LICENSE file.
 | ||
| 
 | ||
| package markup
 | ||
| 
 | ||
| import (
 | ||
| 	"bytes"
 | ||
| 	"net/url"
 | ||
| 	"path"
 | ||
| 	"path/filepath"
 | ||
| 	"regexp"
 | ||
| 	"strings"
 | ||
| 
 | ||
| 	"code.gitea.io/gitea/modules/base"
 | ||
| 	"code.gitea.io/gitea/modules/git"
 | ||
| 	"code.gitea.io/gitea/modules/log"
 | ||
| 	"code.gitea.io/gitea/modules/markup/common"
 | ||
| 	"code.gitea.io/gitea/modules/references"
 | ||
| 	"code.gitea.io/gitea/modules/setting"
 | ||
| 	"code.gitea.io/gitea/modules/util"
 | ||
| 
 | ||
| 	"github.com/unknwon/com"
 | ||
| 	"golang.org/x/net/html"
 | ||
| 	"golang.org/x/net/html/atom"
 | ||
| 	"mvdan.cc/xurls/v2"
 | ||
| )
 | ||
| 
 | ||
| // Issue name styles
 | ||
| const (
 | ||
| 	IssueNameStyleNumeric      = "numeric"
 | ||
| 	IssueNameStyleAlphanumeric = "alphanumeric"
 | ||
| )
 | ||
| 
 | ||
| var (
 | ||
| 	// NOTE: All below regex matching do not perform any extra validation.
 | ||
| 	// Thus a link is produced even if the linked entity does not exist.
 | ||
| 	// While fast, this is also incorrect and lead to false positives.
 | ||
| 	// TODO: fix invalid linking issue
 | ||
| 
 | ||
| 	// sha1CurrentPattern matches string that represents a commit SHA, e.g. d8a994ef243349f321568f9e36d5c3f444b99cae
 | ||
| 	// Although SHA1 hashes are 40 chars long, the regex matches the hash from 7 to 40 chars in length
 | ||
| 	// so that abbreviated hash links can be used as well. This matches git and github useability.
 | ||
| 	sha1CurrentPattern = regexp.MustCompile(`(?:\s|^|\(|\[)([0-9a-f]{7,40})(?:\s|$|\)|\]|\.(\s|$))`)
 | ||
| 
 | ||
| 	// shortLinkPattern matches short but difficult to parse [[name|link|arg=test]] syntax
 | ||
| 	shortLinkPattern = regexp.MustCompile(`\[\[(.*?)\]\](\w*)`)
 | ||
| 
 | ||
| 	// anySHA1Pattern allows to split url containing SHA into parts
 | ||
| 	anySHA1Pattern = regexp.MustCompile(`https?://(?:\S+/){4}([0-9a-f]{40})(/[^#\s]+)?(#\S+)?`)
 | ||
| 
 | ||
| 	validLinksPattern = regexp.MustCompile(`^[a-z][\w-]+://`)
 | ||
| 
 | ||
| 	// While this email regex is definitely not perfect and I'm sure you can come up
 | ||
| 	// with edge cases, it is still accepted by the CommonMark specification, as
 | ||
| 	// well as the HTML5 spec:
 | ||
| 	//   http://spec.commonmark.org/0.28/#email-address
 | ||
| 	//   https://html.spec.whatwg.org/multipage/input.html#e-mail-state-(type%3Demail)
 | ||
| 	emailRegex = regexp.MustCompile("(?:\\s|^|\\(|\\[)([a-zA-Z0-9.!#$%&'*+\\/=?^_`{|}~-]+@[a-zA-Z0-9](?:[a-zA-Z0-9-]{0,61}[a-zA-Z0-9])?(?:\\.[a-zA-Z0-9]{2,}(?:[a-zA-Z0-9-]{0,61}[a-zA-Z0-9])?)+)(?:\\s|$|\\)|\\]|\\.(\\s|$))")
 | ||
| 
 | ||
| 	// blackfriday extensions create IDs like fn:user-content-footnote
 | ||
| 	blackfridayExtRegex = regexp.MustCompile(`[^:]*:user-content-`)
 | ||
| )
 | ||
| 
 | ||
| // CSS class for action keywords (e.g. "closes: #1")
 | ||
| const keywordClass = "issue-keyword"
 | ||
| 
 | ||
| // regexp for full links to issues/pulls
 | ||
| var issueFullPattern *regexp.Regexp
 | ||
| 
 | ||
| // IsLink reports whether link fits valid format.
 | ||
| func IsLink(link []byte) bool {
 | ||
| 	return isLink(link)
 | ||
| }
 | ||
| 
 | ||
| // isLink reports whether link fits valid format.
 | ||
| func isLink(link []byte) bool {
 | ||
| 	return validLinksPattern.Match(link)
 | ||
| }
 | ||
| 
 | ||
| func isLinkStr(link string) bool {
 | ||
| 	return validLinksPattern.MatchString(link)
 | ||
| }
 | ||
| 
 | ||
| func getIssueFullPattern() *regexp.Regexp {
 | ||
| 	if issueFullPattern == nil {
 | ||
| 		appURL := setting.AppURL
 | ||
| 		if len(appURL) > 0 && appURL[len(appURL)-1] != '/' {
 | ||
| 			appURL += "/"
 | ||
| 		}
 | ||
| 		issueFullPattern = regexp.MustCompile(appURL +
 | ||
| 			`\w+/\w+/(?:issues|pulls)/((?:\w{1,10}-)?[1-9][0-9]*)([\?|#]\S+.(\S+)?)?\b`)
 | ||
| 	}
 | ||
| 	return issueFullPattern
 | ||
| }
 | ||
| 
 | ||
| // CustomLinkURLSchemes allows for additional schemes to be detected when parsing links within text
 | ||
| func CustomLinkURLSchemes(schemes []string) {
 | ||
| 	schemes = append(schemes, "http", "https")
 | ||
| 	withAuth := make([]string, 0, len(schemes))
 | ||
| 	validScheme := regexp.MustCompile(`^[a-z]+$`)
 | ||
| 	for _, s := range schemes {
 | ||
| 		if !validScheme.MatchString(s) {
 | ||
| 			continue
 | ||
| 		}
 | ||
| 		without := false
 | ||
| 		for _, sna := range xurls.SchemesNoAuthority {
 | ||
| 			if s == sna {
 | ||
| 				without = true
 | ||
| 				break
 | ||
| 			}
 | ||
| 		}
 | ||
| 		if without {
 | ||
| 			s += ":"
 | ||
| 		} else {
 | ||
| 			s += "://"
 | ||
| 		}
 | ||
| 		withAuth = append(withAuth, s)
 | ||
| 	}
 | ||
| 	common.LinkRegex, _ = xurls.StrictMatchingScheme(strings.Join(withAuth, "|"))
 | ||
| }
 | ||
| 
 | ||
| // IsSameDomain checks if given url string has the same hostname as current Gitea instance
 | ||
| func IsSameDomain(s string) bool {
 | ||
| 	if strings.HasPrefix(s, "/") {
 | ||
| 		return true
 | ||
| 	}
 | ||
| 	if uapp, err := url.Parse(setting.AppURL); err == nil {
 | ||
| 		if u, err := url.Parse(s); err == nil {
 | ||
| 			return u.Host == uapp.Host
 | ||
| 		}
 | ||
| 		return false
 | ||
| 	}
 | ||
| 	return false
 | ||
| }
 | ||
| 
 | ||
| type postProcessError struct {
 | ||
| 	context string
 | ||
| 	err     error
 | ||
| }
 | ||
| 
 | ||
| func (p *postProcessError) Error() string {
 | ||
| 	return "PostProcess: " + p.context + ", " + p.err.Error()
 | ||
| }
 | ||
| 
 | ||
| type processor func(ctx *postProcessCtx, node *html.Node)
 | ||
| 
 | ||
| var defaultProcessors = []processor{
 | ||
| 	fullIssuePatternProcessor,
 | ||
| 	fullSha1PatternProcessor,
 | ||
| 	shortLinkProcessor,
 | ||
| 	linkProcessor,
 | ||
| 	mentionProcessor,
 | ||
| 	issueIndexPatternProcessor,
 | ||
| 	sha1CurrentPatternProcessor,
 | ||
| 	emailAddressProcessor,
 | ||
| }
 | ||
| 
 | ||
| type postProcessCtx struct {
 | ||
| 	metas          map[string]string
 | ||
| 	urlPrefix      string
 | ||
| 	isWikiMarkdown bool
 | ||
| 
 | ||
| 	// processors used by this context.
 | ||
| 	procs []processor
 | ||
| }
 | ||
| 
 | ||
| // PostProcess does the final required transformations to the passed raw HTML
 | ||
| // data, and ensures its validity. Transformations include: replacing links and
 | ||
| // emails with HTML links, parsing shortlinks in the format of [[Link]], like
 | ||
| // MediaWiki, linking issues in the format #ID, and mentions in the format
 | ||
| // @user, and others.
 | ||
| func PostProcess(
 | ||
| 	rawHTML []byte,
 | ||
| 	urlPrefix string,
 | ||
| 	metas map[string]string,
 | ||
| 	isWikiMarkdown bool,
 | ||
| ) ([]byte, error) {
 | ||
| 	// create the context from the parameters
 | ||
| 	ctx := &postProcessCtx{
 | ||
| 		metas:          metas,
 | ||
| 		urlPrefix:      urlPrefix,
 | ||
| 		isWikiMarkdown: isWikiMarkdown,
 | ||
| 		procs:          defaultProcessors,
 | ||
| 	}
 | ||
| 	return ctx.postProcess(rawHTML)
 | ||
| }
 | ||
| 
 | ||
| var commitMessageProcessors = []processor{
 | ||
| 	fullIssuePatternProcessor,
 | ||
| 	fullSha1PatternProcessor,
 | ||
| 	linkProcessor,
 | ||
| 	mentionProcessor,
 | ||
| 	issueIndexPatternProcessor,
 | ||
| 	sha1CurrentPatternProcessor,
 | ||
| 	emailAddressProcessor,
 | ||
| }
 | ||
| 
 | ||
| // RenderCommitMessage will use the same logic as PostProcess, but will disable
 | ||
| // the shortLinkProcessor and will add a defaultLinkProcessor if defaultLink is
 | ||
| // set, which changes every text node into a link to the passed default link.
 | ||
| func RenderCommitMessage(
 | ||
| 	rawHTML []byte,
 | ||
| 	urlPrefix, defaultLink string,
 | ||
| 	metas map[string]string,
 | ||
| ) ([]byte, error) {
 | ||
| 	ctx := &postProcessCtx{
 | ||
| 		metas:     metas,
 | ||
| 		urlPrefix: urlPrefix,
 | ||
| 		procs:     commitMessageProcessors,
 | ||
| 	}
 | ||
| 	if defaultLink != "" {
 | ||
| 		// we don't have to fear data races, because being
 | ||
| 		// commitMessageProcessors of fixed len and cap, every time we append
 | ||
| 		// something to it the slice is realloc+copied, so append always
 | ||
| 		// generates the slice ex-novo.
 | ||
| 		ctx.procs = append(ctx.procs, genDefaultLinkProcessor(defaultLink))
 | ||
| 	}
 | ||
| 	return ctx.postProcess(rawHTML)
 | ||
| }
 | ||
| 
 | ||
| var commitMessageSubjectProcessors = []processor{
 | ||
| 	fullIssuePatternProcessor,
 | ||
| 	fullSha1PatternProcessor,
 | ||
| 	linkProcessor,
 | ||
| 	mentionProcessor,
 | ||
| 	issueIndexPatternProcessor,
 | ||
| 	sha1CurrentPatternProcessor,
 | ||
| }
 | ||
| 
 | ||
| // RenderCommitMessageSubject will use the same logic as PostProcess and
 | ||
| // RenderCommitMessage, but will disable the shortLinkProcessor and
 | ||
| // emailAddressProcessor, will add a defaultLinkProcessor if defaultLink is set,
 | ||
| // which changes every text node into a link to the passed default link.
 | ||
| func RenderCommitMessageSubject(
 | ||
| 	rawHTML []byte,
 | ||
| 	urlPrefix, defaultLink string,
 | ||
| 	metas map[string]string,
 | ||
| ) ([]byte, error) {
 | ||
| 	ctx := &postProcessCtx{
 | ||
| 		metas:     metas,
 | ||
| 		urlPrefix: urlPrefix,
 | ||
| 		procs:     commitMessageSubjectProcessors,
 | ||
| 	}
 | ||
| 	if defaultLink != "" {
 | ||
| 		// we don't have to fear data races, because being
 | ||
| 		// commitMessageSubjectProcessors of fixed len and cap, every time we
 | ||
| 		// append something to it the slice is realloc+copied, so append always
 | ||
| 		// generates the slice ex-novo.
 | ||
| 		ctx.procs = append(ctx.procs, genDefaultLinkProcessor(defaultLink))
 | ||
| 	}
 | ||
| 	return ctx.postProcess(rawHTML)
 | ||
| }
 | ||
| 
 | ||
| // RenderDescriptionHTML will use similar logic as PostProcess, but will
 | ||
| // use a single special linkProcessor.
 | ||
| func RenderDescriptionHTML(
 | ||
| 	rawHTML []byte,
 | ||
| 	urlPrefix string,
 | ||
| 	metas map[string]string,
 | ||
| ) ([]byte, error) {
 | ||
| 	ctx := &postProcessCtx{
 | ||
| 		metas:     metas,
 | ||
| 		urlPrefix: urlPrefix,
 | ||
| 		procs: []processor{
 | ||
| 			descriptionLinkProcessor,
 | ||
| 		},
 | ||
| 	}
 | ||
| 	return ctx.postProcess(rawHTML)
 | ||
| }
 | ||
| 
 | ||
| var byteBodyTag = []byte("<body>")
 | ||
| var byteBodyTagClosing = []byte("</body>")
 | ||
| 
 | ||
| func (ctx *postProcessCtx) postProcess(rawHTML []byte) ([]byte, error) {
 | ||
| 	if ctx.procs == nil {
 | ||
| 		ctx.procs = defaultProcessors
 | ||
| 	}
 | ||
| 
 | ||
| 	// give a generous extra 50 bytes
 | ||
| 	res := make([]byte, 0, len(rawHTML)+50)
 | ||
| 	res = append(res, byteBodyTag...)
 | ||
| 	res = append(res, rawHTML...)
 | ||
| 	res = append(res, byteBodyTagClosing...)
 | ||
| 
 | ||
| 	// parse the HTML
 | ||
| 	nodes, err := html.ParseFragment(bytes.NewReader(res), nil)
 | ||
| 	if err != nil {
 | ||
| 		return nil, &postProcessError{"invalid HTML", err}
 | ||
| 	}
 | ||
| 
 | ||
| 	for _, node := range nodes {
 | ||
| 		ctx.visitNode(node)
 | ||
| 	}
 | ||
| 
 | ||
| 	// Create buffer in which the data will be placed again. We know that the
 | ||
| 	// length will be at least that of res; to spare a few alloc+copy, we
 | ||
| 	// reuse res, resetting its length to 0.
 | ||
| 	buf := bytes.NewBuffer(res[:0])
 | ||
| 	// Render everything to buf.
 | ||
| 	for _, node := range nodes {
 | ||
| 		err = html.Render(buf, node)
 | ||
| 		if err != nil {
 | ||
| 			return nil, &postProcessError{"error rendering processed HTML", err}
 | ||
| 		}
 | ||
| 	}
 | ||
| 
 | ||
| 	// remove initial parts - because Render creates a whole HTML page.
 | ||
| 	res = buf.Bytes()
 | ||
| 	res = res[bytes.Index(res, byteBodyTag)+len(byteBodyTag) : bytes.LastIndex(res, byteBodyTagClosing)]
 | ||
| 
 | ||
| 	// Everything done successfully, return parsed data.
 | ||
| 	return res, nil
 | ||
| }
 | ||
| 
 | ||
| func (ctx *postProcessCtx) visitNode(node *html.Node) {
 | ||
| 	// Add user-content- to IDs if they don't already have them
 | ||
| 	for idx, attr := range node.Attr {
 | ||
| 		if attr.Key == "id" && !(strings.HasPrefix(attr.Val, "user-content-") || blackfridayExtRegex.MatchString(attr.Val)) {
 | ||
| 			node.Attr[idx].Val = "user-content-" + attr.Val
 | ||
| 		}
 | ||
| 	}
 | ||
| 	// We ignore code, pre and already generated links.
 | ||
| 	switch node.Type {
 | ||
| 	case html.TextNode:
 | ||
| 		ctx.textNode(node)
 | ||
| 	case html.ElementNode:
 | ||
| 		if node.Data == "a" || node.Data == "code" || node.Data == "pre" {
 | ||
| 			return
 | ||
| 		}
 | ||
| 		for n := node.FirstChild; n != nil; n = n.NextSibling {
 | ||
| 			ctx.visitNode(n)
 | ||
| 		}
 | ||
| 	}
 | ||
| 	// ignore everything else
 | ||
| }
 | ||
| 
 | ||
| // textNode runs the passed node through various processors, in order to handle
 | ||
| // all kinds of special links handled by the post-processing.
 | ||
| func (ctx *postProcessCtx) textNode(node *html.Node) {
 | ||
| 	for _, processor := range ctx.procs {
 | ||
| 		processor(ctx, node)
 | ||
| 	}
 | ||
| }
 | ||
| 
 | ||
| // createKeyword() renders a highlighted version of an action keyword
 | ||
| func createKeyword(content string) *html.Node {
 | ||
| 	span := &html.Node{
 | ||
| 		Type: html.ElementNode,
 | ||
| 		Data: atom.Span.String(),
 | ||
| 		Attr: []html.Attribute{},
 | ||
| 	}
 | ||
| 	span.Attr = append(span.Attr, html.Attribute{Key: "class", Val: keywordClass})
 | ||
| 
 | ||
| 	text := &html.Node{
 | ||
| 		Type: html.TextNode,
 | ||
| 		Data: content,
 | ||
| 	}
 | ||
| 	span.AppendChild(text)
 | ||
| 
 | ||
| 	return span
 | ||
| }
 | ||
| 
 | ||
| func createLink(href, content, class string) *html.Node {
 | ||
| 	a := &html.Node{
 | ||
| 		Type: html.ElementNode,
 | ||
| 		Data: atom.A.String(),
 | ||
| 		Attr: []html.Attribute{{Key: "href", Val: href}},
 | ||
| 	}
 | ||
| 
 | ||
| 	if class != "" {
 | ||
| 		a.Attr = append(a.Attr, html.Attribute{Key: "class", Val: class})
 | ||
| 	}
 | ||
| 
 | ||
| 	text := &html.Node{
 | ||
| 		Type: html.TextNode,
 | ||
| 		Data: content,
 | ||
| 	}
 | ||
| 
 | ||
| 	a.AppendChild(text)
 | ||
| 	return a
 | ||
| }
 | ||
| 
 | ||
| func createCodeLink(href, content, class string) *html.Node {
 | ||
| 	a := &html.Node{
 | ||
| 		Type: html.ElementNode,
 | ||
| 		Data: atom.A.String(),
 | ||
| 		Attr: []html.Attribute{{Key: "href", Val: href}},
 | ||
| 	}
 | ||
| 
 | ||
| 	if class != "" {
 | ||
| 		a.Attr = append(a.Attr, html.Attribute{Key: "class", Val: class})
 | ||
| 	}
 | ||
| 
 | ||
| 	text := &html.Node{
 | ||
| 		Type: html.TextNode,
 | ||
| 		Data: content,
 | ||
| 	}
 | ||
| 
 | ||
| 	code := &html.Node{
 | ||
| 		Type: html.ElementNode,
 | ||
| 		Data: atom.Code.String(),
 | ||
| 		Attr: []html.Attribute{{Key: "class", Val: "nohighlight"}},
 | ||
| 	}
 | ||
| 
 | ||
| 	code.AppendChild(text)
 | ||
| 	a.AppendChild(code)
 | ||
| 	return a
 | ||
| }
 | ||
| 
 | ||
| // replaceContent takes text node, and in its content it replaces a section of
 | ||
| // it with the specified newNode.
 | ||
| func replaceContent(node *html.Node, i, j int, newNode *html.Node) {
 | ||
| 	replaceContentList(node, i, j, []*html.Node{newNode})
 | ||
| }
 | ||
| 
 | ||
| // replaceContentList takes text node, and in its content it replaces a section of
 | ||
| // it with the specified newNodes. An example to visualize how this can work can
 | ||
| // be found here: https://play.golang.org/p/5zP8NnHZ03s
 | ||
| func replaceContentList(node *html.Node, i, j int, newNodes []*html.Node) {
 | ||
| 	// get the data before and after the match
 | ||
| 	before := node.Data[:i]
 | ||
| 	after := node.Data[j:]
 | ||
| 
 | ||
| 	// Replace in the current node the text, so that it is only what it is
 | ||
| 	// supposed to have.
 | ||
| 	node.Data = before
 | ||
| 
 | ||
| 	// Get the current next sibling, before which we place the replaced data,
 | ||
| 	// and after that we place the new text node.
 | ||
| 	nextSibling := node.NextSibling
 | ||
| 	for _, n := range newNodes {
 | ||
| 		node.Parent.InsertBefore(n, nextSibling)
 | ||
| 	}
 | ||
| 	if after != "" {
 | ||
| 		node.Parent.InsertBefore(&html.Node{
 | ||
| 			Type: html.TextNode,
 | ||
| 			Data: after,
 | ||
| 		}, nextSibling)
 | ||
| 	}
 | ||
| }
 | ||
| 
 | ||
| func mentionProcessor(ctx *postProcessCtx, node *html.Node) {
 | ||
| 	// We replace only the first mention; other mentions will be addressed later
 | ||
| 	found, loc := references.FindFirstMentionBytes([]byte(node.Data))
 | ||
| 	if !found {
 | ||
| 		return
 | ||
| 	}
 | ||
| 	mention := node.Data[loc.Start:loc.End]
 | ||
| 	var teams string
 | ||
| 	teams, ok := ctx.metas["teams"]
 | ||
| 	if ok && strings.Contains(teams, ","+strings.ToLower(mention[1:])+",") {
 | ||
| 		replaceContent(node, loc.Start, loc.End, createLink(util.URLJoin(setting.AppURL, "org", ctx.metas["org"], "teams", mention[1:]), mention, "mention"))
 | ||
| 	} else {
 | ||
| 		replaceContent(node, loc.Start, loc.End, createLink(util.URLJoin(setting.AppURL, mention[1:]), mention, "mention"))
 | ||
| 	}
 | ||
| }
 | ||
| 
 | ||
| func shortLinkProcessor(ctx *postProcessCtx, node *html.Node) {
 | ||
| 	shortLinkProcessorFull(ctx, node, false)
 | ||
| }
 | ||
| 
 | ||
| func shortLinkProcessorFull(ctx *postProcessCtx, node *html.Node, noLink bool) {
 | ||
| 	m := shortLinkPattern.FindStringSubmatchIndex(node.Data)
 | ||
| 	if m == nil {
 | ||
| 		return
 | ||
| 	}
 | ||
| 
 | ||
| 	content := node.Data[m[2]:m[3]]
 | ||
| 	tail := node.Data[m[4]:m[5]]
 | ||
| 	props := make(map[string]string)
 | ||
| 
 | ||
| 	// MediaWiki uses [[link|text]], while GitHub uses [[text|link]]
 | ||
| 	// It makes page handling terrible, but we prefer GitHub syntax
 | ||
| 	// And fall back to MediaWiki only when it is obvious from the look
 | ||
| 	// Of text and link contents
 | ||
| 	sl := strings.Split(content, "|")
 | ||
| 	for _, v := range sl {
 | ||
| 		if equalPos := strings.IndexByte(v, '='); equalPos == -1 {
 | ||
| 			// There is no equal in this argument; this is a mandatory arg
 | ||
| 			if props["name"] == "" {
 | ||
| 				if isLinkStr(v) {
 | ||
| 					// If we clearly see it is a link, we save it so
 | ||
| 
 | ||
| 					// But first we need to ensure, that if both mandatory args provided
 | ||
| 					// look like links, we stick to GitHub syntax
 | ||
| 					if props["link"] != "" {
 | ||
| 						props["name"] = props["link"]
 | ||
| 					}
 | ||
| 
 | ||
| 					props["link"] = strings.TrimSpace(v)
 | ||
| 				} else {
 | ||
| 					props["name"] = v
 | ||
| 				}
 | ||
| 			} else {
 | ||
| 				props["link"] = strings.TrimSpace(v)
 | ||
| 			}
 | ||
| 		} else {
 | ||
| 			// There is an equal; optional argument.
 | ||
| 
 | ||
| 			sep := strings.IndexByte(v, '=')
 | ||
| 			key, val := v[:sep], html.UnescapeString(v[sep+1:])
 | ||
| 
 | ||
| 			// When parsing HTML, x/net/html will change all quotes which are
 | ||
| 			// not used for syntax into UTF-8 quotes. So checking val[0] won't
 | ||
| 			// be enough, since that only checks a single byte.
 | ||
| 			if (strings.HasPrefix(val, "“") && strings.HasSuffix(val, "”")) ||
 | ||
| 				(strings.HasPrefix(val, "‘") && strings.HasSuffix(val, "’")) {
 | ||
| 				const lenQuote = len("‘")
 | ||
| 				val = val[lenQuote : len(val)-lenQuote]
 | ||
| 			} else if (strings.HasPrefix(val, "\"") && strings.HasSuffix(val, "\"")) ||
 | ||
| 				(strings.HasPrefix(val, "'") && strings.HasSuffix(val, "'")) {
 | ||
| 				val = val[1 : len(val)-1]
 | ||
| 			} else if strings.HasPrefix(val, "'") && strings.HasSuffix(val, "’") {
 | ||
| 				const lenQuote = len("‘")
 | ||
| 				val = val[1 : len(val)-lenQuote]
 | ||
| 			}
 | ||
| 			props[key] = val
 | ||
| 		}
 | ||
| 	}
 | ||
| 
 | ||
| 	var name, link string
 | ||
| 	if props["link"] != "" {
 | ||
| 		link = props["link"]
 | ||
| 	} else if props["name"] != "" {
 | ||
| 		link = props["name"]
 | ||
| 	}
 | ||
| 	if props["title"] != "" {
 | ||
| 		name = props["title"]
 | ||
| 	} else if props["name"] != "" {
 | ||
| 		name = props["name"]
 | ||
| 	} else {
 | ||
| 		name = link
 | ||
| 	}
 | ||
| 
 | ||
| 	name += tail
 | ||
| 	image := false
 | ||
| 	switch ext := filepath.Ext(link); ext {
 | ||
| 	// fast path: empty string, ignore
 | ||
| 	case "":
 | ||
| 		break
 | ||
| 	case ".jpg", ".jpeg", ".png", ".tif", ".tiff", ".webp", ".gif", ".bmp", ".ico", ".svg":
 | ||
| 		image = true
 | ||
| 	}
 | ||
| 
 | ||
| 	childNode := &html.Node{}
 | ||
| 	linkNode := &html.Node{
 | ||
| 		FirstChild: childNode,
 | ||
| 		LastChild:  childNode,
 | ||
| 		Type:       html.ElementNode,
 | ||
| 		Data:       "a",
 | ||
| 		DataAtom:   atom.A,
 | ||
| 	}
 | ||
| 	childNode.Parent = linkNode
 | ||
| 	absoluteLink := isLinkStr(link)
 | ||
| 	if !absoluteLink {
 | ||
| 		if image {
 | ||
| 			link = strings.Replace(link, " ", "+", -1)
 | ||
| 		} else {
 | ||
| 			link = strings.Replace(link, " ", "-", -1)
 | ||
| 		}
 | ||
| 		if !strings.Contains(link, "/") {
 | ||
| 			link = url.PathEscape(link)
 | ||
| 		}
 | ||
| 	}
 | ||
| 	urlPrefix := ctx.urlPrefix
 | ||
| 	if image {
 | ||
| 		if !absoluteLink {
 | ||
| 			if IsSameDomain(urlPrefix) {
 | ||
| 				urlPrefix = strings.Replace(urlPrefix, "/src/", "/raw/", 1)
 | ||
| 			}
 | ||
| 			if ctx.isWikiMarkdown {
 | ||
| 				link = util.URLJoin("wiki", "raw", link)
 | ||
| 			}
 | ||
| 			link = util.URLJoin(urlPrefix, link)
 | ||
| 		}
 | ||
| 		title := props["title"]
 | ||
| 		if title == "" {
 | ||
| 			title = props["alt"]
 | ||
| 		}
 | ||
| 		if title == "" {
 | ||
| 			title = path.Base(name)
 | ||
| 		}
 | ||
| 		alt := props["alt"]
 | ||
| 		if alt == "" {
 | ||
| 			alt = name
 | ||
| 		}
 | ||
| 
 | ||
| 		// make the childNode an image - if we can, we also place the alt
 | ||
| 		childNode.Type = html.ElementNode
 | ||
| 		childNode.Data = "img"
 | ||
| 		childNode.DataAtom = atom.Img
 | ||
| 		childNode.Attr = []html.Attribute{
 | ||
| 			{Key: "src", Val: link},
 | ||
| 			{Key: "title", Val: title},
 | ||
| 			{Key: "alt", Val: alt},
 | ||
| 		}
 | ||
| 		if alt == "" {
 | ||
| 			childNode.Attr = childNode.Attr[:2]
 | ||
| 		}
 | ||
| 	} else {
 | ||
| 		if !absoluteLink {
 | ||
| 			if ctx.isWikiMarkdown {
 | ||
| 				link = util.URLJoin("wiki", link)
 | ||
| 			}
 | ||
| 			link = util.URLJoin(urlPrefix, link)
 | ||
| 		}
 | ||
| 		childNode.Type = html.TextNode
 | ||
| 		childNode.Data = name
 | ||
| 	}
 | ||
| 	if noLink {
 | ||
| 		linkNode = childNode
 | ||
| 	} else {
 | ||
| 		linkNode.Attr = []html.Attribute{{Key: "href", Val: link}}
 | ||
| 	}
 | ||
| 	replaceContent(node, m[0], m[1], linkNode)
 | ||
| }
 | ||
| 
 | ||
| func fullIssuePatternProcessor(ctx *postProcessCtx, node *html.Node) {
 | ||
| 	if ctx.metas == nil {
 | ||
| 		return
 | ||
| 	}
 | ||
| 	m := getIssueFullPattern().FindStringSubmatchIndex(node.Data)
 | ||
| 	if m == nil {
 | ||
| 		return
 | ||
| 	}
 | ||
| 	link := node.Data[m[0]:m[1]]
 | ||
| 	id := "#" + node.Data[m[2]:m[3]]
 | ||
| 
 | ||
| 	// extract repo and org name from matched link like
 | ||
| 	// http://localhost:3000/gituser/myrepo/issues/1
 | ||
| 	linkParts := strings.Split(path.Clean(link), "/")
 | ||
| 	matchOrg := linkParts[len(linkParts)-4]
 | ||
| 	matchRepo := linkParts[len(linkParts)-3]
 | ||
| 
 | ||
| 	if matchOrg == ctx.metas["user"] && matchRepo == ctx.metas["repo"] {
 | ||
| 		// TODO if m[4]:m[5] is not nil, then link is to a comment,
 | ||
| 		// and we should indicate that in the text somehow
 | ||
| 		replaceContent(node, m[0], m[1], createLink(link, id, "issue"))
 | ||
| 
 | ||
| 	} else {
 | ||
| 		orgRepoID := matchOrg + "/" + matchRepo + id
 | ||
| 		replaceContent(node, m[0], m[1], createLink(link, orgRepoID, "issue"))
 | ||
| 	}
 | ||
| }
 | ||
| 
 | ||
| func issueIndexPatternProcessor(ctx *postProcessCtx, node *html.Node) {
 | ||
| 	if ctx.metas == nil {
 | ||
| 		return
 | ||
| 	}
 | ||
| 
 | ||
| 	var (
 | ||
| 		found bool
 | ||
| 		ref   *references.RenderizableReference
 | ||
| 	)
 | ||
| 
 | ||
| 	_, exttrack := ctx.metas["format"]
 | ||
| 	alphanum := ctx.metas["style"] == IssueNameStyleAlphanumeric
 | ||
| 
 | ||
| 	// Repos with external issue trackers might still need to reference local PRs
 | ||
| 	// We need to concern with the first one that shows up in the text, whichever it is
 | ||
| 	found, ref = references.FindRenderizableReferenceNumeric(node.Data, exttrack && alphanum)
 | ||
| 	if exttrack && alphanum {
 | ||
| 		if found2, ref2 := references.FindRenderizableReferenceAlphanumeric(node.Data); found2 {
 | ||
| 			if !found || ref2.RefLocation.Start < ref.RefLocation.Start {
 | ||
| 				found = true
 | ||
| 				ref = ref2
 | ||
| 			}
 | ||
| 		}
 | ||
| 	}
 | ||
| 	if !found {
 | ||
| 		return
 | ||
| 	}
 | ||
| 
 | ||
| 	var link *html.Node
 | ||
| 	reftext := node.Data[ref.RefLocation.Start:ref.RefLocation.End]
 | ||
| 	if exttrack && !ref.IsPull {
 | ||
| 		ctx.metas["index"] = ref.Issue
 | ||
| 		link = createLink(com.Expand(ctx.metas["format"], ctx.metas), reftext, "issue")
 | ||
| 	} else {
 | ||
| 		// Path determines the type of link that will be rendered. It's unknown at this point whether
 | ||
| 		// the linked item is actually a PR or an issue. Luckily it's of no real consequence because
 | ||
| 		// Gitea will redirect on click as appropriate.
 | ||
| 		path := "issues"
 | ||
| 		if ref.IsPull {
 | ||
| 			path = "pulls"
 | ||
| 		}
 | ||
| 		if ref.Owner == "" {
 | ||
| 			link = createLink(util.URLJoin(setting.AppURL, ctx.metas["user"], ctx.metas["repo"], path, ref.Issue), reftext, "issue")
 | ||
| 		} else {
 | ||
| 			link = createLink(util.URLJoin(setting.AppURL, ref.Owner, ref.Name, path, ref.Issue), reftext, "issue")
 | ||
| 		}
 | ||
| 	}
 | ||
| 
 | ||
| 	if ref.Action == references.XRefActionNone {
 | ||
| 		replaceContent(node, ref.RefLocation.Start, ref.RefLocation.End, link)
 | ||
| 		return
 | ||
| 	}
 | ||
| 
 | ||
| 	// Decorate action keywords if actionable
 | ||
| 	var keyword *html.Node
 | ||
| 	if references.IsXrefActionable(ref, exttrack, alphanum) {
 | ||
| 		keyword = createKeyword(node.Data[ref.ActionLocation.Start:ref.ActionLocation.End])
 | ||
| 	} else {
 | ||
| 		keyword = &html.Node{
 | ||
| 			Type: html.TextNode,
 | ||
| 			Data: node.Data[ref.ActionLocation.Start:ref.ActionLocation.End],
 | ||
| 		}
 | ||
| 	}
 | ||
| 	spaces := &html.Node{
 | ||
| 		Type: html.TextNode,
 | ||
| 		Data: node.Data[ref.ActionLocation.End:ref.RefLocation.Start],
 | ||
| 	}
 | ||
| 	replaceContentList(node, ref.ActionLocation.Start, ref.RefLocation.End, []*html.Node{keyword, spaces, link})
 | ||
| }
 | ||
| 
 | ||
| // fullSha1PatternProcessor renders SHA containing URLs
 | ||
| func fullSha1PatternProcessor(ctx *postProcessCtx, node *html.Node) {
 | ||
| 	if ctx.metas == nil {
 | ||
| 		return
 | ||
| 	}
 | ||
| 	m := anySHA1Pattern.FindStringSubmatchIndex(node.Data)
 | ||
| 	if m == nil {
 | ||
| 		return
 | ||
| 	}
 | ||
| 
 | ||
| 	urlFull := node.Data[m[0]:m[1]]
 | ||
| 	text := base.ShortSha(node.Data[m[2]:m[3]])
 | ||
| 
 | ||
| 	// 3rd capture group matches a optional path
 | ||
| 	subpath := ""
 | ||
| 	if m[5] > 0 {
 | ||
| 		subpath = node.Data[m[4]:m[5]]
 | ||
| 	}
 | ||
| 
 | ||
| 	// 4th capture group matches a optional url hash
 | ||
| 	hash := ""
 | ||
| 	if m[7] > 0 {
 | ||
| 		hash = node.Data[m[6]:m[7]][1:]
 | ||
| 	}
 | ||
| 
 | ||
| 	start := m[0]
 | ||
| 	end := m[1]
 | ||
| 
 | ||
| 	// If url ends in '.', it's very likely that it is not part of the
 | ||
| 	// actual url but used to finish a sentence.
 | ||
| 	if strings.HasSuffix(urlFull, ".") {
 | ||
| 		end--
 | ||
| 		urlFull = urlFull[:len(urlFull)-1]
 | ||
| 		if hash != "" {
 | ||
| 			hash = hash[:len(hash)-1]
 | ||
| 		} else if subpath != "" {
 | ||
| 			subpath = subpath[:len(subpath)-1]
 | ||
| 		}
 | ||
| 	}
 | ||
| 
 | ||
| 	if subpath != "" {
 | ||
| 		text += subpath
 | ||
| 	}
 | ||
| 
 | ||
| 	if hash != "" {
 | ||
| 		text += " (" + hash + ")"
 | ||
| 	}
 | ||
| 
 | ||
| 	replaceContent(node, start, end, createCodeLink(urlFull, text, "commit"))
 | ||
| }
 | ||
| 
 | ||
| // sha1CurrentPatternProcessor renders SHA1 strings to corresponding links that
 | ||
| // are assumed to be in the same repository.
 | ||
| func sha1CurrentPatternProcessor(ctx *postProcessCtx, node *html.Node) {
 | ||
| 	if ctx.metas == nil || ctx.metas["user"] == "" || ctx.metas["repo"] == "" || ctx.metas["repoPath"] == "" {
 | ||
| 		return
 | ||
| 	}
 | ||
| 	m := sha1CurrentPattern.FindStringSubmatchIndex(node.Data)
 | ||
| 	if m == nil {
 | ||
| 		return
 | ||
| 	}
 | ||
| 	hash := node.Data[m[2]:m[3]]
 | ||
| 	// The regex does not lie, it matches the hash pattern.
 | ||
| 	// However, a regex cannot know if a hash actually exists or not.
 | ||
| 	// We could assume that a SHA1 hash should probably contain alphas AND numerics
 | ||
| 	// but that is not always the case.
 | ||
| 	// Although unlikely, deadbeef and 1234567 are valid short forms of SHA1 hash
 | ||
| 	// as used by git and github for linking and thus we have to do similar.
 | ||
| 	// Because of this, we check to make sure that a matched hash is actually
 | ||
| 	// a commit in the repository before making it a link.
 | ||
| 	if _, err := git.NewCommand("rev-parse", "--verify", hash).RunInDirBytes(ctx.metas["repoPath"]); err != nil {
 | ||
| 		if !strings.Contains(err.Error(), "fatal: Needed a single revision") {
 | ||
| 			log.Debug("sha1CurrentPatternProcessor git rev-parse: %v", err)
 | ||
| 		}
 | ||
| 		return
 | ||
| 	}
 | ||
| 
 | ||
| 	replaceContent(node, m[2], m[3],
 | ||
| 		createCodeLink(util.URLJoin(setting.AppURL, ctx.metas["user"], ctx.metas["repo"], "commit", hash), base.ShortSha(hash), "commit"))
 | ||
| }
 | ||
| 
 | ||
| // emailAddressProcessor replaces raw email addresses with a mailto: link.
 | ||
| func emailAddressProcessor(ctx *postProcessCtx, node *html.Node) {
 | ||
| 	m := emailRegex.FindStringSubmatchIndex(node.Data)
 | ||
| 	if m == nil {
 | ||
| 		return
 | ||
| 	}
 | ||
| 	mail := node.Data[m[2]:m[3]]
 | ||
| 	replaceContent(node, m[2], m[3], createLink("mailto:"+mail, mail, "mailto"))
 | ||
| }
 | ||
| 
 | ||
| // linkProcessor creates links for any HTTP or HTTPS URL not captured by
 | ||
| // markdown.
 | ||
| func linkProcessor(ctx *postProcessCtx, node *html.Node) {
 | ||
| 	m := common.LinkRegex.FindStringIndex(node.Data)
 | ||
| 	if m == nil {
 | ||
| 		return
 | ||
| 	}
 | ||
| 	uri := node.Data[m[0]:m[1]]
 | ||
| 	replaceContent(node, m[0], m[1], createLink(uri, uri, "link"))
 | ||
| }
 | ||
| 
 | ||
| func genDefaultLinkProcessor(defaultLink string) processor {
 | ||
| 	return func(ctx *postProcessCtx, node *html.Node) {
 | ||
| 		ch := &html.Node{
 | ||
| 			Parent: node,
 | ||
| 			Type:   html.TextNode,
 | ||
| 			Data:   node.Data,
 | ||
| 		}
 | ||
| 
 | ||
| 		node.Type = html.ElementNode
 | ||
| 		node.Data = "a"
 | ||
| 		node.DataAtom = atom.A
 | ||
| 		node.Attr = []html.Attribute{
 | ||
| 			{Key: "href", Val: defaultLink},
 | ||
| 			{Key: "class", Val: "default-link"},
 | ||
| 		}
 | ||
| 		node.FirstChild, node.LastChild = ch, ch
 | ||
| 	}
 | ||
| }
 | ||
| 
 | ||
| // descriptionLinkProcessor creates links for DescriptionHTML
 | ||
| func descriptionLinkProcessor(ctx *postProcessCtx, node *html.Node) {
 | ||
| 	m := common.LinkRegex.FindStringIndex(node.Data)
 | ||
| 	if m == nil {
 | ||
| 		return
 | ||
| 	}
 | ||
| 	uri := node.Data[m[0]:m[1]]
 | ||
| 	replaceContent(node, m[0], m[1], createDescriptionLink(uri, uri))
 | ||
| }
 | ||
| 
 | ||
| func createDescriptionLink(href, content string) *html.Node {
 | ||
| 	textNode := &html.Node{
 | ||
| 		Type: html.TextNode,
 | ||
| 		Data: content,
 | ||
| 	}
 | ||
| 	linkNode := &html.Node{
 | ||
| 		FirstChild: textNode,
 | ||
| 		LastChild:  textNode,
 | ||
| 		Type:       html.ElementNode,
 | ||
| 		Data:       "a",
 | ||
| 		DataAtom:   atom.A,
 | ||
| 		Attr: []html.Attribute{
 | ||
| 			{Key: "href", Val: href},
 | ||
| 			{Key: "target", Val: "_blank"},
 | ||
| 			{Key: "rel", Val: "noopener noreferrer"},
 | ||
| 		},
 | ||
| 	}
 | ||
| 	textNode.Parent = linkNode
 | ||
| 	return linkNode
 | ||
| }
 |