2017-09-16 20:17:57 +03:00
// Copyright 2017 The Gitea Authors. All rights reserved.
// Use of this source code is governed by a MIT-style
// license that can be found in the LICENSE file.
package markup
import (
"bytes"
2021-04-20 01:25:08 +03:00
"io"
2017-09-16 20:17:57 +03:00
"net/url"
"path"
"path/filepath"
"regexp"
"strings"
2021-07-15 23:33:56 +03:00
"sync"
2017-09-16 20:17:57 +03:00
"code.gitea.io/gitea/modules/base"
2020-04-28 21:05:39 +03:00
"code.gitea.io/gitea/modules/emoji"
2019-08-14 11:04:55 +03:00
"code.gitea.io/gitea/modules/git"
"code.gitea.io/gitea/modules/log"
2019-12-31 04:53:28 +03:00
"code.gitea.io/gitea/modules/markup/common"
2019-10-14 01:29:10 +03:00
"code.gitea.io/gitea/modules/references"
2022-06-10 08:39:53 +03:00
"code.gitea.io/gitea/modules/regexplru"
2017-09-16 20:17:57 +03:00
"code.gitea.io/gitea/modules/setting"
2022-04-01 11:47:50 +03:00
"code.gitea.io/gitea/modules/templates/vars"
2018-02-20 15:50:42 +03:00
"code.gitea.io/gitea/modules/util"
2017-09-16 20:17:57 +03:00
"golang.org/x/net/html"
2018-02-27 10:09:18 +03:00
"golang.org/x/net/html/atom"
2019-03-27 14:15:23 +03:00
"mvdan.cc/xurls/v2"
2017-09-16 20:17:57 +03:00
)
// Issue name styles
const (
IssueNameStyleNumeric = "numeric"
IssueNameStyleAlphanumeric = "alphanumeric"
2022-06-10 08:39:53 +03:00
IssueNameStyleRegexp = "regexp"
2017-09-16 20:17:57 +03:00
)
var (
// NOTE: All below regex matching do not perform any extra validation.
// Thus a link is produced even if the linked entity does not exist.
// While fast, this is also incorrect and lead to false positives.
// TODO: fix invalid linking issue
2021-12-11 20:21:36 +03:00
// valid chars in encoded path and parameter: [-+~_%.a-zA-Z0-9/]
2018-02-27 10:09:18 +03:00
// sha1CurrentPattern matches string that represents a commit SHA, e.g. d8a994ef243349f321568f9e36d5c3f444b99cae
2017-09-16 20:17:57 +03:00
// Although SHA1 hashes are 40 chars long, the regex matches the hash from 7 to 40 chars in length
2021-12-11 20:21:36 +03:00
// so that abbreviated hash links can be used as well. This matches git and GitHub usability.
2021-01-03 18:11:10 +03:00
sha1CurrentPattern = regexp . MustCompile ( ` (?:\s|^|\(|\[)([0-9a-f] { 7,40})(?:\s|$|\)|\]|[.,](\s|$)) ` )
2017-09-16 20:17:57 +03:00
2018-02-27 10:09:18 +03:00
// shortLinkPattern matches short but difficult to parse [[name|link|arg=test]] syntax
shortLinkPattern = regexp . MustCompile ( ` \[\[(.*?)\]\](\w*) ` )
2017-09-16 20:17:57 +03:00
2021-12-11 20:21:36 +03:00
// anySHA1Pattern splits url containing SHA into parts
anySHA1Pattern = regexp . MustCompile ( ` https?://(?:\S+/) { 4,5}([0-9a-f] { 40})(/[-+~_%.a-zA-Z0-9/]+)?(#[-+~_%.a-zA-Z0-9]+)? ` )
// comparePattern matches "http://domain/org/repo/compare/COMMIT1...COMMIT2#hash"
2022-01-31 02:48:47 +03:00
comparePattern = regexp . MustCompile ( ` https?://(?:\S+/) { 4,5}([0-9a-f] { 7,40})(\.\.\.?)([0-9a-f] { 7,40})?(#[-+~_%.a-zA-Z0-9]+)? ` )
2017-09-16 20:17:57 +03:00
validLinksPattern = regexp . MustCompile ( ` ^[a-z][\w-]+:// ` )
2018-02-27 10:09:18 +03:00
// While this email regex is definitely not perfect and I'm sure you can come up
// with edge cases, it is still accepted by the CommonMark specification, as
// well as the HTML5 spec:
// http://spec.commonmark.org/0.28/#email-address
// https://html.spec.whatwg.org/multipage/input.html#e-mail-state-(type%3Demail)
2019-04-25 04:53:42 +03:00
emailRegex = regexp . MustCompile ( "(?:\\s|^|\\(|\\[)([a-zA-Z0-9.!#$%&'*+\\/=?^_`{|}~-]+@[a-zA-Z0-9](?:[a-zA-Z0-9-]{0,61}[a-zA-Z0-9])?(?:\\.[a-zA-Z0-9]{2,}(?:[a-zA-Z0-9-]{0,61}[a-zA-Z0-9])?)+)(?:\\s|$|\\)|\\]|\\.(\\s|$))" )
2018-02-27 10:09:18 +03:00
2019-12-24 01:38:50 +03:00
// blackfriday extensions create IDs like fn:user-content-footnote
blackfridayExtRegex = regexp . MustCompile ( ` [^:]*:user-content- ` )
2020-04-28 21:05:39 +03:00
// EmojiShortCodeRegex find emoji by alias like :smile:
2021-12-11 20:21:36 +03:00
EmojiShortCodeRegex = regexp . MustCompile ( ` :[-+\w]+: ` )
2017-09-16 20:17:57 +03:00
)
2019-10-14 01:29:10 +03:00
// CSS class for action keywords (e.g. "closes: #1")
const keywordClass = "issue-keyword"
2017-09-16 20:17:57 +03:00
// IsLink reports whether link fits valid format.
func IsLink ( link [ ] byte ) bool {
return isLink ( link )
}
// isLink reports whether link fits valid format.
func isLink ( link [ ] byte ) bool {
return validLinksPattern . Match ( link )
}
2018-02-27 10:09:18 +03:00
func isLinkStr ( link string ) bool {
return validLinksPattern . MatchString ( link )
}
2021-07-15 23:33:56 +03:00
// regexp for full links to issues/pulls
var issueFullPattern * regexp . Regexp
// Once for to prevent races
var issueFullPatternOnce sync . Once
2017-09-16 20:17:57 +03:00
func getIssueFullPattern ( ) * regexp . Regexp {
2021-07-15 23:33:56 +03:00
issueFullPatternOnce . Do ( func ( ) {
2021-02-20 00:36:43 +03:00
issueFullPattern = regexp . MustCompile ( regexp . QuoteMeta ( setting . AppURL ) +
2022-02-26 02:26:43 +03:00
` [\w_.-]+/[\w_.-]+/(?:issues|pulls)/((?:\w { 1,10}-)?[1-9][0-9]*)([\?|#](\S+)?)?\b ` )
2021-07-15 23:33:56 +03:00
} )
2017-09-16 20:17:57 +03:00
return issueFullPattern
}
2019-10-15 04:31:09 +03:00
// CustomLinkURLSchemes allows for additional schemes to be detected when parsing links within text
func CustomLinkURLSchemes ( schemes [ ] string ) {
schemes = append ( schemes , "http" , "https" )
withAuth := make ( [ ] string , 0 , len ( schemes ) )
validScheme := regexp . MustCompile ( ` ^[a-z]+$ ` )
for _ , s := range schemes {
if ! validScheme . MatchString ( s ) {
continue
}
without := false
for _ , sna := range xurls . SchemesNoAuthority {
if s == sna {
without = true
break
}
}
if without {
s += ":"
} else {
s += "://"
}
withAuth = append ( withAuth , s )
}
2019-12-31 04:53:28 +03:00
common . LinkRegex , _ = xurls . StrictMatchingScheme ( strings . Join ( withAuth , "|" ) )
2019-10-15 04:31:09 +03:00
}
2017-09-16 20:17:57 +03:00
// IsSameDomain checks if given url string has the same hostname as current Gitea instance
func IsSameDomain ( s string ) bool {
if strings . HasPrefix ( s , "/" ) {
return true
}
if uapp , err := url . Parse ( setting . AppURL ) ; err == nil {
if u , err := url . Parse ( s ) ; err == nil {
return u . Host == uapp . Host
}
return false
}
return false
}
2018-02-27 10:09:18 +03:00
type postProcessError struct {
context string
err error
}
func ( p * postProcessError ) Error ( ) string {
2019-06-12 22:41:28 +03:00
return "PostProcess: " + p . context + ", " + p . err . Error ( )
2018-02-27 10:09:18 +03:00
}
2021-04-20 01:25:08 +03:00
type processor func ( ctx * RenderContext , node * html . Node )
2018-02-27 10:09:18 +03:00
var defaultProcessors = [ ] processor {
fullIssuePatternProcessor ,
2021-12-11 20:21:36 +03:00
comparePatternProcessor ,
2019-03-27 18:37:54 +03:00
fullSha1PatternProcessor ,
shortLinkProcessor ,
linkProcessor ,
mentionProcessor ,
2018-02-27 10:09:18 +03:00
issueIndexPatternProcessor ,
sha1CurrentPatternProcessor ,
emailAddressProcessor ,
2020-04-28 21:05:39 +03:00
emojiProcessor ,
emojiShortCodeProcessor ,
2018-02-27 10:09:18 +03:00
}
// PostProcess does the final required transformations to the passed raw HTML
// data, and ensures its validity. Transformations include: replacing links and
// emails with HTML links, parsing shortlinks in the format of [[Link]], like
// MediaWiki, linking issues in the format #ID, and mentions in the format
// @user, and others.
func PostProcess (
2021-04-20 01:25:08 +03:00
ctx * RenderContext ,
input io . Reader ,
output io . Writer ,
) error {
return postProcess ( ctx , defaultProcessors , input , output )
2018-02-27 10:09:18 +03:00
}
var commitMessageProcessors = [ ] processor {
fullIssuePatternProcessor ,
2021-12-11 20:21:36 +03:00
comparePatternProcessor ,
2019-03-27 18:37:54 +03:00
fullSha1PatternProcessor ,
linkProcessor ,
mentionProcessor ,
2018-02-27 10:09:18 +03:00
issueIndexPatternProcessor ,
sha1CurrentPatternProcessor ,
emailAddressProcessor ,
2020-04-28 21:05:39 +03:00
emojiProcessor ,
emojiShortCodeProcessor ,
2018-02-27 10:09:18 +03:00
}
// RenderCommitMessage will use the same logic as PostProcess, but will disable
// the shortLinkProcessor and will add a defaultLinkProcessor if defaultLink is
// set, which changes every text node into a link to the passed default link.
func RenderCommitMessage (
2021-04-20 01:25:08 +03:00
ctx * RenderContext ,
content string ,
) ( string , error ) {
2022-01-20 20:46:10 +03:00
procs := commitMessageProcessors
2021-04-20 01:25:08 +03:00
if ctx . DefaultLink != "" {
2018-02-27 10:09:18 +03:00
// we don't have to fear data races, because being
// commitMessageProcessors of fixed len and cap, every time we append
// something to it the slice is realloc+copied, so append always
// generates the slice ex-novo.
2021-04-20 01:25:08 +03:00
procs = append ( procs , genDefaultLinkProcessor ( ctx . DefaultLink ) )
2018-02-27 10:09:18 +03:00
}
2021-04-20 01:25:08 +03:00
return renderProcessString ( ctx , procs , content )
2018-02-27 10:09:18 +03:00
}
2019-09-10 12:03:30 +03:00
var commitMessageSubjectProcessors = [ ] processor {
fullIssuePatternProcessor ,
2021-12-11 20:21:36 +03:00
comparePatternProcessor ,
2019-09-10 12:03:30 +03:00
fullSha1PatternProcessor ,
linkProcessor ,
mentionProcessor ,
issueIndexPatternProcessor ,
sha1CurrentPatternProcessor ,
2020-04-28 21:05:39 +03:00
emojiShortCodeProcessor ,
emojiProcessor ,
}
var emojiProcessors = [ ] processor {
emojiShortCodeProcessor ,
emojiProcessor ,
2019-09-10 12:03:30 +03:00
}
// RenderCommitMessageSubject will use the same logic as PostProcess and
// RenderCommitMessage, but will disable the shortLinkProcessor and
// emailAddressProcessor, will add a defaultLinkProcessor if defaultLink is set,
// which changes every text node into a link to the passed default link.
func RenderCommitMessageSubject (
2021-04-20 01:25:08 +03:00
ctx * RenderContext ,
content string ,
) ( string , error ) {
2022-01-20 20:46:10 +03:00
procs := commitMessageSubjectProcessors
2021-04-20 01:25:08 +03:00
if ctx . DefaultLink != "" {
2019-09-10 12:03:30 +03:00
// we don't have to fear data races, because being
// commitMessageSubjectProcessors of fixed len and cap, every time we
// append something to it the slice is realloc+copied, so append always
// generates the slice ex-novo.
2021-04-20 01:25:08 +03:00
procs = append ( procs , genDefaultLinkProcessor ( ctx . DefaultLink ) )
2019-09-10 12:03:30 +03:00
}
2021-04-20 01:25:08 +03:00
return renderProcessString ( ctx , procs , content )
2019-09-10 12:03:30 +03:00
}
2020-12-03 13:50:47 +03:00
// RenderIssueTitle to process title on individual issue/pull page
func RenderIssueTitle (
2021-04-20 01:25:08 +03:00
ctx * RenderContext ,
title string ,
) ( string , error ) {
return renderProcessString ( ctx , [ ] processor {
issueIndexPatternProcessor ,
sha1CurrentPatternProcessor ,
emojiShortCodeProcessor ,
emojiProcessor ,
} , title )
}
func renderProcessString ( ctx * RenderContext , procs [ ] processor , content string ) ( string , error ) {
var buf strings . Builder
if err := postProcess ( ctx , procs , strings . NewReader ( content ) , & buf ) ; err != nil {
return "" , err
2020-12-03 13:50:47 +03:00
}
2021-04-20 01:25:08 +03:00
return buf . String ( ) , nil
2020-12-03 13:50:47 +03:00
}
2019-03-12 05:23:34 +03:00
// RenderDescriptionHTML will use similar logic as PostProcess, but will
// use a single special linkProcessor.
func RenderDescriptionHTML (
2021-04-20 01:25:08 +03:00
ctx * RenderContext ,
content string ,
) ( string , error ) {
return renderProcessString ( ctx , [ ] processor {
descriptionLinkProcessor ,
emojiShortCodeProcessor ,
emojiProcessor ,
} , content )
2019-03-12 05:23:34 +03:00
}
2020-04-28 21:05:39 +03:00
// RenderEmoji for when we want to just process emoji and shortcodes
2021-07-08 14:38:13 +03:00
// in various places it isn't already run through the normal markdown processor
2020-04-28 21:05:39 +03:00
func RenderEmoji (
2021-04-20 01:25:08 +03:00
content string ,
) ( string , error ) {
return renderProcessString ( & RenderContext { } , emojiProcessors , content )
2020-04-28 21:05:39 +03:00
}
2022-01-20 20:46:10 +03:00
var (
tagCleaner = regexp . MustCompile ( ` <((?:/?\w+/\w+)|(?:/[\w ]+/)|(/?[hH][tT][mM][lL]\b)|(/?[hH][eE][aA][dD]\b)) ` )
nulCleaner = strings . NewReplacer ( "\000" , "" )
)
2021-03-16 02:20:05 +03:00
2021-04-20 01:25:08 +03:00
func postProcess ( ctx * RenderContext , procs [ ] processor , input io . Reader , output io . Writer ) error {
2021-06-21 01:39:12 +03:00
defer ctx . Cancel ( )
2021-04-20 01:25:08 +03:00
// FIXME: don't read all content to memory
2021-09-22 08:38:34 +03:00
rawHTML , err := io . ReadAll ( input )
2021-04-20 01:25:08 +03:00
if err != nil {
return err
2018-02-27 10:09:18 +03:00
}
2021-03-16 02:20:05 +03:00
res := bytes . NewBuffer ( make ( [ ] byte , 0 , len ( rawHTML ) + 50 ) )
2021-02-18 04:32:14 +03:00
// prepend "<html><body>"
2021-03-16 02:20:05 +03:00
_ , _ = res . WriteString ( "<html><body>" )
2021-02-18 04:32:14 +03:00
// Strip out nuls - they're always invalid
2021-03-22 04:45:01 +03:00
_ , _ = res . Write ( tagCleaner . ReplaceAll ( [ ] byte ( nulCleaner . Replace ( string ( rawHTML ) ) ) , [ ] byte ( "<$1" ) ) )
2021-02-18 04:32:14 +03:00
// close the tags
2021-03-16 02:20:05 +03:00
_ , _ = res . WriteString ( "</body></html>" )
2018-02-27 10:09:18 +03:00
// parse the HTML
2021-06-22 01:12:22 +03:00
node , err := html . Parse ( res )
2018-02-27 10:09:18 +03:00
if err != nil {
2021-04-20 01:25:08 +03:00
return & postProcessError { "invalid HTML" , err }
2018-02-27 10:09:18 +03:00
}
2021-06-22 01:12:22 +03:00
if node . Type == html . DocumentNode {
node = node . FirstChild
2018-02-27 10:09:18 +03:00
}
2021-12-16 02:49:12 +03:00
visitNode ( ctx , procs , procs , node )
2021-01-20 18:10:50 +03:00
2021-06-22 01:12:22 +03:00
newNodes := make ( [ ] * html . Node , 0 , 5 )
if node . Data == "html" {
node = node . FirstChild
for node != nil && node . Data != "body" {
node = node . NextSibling
2021-01-20 18:10:50 +03:00
}
2021-06-22 01:12:22 +03:00
}
if node != nil {
2021-01-20 18:10:50 +03:00
if node . Data == "body" {
child := node . FirstChild
for child != nil {
newNodes = append ( newNodes , child )
child = child . NextSibling
}
} else {
newNodes = append ( newNodes , node )
}
}
2018-02-27 10:09:18 +03:00
// Render everything to buf.
2021-04-20 01:25:08 +03:00
for _ , node := range newNodes {
2022-03-17 21:04:36 +03:00
if err := html . Render ( output , node ) ; err != nil {
2021-04-20 01:25:08 +03:00
return & postProcessError { "error rendering processed HTML" , err }
2017-09-16 20:17:57 +03:00
}
2018-02-27 10:09:18 +03:00
}
2021-04-20 01:25:08 +03:00
return nil
2018-02-27 10:09:18 +03:00
}
2021-12-16 02:49:12 +03:00
func visitNode ( ctx * RenderContext , procs , textProcs [ ] processor , node * html . Node ) {
2019-12-24 01:38:50 +03:00
// Add user-content- to IDs if they don't already have them
for idx , attr := range node . Attr {
if attr . Key == "id" && ! ( strings . HasPrefix ( attr . Val , "user-content-" ) || blackfridayExtRegex . MatchString ( attr . Val ) ) {
node . Attr [ idx ] . Val = "user-content-" + attr . Val
}
2020-04-28 21:05:39 +03:00
if attr . Key == "class" && attr . Val == "emoji" {
2021-12-16 02:49:12 +03:00
textProcs = nil
2020-04-28 21:05:39 +03:00
}
2019-12-24 01:38:50 +03:00
}
2020-04-28 21:05:39 +03:00
2021-12-16 02:49:12 +03:00
// We ignore code and pre.
2018-02-27 10:09:18 +03:00
switch node . Type {
case html . TextNode :
2021-12-16 02:49:12 +03:00
textNode ( ctx , textProcs , node )
2018-02-27 10:09:18 +03:00
case html . ElementNode :
2020-02-28 07:16:05 +03:00
if node . Data == "img" {
2021-07-04 12:26:04 +03:00
for i , attr := range node . Attr {
2020-02-28 07:16:05 +03:00
if attr . Key != "src" {
continue
}
2021-06-07 19:55:26 +03:00
if len ( attr . Val ) > 0 && ! isLinkStr ( attr . Val ) && ! strings . HasPrefix ( attr . Val , "data:image/" ) {
2021-04-20 01:25:08 +03:00
prefix := ctx . URLPrefix
if ctx . IsWiki {
2020-02-28 07:16:05 +03:00
prefix = util . URLJoin ( prefix , "wiki" , "raw" )
}
prefix = strings . Replace ( prefix , "/src/" , "/media/" , 1 )
2021-06-07 19:55:26 +03:00
attr . Val = util . URLJoin ( prefix , attr . Val )
2020-02-28 07:16:05 +03:00
}
2022-03-29 11:27:37 +03:00
attr . Val = camoHandleLink ( attr . Val )
2021-07-04 12:26:04 +03:00
node . Attr [ i ] = attr
2020-02-28 07:16:05 +03:00
}
} else if node . Data == "a" {
2021-12-16 02:49:12 +03:00
// Restrict text in links to emojis
textProcs = emojiProcessors
2020-02-28 07:16:05 +03:00
} else if node . Data == "code" || node . Data == "pre" {
2018-02-27 10:09:18 +03:00
return
2020-04-24 16:22:36 +03:00
} else if node . Data == "i" {
for _ , attr := range node . Attr {
if attr . Key != "class" {
continue
}
classes := strings . Split ( attr . Val , " " )
for i , class := range classes {
if class == "icon" {
classes [ 0 ] , classes [ i ] = classes [ i ] , classes [ 0 ]
attr . Val = strings . Join ( classes , " " )
// Remove all children of icons
child := node . FirstChild
for child != nil {
node . RemoveChild ( child )
child = node . FirstChild
}
break
}
}
}
2017-09-16 20:17:57 +03:00
}
2018-02-27 10:09:18 +03:00
for n := node . FirstChild ; n != nil ; n = n . NextSibling {
2021-12-16 02:49:12 +03:00
visitNode ( ctx , procs , textProcs , n )
2017-09-16 20:17:57 +03:00
}
2018-02-27 10:09:18 +03:00
}
// ignore everything else
}
// textNode runs the passed node through various processors, in order to handle
// all kinds of special links handled by the post-processing.
2021-04-20 01:25:08 +03:00
func textNode ( ctx * RenderContext , procs [ ] processor , node * html . Node ) {
for _ , processor := range procs {
2018-02-27 10:09:18 +03:00
processor ( ctx , node )
}
2017-09-16 20:17:57 +03:00
}
2019-10-14 01:29:10 +03:00
// createKeyword() renders a highlighted version of an action keyword
func createKeyword ( content string ) * html . Node {
span := & html . Node {
Type : html . ElementNode ,
Data : atom . Span . String ( ) ,
Attr : [ ] html . Attribute { } ,
}
span . Attr = append ( span . Attr , html . Attribute { Key : "class" , Val : keywordClass } )
text := & html . Node {
Type : html . TextNode ,
Data : content ,
}
span . AppendChild ( text )
return span
}
2020-04-28 21:05:39 +03:00
func createEmoji ( content , class , name string ) * html . Node {
span := & html . Node {
Type : html . ElementNode ,
Data : atom . Span . String ( ) ,
Attr : [ ] html . Attribute { } ,
}
if class != "" {
span . Attr = append ( span . Attr , html . Attribute { Key : "class" , Val : class } )
}
if name != "" {
span . Attr = append ( span . Attr , html . Attribute { Key : "aria-label" , Val : name } )
}
text := & html . Node {
Type : html . TextNode ,
Data : content ,
}
span . AppendChild ( text )
return span
}
2021-06-29 17:28:38 +03:00
func createCustomEmoji ( alias string ) * html . Node {
2020-04-28 21:05:39 +03:00
span := & html . Node {
Type : html . ElementNode ,
Data : atom . Span . String ( ) ,
Attr : [ ] html . Attribute { } ,
}
2021-06-29 17:28:38 +03:00
span . Attr = append ( span . Attr , html . Attribute { Key : "class" , Val : "emoji" } )
span . Attr = append ( span . Attr , html . Attribute { Key : "aria-label" , Val : alias } )
2020-04-28 21:05:39 +03:00
img := & html . Node {
Type : html . ElementNode ,
DataAtom : atom . Img ,
Data : "img" ,
Attr : [ ] html . Attribute { } ,
}
2021-06-29 17:28:38 +03:00
img . Attr = append ( img . Attr , html . Attribute { Key : "alt" , Val : ":" + alias + ":" } )
img . Attr = append ( img . Attr , html . Attribute { Key : "src" , Val : setting . StaticURLPrefix + "/assets/img/emoji/" + alias + ".png" } )
2020-04-28 21:05:39 +03:00
span . AppendChild ( img )
return span
}
2019-09-10 12:03:30 +03:00
func createLink ( href , content , class string ) * html . Node {
2019-04-09 06:18:48 +03:00
a := & html . Node {
Type : html . ElementNode ,
Data : atom . A . String ( ) ,
Attr : [ ] html . Attribute { { Key : "href" , Val : href } } ,
}
2019-09-10 12:03:30 +03:00
if class != "" {
a . Attr = append ( a . Attr , html . Attribute { Key : "class" , Val : class } )
}
2019-04-09 06:18:48 +03:00
text := & html . Node {
2018-02-27 10:09:18 +03:00
Type : html . TextNode ,
Data : content ,
}
2019-04-09 06:18:48 +03:00
a . AppendChild ( text )
return a
}
2019-09-10 12:03:30 +03:00
func createCodeLink ( href , content , class string ) * html . Node {
2019-04-09 06:18:48 +03:00
a := & html . Node {
Type : html . ElementNode ,
Data : atom . A . String ( ) ,
Attr : [ ] html . Attribute { { Key : "href" , Val : href } } ,
}
2019-09-10 12:03:30 +03:00
if class != "" {
a . Attr = append ( a . Attr , html . Attribute { Key : "class" , Val : class } )
}
2019-04-09 06:18:48 +03:00
text := & html . Node {
Type : html . TextNode ,
Data : content ,
2017-09-16 20:17:57 +03:00
}
2019-04-09 06:18:48 +03:00
code := & html . Node {
Type : html . ElementNode ,
Data : atom . Code . String ( ) ,
2019-06-19 01:31:31 +03:00
Attr : [ ] html . Attribute { { Key : "class" , Val : "nohighlight" } } ,
2019-04-09 06:18:48 +03:00
}
code . AppendChild ( text )
a . AppendChild ( code )
return a
2017-09-16 20:17:57 +03:00
}
2019-10-14 01:29:10 +03:00
// replaceContent takes text node, and in its content it replaces a section of
// it with the specified newNode.
2018-02-27 10:09:18 +03:00
func replaceContent ( node * html . Node , i , j int , newNode * html . Node ) {
2019-10-14 01:29:10 +03:00
replaceContentList ( node , i , j , [ ] * html . Node { newNode } )
}
// replaceContentList takes text node, and in its content it replaces a section of
// it with the specified newNodes. An example to visualize how this can work can
// be found here: https://play.golang.org/p/5zP8NnHZ03s
func replaceContentList ( node * html . Node , i , j int , newNodes [ ] * html . Node ) {
2018-02-27 10:09:18 +03:00
// get the data before and after the match
before := node . Data [ : i ]
after := node . Data [ j : ]
// Replace in the current node the text, so that it is only what it is
// supposed to have.
node . Data = before
// Get the current next sibling, before which we place the replaced data,
// and after that we place the new text node.
nextSibling := node . NextSibling
2019-10-14 01:29:10 +03:00
for _ , n := range newNodes {
node . Parent . InsertBefore ( n , nextSibling )
}
2018-02-27 10:09:18 +03:00
if after != "" {
node . Parent . InsertBefore ( & html . Node {
Type : html . TextNode ,
Data : after ,
} , nextSibling )
2017-09-16 20:17:57 +03:00
}
}
2021-04-20 01:25:08 +03:00
func mentionProcessor ( ctx * RenderContext , node * html . Node ) {
2021-06-17 13:35:05 +03:00
start := 0
next := node . NextSibling
for node != nil && node != next && start < len ( node . Data ) {
// We replace only the first mention; other mentions will be addressed later
found , loc := references . FindFirstMentionBytes ( [ ] byte ( node . Data [ start : ] ) )
if ! found {
return
2020-12-21 18:39:28 +03:00
}
2021-06-17 13:35:05 +03:00
loc . Start += start
loc . End += start
mention := node . Data [ loc . Start : loc . End ]
var teams string
teams , ok := ctx . Metas [ "teams" ]
// FIXME: util.URLJoin may not be necessary here:
// - setting.AppURL is defined to have a terminal '/' so unless mention[1:]
// is an AppSubURL link we can probably fallback to concatenation.
// team mention should follow @orgName/teamName style
if ok && strings . Contains ( mention , "/" ) {
mentionOrgAndTeam := strings . Split ( mention , "/" )
if mentionOrgAndTeam [ 0 ] [ 1 : ] == ctx . Metas [ "org" ] && strings . Contains ( teams , "," + strings . ToLower ( mentionOrgAndTeam [ 1 ] ) + "," ) {
replaceContent ( node , loc . Start , loc . End , createLink ( util . URLJoin ( setting . AppURL , "org" , ctx . Metas [ "org" ] , "teams" , mentionOrgAndTeam [ 1 ] ) , mention , "mention" ) )
node = node . NextSibling . NextSibling
start = 0
continue
}
start = loc . End
continue
}
replaceContent ( node , loc . Start , loc . End , createLink ( util . URLJoin ( setting . AppURL , mention [ 1 : ] ) , mention , "mention" ) )
node = node . NextSibling . NextSibling
start = 0
2019-11-24 19:34:44 +03:00
}
2018-02-27 10:09:18 +03:00
}
2021-04-20 01:25:08 +03:00
func shortLinkProcessor ( ctx * RenderContext , node * html . Node ) {
2018-02-27 10:09:18 +03:00
shortLinkProcessorFull ( ctx , node , false )
}
2021-04-20 01:25:08 +03:00
func shortLinkProcessorFull ( ctx * RenderContext , node * html . Node , noLink bool ) {
2021-06-17 13:35:05 +03:00
next := node . NextSibling
for node != nil && node != next {
m := shortLinkPattern . FindStringSubmatchIndex ( node . Data )
if m == nil {
return
}
2017-09-16 20:17:57 +03:00
2021-06-17 13:35:05 +03:00
content := node . Data [ m [ 2 ] : m [ 3 ] ]
tail := node . Data [ m [ 4 ] : m [ 5 ] ]
props := make ( map [ string ] string )
// MediaWiki uses [[link|text]], while GitHub uses [[text|link]]
// It makes page handling terrible, but we prefer GitHub syntax
// And fall back to MediaWiki only when it is obvious from the look
// Of text and link contents
sl := strings . Split ( content , "|" )
for _ , v := range sl {
if equalPos := strings . IndexByte ( v , '=' ) ; equalPos == - 1 {
// There is no equal in this argument; this is a mandatory arg
if props [ "name" ] == "" {
if isLinkStr ( v ) {
// If we clearly see it is a link, we save it so
// But first we need to ensure, that if both mandatory args provided
// look like links, we stick to GitHub syntax
if props [ "link" ] != "" {
props [ "name" ] = props [ "link" ]
}
2018-02-27 10:09:18 +03:00
2021-06-17 13:35:05 +03:00
props [ "link" ] = strings . TrimSpace ( v )
} else {
props [ "name" ] = v
}
2018-02-27 10:09:18 +03:00
} else {
2021-06-17 13:35:05 +03:00
props [ "link" ] = strings . TrimSpace ( v )
2017-09-16 20:17:57 +03:00
}
2018-02-27 10:09:18 +03:00
} else {
2021-06-17 13:35:05 +03:00
// There is an equal; optional argument.
sep := strings . IndexByte ( v , '=' )
key , val := v [ : sep ] , html . UnescapeString ( v [ sep + 1 : ] )
// When parsing HTML, x/net/html will change all quotes which are
// not used for syntax into UTF-8 quotes. So checking val[0] won't
// be enough, since that only checks a single byte.
if len ( val ) > 1 {
if ( strings . HasPrefix ( val , "“" ) && strings . HasSuffix ( val , "”" ) ) ||
( strings . HasPrefix ( val , "‘ " ) && strings . HasSuffix ( val , "’ " ) ) {
const lenQuote = len ( "‘ " )
val = val [ lenQuote : len ( val ) - lenQuote ]
} else if ( strings . HasPrefix ( val , "\"" ) && strings . HasSuffix ( val , "\"" ) ) ||
( strings . HasPrefix ( val , "'" ) && strings . HasSuffix ( val , "'" ) ) {
val = val [ 1 : len ( val ) - 1 ]
} else if strings . HasPrefix ( val , "'" ) && strings . HasSuffix ( val , "’ " ) {
const lenQuote = len ( "‘ " )
val = val [ 1 : len ( val ) - lenQuote ]
}
2020-12-04 05:01:42 +03:00
}
2021-06-17 13:35:05 +03:00
props [ key ] = val
2017-09-16 20:17:57 +03:00
}
}
2018-02-27 10:09:18 +03:00
2021-06-17 13:35:05 +03:00
var name , link string
if props [ "link" ] != "" {
link = props [ "link" ]
} else if props [ "name" ] != "" {
link = props [ "name" ]
}
if props [ "title" ] != "" {
name = props [ "title" ]
} else if props [ "name" ] != "" {
name = props [ "name" ]
2018-03-05 21:39:12 +03:00
} else {
2021-06-17 13:35:05 +03:00
name = link
2018-03-05 21:39:12 +03:00
}
2021-06-17 13:35:05 +03:00
name += tail
image := false
switch ext := filepath . Ext ( link ) ; ext {
// fast path: empty string, ignore
case "" :
// leave image as false
case ".jpg" , ".jpeg" , ".png" , ".tif" , ".tiff" , ".webp" , ".gif" , ".bmp" , ".ico" , ".svg" :
image = true
2018-06-15 15:42:49 +03:00
}
2021-06-17 13:35:05 +03:00
childNode := & html . Node { }
linkNode := & html . Node {
FirstChild : childNode ,
LastChild : childNode ,
Type : html . ElementNode ,
Data : "a" ,
DataAtom : atom . A ,
}
childNode . Parent = linkNode
absoluteLink := isLinkStr ( link )
2018-02-27 10:09:18 +03:00
if ! absoluteLink {
2021-06-17 13:35:05 +03:00
if image {
link = strings . ReplaceAll ( link , " " , "+" )
} else {
link = strings . ReplaceAll ( link , " " , "-" )
2018-02-27 10:09:18 +03:00
}
2021-06-17 13:35:05 +03:00
if ! strings . Contains ( link , "/" ) {
link = url . PathEscape ( link )
2018-02-27 10:09:18 +03:00
}
2017-09-16 20:17:57 +03:00
}
2021-06-17 13:35:05 +03:00
urlPrefix := ctx . URLPrefix
if image {
if ! absoluteLink {
if IsSameDomain ( urlPrefix ) {
urlPrefix = strings . Replace ( urlPrefix , "/src/" , "/raw/" , 1 )
}
if ctx . IsWiki {
link = util . URLJoin ( "wiki" , "raw" , link )
}
link = util . URLJoin ( urlPrefix , link )
}
title := props [ "title" ]
if title == "" {
title = props [ "alt" ]
}
if title == "" {
title = path . Base ( name )
}
alt := props [ "alt" ]
if alt == "" {
alt = name
}
2017-09-16 20:17:57 +03:00
2021-06-17 13:35:05 +03:00
// make the childNode an image - if we can, we also place the alt
childNode . Type = html . ElementNode
childNode . Data = "img"
childNode . DataAtom = atom . Img
childNode . Attr = [ ] html . Attribute {
{ Key : "src" , Val : link } ,
{ Key : "title" , Val : title } ,
{ Key : "alt" , Val : alt } ,
}
if alt == "" {
childNode . Attr = childNode . Attr [ : 2 ]
2017-09-16 20:17:57 +03:00
}
2021-06-17 13:35:05 +03:00
} else {
if ! absoluteLink {
if ctx . IsWiki {
link = util . URLJoin ( "wiki" , link )
}
link = util . URLJoin ( urlPrefix , link )
}
childNode . Type = html . TextNode
childNode . Data = name
2017-09-16 20:17:57 +03:00
}
2021-06-17 13:35:05 +03:00
if noLink {
linkNode = childNode
} else {
linkNode . Attr = [ ] html . Attribute { { Key : "href" , Val : link } }
}
replaceContent ( node , m [ 0 ] , m [ 1 ] , linkNode )
node = node . NextSibling . NextSibling
2018-02-27 10:09:18 +03:00
}
2017-09-16 20:17:57 +03:00
}
2021-04-20 01:25:08 +03:00
func fullIssuePatternProcessor ( ctx * RenderContext , node * html . Node ) {
if ctx . Metas == nil {
2019-04-12 08:53:34 +03:00
return
}
2021-06-17 13:35:05 +03:00
next := node . NextSibling
for node != nil && node != next {
m := getIssueFullPattern ( ) . FindStringSubmatchIndex ( node . Data )
if m == nil {
return
}
link := node . Data [ m [ 0 ] : m [ 1 ] ]
id := "#" + node . Data [ m [ 2 ] : m [ 3 ] ]
// extract repo and org name from matched link like
// http://localhost:3000/gituser/myrepo/issues/1
2021-08-13 01:22:05 +03:00
linkParts := strings . Split ( link , "/" )
2021-06-17 13:35:05 +03:00
matchOrg := linkParts [ len ( linkParts ) - 4 ]
matchRepo := linkParts [ len ( linkParts ) - 3 ]
if matchOrg == ctx . Metas [ "user" ] && matchRepo == ctx . Metas [ "repo" ] {
// TODO if m[4]:m[5] is not nil, then link is to a comment,
// and we should indicate that in the text somehow
replaceContent ( node , m [ 0 ] , m [ 1 ] , createLink ( link , id , "ref-issue" ) )
} else {
orgRepoID := matchOrg + "/" + matchRepo + id
replaceContent ( node , m [ 0 ] , m [ 1 ] , createLink ( link , orgRepoID , "ref-issue" ) )
}
node = node . NextSibling . NextSibling
2019-04-12 08:53:34 +03:00
}
2018-02-27 10:09:18 +03:00
}
2017-09-16 20:17:57 +03:00
2021-04-20 01:25:08 +03:00
func issueIndexPatternProcessor ( ctx * RenderContext , node * html . Node ) {
if ctx . Metas == nil {
2019-04-12 08:53:34 +03:00
return
}
2019-10-14 01:29:10 +03:00
var (
found bool
ref * references . RenderizableReference
)
2021-06-17 13:35:05 +03:00
next := node . NextSibling
2022-06-10 08:39:53 +03:00
2021-06-17 13:35:05 +03:00
for node != nil && node != next {
2022-06-10 08:39:53 +03:00
_ , hasExtTrackFormat := ctx . Metas [ "format" ]
2021-06-17 13:35:05 +03:00
// Repos with external issue trackers might still need to reference local PRs
// We need to concern with the first one that shows up in the text, whichever it is
2022-06-10 08:39:53 +03:00
isNumericStyle := ctx . Metas [ "style" ] == "" || ctx . Metas [ "style" ] == IssueNameStyleNumeric
foundNumeric , refNumeric := references . FindRenderizableReferenceNumeric ( node . Data , hasExtTrackFormat && ! isNumericStyle )
switch ctx . Metas [ "style" ] {
case "" , IssueNameStyleNumeric :
found , ref = foundNumeric , refNumeric
case IssueNameStyleAlphanumeric :
found , ref = references . FindRenderizableReferenceAlphanumeric ( node . Data )
case IssueNameStyleRegexp :
pattern , err := regexplru . GetCompiled ( ctx . Metas [ "regexp" ] )
if err != nil {
return
}
found , ref = references . FindRenderizableReferenceRegexp ( node . Data , pattern )
}
// Repos with external issue trackers might still need to reference local PRs
// We need to concern with the first one that shows up in the text, whichever it is
2022-07-07 18:46:49 +03:00
if hasExtTrackFormat && ! isNumericStyle && refNumeric != nil {
2022-06-10 08:39:53 +03:00
// If numeric (PR) was found, and it was BEFORE the non-numeric pattern, use that
2022-07-07 18:46:49 +03:00
// Allow a free-pass when non-numeric pattern wasn't found.
if found && ( ref == nil || refNumeric . RefLocation . Start < ref . RefLocation . Start ) {
2022-06-10 08:39:53 +03:00
found = foundNumeric
ref = refNumeric
2019-12-01 16:57:05 +03:00
}
}
2021-06-17 13:35:05 +03:00
if ! found {
return
2019-12-01 16:57:05 +03:00
}
2021-06-17 13:35:05 +03:00
var link * html . Node
reftext := node . Data [ ref . RefLocation . Start : ref . RefLocation . End ]
2022-06-10 08:39:53 +03:00
if hasExtTrackFormat && ! ref . IsPull {
2021-06-17 13:35:05 +03:00
ctx . Metas [ "index" ] = ref . Issue
2022-04-01 11:47:50 +03:00
res , err := vars . Expand ( ctx . Metas [ "format" ] , ctx . Metas )
if err != nil {
// here we could just log the error and continue the rendering
log . Error ( "unable to expand template vars for ref %s, err: %v" , ref . Issue , err )
}
link = createLink ( res , reftext , "ref-issue ref-external-issue" )
2019-12-01 16:57:05 +03:00
} else {
2021-06-17 13:35:05 +03:00
// Path determines the type of link that will be rendered. It's unknown at this point whether
// the linked item is actually a PR or an issue. Luckily it's of no real consequence because
// Gitea will redirect on click as appropriate.
path := "issues"
if ref . IsPull {
path = "pulls"
}
if ref . Owner == "" {
link = createLink ( util . URLJoin ( setting . AppURL , ctx . Metas [ "user" ] , ctx . Metas [ "repo" ] , path , ref . Issue ) , reftext , "ref-issue" )
} else {
link = createLink ( util . URLJoin ( setting . AppURL , ref . Owner , ref . Name , path , ref . Issue ) , reftext , "ref-issue" )
}
2019-12-01 16:57:05 +03:00
}
2017-09-16 20:17:57 +03:00
2021-06-17 13:35:05 +03:00
if ref . Action == references . XRefActionNone {
replaceContent ( node , ref . RefLocation . Start , ref . RefLocation . End , link )
node = node . NextSibling . NextSibling
continue
}
2018-02-27 10:09:18 +03:00
2021-06-17 13:35:05 +03:00
// Decorate action keywords if actionable
var keyword * html . Node
2022-06-10 08:39:53 +03:00
if references . IsXrefActionable ( ref , hasExtTrackFormat ) {
2021-06-17 13:35:05 +03:00
keyword = createKeyword ( node . Data [ ref . ActionLocation . Start : ref . ActionLocation . End ] )
} else {
keyword = & html . Node {
Type : html . TextNode ,
Data : node . Data [ ref . ActionLocation . Start : ref . ActionLocation . End ] ,
}
}
spaces := & html . Node {
2019-11-18 16:13:07 +03:00
Type : html . TextNode ,
2021-06-17 13:35:05 +03:00
Data : node . Data [ ref . ActionLocation . End : ref . RefLocation . Start ] ,
2019-11-18 16:13:07 +03:00
}
2021-06-17 13:35:05 +03:00
replaceContentList ( node , ref . ActionLocation . Start , ref . RefLocation . End , [ ] * html . Node { keyword , spaces , link } )
node = node . NextSibling . NextSibling . NextSibling . NextSibling
2019-11-18 16:13:07 +03:00
}
2017-09-16 20:17:57 +03:00
}
2018-02-27 10:09:18 +03:00
// fullSha1PatternProcessor renders SHA containing URLs
2021-04-20 01:25:08 +03:00
func fullSha1PatternProcessor ( ctx * RenderContext , node * html . Node ) {
if ctx . Metas == nil {
2019-04-16 10:53:57 +03:00
return
}
2019-04-06 21:28:45 +03:00
2021-06-17 13:35:05 +03:00
next := node . NextSibling
for node != nil && node != next {
m := anySHA1Pattern . FindStringSubmatchIndex ( node . Data )
if m == nil {
return
}
2017-09-16 20:17:57 +03:00
2021-06-17 13:35:05 +03:00
urlFull := node . Data [ m [ 0 ] : m [ 1 ] ]
text := base . ShortSha ( node . Data [ m [ 2 ] : m [ 3 ] ] )
2017-09-16 20:17:57 +03:00
2021-06-17 13:35:05 +03:00
// 3rd capture group matches a optional path
subpath := ""
if m [ 5 ] > 0 {
subpath = node . Data [ m [ 4 ] : m [ 5 ] ]
}
2019-04-06 21:28:45 +03:00
2021-06-17 13:35:05 +03:00
// 4th capture group matches a optional url hash
hash := ""
if m [ 7 ] > 0 {
hash = node . Data [ m [ 6 ] : m [ 7 ] ] [ 1 : ]
}
2019-04-06 21:28:45 +03:00
2021-06-17 13:35:05 +03:00
start := m [ 0 ]
end := m [ 1 ]
// If url ends in '.', it's very likely that it is not part of the
// actual url but used to finish a sentence.
if strings . HasSuffix ( urlFull , "." ) {
end --
urlFull = urlFull [ : len ( urlFull ) - 1 ]
if hash != "" {
hash = hash [ : len ( hash ) - 1 ]
} else if subpath != "" {
subpath = subpath [ : len ( subpath ) - 1 ]
}
2019-04-06 21:28:45 +03:00
}
2017-09-16 20:17:57 +03:00
2021-06-17 13:35:05 +03:00
if subpath != "" {
text += subpath
}
2019-04-06 21:28:45 +03:00
2021-06-17 13:35:05 +03:00
if hash != "" {
text += " (" + hash + ")"
}
replaceContent ( node , start , end , createCodeLink ( urlFull , text , "commit" ) )
node = node . NextSibling . NextSibling
}
2018-02-27 10:09:18 +03:00
}
2017-09-16 20:17:57 +03:00
2021-12-11 20:21:36 +03:00
func comparePatternProcessor ( ctx * RenderContext , node * html . Node ) {
if ctx . Metas == nil {
return
}
next := node . NextSibling
for node != nil && node != next {
m := comparePattern . FindStringSubmatchIndex ( node . Data )
if m == nil {
return
}
2022-01-31 02:48:47 +03:00
// Ensure that every group (m[0]...m[7]) has a match
for i := 0 ; i < 8 ; i ++ {
if m [ i ] == - 1 {
return
}
}
2021-12-11 20:21:36 +03:00
urlFull := node . Data [ m [ 0 ] : m [ 1 ] ]
text1 := base . ShortSha ( node . Data [ m [ 2 ] : m [ 3 ] ] )
textDots := base . ShortSha ( node . Data [ m [ 4 ] : m [ 5 ] ] )
text2 := base . ShortSha ( node . Data [ m [ 6 ] : m [ 7 ] ] )
hash := ""
if m [ 9 ] > 0 {
hash = node . Data [ m [ 8 ] : m [ 9 ] ] [ 1 : ]
}
start := m [ 0 ]
end := m [ 1 ]
// If url ends in '.', it's very likely that it is not part of the
// actual url but used to finish a sentence.
if strings . HasSuffix ( urlFull , "." ) {
end --
urlFull = urlFull [ : len ( urlFull ) - 1 ]
if hash != "" {
hash = hash [ : len ( hash ) - 1 ]
} else if text2 != "" {
text2 = text2 [ : len ( text2 ) - 1 ]
}
}
text := text1 + textDots + text2
if hash != "" {
text += " (" + hash + ")"
}
replaceContent ( node , start , end , createCodeLink ( urlFull , text , "compare" ) )
node = node . NextSibling . NextSibling
}
}
2020-04-28 21:05:39 +03:00
// emojiShortCodeProcessor for rendering text like :smile: into emoji
2021-04-20 01:25:08 +03:00
func emojiShortCodeProcessor ( ctx * RenderContext , node * html . Node ) {
2021-06-17 13:35:05 +03:00
start := 0
next := node . NextSibling
for node != nil && node != next && start < len ( node . Data ) {
m := EmojiShortCodeRegex . FindStringSubmatchIndex ( node . Data [ start : ] )
if m == nil {
2020-04-28 21:05:39 +03:00
return
}
2021-06-17 13:35:05 +03:00
m [ 0 ] += start
m [ 1 ] += start
start = m [ 1 ]
alias := node . Data [ m [ 0 ] : m [ 1 ] ]
alias = strings . ReplaceAll ( alias , ":" , "" )
converted := emoji . FromAlias ( alias )
if converted == nil {
// check if this is a custom reaction
2021-06-29 17:28:38 +03:00
if _ , exist := setting . UI . CustomEmojisMap [ alias ] ; exist {
replaceContent ( node , m [ 0 ] , m [ 1 ] , createCustomEmoji ( alias ) )
2021-06-17 13:35:05 +03:00
node = node . NextSibling . NextSibling
start = 0
continue
}
continue
}
2020-04-28 21:05:39 +03:00
2021-06-17 13:35:05 +03:00
replaceContent ( node , m [ 0 ] , m [ 1 ] , createEmoji ( converted . Emoji , "emoji" , converted . Description ) )
node = node . NextSibling . NextSibling
start = 0
}
2020-04-28 21:05:39 +03:00
}
// emoji processor to match emoji and add emoji class
2021-04-20 01:25:08 +03:00
func emojiProcessor ( ctx * RenderContext , node * html . Node ) {
2021-06-17 13:35:05 +03:00
start := 0
next := node . NextSibling
for node != nil && node != next && start < len ( node . Data ) {
m := emoji . FindEmojiSubmatchIndex ( node . Data [ start : ] )
if m == nil {
return
}
m [ 0 ] += start
m [ 1 ] += start
codepoint := node . Data [ m [ 0 ] : m [ 1 ] ]
start = m [ 1 ]
val := emoji . FromCode ( codepoint )
if val != nil {
replaceContent ( node , m [ 0 ] , m [ 1 ] , createEmoji ( codepoint , "emoji" , val . Description ) )
node = node . NextSibling . NextSibling
start = 0
}
2020-04-28 21:05:39 +03:00
}
}
2018-02-27 10:09:18 +03:00
// sha1CurrentPatternProcessor renders SHA1 strings to corresponding links that
// are assumed to be in the same repository.
2021-04-20 01:25:08 +03:00
func sha1CurrentPatternProcessor ( ctx * RenderContext , node * html . Node ) {
if ctx . Metas == nil || ctx . Metas [ "user" ] == "" || ctx . Metas [ "repo" ] == "" || ctx . Metas [ "repoPath" ] == "" {
2019-08-14 11:04:55 +03:00
return
}
2021-06-17 13:35:05 +03:00
start := 0
next := node . NextSibling
2021-06-21 01:39:12 +03:00
if ctx . ShaExistCache == nil {
ctx . ShaExistCache = make ( map [ string ] bool )
}
2021-06-17 13:35:05 +03:00
for node != nil && node != next && start < len ( node . Data ) {
m := sha1CurrentPattern . FindStringSubmatchIndex ( node . Data [ start : ] )
if m == nil {
return
}
m [ 2 ] += start
m [ 3 ] += start
hash := node . Data [ m [ 2 ] : m [ 3 ] ]
// The regex does not lie, it matches the hash pattern.
// However, a regex cannot know if a hash actually exists or not.
// We could assume that a SHA1 hash should probably contain alphas AND numerics
// but that is not always the case.
// Although unlikely, deadbeef and 1234567 are valid short forms of SHA1 hash
// as used by git and github for linking and thus we have to do similar.
// Because of this, we check to make sure that a matched hash is actually
// a commit in the repository before making it a link.
2021-06-21 01:39:12 +03:00
// check cache first
exist , inCache := ctx . ShaExistCache [ hash ]
if ! inCache {
if ctx . GitRepo == nil {
var err error
2022-03-29 22:13:41 +03:00
ctx . GitRepo , err = git . OpenRepository ( ctx . Ctx , ctx . Metas [ "repoPath" ] )
2021-06-21 01:39:12 +03:00
if err != nil {
log . Error ( "unable to open repository: %s Error: %v" , ctx . Metas [ "repoPath" ] , err )
return
}
ctx . AddCancel ( func ( ) {
ctx . GitRepo . Close ( )
ctx . GitRepo = nil
} )
2021-06-17 13:35:05 +03:00
}
2021-06-21 01:39:12 +03:00
exist = ctx . GitRepo . IsObjectExist ( hash )
ctx . ShaExistCache [ hash ] = exist
}
if ! exist {
2021-06-17 13:35:05 +03:00
start = m [ 3 ]
continue
2019-08-14 11:04:55 +03:00
}
2021-12-11 20:21:36 +03:00
link := util . URLJoin ( setting . AppURL , ctx . Metas [ "user" ] , ctx . Metas [ "repo" ] , "commit" , hash )
replaceContent ( node , m [ 2 ] , m [ 3 ] , createCodeLink ( link , base . ShortSha ( hash ) , "commit" ) )
2021-06-17 13:35:05 +03:00
start = 0
node = node . NextSibling . NextSibling
}
2018-02-27 10:09:18 +03:00
}
2017-09-16 20:17:57 +03:00
2018-02-27 10:09:18 +03:00
// emailAddressProcessor replaces raw email addresses with a mailto: link.
2021-04-20 01:25:08 +03:00
func emailAddressProcessor ( ctx * RenderContext , node * html . Node ) {
2021-06-17 13:35:05 +03:00
next := node . NextSibling
for node != nil && node != next {
m := emailRegex . FindStringSubmatchIndex ( node . Data )
if m == nil {
return
}
mail := node . Data [ m [ 2 ] : m [ 3 ] ]
replaceContent ( node , m [ 2 ] , m [ 3 ] , createLink ( "mailto:" + mail , mail , "mailto" ) )
node = node . NextSibling . NextSibling
2017-09-16 20:17:57 +03:00
}
2018-02-27 10:09:18 +03:00
}
2017-09-16 20:17:57 +03:00
2018-02-27 10:09:18 +03:00
// linkProcessor creates links for any HTTP or HTTPS URL not captured by
// markdown.
2021-04-20 01:25:08 +03:00
func linkProcessor ( ctx * RenderContext , node * html . Node ) {
2021-06-17 13:35:05 +03:00
next := node . NextSibling
for node != nil && node != next {
m := common . LinkRegex . FindStringIndex ( node . Data )
if m == nil {
return
}
uri := node . Data [ m [ 0 ] : m [ 1 ] ]
replaceContent ( node , m [ 0 ] , m [ 1 ] , createLink ( uri , uri , "link" ) )
node = node . NextSibling . NextSibling
2017-09-16 20:17:57 +03:00
}
2018-02-27 10:09:18 +03:00
}
func genDefaultLinkProcessor ( defaultLink string ) processor {
2021-04-20 01:25:08 +03:00
return func ( ctx * RenderContext , node * html . Node ) {
2018-02-27 10:09:18 +03:00
ch := & html . Node {
Parent : node ,
Type : html . TextNode ,
Data : node . Data ,
}
2017-09-16 20:17:57 +03:00
2018-02-27 10:09:18 +03:00
node . Type = html . ElementNode
node . Data = "a"
node . DataAtom = atom . A
2019-09-10 12:03:30 +03:00
node . Attr = [ ] html . Attribute {
{ Key : "href" , Val : defaultLink } ,
{ Key : "class" , Val : "default-link" } ,
}
2018-02-27 10:09:18 +03:00
node . FirstChild , node . LastChild = ch , ch
}
2017-09-16 20:17:57 +03:00
}
2019-03-12 05:23:34 +03:00
// descriptionLinkProcessor creates links for DescriptionHTML
2021-04-20 01:25:08 +03:00
func descriptionLinkProcessor ( ctx * RenderContext , node * html . Node ) {
2021-06-17 13:35:05 +03:00
next := node . NextSibling
for node != nil && node != next {
m := common . LinkRegex . FindStringIndex ( node . Data )
if m == nil {
return
}
uri := node . Data [ m [ 0 ] : m [ 1 ] ]
replaceContent ( node , m [ 0 ] , m [ 1 ] , createDescriptionLink ( uri , uri ) )
node = node . NextSibling . NextSibling
2019-03-12 05:23:34 +03:00
}
}
func createDescriptionLink ( href , content string ) * html . Node {
textNode := & html . Node {
Type : html . TextNode ,
Data : content ,
}
linkNode := & html . Node {
FirstChild : textNode ,
LastChild : textNode ,
Type : html . ElementNode ,
Data : "a" ,
DataAtom : atom . A ,
Attr : [ ] html . Attribute {
{ Key : "href" , Val : href } ,
{ Key : "target" , Val : "_blank" } ,
{ Key : "rel" , Val : "noopener noreferrer" } ,
} ,
}
textNode . Parent = linkNode
return linkNode
}