2019-12-31 01:53:28 +00:00
// Copyright 2019 The Gitea Authors. All rights reserved.
2022-11-27 13:20:29 -05:00
// SPDX-License-Identifier: MIT
2019-12-31 01:53:28 +00:00
package markdown
import (
"bytes"
"fmt"
2020-04-24 14:22:36 +01:00
"regexp"
2019-12-31 01:53:28 +00:00
"strings"
2022-10-12 07:18:26 +02:00
"code.gitea.io/gitea/modules/container"
2019-12-31 01:53:28 +00:00
"code.gitea.io/gitea/modules/markup"
"code.gitea.io/gitea/modules/markup/common"
2020-04-24 14:22:36 +01:00
"code.gitea.io/gitea/modules/setting"
2022-11-09 02:11:26 +02:00
"code.gitea.io/gitea/modules/svg"
2019-12-31 01:53:28 +00:00
giteautil "code.gitea.io/gitea/modules/util"
2022-10-21 15:00:53 +03:00
"github.com/microcosm-cc/bluemonday/css"
2019-12-31 01:53:28 +00:00
"github.com/yuin/goldmark/ast"
east "github.com/yuin/goldmark/extension/ast"
"github.com/yuin/goldmark/parser"
"github.com/yuin/goldmark/renderer"
"github.com/yuin/goldmark/renderer/html"
"github.com/yuin/goldmark/text"
"github.com/yuin/goldmark/util"
)
var byteMailto = [ ] byte ( "mailto:" )
2020-04-24 14:22:36 +01:00
// ASTTransformer is a default transformer of the goldmark tree.
type ASTTransformer struct { }
2019-12-31 01:53:28 +00:00
// Transform transforms the given AST tree.
2020-04-24 14:22:36 +01:00
func ( g * ASTTransformer ) Transform ( node * ast . Document , reader text . Reader , pc parser . Context ) {
firstChild := node . FirstChild ( )
2023-04-18 03:05:19 +08:00
tocMode := ""
2022-06-08 09:59:16 +01:00
ctx := pc . Get ( renderContextKey ) . ( * markup . RenderContext )
2022-09-13 17:33:37 +01:00
rc := pc . Get ( renderConfigKey ) . ( * RenderConfig )
2023-04-18 03:05:19 +08:00
tocList := make ( [ ] markup . Header , 0 , 20 )
2022-09-13 17:33:37 +01:00
if rc . yamlNode != nil {
metaNode := rc . toMetaNode ( )
2020-04-24 14:22:36 +01:00
if metaNode != nil {
node . InsertBefore ( node , firstChild , metaNode )
}
2023-04-18 03:05:19 +08:00
tocMode = rc . TOC
2020-04-24 14:22:36 +01:00
}
2023-05-20 23:02:52 +02:00
applyElementDir := func ( n ast . Node ) {
if markup . DefaultProcessorHelper . ElementDir != "" {
n . SetAttributeString ( "dir" , [ ] byte ( markup . DefaultProcessorHelper . ElementDir ) )
}
}
2022-11-09 02:11:26 +02:00
attentionMarkedBlockquotes := make ( container . Set [ * ast . Blockquote ] )
2019-12-31 01:53:28 +00:00
_ = ast . Walk ( node , func ( n ast . Node , entering bool ) ( ast . WalkStatus , error ) {
if ! entering {
return ast . WalkContinue , nil
}
switch v := n . ( type ) {
2020-04-24 14:22:36 +01:00
case * ast . Heading :
2022-06-08 09:59:16 +01:00
for _ , attr := range v . Attributes ( ) {
if _ , ok := attr . Value . ( [ ] byte ) ; ! ok {
v . SetAttribute ( attr . Name , [ ] byte ( fmt . Sprintf ( "%v" , attr . Value ) ) )
2021-03-15 23:20:05 +00:00
}
2020-04-24 14:22:36 +01:00
}
2023-04-18 03:05:19 +08:00
txt := n . Text ( reader . Source ( ) )
2022-06-08 09:59:16 +01:00
header := markup . Header {
2023-04-18 03:05:19 +08:00
Text : util . BytesToReadOnlyString ( txt ) ,
2022-06-08 09:59:16 +01:00
Level : v . Level ,
}
if id , found := v . AttributeString ( "id" ) ; found {
header . ID = util . BytesToReadOnlyString ( id . ( [ ] byte ) )
}
2023-04-18 03:05:19 +08:00
tocList = append ( tocList , header )
2023-05-20 23:02:52 +02:00
applyElementDir ( v )
case * ast . Paragraph :
applyElementDir ( v )
2019-12-31 01:53:28 +00:00
case * ast . Image :
// Images need two things:
//
// 1. Their src needs to munged to be a real value
// 2. If they're not wrapped with a link they need a link wrapper
// Check if the destination is a real link
link := v . Destination
if len ( link ) > 0 && ! markup . IsLink ( link ) {
prefix := pc . Get ( urlPrefixKey ) . ( string )
if pc . Get ( isWikiKey ) . ( bool ) {
prefix = giteautil . URLJoin ( prefix , "wiki" , "raw" )
}
prefix = strings . Replace ( prefix , "/src/" , "/media/" , 1 )
2021-04-10 17:26:28 +01:00
lnk := strings . TrimLeft ( string ( link ) , "/" )
2019-12-31 01:53:28 +00:00
lnk = giteautil . URLJoin ( prefix , lnk )
link = [ ] byte ( lnk )
}
v . Destination = link
parent := n . Parent ( )
// Create a link around image only if parent is not already a link
if _ , ok := parent . ( * ast . Link ) ; ! ok && parent != nil {
2021-03-14 16:36:51 +00:00
next := n . NextSibling ( )
// Create a link wrapper
2019-12-31 01:53:28 +00:00
wrap := ast . NewLink ( )
wrap . Destination = link
wrap . Title = v . Title
2021-10-11 20:12:06 +08:00
wrap . SetAttributeString ( "target" , [ ] byte ( "_blank" ) )
2021-03-14 16:36:51 +00:00
// Duplicate the current image node
image := ast . NewImage ( ast . NewLink ( ) )
image . Destination = link
image . Title = v . Title
for _ , attr := range v . Attributes ( ) {
image . SetAttribute ( attr . Name , attr . Value )
}
for child := v . FirstChild ( ) ; child != nil ; {
next := child . NextSibling ( )
image . AppendChild ( image , child )
child = next
}
// Append our duplicate image to the wrapper link
wrap . AppendChild ( wrap , image )
// Wire in the next sibling
wrap . SetNextSibling ( next )
// Replace the current node with the wrapper link
2019-12-31 01:53:28 +00:00
parent . ReplaceChild ( parent , n , wrap )
2021-03-14 16:36:51 +00:00
// But most importantly ensure the next sibling is still on the old image too
v . SetNextSibling ( next )
2019-12-31 01:53:28 +00:00
}
case * ast . Link :
// Links need their href to munged to be a real value
link := v . Destination
if len ( link ) > 0 && ! markup . IsLink ( link ) &&
link [ 0 ] != '#' && ! bytes . HasPrefix ( link , byteMailto ) {
// special case: this is not a link, a hash link or a mailto:, so it's a
// relative URL
lnk := string ( link )
if pc . Get ( isWikiKey ) . ( bool ) {
lnk = giteautil . URLJoin ( "wiki" , lnk )
}
link = [ ] byte ( giteautil . URLJoin ( pc . Get ( urlPrefixKey ) . ( string ) , lnk ) )
}
2020-01-16 12:23:48 +01:00
if len ( link ) > 0 && link [ 0 ] == '#' {
link = [ ] byte ( "#user-content-" + string ( link ) [ 1 : ] )
}
2019-12-31 01:53:28 +00:00
v . Destination = link
2020-03-22 22:25:38 +00:00
case * ast . List :
2020-05-11 00:14:49 +01:00
if v . HasChildren ( ) {
children := make ( [ ] ast . Node , 0 , v . ChildCount ( ) )
child := v . FirstChild ( )
for child != nil {
children = append ( children , child )
child = child . NextSibling ( )
}
v . RemoveChildren ( v )
for _ , child := range children {
listItem := child . ( * ast . ListItem )
if ! child . HasChildren ( ) || ! child . FirstChild ( ) . HasChildren ( ) {
v . AppendChild ( v , child )
continue
2020-04-26 06:09:08 +01:00
}
2020-05-11 00:14:49 +01:00
taskCheckBox , ok := child . FirstChild ( ) . FirstChild ( ) . ( * east . TaskCheckBox )
if ! ok {
v . AppendChild ( v , child )
continue
2020-04-26 06:09:08 +01:00
}
2020-05-11 00:14:49 +01:00
newChild := NewTaskCheckBoxListItem ( listItem )
newChild . IsChecked = taskCheckBox . IsChecked
newChild . SetAttributeString ( "class" , [ ] byte ( "task-list-item" ) )
2023-06-13 02:44:47 -04:00
segments := newChild . FirstChild ( ) . Lines ( )
if segments . Len ( ) > 0 {
segment := segments . At ( 0 )
newChild . SourcePosition = rc . metaLength + segment . Start
}
2020-05-11 00:14:49 +01:00
v . AppendChild ( v , newChild )
2020-03-22 22:25:38 +00:00
}
}
2023-05-20 23:02:52 +02:00
applyElementDir ( v )
2020-05-24 09:14:26 +01:00
case * ast . Text :
if v . SoftLineBreak ( ) && ! v . HardLineBreak ( ) {
renderMetas := pc . Get ( renderMetasKey ) . ( map [ string ] string )
mode := renderMetas [ "mode" ]
if mode != "document" {
v . SetHardLineBreak ( setting . Markdown . EnableHardLineBreakInComments )
} else {
v . SetHardLineBreak ( setting . Markdown . EnableHardLineBreakInDocuments )
}
}
2022-10-21 15:00:53 +03:00
case * ast . CodeSpan :
colorContent := n . Text ( reader . Source ( ) )
if css . ColorHandler ( strings . ToLower ( string ( colorContent ) ) ) {
v . AppendChild ( v , NewColorPreview ( colorContent ) )
}
2022-11-09 02:11:26 +02:00
case * ast . Emphasis :
// check if inside blockquote for attention, expected hierarchy is
// Emphasis < Paragraph < Blockquote
blockquote , isInBlockquote := n . Parent ( ) . Parent ( ) . ( * ast . Blockquote )
if isInBlockquote && ! attentionMarkedBlockquotes . Contains ( blockquote ) {
fullText := string ( n . Text ( reader . Source ( ) ) )
if fullText == AttentionNote || fullText == AttentionWarning {
v . SetAttributeString ( "class" , [ ] byte ( "attention-" + strings . ToLower ( fullText ) ) )
v . Parent ( ) . InsertBefore ( v . Parent ( ) , v , NewAttention ( fullText ) )
attentionMarkedBlockquotes . Add ( blockquote )
}
}
2019-12-31 01:53:28 +00:00
}
return ast . WalkContinue , nil
} )
2020-04-24 14:22:36 +01:00
2023-04-18 03:05:19 +08:00
showTocInMain := tocMode == "true" /* old behavior, in main view */ || tocMode == "main"
showTocInSidebar := ! showTocInMain && tocMode != "false" // not hidden, not main, then show it in sidebar
if len ( tocList ) > 0 && ( showTocInMain || showTocInSidebar ) {
if showTocInMain {
tocNode := createTOCNode ( tocList , rc . Lang , nil )
2020-04-24 14:22:36 +01:00
node . InsertBefore ( node , firstChild , tocNode )
2023-04-18 03:05:19 +08:00
} else {
tocNode := createTOCNode ( tocList , rc . Lang , map [ string ] string { "open" : "open" } )
ctx . SidebarTocNode = tocNode
2020-04-24 14:22:36 +01:00
}
}
if len ( rc . Lang ) > 0 {
node . SetAttributeString ( "lang" , [ ] byte ( rc . Lang ) )
}
2019-12-31 01:53:28 +00:00
}
type prefixedIDs struct {
2022-10-12 07:18:26 +02:00
values container . Set [ string ]
2019-12-31 01:53:28 +00:00
}
// Generate generates a new element id.
func ( p * prefixedIDs ) Generate ( value [ ] byte , kind ast . NodeKind ) [ ] byte {
dft := [ ] byte ( "id" )
if kind == ast . KindHeading {
dft = [ ] byte ( "heading" )
}
return p . GenerateWithDefault ( value , dft )
}
// Generate generates a new element id.
2021-12-20 05:41:31 +01:00
func ( p * prefixedIDs ) GenerateWithDefault ( value , dft [ ] byte ) [ ] byte {
2019-12-31 01:53:28 +00:00
result := common . CleanValue ( value )
if len ( result ) == 0 {
result = dft
}
if ! bytes . HasPrefix ( result , [ ] byte ( "user-content-" ) ) {
result = append ( [ ] byte ( "user-content-" ) , result ... )
}
2022-10-12 07:18:26 +02:00
if p . values . Add ( util . BytesToReadOnlyString ( result ) ) {
2019-12-31 01:53:28 +00:00
return result
}
for i := 1 ; ; i ++ {
newResult := fmt . Sprintf ( "%s-%d" , result , i )
2022-10-12 07:18:26 +02:00
if p . values . Add ( newResult ) {
2019-12-31 01:53:28 +00:00
return [ ] byte ( newResult )
}
}
}
// Put puts a given element id to the used ids table.
func ( p * prefixedIDs ) Put ( value [ ] byte ) {
2022-10-12 07:18:26 +02:00
p . values . Add ( util . BytesToReadOnlyString ( value ) )
2019-12-31 01:53:28 +00:00
}
func newPrefixedIDs ( ) * prefixedIDs {
return & prefixedIDs {
2022-10-12 07:18:26 +02:00
values : make ( container . Set [ string ] ) ,
2019-12-31 01:53:28 +00:00
}
}
2020-04-24 14:22:36 +01:00
// NewHTMLRenderer creates a HTMLRenderer to render
2019-12-31 01:53:28 +00:00
// in the gitea form.
2020-04-24 14:22:36 +01:00
func NewHTMLRenderer ( opts ... html . Option ) renderer . NodeRenderer {
r := & HTMLRenderer {
2019-12-31 01:53:28 +00:00
Config : html . NewConfig ( ) ,
}
for _ , opt := range opts {
opt . SetHTMLOption ( & r . Config )
}
return r
}
2020-04-24 14:22:36 +01:00
// HTMLRenderer is a renderer.NodeRenderer implementation that
// renders gitea specific features.
type HTMLRenderer struct {
2019-12-31 01:53:28 +00:00
html . Config
}
// RegisterFuncs implements renderer.NodeRenderer.RegisterFuncs.
2020-04-24 14:22:36 +01:00
func ( r * HTMLRenderer ) RegisterFuncs ( reg renderer . NodeRendererFuncRegisterer ) {
reg . Register ( ast . KindDocument , r . renderDocument )
reg . Register ( KindDetails , r . renderDetails )
reg . Register ( KindSummary , r . renderSummary )
reg . Register ( KindIcon , r . renderIcon )
2022-10-21 15:00:53 +03:00
reg . Register ( ast . KindCodeSpan , r . renderCodeSpan )
2022-11-09 02:11:26 +02:00
reg . Register ( KindAttention , r . renderAttention )
2020-04-26 06:09:08 +01:00
reg . Register ( KindTaskCheckBoxListItem , r . renderTaskCheckBoxListItem )
2019-12-31 01:53:28 +00:00
reg . Register ( east . KindTaskCheckBox , r . renderTaskCheckBox )
}
2022-10-21 15:00:53 +03:00
// renderCodeSpan renders CodeSpan elements (like goldmark upstream does) but also renders ColorPreview elements.
// See #21474 for reference
func ( r * HTMLRenderer ) renderCodeSpan ( w util . BufWriter , source [ ] byte , n ast . Node , entering bool ) ( ast . WalkStatus , error ) {
if entering {
if n . Attributes ( ) != nil {
_ , _ = w . WriteString ( "<code" )
html . RenderAttributes ( w , n , html . CodeAttributeFilter )
_ = w . WriteByte ( '>' )
} else {
_ , _ = w . WriteString ( "<code>" )
}
for c := n . FirstChild ( ) ; c != nil ; c = c . NextSibling ( ) {
switch v := c . ( type ) {
case * ast . Text :
segment := v . Segment
value := segment . Value ( source )
if bytes . HasSuffix ( value , [ ] byte ( "\n" ) ) {
r . Writer . RawWrite ( w , value [ : len ( value ) - 1 ] )
r . Writer . RawWrite ( w , [ ] byte ( " " ) )
} else {
r . Writer . RawWrite ( w , value )
}
case * ColorPreview :
_ , _ = w . WriteString ( fmt . Sprintf ( ` <span class="color-preview" style="background-color: %v"></span> ` , string ( v . Color ) ) )
}
}
return ast . WalkSkipChildren , nil
}
_ , _ = w . WriteString ( "</code>" )
return ast . WalkContinue , nil
}
2022-11-09 02:11:26 +02:00
// renderAttention renders a quote marked with i.e. "> **Note**" or "> **Warning**" with a corresponding svg
func ( r * HTMLRenderer ) renderAttention ( w util . BufWriter , source [ ] byte , node ast . Node , entering bool ) ( ast . WalkStatus , error ) {
if entering {
_ , _ = w . WriteString ( ` <span class="attention-icon attention- ` )
n := node . ( * Attention )
_ , _ = w . WriteString ( strings . ToLower ( n . AttentionType ) )
_ , _ = w . WriteString ( ` "> ` )
var octiconType string
switch n . AttentionType {
case AttentionNote :
octiconType = "info"
case AttentionWarning :
octiconType = "alert"
}
_ , _ = w . WriteString ( string ( svg . RenderHTML ( "octicon-" + octiconType ) ) )
} else {
_ , _ = w . WriteString ( "</span>\n" )
}
return ast . WalkContinue , nil
}
2020-04-24 14:22:36 +01:00
func ( r * HTMLRenderer ) renderDocument ( w util . BufWriter , source [ ] byte , node ast . Node , entering bool ) ( ast . WalkStatus , error ) {
n := node . ( * ast . Document )
if val , has := n . AttributeString ( "lang" ) ; has {
var err error
if entering {
_ , err = w . WriteString ( "<div" )
if err == nil {
_ , err = w . WriteString ( fmt . Sprintf ( ` lang=%q ` , val ) )
}
if err == nil {
_ , err = w . WriteRune ( '>' )
}
} else {
_ , err = w . WriteString ( "</div>" )
}
if err != nil {
return ast . WalkStop , err
}
}
return ast . WalkContinue , nil
}
func ( r * HTMLRenderer ) renderDetails ( w util . BufWriter , source [ ] byte , node ast . Node , entering bool ) ( ast . WalkStatus , error ) {
var err error
if entering {
2023-04-18 03:05:19 +08:00
if _ , err = w . WriteString ( "<details" ) ; err != nil {
return ast . WalkStop , err
}
html . RenderAttributes ( w , node , nil )
_ , err = w . WriteString ( ">" )
2020-04-24 14:22:36 +01:00
} else {
_ , err = w . WriteString ( "</details>" )
}
if err != nil {
return ast . WalkStop , err
}
return ast . WalkContinue , nil
}
func ( r * HTMLRenderer ) renderSummary ( w util . BufWriter , source [ ] byte , node ast . Node , entering bool ) ( ast . WalkStatus , error ) {
var err error
if entering {
_ , err = w . WriteString ( "<summary>" )
} else {
_ , err = w . WriteString ( "</summary>" )
}
if err != nil {
return ast . WalkStop , err
}
return ast . WalkContinue , nil
}
var validNameRE = regexp . MustCompile ( "^[a-z ]+$" )
func ( r * HTMLRenderer ) renderIcon ( w util . BufWriter , source [ ] byte , node ast . Node , entering bool ) ( ast . WalkStatus , error ) {
if ! entering {
return ast . WalkContinue , nil
}
n := node . ( * Icon )
name := strings . TrimSpace ( strings . ToLower ( string ( n . Name ) ) )
if len ( name ) == 0 {
// skip this
return ast . WalkContinue , nil
}
if ! validNameRE . MatchString ( name ) {
// skip this
return ast . WalkContinue , nil
}
var err error
_ , err = w . WriteString ( fmt . Sprintf ( ` <i class="icon %s"></i> ` , name ) )
if err != nil {
return ast . WalkStop , err
}
return ast . WalkContinue , nil
}
2020-04-26 06:09:08 +01:00
func ( r * HTMLRenderer ) renderTaskCheckBoxListItem ( w util . BufWriter , source [ ] byte , node ast . Node , entering bool ) ( ast . WalkStatus , error ) {
n := node . ( * TaskCheckBoxListItem )
if entering {
if n . Attributes ( ) != nil {
_ , _ = w . WriteString ( "<li" )
html . RenderAttributes ( w , n , html . ListItemAttributeFilter )
_ = w . WriteByte ( '>' )
} else {
_ , _ = w . WriteString ( "<li>" )
}
2023-06-13 02:44:47 -04:00
fmt . Fprintf ( w , ` <input type="checkbox" disabled="" data-source-position="%d" ` , n . SourcePosition )
2020-04-26 06:09:08 +01:00
if n . IsChecked {
2021-05-23 16:14:03 +02:00
_ , _ = w . WriteString ( ` checked="" ` )
2020-04-26 06:09:08 +01:00
}
2021-05-23 16:14:03 +02:00
if r . XHTML {
_ , _ = w . WriteString ( ` /> ` )
} else {
_ = w . WriteByte ( '>' )
2020-04-26 06:09:08 +01:00
}
fc := n . FirstChild ( )
if fc != nil {
if _ , ok := fc . ( * ast . TextBlock ) ; ! ok {
_ = w . WriteByte ( '\n' )
}
}
2019-12-31 01:53:28 +00:00
} else {
2020-12-13 02:05:50 +01:00
_ , _ = w . WriteString ( "</li>\n" )
2019-12-31 01:53:28 +00:00
}
return ast . WalkContinue , nil
}
2020-04-26 06:09:08 +01:00
func ( r * HTMLRenderer ) renderTaskCheckBox ( w util . BufWriter , source [ ] byte , node ast . Node , entering bool ) ( ast . WalkStatus , error ) {
return ast . WalkContinue , nil
}