mirror of
https://github.com/yuin/goldmark
synced 2025-03-04 23:04:52 +00:00
Note that this is a breaking change and will require new goldmark major version. I have tried to fix problem with leading tabs in fenced code blocks (and probably normal code blocks too). Important note - tabs do not behave like "just 4 spaces". They "finish" 4 space columns. So tab can behave like anything between 1 space to 4 spaces, depending on position. If you have MD like this (. represents space, [tb] , [t] or [] tabs) ``` *.some.text ..``` ..foo ..[]foo ..``` ``` you expect the tab to be kept in the code. This did not work properly in goldmark and I fixed that. However, if you have a code like this ``` *.some.text ..``` ..foo .[t]foo ..``` ``` what should happen? I decided that it should be two spaces, as the tab is not "completely" in the code block. Similarly, what should happen in this case ``` *.some.text ..``` ..foo .[t][tb]foo ..``` ``` I decided that it should be first three spaces and then tab. Not sure what even is the correct solution here... The crux of the fix is - text segments don't have just padding, but also remember what chars is the padding and then print that, if they are called to do so in the code blocks. In other cases, the paddingChars are ignored. This should fix #177 .
112 lines
3 KiB
Go
112 lines
3 KiB
Go
package parser
|
|
|
|
import (
|
|
"bytes"
|
|
|
|
"github.com/yuin/goldmark/ast"
|
|
"github.com/yuin/goldmark/text"
|
|
"github.com/yuin/goldmark/util"
|
|
)
|
|
|
|
type fencedCodeBlockParser struct {
|
|
}
|
|
|
|
var defaultFencedCodeBlockParser = &fencedCodeBlockParser{}
|
|
|
|
// NewFencedCodeBlockParser returns a new BlockParser that
|
|
// parses fenced code blocks.
|
|
func NewFencedCodeBlockParser() BlockParser {
|
|
return defaultFencedCodeBlockParser
|
|
}
|
|
|
|
type fenceData struct {
|
|
char byte
|
|
indent int
|
|
length int
|
|
node ast.Node
|
|
}
|
|
|
|
var fencedCodeBlockInfoKey = NewContextKey()
|
|
|
|
func (b *fencedCodeBlockParser) Trigger() []byte {
|
|
return []byte{'~', '`'}
|
|
}
|
|
|
|
func (b *fencedCodeBlockParser) Open(parent ast.Node, reader text.Reader, pc Context) (ast.Node, State) {
|
|
line, segment := reader.PeekLine()
|
|
pos := pc.BlockOffset()
|
|
if pos < 0 || (line[pos] != '`' && line[pos] != '~') {
|
|
return nil, NoChildren
|
|
}
|
|
findent := pos
|
|
fenceChar := line[pos]
|
|
i := pos
|
|
for ; i < len(line) && line[i] == fenceChar; i++ {
|
|
}
|
|
oFenceLength := i - pos
|
|
if oFenceLength < 3 {
|
|
return nil, NoChildren
|
|
}
|
|
var info *ast.Text
|
|
if i < len(line)-1 {
|
|
rest := line[i:]
|
|
left := util.TrimLeftSpaceLength(rest)
|
|
right := util.TrimRightSpaceLength(rest)
|
|
if left < len(rest)-right {
|
|
infoStart, infoStop := segment.Start-segment.Padding+i+left, segment.Stop-right
|
|
value := rest[left : len(rest)-right]
|
|
if fenceChar == '`' && bytes.IndexByte(value, '`') > -1 {
|
|
return nil, NoChildren
|
|
} else if infoStart != infoStop {
|
|
info = ast.NewTextSegment(text.NewSegment(infoStart, infoStop))
|
|
}
|
|
}
|
|
}
|
|
node := ast.NewFencedCodeBlock(info)
|
|
pc.Set(fencedCodeBlockInfoKey, &fenceData{fenceChar, findent, oFenceLength, node})
|
|
return node, NoChildren
|
|
|
|
}
|
|
|
|
func (b *fencedCodeBlockParser) Continue(node ast.Node, reader text.Reader, pc Context) State {
|
|
line, segment := reader.PeekLine()
|
|
|
|
fdata := pc.Get(fencedCodeBlockInfoKey).(*fenceData)
|
|
w, pos := util.IndentWidth(line, reader.LineOffset())
|
|
if w < 4 {
|
|
i := pos
|
|
for ; i < len(line) && line[i] == fdata.char; i++ {
|
|
}
|
|
length := i - pos
|
|
if length >= fdata.length && util.IsBlank(line[i:]) {
|
|
newline := 1
|
|
if line[len(line)-1] != '\n' {
|
|
newline = 0
|
|
}
|
|
reader.Advance(segment.Stop - segment.Start - newline - segment.Padding)
|
|
return Close
|
|
}
|
|
}
|
|
|
|
pos, padding, chars := util.DedentPositionPadding(line, reader.LineOffset(), segment.Padding, fdata.indent, segment.PaddingChars)
|
|
seg := text.NewSegmentPadding(segment.Start+pos, segment.Stop, padding, chars)
|
|
seg = seg.WithRenderPaddingTabs()
|
|
node.Lines().Append(seg)
|
|
reader.AdvanceAndSetPadding(segment.Stop-segment.Start-pos-1, padding, chars)
|
|
return Continue | NoChildren
|
|
}
|
|
|
|
func (b *fencedCodeBlockParser) Close(node ast.Node, reader text.Reader, pc Context) {
|
|
fdata := pc.Get(fencedCodeBlockInfoKey).(*fenceData)
|
|
if fdata.node == node {
|
|
pc.Set(fencedCodeBlockInfoKey, nil)
|
|
}
|
|
}
|
|
|
|
func (b *fencedCodeBlockParser) CanInterruptParagraph() bool {
|
|
return true
|
|
}
|
|
|
|
func (b *fencedCodeBlockParser) CanAcceptIndentedLine() bool {
|
|
return false
|
|
}
|