Skip to content

Commit 157d370

Browse files
bepjmooring
andcommitted
Add autoID for definition terms
Fixes #13403 See #11566 Co-authored-by: Joe Mooring <joe@mooring.com>
1 parent 9c2f8ec commit 157d370

File tree

9 files changed

+261
-46
lines changed

9 files changed

+261
-46
lines changed

‎markup/goldmark/autoid.go

+33-7
Original file line numberDiff line numberDiff line change
@@ -26,6 +26,7 @@ import (
2626
"github.com/gohugoio/hugo/common/text"
2727

2828
"github.com/yuin/goldmark/ast"
29+
east "github.com/yuin/goldmark/extension/ast"
2930
"github.com/yuin/goldmark/parser"
3031
"github.com/yuin/goldmark/util"
3132

@@ -43,11 +44,11 @@ func sanitizeAnchorName(b []byte, idType string) []byte {
4344
func sanitizeAnchorNameWithHook(b []byte, idType string, hook func(buf *bytes.Buffer)) []byte {
4445
buf := bp.GetBuffer()
4546

46-
if idType == goldmark_config.AutoHeadingIDTypeBlackfriday {
47+
if idType == goldmark_config.AutoIDTypeBlackfriday {
4748
// TODO(bep) make it more efficient.
4849
buf.WriteString(blackfriday.SanitizedAnchorName(string(b)))
4950
} else {
50-
asciiOnly := idType == goldmark_config.AutoHeadingIDTypeGitHubAscii
51+
asciiOnly := idType == goldmark_config.AutoIDTypeGitHubAscii
5152

5253
if asciiOnly {
5354
// Normalize it to preserve accents if possible.
@@ -90,8 +91,9 @@ func isAlphaNumeric(r rune) bool {
9091
var _ parser.IDs = (*idFactory)(nil)
9192

9293
type idFactory struct {
93-
idType string
94-
vals map[string]struct{}
94+
idType string
95+
vals map[string]struct{}
96+
duplicates []string
9597
}
9698

9799
func newIDFactory(idType string) *idFactory {
@@ -101,11 +103,28 @@ func newIDFactory(idType string) *idFactory {
101103
}
102104
}
103105

106+
type stringValuesProvider interface {
107+
StringValues() []string
108+
}
109+
110+
var _ stringValuesProvider = (*idFactory)(nil)
111+
112+
func (ids *idFactory) StringValues() []string {
113+
values := make([]string, 0, len(ids.vals))
114+
for k := range ids.vals {
115+
values = append(values, k)
116+
}
117+
values = append(values, ids.duplicates...)
118+
return values
119+
}
120+
104121
func (ids *idFactory) Generate(value []byte, kind ast.NodeKind) []byte {
105122
return sanitizeAnchorNameWithHook(value, ids.idType, func(buf *bytes.Buffer) {
106123
if buf.Len() == 0 {
107124
if kind == ast.KindHeading {
108125
buf.WriteString("heading")
126+
} else if kind == east.KindDefinitionTerm {
127+
buf.WriteString("term")
109128
} else {
110129
buf.WriteString("id")
111130
}
@@ -123,11 +142,18 @@ func (ids *idFactory) Generate(value []byte, kind ast.NodeKind) []byte {
123142
buf.Truncate(pos)
124143
}
125144
}
126-
127-
ids.vals[buf.String()] = struct{}{}
145+
ids.put(buf.String())
128146
})
129147
}
130148

149+
func (ids *idFactory) put(s string) {
150+
if _, found := ids.vals[s]; found {
151+
ids.duplicates = append(ids.duplicates, s)
152+
} else {
153+
ids.vals[s] = struct{}{}
154+
}
155+
}
156+
131157
func (ids *idFactory) Put(value []byte) {
132-
ids.vals[util.BytesToReadOnlyString(value)] = struct{}{}
158+
ids.put(string(value))
133159
}

‎markup/goldmark/autoid_test.go

+9-9
Original file line numberDiff line numberDiff line change
@@ -78,9 +78,9 @@ tabspace
7878
expect := expectlines[i]
7979
c.Run(input, func(c *qt.C) {
8080
b := []byte(input)
81-
got := string(sanitizeAnchorName(b, goldmark_config.AutoHeadingIDTypeGitHub))
81+
got := string(sanitizeAnchorName(b, goldmark_config.AutoIDTypeGitHub))
8282
c.Assert(got, qt.Equals, expect)
83-
c.Assert(sanitizeAnchorNameString(input, goldmark_config.AutoHeadingIDTypeGitHub), qt.Equals, expect)
83+
c.Assert(sanitizeAnchorNameString(input, goldmark_config.AutoIDTypeGitHub), qt.Equals, expect)
8484
c.Assert(string(b), qt.Equals, input)
8585
})
8686
}
@@ -89,20 +89,20 @@ tabspace
8989
func TestSanitizeAnchorNameAsciiOnly(t *testing.T) {
9090
c := qt.New(t)
9191

92-
c.Assert(sanitizeAnchorNameString("god is神真美好 good", goldmark_config.AutoHeadingIDTypeGitHubAscii), qt.Equals, "god-is-good")
93-
c.Assert(sanitizeAnchorNameString("Resumé", goldmark_config.AutoHeadingIDTypeGitHubAscii), qt.Equals, "resume")
92+
c.Assert(sanitizeAnchorNameString("god is神真美好 good", goldmark_config.AutoIDTypeGitHubAscii), qt.Equals, "god-is-good")
93+
c.Assert(sanitizeAnchorNameString("Resumé", goldmark_config.AutoIDTypeGitHubAscii), qt.Equals, "resume")
9494
}
9595

9696
func TestSanitizeAnchorNameBlackfriday(t *testing.T) {
9797
c := qt.New(t)
98-
c.Assert(sanitizeAnchorNameString("Let's try this, shall we?", goldmark_config.AutoHeadingIDTypeBlackfriday), qt.Equals, "let-s-try-this-shall-we")
98+
c.Assert(sanitizeAnchorNameString("Let's try this, shall we?", goldmark_config.AutoIDTypeBlackfriday), qt.Equals, "let-s-try-this-shall-we")
9999
}
100100

101101
func BenchmarkSanitizeAnchorName(b *testing.B) {
102102
input := []byte("God is good: 神真美好")
103103
b.ResetTimer()
104104
for i := 0; i < b.N; i++ {
105-
result := sanitizeAnchorName(input, goldmark_config.AutoHeadingIDTypeGitHub)
105+
result := sanitizeAnchorName(input, goldmark_config.AutoIDTypeGitHub)
106106
if len(result) != 24 {
107107
b.Fatalf("got %d", len(result))
108108
}
@@ -113,7 +113,7 @@ func BenchmarkSanitizeAnchorNameAsciiOnly(b *testing.B) {
113113
input := []byte("God is good: 神真美好")
114114
b.ResetTimer()
115115
for i := 0; i < b.N; i++ {
116-
result := sanitizeAnchorName(input, goldmark_config.AutoHeadingIDTypeGitHubAscii)
116+
result := sanitizeAnchorName(input, goldmark_config.AutoIDTypeGitHubAscii)
117117
if len(result) != 12 {
118118
b.Fatalf("got %d", len(result))
119119
}
@@ -124,7 +124,7 @@ func BenchmarkSanitizeAnchorNameBlackfriday(b *testing.B) {
124124
input := []byte("God is good: 神真美好")
125125
b.ResetTimer()
126126
for i := 0; i < b.N; i++ {
127-
result := sanitizeAnchorName(input, goldmark_config.AutoHeadingIDTypeBlackfriday)
127+
result := sanitizeAnchorName(input, goldmark_config.AutoIDTypeBlackfriday)
128128
if len(result) != 24 {
129129
b.Fatalf("got %d", len(result))
130130
}
@@ -135,7 +135,7 @@ func BenchmarkSanitizeAnchorNameString(b *testing.B) {
135135
input := "God is good: 神真美好"
136136
b.ResetTimer()
137137
for i := 0; i < b.N; i++ {
138-
result := sanitizeAnchorNameString(input, goldmark_config.AutoHeadingIDTypeGitHub)
138+
result := sanitizeAnchorNameString(input, goldmark_config.AutoIDTypeGitHub)
139139
if len(result) != 24 {
140140
b.Fatalf("got %d", len(result))
141141
}

‎markup/goldmark/convert.go

+4-8
Original file line numberDiff line numberDiff line change
@@ -61,7 +61,7 @@ func (p provide) New(cfg converter.ProviderConfig) (converter.Provider, error) {
6161
cfg: cfg,
6262
md: md,
6363
sanitizeAnchorName: func(s string) string {
64-
return sanitizeAnchorNameString(s, cfg.MarkupConfig().Goldmark.Parser.AutoHeadingIDType)
64+
return sanitizeAnchorNameString(s, cfg.MarkupConfig().Goldmark.Parser.AutoIDType)
6565
},
6666
}, nil
6767
}), nil
@@ -188,16 +188,12 @@ func newMarkdown(pcfg converter.ProviderConfig) goldmark.Markdown {
188188
extensions = append(extensions, emoji.Emoji)
189189
}
190190

191-
if cfg.Parser.AutoHeadingID {
192-
parserOptions = append(parserOptions, parser.WithAutoHeadingID())
193-
}
194-
195191
if cfg.Parser.Attribute.Title {
196192
parserOptions = append(parserOptions, parser.WithAttribute())
197193
}
198194

199-
if cfg.Parser.Attribute.Block {
200-
extensions = append(extensions, attributes.New())
195+
if cfg.Parser.Attribute.Block || cfg.Parser.AutoHeadingID || cfg.Parser.AutoDefinitionTermID {
196+
extensions = append(extensions, attributes.New(cfg.Parser))
201197
}
202198

203199
md := goldmark.New(
@@ -295,7 +291,7 @@ func (c *goldmarkConverter) Convert(ctx converter.RenderContext) (converter.Resu
295291
}
296292

297293
func (c *goldmarkConverter) newParserContext(rctx converter.RenderContext) *parserContext {
298-
ctx := parser.NewContext(parser.WithIDs(newIDFactory(c.cfg.MarkupConfig().Goldmark.Parser.AutoHeadingIDType)))
294+
ctx := parser.NewContext(parser.WithIDs(newIDFactory(c.cfg.MarkupConfig().Goldmark.Parser.AutoIDType)))
299295
ctx.Set(tocEnableKey, rctx.RenderTOC)
300296
return &parserContext{
301297
Context: ctx,

‎markup/goldmark/goldmark_config/config.go

+32-7
Original file line numberDiff line numberDiff line change
@@ -15,9 +15,9 @@
1515
package goldmark_config
1616

1717
const (
18-
AutoHeadingIDTypeGitHub = "github"
19-
AutoHeadingIDTypeGitHubAscii = "github-ascii"
20-
AutoHeadingIDTypeBlackfriday = "blackfriday"
18+
AutoIDTypeGitHub = "github"
19+
AutoIDTypeGitHubAscii = "github-ascii"
20+
AutoIDTypeBlackfriday = "blackfriday"
2121
)
2222

2323
// Default holds the default Goldmark configuration.
@@ -79,7 +79,8 @@ var Default = Config{
7979
},
8080
Parser: Parser{
8181
AutoHeadingID: true,
82-
AutoHeadingIDType: AutoHeadingIDTypeGitHub,
82+
AutoDefinitionTermID: false,
83+
AutoIDType: AutoIDTypeGitHub,
8384
WrapStandAloneImageWithinParagraph: true,
8485
Attribute: ParserAttribute{
8586
Title: true,
@@ -97,6 +98,16 @@ type Config struct {
9798
RenderHooks RenderHooks
9899
}
99100

101+
func (c *Config) Init() error {
102+
if err := c.Parser.Init(); err != nil {
103+
return err
104+
}
105+
if c.Parser.AutoDefinitionTermID && !c.Extensions.DefinitionList {
106+
c.Parser.AutoDefinitionTermID = false
107+
}
108+
return nil
109+
}
110+
100111
// RenderHooks contains configuration for Goldmark render hooks.
101112
type RenderHooks struct {
102113
Image ImageRenderHook
@@ -250,16 +261,30 @@ type Parser struct {
250261
// auto generated heading ids.
251262
AutoHeadingID bool
252263

253-
// The strategy to use when generating heading IDs.
254-
// Available options are "github", "github-ascii".
264+
// Enables auto definition term ids.
265+
AutoDefinitionTermID bool
266+
267+
// The strategy to use when generating IDs.
268+
// Available options are "github", "github-ascii", and "blackfriday".
255269
// Default is "github", which will create GitHub-compatible anchor names.
256-
AutoHeadingIDType string
270+
AutoIDType string
257271

258272
// Enables custom attributes.
259273
Attribute ParserAttribute
260274

261275
// Whether to wrap stand-alone images within a paragraph or not.
262276
WrapStandAloneImageWithinParagraph bool
277+
278+
// Renamed to AutoIDType in 0.144.0.
279+
AutoHeadingIDType string `json:"-"`
280+
}
281+
282+
func (p *Parser) Init() error {
283+
// Renamed from AutoHeadingIDType to AutoIDType in 0.144.0.
284+
if p.AutoHeadingIDType != "" {
285+
p.AutoIDType = p.AutoHeadingIDType
286+
}
287+
return nil
263288
}
264289

265290
type ParserAttribute struct {

‎markup/goldmark/internal/extensions/attributes/attributes.go

+79-12
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,11 @@
11
package attributes
22

33
import (
4+
"github.com/gohugoio/hugo/markup/goldmark/goldmark_config"
5+
"github.com/gohugoio/hugo/markup/goldmark/internal/render"
46
"github.com/yuin/goldmark"
57
"github.com/yuin/goldmark/ast"
8+
east "github.com/yuin/goldmark/extension/ast"
69
"github.com/yuin/goldmark/parser"
710
"github.com/yuin/goldmark/text"
811
"github.com/yuin/goldmark/util"
@@ -14,24 +17,29 @@ import (
1417

1518
var (
1619
kindAttributesBlock = ast.NewNodeKind("AttributesBlock")
20+
attrNameID = []byte("id")
1721

18-
defaultParser = new(attrParser)
19-
defaultTransformer = new(transformer)
20-
attributes goldmark.Extender = new(attrExtension)
22+
defaultParser = new(attrParser)
2123
)
2224

23-
func New() goldmark.Extender {
24-
return attributes
25+
func New(cfg goldmark_config.Parser) goldmark.Extender {
26+
return &attrExtension{cfg: cfg}
2527
}
2628

27-
type attrExtension struct{}
29+
type attrExtension struct {
30+
cfg goldmark_config.Parser
31+
}
2832

2933
func (a *attrExtension) Extend(m goldmark.Markdown) {
34+
if a.cfg.Attribute.Block {
35+
m.Parser().AddOptions(
36+
parser.WithBlockParsers(
37+
util.Prioritized(defaultParser, 100)),
38+
)
39+
}
3040
m.Parser().AddOptions(
31-
parser.WithBlockParsers(
32-
util.Prioritized(defaultParser, 100)),
3341
parser.WithASTTransformers(
34-
util.Prioritized(defaultTransformer, 100),
42+
util.Prioritized(&transformer{cfg: a.cfg}, 100),
3543
),
3644
)
3745
}
@@ -92,18 +100,47 @@ func (a *attributesBlock) Kind() ast.NodeKind {
92100
return kindAttributesBlock
93101
}
94102

95-
type transformer struct{}
103+
type transformer struct {
104+
cfg goldmark_config.Parser
105+
}
106+
107+
func (a *transformer) isFragmentNode(n ast.Node) bool {
108+
switch n.Kind() {
109+
case east.KindDefinitionTerm, ast.KindHeading:
110+
return true
111+
default:
112+
return false
113+
}
114+
}
96115

97116
func (a *transformer) Transform(node *ast.Document, reader text.Reader, pc parser.Context) {
98-
attributes := make([]ast.Node, 0, 500)
117+
var attributes []ast.Node
118+
if a.cfg.Attribute.Block {
119+
attributes = make([]ast.Node, 0, 500)
120+
}
99121
ast.Walk(node, func(node ast.Node, entering bool) (ast.WalkStatus, error) {
100-
if entering && node.Kind() == kindAttributesBlock {
122+
if !entering {
123+
return ast.WalkContinue, nil
124+
}
125+
126+
if a.isFragmentNode(node) {
127+
if id, found := node.Attribute(attrNameID); !found {
128+
a.generateAutoID(node, reader, pc)
129+
} else {
130+
pc.IDs().Put(id.([]byte))
131+
}
132+
}
133+
134+
if a.cfg.Attribute.Block && node.Kind() == kindAttributesBlock {
101135
// Attributes for fenced code blocks are handled in their own extension,
102136
// but note that we currently only support code block attributes when
103137
// CodeFences=true.
104138
if node.PreviousSibling() != nil && node.PreviousSibling().Kind() != ast.KindFencedCodeBlock && !node.HasBlankPreviousLines() {
105139
attributes = append(attributes, node)
106140
return ast.WalkSkipChildren, nil
141+
} else {
142+
// remove attributes node
143+
node.Parent().RemoveChild(node.Parent(), node)
107144
}
108145
}
109146

@@ -123,3 +160,33 @@ func (a *transformer) Transform(node *ast.Document, reader text.Reader, pc parse
123160
attr.Parent().RemoveChild(attr.Parent(), attr)
124161
}
125162
}
163+
164+
func (a *transformer) generateAutoID(n ast.Node, reader text.Reader, pc parser.Context) {
165+
var text []byte
166+
switch n := n.(type) {
167+
case *ast.Heading:
168+
if a.cfg.AutoHeadingID {
169+
text = textHeadingID(n, reader)
170+
}
171+
case *east.DefinitionTerm:
172+
if a.cfg.AutoDefinitionTermID {
173+
text = []byte(render.TextPlain(n, reader.Source()))
174+
}
175+
}
176+
177+
if len(text) > 0 {
178+
headingID := pc.IDs().Generate(text, n.Kind())
179+
n.SetAttribute(attrNameID, headingID)
180+
}
181+
}
182+
183+
// Markdown settext headers can have multiple lines, use the last line for the ID.
184+
func textHeadingID(node *ast.Heading, reader text.Reader) []byte {
185+
var line []byte
186+
lastIndex := node.Lines().Len() - 1
187+
if lastIndex > -1 {
188+
lastLine := node.Lines().At(lastIndex)
189+
line = lastLine.Value(reader.Source())
190+
}
191+
return line
192+
}

0 commit comments

Comments
 (0)