2020-01-04 05:28:19 -05:00
|
|
|
// Copyright 2019 The Hugo Authors. All rights reserved.
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
|
|
|
|
package goldmark
|
|
|
|
|
|
|
|
import (
|
|
|
|
"bytes"
|
|
|
|
"strconv"
|
|
|
|
"unicode"
|
|
|
|
"unicode/utf8"
|
|
|
|
|
2020-01-05 05:52:00 -05:00
|
|
|
"github.com/gohugoio/hugo/markup/blackfriday"
|
|
|
|
|
2020-01-05 05:29:22 -05:00
|
|
|
"github.com/gohugoio/hugo/markup/goldmark/goldmark_config"
|
|
|
|
|
2020-01-04 05:28:19 -05:00
|
|
|
"github.com/gohugoio/hugo/common/text"
|
|
|
|
|
|
|
|
"github.com/yuin/goldmark/ast"
|
|
|
|
"github.com/yuin/goldmark/parser"
|
|
|
|
"github.com/yuin/goldmark/util"
|
|
|
|
|
|
|
|
bp "github.com/gohugoio/hugo/bufferpool"
|
|
|
|
)
|
|
|
|
|
2020-01-05 05:52:00 -05:00
|
|
|
func sanitizeAnchorNameString(s string, idType string) string {
|
|
|
|
return string(sanitizeAnchorName([]byte(s), idType))
|
2020-01-04 05:28:19 -05:00
|
|
|
}
|
|
|
|
|
2020-01-05 05:52:00 -05:00
|
|
|
func sanitizeAnchorName(b []byte, idType string) []byte {
|
|
|
|
return sanitizeAnchorNameWithHook(b, idType, nil)
|
2020-01-04 05:28:19 -05:00
|
|
|
}
|
|
|
|
|
2020-01-05 05:52:00 -05:00
|
|
|
func sanitizeAnchorNameWithHook(b []byte, idType string, hook func(buf *bytes.Buffer)) []byte {
|
2020-01-04 05:28:19 -05:00
|
|
|
buf := bp.GetBuffer()
|
|
|
|
|
2020-01-05 05:52:00 -05:00
|
|
|
if idType == goldmark_config.AutoHeadingIDTypeBlackfriday {
|
|
|
|
// TODO(bep) make it more efficient.
|
|
|
|
buf.WriteString(blackfriday.SanitizedAnchorName(string(b)))
|
|
|
|
} else {
|
|
|
|
asciiOnly := idType == goldmark_config.AutoHeadingIDTypeGitHubAscii
|
2020-01-04 05:28:19 -05:00
|
|
|
|
2020-01-05 05:52:00 -05:00
|
|
|
if asciiOnly {
|
|
|
|
// Normalize it to preserve accents if possible.
|
|
|
|
b = text.RemoveAccents(b)
|
2020-01-04 05:28:19 -05:00
|
|
|
}
|
|
|
|
|
2020-07-04 17:02:00 -04:00
|
|
|
b = bytes.TrimSpace(b)
|
|
|
|
|
2020-01-05 05:52:00 -05:00
|
|
|
for len(b) > 0 {
|
|
|
|
r, size := utf8.DecodeRune(b)
|
|
|
|
switch {
|
|
|
|
case asciiOnly && size != 1:
|
2020-01-05 09:58:14 -05:00
|
|
|
case r == '-' || r == ' ':
|
2020-01-05 05:52:00 -05:00
|
|
|
buf.WriteRune('-')
|
|
|
|
case isAlphaNumeric(r):
|
|
|
|
buf.WriteRune(unicode.ToLower(r))
|
|
|
|
default:
|
|
|
|
}
|
|
|
|
|
|
|
|
b = b[size:]
|
|
|
|
}
|
2020-01-04 05:28:19 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
if hook != nil {
|
|
|
|
hook(buf)
|
|
|
|
}
|
|
|
|
|
|
|
|
result := make([]byte, buf.Len())
|
|
|
|
copy(result, buf.Bytes())
|
|
|
|
|
|
|
|
bp.PutBuffer(buf)
|
|
|
|
|
|
|
|
return result
|
|
|
|
}
|
|
|
|
|
|
|
|
func isAlphaNumeric(r rune) bool {
|
|
|
|
return r == '_' || unicode.IsLetter(r) || unicode.IsDigit(r)
|
|
|
|
}
|
|
|
|
|
|
|
|
var _ parser.IDs = (*idFactory)(nil)
|
|
|
|
|
|
|
|
type idFactory struct {
|
2020-01-05 05:52:00 -05:00
|
|
|
idType string
|
|
|
|
vals map[string]struct{}
|
2020-01-04 05:28:19 -05:00
|
|
|
}
|
|
|
|
|
2020-01-05 05:29:22 -05:00
|
|
|
func newIDFactory(idType string) *idFactory {
|
2020-01-04 05:28:19 -05:00
|
|
|
return &idFactory{
|
2020-01-05 05:52:00 -05:00
|
|
|
vals: make(map[string]struct{}),
|
|
|
|
idType: idType,
|
2020-01-04 05:28:19 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (ids *idFactory) Generate(value []byte, kind ast.NodeKind) []byte {
|
2020-01-05 05:52:00 -05:00
|
|
|
return sanitizeAnchorNameWithHook(value, ids.idType, func(buf *bytes.Buffer) {
|
2020-01-04 05:28:19 -05:00
|
|
|
if buf.Len() == 0 {
|
|
|
|
if kind == ast.KindHeading {
|
|
|
|
buf.WriteString("heading")
|
|
|
|
} else {
|
|
|
|
buf.WriteString("id")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if _, found := ids.vals[util.BytesToReadOnlyString(buf.Bytes())]; found {
|
2023-02-18 15:47:35 -05:00
|
|
|
// Append a hyphen and a number, starting with 1.
|
2020-01-04 05:28:19 -05:00
|
|
|
buf.WriteRune('-')
|
|
|
|
pos := buf.Len()
|
|
|
|
for i := 1; ; i++ {
|
|
|
|
buf.WriteString(strconv.Itoa(i))
|
|
|
|
if _, found := ids.vals[util.BytesToReadOnlyString(buf.Bytes())]; !found {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
buf.Truncate(pos)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
ids.vals[buf.String()] = struct{}{}
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
func (ids *idFactory) Put(value []byte) {
|
|
|
|
ids.vals[util.BytesToReadOnlyString(value)] = struct{}{}
|
|
|
|
}
|