mirror of
https://codeberg.org/davrot/forgejo.git
synced 2025-05-17 23:00:02 +02:00
feat: highlighted code search results (#4749)
closes #4534 <details> <summary>Screenshots</summary>  </details> Reviewed-on: https://codeberg.org/forgejo/forgejo/pulls/4749 Reviewed-by: 0ko <0ko@noreply.codeberg.org> Co-authored-by: Shiny Nematoda <snematoda.751k2@aleeas.com> Co-committed-by: Shiny Nematoda <snematoda.751k2@aleeas.com>
This commit is contained in:
parent
517637137c
commit
06d2e90fa4
10 changed files with 214 additions and 75 deletions
|
@ -337,7 +337,7 @@ func (diffSection *DiffSection) GetComputedInlineDiffFor(diffLine *DiffLine, loc
|
|||
return DiffInlineWithHighlightCode(diffSection.FileName, language, diffLine.Content, locale)
|
||||
}
|
||||
|
||||
hcd := newHighlightCodeDiff()
|
||||
hcd := NewHighlightCodeDiff()
|
||||
diffRecord := hcd.diffWithHighlight(diffSection.FileName, language, diff1[1:], diff2[1:])
|
||||
// it seems that Gitea doesn't need the line wrapper of Chroma, so do not add them back
|
||||
// if the line wrappers are still needed in the future, it can be added back by "diffToHTML(hcd.lineWrapperTags. ...)"
|
||||
|
|
|
@ -31,17 +31,17 @@ func extractHTMLToken(s string) (before, token, after string, valid bool) {
|
|||
return "", "", s, true
|
||||
}
|
||||
|
||||
// highlightCodeDiff is used to do diff with highlighted HTML code.
|
||||
// HighlightCodeDiff is used to do diff with highlighted HTML code.
|
||||
// It totally depends on Chroma's valid HTML output and its structure, do not use these functions for other purposes.
|
||||
// The HTML tags and entities will be replaced by Unicode placeholders: "<span>{TEXT}</span>" => "\uE000{TEXT}\uE001"
|
||||
// These Unicode placeholders are friendly to the diff.
|
||||
// Then after diff, the placeholders in diff result will be recovered to the HTML tags and entities.
|
||||
// It's guaranteed that the tags in final diff result are paired correctly.
|
||||
type highlightCodeDiff struct {
|
||||
type HighlightCodeDiff struct {
|
||||
placeholderBegin rune
|
||||
placeholderMaxCount int
|
||||
placeholderIndex int
|
||||
placeholderTokenMap map[rune]string
|
||||
PlaceholderTokenMap map[rune]string
|
||||
tokenPlaceholderMap map[string]rune
|
||||
|
||||
placeholderOverflowCount int
|
||||
|
@ -49,52 +49,52 @@ type highlightCodeDiff struct {
|
|||
lineWrapperTags []string
|
||||
}
|
||||
|
||||
func newHighlightCodeDiff() *highlightCodeDiff {
|
||||
return &highlightCodeDiff{
|
||||
func NewHighlightCodeDiff() *HighlightCodeDiff {
|
||||
return &HighlightCodeDiff{
|
||||
placeholderBegin: rune(0x100000), // Plane 16: Supplementary Private Use Area B (U+100000..U+10FFFD)
|
||||
placeholderMaxCount: 64000,
|
||||
placeholderTokenMap: map[rune]string{},
|
||||
PlaceholderTokenMap: map[rune]string{},
|
||||
tokenPlaceholderMap: map[string]rune{},
|
||||
}
|
||||
}
|
||||
|
||||
// nextPlaceholder returns 0 if no more placeholder can be used
|
||||
// NextPlaceholder returns 0 if no more placeholder can be used
|
||||
// the diff is done line by line, usually there are only a few (no more than 10) placeholders in one line
|
||||
// so the placeholderMaxCount is impossible to be exhausted in real cases.
|
||||
func (hcd *highlightCodeDiff) nextPlaceholder() rune {
|
||||
func (hcd *HighlightCodeDiff) NextPlaceholder() rune {
|
||||
for hcd.placeholderIndex < hcd.placeholderMaxCount {
|
||||
r := hcd.placeholderBegin + rune(hcd.placeholderIndex)
|
||||
hcd.placeholderIndex++
|
||||
// only use non-existing (not used by code) rune as placeholders
|
||||
if _, ok := hcd.placeholderTokenMap[r]; !ok {
|
||||
if _, ok := hcd.PlaceholderTokenMap[r]; !ok {
|
||||
return r
|
||||
}
|
||||
}
|
||||
return 0 // no more available placeholder
|
||||
}
|
||||
|
||||
func (hcd *highlightCodeDiff) isInPlaceholderRange(r rune) bool {
|
||||
func (hcd *HighlightCodeDiff) isInPlaceholderRange(r rune) bool {
|
||||
return hcd.placeholderBegin <= r && r < hcd.placeholderBegin+rune(hcd.placeholderMaxCount)
|
||||
}
|
||||
|
||||
func (hcd *highlightCodeDiff) collectUsedRunes(code string) {
|
||||
func (hcd *HighlightCodeDiff) CollectUsedRunes(code string) {
|
||||
for _, r := range code {
|
||||
if hcd.isInPlaceholderRange(r) {
|
||||
// put the existing rune (used by code) in map, then this rune won't be used a placeholder anymore.
|
||||
hcd.placeholderTokenMap[r] = ""
|
||||
hcd.PlaceholderTokenMap[r] = ""
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
func (hcd *highlightCodeDiff) diffWithHighlight(filename, language, codeA, codeB string) []diffmatchpatch.Diff {
|
||||
hcd.collectUsedRunes(codeA)
|
||||
hcd.collectUsedRunes(codeB)
|
||||
func (hcd *HighlightCodeDiff) diffWithHighlight(filename, language, codeA, codeB string) []diffmatchpatch.Diff {
|
||||
hcd.CollectUsedRunes(codeA)
|
||||
hcd.CollectUsedRunes(codeB)
|
||||
|
||||
highlightCodeA, _ := highlight.Code(filename, language, codeA)
|
||||
highlightCodeB, _ := highlight.Code(filename, language, codeB)
|
||||
|
||||
convertedCodeA := hcd.convertToPlaceholders(string(highlightCodeA))
|
||||
convertedCodeB := hcd.convertToPlaceholders(string(highlightCodeB))
|
||||
convertedCodeA := hcd.ConvertToPlaceholders(string(highlightCodeA))
|
||||
convertedCodeB := hcd.ConvertToPlaceholders(string(highlightCodeB))
|
||||
|
||||
diffs := diffMatchPatch.DiffMain(convertedCodeA, convertedCodeB, true)
|
||||
diffs = diffMatchPatch.DiffCleanupEfficiency(diffs)
|
||||
|
@ -106,7 +106,7 @@ func (hcd *highlightCodeDiff) diffWithHighlight(filename, language, codeA, codeB
|
|||
}
|
||||
|
||||
// convertToPlaceholders totally depends on Chroma's valid HTML output and its structure, do not use these functions for other purposes.
|
||||
func (hcd *highlightCodeDiff) convertToPlaceholders(htmlCode string) string {
|
||||
func (hcd *HighlightCodeDiff) ConvertToPlaceholders(htmlCode string) string {
|
||||
var tagStack []string
|
||||
res := strings.Builder{}
|
||||
|
||||
|
@ -153,10 +153,10 @@ func (hcd *highlightCodeDiff) convertToPlaceholders(htmlCode string) string {
|
|||
// remember the placeholder and token in the map
|
||||
placeholder, ok := hcd.tokenPlaceholderMap[tokenInMap]
|
||||
if !ok {
|
||||
placeholder = hcd.nextPlaceholder()
|
||||
placeholder = hcd.NextPlaceholder()
|
||||
if placeholder != 0 {
|
||||
hcd.tokenPlaceholderMap[tokenInMap] = placeholder
|
||||
hcd.placeholderTokenMap[placeholder] = tokenInMap
|
||||
hcd.PlaceholderTokenMap[placeholder] = tokenInMap
|
||||
}
|
||||
}
|
||||
|
||||
|
@ -179,12 +179,16 @@ func (hcd *highlightCodeDiff) convertToPlaceholders(htmlCode string) string {
|
|||
return res.String()
|
||||
}
|
||||
|
||||
func (hcd *highlightCodeDiff) recoverOneDiff(diff *diffmatchpatch.Diff) {
|
||||
func (hcd *HighlightCodeDiff) recoverOneDiff(diff *diffmatchpatch.Diff) {
|
||||
diff.Text = hcd.Recover(diff.Text)
|
||||
}
|
||||
|
||||
func (hcd *HighlightCodeDiff) Recover(src string) string {
|
||||
sb := strings.Builder{}
|
||||
var tagStack []string
|
||||
|
||||
for _, r := range diff.Text {
|
||||
token, ok := hcd.placeholderTokenMap[r]
|
||||
for _, r := range src {
|
||||
token, ok := hcd.PlaceholderTokenMap[r]
|
||||
if !ok || token == "" {
|
||||
sb.WriteRune(r) // if the rune is not a placeholder, write it as it is
|
||||
continue
|
||||
|
@ -218,5 +222,5 @@ func (hcd *highlightCodeDiff) recoverOneDiff(diff *diffmatchpatch.Diff) {
|
|||
}
|
||||
}
|
||||
|
||||
diff.Text = sb.String()
|
||||
return sb.String()
|
||||
}
|
||||
|
|
|
@ -13,7 +13,7 @@ import (
|
|||
)
|
||||
|
||||
func TestDiffWithHighlight(t *testing.T) {
|
||||
hcd := newHighlightCodeDiff()
|
||||
hcd := NewHighlightCodeDiff()
|
||||
diffs := hcd.diffWithHighlight(
|
||||
"main.v", "",
|
||||
" run('<>')\n",
|
||||
|
@ -28,9 +28,9 @@ func TestDiffWithHighlight(t *testing.T) {
|
|||
output = diffToHTML(nil, diffs, DiffLineAdd)
|
||||
assert.Equal(t, expected, output)
|
||||
|
||||
hcd = newHighlightCodeDiff()
|
||||
hcd.placeholderTokenMap['O'] = "<span>"
|
||||
hcd.placeholderTokenMap['C'] = "</span>"
|
||||
hcd = NewHighlightCodeDiff()
|
||||
hcd.PlaceholderTokenMap['O'] = "<span>"
|
||||
hcd.PlaceholderTokenMap['C'] = "</span>"
|
||||
diff := diffmatchpatch.Diff{}
|
||||
|
||||
diff.Text = "OC"
|
||||
|
@ -47,20 +47,20 @@ func TestDiffWithHighlight(t *testing.T) {
|
|||
}
|
||||
|
||||
func TestDiffWithHighlightPlaceholder(t *testing.T) {
|
||||
hcd := newHighlightCodeDiff()
|
||||
hcd := NewHighlightCodeDiff()
|
||||
diffs := hcd.diffWithHighlight(
|
||||
"main.js", "",
|
||||
"a='\U00100000'",
|
||||
"a='\U0010FFFD''",
|
||||
)
|
||||
assert.Equal(t, "", hcd.placeholderTokenMap[0x00100000])
|
||||
assert.Equal(t, "", hcd.placeholderTokenMap[0x0010FFFD])
|
||||
assert.Equal(t, "", hcd.PlaceholderTokenMap[0x00100000])
|
||||
assert.Equal(t, "", hcd.PlaceholderTokenMap[0x0010FFFD])
|
||||
|
||||
expected := fmt.Sprintf(`<span class="nx">a</span><span class="o">=</span><span class="s1">'</span><span class="removed-code">%s</span>'`, "\U00100000")
|
||||
output := diffToHTML(hcd.lineWrapperTags, diffs, DiffLineDel)
|
||||
assert.Equal(t, expected, output)
|
||||
|
||||
hcd = newHighlightCodeDiff()
|
||||
hcd = NewHighlightCodeDiff()
|
||||
diffs = hcd.diffWithHighlight(
|
||||
"main.js", "",
|
||||
"a='\U00100000'",
|
||||
|
@ -72,7 +72,7 @@ func TestDiffWithHighlightPlaceholder(t *testing.T) {
|
|||
}
|
||||
|
||||
func TestDiffWithHighlightPlaceholderExhausted(t *testing.T) {
|
||||
hcd := newHighlightCodeDiff()
|
||||
hcd := NewHighlightCodeDiff()
|
||||
hcd.placeholderMaxCount = 0
|
||||
diffs := hcd.diffWithHighlight(
|
||||
"main.js", "",
|
||||
|
@ -83,7 +83,7 @@ func TestDiffWithHighlightPlaceholderExhausted(t *testing.T) {
|
|||
expected := fmt.Sprintf(`<span class="removed-code">%s#39;</span>`, "\uFFFD")
|
||||
assert.Equal(t, expected, output)
|
||||
|
||||
hcd = newHighlightCodeDiff()
|
||||
hcd = NewHighlightCodeDiff()
|
||||
hcd.placeholderMaxCount = 0
|
||||
diffs = hcd.diffWithHighlight(
|
||||
"main.js", "",
|
||||
|
@ -102,7 +102,7 @@ func TestDiffWithHighlightPlaceholderExhausted(t *testing.T) {
|
|||
func TestDiffWithHighlightTagMatch(t *testing.T) {
|
||||
totalOverflow := 0
|
||||
for i := 0; i < 100; i++ {
|
||||
hcd := newHighlightCodeDiff()
|
||||
hcd := NewHighlightCodeDiff()
|
||||
hcd.placeholderMaxCount = i
|
||||
diffs := hcd.diffWithHighlight(
|
||||
"main.js", "",
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue