1
1
mirror of https://github.com/go-gitea/gitea synced 2025-01-25 00:54:27 +00:00
gitea/modules/util/truncate.go

106 lines
3.2 KiB
Go
Raw Normal View History

// Copyright 2021 The Gitea Authors. All rights reserved.
// SPDX-License-Identifier: MIT
package util
import (
"strings"
"unicode/utf8"
)
// in UTF8 "…" is 3 bytes so doesn't really gain us anything...
const (
utf8Ellipsis = "…"
asciiEllipsis = "..."
)
2024-12-26 11:56:03 +08:00
func IsLikelyEllipsisLeftPart(s string) bool {
return strings.HasSuffix(s, utf8Ellipsis) || strings.HasSuffix(s, asciiEllipsis)
}
2024-12-26 11:56:03 +08:00
// EllipsisDisplayString returns a truncated short string for display purpose.
// The length is the approximate number of ASCII-width in the string (CJK/emoji are 2-ASCII width)
// It appends "…" or "..." at the end of truncated string.
// It guarantees the length of the returned runes doesn't exceed the limit.
func EllipsisDisplayString(str string, limit int) string {
s, _, _, _ := ellipsisDisplayString(str, limit)
return s
}
2024-12-26 11:56:03 +08:00
// EllipsisDisplayStringX works like EllipsisDisplayString while it also returns the right part
func EllipsisDisplayStringX(str string, limit int) (left, right string) {
left, offset, truncated, encounterInvalid := ellipsisDisplayString(str, limit)
if truncated {
right = str[offset:]
r, _ := utf8.DecodeRune(UnsafeStringToBytes(right))
encounterInvalid = encounterInvalid || r == utf8.RuneError
ellipsis := utf8Ellipsis
if encounterInvalid {
ellipsis = asciiEllipsis
}
2024-12-26 11:56:03 +08:00
right = ellipsis + right
}
2024-12-26 11:56:03 +08:00
return left, right
}
2024-12-26 11:56:03 +08:00
func ellipsisDisplayString(str string, limit int) (res string, offset int, truncated, encounterInvalid bool) {
if len(str) <= limit {
return str, len(str), false, false
}
// To future maintainers: this logic must guarantee that the length of the returned runes doesn't exceed the limit,
// because the returned string will also be used as database value. UTF-8 VARCHAR(10) could store 10 rune characters,
// So each rune must be countered as at least 1 width.
// Even if there are some special Unicode characters (zero-width, combining, etc.), they should NEVER be counted as zero.
pos, used := 0, 0
for i, r := range str {
encounterInvalid = encounterInvalid || r == utf8.RuneError
pos = i
runeWidth := 1
if r >= 128 {
runeWidth = 2 // CJK/emoji chars are considered as 2-ASCII width
}
if used+runeWidth+3 > limit {
break
}
2024-12-26 11:56:03 +08:00
used += runeWidth
offset += utf8.RuneLen(r)
}
// if the remaining are fewer than 3 runes, then maybe we could add them, no need to ellipse
if len(str)-pos <= 12 {
var nextCnt, nextWidth int
for _, r := range str[pos:] {
if nextCnt >= 4 {
break
}
nextWidth++
if r >= 128 {
nextWidth++ // CJK/emoji chars are considered as 2-ASCII width
}
nextCnt++
}
if nextCnt <= 3 && used+nextWidth <= limit {
return str, len(str), false, false
}
}
if limit < 3 {
// if the limit is so small, do not add ellipsis
return str[:offset], offset, true, false
}
2024-12-26 11:56:03 +08:00
ellipsis := utf8Ellipsis
if encounterInvalid {
ellipsis = asciiEllipsis
}
return str[:offset] + ellipsis, offset, true, encounterInvalid
}
2024-12-26 11:56:03 +08:00
// TruncateRunes returns a truncated string with given rune limit,
// it returns input string if its rune length doesn't exceed the limit.
func TruncateRunes(str string, limit int) string {
if utf8.RuneCountInString(str) < limit {
return str
}
return string([]rune(str)[:limit])
}