2021-07-25 03:59:27 +01:00
// Copyright 2021 The Gitea Authors. All rights reserved.
2022-11-27 13:20:29 -05:00
// SPDX-License-Identifier: MIT
2021-07-25 03:59:27 +01:00
package util
2023-06-05 09:00:12 +02:00
import (
"strings"
"unicode/utf8"
)
2021-07-25 03:59:27 +01:00
2021-12-09 13:41:17 +08:00
// in UTF8 "…" is 3 bytes so doesn't really gain us anything...
2022-01-20 18:46:10 +01:00
const (
utf8Ellipsis = "…"
asciiEllipsis = "..."
)
2021-12-09 13:41:17 +08:00
2021-07-25 03:59:27 +01:00
// SplitStringAtByteN splits a string at byte n accounting for rune boundaries. (Combining characters are not accounted for.)
func SplitStringAtByteN ( input string , n int ) ( left , right string ) {
if len ( input ) <= n {
2021-12-09 13:41:17 +08:00
return input , ""
2021-07-25 03:59:27 +01:00
}
if ! utf8 . ValidString ( input ) {
2021-12-09 13:41:17 +08:00
if n - 3 < 0 {
return input , ""
}
return input [ : n - 3 ] + asciiEllipsis , asciiEllipsis + input [ n - 3 : ]
2021-07-25 03:59:27 +01:00
}
end := 0
for end <= n - 3 {
_ , size := utf8 . DecodeRuneInString ( input [ end : ] )
if end + size > n - 3 {
break
}
end += size
}
2021-12-09 13:41:17 +08:00
return input [ : end ] + utf8Ellipsis , utf8Ellipsis + input [ end : ]
}
2023-06-05 09:00:12 +02:00
// SplitTrimSpace splits the string at given separator and trims leading and trailing space
func SplitTrimSpace ( input , sep string ) [ ] string {
2024-11-27 20:50:27 -06:00
// Trim initial leading & trailing space
input = strings . TrimSpace ( input )
2023-06-05 09:00:12 +02:00
// replace CRLF with LF
input = strings . ReplaceAll ( input , "\r\n" , "\n" )
var stringList [ ] string
for _ , s := range strings . Split ( input , sep ) {
// trim leading and trailing space
stringList = append ( stringList , strings . TrimSpace ( s ) )
}
return stringList
}