mirror of
https://github.com/coaidev/coai.git
synced 2025-05-20 13:30:13 +09:00
fix unicode
This commit is contained in:
parent
0d45c5bc0b
commit
86995a8a79
@ -90,7 +90,11 @@ func getRobustnessResult(chunk string) string {
|
|||||||
|
|
||||||
matches := compile.FindStringSubmatch(chunk)
|
matches := compile.FindStringSubmatch(chunk)
|
||||||
if len(matches) > 1 {
|
if len(matches) > 1 {
|
||||||
return matches[1]
|
partial := matches[1]
|
||||||
|
// if is the unicode character
|
||||||
|
if strings.HasPrefix(partial, "\\u") {
|
||||||
|
return utils.DecodeUnicode(partial)
|
||||||
|
}
|
||||||
} else {
|
} else {
|
||||||
return ""
|
return ""
|
||||||
}
|
}
|
||||||
|
@ -151,3 +151,17 @@ func ExtractImageUrls(data string) []string {
|
|||||||
re := regexp.MustCompile(`(https?://\S+\.(?:png|jpg|jpeg|gif|webp))`)
|
re := regexp.MustCompile(`(https?://\S+\.(?:png|jpg|jpeg|gif|webp))`)
|
||||||
return re.FindAllString(data, -1)
|
return re.FindAllString(data, -1)
|
||||||
}
|
}
|
||||||
|
|
||||||
|
func DecodeUnicode(data string) string {
|
||||||
|
re := regexp.MustCompile(`\\u([0-9a-fA-F]{4})`)
|
||||||
|
return re.ReplaceAllStringFunc(data, func(s string) string {
|
||||||
|
if len(s) < 6 {
|
||||||
|
return s
|
||||||
|
}
|
||||||
|
val, err := strconv.ParseInt(s[2:], 16, 32)
|
||||||
|
if err != nil {
|
||||||
|
return s
|
||||||
|
}
|
||||||
|
return strconv.FormatInt(val, 10)
|
||||||
|
})
|
||||||
|
}
|
||||||
|
Loading…
Reference in New Issue
Block a user