mirror of
https://github.com/coaidev/coai.git
synced 2025-05-19 21:10:18 +09:00
103 lines
1.9 KiB
Go
103 lines
1.9 KiB
Go
package utils
|
|
|
|
import (
|
|
"chat/globals"
|
|
"github.com/chai2010/webp"
|
|
"image"
|
|
"image/gif"
|
|
"image/jpeg"
|
|
"io"
|
|
"math"
|
|
"net/http"
|
|
"path"
|
|
"strings"
|
|
)
|
|
|
|
type Image struct {
|
|
Object image.Image
|
|
}
|
|
type Images []Image
|
|
|
|
func NewImage(url string) (*Image, error) {
|
|
res, err := http.Get(url)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
defer res.Body.Close()
|
|
|
|
var img image.Image
|
|
suffix := strings.ToLower(path.Ext(url))
|
|
switch suffix {
|
|
case ".png":
|
|
if img, _, err = image.Decode(res.Body); err != nil {
|
|
return nil, err
|
|
}
|
|
case ".jpg", ".jpeg":
|
|
if img, err = jpeg.Decode(res.Body); err != nil {
|
|
return nil, err
|
|
}
|
|
case "webp":
|
|
if img, err = webp.Decode(res.Body); err != nil {
|
|
return nil, err
|
|
}
|
|
case "gif":
|
|
ticks, err := gif.DecodeAll(res.Body)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
img = ticks.Image[0]
|
|
}
|
|
|
|
return &Image{Object: img}, nil
|
|
}
|
|
|
|
func ConvertToBase64(url string) (string, error) {
|
|
res, err := http.Get(url)
|
|
if err != nil {
|
|
return "", err
|
|
}
|
|
|
|
defer res.Body.Close()
|
|
|
|
data, err := io.ReadAll(res.Body)
|
|
if err != nil {
|
|
return "", err
|
|
}
|
|
|
|
return Base64EncodeBytes(data), nil
|
|
}
|
|
|
|
func (i *Image) GetWidth() int {
|
|
return i.Object.Bounds().Max.X
|
|
}
|
|
|
|
func (i *Image) GetHeight() int {
|
|
return i.Object.Bounds().Max.Y
|
|
}
|
|
|
|
func (i *Image) GetPixel(x int, y int) (uint32, uint32, uint32, uint32) {
|
|
return i.Object.At(x, y).RGBA()
|
|
}
|
|
|
|
func (i *Image) GetPixelColor(x int, y int) (int, int, int) {
|
|
r, g, b, _ := i.GetPixel(x, y)
|
|
return int(r), int(g), int(b)
|
|
}
|
|
|
|
func (i *Image) CountTokens(model string) int {
|
|
if globals.IsGPT41106VisionPreview(model) {
|
|
// tile size is 512x512
|
|
// the max size of image is 2048x2048
|
|
// the image that is larger than 2048x2048 will be resized in 16 tiles
|
|
|
|
x := LimitMax(math.Ceil(float64(i.GetWidth())/512), 4)
|
|
y := LimitMax(math.Ceil(float64(i.GetHeight())/512), 4)
|
|
tiles := int(x) * int(y)
|
|
|
|
return 85 + 170*tiles
|
|
}
|
|
|
|
return 0
|
|
}
|