coai/utils/image.go

103 lines
1.9 KiB
Go

package utils
import (
"chat/globals"
"github.com/chai2010/webp"
"image"
"image/gif"
"image/jpeg"
"io"
"math"
"net/http"
"path"
"strings"
)
type Image struct {
Object image.Image
}
type Images []Image
func NewImage(url string) (*Image, error) {
res, err := http.Get(url)
if err != nil {
return nil, err
}
defer res.Body.Close()
var img image.Image
suffix := strings.ToLower(path.Ext(url))
switch suffix {
case ".png":
if img, _, err = image.Decode(res.Body); err != nil {
return nil, err
}
case ".jpg", ".jpeg":
if img, err = jpeg.Decode(res.Body); err != nil {
return nil, err
}
case "webp":
if img, err = webp.Decode(res.Body); err != nil {
return nil, err
}
case "gif":
ticks, err := gif.DecodeAll(res.Body)
if err != nil {
return nil, err
}
img = ticks.Image[0]
}
return &Image{Object: img}, nil
}
func ConvertToBase64(url string) (string, error) {
res, err := http.Get(url)
if err != nil {
return "", err
}
defer res.Body.Close()
data, err := io.ReadAll(res.Body)
if err != nil {
return "", err
}
return Base64EncodeBytes(data), nil
}
func (i *Image) GetWidth() int {
return i.Object.Bounds().Max.X
}
func (i *Image) GetHeight() int {
return i.Object.Bounds().Max.Y
}
func (i *Image) GetPixel(x int, y int) (uint32, uint32, uint32, uint32) {
return i.Object.At(x, y).RGBA()
}
func (i *Image) GetPixelColor(x int, y int) (int, int, int) {
r, g, b, _ := i.GetPixel(x, y)
return int(r), int(g), int(b)
}
func (i *Image) CountTokens(model string) int {
if globals.IsOpenAIVisionModels(model) {
// tile size is 512x512
// the max size of image is 2048x2048
// the image that is larger than 2048x2048 will be resized in 16 tiles
x := LimitMax(math.Ceil(float64(i.GetWidth())/512), 4)
y := LimitMax(math.Ceil(float64(i.GetHeight())/512), 4)
tiles := int(x) * int(y)
return 85 + 170*tiles
}
return 0
}