Files
higress/plugins/wasm-go/extensions/ai-cache/embedding/huggingface.go
2025-03-29 18:08:37 +08:00

169 lines
4.0 KiB
Go

package embedding
import (
"encoding/json"
"errors"
"fmt"
"net/http"
"strconv"
"strings"
"github.com/alibaba/higress/plugins/wasm-go/pkg/log"
"github.com/alibaba/higress/plugins/wasm-go/pkg/wrapper"
"github.com/tidwall/gjson"
)
const (
HUGGINGFACE_DOMAIN = "api-inference.huggingface.co"
HUGGINGFACE_PORT = 443
HUGGINGFACE_DEFAULT_MODEL_NAME = "sentence-transformers/all-MiniLM-L6-v2"
HUGGINGFACE_ENDPOINT = "/pipeline/feature-extraction/{modelId}"
)
type huggingfaceProviderInitializer struct {
}
var huggingfaceConfig huggingfaceProviderConfig
type huggingfaceProviderConfig struct {
// @Title zh-CN 文本特征提取服务 API Key
// @Description zh-CN 文本特征提取服务 API Key。在HuggingFace定义为 hf_token
apiKey string
}
func (c *huggingfaceProviderInitializer) InitConfig(json gjson.Result) {
huggingfaceConfig.apiKey = json.Get("apiKey").String()
}
func (c *huggingfaceProviderInitializer) ValidateConfig() error {
if huggingfaceConfig.apiKey == "" {
return errors.New("[HuggingFace] hfTokens is required")
}
return nil
}
func (t *huggingfaceProviderInitializer) CreateProvider(c ProviderConfig) (Provider, error) {
if c.servicePort == 0 {
c.servicePort = HUGGINGFACE_PORT
}
if c.serviceHost == "" {
c.serviceHost = HUGGINGFACE_DOMAIN
}
if c.model == "" {
c.model = HUGGINGFACE_DEFAULT_MODEL_NAME
}
return &HuggingFaceProvider{
config: c,
client: wrapper.NewClusterClient(wrapper.FQDNCluster{
FQDN: c.serviceName,
Host: c.serviceHost,
Port: c.servicePort,
}),
}, nil
}
func (t *HuggingFaceProvider) GetProviderType() string {
return PROVIDER_TYPE_HUGGINGFACE
}
type HuggingFaceProvider struct {
config ProviderConfig
client wrapper.HttpClient
}
type HuggingFaceEmbeddingRequest struct {
Inputs string `json:"inputs"`
Options struct {
WaitForModel bool `json:"wait_for_model"`
} `json:"options"`
}
func (t *HuggingFaceProvider) constructParameters(text string) (string, [][2]string, []byte, error) {
if text == "" {
err := errors.New("queryString text cannot be empty")
return "", nil, nil, err
}
data := HuggingFaceEmbeddingRequest{
Inputs: text,
Options: struct {
WaitForModel bool `json:"wait_for_model"`
}{
WaitForModel: true,
},
}
requestBody, err := json.Marshal(data)
if err != nil {
log.Errorf("failed to marshal request data: %v", err)
return "", nil, nil, err
}
modelId := t.config.model
if modelId == "" {
modelId = HUGGINGFACE_DEFAULT_MODEL_NAME
}
// 拼接 endpoint
endpoint := strings.Replace(HUGGINGFACE_ENDPOINT, "{modelId}", modelId, 1)
headers := [][2]string{
{"Authorization", "Bearer " + huggingfaceConfig.apiKey},
{"Content-Type", "application/json"},
}
return endpoint, headers, requestBody, err
}
func (t *HuggingFaceProvider) parseTextEmbedding(responseBody []byte) ([]float64, error) {
var embedding []float64
err := json.Unmarshal(responseBody, &embedding)
if err != nil {
return nil, err
}
return embedding, nil
}
func (t *HuggingFaceProvider) GetEmbedding(
queryString string,
ctx wrapper.HttpContext,
callback func(emb []float64, err error)) error {
embUrl, embHeaders, embRequestBody, err := t.constructParameters(queryString)
if err != nil {
log.Errorf("failed to construct parameters: %v", err)
return err
}
err = t.client.Post(embUrl, embHeaders, embRequestBody,
func(statusCode int, responseHeaders http.Header, responseBody []byte) {
if statusCode != http.StatusOK {
err = errors.New("failed to get embedding due to status code: " + strconv.Itoa(statusCode))
callback(nil, err)
return
}
var resp []float64
resp, err = t.parseTextEmbedding(responseBody)
if err != nil {
err = fmt.Errorf("failed to parse response: %v", err)
callback(nil, err)
return
}
log.Debugf("get embedding response: %d, %s", statusCode, responseBody)
if len(resp) == 0 {
err = errors.New("no embedding found in response")
callback(nil, err)
return
}
callback(resp, nil)
}, t.config.timeout)
return err
}