feature: add hunyuan llm support for plugins/ai-proxy (#1018)

Co-authored-by: Kent Dong <ch3cho@qq.com>
2026-06-09 04:37:31 +08:00 · 2024-06-06 18:11:51 +08:00
parent ed976c6d06
commit c6e3db95e0
4 changed files with 699 additions and 3 deletions
--- a/plugins/wasm-go/extensions/ai-proxy/README.md
+++ b/plugins/wasm-go/extensions/ai-proxy/README.md
@@ -106,6 +106,16 @@ Ollama 所对应的 `type` 为 `ollama`。它特有的配置字段如下：
 | `ollamaServerHost` | string | 必填   | -   | Ollama 服务器的主机地址 |
 | `ollamaServerPort` | number | 必填   | -   | Ollama 服务器的端口号，默认为11434 |
 #### 混元
 混元所对应的 `type` 为 `hunyuan`。它特有的配置字段如下：
 | 名称                | 数据类型   | 填写要求 | 默认值 | 描述                                           |
 |-------------------|--------|------|-----|----------------------------------------------|
 | `hunyuanAuthId` | string | 必填   | -   | 混元用于v3版本认证的id |
 | `hunyuanAuthKey` | string | 必填   | -   | 混元用于v3版本认证的key |
 ## 用法示例
 ### 使用 OpenAI 协议代理 Azure OpenAI 服务
@@ -546,6 +556,70 @@ provider:
  "stop_reason": "end_turn"
 }
 ```
 ### 使用 OpenAI 协议代理混元服务
 **配置信息**
 ```yaml
 provider:
  type: "hunyuan"
  hunyuanAuthKey: "<YOUR AUTH KEY>"
  apiTokens:
    - ""
  hunyuanAuthId: "<YOUR AUTH ID>"
  timeout: 1200000
  modelMapping:
    "*": "hunyuan-lite"
 ```
 **请求示例**
 请求脚本：
 ```sh
 curl --location 'http://<your higress domain>/v1/chat/completions' \
 --header 'Content-Type:  application/json' \
 --data '{
  "model": "gpt-3",
  "messages": [
    {
      "role": "system",
      "content": "你是一个名专业的开发人员！"
    },
    {
      "role": "user",
      "content": "你好，你是谁？"
    }
  ],
  "temperature": 0.3,
  "stream": false
 }'
 ```
 **响应示例**
 ```json
 {
    "id": "fd140c3e-0b69-4b19-849b-d354d32a6162",
    "choices": [
        {
            "index": 0,
            "delta": {
                "role": "assistant",
                "content": "你好！我是一名专业的开发人员。"
            },
            "finish_reason": "stop"
        }
    ],
    "created": 1717493117,
    "model": "hunyuan-lite",
    "object": "chat.completion",
    "usage": {
        "prompt_tokens": 15,
        "completion_tokens": 9,
        "total_tokens": 24
    }
 }
 ```
 ## 完整配置示例
@@ -619,4 +693,4 @@ curl "http://<YOUR-DOMAIN>/v1/chat/completions" -H "Content-Type: application/js
    }
  ]
 }'
-```
+```
--- a/plugins/wasm-go/extensions/ai-proxy/README_dev.md
+++ b/plugins/wasm-go/extensions/ai-proxy/README_dev.md
@@ -13,6 +13,52 @@ DOCKER_BUILDKIT=1; docker build --build-arg PLUGIN_NAME=ai-proxy --build-arg EXT
 ```powershell
 $env:DOCKER_BUILDKIT=1; docker build --build-arg PLUGIN_NAME=ai-proxy --build-arg EXTRA_TAGS=proxy_wasm_version_0_2_100 --build-arg BUILDER=higress-registry.cn-hangzhou.cr.aliyuncs.com/plugins/wasm-go-builder:go1.19-tinygo0.28.1-oras1.0.0 -t ai-proxy:0.0.1 --output .\out ..\..
 ```
 ## 本地运行
 参考：https://higress.io/zh-cn/docs/user/wasm-go
 需要注意的是，higress/plugins/wasm-go/extensions/ai-proxy/envoy.yaml中的clusters字段，记得改成你需要地址，比如混元的话：就会有如下的一个cluster的配置：
 ```yaml
 <省略>
 static_resources:
 <省略>
  clusters:
      load_assignment:
        cluster_name: moonshot
        endpoints:
          - lb_endpoints:
              - endpoint:
                  address:
                    socket_address:
                      address: hunyuan.tencentcloudapi.com
                      port_value: 443
      transport_socket:
        name: envoy.transport_sockets.tls
        typed_config:
          "@type": type.googleapis.com/envoy.extensions.transport_sockets.tls.v3.UpstreamTlsContext
          "sni": "hunyuan.tencentcloudapi.com"
 ```
 而后你就可以在本地的pod中查看相应的输出，请求样例如下：
 ```sh
 curl --location 'http://127.0.0.1:10000/v1/chat/completions' \
 --header 'Content-Type:  application/json' \
 --data '{
  "model": "gpt-3",
  "messages": [
    {
      "role": "system",
      "content": "你是一个名专业的开发人员！"
    },
    {
      "role": "user",
      "content": "你好，你是谁？"
    }
  ],
  "temperature": 0.3,
  "stream": false
 }'
 ```
 ## 测试须知
 由于 `ai-proxy` 插件使用了 Higress 对数据面定制的特殊功能，因此在测试时需要使用版本不低于 1.4.0-rc.1 的 Higress Gateway 镜像。
--- a/plugins/wasm-go/extensions/ai-proxy/provider/hunyuan.go
+++ b/plugins/wasm-go/extensions/ai-proxy/provider/hunyuan.go
@@ -0,0 +1,563 @@
 package provider
 import (
 	"bytes"
 	"crypto/hmac"
 	"crypto/sha256"
 	"encoding/hex"
 	"encoding/json"
 	"errors"
 	"fmt"
 	"strings"
 	"time"
 	"github.com/alibaba/higress/plugins/wasm-go/extensions/ai-proxy/util"
 	"github.com/alibaba/higress/plugins/wasm-go/pkg/wrapper"
 	"github.com/higress-group/proxy-wasm-go-sdk/proxywasm"
 	"github.com/higress-group/proxy-wasm-go-sdk/proxywasm/types"
 )
 // hunyuanProvider is the provider for hunyuan AI service.
 const (
 	hunyuanDomain                 = "hunyuan.tencentcloudapi.com"
 	hunyuanRequestPath            = "/"
 	hunyuanChatCompletionTCAction = "ChatCompletions"
 	// headers necessary for TC hunyuan api call:
 	// ref: https://cloud.tencent.com/document/api/1729/105701, https://cloud.tencent.com/document/api/1729/101842
 	actionKey        = "X-TC-Action"
 	timestampKey     = "X-TC-Timestamp"
 	authorizationKey = "Authorization"
 	versionKey       = "X-TC-Version"
 	versionValue     = "2023-09-01"
 	hostKey          = "Host"
 	ssePrefix            = "data: " // Server-Sent Events (SSE) 类型的流式响应的开始标记
 	hunyuanStreamEndMark = "stop"   // 混元的流式的finishReason为stop时，表示结束
 	hunyuanAuthKeyLen = 32
 	hunyuanAuthIdLen  = 36
 )
 type hunyuanProviderInitializer struct {
 }
 // ref: https://console.cloud.tencent.com/api/explorer?Product=hunyuan&Version=2023-09-01&Action=ChatCompletions
 type hunyuanTextGenRequest struct {
 	Model             string               `json:"Model"`
 	Messages          []hunyuanChatMessage `json:"Messages"`
 	Stream            bool                 `json:"Stream,omitempty"`
 	StreamModeration  bool                 `json:"StreamModeration,omitempty"`
 	TopP              float32              `json:"TopP,omitempty"`
 	Temperature       float32              `json:"Temperature,omitempty"`
 	EnableEnhancement bool                 `json:"EnableEnhancement,omitempty"`
 }
 type hunyuanTextGenResponseNonStreaming struct {
 	Response hunyuanTextGenDetailedResponseNonStreaming `json:"Response"`
 }
 type hunyuanTextGenDetailedResponseNonStreaming struct {
 	RequestId string                 `json:"RequestId,omitempty"`
 	Note      string                 `json:"Note"`
 	Choices   []hunyuanTextGenChoice `json:"Choices"`
 	Created   int64                  `json:"Created"`
 	Id        string                 `json:"Id"`
 	Usage     hunyuanTextGenUsage    `json:"Usage"`
 }
 type hunyuanTextGenChoice struct {
 	FinishReason string             `json:"FinishReason"`
 	Message      hunyuanChatMessage `json:"Message,omitempty"` // 当非流式返回时存储大模型生成文字
 	Delta        hunyuanChatMessage `json:"Delta,omitempty"`   // 流式返回时存储大模型生成文字
 }
 type hunyuanTextGenUsage struct {
 	PromptTokens     int `json:"PromptTokens"`
 	CompletionTokens int `json:"CompletionTokens"`
 	TotalTokens      int `json:"TotalTokens"`
 }
 type hunyuanChatMessage struct {
 	Role    string `json:"Role,omitempty"`
 	Content string `json:"Content,omitempty"`
 }
 func (m *hunyuanProviderInitializer) ValidateConfig(config ProviderConfig) error {
 	// 校验hunyuan id 和 key的合法性
 	if len(config.hunyuanAuthId) != hunyuanAuthIdLen || len(config.hunyuanAuthKey) != hunyuanAuthKeyLen {
 		return errors.New("hunyuanAuthId / hunyuanAuthKey is illegal in config file")
 	}
 	return nil
 }
 func (m *hunyuanProviderInitializer) CreateProvider(config ProviderConfig) (Provider, error) {
 	return &hunyuanProvider{
 		config: config,
 		client: wrapper.NewClusterClient(wrapper.RouteCluster{
 			Host: hunyuanDomain,
 		}),
 		contextCache: createContextCache(&config),
 	}, nil
 }
 type hunyuanProvider struct {
 	config ProviderConfig
 	client       wrapper.HttpClient
 	contextCache *contextCache
 }
 func (m *hunyuanProvider) GetProviderType() string {
 	return providerTypeHunyuan
 }
 func (m *hunyuanProvider) OnRequestHeaders(ctx wrapper.HttpContext, apiName ApiName, log wrapper.Log) (types.Action, error) {
 	// log.Debugf("hunyuanProvider.OnRequestHeaders called! hunyunSecretKey/id is: %s/%s", m.config.hunyuanAuthKey, m.config.hunyuanAuthId)
 	if apiName != ApiNameChatCompletion {
 		return types.ActionContinue, errUnsupportedApiName
 	}
 	_ = util.OverwriteRequestHost(hunyuanDomain)
 	_ = util.OverwriteRequestPath(hunyuanRequestPath)
 	// 添加hunyuan需要的自定义字段
 	_ = proxywasm.ReplaceHttpRequestHeader(actionKey, hunyuanChatCompletionTCAction)
 	_ = proxywasm.ReplaceHttpRequestHeader(versionKey, versionValue)
 	// 删除一些字段
 	_ = proxywasm.RemoveHttpRequestHeader("Accept-Encoding")
 	_ = proxywasm.RemoveHttpRequestHeader("Content-Length")
 	// Delay the header processing to allow changing streaming mode in OnRequestBody
 	return types.HeaderStopIteration, nil
 }
 func (m *hunyuanProvider) OnRequestBody(ctx wrapper.HttpContext, apiName ApiName, body []byte, log wrapper.Log) (types.Action, error) {
 	if apiName != ApiNameChatCompletion {
 		return types.ActionContinue, errUnsupportedApiName
 	}
 	// 为header添加时间戳字段 （因为需要根据body进行签名时依赖时间戳，故于body处理部分创建时间戳）
 	var timestamp int64 = time.Now().Unix()
 	_ = proxywasm.ReplaceHttpRequestHeader(timestampKey, fmt.Sprintf("%d", timestamp))
 	// log.Debugf("#debug nash5# OnRequestBody set timestamp header: ", timestamp)
 	// 使用混元本身接口的协议
 	if m.config.protocol == protocolOriginal {
 		request := &hunyuanTextGenRequest{}
 		if err := json.Unmarshal(body, request); err != nil {
 			return types.ActionContinue, fmt.Errorf("unable to unmarshal request: %v", err)
 		}
 		// 根据确定好的payload进行签名
 		hunyuanBody, _ := json.Marshal(request)
 		authorizedValueNew := GetTC3Authorizationcode(m.config.hunyuanAuthId, m.config.hunyuanAuthKey, timestamp, hunyuanDomain, hunyuanChatCompletionTCAction, string(hunyuanBody))
 		_ = proxywasm.ReplaceHttpRequestHeader(authorizationKey, authorizedValueNew)
 		_ = proxywasm.ReplaceHttpRequestHeader("Accept", "*/*")
 		// log.Debugf("#debug nash5# OnRequestBody call hunyuan api using original api! signature computation done!")
 		// 若无配置文件，直接返回
 		if m.config.context == nil {
 			return types.ActionContinue, replaceJsonRequestBody(request, log)
 		}
 		err := m.contextCache.GetContent(func(content string, err error) {
 			log.Debugf("#debug nash5# ctx file loaded! callback start, content is: %s", content)
 			defer func() {
 				_ = proxywasm.ResumeHttpRequest()
 			}()
 			if err != nil {
 				log.Errorf("failed to load context file: %v", err)
 				_ = util.SendResponse(500, util.MimeTypeTextPlain, fmt.Sprintf("failed to load context file: %v", err))
 			}
 			m.insertContextMessageIntoHunyuanRequest(request, content)
 			// 因为手动插入了context内容，这里需要重新计算签名
 			hunyuanBody, _ := json.Marshal(request)
 			authorizedValueNew := GetTC3Authorizationcode(m.config.hunyuanAuthId, m.config.hunyuanAuthKey, timestamp, hunyuanDomain, hunyuanChatCompletionTCAction, string(hunyuanBody))
 			_ = proxywasm.ReplaceHttpRequestHeader(authorizationKey, authorizedValueNew)
 			if err := replaceJsonRequestBody(request, log); err != nil {
 				_ = util.SendResponse(500, util.MimeTypeTextPlain, fmt.Sprintf("failed to replace request body: %v", err))
 			}
 		}, log)
 		if err == nil {
 			log.Debugf("#debug nash5# ctx file load success!")
 			return types.ActionPause, nil
 		}
 		log.Debugf("#debug nash5# ctx file load failed!")
 		return types.ActionContinue, replaceJsonRequestBody(request, log)
 	}
 	// 使用open ai接口协议
 	request := &chatCompletionRequest{}
 	if err := decodeChatCompletionRequest(body, request); err != nil {
 		return types.ActionContinue, err
 	}
 	// log.Debugf("#debug nash5# OnRequestBody call hunyuan api using openai's api!")
 	model := request.Model
 	if model == "" {
 		return types.ActionContinue, errors.New("missing model in chat completion request")
 	}
 	ctx.SetContext(ctxKeyOriginalRequestModel, model) // 设置原始请求的model，以便返回值使用
 	mappedModel := getMappedModel(model, m.config.modelMapping, log)
 	if mappedModel == "" {
 		return types.ActionContinue, errors.New("model becomes empty after applying the configured mapping")
 	}
 	request.Model = mappedModel
 	ctx.SetContext(ctxKeyFinalRequestModel, request.Model) // 设置真实请求的模型，以便返回值使用
 	// 看请求中的stream的设置，相应的我们更该http头
 	streaming := request.Stream
 	if streaming {
 		_ = proxywasm.ReplaceHttpRequestHeader("Accept", "text/event-stream")
 	} else {
 		_ = proxywasm.ReplaceHttpRequestHeader("Accept", "*/*")
 	}
 	// 若没有配置上下文，直接开始请求
 	if m.config.context == nil {
 		hunyuanRequest := m.buildHunyuanTextGenerationRequest(request)
 		// 根据确定好的payload进行签名：
 		body, _ := json.Marshal(hunyuanRequest)
 		authorizedValueNew := GetTC3Authorizationcode(
 			m.config.hunyuanAuthId,
 			m.config.hunyuanAuthKey,
 			timestamp,
 			hunyuanDomain,
 			hunyuanChatCompletionTCAction,
 			string(body),
 		)
 		_ = proxywasm.ReplaceHttpRequestHeader(authorizationKey, authorizedValueNew)
 		// log.Debugf("#debug nash5# OnRequestBody done, body is: ", string(body))
 		// // 打印所有的headers
 		// headers, err2 := proxywasm.GetHttpRequestHeaders()
 		// if err2 != nil {
 		// 	log.Errorf("failed to get request headers: %v", err2)
 		// } else {
 		// 	// 迭代并打印所有请求头
 		// 	for _, header := range headers {
 		// 		log.Infof("#debug nash5# inB Request header - %s: %s", header[0], header[1])
 		// 	}
 		// }
 		return types.ActionContinue, replaceJsonRequestBody(hunyuanRequest, log)
 	}
 	err := m.contextCache.GetContent(func(content string, err error) {
 		defer func() {
 			_ = proxywasm.ResumeHttpRequest()
 		}()
 		if err != nil {
 			log.Errorf("failed to load context file: %v", err)
 			_ = util.SendResponse(500, util.MimeTypeTextPlain, fmt.Sprintf("failed to load context file: %v", err))
 			return
 		}
 		insertContextMessage(request, content)
 		hunyuanRequest := m.buildHunyuanTextGenerationRequest(request)
 		// 因为手动插入了context内容，这里需要重新计算签名
 		hunyuanBody, _ := json.Marshal(hunyuanRequest)
 		authorizedValueNew := GetTC3Authorizationcode(m.config.hunyuanAuthId, m.config.hunyuanAuthKey, timestamp, hunyuanDomain, hunyuanChatCompletionTCAction, string(hunyuanBody))
 		_ = proxywasm.ReplaceHttpRequestHeader(authorizationKey, authorizedValueNew)
 		if err := replaceJsonRequestBody(hunyuanRequest, log); err != nil {
 			_ = util.SendResponse(500, util.MimeTypeTextPlain, fmt.Sprintf("failed to replace request body: %v", err))
 		}
 	}, log)
 	if err == nil {
 		return types.ActionPause, nil
 	}
 	return types.ActionContinue, err
 }
 func (m *hunyuanProvider) OnResponseHeaders(ctx wrapper.HttpContext, apiName ApiName, log wrapper.Log) (types.Action, error) {
 	_ = proxywasm.RemoveHttpResponseHeader("Content-Length")
 	return types.ActionContinue, nil
 }
 func (m *hunyuanProvider) OnStreamingResponseBody(ctx wrapper.HttpContext, name ApiName, chunk []byte, isLastChunk bool, log wrapper.Log) ([]byte, error) {
 	if m.config.protocol == protocolOriginal {
 		return chunk, nil
 	}
 	// hunyuan的流式返回:
 	//data: {"Note":"以上内容为AI生成，不代表开发者立场，请勿删除或修改本标记","Choices":[{"Delta":{"Role":"assistant","Content":"有助于"},"FinishReason":""}],"Created":1716359713,"Id":"086b6b19-8b2c-4def-a65c-db6a7bc86acd","Usage":{"PromptTokens":7,"CompletionTokens":145,"TotalTokens":152}}
 	// openai的流式返回
 	// data: {"id": "chatcmpl-7QyqpwdfhqwajicIEznoc6Q47XAyW", "object": "chat.completion.chunk", "created": 1677664795, "model": "gpt-3.5-turbo-0613", "choices": [{"delta": {"content": "The "}, "index": 0, "finish_reason": null}]}
 	// log.Debugf("#debug nash5# [OnStreamingResponseBody] chunk is: %s", string(chunk))
 	// 从上下文获取现有缓冲区数据
 	newBufferedBody := chunk
 	if bufferedBody, has := ctx.GetContext(ctxKeyStreamingBody).([]byte); has {
 		newBufferedBody = append(bufferedBody, chunk...)
 	}
 	// 初始化处理下标，以及将要返回的处理过的chunks
 	var newEventPivot = -1
 	var outputBuffer []byte
 	// 从buffer区取出若干完整的chunk，将其转为openAI格式后返回
 	// 处理可能包含多个事件的缓冲区
 	for {
 		eventStartIndex := bytes.Index(newBufferedBody, []byte(ssePrefix))
 		if eventStartIndex == -1 {
 			break // 没有找到新事件，跳出循环
 		}
 		// 移除缓冲区前面非事件部分
 		newBufferedBody = newBufferedBody[eventStartIndex+len(ssePrefix):]
 		// 查找事件结束的位置（即下一个事件的开始）
 		newEventPivot = bytes.Index(newBufferedBody, []byte("\n\n"))
 		if newEventPivot == -1 && !isLastChunk {
 			// 未找到事件结束标识，跳出循环等待更多数据，若是最后一个chunk，不一定有2个换行符
 			break
 		}
 		// 提取并处理一个完整的事件
 		eventData := newBufferedBody[:newEventPivot]
 		// log.Debugf("@@@ <<< ori chun is: %s", string(newBufferedBody[:newEventPivot]))
 		newBufferedBody = newBufferedBody[newEventPivot+2:] // 跳过结束标识
 		// 转换并追加到输出缓冲区
 		convertedData, _ := m.convertChunkFromHunyuanToOpenAI(ctx, eventData, log)
 		// log.Debugf("@@@ >>> converted one chunk: %s", string(convertedData))
 		outputBuffer = append(outputBuffer, convertedData...)
 	}
 	// 刷新剩余的不完整事件回到上下文缓冲区以便下次继续处理
 	ctx.SetContext(ctxKeyStreamingBody, newBufferedBody)
 	log.Debugf("=== modified response chunk: %s", string(outputBuffer))
 	return outputBuffer, nil
 }
 func (m *hunyuanProvider) convertChunkFromHunyuanToOpenAI(ctx wrapper.HttpContext, hunyuanChunk []byte, log wrapper.Log) ([]byte, error) {
 	// 将hunyuan的chunk转为openai的chunk
 	hunyuanFormattedChunk := &hunyuanTextGenDetailedResponseNonStreaming{}
 	if err := json.Unmarshal(hunyuanChunk, hunyuanFormattedChunk); err != nil {
 		return []byte(""), nil
 	}
 	openAIFormattedChunk := &chatCompletionResponse{
 		Id:                hunyuanFormattedChunk.Id,
 		Created:           time.Now().UnixMilli() / 1000,
 		Model:             ctx.GetContext(ctxKeyFinalRequestModel).(string),
 		SystemFingerprint: "",
 		Object:            objectChatCompletionChunk,
 		Usage: chatCompletionUsage{
 			PromptTokens:     hunyuanFormattedChunk.Usage.PromptTokens,
 			CompletionTokens: hunyuanFormattedChunk.Usage.CompletionTokens,
 			TotalTokens:      hunyuanFormattedChunk.Usage.TotalTokens,
 		},
 	}
 	// tmpStr3, _ := json.Marshal(hunyuanFormattedChunk)
 	// log.Debugf("@@@ --- 源数据是：: %s", tmpStr3)
 	// 是否为最后一个chunk？
 	if hunyuanFormattedChunk.Choices[0].FinishReason == hunyuanStreamEndMark {
 		// log.Debugf("@@@ --- 最后chunk: ")
 		openAIFormattedChunk.Choices = append(openAIFormattedChunk.Choices, chatCompletionChoice{
 			FinishReason: hunyuanFormattedChunk.Choices[0].FinishReason,
 		})
 	} else {
 		deltaMsg := chatMessage{
 			Name:      "",
 			Role:      hunyuanFormattedChunk.Choices[0].Delta.Role,
 			Content:   hunyuanFormattedChunk.Choices[0].Delta.Content,
 			ToolCalls: []toolCall{},
 		}
 		// tmpStr2, _ := json.Marshal(deltaMsg)
 		// log.Debugf("@@@ --- 中间chunk: choices.chatMsg 是: %s", tmpStr2)
 		openAIFormattedChunk.Choices = append(
 			openAIFormattedChunk.Choices,
 			chatCompletionChoice{Delta: &deltaMsg},
 		)
 		// tmpStr, _ := json.Marshal(openAIFormattedChunk.Choices)
 		// log.Debugf("@@@ --- 中间chunk: choices 是: %s", tmpStr)
 	}
 	// 返回的格式
 	openAIFormattedChunkBytes, _ := json.Marshal(openAIFormattedChunk)
 	var openAIChunk strings.Builder
 	openAIChunk.WriteString(ssePrefix)
 	openAIChunk.WriteString(string(openAIFormattedChunkBytes))
 	openAIChunk.WriteString("\n\n")
 	return []byte(openAIChunk.String()), nil
 }
 func (m *hunyuanProvider) OnResponseBody(ctx wrapper.HttpContext, apiName ApiName, body []byte, log wrapper.Log) (types.Action, error) {
 	log.Debugf("#debug nash5# onRespBody's resp is: %s", string(body))
 	hunyuanResponse := &hunyuanTextGenResponseNonStreaming{}
 	if err := json.Unmarshal(body, hunyuanResponse); err != nil {
 		return types.ActionContinue, fmt.Errorf("unable to unmarshal hunyuan response: %v", err)
 	}
 	if m.config.protocol == protocolOriginal {
 		return types.ActionContinue, replaceJsonResponseBody(hunyuanResponse, log)
 	}
 	response := m.buildChatCompletionResponse(ctx, hunyuanResponse)
 	return types.ActionContinue, replaceJsonResponseBody(response, log)
 }
 func (m *hunyuanProvider) insertContextMessageIntoHunyuanRequest(request *hunyuanTextGenRequest, content string) {
 	fileMessage := hunyuanChatMessage{
 		Role:    roleSystem,
 		Content: content,
 	}
 	messages := request.Messages
 	request.Messages = append([]hunyuanChatMessage{},
 		append([]hunyuanChatMessage{fileMessage}, messages...)...,
 	)
 }
 func (m *hunyuanProvider) buildHunyuanTextGenerationRequest(request *chatCompletionRequest) *hunyuanTextGenRequest {
 	hunyuanRequest := &hunyuanTextGenRequest{
 		Model:             request.Model,
 		Messages:          convertMessagesFromOpenAIToHunyuan(request.Messages),
 		Stream:            request.Stream,
 		StreamModeration:  false,
 		TopP:              float32(request.TopP),
 		Temperature:       float32(request.Temperature),
 		EnableEnhancement: false,
 	}
 	return hunyuanRequest
 }
 func convertMessagesFromOpenAIToHunyuan(openAIMessages []chatMessage) []hunyuanChatMessage {
 	// 将chatgpt的messages转换为hunyuan的messages
 	hunyuanChatMessages := make([]hunyuanChatMessage, 0, len(openAIMessages))
 	for _, msg := range openAIMessages {
 		hunyuanChatMessages = append(hunyuanChatMessages, hunyuanChatMessage{
 			Role:    msg.Role,
 			Content: msg.Content,
 		})
 	}
 	return hunyuanChatMessages
 }
 func (m *hunyuanProvider) buildChatCompletionResponse(ctx wrapper.HttpContext, hunyuanResponse *hunyuanTextGenResponseNonStreaming) *chatCompletionResponse {
 	choices := make([]chatCompletionChoice, 0, len(hunyuanResponse.Response.Choices))
 	for _, choice := range hunyuanResponse.Response.Choices {
 		choices = append(choices, chatCompletionChoice{
 			Message: &chatMessage{
 				Name:      "",
 				Role:      choice.Message.Role,
 				Content:   choice.Message.Content,
 				ToolCalls: nil,
 			},
 			FinishReason: choice.FinishReason,
 		})
 	}
 	return &chatCompletionResponse{
 		Id:                hunyuanResponse.Response.Id,
 		Created:           time.Now().UnixMilli() / 1000,
 		Model:             ctx.GetContext(ctxKeyFinalRequestModel).(string),
 		SystemFingerprint: "",
 		Object:            objectChatCompletion,
 		Choices:           choices,
 		Usage: chatCompletionUsage{
 			PromptTokens:     hunyuanResponse.Response.Usage.PromptTokens,
 			CompletionTokens: hunyuanResponse.Response.Usage.CompletionTokens,
 			TotalTokens:      hunyuanResponse.Response.Usage.TotalTokens,
 		},
 	}
 }
 func Sha256hex(s string) string {
 	b := sha256.Sum256([]byte(s))
 	return hex.EncodeToString(b[:])
 }
 func Hmacsha256(s, key string) string {
 	hashed := hmac.New(sha256.New, []byte(key))
 	hashed.Write([]byte(s))
 	return string(hashed.Sum(nil))
 }
 /**
 * @param secretId 秘钥id
 * @param secretKey 秘钥
 * @param timestamp 时间戳
 * @param host 目标域名
 * @param action 请求动作
 * @param payload 请求体
 * @return 签名
 */
 func GetTC3Authorizationcode(secretId string, secretKey string, timestamp int64, host string, action string, payload string) string {
 	algorithm := "TC3-HMAC-SHA256"
 	service := "hunyuan" // 注意，必须和域名中的产品名保持一致
 	// step 1: build canonical request string
 	httpRequestMethod := "POST"
 	canonicalURI := "/"
 	canonicalQueryString := ""
 	canonicalHeaders := fmt.Sprintf("content-type:%s\nhost:%s\nx-tc-action:%s\n",
 		"application/json", host, strings.ToLower(action))
 	signedHeaders := "content-type;host;x-tc-action"
 	// fmt.Println("payload is: %s", payload)
 	hashedRequestPayload := Sha256hex(payload)
 	canonicalRequest := fmt.Sprintf("%s\n%s\n%s\n%s\n%s\n%s",
 		httpRequestMethod,
 		canonicalURI,
 		canonicalQueryString,
 		canonicalHeaders,
 		signedHeaders,
 		hashedRequestPayload)
 	// fmt.Println(canonicalRequest)
 	// step 2: build string to sign
 	date := time.Unix(timestamp, 0).UTC().Format("2006-01-02")
 	credentialScope := fmt.Sprintf("%s/%s/tc3_request", date, service)
 	hashedCanonicalRequest := Sha256hex(canonicalRequest)
 	string2sign := fmt.Sprintf("%s\n%d\n%s\n%s",
 		algorithm,
 		timestamp,
 		credentialScope,
 		hashedCanonicalRequest)
 	// fmt.Println(string2sign)
 	// step 3: sign string
 	secretDate := Hmacsha256(date, "TC3"+secretKey)
 	secretService := Hmacsha256(service, secretDate)
 	secretSigning := Hmacsha256("tc3_request", secretService)
 	signature := hex.EncodeToString([]byte(Hmacsha256(string2sign, secretSigning)))
 	// fmt.Println(signature)
 	// step 4: build authorization
 	authorization := fmt.Sprintf("%s Credential=%s/%s, SignedHeaders=%s, Signature=%s",
 		algorithm,
 		secretId,
 		credentialScope,
 		signedHeaders,
 		signature)
 	// curl := fmt.Sprintf(`curl -X POST https://%s \
 	// 	-H "Authorization: %s" \
 	// 	-H "Content-Type: application/json" \
 	// 	-H "Host: %s" -H "X-TC-Action: %s" \
 	// 	-H "X-TC-Timestamp: %d" \
 	// 	-H "X-TC-Version: 2023-09-01" \
 	// 	-d '%s'`, host, authorization, host, action, timestamp, payload)
 	// fmt.Println(curl)
 	return authorization
 }
--- a/plugins/wasm-go/extensions/ai-proxy/provider/provider.go
+++ b/plugins/wasm-go/extensions/ai-proxy/provider/provider.go
@@ -25,13 +25,17 @@ const (
 	providerTypeDeepSeek = "deepseek"
 	providerTypeZhipuAi  = "zhipuai"
 	providerTypeOllama   = "ollama"
 	providerTypeHunyuan  = "hunyuan"
 	protocolOpenAI   = "openai"
 	protocolOriginal = "original"
-	roleSystem = "system"
+	roleSystem    = "system"
 	roleUser      = "user"
 	roleAssistant = "assistant"
 	ctxKeyIncrementalStreaming = "incrementalStreaming"
 	ctxKeyApiName              = "apiKey"
 	ctxKeyStreamingBody        = "streamingBody"
 	ctxKeyOriginalRequestModel = "originalRequestModel"
 	ctxKeyFinalRequestModel    = "finalRequestModel"
@@ -64,6 +68,7 @@ var (
 		providerTypeDeepSeek: &deepseekProviderInitializer{},
 		providerTypeZhipuAi:  &zhipuAiProviderInitializer{},
 		providerTypeOllama:   &ollamaProviderInitializer{},
 		providerTypeHunyuan:  &hunyuanProviderInitializer{},
 	}
 )
@@ -119,6 +124,12 @@ type ProviderConfig struct {
 	// @Title zh-CN Ollama Server Port
 	// @Description zh-CN 仅适用于 Ollama 服务。Ollama 服务器的端口号。
 	ollamaServerPort uint32 `required:"false" yaml:"ollamaServerPort" json:"ollamaServerPort"`
 	// @Title zh-CN hunyuan api key for authorization
 	// @Description zh-CN 仅适用于Hun Yuan AI服务鉴权，API key/id 参考：https://cloud.tencent.com/document/api/1729/101843#Golang
 	hunyuanAuthKey string `required:"false" yaml:"hunyuanAuthKey" json:"hunyuanAuthKey"`
 	// @Title zh-CN hunyuan api id for authorization
 	// @Description zh-CN 仅适用于Hun Yuan AI服务鉴权
 	hunyuanAuthId string `required:"false" yaml:"hunyuanAuthId" json:"hunyuanAuthId"`
 	// @Title zh-CN 模型名称映射表
 	// @Description zh-CN 用于将请求中的模型名称映射为目标AI服务商支持的模型名称。支持通过“*”来配置全局映射
 	modelMapping map[string]string `required:"false" yaml:"modelMapping" json:"modelMapping"`
@@ -162,6 +173,9 @@ func (c *ProviderConfig) FromJson(json gjson.Result) {
 		c.context = &ContextConfig{}
 		c.context.FromJson(contextJson)
 	}
 	c.hunyuanAuthId = json.Get("hunyuanAuthId").String()
 	c.hunyuanAuthKey = json.Get("hunyuanAuthKey").String()
 }
 func (c *ProviderConfig) Validate() error {
@@ -182,7 +196,6 @@ func (c *ProviderConfig) Validate() error {
 	if c.typ == "" {
 		return errors.New("missing type in provider config")
 	}
 	initializer, has := providerInitializers[c.typ]
 	if !has {