From c6e3db95e04af64ae2cc2c58ec892571f46c667d Mon Sep 17 00:00:00 2001
From: nash5 <cxy_hust@qq.com>
Date: Thu, 6 Jun 2024 18:11:51 +0800
Subject: [PATCH] feature: add hunyuan llm support for plugins/ai-proxy (#1018)

Co-authored-by: Kent Dong <ch3cho@qq.com>
---
 plugins/wasm-go/extensions/ai-proxy/README.md |  76 ++-
 .../wasm-go/extensions/ai-proxy/README_dev.md |  46 ++
 .../extensions/ai-proxy/provider/hunyuan.go   | 563 ++++++++++++++++++
 .../extensions/ai-proxy/provider/provider.go  |  17 +-
 4 files changed, 699 insertions(+), 3 deletions(-)
 create mode 100644 plugins/wasm-go/extensions/ai-proxy/provider/hunyuan.go
diff --git a/plugins/wasm-go/extensions/ai-proxy/README.md b/plugins/wasm-go/extensions/ai-proxy/README.md
index 1c101b381..96f0e4b84 100644
--- a/plugins/wasm-go/extensions/ai-proxy/README.md
+++ b/plugins/wasm-go/extensions/ai-proxy/README.md
@@ -106,6 +106,16 @@ Ollama 所对应的 `type` 为 `ollama`。它特有的配置字段如下：
 | `ollamaServerHost` | string | 必填   | -   | Ollama 服务器的主机地址 |
 | `ollamaServerPort` | number | 必填   | -   | Ollama 服务器的端口号，默认为11434 |
 
+#### 混元
+
+混元所对应的 `type` 为 `hunyuan`。它特有的配置字段如下：
+
+| 名称                | 数据类型   | 填写要求 | 默认值 | 描述                                           |
+|-------------------|--------|------|-----|----------------------------------------------|
+| `hunyuanAuthId` | string | 必填   | -   | 混元用于v3版本认证的id |
+| `hunyuanAuthKey` | string | 必填   | -   | 混元用于v3版本认证的key |
+
+
 ## 用法示例
 
 ### 使用 OpenAI 协议代理 Azure OpenAI 服务
@@ -546,6 +556,70 @@ provider:
   "stop_reason": "end_turn"
 }
 ```
+### 使用 OpenAI 协议代理混元服务
+
+**配置信息**
+
+```yaml
+provider:
+  type: "hunyuan"
+  hunyuanAuthKey: "<YOUR AUTH KEY>"
+  apiTokens:
+    - ""
+  hunyuanAuthId: "<YOUR AUTH ID>"
+  timeout: 1200000
+  modelMapping:
+    "*": "hunyuan-lite"
+```
+
+**请求示例**
+请求脚本：
+```sh
+
+curl --location 'http://<your higress domain>/v1/chat/completions' \
+--header 'Content-Type:  application/json' \
+--data '{
+  "model": "gpt-3",
+  "messages": [
+    {
+      "role": "system",
+      "content": "你是一个名专业的开发人员！"
+    },
+    {
+      "role": "user",
+      "content": "你好，你是谁？"
+    }
+  ],
+  "temperature": 0.3,
+  "stream": false
+}'
+```
+
+**响应示例**
+
+```json
+{
+    "id": "fd140c3e-0b69-4b19-849b-d354d32a6162",
+    "choices": [
+        {
+            "index": 0,
+            "delta": {
+                "role": "assistant",
+                "content": "你好！我是一名专业的开发人员。"
+            },
+            "finish_reason": "stop"
+        }
+    ],
+    "created": 1717493117,
+    "model": "hunyuan-lite",
+    "object": "chat.completion",
+    "usage": {
+        "prompt_tokens": 15,
+        "completion_tokens": 9,
+        "total_tokens": 24
+    }
+}
+```
 
 ## 完整配置示例
 
@@ -619,4 +693,4 @@ curl "http://<YOUR-DOMAIN>/v1/chat/completions" -H "Content-Type: application/js
     }
   ]
 }'
-```
\ No newline at end of file
+```
diff --git a/plugins/wasm-go/extensions/ai-proxy/README_dev.md b/plugins/wasm-go/extensions/ai-proxy/README_dev.md
index 0d82655ab..70634fc88 100644
--- a/plugins/wasm-go/extensions/ai-proxy/README_dev.md
+++ b/plugins/wasm-go/extensions/ai-proxy/README_dev.md
@@ -13,6 +13,52 @@ DOCKER_BUILDKIT=1; docker build --build-arg PLUGIN_NAME=ai-proxy --build-arg EXT
 ```powershell
 $env:DOCKER_BUILDKIT=1; docker build --build-arg PLUGIN_NAME=ai-proxy --build-arg EXTRA_TAGS=proxy_wasm_version_0_2_100 --build-arg BUILDER=higress-registry.cn-hangzhou.cr.aliyuncs.com/plugins/wasm-go-builder:go1.19-tinygo0.28.1-oras1.0.0 -t ai-proxy:0.0.1 --output .\out ..\..
 ```
+
+## 本地运行
+参考：https://higress.io/zh-cn/docs/user/wasm-go
+需要注意的是，higress/plugins/wasm-go/extensions/ai-proxy/envoy.yaml中的clusters字段，记得改成你需要地址，比如混元的话：就会有如下的一个cluster的配置：
+```yaml
+<省略>
+static_resources:
+<省略>
+  clusters:
+      load_assignment:
+        cluster_name: moonshot
+        endpoints:
+          - lb_endpoints:
+              - endpoint:
+                  address:
+                    socket_address:
+                      address: hunyuan.tencentcloudapi.com
+                      port_value: 443
+      transport_socket:
+        name: envoy.transport_sockets.tls
+        typed_config:
+          "@type": type.googleapis.com/envoy.extensions.transport_sockets.tls.v3.UpstreamTlsContext
+          "sni": "hunyuan.tencentcloudapi.com"
+```
+
+而后你就可以在本地的pod中查看相应的输出，请求样例如下：
+```sh
+curl --location 'http://127.0.0.1:10000/v1/chat/completions' \
+--header 'Content-Type:  application/json' \
+--data '{
+  "model": "gpt-3",
+  "messages": [
+    {
+      "role": "system",
+      "content": "你是一个名专业的开发人员！"
+    },
+    {
+      "role": "user",
+      "content": "你好，你是谁？"
+    }
+  ],
+  "temperature": 0.3,
+  "stream": false
+}'
+```
+
 ## 测试须知
 
 由于 `ai-proxy` 插件使用了 Higress 对数据面定制的特殊功能，因此在测试时需要使用版本不低于 1.4.0-rc.1 的 Higress Gateway 镜像。
\ No newline at end of file
diff --git a/plugins/wasm-go/extensions/ai-proxy/provider/hunyuan.go b/plugins/wasm-go/extensions/ai-proxy/provider/hunyuan.go
new file mode 100644
index 000000000..ae22a3ba7
--- /dev/null
+++ b/plugins/wasm-go/extensions/ai-proxy/provider/hunyuan.go
@@ -0,0 +1,563 @@
+package provider
+
+import (
+	"bytes"
+	"crypto/hmac"
+	"crypto/sha256"
+	"encoding/hex"
+	"encoding/json"
+	"errors"
+	"fmt"
+	"strings"
+	"time"
+
+	"github.com/alibaba/higress/plugins/wasm-go/extensions/ai-proxy/util"
+	"github.com/alibaba/higress/plugins/wasm-go/pkg/wrapper"
+	"github.com/higress-group/proxy-wasm-go-sdk/proxywasm"
+	"github.com/higress-group/proxy-wasm-go-sdk/proxywasm/types"
+)
+
+// hunyuanProvider is the provider for hunyuan AI service.
+
+const (
+	hunyuanDomain                 = "hunyuan.tencentcloudapi.com"
+	hunyuanRequestPath            = "/"
+	hunyuanChatCompletionTCAction = "ChatCompletions"
+
+	// headers necessary for TC hunyuan api call:
+	// ref: https://cloud.tencent.com/document/api/1729/105701, https://cloud.tencent.com/document/api/1729/101842
+	actionKey        = "X-TC-Action"
+	timestampKey     = "X-TC-Timestamp"
+	authorizationKey = "Authorization"
+	versionKey       = "X-TC-Version"
+	versionValue     = "2023-09-01"
+	hostKey          = "Host"
+
+	ssePrefix            = "data: " // Server-Sent Events (SSE) 类型的流式响应的开始标记
+	hunyuanStreamEndMark = "stop"   // 混元的流式的finishReason为stop时，表示结束
+
+	hunyuanAuthKeyLen = 32
+	hunyuanAuthIdLen  = 36
+)
+
+type hunyuanProviderInitializer struct {
+}
+
+// ref: https://console.cloud.tencent.com/api/explorer?Product=hunyuan&Version=2023-09-01&Action=ChatCompletions
+type hunyuanTextGenRequest struct {
+	Model             string               `json:"Model"`
+	Messages          []hunyuanChatMessage `json:"Messages"`
+	Stream            bool                 `json:"Stream,omitempty"`
+	StreamModeration  bool                 `json:"StreamModeration,omitempty"`
+	TopP              float32              `json:"TopP,omitempty"`
+	Temperature       float32              `json:"Temperature,omitempty"`
+	EnableEnhancement bool                 `json:"EnableEnhancement,omitempty"`
+}
+
+type hunyuanTextGenResponseNonStreaming struct {
+	Response hunyuanTextGenDetailedResponseNonStreaming `json:"Response"`
+}
+
+type hunyuanTextGenDetailedResponseNonStreaming struct {
+	RequestId string                 `json:"RequestId,omitempty"`
+	Note      string                 `json:"Note"`
+	Choices   []hunyuanTextGenChoice `json:"Choices"`
+	Created   int64                  `json:"Created"`
+	Id        string                 `json:"Id"`
+	Usage     hunyuanTextGenUsage    `json:"Usage"`
+}
+
+type hunyuanTextGenChoice struct {
+	FinishReason string             `json:"FinishReason"`
+	Message      hunyuanChatMessage `json:"Message,omitempty"` // 当非流式返回时存储大模型生成文字
+	Delta        hunyuanChatMessage `json:"Delta,omitempty"`   // 流式返回时存储大模型生成文字
+}
+
+type hunyuanTextGenUsage struct {
+	PromptTokens     int `json:"PromptTokens"`
+	CompletionTokens int `json:"CompletionTokens"`
+	TotalTokens      int `json:"TotalTokens"`
+}
+
+type hunyuanChatMessage struct {
+	Role    string `json:"Role,omitempty"`
+	Content string `json:"Content,omitempty"`
+}
+
+func (m *hunyuanProviderInitializer) ValidateConfig(config ProviderConfig) error {
+	// 校验hunyuan id 和 key的合法性
+	if len(config.hunyuanAuthId) != hunyuanAuthIdLen || len(config.hunyuanAuthKey) != hunyuanAuthKeyLen {
+		return errors.New("hunyuanAuthId / hunyuanAuthKey is illegal in config file")
+	}
+	return nil
+}
+
+func (m *hunyuanProviderInitializer) CreateProvider(config ProviderConfig) (Provider, error) {
+	return &hunyuanProvider{
+		config: config,
+		client: wrapper.NewClusterClient(wrapper.RouteCluster{
+			Host: hunyuanDomain,
+		}),
+		contextCache: createContextCache(&config),
+	}, nil
+}
+
+type hunyuanProvider struct {
+	config ProviderConfig
+
+	client       wrapper.HttpClient
+	contextCache *contextCache
+}
+
+func (m *hunyuanProvider) GetProviderType() string {
+	return providerTypeHunyuan
+}
+
+func (m *hunyuanProvider) OnRequestHeaders(ctx wrapper.HttpContext, apiName ApiName, log wrapper.Log) (types.Action, error) {
+	// log.Debugf("hunyuanProvider.OnRequestHeaders called! hunyunSecretKey/id is: %s/%s", m.config.hunyuanAuthKey, m.config.hunyuanAuthId)
+	if apiName != ApiNameChatCompletion {
+		return types.ActionContinue, errUnsupportedApiName
+	}
+
+	_ = util.OverwriteRequestHost(hunyuanDomain)
+	_ = util.OverwriteRequestPath(hunyuanRequestPath)
+
+	// 添加hunyuan需要的自定义字段
+	_ = proxywasm.ReplaceHttpRequestHeader(actionKey, hunyuanChatCompletionTCAction)
+	_ = proxywasm.ReplaceHttpRequestHeader(versionKey, versionValue)
+
+	// 删除一些字段
+	_ = proxywasm.RemoveHttpRequestHeader("Accept-Encoding")
+	_ = proxywasm.RemoveHttpRequestHeader("Content-Length")
+
+	// Delay the header processing to allow changing streaming mode in OnRequestBody
+	return types.HeaderStopIteration, nil
+}
+
+func (m *hunyuanProvider) OnRequestBody(ctx wrapper.HttpContext, apiName ApiName, body []byte, log wrapper.Log) (types.Action, error) {
+	if apiName != ApiNameChatCompletion {
+		return types.ActionContinue, errUnsupportedApiName
+	}
+
+	// 为header添加时间戳字段 （因为需要根据body进行签名时依赖时间戳，故于body处理部分创建时间戳）
+	var timestamp int64 = time.Now().Unix()
+	_ = proxywasm.ReplaceHttpRequestHeader(timestampKey, fmt.Sprintf("%d", timestamp))
+	// log.Debugf("#debug nash5# OnRequestBody set timestamp header: ", timestamp)
+
+	// 使用混元本身接口的协议
+	if m.config.protocol == protocolOriginal {
+		request := &hunyuanTextGenRequest{}
+
+		if err := json.Unmarshal(body, request); err != nil {
+			return types.ActionContinue, fmt.Errorf("unable to unmarshal request: %v", err)
+		}
+
+		// 根据确定好的payload进行签名
+		hunyuanBody, _ := json.Marshal(request)
+		authorizedValueNew := GetTC3Authorizationcode(m.config.hunyuanAuthId, m.config.hunyuanAuthKey, timestamp, hunyuanDomain, hunyuanChatCompletionTCAction, string(hunyuanBody))
+		_ = proxywasm.ReplaceHttpRequestHeader(authorizationKey, authorizedValueNew)
+		_ = proxywasm.ReplaceHttpRequestHeader("Accept", "*/*")
+		// log.Debugf("#debug nash5# OnRequestBody call hunyuan api using original api! signature computation done!")
+
+		// 若无配置文件，直接返回
+		if m.config.context == nil {
+			return types.ActionContinue, replaceJsonRequestBody(request, log)
+		}
+		err := m.contextCache.GetContent(func(content string, err error) {
+			log.Debugf("#debug nash5# ctx file loaded! callback start, content is: %s", content)
+			defer func() {
+				_ = proxywasm.ResumeHttpRequest()
+			}()
+
+			if err != nil {
+				log.Errorf("failed to load context file: %v", err)
+				_ = util.SendResponse(500, util.MimeTypeTextPlain, fmt.Sprintf("failed to load context file: %v", err))
+			}
+			m.insertContextMessageIntoHunyuanRequest(request, content)
+
+			// 因为手动插入了context内容，这里需要重新计算签名
+			hunyuanBody, _ := json.Marshal(request)
+			authorizedValueNew := GetTC3Authorizationcode(m.config.hunyuanAuthId, m.config.hunyuanAuthKey, timestamp, hunyuanDomain, hunyuanChatCompletionTCAction, string(hunyuanBody))
+			_ = proxywasm.ReplaceHttpRequestHeader(authorizationKey, authorizedValueNew)
+
+			if err := replaceJsonRequestBody(request, log); err != nil {
+				_ = util.SendResponse(500, util.MimeTypeTextPlain, fmt.Sprintf("failed to replace request body: %v", err))
+			}
+		}, log)
+		if err == nil {
+			log.Debugf("#debug nash5# ctx file load success!")
+			return types.ActionPause, nil
+		}
+
+		log.Debugf("#debug nash5# ctx file load failed!")
+		return types.ActionContinue, replaceJsonRequestBody(request, log)
+	}
+
+	// 使用open ai接口协议
+	request := &chatCompletionRequest{}
+	if err := decodeChatCompletionRequest(body, request); err != nil {
+		return types.ActionContinue, err
+	}
+	// log.Debugf("#debug nash5# OnRequestBody call hunyuan api using openai's api!")
+
+	model := request.Model
+	if model == "" {
+		return types.ActionContinue, errors.New("missing model in chat completion request")
+	}
+	ctx.SetContext(ctxKeyOriginalRequestModel, model) // 设置原始请求的model，以便返回值使用
+	mappedModel := getMappedModel(model, m.config.modelMapping, log)
+	if mappedModel == "" {
+		return types.ActionContinue, errors.New("model becomes empty after applying the configured mapping")
+	}
+	request.Model = mappedModel
+	ctx.SetContext(ctxKeyFinalRequestModel, request.Model) // 设置真实请求的模型，以便返回值使用
+
+	// 看请求中的stream的设置，相应的我们更该http头
+	streaming := request.Stream
+	if streaming {
+		_ = proxywasm.ReplaceHttpRequestHeader("Accept", "text/event-stream")
+	} else {
+		_ = proxywasm.ReplaceHttpRequestHeader("Accept", "*/*")
+	}
+
+	// 若没有配置上下文，直接开始请求
+	if m.config.context == nil {
+		hunyuanRequest := m.buildHunyuanTextGenerationRequest(request)
+
+		// 根据确定好的payload进行签名：
+		body, _ := json.Marshal(hunyuanRequest)
+		authorizedValueNew := GetTC3Authorizationcode(
+			m.config.hunyuanAuthId,
+			m.config.hunyuanAuthKey,
+			timestamp,
+			hunyuanDomain,
+			hunyuanChatCompletionTCAction,
+			string(body),
+		)
+		_ = proxywasm.ReplaceHttpRequestHeader(authorizationKey, authorizedValueNew)
+		// log.Debugf("#debug nash5# OnRequestBody done, body is: ", string(body))
+
+		// // 打印所有的headers
+		// headers, err2 := proxywasm.GetHttpRequestHeaders()
+		// if err2 != nil {
+		// 	log.Errorf("failed to get request headers: %v", err2)
+		// } else {
+		// 	// 迭代并打印所有请求头
+		// 	for _, header := range headers {
+		// 		log.Infof("#debug nash5# inB Request header - %s: %s", header[0], header[1])
+		// 	}
+		// }
+		return types.ActionContinue, replaceJsonRequestBody(hunyuanRequest, log)
+	}
+
+	err := m.contextCache.GetContent(func(content string, err error) {
+		defer func() {
+			_ = proxywasm.ResumeHttpRequest()
+		}()
+		if err != nil {
+			log.Errorf("failed to load context file: %v", err)
+			_ = util.SendResponse(500, util.MimeTypeTextPlain, fmt.Sprintf("failed to load context file: %v", err))
+			return
+		}
+		insertContextMessage(request, content)
+		hunyuanRequest := m.buildHunyuanTextGenerationRequest(request)
+
+		// 因为手动插入了context内容，这里需要重新计算签名
+		hunyuanBody, _ := json.Marshal(hunyuanRequest)
+		authorizedValueNew := GetTC3Authorizationcode(m.config.hunyuanAuthId, m.config.hunyuanAuthKey, timestamp, hunyuanDomain, hunyuanChatCompletionTCAction, string(hunyuanBody))
+		_ = proxywasm.ReplaceHttpRequestHeader(authorizationKey, authorizedValueNew)
+
+		if err := replaceJsonRequestBody(hunyuanRequest, log); err != nil {
+			_ = util.SendResponse(500, util.MimeTypeTextPlain, fmt.Sprintf("failed to replace request body: %v", err))
+		}
+	}, log)
+	if err == nil {
+		return types.ActionPause, nil
+	}
+	return types.ActionContinue, err
+}
+
+func (m *hunyuanProvider) OnResponseHeaders(ctx wrapper.HttpContext, apiName ApiName, log wrapper.Log) (types.Action, error) {
+	_ = proxywasm.RemoveHttpResponseHeader("Content-Length")
+	return types.ActionContinue, nil
+}
+
+func (m *hunyuanProvider) OnStreamingResponseBody(ctx wrapper.HttpContext, name ApiName, chunk []byte, isLastChunk bool, log wrapper.Log) ([]byte, error) {
+	if m.config.protocol == protocolOriginal {
+		return chunk, nil
+	}
+
+	// hunyuan的流式返回:
+	//data: {"Note":"以上内容为AI生成，不代表开发者立场，请勿删除或修改本标记","Choices":[{"Delta":{"Role":"assistant","Content":"有助于"},"FinishReason":""}],"Created":1716359713,"Id":"086b6b19-8b2c-4def-a65c-db6a7bc86acd","Usage":{"PromptTokens":7,"CompletionTokens":145,"TotalTokens":152}}
+
+	// openai的流式返回
+	// data: {"id": "chatcmpl-7QyqpwdfhqwajicIEznoc6Q47XAyW", "object": "chat.completion.chunk", "created": 1677664795, "model": "gpt-3.5-turbo-0613", "choices": [{"delta": {"content": "The "}, "index": 0, "finish_reason": null}]}
+
+	// log.Debugf("#debug nash5# [OnStreamingResponseBody] chunk is: %s", string(chunk))
+
+	// 从上下文获取现有缓冲区数据
+	newBufferedBody := chunk
+	if bufferedBody, has := ctx.GetContext(ctxKeyStreamingBody).([]byte); has {
+		newBufferedBody = append(bufferedBody, chunk...)
+	}
+
+	// 初始化处理下标，以及将要返回的处理过的chunks
+	var newEventPivot = -1
+	var outputBuffer []byte
+
+	// 从buffer区取出若干完整的chunk，将其转为openAI格式后返回
+	// 处理可能包含多个事件的缓冲区
+	for {
+		eventStartIndex := bytes.Index(newBufferedBody, []byte(ssePrefix))
+		if eventStartIndex == -1 {
+			break // 没有找到新事件，跳出循环
+		}
+
+		// 移除缓冲区前面非事件部分
+		newBufferedBody = newBufferedBody[eventStartIndex+len(ssePrefix):]
+
+		// 查找事件结束的位置（即下一个事件的开始）
+		newEventPivot = bytes.Index(newBufferedBody, []byte("\n\n"))
+		if newEventPivot == -1 && !isLastChunk {
+			// 未找到事件结束标识，跳出循环等待更多数据，若是最后一个chunk，不一定有2个换行符
+			break
+		}
+
+		// 提取并处理一个完整的事件
+		eventData := newBufferedBody[:newEventPivot]
+		// log.Debugf("@@@ <<< ori chun is: %s", string(newBufferedBody[:newEventPivot]))
+		newBufferedBody = newBufferedBody[newEventPivot+2:] // 跳过结束标识
+
+		// 转换并追加到输出缓冲区
+		convertedData, _ := m.convertChunkFromHunyuanToOpenAI(ctx, eventData, log)
+		// log.Debugf("@@@ >>> converted one chunk: %s", string(convertedData))
+		outputBuffer = append(outputBuffer, convertedData...)
+	}
+
+	// 刷新剩余的不完整事件回到上下文缓冲区以便下次继续处理
+	ctx.SetContext(ctxKeyStreamingBody, newBufferedBody)
+
+	log.Debugf("=== modified response chunk: %s", string(outputBuffer))
+	return outputBuffer, nil
+}
+
+func (m *hunyuanProvider) convertChunkFromHunyuanToOpenAI(ctx wrapper.HttpContext, hunyuanChunk []byte, log wrapper.Log) ([]byte, error) {
+	// 将hunyuan的chunk转为openai的chunk
+	hunyuanFormattedChunk := &hunyuanTextGenDetailedResponseNonStreaming{}
+	if err := json.Unmarshal(hunyuanChunk, hunyuanFormattedChunk); err != nil {
+		return []byte(""), nil
+	}
+
+	openAIFormattedChunk := &chatCompletionResponse{
+		Id:                hunyuanFormattedChunk.Id,
+		Created:           time.Now().UnixMilli() / 1000,
+		Model:             ctx.GetContext(ctxKeyFinalRequestModel).(string),
+		SystemFingerprint: "",
+		Object:            objectChatCompletionChunk,
+		Usage: chatCompletionUsage{
+			PromptTokens:     hunyuanFormattedChunk.Usage.PromptTokens,
+			CompletionTokens: hunyuanFormattedChunk.Usage.CompletionTokens,
+			TotalTokens:      hunyuanFormattedChunk.Usage.TotalTokens,
+		},
+	}
+	// tmpStr3, _ := json.Marshal(hunyuanFormattedChunk)
+	// log.Debugf("@@@ --- 源数据是：: %s", tmpStr3)
+
+	// 是否为最后一个chunk？
+	if hunyuanFormattedChunk.Choices[0].FinishReason == hunyuanStreamEndMark {
+		// log.Debugf("@@@ --- 最后chunk: ")
+		openAIFormattedChunk.Choices = append(openAIFormattedChunk.Choices, chatCompletionChoice{
+			FinishReason: hunyuanFormattedChunk.Choices[0].FinishReason,
+		})
+	} else {
+		deltaMsg := chatMessage{
+			Name:      "",
+			Role:      hunyuanFormattedChunk.Choices[0].Delta.Role,
+			Content:   hunyuanFormattedChunk.Choices[0].Delta.Content,
+			ToolCalls: []toolCall{},
+		}
+
+		// tmpStr2, _ := json.Marshal(deltaMsg)
+		// log.Debugf("@@@ --- 中间chunk: choices.chatMsg 是: %s", tmpStr2)
+
+		openAIFormattedChunk.Choices = append(
+			openAIFormattedChunk.Choices,
+			chatCompletionChoice{Delta: &deltaMsg},
+		)
+		// tmpStr, _ := json.Marshal(openAIFormattedChunk.Choices)
+		// log.Debugf("@@@ --- 中间chunk: choices 是: %s", tmpStr)
+	}
+
+	// 返回的格式
+	openAIFormattedChunkBytes, _ := json.Marshal(openAIFormattedChunk)
+	var openAIChunk strings.Builder
+	openAIChunk.WriteString(ssePrefix)
+	openAIChunk.WriteString(string(openAIFormattedChunkBytes))
+	openAIChunk.WriteString("\n\n")
+
+	return []byte(openAIChunk.String()), nil
+}
+
+func (m *hunyuanProvider) OnResponseBody(ctx wrapper.HttpContext, apiName ApiName, body []byte, log wrapper.Log) (types.Action, error) {
+
+	log.Debugf("#debug nash5# onRespBody's resp is: %s", string(body))
+	hunyuanResponse := &hunyuanTextGenResponseNonStreaming{}
+	if err := json.Unmarshal(body, hunyuanResponse); err != nil {
+		return types.ActionContinue, fmt.Errorf("unable to unmarshal hunyuan response: %v", err)
+	}
+
+	if m.config.protocol == protocolOriginal {
+		return types.ActionContinue, replaceJsonResponseBody(hunyuanResponse, log)
+	}
+
+	response := m.buildChatCompletionResponse(ctx, hunyuanResponse)
+
+	return types.ActionContinue, replaceJsonResponseBody(response, log)
+}
+
+func (m *hunyuanProvider) insertContextMessageIntoHunyuanRequest(request *hunyuanTextGenRequest, content string) {
+
+	fileMessage := hunyuanChatMessage{
+		Role:    roleSystem,
+		Content: content,
+	}
+	messages := request.Messages
+	request.Messages = append([]hunyuanChatMessage{},
+		append([]hunyuanChatMessage{fileMessage}, messages...)...,
+	)
+}
+
+func (m *hunyuanProvider) buildHunyuanTextGenerationRequest(request *chatCompletionRequest) *hunyuanTextGenRequest {
+	hunyuanRequest := &hunyuanTextGenRequest{
+		Model:             request.Model,
+		Messages:          convertMessagesFromOpenAIToHunyuan(request.Messages),
+		Stream:            request.Stream,
+		StreamModeration:  false,
+		TopP:              float32(request.TopP),
+		Temperature:       float32(request.Temperature),
+		EnableEnhancement: false,
+	}
+
+	return hunyuanRequest
+}
+
+func convertMessagesFromOpenAIToHunyuan(openAIMessages []chatMessage) []hunyuanChatMessage {
+	// 将chatgpt的messages转换为hunyuan的messages
+	hunyuanChatMessages := make([]hunyuanChatMessage, 0, len(openAIMessages))
+	for _, msg := range openAIMessages {
+		hunyuanChatMessages = append(hunyuanChatMessages, hunyuanChatMessage{
+			Role:    msg.Role,
+			Content: msg.Content,
+		})
+	}
+
+	return hunyuanChatMessages
+}
+
+func (m *hunyuanProvider) buildChatCompletionResponse(ctx wrapper.HttpContext, hunyuanResponse *hunyuanTextGenResponseNonStreaming) *chatCompletionResponse {
+	choices := make([]chatCompletionChoice, 0, len(hunyuanResponse.Response.Choices))
+	for _, choice := range hunyuanResponse.Response.Choices {
+		choices = append(choices, chatCompletionChoice{
+			Message: &chatMessage{
+				Name:      "",
+				Role:      choice.Message.Role,
+				Content:   choice.Message.Content,
+				ToolCalls: nil,
+			},
+			FinishReason: choice.FinishReason,
+		})
+	}
+	return &chatCompletionResponse{
+		Id:                hunyuanResponse.Response.Id,
+		Created:           time.Now().UnixMilli() / 1000,
+		Model:             ctx.GetContext(ctxKeyFinalRequestModel).(string),
+		SystemFingerprint: "",
+		Object:            objectChatCompletion,
+		Choices:           choices,
+		Usage: chatCompletionUsage{
+			PromptTokens:     hunyuanResponse.Response.Usage.PromptTokens,
+			CompletionTokens: hunyuanResponse.Response.Usage.CompletionTokens,
+			TotalTokens:      hunyuanResponse.Response.Usage.TotalTokens,
+		},
+	}
+}
+
+func Sha256hex(s string) string {
+	b := sha256.Sum256([]byte(s))
+	return hex.EncodeToString(b[:])
+}
+
+func Hmacsha256(s, key string) string {
+	hashed := hmac.New(sha256.New, []byte(key))
+	hashed.Write([]byte(s))
+	return string(hashed.Sum(nil))
+}
+
+/**
+ * @param secretId 秘钥id
+ * @param secretKey 秘钥
+ * @param timestamp 时间戳
+ * @param host 目标域名
+ * @param action 请求动作
+ * @param payload 请求体
+ * @return 签名
+ */
+func GetTC3Authorizationcode(secretId string, secretKey string, timestamp int64, host string, action string, payload string) string {
+	algorithm := "TC3-HMAC-SHA256"
+	service := "hunyuan" // 注意，必须和域名中的产品名保持一致
+
+	// step 1: build canonical request string
+	httpRequestMethod := "POST"
+	canonicalURI := "/"
+	canonicalQueryString := ""
+	canonicalHeaders := fmt.Sprintf("content-type:%s\nhost:%s\nx-tc-action:%s\n",
+		"application/json", host, strings.ToLower(action))
+	signedHeaders := "content-type;host;x-tc-action"
+
+	// fmt.Println("payload is: %s", payload)
+	hashedRequestPayload := Sha256hex(payload)
+	canonicalRequest := fmt.Sprintf("%s\n%s\n%s\n%s\n%s\n%s",
+		httpRequestMethod,
+		canonicalURI,
+		canonicalQueryString,
+		canonicalHeaders,
+		signedHeaders,
+		hashedRequestPayload)
+	// fmt.Println(canonicalRequest)
+
+	// step 2: build string to sign
+	date := time.Unix(timestamp, 0).UTC().Format("2006-01-02")
+	credentialScope := fmt.Sprintf("%s/%s/tc3_request", date, service)
+	hashedCanonicalRequest := Sha256hex(canonicalRequest)
+	string2sign := fmt.Sprintf("%s\n%d\n%s\n%s",
+		algorithm,
+		timestamp,
+		credentialScope,
+		hashedCanonicalRequest)
+	// fmt.Println(string2sign)
+
+	// step 3: sign string
+	secretDate := Hmacsha256(date, "TC3"+secretKey)
+	secretService := Hmacsha256(service, secretDate)
+	secretSigning := Hmacsha256("tc3_request", secretService)
+	signature := hex.EncodeToString([]byte(Hmacsha256(string2sign, secretSigning)))
+	// fmt.Println(signature)
+
+	// step 4: build authorization
+	authorization := fmt.Sprintf("%s Credential=%s/%s, SignedHeaders=%s, Signature=%s",
+		algorithm,
+		secretId,
+		credentialScope,
+		signedHeaders,
+		signature)
+
+	// curl := fmt.Sprintf(`curl -X POST https://%s \
+	// 	-H "Authorization: %s" \
+	// 	-H "Content-Type: application/json" \
+	// 	-H "Host: %s" -H "X-TC-Action: %s" \
+	// 	-H "X-TC-Timestamp: %d" \
+	// 	-H "X-TC-Version: 2023-09-01" \
+	// 	-d '%s'`, host, authorization, host, action, timestamp, payload)
+	// fmt.Println(curl)
+	return authorization
+}
diff --git a/plugins/wasm-go/extensions/ai-proxy/provider/provider.go b/plugins/wasm-go/extensions/ai-proxy/provider/provider.go
index cd0a0aba4..5ac17fee0 100644
--- a/plugins/wasm-go/extensions/ai-proxy/provider/provider.go
+++ b/plugins/wasm-go/extensions/ai-proxy/provider/provider.go
@@ -25,13 +25,17 @@ const (
 	providerTypeDeepSeek = "deepseek"
 	providerTypeZhipuAi  = "zhipuai"
 	providerTypeOllama   = "ollama"
+	providerTypeHunyuan  = "hunyuan"
 
 	protocolOpenAI   = "openai"
 	protocolOriginal = "original"
 
-	roleSystem = "system"
+	roleSystem    = "system"
+	roleUser      = "user"
+	roleAssistant = "assistant"
 
 	ctxKeyIncrementalStreaming = "incrementalStreaming"
+	ctxKeyApiName              = "apiKey"
 	ctxKeyStreamingBody        = "streamingBody"
 	ctxKeyOriginalRequestModel = "originalRequestModel"
 	ctxKeyFinalRequestModel    = "finalRequestModel"
@@ -64,6 +68,7 @@ var (
 		providerTypeDeepSeek: &deepseekProviderInitializer{},
 		providerTypeZhipuAi:  &zhipuAiProviderInitializer{},
 		providerTypeOllama:   &ollamaProviderInitializer{},
+		providerTypeHunyuan:  &hunyuanProviderInitializer{},
 	}
 )
 
@@ -119,6 +124,12 @@ type ProviderConfig struct {
 	// @Title zh-CN Ollama Server Port
 	// @Description zh-CN 仅适用于 Ollama 服务。Ollama 服务器的端口号。
 	ollamaServerPort uint32 `required:"false" yaml:"ollamaServerPort" json:"ollamaServerPort"`
+	// @Title zh-CN hunyuan api key for authorization
+	// @Description zh-CN 仅适用于Hun Yuan AI服务鉴权，API key/id 参考：https://cloud.tencent.com/document/api/1729/101843#Golang
+	hunyuanAuthKey string `required:"false" yaml:"hunyuanAuthKey" json:"hunyuanAuthKey"`
+	// @Title zh-CN hunyuan api id for authorization
+	// @Description zh-CN 仅适用于Hun Yuan AI服务鉴权
+	hunyuanAuthId string `required:"false" yaml:"hunyuanAuthId" json:"hunyuanAuthId"`
 	// @Title zh-CN 模型名称映射表
 	// @Description zh-CN 用于将请求中的模型名称映射为目标AI服务商支持的模型名称。支持通过“*”来配置全局映射
 	modelMapping map[string]string `required:"false" yaml:"modelMapping" json:"modelMapping"`
@@ -162,6 +173,9 @@ func (c *ProviderConfig) FromJson(json gjson.Result) {
 		c.context = &ContextConfig{}
 		c.context.FromJson(contextJson)
 	}
+
+	c.hunyuanAuthId = json.Get("hunyuanAuthId").String()
+	c.hunyuanAuthKey = json.Get("hunyuanAuthKey").String()
 }
 
 func (c *ProviderConfig) Validate() error {
@@ -182,7 +196,6 @@ func (c *ProviderConfig) Validate() error {
 
 	if c.typ == "" {
 		return errors.New("missing type in provider config")
-    
 	}
 	initializer, has := providerInitializers[c.typ]
 	if !has {