mirror of
https://github.com/alibaba/higress.git
synced 2026-03-16 16:30:47 +08:00
206 lines
5.3 KiB
YAML
206 lines
5.3 KiB
YAML
# Copyright (c) 2025 Alibaba Group Holding Ltd.
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
apiVersion: networking.k8s.io/v1
|
|
kind: Ingress
|
|
metadata:
|
|
name: wasmplugin-ai-proxy-baidu
|
|
namespace: higress-conformance-ai-backend
|
|
spec:
|
|
ingressClassName: higress
|
|
rules:
|
|
- host: "qianfan.baidubce.com"
|
|
http:
|
|
paths:
|
|
- pathType: Prefix
|
|
path: "/"
|
|
backend:
|
|
service:
|
|
name: llm-mock-service
|
|
port:
|
|
number: 3000
|
|
---
|
|
apiVersion: networking.k8s.io/v1
|
|
kind: Ingress
|
|
metadata:
|
|
name: wasmplugin-ai-proxy-doubao
|
|
namespace: higress-conformance-ai-backend
|
|
spec:
|
|
ingressClassName: higress
|
|
rules:
|
|
- host: "ark.cn-beijing.volces.com"
|
|
http:
|
|
paths:
|
|
- pathType: Prefix
|
|
path: "/"
|
|
backend:
|
|
service:
|
|
name: llm-mock-service
|
|
port:
|
|
number: 3000
|
|
---
|
|
apiVersion: networking.k8s.io/v1
|
|
kind: Ingress
|
|
metadata:
|
|
name: wasmplugin-ai-proxy-minimax-v2-api
|
|
namespace: higress-conformance-ai-backend
|
|
spec:
|
|
ingressClassName: higress
|
|
rules:
|
|
- host: "api.minimax.chat-v2-api"
|
|
http:
|
|
paths:
|
|
- pathType: Prefix
|
|
path: "/"
|
|
backend:
|
|
service:
|
|
name: llm-mock-service
|
|
port:
|
|
number: 3000
|
|
---
|
|
apiVersion: networking.k8s.io/v1
|
|
kind: Ingress
|
|
metadata:
|
|
name: wasmplugin-ai-proxy-minimax-pro-api
|
|
namespace: higress-conformance-ai-backend
|
|
spec:
|
|
ingressClassName: higress
|
|
rules:
|
|
- host: "api.minimax.chat-pro-api"
|
|
http:
|
|
paths:
|
|
- pathType: Prefix
|
|
path: "/"
|
|
backend:
|
|
service:
|
|
name: llm-mock-service
|
|
port:
|
|
number: 3000
|
|
---
|
|
apiVersion: networking.k8s.io/v1
|
|
kind: Ingress
|
|
metadata:
|
|
name: wasmplugin-ai-proxy-qwen-compatible-mode
|
|
namespace: higress-conformance-ai-backend
|
|
spec:
|
|
ingressClassName: higress
|
|
rules:
|
|
- host: "dashscope.aliyuncs.com-compatible-mode"
|
|
http:
|
|
paths:
|
|
- pathType: Prefix
|
|
path: "/"
|
|
backend:
|
|
service:
|
|
name: llm-mock-service
|
|
port:
|
|
number: 3000
|
|
---
|
|
apiVersion: networking.k8s.io/v1
|
|
kind: Ingress
|
|
metadata:
|
|
name: wasmplugin-ai-proxy-qwen
|
|
namespace: higress-conformance-ai-backend
|
|
spec:
|
|
ingressClassName: higress
|
|
rules:
|
|
- host: "dashscope.aliyuncs.com"
|
|
http:
|
|
paths:
|
|
- pathType: Prefix
|
|
path: "/"
|
|
backend:
|
|
service:
|
|
name: llm-mock-service
|
|
port:
|
|
number: 3000
|
|
---
|
|
apiVersion: extensions.higress.io/v1alpha1
|
|
kind: WasmPlugin
|
|
metadata:
|
|
name: ai-proxy
|
|
namespace: higress-system
|
|
spec:
|
|
defaultConfigDisable: true
|
|
phase: UNSPECIFIED_PHASE
|
|
priority: 100
|
|
matchRules:
|
|
- config:
|
|
provider:
|
|
apiTokens:
|
|
- fake_token
|
|
modelMapping:
|
|
'gpt-3': ernie-3.5-8k
|
|
'*': ernie-3.5-8k
|
|
type: baidu
|
|
ingress:
|
|
- higress-conformance-ai-backend/wasmplugin-ai-proxy-baidu
|
|
- config:
|
|
provider:
|
|
apiTokens:
|
|
- fake_token
|
|
modelMapping:
|
|
'*': fake_doubao_endpoint
|
|
type: doubao
|
|
ingress:
|
|
- higress-conformance-ai-backend/wasmplugin-ai-proxy-doubao
|
|
- config:
|
|
provider:
|
|
apiTokens:
|
|
- fake_token
|
|
modelMapping:
|
|
'gpt-3': abab6.5s-chat
|
|
'gpt-4': abab6.5g-chat
|
|
'*': abab6.5t-chat
|
|
type: minimax
|
|
ingress:
|
|
- higress-conformance-ai-backend/wasmplugin-ai-proxy-minimax-v2-api
|
|
- config:
|
|
provider:
|
|
apiTokens:
|
|
- fake_token
|
|
modelMapping:
|
|
'gpt-3': abab6.5s-chat
|
|
'gpt-4': abab6.5g-chat
|
|
'*': abab6.5t-chat
|
|
type: minimax
|
|
minimaxApiType: pro
|
|
minimaxGroupId: 1
|
|
ingress:
|
|
- higress-conformance-ai-backend/wasmplugin-ai-proxy-minimax-pro-api
|
|
- config:
|
|
provider:
|
|
apiTokens:
|
|
- fake_token
|
|
modelMapping:
|
|
'gpt-3': qwen-turbo
|
|
'gpt-35-turbo': qwen-plus
|
|
'gpt-4-*': qwen-max
|
|
'*': qwen-turbo
|
|
type: qwen
|
|
qwenEnableCompatible: true
|
|
ingress:
|
|
- higress-conformance-ai-backend/wasmplugin-ai-proxy-qwen-compatible-mode
|
|
- config:
|
|
provider:
|
|
apiTokens:
|
|
- fake_token
|
|
modelMapping:
|
|
'gpt-3': qwen-turbo
|
|
'gpt-35-turbo': qwen-plus
|
|
'gpt-4-*': qwen-max
|
|
'*': qwen-turbo
|
|
type: qwen
|
|
ingress:
|
|
- higress-conformance-ai-backend/wasmplugin-ai-proxy-qwen
|
|
url: oci://higress-registry.cn-hangzhou.cr.aliyuncs.com/plugins/ai-proxy:1.0.0 |