Files
higress/test/e2e/conformance/tests/go-wasm-ai-cache.yaml

104 lines
2.9 KiB
YAML

# Copyright (c) 2022 Alibaba Group Holding Ltd.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
apiVersion: networking.k8s.io/v1
kind: Ingress
metadata:
annotations:
name: wasmplugin-ai-cache-openai
namespace: higress-conformance-infra
spec:
ingressClassName: higress
rules:
- host: "dashscope.aliyuncs.com"
http:
paths:
- pathType: Prefix
path: "/"
backend:
service:
name: infra-backend-v1
port:
number: 8080
---
apiVersion: networking.k8s.io/v1
kind: Ingress
metadata:
annotations:
name: wasmplugin-ai-cache-qwen
namespace: higress-conformance-infra
spec:
ingressClassName: higress
rules:
- host: "qwen.ai.com"
http:
paths:
- pathType: Prefix
path: "/"
backend:
service:
name: infra-backend-v1
port:
number: 8080
---
apiVersion: extensions.higress.io/v1alpha1
kind: WasmPlugin
metadata:
name: ai-cache
namespace: higress-system
spec:
priority: 400
matchRules:
- config:
embedding:
type: "dashscope"
serviceName: "qwen"
apiKey: "{{secret.qwenApiKey}}"
timeout: 12000
vector:
type: "dashvector"
serviceName: "dashvector"
collectionID: "{{secret.collectionID}}"
serviceDomain: "{{secret.serviceDomain}}"
apiKey: "{{secret.apiKey}}"
timeout: 12000
cache:
ingress:
- higress-conformance-infra/wasmplugin-ai-cache-openai
- higress-conformance-infra/wasmplugin-ai-cache-qwen
# url: file:///opt/plugins/wasm-go/extensions/ai-cache/plugin.wasm
url: oci://registry.cn-shanghai.aliyuncs.com/suchunsv/higress_ai:1.18
---
apiVersion: extensions.higress.io/v1alpha1
kind: WasmPlugin
metadata:
name: ai-proxy
namespace: higress-system
spec:
priority: 201
matchRules:
- config:
provider:
type: "qwen"
qwenEnableCompatible: true
apiTokens:
- "{{secret.qwenApiKey}}"
timeout: 1200000
modelMapping:
"*": "qwen-long"
ingress:
- higress-conformance-infra/wasmplugin-ai-cache-openai
- higress-conformance-infra/wasmplugin-ai-cache-qwen
url: oci://higress-registry.cn-hangzhou.cr.aliyuncs.com/plugins/ai-proxy:1.0.0