ai-statistics: increase default value_length_limit and emit AILog during streaming usage (#3624)

This commit is contained in:
rinfx
2026-03-23 14:04:02 +08:00
committed by GitHub
parent 23a0299d3b
commit cce53203ce
2 changed files with 331 additions and 26 deletions

View File

@@ -1712,3 +1712,305 @@ func TestTokenDetails(t *testing.T) {
host.CompleteHttp()
})
}
func TestUnmatchedPathsAndContentTypes(t *testing.T) {
test.RunTest(t, func(t *testing.T) {
restrictiveConfig := func() json.RawMessage {
data, _ := json.Marshal(map[string]interface{}{
"enable_path_suffixes": []string{"/allowed_path"},
"enable_content_types": []string{"application/json"},
"attributes": []map[string]interface{}{
{
"key": "test_attr",
"value_source": "response_body",
"value": "data",
"apply_to_log": true,
},
},
"disable_openai_usage": true,
})
return data
}()
t.Run("skip request for unenabled path", func(t *testing.T) {
host, status := test.NewTestHost(restrictiveConfig)
defer host.Reset()
require.Equal(t, types.OnPluginStartStatusOK, status)
action := host.CallOnHttpRequestHeaders([][2]string{
{":authority", "example.com"},
{":path", "/disallowed_path"},
{":method", "POST"},
})
require.Equal(t, types.ActionContinue, action)
host.CompleteHttp()
})
t.Run("skip response for unenabled content type", func(t *testing.T) {
host, status := test.NewTestHost(restrictiveConfig)
defer host.Reset()
require.Equal(t, types.OnPluginStartStatusOK, status)
host.CallOnHttpRequestHeaders([][2]string{
{":authority", "example.com"},
{":path", "/allowed_path"},
{":method", "POST"},
})
action := host.CallOnHttpResponseHeaders([][2]string{
{":status", "200"},
{"content-type", "text/plain"},
})
require.Equal(t, types.ActionContinue, action)
host.CompleteHttp()
})
})
}
func TestSetSpanAttributeAndLoggingEdgeCases(t *testing.T) {
test.RunTest(t, func(t *testing.T) {
configBytes := []byte(`{
"attributes": [
{
"key": "test_attr1",
"value_source": "fixed_value",
"value": "",
"apply_to_span": true
},
{
"key": "test_attr2",
"value_source": "fixed_value",
"value": "long_value_that_exceeds_limit_long_value_that_exceeds_limit_long_value_that_exceeds_limit",
"apply_to_log": true
}
],
"value_length_limit": 20
}`)
t.Run("span attribute edge cases", func(t *testing.T) {
host, status := test.NewTestHost(configBytes)
defer host.Reset()
require.Equal(t, types.OnPluginStartStatusOK, status)
// Setting fixed value attribute to empty should just print a debug log and skip setting span
action := host.CallOnHttpRequestHeaders([][2]string{
{":authority", "example.com"},
{":path", "/api/chat"},
})
require.Equal(t, types.ActionContinue, action)
host.CompleteHttp()
})
})
}
func TestGetRouteAndClusterNameEdgeCases(t *testing.T) {
test.RunTest(t, func(t *testing.T) {
t.Run("properties absence", func(t *testing.T) {
host, status := test.NewTestHost([]byte(`{}`))
defer host.Reset()
require.Equal(t, types.OnPluginStartStatusOK, status)
// Host doesn't have route_name implicitly by default without SetRouteName, but getRouteName handles err
host.CallOnHttpRequestHeaders([][2]string{
{":authority", "example.com"},
{":path", "/api/chat"},
})
host.CompleteHttp()
})
t.Run("api name with @", func(t *testing.T) {
host, status := test.NewTestHost([]byte(`{}`))
defer host.Reset()
require.Equal(t, types.OnPluginStartStatusOK, status)
host.SetRouteName("api@v1@service@extra") // @ has special handling in getAPIName
host.CallOnHttpRequestHeaders([][2]string{
{":authority", "example.com"},
{":path", "/api/chat"},
})
host.CompleteHttp()
})
})
}
func TestExtractClaudeStreamingToolCallsMissingInput(t *testing.T) {
t.Run("claude missing partial_json", func(t *testing.T) {
chunks := [][]byte{
[]byte(`data: {"type":"content_block_start","index":0,"content_block":{"type":"tool_use","id":"tool_123","name":"get_weather","input":{}}}`),
[]byte(`data: {"type":"content_block_delta","index":0,"delta":{"type":"input_json_delta"}}`),
[]byte(`data: {"type":"content_block_stop","index":0}`),
}
var buffer *StreamingToolCallsBuffer
for _, chunk := range chunks {
buffer = extractClaudeStreamingToolCalls(chunk, buffer)
}
toolCalls := getToolCallsFromBuffer(buffer)
require.Len(t, toolCalls, 1)
require.Equal(t, "tool_123", toolCalls[0].ID)
require.Equal(t, "tool_use", toolCalls[0].Type)
require.Equal(t, "get_weather", toolCalls[0].Function.Name)
// partial_json absence means arguments might be empty
})
}
func TestWriteMetricEdgeCases(t *testing.T) {
test.RunTest(t, func(t *testing.T) {
t.Run("disable_openai_usage true", func(t *testing.T) {
configBytes := []byte(`{
"disable_openai_usage": true
}`)
host, status := test.NewTestHost(configBytes)
defer host.Reset()
require.Equal(t, types.OnPluginStartStatusOK, status)
host.SetRouteName("api-v1")
host.SetClusterName("cluster-1")
host.CallOnHttpRequestHeaders([][2]string{
{":authority", "example.com"},
{":path", "/api/chat"},
})
host.CallOnHttpResponseHeaders([][2]string{
{":status", "200"},
{"content-type", "application/json"},
})
responseBody := []byte(`{
"usage": {"prompt_tokens": 5, "completion_tokens": 8, "total_tokens": 13},
"model": "gpt-3.5-turbo"
}`)
host.CallOnHttpResponseBody(responseBody)
host.CompleteHttp()
})
})
}
func TestIsPathEnabled(t *testing.T) {
require.True(t, isPathEnabled("/v1/chat/completions", nil))
require.True(t, isPathEnabled("/v1/chat/completions", []string{}))
require.True(t, isPathEnabled("/v1/chat/completions", []string{"/completions", "/messages"}))
require.True(t, isPathEnabled("/v1/messages", []string{"/completions", "/messages"}))
require.False(t, isPathEnabled("/v1/embeddings", []string{"/completions", "/messages"}))
// test query params
require.True(t, isPathEnabled("/v1/chat/completions?stream=true", []string{"/completions"}))
require.False(t, isPathEnabled("/v1/embeddings?stream=true", []string{"/completions"}))
}
func TestIsContentTypeEnabled(t *testing.T) {
require.True(t, isContentTypeEnabled("application/json", nil))
require.True(t, isContentTypeEnabled("application/json", []string{}))
require.True(t, isContentTypeEnabled("application/json", []string{"application/json", "text/event-stream"}))
require.True(t, isContentTypeEnabled("text/event-stream; charset=utf-8", []string{"application/json", "text/event-stream"}))
require.False(t, isContentTypeEnabled("text/html", []string{"application/json", "text/event-stream"}))
}
func TestConvertToUInt(t *testing.T) {
val, ok := convertToUInt(int32(10))
require.True(t, ok)
require.Equal(t, uint64(10), val)
val, ok = convertToUInt(int64(10))
require.True(t, ok)
require.Equal(t, uint64(10), val)
val, ok = convertToUInt(uint32(10))
require.True(t, ok)
require.Equal(t, uint64(10), val)
val, ok = convertToUInt(uint64(10))
require.True(t, ok)
require.Equal(t, uint64(10), val)
val, ok = convertToUInt(float32(10.0))
require.True(t, ok)
require.Equal(t, uint64(10), val)
val, ok = convertToUInt(float64(10.0))
require.True(t, ok)
require.Equal(t, uint64(10), val)
_, ok = convertToUInt("10")
require.False(t, ok)
}
func TestExtractClaudeStreamingToolCalls(t *testing.T) {
t.Run("claude tool use assembly", func(t *testing.T) {
chunks := [][]byte{
[]byte(`data: {"type":"content_block_start","index":0,"content_block":{"type":"tool_use","id":"tool_123","name":"get_weather"}}`),
[]byte(`data: {"type":"content_block_delta","index":0,"delta":{"type":"input_json_delta","partial_json":"{\"loc"}}}`),
[]byte(`data: {"type":"content_block_delta","index":0,"delta":{"type":"input_json_delta","partial_json":"ation\":\"Bei"}}}`),
[]byte(`data: {"type":"content_block_delta","index":0,"delta":{"type":"input_json_delta","partial_json":"jing\"}"}}}`),
[]byte(`data: {"type":"content_block_stop","index":0}`),
}
var buffer *StreamingToolCallsBuffer
for _, chunk := range chunks {
buffer = extractClaudeStreamingToolCalls(chunk, buffer)
}
toolCalls := getToolCallsFromBuffer(buffer)
require.Len(t, toolCalls, 1)
require.Equal(t, "tool_123", toolCalls[0].ID)
require.Equal(t, "tool_use", toolCalls[0].Type)
require.Equal(t, "get_weather", toolCalls[0].Function.Name)
require.Equal(t, `{"location":"Beijing"}`, toolCalls[0].Function.Arguments)
})
t.Run("claude empty chunks", func(t *testing.T) {
chunks := [][]byte{
[]byte(`data: {"type":"ping"}`),
[]byte(`data: {"type":"content_block_delta","index":0,"delta":{"type":"text_delta","text":"Hello"}}`),
}
var buffer *StreamingToolCallsBuffer
for _, chunk := range chunks {
buffer = extractClaudeStreamingToolCalls(chunk, buffer)
}
toolCalls := getToolCallsFromBuffer(buffer)
require.Len(t, toolCalls, 0)
})
t.Run("claude tool use with initial input", func(t *testing.T) {
chunks := [][]byte{
[]byte(`data: {"type":"content_block_start","index":1,"content_block":{"type":"tool_use","id":"tool_456","name":"get_time","input":{"timezone":"UTC+8"}}}`),
[]byte(`data: {"type":"content_block_stop","index":1}`),
}
var buffer *StreamingToolCallsBuffer
for _, chunk := range chunks {
buffer = extractClaudeStreamingToolCalls(chunk, buffer)
}
toolCalls := getToolCallsFromBuffer(buffer)
require.Len(t, toolCalls, 1)
require.Equal(t, "tool_456", toolCalls[0].ID)
require.Equal(t, "tool_use", toolCalls[0].Type)
require.Equal(t, "get_time", toolCalls[0].Function.Name)
require.Equal(t, `{"timezone":"UTC+8"}`, toolCalls[0].Function.Arguments)
})
}
func TestConfigWithDefaultAttributes(t *testing.T) {
test.RunTest(t, func(t *testing.T) {
t.Run("use default attributes config", func(t *testing.T) {
defaultConfig := []byte(`{
"use_default_attributes": true
}`)
host, status := test.NewTestHost(defaultConfig)
defer host.Reset()
require.Equal(t, types.OnPluginStartStatusOK, status)
})
t.Run("use default response attributes config", func(t *testing.T) {
defaultRespConfig := []byte(`{
"use_default_response_attributes": true
}`)
host, status := test.NewTestHost(defaultRespConfig)
defer host.Reset()
require.Equal(t, types.OnPluginStartStatusOK, status)
})
})
}