|
| 1 | +package client |
| 2 | + |
| 3 | +import ( |
| 4 | + "context" |
| 5 | + "testing" |
| 6 | +) |
| 7 | + |
| 8 | +// ---------- buildRequestBase ---------- |
| 9 | + |
| 10 | +func BenchmarkBuildRequestBase_SimpleMessages(b *testing.B) { |
| 11 | + messages := []EyrieMessage{ |
| 12 | + {Role: "system", Content: "You are helpful."}, |
| 13 | + {Role: "user", Content: "Hello"}, |
| 14 | + {Role: "assistant", Content: "Hi there!"}, |
| 15 | + {Role: "user", Content: "How are you?"}, |
| 16 | + } |
| 17 | + opts := ChatOptions{ |
| 18 | + Model: "gpt-4", |
| 19 | + Temperature: floatPtr(0.7), |
| 20 | + MaxTokens: 4096, |
| 21 | + } |
| 22 | + b.ReportAllocs() |
| 23 | + b.ResetTimer() |
| 24 | + for i := 0; i < b.N; i++ { |
| 25 | + _ = buildRequestBase(messages, opts, false, nil) |
| 26 | + } |
| 27 | +} |
| 28 | + |
| 29 | +func BenchmarkBuildRequestBase_WithToolUse(b *testing.B) { |
| 30 | + messages := []EyrieMessage{ |
| 31 | + {Role: "system", Content: "You are helpful."}, |
| 32 | + {Role: "user", Content: "Search for files"}, |
| 33 | + {Role: "assistant", ToolUse: []ToolCall{ |
| 34 | + {ID: "tc-1", Name: "search", Arguments: map[string]interface{}{"query": "main.go"}}, |
| 35 | + {ID: "tc-2", Name: "read", Arguments: map[string]interface{}{"path": "main.go"}}, |
| 36 | + }}, |
| 37 | + {Role: "user", ToolResult: &ToolResult{ToolUseID: "tc-1", Content: "Found 1 file"}}, |
| 38 | + {Role: "user", ToolResult: &ToolResult{ToolUseID: "tc-2", Content: "package main\nfunc main() {}"}}, |
| 39 | + } |
| 40 | + opts := ChatOptions{ |
| 41 | + Model: "gpt-4", |
| 42 | + Tools: []EyrieTool{ |
| 43 | + {Name: "search", Description: "Search for files", Parameters: map[string]interface{}{"query": map[string]string{"type": "string"}}}, |
| 44 | + {Name: "read", Description: "Read a file", Parameters: map[string]interface{}{"path": map[string]string{"type": "string"}}}, |
| 45 | + }, |
| 46 | + MaxTokens: 4096, |
| 47 | + } |
| 48 | + b.ReportAllocs() |
| 49 | + b.ResetTimer() |
| 50 | + for i := 0; i < b.N; i++ { |
| 51 | + _ = buildRequestBase(messages, opts, false, nil) |
| 52 | + } |
| 53 | +} |
| 54 | + |
| 55 | +func BenchmarkBuildRequestBase_WithImages(b *testing.B) { |
| 56 | + messages := []EyrieMessage{ |
| 57 | + {Role: "user", Content: "What's in this image?", Images: []string{"data:image/png;base64,iVBORw0KGgo="}}, |
| 58 | + } |
| 59 | + opts := ChatOptions{Model: "gpt-4-vision", MaxTokens: 4096} |
| 60 | + b.ReportAllocs() |
| 61 | + b.ResetTimer() |
| 62 | + for i := 0; i < b.N; i++ { |
| 63 | + _ = buildRequestBase(messages, opts, false, nil) |
| 64 | + } |
| 65 | +} |
| 66 | + |
| 67 | +func BenchmarkBuildRequestBase_Streaming(b *testing.B) { |
| 68 | + messages := []EyrieMessage{ |
| 69 | + {Role: "user", Content: "Write a long essay"}, |
| 70 | + } |
| 71 | + opts := ChatOptions{Model: "gpt-4", MaxTokens: 4096} |
| 72 | + b.ReportAllocs() |
| 73 | + b.ResetTimer() |
| 74 | + for i := 0; i < b.N; i++ { |
| 75 | + _ = buildRequestBase(messages, opts, true, nil) |
| 76 | + } |
| 77 | +} |
| 78 | + |
| 79 | +// ---------- buildCacheKey ---------- |
| 80 | + |
| 81 | +func BenchmarkBuildCacheKey_Short(b *testing.B) { |
| 82 | + messages := []EyrieMessage{ |
| 83 | + {Role: "user", Content: "Hello"}, |
| 84 | + } |
| 85 | + opts := ChatOptions{Model: "gpt-4"} |
| 86 | + b.ReportAllocs() |
| 87 | + b.ResetTimer() |
| 88 | + for i := 0; i < b.N; i++ { |
| 89 | + _ = buildCacheKey(messages, opts) |
| 90 | + } |
| 91 | +} |
| 92 | + |
| 93 | +func BenchmarkBuildCacheKey_Long(b *testing.B) { |
| 94 | + longContent := make([]byte, 4000) |
| 95 | + for i := range longContent { |
| 96 | + longContent[i] = 'a' |
| 97 | + } |
| 98 | + messages := []EyrieMessage{ |
| 99 | + {Role: "system", Content: string(longContent)}, |
| 100 | + {Role: "user", Content: "Hello"}, |
| 101 | + {Role: "assistant", Content: string(longContent)}, |
| 102 | + {Role: "user", Content: "Continue"}, |
| 103 | + } |
| 104 | + opts := ChatOptions{Model: "gpt-4", System: "You are helpful"} |
| 105 | + b.ReportAllocs() |
| 106 | + b.ResetTimer() |
| 107 | + for i := 0; i < b.N; i++ { |
| 108 | + _ = buildCacheKey(messages, opts) |
| 109 | + } |
| 110 | +} |
| 111 | + |
| 112 | +func BenchmarkBuildCacheKey_WithToolCalls(b *testing.B) { |
| 113 | + messages := []EyrieMessage{ |
| 114 | + {Role: "assistant", ToolUse: []ToolCall{ |
| 115 | + {ID: "tc-1", Name: "search", Arguments: map[string]interface{}{"query": "test"}}, |
| 116 | + }}, |
| 117 | + {Role: "user", ToolResult: &ToolResult{ToolUseID: "tc-1", Content: "result"}}, |
| 118 | + } |
| 119 | + opts := ChatOptions{Model: "gpt-4"} |
| 120 | + b.ReportAllocs() |
| 121 | + b.ResetTimer() |
| 122 | + for i := 0; i < b.N; i++ { |
| 123 | + _ = buildCacheKey(messages, opts) |
| 124 | + } |
| 125 | +} |
| 126 | + |
| 127 | +// ---------- CachedProvider ---------- |
| 128 | + |
| 129 | +func BenchmarkCachedProvider_CacheHit(b *testing.B) { |
| 130 | + mock := NewMockProvider(MockModeFixed) |
| 131 | + mock.Response = "cached response" |
| 132 | + cp := NewCachedProvider(mock, DefaultCacheConfig()) |
| 133 | + messages := []EyrieMessage{{Role: "user", Content: "Hello"}} |
| 134 | + opts := ChatOptions{Model: "gpt-4"} |
| 135 | + |
| 136 | + // Prime the cache |
| 137 | + _, _ = cp.Chat(context.TODO(), messages, opts) |
| 138 | + |
| 139 | + b.ReportAllocs() |
| 140 | + b.ResetTimer() |
| 141 | + for i := 0; i < b.N; i++ { |
| 142 | + _, _ = cp.Chat(context.TODO(), messages, opts) |
| 143 | + } |
| 144 | +} |
| 145 | + |
| 146 | +func BenchmarkCachedProvider_CacheMiss(b *testing.B) { |
| 147 | + mock := NewMockProvider(MockModeFixed) |
| 148 | + mock.Response = "response" |
| 149 | + cp := NewCachedProvider(mock, DefaultCacheConfig()) |
| 150 | + opts := ChatOptions{Model: "gpt-4"} |
| 151 | + |
| 152 | + b.ReportAllocs() |
| 153 | + b.ResetTimer() |
| 154 | + for i := 0; i < b.N; i++ { |
| 155 | + messages := []EyrieMessage{{Role: "user", Content: "unique query"}} |
| 156 | + _, _ = cp.Chat(context.TODO(), messages, opts) |
| 157 | + } |
| 158 | +} |
| 159 | + |
| 160 | +// ---------- SanitizeMessages ---------- |
| 161 | + |
| 162 | +func BenchmarkSanitizeMessages_Clean(b *testing.B) { |
| 163 | + messages := []EyrieMessage{ |
| 164 | + {Role: "user", Content: "Hello"}, |
| 165 | + {Role: "assistant", Content: "Hi there!"}, |
| 166 | + {Role: "user", Content: "How are you?"}, |
| 167 | + {Role: "assistant", Content: "I'm good."}, |
| 168 | + } |
| 169 | + b.ReportAllocs() |
| 170 | + b.ResetTimer() |
| 171 | + for i := 0; i < b.N; i++ { |
| 172 | + _ = SanitizeMessages(messages) |
| 173 | + } |
| 174 | +} |
| 175 | + |
| 176 | +func BenchmarkSanitizeMessages_WithOrphans(b *testing.B) { |
| 177 | + messages := []EyrieMessage{ |
| 178 | + {Role: "user", Content: "Search for files"}, |
| 179 | + {Role: "assistant", ToolUse: []ToolCall{ |
| 180 | + {ID: "tc-1", Name: "search", Arguments: map[string]interface{}{"query": "test"}}, |
| 181 | + {ID: "tc-2", Name: "read", Arguments: map[string]interface{}{"path": "main.go"}}, |
| 182 | + }}, |
| 183 | + // tc-1 has result, tc-2 is orphaned |
| 184 | + {Role: "user", ToolResult: &ToolResult{ToolUseID: "tc-1", Content: "Found 1 file"}}, |
| 185 | + } |
| 186 | + b.ReportAllocs() |
| 187 | + b.ResetTimer() |
| 188 | + for i := 0; i < b.N; i++ { |
| 189 | + _ = SanitizeMessages(messages) |
| 190 | + } |
| 191 | +} |
| 192 | + |
| 193 | +func BenchmarkSanitizeMessages_Large(b *testing.B) { |
| 194 | + messages := make([]EyrieMessage, 50) |
| 195 | + for i := range messages { |
| 196 | + if i%3 == 0 { |
| 197 | + messages[i] = EyrieMessage{Role: "user", Content: "message"} |
| 198 | + } else { |
| 199 | + messages[i] = EyrieMessage{Role: "assistant", Content: "response"} |
| 200 | + } |
| 201 | + } |
| 202 | + b.ReportAllocs() |
| 203 | + b.ResetTimer() |
| 204 | + for i := 0; i < b.N; i++ { |
| 205 | + _ = SanitizeMessages(messages) |
| 206 | + } |
| 207 | +} |
| 208 | + |
| 209 | +// ---------- MergeConsecutiveRoles ---------- |
| 210 | + |
| 211 | +func BenchmarkMergeConsecutiveRoles_NoMerge(b *testing.B) { |
| 212 | + messages := []EyrieMessage{ |
| 213 | + {Role: "user", Content: "Hello"}, |
| 214 | + {Role: "assistant", Content: "Hi"}, |
| 215 | + {Role: "user", Content: "How are you?"}, |
| 216 | + {Role: "assistant", Content: "Good"}, |
| 217 | + } |
| 218 | + b.ReportAllocs() |
| 219 | + b.ResetTimer() |
| 220 | + for i := 0; i < b.N; i++ { |
| 221 | + _ = MergeConsecutiveRoles(messages) |
| 222 | + } |
| 223 | +} |
| 224 | + |
| 225 | +func BenchmarkMergeConsecutiveRoles_WithMerges(b *testing.B) { |
| 226 | + messages := []EyrieMessage{ |
| 227 | + {Role: "user", Content: "Hello"}, |
| 228 | + {Role: "user", Content: "World"}, |
| 229 | + {Role: "assistant", Content: "Hi"}, |
| 230 | + {Role: "assistant", Content: "There"}, |
| 231 | + {Role: "user", Content: "How are you?"}, |
| 232 | + } |
| 233 | + b.ReportAllocs() |
| 234 | + b.ResetTimer() |
| 235 | + for i := 0; i < b.N; i++ { |
| 236 | + _ = MergeConsecutiveRoles(messages) |
| 237 | + } |
| 238 | +} |
| 239 | + |
| 240 | +func BenchmarkMergeConsecutiveRoles_WithToolUse(b *testing.B) { |
| 241 | + messages := []EyrieMessage{ |
| 242 | + {Role: "assistant", ToolUse: []ToolCall{{ID: "tc-1", Name: "search"}}}, |
| 243 | + {Role: "assistant", Content: "Let me search"}, |
| 244 | + {Role: "user", ToolResult: &ToolResult{ToolUseID: "tc-1", Content: "result"}}, |
| 245 | + } |
| 246 | + b.ReportAllocs() |
| 247 | + b.ResetTimer() |
| 248 | + for i := 0; i < b.N; i++ { |
| 249 | + _ = MergeConsecutiveRoles(messages) |
| 250 | + } |
| 251 | +} |
| 252 | + |
| 253 | +// ---------- MetricsCollector ---------- |
| 254 | + |
| 255 | +func BenchmarkMetricsCollector_Record(b *testing.B) { |
| 256 | + mc := NewMetricsCollector() |
| 257 | + m := CallMetrics{Model: "gpt-4", Provider: "openai", InputTokens: 100, OutputTokens: 50, LatencyMs: 100} |
| 258 | + b.ReportAllocs() |
| 259 | + b.ResetTimer() |
| 260 | + for i := 0; i < b.N; i++ { |
| 261 | + mc.Record(m) |
| 262 | + } |
| 263 | +} |
| 264 | + |
| 265 | +func BenchmarkMetricsCollector_Recent(b *testing.B) { |
| 266 | + mc := NewMetricsCollector() |
| 267 | + m := CallMetrics{Model: "gpt-4", Provider: "openai", InputTokens: 100, OutputTokens: 50, LatencyMs: 100} |
| 268 | + for i := 0; i < 100; i++ { |
| 269 | + mc.Record(m) |
| 270 | + } |
| 271 | + b.ReportAllocs() |
| 272 | + b.ResetTimer() |
| 273 | + for i := 0; i < b.N; i++ { |
| 274 | + _ = mc.Recent(10) |
| 275 | + } |
| 276 | +} |
| 277 | + |
| 278 | +func BenchmarkMetricsCollector_TotalCost(b *testing.B) { |
| 279 | + mc := NewMetricsCollector() |
| 280 | + m := CallMetrics{Model: "gpt-4", Provider: "openai", InputTokens: 1000, OutputTokens: 500, CacheReadTokens: 200, CacheCreationTokens: 100} |
| 281 | + for i := 0; i < 100; i++ { |
| 282 | + mc.Record(m) |
| 283 | + } |
| 284 | + b.ReportAllocs() |
| 285 | + b.ResetTimer() |
| 286 | + for i := 0; i < b.N; i++ { |
| 287 | + _ = mc.TotalCost() |
| 288 | + } |
| 289 | +} |
| 290 | + |
| 291 | +// ---------- helpers ---------- |
| 292 | + |
| 293 | +func floatPtr(f float64) *float64 { return &f } |
0 commit comments