67 lines
2.0 KiB
Go
67 lines
2.0 KiB
Go
package runner
|
|
|
|
import (
|
|
"testing"
|
|
|
|
"github.com/easyai/easyai-ai-gateway/apps/api/internal/clients"
|
|
"github.com/easyai/easyai-ai-gateway/apps/api/internal/store"
|
|
)
|
|
|
|
func TestTokenUsageAmountsUsesActualUsageForTPM(t *testing.T) {
|
|
got := tokenUsageAmounts(clients.Usage{InputTokens: 12, OutputTokens: 8, TotalTokens: 21})
|
|
|
|
if got["tpm_input"] != 12 {
|
|
t.Fatalf("expected input token amount 12, got %v", got["tpm_input"])
|
|
}
|
|
if got["tpm_output"] != 8 {
|
|
t.Fatalf("expected output token amount 8, got %v", got["tpm_output"])
|
|
}
|
|
if got["tpm_total"] != 21 {
|
|
t.Fatalf("expected total token amount 21, got %v", got["tpm_total"])
|
|
}
|
|
}
|
|
|
|
func TestTokenUsageAmountsFallsBackToInputOutputTotal(t *testing.T) {
|
|
got := tokenUsageAmounts(clients.Usage{InputTokens: 3, OutputTokens: 5})
|
|
|
|
if got["tpm_total"] != 8 {
|
|
t.Fatalf("expected total token fallback 8, got %v", got["tpm_total"])
|
|
}
|
|
}
|
|
|
|
func TestEffectiveRateLimitPolicyTreatsEmptyRuntimePolicyAsUnlimited(t *testing.T) {
|
|
policy := effectiveRateLimitPolicy(store.RuntimeModelCandidate{
|
|
PlatformRateLimitPolicy: map[string]any{"rules": []any{
|
|
map[string]any{"metric": "rpm", "limit": 500},
|
|
}},
|
|
RuntimePolicySetID: "runtime-policy-1",
|
|
RuntimeRateLimitPolicy: map[string]any{"rules": []any{}},
|
|
})
|
|
|
|
if hasRules(policy) {
|
|
t.Fatalf("expected empty runtime policy to clear inherited limits, got %+v", policy)
|
|
}
|
|
}
|
|
|
|
func TestReservationsFromPolicySkipsNonPositiveLimits(t *testing.T) {
|
|
reservations := reservationsFromPolicy(
|
|
"platform_model",
|
|
"model-1",
|
|
"Model 1",
|
|
nil,
|
|
map[string]any{"rules": []any{
|
|
map[string]any{"metric": "rpm", "limit": -1},
|
|
map[string]any{"metric": "tpm_total", "limit": 0},
|
|
map[string]any{"metric": "concurrent", "limit": 2},
|
|
}},
|
|
map[string]any{"prompt": "hello"},
|
|
)
|
|
|
|
if len(reservations) != 1 {
|
|
t.Fatalf("expected only the positive concurrent rule to reserve, got %+v", reservations)
|
|
}
|
|
if reservations[0].Metric != "concurrent" || reservations[0].Limit != 2 {
|
|
t.Fatalf("expected concurrent reservation with limit 2, got %+v", reservations[0])
|
|
}
|
|
}
|