feat: implement tiered billing expression evaluation and related functionality

- Added support for tiered billing expressions in the billing system. - Introduced new types and functions for handling billing expressions, including caching and execution. - Updated existing billing logic to accommodate tiered billing scenarios. - Enhanced request handling to support incoming billing expression requests. - Added tests for tiered billing functionality to ensure correctness.
2026-03-16 16:00:22 +08:00
parent a4fd2246ba
commit 91ed4e196a
34 changed files with 4797 additions and 26 deletions
@@ -0,0 +1,933 @@
+package billingexpr_test
+
+import (
+	"math"
+	"math/rand"
+	"testing"
+
+	"github.com/QuantumNous/new-api/pkg/billingexpr"
+)
+
+// ---------------------------------------------------------------------------
+// Claude-style: fixed tiers, input > 200K changes both input & output price
+// ---------------------------------------------------------------------------
+
+const claudeExpr = `p <= 200000 ? tier("standard", p * 1.5 + c * 7.5) : tier("long_context", p * 3.0 + c * 11.25)`
+
+func TestClaude_StandardTier(t *testing.T) {
+	cost, trace, err := billingexpr.RunExpr(claudeExpr, billingexpr.TokenParams{P: 100000, C: 5000})
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := 100000*1.5 + 5000*7.5
+	if math.Abs(cost-want) > 1e-6 {
+		t.Errorf("cost = %f, want %f", cost, want)
+	}
+	if trace.MatchedTier != "standard" {
+		t.Errorf("tier = %q, want %q", trace.MatchedTier, "standard")
+	}
+}
+
+func TestClaude_LongContextTier(t *testing.T) {
+	cost, trace, err := billingexpr.RunExpr(claudeExpr, billingexpr.TokenParams{P: 300000, C: 10000})
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := 300000*3.0 + 10000*11.25
+	if math.Abs(cost-want) > 1e-6 {
+		t.Errorf("cost = %f, want %f", cost, want)
+	}
+	if trace.MatchedTier != "long_context" {
+		t.Errorf("tier = %q, want %q", trace.MatchedTier, "long_context")
+	}
+}
+
+func TestClaude_BoundaryExact(t *testing.T) {
+	cost, trace, err := billingexpr.RunExpr(claudeExpr, billingexpr.TokenParams{P: 200000, C: 1000})
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := 200000*1.5 + 1000*7.5
+	if math.Abs(cost-want) > 1e-6 {
+		t.Errorf("cost = %f, want %f", cost, want)
+	}
+	if trace.MatchedTier != "standard" {
+		t.Errorf("tier = %q, want %q", trace.MatchedTier, "standard")
+	}
+}
+
+// ---------------------------------------------------------------------------
+// GLM-style: multi-condition tiers with both input and output dimensions
+// ---------------------------------------------------------------------------
+
+const glmExpr = `
+(
+	p < 32000 && c < 200 ? tier("tier1_short", (p)*2 + c*8) :
+	p < 32000 && c >= 200 ? tier("tier2_long_output", (p)*3 + c*14) :
+	tier("tier3_long_input", (p)*4 + c*16)
+) / 1000000
+`
+
+func TestGLM_Tier1(t *testing.T) {
+	cost, trace, err := billingexpr.RunExpr(glmExpr, billingexpr.TokenParams{P: 15000, C: 100})
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := (15000.0*2 + 100.0*8) / 1000000
+	if math.Abs(cost-want) > 1e-10 {
+		t.Errorf("cost = %f, want %f", cost, want)
+	}
+	if trace.MatchedTier != "tier1_short" {
+		t.Errorf("tier = %q, want %q", trace.MatchedTier, "tier1_short")
+	}
+}
+
+func TestGLM_Tier2(t *testing.T) {
+	cost, trace, err := billingexpr.RunExpr(glmExpr, billingexpr.TokenParams{P: 15000, C: 500})
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := (15000.0*3 + 500.0*14) / 1000000
+	if math.Abs(cost-want) > 1e-10 {
+		t.Errorf("cost = %f, want %f", cost, want)
+	}
+	if trace.MatchedTier != "tier2_long_output" {
+		t.Errorf("tier = %q, want %q", trace.MatchedTier, "tier2_long_output")
+	}
+}
+
+func TestGLM_Tier3(t *testing.T) {
+	cost, trace, err := billingexpr.RunExpr(glmExpr, billingexpr.TokenParams{P: 50000, C: 100})
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := (50000.0*4 + 100.0*16) / 1000000
+	if math.Abs(cost-want) > 1e-10 {
+		t.Errorf("cost = %f, want %f", cost, want)
+	}
+	if trace.MatchedTier != "tier3_long_input" {
+		t.Errorf("tier = %q, want %q", trace.MatchedTier, "tier3_long_input")
+	}
+}
+
+// ---------------------------------------------------------------------------
+// Simple flat-rate (no tier() call)
+// ---------------------------------------------------------------------------
+
+func TestSimpleExpr_NoTier(t *testing.T) {
+	cost, trace, err := billingexpr.RunExpr("p * 0.5 + c * 1.0", billingexpr.TokenParams{P: 1000, C: 500})
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := 1000*0.5 + 500*1.0
+	if math.Abs(cost-want) > 1e-6 {
+		t.Errorf("cost = %f, want %f", cost, want)
+	}
+	if trace.MatchedTier != "" {
+		t.Errorf("tier should be empty, got %q", trace.MatchedTier)
+	}
+}
+
+// ---------------------------------------------------------------------------
+// Math helper functions
+// ---------------------------------------------------------------------------
+
+func TestMathHelpers(t *testing.T) {
+	cost, _, err := billingexpr.RunExpr("max(p, c) * 0.5 + min(p, c) * 0.1", billingexpr.TokenParams{P: 300, C: 500})
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := 500*0.5 + 300*0.1
+	if math.Abs(cost-want) > 1e-6 {
+		t.Errorf("cost = %f, want %f", cost, want)
+	}
+}
+
+func TestRequestProbeHelpers(t *testing.T) {
+	cost, _, err := billingexpr.RunExprWithRequest(
+		`prompt_tokens * 0.5 + completion_tokens * 1.0 * (param("service_tier") == "fast" ? 2 : 1)`,
+		billingexpr.TokenParams{P: 1000, C: 500},
+		billingexpr.RequestInput{
+			Body: []byte(`{"service_tier":"fast"}`),
+		},
+	)
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := 1000*0.5 + 500*1.0*2
+	if math.Abs(cost-want) > 1e-6 {
+		t.Errorf("cost = %f, want %f", cost, want)
+	}
+}
+
+func TestHeaderProbeHelper(t *testing.T) {
+	cost, _, err := billingexpr.RunExprWithRequest(
+		`p * 0.5 + c * 1.0 * (has(header("anthropic-beta"), "fast-mode") ? 2 : 1)`,
+		billingexpr.TokenParams{P: 1000, C: 500},
+		billingexpr.RequestInput{
+			Headers: map[string]string{
+				"Anthropic-Beta": "fast-mode-2026-02-01",
+			},
+		},
+	)
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := 1000*0.5 + 500*1.0*2
+	if math.Abs(cost-want) > 1e-6 {
+		t.Errorf("cost = %f, want %f", cost, want)
+	}
+}
+
+func TestParamProbeNestedBool(t *testing.T) {
+	cost, _, err := billingexpr.RunExprWithRequest(
+		`p * (param("stream_options.fast_mode") == true ? 1.5 : 1.0)`,
+		billingexpr.TokenParams{P: 100},
+		billingexpr.RequestInput{
+			Body: []byte(`{"stream_options":{"fast_mode":true}}`),
+		},
+	)
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := 150.0
+	if math.Abs(cost-want) > 1e-6 {
+		t.Errorf("cost = %f, want %f", cost, want)
+	}
+}
+
+func TestParamProbeArrayLength(t *testing.T) {
+	cost, _, err := billingexpr.RunExprWithRequest(
+		`p * (param("messages.#") > 20 ? 1.2 : 1.0)`,
+		billingexpr.TokenParams{P: 100},
+		billingexpr.RequestInput{
+			Body: []byte(`{"messages":[1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21]}`),
+		},
+	)
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := 120.0
+	if math.Abs(cost-want) > 1e-6 {
+		t.Errorf("cost = %f, want %f", cost, want)
+	}
+}
+
+func TestRequestProbeMissingFieldReturnsNil(t *testing.T) {
+	cost, _, err := billingexpr.RunExprWithRequest(
+		`param("missing.value") == nil ? 2 : 1`,
+		billingexpr.TokenParams{},
+		billingexpr.RequestInput{
+			Body: []byte(`{"service_tier":"standard"}`),
+		},
+	)
+	if err != nil {
+		t.Fatal(err)
+	}
+	if cost != 2 {
+		t.Errorf("cost = %f, want 2", cost)
+	}
+}
+
+func TestRequestProbeMultipleRulesMultiply(t *testing.T) {
+	cost, _, err := billingexpr.RunExprWithRequest(
+		`(param("service_tier") == "fast" ? 2 : 1) * (has(header("anthropic-beta"), "fast-mode-2026-02-01") ? 2.5 : 1)`,
+		billingexpr.TokenParams{},
+		billingexpr.RequestInput{
+			Headers: map[string]string{
+				"Anthropic-Beta": "fast-mode-2026-02-01",
+			},
+			Body: []byte(`{"service_tier":"fast"}`),
+		},
+	)
+	if err != nil {
+		t.Fatal(err)
+	}
+	if math.Abs(cost-5) > 1e-6 {
+		t.Errorf("cost = %f, want 5", cost)
+	}
+}
+
+func TestCeilFloor(t *testing.T) {
+	cost, _, err := billingexpr.RunExpr("ceil(p / 1000) * 0.5", billingexpr.TokenParams{P: 1500})
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := math.Ceil(1500.0/1000) * 0.5
+	if math.Abs(cost-want) > 1e-6 {
+		t.Errorf("cost = %f, want %f", cost, want)
+	}
+}
+
+// ---------------------------------------------------------------------------
+// Zero tokens
+// ---------------------------------------------------------------------------
+
+func TestZeroTokens(t *testing.T) {
+	cost, _, err := billingexpr.RunExpr(claudeExpr, billingexpr.TokenParams{})
+	if err != nil {
+		t.Fatal(err)
+	}
+	if cost != 0 {
+		t.Errorf("cost should be 0 for zero tokens, got %f", cost)
+	}
+}
+
+// ---------------------------------------------------------------------------
+// Rounding
+// ---------------------------------------------------------------------------
+
+func TestQuotaRound(t *testing.T) {
+	tests := []struct {
+		in   float64
+		want int
+	}{
+		{0, 0},
+		{0.4, 0},
+		{0.5, 1},
+		{0.6, 1},
+		{1.5, 2},
+		{-0.5, -1},
+		{-0.6, -1},
+		{999.4999, 999},
+		{999.5, 1000},
+		{1e9 + 0.5, 1e9 + 1},
+	}
+	for _, tt := range tests {
+		got := billingexpr.QuotaRound(tt.in)
+		if got != tt.want {
+			t.Errorf("QuotaRound(%f) = %d, want %d", tt.in, got, tt.want)
+		}
+	}
+}
+
+// ---------------------------------------------------------------------------
+// Settlement
+// ---------------------------------------------------------------------------
+
+func TestComputeTieredQuota_Basic(t *testing.T) {
+	snap := &billingexpr.BillingSnapshot{
+		BillingMode:               "tiered_expr",
+		ExprString:                claudeExpr,
+		ExprHash:                  billingexpr.ExprHashString(claudeExpr),
+		GroupRatio:                1.0,
+		EstimatedPromptTokens:     100000,
+		EstimatedCompletionTokens: 5000,
+		EstimatedQuotaBeforeGroup: 100000*1.5 + 5000*7.5,
+		EstimatedQuotaAfterGroup:  billingexpr.QuotaRound(100000*1.5 + 5000*7.5),
+		EstimatedTier:             "standard",
+	}
+
+	result, err := billingexpr.ComputeTieredQuota(snap, billingexpr.TokenParams{P: 300000, C: 10000})
+	if err != nil {
+		t.Fatal(err)
+	}
+
+	wantBefore := 300000*3.0 + 10000*11.25
+	if math.Abs(result.ActualQuotaBeforeGroup-wantBefore) > 1e-6 {
+		t.Errorf("before group: got %f, want %f", result.ActualQuotaBeforeGroup, wantBefore)
+	}
+	if result.MatchedTier != "long_context" {
+		t.Errorf("tier = %q, want %q", result.MatchedTier, "long_context")
+	}
+	if !result.CrossedTier {
+		t.Error("expected crossed_tier=true (estimated standard, actual long_context)")
+	}
+}
+
+func TestComputeTieredQuota_SameTier(t *testing.T) {
+	snap := &billingexpr.BillingSnapshot{
+		BillingMode:               "tiered_expr",
+		ExprString:                claudeExpr,
+		ExprHash:                  billingexpr.ExprHashString(claudeExpr),
+		GroupRatio:                1.5,
+		EstimatedPromptTokens:     50000,
+		EstimatedCompletionTokens: 1000,
+		EstimatedQuotaBeforeGroup: 50000*1.5 + 1000*7.5,
+		EstimatedQuotaAfterGroup:  billingexpr.QuotaRound((50000*1.5 + 1000*7.5) * 1.5),
+		EstimatedTier:             "standard",
+	}
+
+	result, err := billingexpr.ComputeTieredQuota(snap, billingexpr.TokenParams{P: 80000, C: 2000})
+	if err != nil {
+		t.Fatal(err)
+	}
+
+	wantBefore := 80000*1.5 + 2000*7.5
+	wantAfter := billingexpr.QuotaRound(wantBefore * 1.5)
+	if result.ActualQuotaAfterGroup != wantAfter {
+		t.Errorf("after group: got %d, want %d", result.ActualQuotaAfterGroup, wantAfter)
+	}
+	if result.CrossedTier {
+		t.Error("expected crossed_tier=false (both standard)")
+	}
+}
+
+// ---------------------------------------------------------------------------
+// Compile errors
+// ---------------------------------------------------------------------------
+
+func TestCompileError(t *testing.T) {
+	_, _, err := billingexpr.RunExpr("invalid +-+ syntax", billingexpr.TokenParams{})
+	if err == nil {
+		t.Error("expected compile error")
+	}
+}
+
+// ---------------------------------------------------------------------------
+// Compile Cache
+// ---------------------------------------------------------------------------
+
+func TestCompileCache_SameResult(t *testing.T) {
+	r1, _, err := billingexpr.RunExpr("p * 0.5", billingexpr.TokenParams{P: 100})
+	if err != nil {
+		t.Fatal(err)
+	}
+	r2, _, err := billingexpr.RunExpr("p * 0.5", billingexpr.TokenParams{P: 100})
+	if err != nil {
+		t.Fatal(err)
+	}
+	if r1 != r2 {
+		t.Errorf("cached and uncached results differ: %f != %f", r1, r2)
+	}
+}
+
+func TestInvalidateCache(t *testing.T) {
+	billingexpr.InvalidateCache()
+	r1, _, _ := billingexpr.RunExpr("p * 0.5", billingexpr.TokenParams{P: 100})
+	billingexpr.InvalidateCache()
+	r2, _, _ := billingexpr.RunExpr("p * 0.5", billingexpr.TokenParams{P: 100})
+	if r1 != r2 {
+		t.Errorf("post-invalidate results differ: %f != %f", r1, r2)
+	}
+}
+
+// ---------------------------------------------------------------------------
+// Hash
+// ---------------------------------------------------------------------------
+
+func TestExprHashString_Deterministic(t *testing.T) {
+	h1 := billingexpr.ExprHashString("p * 0.5")
+	h2 := billingexpr.ExprHashString("p * 0.5")
+	if h1 != h2 {
+		t.Error("hash should be deterministic")
+	}
+	h3 := billingexpr.ExprHashString("p * 0.6")
+	if h1 == h3 {
+		t.Error("different expressions should have different hashes")
+	}
+}
+
+// ---------------------------------------------------------------------------
+// Cache variables: present
+// ---------------------------------------------------------------------------
+
+const claudeWithCacheExpr = `p <= 200000 ? tier("standard", p * 1.5 + c * 7.5 + cr * 0.15 + cc * 1.875) : tier("long_context", p * 3.0 + c * 11.25 + cr * 0.3 + cc * 3.75)`
+
+func TestCachePresent_StandardTier(t *testing.T) {
+	params := billingexpr.TokenParams{P: 100000, C: 5000, CR: 50000, CC: 10000}
+	cost, trace, err := billingexpr.RunExpr(claudeWithCacheExpr, params)
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := 100000*1.5 + 5000*7.5 + 50000*0.15 + 10000*1.875
+	if math.Abs(cost-want) > 1e-6 {
+		t.Errorf("cost = %f, want %f", cost, want)
+	}
+	if trace.MatchedTier != "standard" {
+		t.Errorf("tier = %q, want %q", trace.MatchedTier, "standard")
+	}
+}
+
+func TestCachePresent_LongContextTier(t *testing.T) {
+	params := billingexpr.TokenParams{P: 300000, C: 10000, CR: 100000, CC: 20000}
+	cost, trace, err := billingexpr.RunExpr(claudeWithCacheExpr, params)
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := 300000*3.0 + 10000*11.25 + 100000*0.3 + 20000*3.75
+	if math.Abs(cost-want) > 1e-6 {
+		t.Errorf("cost = %f, want %f", cost, want)
+	}
+	if trace.MatchedTier != "long_context" {
+		t.Errorf("tier = %q, want %q", trace.MatchedTier, "long_context")
+	}
+}
+
+// ---------------------------------------------------------------------------
+// Cache variables: absent (all zero) — same expression still works
+// ---------------------------------------------------------------------------
+
+func TestCacheAbsent_ZeroCacheTokens(t *testing.T) {
+	params := billingexpr.TokenParams{P: 100000, C: 5000}
+	cost, trace, err := billingexpr.RunExpr(claudeWithCacheExpr, params)
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := 100000*1.5 + 5000*7.5
+	if math.Abs(cost-want) > 1e-6 {
+		t.Errorf("cost = %f, want %f (cache terms should be 0)", cost, want)
+	}
+	if trace.MatchedTier != "standard" {
+		t.Errorf("tier = %q, want %q", trace.MatchedTier, "standard")
+	}
+}
+
+// ---------------------------------------------------------------------------
+// Mixed cache fields: cc and cc1h non-zero
+// ---------------------------------------------------------------------------
+
+const claudeCacheSplitExpr = `tier("default", p * 1.5 + c * 7.5 + cr * 0.15 + cc * 2.0 + cc1h * 3.0)`
+
+func TestMixedCacheFields(t *testing.T) {
+	params := billingexpr.TokenParams{P: 100000, C: 5000, CR: 10000, CC: 5000, CC1h: 2000}
+	cost, _, err := billingexpr.RunExpr(claudeCacheSplitExpr, params)
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := 100000*1.5 + 5000*7.5 + 10000*0.15 + 5000*2.0 + 2000*3.0
+	if math.Abs(cost-want) > 1e-6 {
+		t.Errorf("cost = %f, want %f", cost, want)
+	}
+}
+
+func TestMixedCacheFields_AllCacheZero(t *testing.T) {
+	params := billingexpr.TokenParams{P: 100000, C: 5000}
+	cost, _, err := billingexpr.RunExpr(claudeCacheSplitExpr, params)
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := 100000*1.5 + 5000*7.5
+	if math.Abs(cost-want) > 1e-6 {
+		t.Errorf("cost = %f, want %f (all cache zero)", cost, want)
+	}
+}
+
+// ---------------------------------------------------------------------------
+// Backward compatibility: p+c only expressions still work with TokenParams
+// ---------------------------------------------------------------------------
+
+func TestBackwardCompat_OldExprWithTokenParams(t *testing.T) {
+	params := billingexpr.TokenParams{P: 100000, C: 5000, CR: 99999, CC: 88888}
+	cost, trace, err := billingexpr.RunExpr(claudeExpr, params)
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := 100000*1.5 + 5000*7.5
+	if math.Abs(cost-want) > 1e-6 {
+		t.Errorf("cost = %f, want %f (old expr ignores cache fields)", cost, want)
+	}
+	if trace.MatchedTier != "standard" {
+		t.Errorf("tier = %q, want %q", trace.MatchedTier, "standard")
+	}
+}
+
+// ---------------------------------------------------------------------------
+// Settlement with cache tokens
+// ---------------------------------------------------------------------------
+
+func TestComputeTieredQuota_WithCache(t *testing.T) {
+	snap := &billingexpr.BillingSnapshot{
+		BillingMode:               "tiered_expr",
+		ExprString:                claudeWithCacheExpr,
+		ExprHash:                  billingexpr.ExprHashString(claudeWithCacheExpr),
+		GroupRatio:                1.0,
+		EstimatedPromptTokens:     100000,
+		EstimatedCompletionTokens: 5000,
+		EstimatedQuotaBeforeGroup: 100000*1.5 + 5000*7.5,
+		EstimatedQuotaAfterGroup:  billingexpr.QuotaRound(100000*1.5 + 5000*7.5),
+		EstimatedTier:             "standard",
+	}
+
+	params := billingexpr.TokenParams{P: 100000, C: 5000, CR: 50000, CC: 10000}
+	result, err := billingexpr.ComputeTieredQuota(snap, params)
+	if err != nil {
+		t.Fatal(err)
+	}
+
+	wantBefore := 100000*1.5 + 5000*7.5 + 50000*0.15 + 10000*1.875
+	if math.Abs(result.ActualQuotaBeforeGroup-wantBefore) > 1e-6 {
+		t.Errorf("before group: got %f, want %f", result.ActualQuotaBeforeGroup, wantBefore)
+	}
+	if result.MatchedTier != "standard" {
+		t.Errorf("tier = %q, want %q", result.MatchedTier, "standard")
+	}
+	if result.CrossedTier {
+		t.Error("expected crossed_tier=false (same tier)")
+	}
+}
+
+func TestComputeTieredQuota_WithCacheCrossTier(t *testing.T) {
+	snap := &billingexpr.BillingSnapshot{
+		BillingMode:               "tiered_expr",
+		ExprString:                claudeWithCacheExpr,
+		ExprHash:                  billingexpr.ExprHashString(claudeWithCacheExpr),
+		GroupRatio:                2.0,
+		EstimatedPromptTokens:     100000,
+		EstimatedCompletionTokens: 5000,
+		EstimatedQuotaBeforeGroup: 100000*1.5 + 5000*7.5,
+		EstimatedQuotaAfterGroup:  billingexpr.QuotaRound((100000*1.5 + 5000*7.5) * 2.0),
+		EstimatedTier:             "standard",
+	}
+
+	params := billingexpr.TokenParams{P: 300000, C: 10000, CR: 50000, CC: 10000}
+	result, err := billingexpr.ComputeTieredQuota(snap, params)
+	if err != nil {
+		t.Fatal(err)
+	}
+
+	wantBefore := 300000*3.0 + 10000*11.25 + 50000*0.3 + 10000*3.75
+	wantAfter := billingexpr.QuotaRound(wantBefore * 2.0)
+	if math.Abs(result.ActualQuotaBeforeGroup-wantBefore) > 1e-6 {
+		t.Errorf("before group: got %f, want %f", result.ActualQuotaBeforeGroup, wantBefore)
+	}
+	if result.ActualQuotaAfterGroup != wantAfter {
+		t.Errorf("after group: got %d, want %d", result.ActualQuotaAfterGroup, wantAfter)
+	}
+	if !result.CrossedTier {
+		t.Error("expected crossed_tier=true (estimated standard, actual long_context)")
+	}
+}
+
+// ---------------------------------------------------------------------------
+// Fuzz: random p/c/cache, verify non-negative result
+// ---------------------------------------------------------------------------
+
+func TestFuzz_NonNegativeResults(t *testing.T) {
+	exprs := []string{
+		claudeExpr,
+		claudeWithCacheExpr,
+		glmExpr,
+		"p * 0.5 + c * 1.0",
+		"max(p, c) * 0.1",
+		"p * 0.5 + cr * 0.1 + cc * 0.2",
+	}
+
+	rng := rand.New(rand.NewSource(42))
+
+	for _, exprStr := range exprs {
+		for i := 0; i < 500; i++ {
+			params := billingexpr.TokenParams{
+				P:    math.Round(rng.Float64() * 1000000),
+				C:    math.Round(rng.Float64() * 500000),
+				CR:   math.Round(rng.Float64() * 200000),
+				CC:   math.Round(rng.Float64() * 50000),
+				CC1h: math.Round(rng.Float64() * 10000),
+			}
+
+			cost, _, err := billingexpr.RunExpr(exprStr, params)
+			if err != nil {
+				t.Fatalf("expr=%q params=%+v: %v", exprStr, params, err)
+			}
+			if cost < 0 {
+				t.Errorf("expr=%q params=%+v: negative cost %f", exprStr, params, cost)
+			}
+		}
+	}
+}
+
+func TestFuzz_SettlementConsistency(t *testing.T) {
+	rng := rand.New(rand.NewSource(99))
+
+	for i := 0; i < 200; i++ {
+		estParams := billingexpr.TokenParams{
+			P:  math.Round(rng.Float64() * 500000),
+			C:  math.Round(rng.Float64() * 100000),
+			CR: math.Round(rng.Float64() * 100000),
+			CC: math.Round(rng.Float64() * 30000),
+		}
+		actParams := billingexpr.TokenParams{
+			P:  math.Round(rng.Float64() * 500000),
+			C:  math.Round(rng.Float64() * 100000),
+			CR: math.Round(rng.Float64() * 100000),
+			CC: math.Round(rng.Float64() * 30000),
+		}
+		groupRatio := 0.5 + rng.Float64()*2.0
+
+		estCost, estTrace, _ := billingexpr.RunExpr(claudeWithCacheExpr, estParams)
+
+		snap := &billingexpr.BillingSnapshot{
+			BillingMode:               "tiered_expr",
+			ExprString:                claudeWithCacheExpr,
+			ExprHash:                  billingexpr.ExprHashString(claudeWithCacheExpr),
+			GroupRatio:                groupRatio,
+			EstimatedPromptTokens:     int(estParams.P),
+			EstimatedCompletionTokens: int(estParams.C),
+			EstimatedQuotaBeforeGroup: estCost,
+			EstimatedQuotaAfterGroup:  billingexpr.QuotaRound(estCost * groupRatio),
+			EstimatedTier:             estTrace.MatchedTier,
+		}
+
+		result, err := billingexpr.ComputeTieredQuota(snap, actParams)
+		if err != nil {
+			t.Fatalf("iter %d: %v", i, err)
+		}
+
+		directCost, _, _ := billingexpr.RunExpr(claudeWithCacheExpr, actParams)
+		directQuota := billingexpr.QuotaRound(directCost * groupRatio)
+
+		if result.ActualQuotaAfterGroup != directQuota {
+			t.Errorf("iter %d: settlement %d != direct %d", i, result.ActualQuotaAfterGroup, directQuota)
+		}
+	}
+}
+
+// ---------------------------------------------------------------------------
+// Settlement-level tests for ComputeTieredQuota
+// ---------------------------------------------------------------------------
+
+func TestComputeTieredQuota_BasicSettlement(t *testing.T) {
+	exprStr := `tier("default", p + c)`
+	snap := &billingexpr.BillingSnapshot{
+		BillingMode: "tiered_expr",
+		ExprString:  exprStr,
+		ExprHash:    billingexpr.ExprHashString(exprStr),
+		GroupRatio:  1.0,
+	}
+
+	result, err := billingexpr.ComputeTieredQuota(snap, billingexpr.TokenParams{P: 3000, C: 2000})
+	if err != nil {
+		t.Fatal(err)
+	}
+	if math.Abs(result.ActualQuotaBeforeGroup-5000) > 1e-6 {
+		t.Errorf("before group = %f, want 5000", result.ActualQuotaBeforeGroup)
+	}
+	if result.ActualQuotaAfterGroup != 5000 {
+		t.Errorf("after group = %d, want 5000", result.ActualQuotaAfterGroup)
+	}
+	if result.MatchedTier != "default" {
+		t.Errorf("tier = %q, want default", result.MatchedTier)
+	}
+}
+
+func TestComputeTieredQuota_WithGroupRatio(t *testing.T) {
+	exprStr := `tier("default", p + c)`
+	snap := &billingexpr.BillingSnapshot{
+		BillingMode: "tiered_expr",
+		ExprString:  exprStr,
+		ExprHash:    billingexpr.ExprHashString(exprStr),
+		GroupRatio:  2.0,
+	}
+
+	result, err := billingexpr.ComputeTieredQuota(snap, billingexpr.TokenParams{P: 1000, C: 500})
+	if err != nil {
+		t.Fatal(err)
+	}
+	// cost = 1500, after group = round(1500 * 2.0) = 3000
+	if result.ActualQuotaAfterGroup != 3000 {
+		t.Errorf("after group = %d, want 3000", result.ActualQuotaAfterGroup)
+	}
+}
+
+func TestComputeTieredQuota_ZeroTokens(t *testing.T) {
+	exprStr := `tier("default", p * 2 + c * 10)`
+	snap := &billingexpr.BillingSnapshot{
+		BillingMode: "tiered_expr",
+		ExprString:  exprStr,
+		ExprHash:    billingexpr.ExprHashString(exprStr),
+		GroupRatio:  1.0,
+	}
+
+	result, err := billingexpr.ComputeTieredQuota(snap, billingexpr.TokenParams{})
+	if err != nil {
+		t.Fatal(err)
+	}
+	if result.ActualQuotaAfterGroup != 0 {
+		t.Errorf("after group = %d, want 0", result.ActualQuotaAfterGroup)
+	}
+}
+
+func TestComputeTieredQuota_RoundingEdge(t *testing.T) {
+	exprStr := `tier("default", p * 0.5)` // 3 * 0.5 = 1.5 -> round to 2
+	snap := &billingexpr.BillingSnapshot{
+		BillingMode: "tiered_expr",
+		ExprString:  exprStr,
+		ExprHash:    billingexpr.ExprHashString(exprStr),
+		GroupRatio:  1.0,
+	}
+
+	result, err := billingexpr.ComputeTieredQuota(snap, billingexpr.TokenParams{P: 3})
+	if err != nil {
+		t.Fatal(err)
+	}
+	// 3 * 0.5 = 1.5, round(1.5) = 2
+	if result.ActualQuotaAfterGroup != 2 {
+		t.Errorf("after group = %d, want 2 (round 1.5 up)", result.ActualQuotaAfterGroup)
+	}
+}
+
+func TestComputeTieredQuota_RoundingEdgeDown(t *testing.T) {
+	exprStr := `tier("default", p * 0.4)` // 3 * 0.4 = 1.2 -> round to 1
+	snap := &billingexpr.BillingSnapshot{
+		BillingMode: "tiered_expr",
+		ExprString:  exprStr,
+		ExprHash:    billingexpr.ExprHashString(exprStr),
+		GroupRatio:  1.0,
+	}
+
+	result, err := billingexpr.ComputeTieredQuota(snap, billingexpr.TokenParams{P: 3})
+	if err != nil {
+		t.Fatal(err)
+	}
+	// 3 * 0.4 = 1.2, round(1.2) = 1
+	if result.ActualQuotaAfterGroup != 1 {
+		t.Errorf("after group = %d, want 1 (round 1.2 down)", result.ActualQuotaAfterGroup)
+	}
+}
+
+func TestComputeTieredQuotaWithRequest_ProbeAffectsQuota(t *testing.T) {
+	exprStr := `param("fast") == true ? tier("fast", p * 4) : tier("normal", p * 2)`
+	snap := &billingexpr.BillingSnapshot{
+		BillingMode:   "tiered_expr",
+		ExprString:    exprStr,
+		ExprHash:      billingexpr.ExprHashString(exprStr),
+		GroupRatio:    1.0,
+		EstimatedTier: "normal",
+	}
+
+	// Without request: normal tier
+	r1, err := billingexpr.ComputeTieredQuota(snap, billingexpr.TokenParams{P: 1000})
+	if err != nil {
+		t.Fatal(err)
+	}
+	if r1.ActualQuotaAfterGroup != 2000 {
+		t.Errorf("normal = %d, want 2000", r1.ActualQuotaAfterGroup)
+	}
+
+	// With request: fast tier
+	r2, err := billingexpr.ComputeTieredQuotaWithRequest(snap, billingexpr.TokenParams{P: 1000}, billingexpr.RequestInput{
+		Body: []byte(`{"fast":true}`),
+	})
+	if err != nil {
+		t.Fatal(err)
+	}
+	if r2.ActualQuotaAfterGroup != 4000 {
+		t.Errorf("fast = %d, want 4000", r2.ActualQuotaAfterGroup)
+	}
+	if !r2.CrossedTier {
+		t.Error("expected CrossedTier = true when probe changes tier")
+	}
+}
+
+func TestComputeTieredQuota_BoundaryTierCrossing(t *testing.T) {
+	exprStr := `p <= 100000 ? tier("small", p * 1) : tier("large", p * 2)`
+	snap := &billingexpr.BillingSnapshot{
+		BillingMode:   "tiered_expr",
+		ExprString:    exprStr,
+		ExprHash:      billingexpr.ExprHashString(exprStr),
+		GroupRatio:    1.0,
+		EstimatedTier: "small",
+	}
+
+	// At boundary
+	r1, err := billingexpr.ComputeTieredQuota(snap, billingexpr.TokenParams{P: 100000})
+	if err != nil {
+		t.Fatal(err)
+	}
+	if r1.MatchedTier != "small" {
+		t.Errorf("at boundary: tier = %s, want small", r1.MatchedTier)
+	}
+	if r1.ActualQuotaAfterGroup != 100000 {
+		t.Errorf("at boundary: quota = %d, want 100000", r1.ActualQuotaAfterGroup)
+	}
+
+	// Past boundary
+	r2, err := billingexpr.ComputeTieredQuota(snap, billingexpr.TokenParams{P: 100001})
+	if err != nil {
+		t.Fatal(err)
+	}
+	if r2.MatchedTier != "large" {
+		t.Errorf("past boundary: tier = %s, want large", r2.MatchedTier)
+	}
+	if r2.ActualQuotaAfterGroup != 200002 {
+		t.Errorf("past boundary: quota = %d, want 200002", r2.ActualQuotaAfterGroup)
+	}
+	if !r2.CrossedTier {
+		t.Error("expected CrossedTier = true")
+	}
+}
+
+// ---------------------------------------------------------------------------
+// Time function tests
+// ---------------------------------------------------------------------------
+
+func TestTimeFunctions_ValidTimezone(t *testing.T) {
+	exprStr := `tier("default", p) * (hour("UTC") >= 0 ? 1 : 1)`
+	cost, _, err := billingexpr.RunExpr(exprStr, billingexpr.TokenParams{P: 100})
+	if err != nil {
+		t.Fatal(err)
+	}
+	if cost != 100 {
+		t.Errorf("cost = %f, want 100", cost)
+	}
+}
+
+func TestTimeFunctions_AllFunctionsCompile(t *testing.T) {
+	exprStr := `tier("default", p) * (hour("Asia/Shanghai") >= 0 ? 1 : 1) * (minute("UTC") >= 0 ? 1 : 1) * (weekday("UTC") >= 0 ? 1 : 1) * (month("UTC") >= 1 ? 1 : 1) * (day("UTC") >= 1 ? 1 : 1)`
+	cost, _, err := billingexpr.RunExpr(exprStr, billingexpr.TokenParams{P: 500})
+	if err != nil {
+		t.Fatal(err)
+	}
+	if cost != 500 {
+		t.Errorf("cost = %f, want 500", cost)
+	}
+}
+
+func TestTimeFunctions_InvalidTimezone(t *testing.T) {
+	exprStr := `tier("default", p) * (hour("Invalid/Zone") >= 0 ? 1 : 2)`
+	cost, _, err := billingexpr.RunExpr(exprStr, billingexpr.TokenParams{P: 100})
+	if err != nil {
+		t.Fatal(err)
+	}
+	// Invalid timezone falls back to UTC; hour is 0-23, so condition is always true
+	if cost != 100 {
+		t.Errorf("cost = %f, want 100 (fallback to UTC)", cost)
+	}
+}
+
+func TestTimeFunctions_EmptyTimezone(t *testing.T) {
+	exprStr := `tier("default", p) * (hour("") >= 0 ? 1 : 2)`
+	cost, _, err := billingexpr.RunExpr(exprStr, billingexpr.TokenParams{P: 100})
+	if err != nil {
+		t.Fatal(err)
+	}
+	if cost != 100 {
+		t.Errorf("cost = %f, want 100 (empty tz -> UTC)", cost)
+	}
+}
+
+func TestTimeFunctions_NightDiscountPattern(t *testing.T) {
+	exprStr := `tier("default", p * 2 + c * 10) * (hour("UTC") >= 21 || hour("UTC") < 6 ? 0.5 : 1)`
+	cost, _, err := billingexpr.RunExpr(exprStr, billingexpr.TokenParams{P: 1000, C: 500})
+	if err != nil {
+		t.Fatal(err)
+	}
+	// Base = 1000*2 + 500*10 = 7000; multiplier is either 0.5 or 1 depending on current UTC hour
+	if cost != 7000 && cost != 3500 {
+		t.Errorf("cost = %f, want 7000 or 3500", cost)
+	}
+}
+
+func TestTimeFunctions_WeekdayRange(t *testing.T) {
+	exprStr := `tier("default", p) * (weekday("UTC") >= 0 && weekday("UTC") <= 6 ? 1 : 999)`
+	cost, _, err := billingexpr.RunExpr(exprStr, billingexpr.TokenParams{P: 100})
+	if err != nil {
+		t.Fatal(err)
+	}
+	// weekday is always 0-6, so multiplier is always 1
+	if cost != 100 {
+		t.Errorf("cost = %f, want 100", cost)
+	}
+}
+
+func TestTimeFunctions_MonthDayPattern(t *testing.T) {
+	exprStr := `tier("default", p) * (month("Asia/Shanghai") == 1 && day("Asia/Shanghai") == 1 ? 0.5 : 1)`
+	cost, _, err := billingexpr.RunExpr(exprStr, billingexpr.TokenParams{P: 1000})
+	if err != nil {
+		t.Fatal(err)
+	}
+	// Either 1000 (not Jan 1) or 500 (Jan 1) — both are valid
+	if cost != 1000 && cost != 500 {
+		t.Errorf("cost = %f, want 1000 or 500", cost)
+	}
+}
@@ -0,0 +1,91 @@
+package billingexpr
+
+import (
+	"fmt"
+	"math"
+	"sync"
+
+	"github.com/expr-lang/expr"
+	"github.com/expr-lang/expr/vm"
+)
+
+const maxCacheSize = 256
+
+var (
+	cacheMu sync.RWMutex
+	cache   = make(map[string]*vm.Program, 64)
+)
+
+// compileEnvPrototype is the type-checking prototype used at compile time.
+// It declares the shape of the environment that RunExpr will provide.
+// The tier() function is a no-op placeholder here; the real one with
+// side-channel tracing is injected at runtime.
+var compileEnvPrototype = map[string]interface{}{
+	"p":                      float64(0),
+	"c":                      float64(0),
+	"cr":                     float64(0),
+	"cc":                     float64(0),
+	"cc1h":                   float64(0),
+	"prompt_tokens":          float64(0),
+	"completion_tokens":      float64(0),
+	"cache_read_tokens":      float64(0),
+	"cache_create_tokens":    float64(0),
+	"cache_create_1h_tokens": float64(0),
+	"tier":                   func(string, float64) float64 { return 0 },
+	"header":                 func(string) string { return "" },
+	"param":                  func(string) interface{} { return nil },
+	"has":                    func(interface{}, string) bool { return false },
+	"hour":                   func(string) int { return 0 },
+	"minute":                 func(string) int { return 0 },
+	"weekday":                func(string) int { return 0 },
+	"month":                  func(string) int { return 0 },
+	"day":                    func(string) int { return 0 },
+	"max":                    math.Max,
+	"min":                    math.Min,
+	"abs":                    math.Abs,
+	"ceil":                   math.Ceil,
+	"floor":                  math.Floor,
+}
+
+// CompileFromCache compiles an expression string, using a cached program when
+// available. The cache is keyed by the SHA-256 hex digest of the expression.
+func CompileFromCache(exprStr string) (*vm.Program, error) {
+	return compileFromCacheByHash(exprStr, ExprHashString(exprStr))
+}
+
+// CompileFromCacheByHash is like CompileFromCache but accepts a pre-computed
+// hash, useful when the caller already has the BillingSnapshot.ExprHash.
+func CompileFromCacheByHash(exprStr, hash string) (*vm.Program, error) {
+	return compileFromCacheByHash(exprStr, hash)
+}
+
+func compileFromCacheByHash(exprStr, hash string) (*vm.Program, error) {
+	cacheMu.RLock()
+	if prog, ok := cache[hash]; ok {
+		cacheMu.RUnlock()
+		return prog, nil
+	}
+	cacheMu.RUnlock()
+
+	prog, err := expr.Compile(exprStr, expr.Env(compileEnvPrototype), expr.AsFloat64())
+	if err != nil {
+		return nil, fmt.Errorf("expr compile error: %w", err)
+	}
+
+	cacheMu.Lock()
+	if len(cache) >= maxCacheSize {
+		cache = make(map[string]*vm.Program, 64)
+	}
+	cache[hash] = prog
+	cacheMu.Unlock()
+
+	return prog, nil
+}
+
+// InvalidateCache clears the compiled-expression cache.
+// Called when billing rules are updated.
+func InvalidateCache() {
+	cacheMu.Lock()
+	cache = make(map[string]*vm.Program, 64)
+	cacheMu.Unlock()
+}
@@ -0,0 +1,10 @@
+package billingexpr
+
+import "math"
+
+// QuotaRound converts a float64 quota value to int using half-away-from-zero
+// rounding. Every tiered billing path (pre-consume, settlement, breakdown
+// validation, log fields) MUST use this function to avoid +-1 discrepancies.
+func QuotaRound(f float64) int {
+	return int(math.Round(f))
+}
@@ -0,0 +1,139 @@
+package billingexpr
+
+import (
+	"fmt"
+	"math"
+	"strings"
+	"time"
+
+	"github.com/expr-lang/expr"
+	"github.com/expr-lang/expr/vm"
+	"github.com/tidwall/gjson"
+)
+
+// RunExpr compiles (with cache) and executes an expression string.
+// The environment exposes:
+//   - p, c             — prompt / completion tokens
+//   - cr, cc, cc1h     — cache read / creation / creation-1h tokens
+//   - tier(name, value) — trace callback that records which tier matched
+//   - max, min, abs, ceil, floor — standard math helpers
+//
+// Returns the resulting float64 quota (before group ratio) and a TraceResult
+// with side-channel info captured by tier() during execution.
+func RunExpr(exprStr string, params TokenParams) (float64, TraceResult, error) {
+	return RunExprWithRequest(exprStr, params, RequestInput{})
+}
+
+func RunExprWithRequest(exprStr string, params TokenParams, request RequestInput) (float64, TraceResult, error) {
+	prog, err := CompileFromCache(exprStr)
+	if err != nil {
+		return 0, TraceResult{}, err
+	}
+	return runProgram(prog, params, request)
+}
+
+// RunExprByHash is like RunExpr but accepts a pre-computed hash for the cache
+// lookup, avoiding a redundant SHA-256 computation when the caller already
+// holds BillingSnapshot.ExprHash.
+func RunExprByHash(exprStr, hash string, params TokenParams) (float64, TraceResult, error) {
+	return RunExprByHashWithRequest(exprStr, hash, params, RequestInput{})
+}
+
+func RunExprByHashWithRequest(exprStr, hash string, params TokenParams, request RequestInput) (float64, TraceResult, error) {
+	prog, err := CompileFromCacheByHash(exprStr, hash)
+	if err != nil {
+		return 0, TraceResult{}, err
+	}
+	return runProgram(prog, params, request)
+}
+
+func runProgram(prog *vm.Program, params TokenParams, request RequestInput) (float64, TraceResult, error) {
+	trace := TraceResult{}
+	headers := normalizeHeaders(request.Headers)
+
+	env := map[string]interface{}{
+		"p":                      params.P,
+		"c":                      params.C,
+		"cr":                     params.CR,
+		"cc":                     params.CC,
+		"cc1h":                   params.CC1h,
+		"prompt_tokens":          params.P,
+		"completion_tokens":      params.C,
+		"cache_read_tokens":      params.CR,
+		"cache_create_tokens":    params.CC,
+		"cache_create_1h_tokens": params.CC1h,
+		"tier": func(name string, value float64) float64 {
+			trace.MatchedTier = name
+			trace.Cost = value
+			return value
+		},
+		"header": func(key string) string {
+			return headers[strings.ToLower(strings.TrimSpace(key))]
+		},
+		"param": func(path string) interface{} {
+			path = strings.TrimSpace(path)
+			if path == "" || len(request.Body) == 0 {
+				return nil
+			}
+			result := gjson.GetBytes(request.Body, path)
+			if !result.Exists() {
+				return nil
+			}
+			return result.Value()
+		},
+		"has": func(source interface{}, substr string) bool {
+			if source == nil || substr == "" {
+				return false
+			}
+			return strings.Contains(fmt.Sprint(source), substr)
+		},
+		"hour":    func(tz string) int { return timeInZone(tz).Hour() },
+		"minute":  func(tz string) int { return timeInZone(tz).Minute() },
+		"weekday": func(tz string) int { return int(timeInZone(tz).Weekday()) },
+		"month":   func(tz string) int { return int(timeInZone(tz).Month()) },
+		"day":     func(tz string) int { return timeInZone(tz).Day() },
+		"max":     math.Max,
+		"min":   math.Min,
+		"abs":   math.Abs,
+		"ceil":  math.Ceil,
+		"floor": math.Floor,
+	}
+
+	out, err := expr.Run(prog, env)
+	if err != nil {
+		return 0, trace, fmt.Errorf("expr run error: %w", err)
+	}
+	f, ok := out.(float64)
+	if !ok {
+		return 0, trace, fmt.Errorf("expr result is %T, want float64", out)
+	}
+	return f, trace, nil
+}
+
+func timeInZone(tz string) time.Time {
+	tz = strings.TrimSpace(tz)
+	if tz == "" {
+		return time.Now().UTC()
+	}
+	loc, err := time.LoadLocation(tz)
+	if err != nil {
+		return time.Now().UTC()
+	}
+	return time.Now().In(loc)
+}
+
+func normalizeHeaders(headers map[string]string) map[string]string {
+	if len(headers) == 0 {
+		return map[string]string{}
+	}
+	normalized := make(map[string]string, len(headers))
+	for key, value := range headers {
+		k := strings.ToLower(strings.TrimSpace(key))
+		v := strings.TrimSpace(value)
+		if k == "" || v == "" {
+			continue
+		}
+		normalized[k] = v
+	}
+	return normalized
+}
@@ -0,0 +1,24 @@
+package billingexpr
+
+// ComputeTieredQuota runs the Expr from a frozen BillingSnapshot against
+// actual token counts and returns the settlement result.
+func ComputeTieredQuota(snap *BillingSnapshot, params TokenParams) (TieredResult, error) {
+	return ComputeTieredQuotaWithRequest(snap, params, RequestInput{})
+}
+
+func ComputeTieredQuotaWithRequest(snap *BillingSnapshot, params TokenParams, request RequestInput) (TieredResult, error) {
+	cost, trace, err := RunExprByHashWithRequest(snap.ExprString, snap.ExprHash, params, request)
+	if err != nil {
+		return TieredResult{}, err
+	}
+
+	afterGroup := QuotaRound(cost * snap.GroupRatio)
+	crossed := trace.MatchedTier != snap.EstimatedTier
+
+	return TieredResult{
+		ActualQuotaBeforeGroup: cost,
+		ActualQuotaAfterGroup:  afterGroup,
+		MatchedTier:            trace.MatchedTier,
+		CrossedTier:            crossed,
+	}, nil
+}
@@ -0,0 +1,59 @@
+package billingexpr
+
+import (
+	"crypto/sha256"
+	"fmt"
+)
+
+type RequestInput struct {
+	Headers map[string]string
+	Body    []byte
+}
+
+// TokenParams holds all token dimensions passed into an Expr evaluation.
+// Fields beyond P and C are optional — when absent they default to 0,
+// which means cache-unaware expressions keep working unchanged.
+type TokenParams struct {
+	P    float64 // prompt tokens
+	C    float64 // completion tokens
+	CR   float64 // cache read (hit) tokens
+	CC   float64 // cache creation tokens (5-min TTL for Claude, generic for others)
+	CC1h float64 // cache creation tokens — 1-hour TTL (Claude only)
+}
+
+// TraceResult holds side-channel info captured by the tier() function
+// during Expr execution. This replaces the old Breakdown mechanism —
+// the Expr itself is the single source of truth for billing logic.
+type TraceResult struct {
+	MatchedTier string  `json:"matched_tier"`
+	Cost        float64 `json:"cost"`
+}
+
+// BillingSnapshot captures the billing rule state frozen at pre-consume time.
+// It is fully serializable and contains no compiled program pointers.
+type BillingSnapshot struct {
+	BillingMode               string  `json:"billing_mode"`
+	ModelName                 string  `json:"model_name"`
+	ExprString                string  `json:"expr_string"`
+	ExprHash                  string  `json:"expr_hash"`
+	GroupRatio                float64 `json:"group_ratio"`
+	EstimatedPromptTokens     int     `json:"estimated_prompt_tokens"`
+	EstimatedCompletionTokens int     `json:"estimated_completion_tokens"`
+	EstimatedQuotaBeforeGroup float64 `json:"estimated_quota_before_group"`
+	EstimatedQuotaAfterGroup  int     `json:"estimated_quota_after_group"`
+	EstimatedTier             string  `json:"estimated_tier"`
+}
+
+// TieredResult holds everything needed after running tiered settlement.
+type TieredResult struct {
+	ActualQuotaBeforeGroup float64 `json:"actual_quota_before_group"`
+	ActualQuotaAfterGroup  int     `json:"actual_quota_after_group"`
+	MatchedTier            string  `json:"matched_tier"`
+	CrossedTier            bool    `json:"crossed_tier"`
+}
+
+// ExprHashString returns the SHA-256 hex digest of an expression string.
+func ExprHashString(expr string) string {
+	h := sha256.Sum256([]byte(expr))
+	return fmt.Sprintf("%x", h)
+}