ding113 · ding113 · Mar 21, 2026 · greptile-apps · Mar 21, 2026 · greptile-apps
diff --git a/src/app/v1/_lib/proxy/billing-header-rectifier.ts b/src/app/v1/_lib/proxy/billing-header-rectifier.ts
@@ -17,6 +17,15 @@ export type BillingHeaderRectifierResult = {
 };
 
 const BILLING_HEADER_PATTERN = /^\s*x-anthropic-billing-header\s*:/i;
+const REDACTED_BILLING_HEADER_VALUE = "x-anthropic-billing-header: [REDACTED]";
+
+function redactBillingHeaderAuditValue(value: string): string {
+  if (!BILLING_HEADER_PATTERN.test(value)) {
+    return value.trim();
+  }
+
+  return REDACTED_BILLING_HEADER_VALUE;
+}
-function redactBillingHeaderAuditValue(value: string): string {
-  if (!BILLING_HEADER_PATTERN.test(value)) {
-    return value.trim();
-  }
-
-  return REDACTED_BILLING_HEADER_VALUE;
-}
+function redactBillingHeaderAuditValue(): string {
+  return REDACTED_BILLING_HEADER_VALUE;
+}
-function redactBillingHeaderAuditValue(value: string): string {
-  if (!BILLING_HEADER_PATTERN.test(value)) {
-    return value.trim();
-  }
-
-  return REDACTED_BILLING_HEADER_VALUE;
-}
+function redactBillingHeaderAuditValue(): string {
+  return REDACTED_BILLING_HEADER_VALUE;
+}
 
 /**
  * Remove x-anthropic-billing-header text blocks from the request system prompt.
@@ -35,7 +44,7 @@ export function rectifyBillingHeader(
   // Case 2: system is a plain string
   if (typeof system === "string") {
     if (BILLING_HEADER_PATTERN.test(system)) {
-      const extractedValues = [system.trim()];
+      const extractedValues = [redactBillingHeaderAuditValue(system)];
       delete message.system;
       return { applied: true, removedCount: 1, extractedValues };
     }
@@ -55,7 +64,9 @@ export function rectifyBillingHeader(
         typeof (block as Record<string, unknown>).text === "string" &&
         BILLING_HEADER_PATTERN.test((block as Record<string, unknown>).text as string)
       ) {
-        extractedValues.push(((block as Record<string, unknown>).text as string).trim());
+        extractedValues.push(
+          redactBillingHeaderAuditValue((block as Record<string, unknown>).text as string)
+        );
       } else {
         filtered.push(block);
       }

diff --git a/src/app/v1/_lib/proxy/circuit-breaker-accounting.ts b/src/app/v1/_lib/proxy/circuit-breaker-accounting.ts
@@ -0,0 +1,9 @@
+const PROVIDER_FAILURE_STATUSES = new Set([401, 402, 403, 408, 429, 451]);
+
+export function shouldRecordProviderCircuitFailure(statusCode: number): boolean {
+  if (statusCode >= 500) {
+    return true;
+  }
+
+  return PROVIDER_FAILURE_STATUSES.has(statusCode);
+}
diff --git a/src/app/v1/_lib/proxy/endpoint-family-catalog.ts b/src/app/v1/_lib/proxy/endpoint-family-catalog.ts
@@ -97,7 +97,7 @@ const KNOWN_ENDPOINT_FAMILIES: readonly EndpointFamily[] = Object.freeze([
   {
     id: "response-compact",
     surface: "response",
-    accountingTier: "none",
+    accountingTier: "required_usage",
     modelRequired: false,
     rawPassthrough: true,
     match: (pathname) => pathname === "/v1/responses/compact",

diff --git a/src/app/v1/_lib/proxy/endpoint-policy.ts b/src/app/v1/_lib/proxy/endpoint-policy.ts
@@ -5,7 +5,7 @@ export type EndpointGuardPreset = "chat" | "raw_passthrough";
 export type EndpointPoolStrictness = "inherit" | "strict";
 
 export interface EndpointPolicy {
-  readonly kind: "default" | "raw_passthrough";
+  readonly kind: "default" | "raw_passthrough" | "guarded_passthrough";
   readonly guardPreset: EndpointGuardPreset;
   readonly allowRetry: boolean;
   readonly allowProviderSwitch: boolean;
@@ -46,10 +46,22 @@ const RAW_PASSTHROUGH_ENDPOINT_POLICY: EndpointPolicy = Object.freeze({
   endpointPoolStrictness: "strict",
 });
 
-const rawPassthroughEndpointPathSet = new Set<string>([
-  V1_ENDPOINT_PATHS.MESSAGES_COUNT_TOKENS,
-  V1_ENDPOINT_PATHS.RESPONSES_COMPACT,
-]);
+const GUARDED_PASSTHROUGH_ENDPOINT_POLICY: EndpointPolicy = Object.freeze({
+  kind: "guarded_passthrough",
+  guardPreset: "chat",
+  allowRetry: false,
+  allowProviderSwitch: false,
+  allowCircuitBreakerAccounting: true,
+  trackConcurrentRequests: true,
+  bypassRequestFilters: false,
+  bypassForwarderPreprocessing: true,
+  bypassSpecialSettings: true,
+  bypassResponseRectifier: true,
+  endpointPoolStrictness: "strict",
+});
+
+const rawPassthroughEndpointPathSet = new Set<string>([V1_ENDPOINT_PATHS.MESSAGES_COUNT_TOKENS]);
+const guardedPassthroughEndpointPathSet = new Set<string>([V1_ENDPOINT_PATHS.RESPONSES_COMPACT]);
 
 export function isRawPassthroughEndpointPath(pathname: string): boolean {
   return rawPassthroughEndpointPathSet.has(normalizeEndpointPath(pathname));
@@ -64,5 +76,9 @@ export function resolveEndpointPolicy(pathname: string): EndpointPolicy {
     return RAW_PASSTHROUGH_ENDPOINT_POLICY;
   }
 
+  if (guardedPassthroughEndpointPathSet.has(normalizeEndpointPath(pathname))) {
+    return GUARDED_PASSTHROUGH_ENDPOINT_POLICY;
+  }
+
   return DEFAULT_ENDPOINT_POLICY;
 }
diff --git a/src/app/v1/_lib/proxy/response-handler.ts b/src/app/v1/_lib/proxy/response-handler.ts
@@ -39,6 +39,7 @@ import type { SessionUsageUpdate } from "@/types/session";
 import type { LongContextPricingSpecialSetting } from "@/types/special-settings";
 import { GeminiAdapter } from "../gemini/adapter";
 import type { GeminiResponse } from "../gemini/types";
+import { shouldRecordProviderCircuitFailure } from "./circuit-breaker-accounting";
 import { isClientAbortError, isTransportError } from "./errors";
 import type { ProxySession } from "./session";
 import { consumeDeferredStreamingFinalization } from "./stream-finalization";
@@ -507,10 +508,12 @@ async function finalizeDeferredStreamingFinalizationIfNeeded(
 
     const chainReason = effectiveStatusCode === 404 ? "resource_not_found" : "retry_failed";
 
-    // 计入熔断器：让后续请求能正确触发故障转移/熔断。
-    //
-    // 注意：404 语义在 forwarder 中属于 RESOURCE_NOT_FOUND，不计入熔断器（避免把“资源/模型不存在”当作供应商故障）。
-    if (effectiveStatusCode !== 404 && session.getEndpointPolicy().allowCircuitBreakerAccounting) {
+    // 计入熔断器：仅对 provider/key 侧故障计数；
+    // 客户端可诱发的 4xx（400/404/409/413/415/422）不应把全局 provider 熔断打爆。
+    if (
+      shouldRecordProviderCircuitFailure(effectiveStatusCode) &&
+      session.getEndpointPolicy().allowCircuitBreakerAccounting
+    ) {
       try {
         // 动态导入：避免 proxy 模块与熔断器模块之间潜在的循环依赖。
         const { recordFailure } = await import("@/lib/circuit-breaker");
@@ -559,9 +562,12 @@ async function finalizeDeferredStreamingFinalizationIfNeeded(
 
     const chainReason = effectiveStatusCode === 404 ? "resource_not_found" : "retry_failed";
 
-    // 计入熔断器：让后续请求能正确触发故障转移/熔断。
-    // 注意：与 forwarder 口径保持一致：404 不计入熔断器（资源不存在不是供应商故障）。
-    if (effectiveStatusCode !== 404 && session.getEndpointPolicy().allowCircuitBreakerAccounting) {
+    // 计入熔断器：仅对 provider/key 侧故障计数；
+    // 客户端可诱发的 4xx（400/404/409/413/415/422）不应把全局 provider 熔断打爆。
+    if (
+      shouldRecordProviderCircuitFailure(effectiveStatusCode) &&
+      session.getEndpointPolicy().allowCircuitBreakerAccounting
+    ) {
       try {
         const { recordFailure } = await import("@/lib/circuit-breaker");
         await recordFailure(meta.providerId, new Error(errorMessage));
@@ -780,8 +786,11 @@ export class ProxyResponseHandler {
               const detected = detectUpstreamErrorFromSseOrJsonText(responseText);
               errorMessageForFinalize = detected.isError ? detected.code : `HTTP ${statusCode}`;
 
-              // 计入熔断器
-              if (session.getEndpointPolicy().allowCircuitBreakerAccounting) {
+              // 计入熔断器：仅统计 provider/key 侧故障。
+              if (
+                shouldRecordProviderCircuitFailure(statusCode) &&
+                session.getEndpointPolicy().allowCircuitBreakerAccounting
+              ) {
                 try {
                   const { recordFailure } = await import("@/lib/circuit-breaker");
                   await recordFailure(provider.id, new Error(errorMessageForFinalize));
@@ -1106,8 +1115,11 @@ export class ProxyResponseHandler {
           const detected = detectUpstreamErrorFromSseOrJsonText(responseText);
           const errorMessageForDb = detected.isError ? detected.code : `HTTP ${statusCode}`;
 
-          // 计入熔断器
-          if (session.getEndpointPolicy().allowCircuitBreakerAccounting) {
+          // 计入熔断器：仅统计 provider/key 侧故障。
+          if (
+            shouldRecordProviderCircuitFailure(statusCode) &&
+            session.getEndpointPolicy().allowCircuitBreakerAccounting
+          ) {
             try {
               const { recordFailure } = await import("@/lib/circuit-breaker");
               await recordFailure(provider.id, new Error(errorMessageForDb));

diff --git a/src/lib/session-manager.ts b/src/lib/session-manager.ts
@@ -391,96 +391,15 @@ export class SessionManager {
       return clientSessionId;
     }
 
-    // 2. 降级方案：计算 messages 内容哈希（TC-047 警告：不可靠）
-    logger.warn(
-      "SessionManager: No client session ID, falling back to content hash (unreliable for compressed dialogs)",
-      {
-        keyId,
-        messagesLength: Array.isArray(messages) ? messages.length : 0,
-      }
-    );
-    const contentHash = SessionManager.calculateMessagesHash(messages);
-    if (!contentHash) {
-      // 降级：无法计算哈希，生成新 session
-      const newId = SessionManager.generateSessionId();
-      logger.warn("SessionManager: Cannot calculate hash, generating new session", {
-        sessionId: newId,
-      });
-      return newId;
-    }
-
-    // 3. 尝试从 Redis 查找已有 session
-    if (redis && redis.status === "ready") {
-      try {
-        const hashKey = `hash:${contentHash}:session`;
-        const existingSessionId = await redis.get(hashKey);
-
-        if (existingSessionId) {
-          // 找到已有 session，刷新 TTL
-          await SessionManager.refreshSessionTTL(existingSessionId);
-          logger.trace("SessionManager: Reusing session via hash", {
-            sessionId: existingSessionId,
-            hash: contentHash,
-          });
-          return existingSessionId;
-        }
-
-        // 未找到：创建新 session
-        const newSessionId = SessionManager.generateSessionId();
-
-        // 存储映射关系（异步，不阻塞）
-        void SessionManager.storeSessionMapping(contentHash, newSessionId, keyId);
-
-        logger.trace("SessionManager: Created new session with hash", {
-          sessionId: newSessionId,
-          hash: contentHash,
-        });
-        return newSessionId;
-      } catch (error) {
-        logger.error("SessionManager: Redis error", { error });
-        // 降级：Redis 错误，生成新 session
-        return SessionManager.generateSessionId();
-      }
-    }
-
-    // 4. Redis 不可用，降级生成新 session
+    // 2. 安全降级：客户端未提供 session_id 时，始终生成新的 opaque session。
+    // 旧的 content-hash 复用会把不同 key/user 的同构请求错误合并进同一 session。
+    logger.warn("SessionManager: No client session ID, generating fresh opaque session", {
+      keyId,
+      messagesLength,
+    });
     return SessionManager.generateSessionId();
   }
 
-  /**
-   * 存储 hash → session 映射关系
-   */
-  private static async storeSessionMapping(
-    contentHash: string,
-    sessionId: string,
-    keyId: number
-  ): Promise<void> {
-    const redis = getRedisClient();
-    if (!redis || redis.status !== "ready") return;
-
-    try {
-      const pipeline = redis.pipeline();
-      const hashKey = `hash:${contentHash}:session`;
-
-      // 存储映射关系
-      pipeline.setex(hashKey, SessionManager.SESSION_TTL, sessionId);
-
-      // 初始化 session 元数据
-      pipeline.setex(`session:${sessionId}:key`, SessionManager.SESSION_TTL, keyId.toString());
-      pipeline.setex(
-        `session:${sessionId}:last_seen`,
-        SessionManager.SESSION_TTL,
-        Date.now().toString()
-      );
-
-      await pipeline.exec();
-    } catch (error) {
-      logger.error("SessionManager: Failed to store session mapping", {
-        error,
-      });
-    }
-  }
-
   /**
    * 刷新 session TTL（滑动窗口）
    */

diff --git a/src/lib/utils/sse.ts b/src/lib/utils/sse.ts
@@ -70,6 +70,7 @@ export function parseSSEData(sseText: string): ParsedSSEEvent[] {
  * 只认行首的 `event:` / `data:`（或前置注释行 `:`），避免 JSON 里包含 "data:" 误判。
  */
 export function isSSEText(text: string): boolean {
+  const sseFieldPrefixes = ["event:", "data:", "id:", "retry:"];
   let start = 0;
 
   for (let i = 0; i <= text.length; i += 1) {
@@ -81,7 +82,7 @@ export function isSSEText(text: string): boolean {
     if (!line) continue;
     if (line.startsWith(":")) continue;
 
-    return line.startsWith("event:") || line.startsWith("data:");
+    return sseFieldPrefixes.some((prefix) => line.startsWith(prefix));
-
+  const sseFieldPrefixes = ["event:", "data:", "id:", "retry:"];
+  // Note: `id:` and `retry:` are valid SSE field prefixes and must be
+  // recognised here so isSSEText returns true for responses that begin
+  // with them. parseSSEData intentionally does NOT process these fields
+  // because they control SSE reconnection state, not event data.
+  let start = 0;
-
+  const sseFieldPrefixes = ["event:", "data:", "id:", "retry:"];
+  // Note: `id:` and `retry:` are valid SSE field prefixes and must be
+  // recognised here so isSSEText returns true for responses that begin
+  // with them. parseSSEData intentionally does NOT process these fields
+  // because they control SSE reconnection state, not event data.
+  let start = 0;
   }
 
   return false;

diff --git a/tests/unit/lib/session-manager-session-id-fallback.test.ts b/tests/unit/lib/session-manager-session-id-fallback.test.ts
@@ -0,0 +1,63 @@
+import { beforeEach, describe, expect, test, vi } from "vitest";
+
+vi.mock("server-only", () => ({}));
+
+vi.mock("@/lib/logger", () => ({
+  logger: {
+    warn: vi.fn(),
+    trace: vi.fn(),
+    info: vi.fn(),
+    error: vi.fn(),
+  },
+}));
+
+const getRedisClientMock = vi.fn();
+
+vi.mock("@/lib/redis", () => ({
+  getRedisClient: getRedisClientMock,
+}));
+
+vi.mock("@/app/v1/_lib/proxy/errors", () => ({
+  sanitizeHeaders: vi.fn(() => "(empty)"),
+  sanitizeUrl: vi.fn((value: string) => value),
+}));
+
+vi.mock("@/lib/session-tracker", () => ({
+  SessionTracker: {
+    getActiveSessions: vi.fn(async () => []),
+  },
+}));
+
+describe("SessionManager.getOrCreateSessionId fallback", () => {
+  beforeEach(() => {
+    vi.clearAllMocks();
+  });
+
+  test("without client session id, identical messages should not reuse the same derived session id even when Redis is ready", async () => {
+    const { SessionManager } = await import("@/lib/session-manager");
+    const messages = [{ role: "user", content: "hello" }];
+    const hashMapping = new Map<string, string>();
+
+    const pipeline = {
+      setex: vi.fn((key: string, _ttl: number, value: string) => {
+        hashMapping.set(key, value);
+        return pipeline;
+      }),
+      exec: vi.fn(async () => []),
+    };
+
+    getRedisClientMock.mockReturnValue({
+      status: "ready",
+      get: vi.fn(async (key: string) => hashMapping.get(key) ?? null),
+      pipeline: vi.fn(() => pipeline),
+    });
+
+    const first = await SessionManager.getOrCreateSessionId(11, messages, null);
+    await new Promise((resolve) => setTimeout(resolve, 0));
+    const second = await SessionManager.getOrCreateSessionId(22, messages, null);
+
+    expect(first).toMatch(/^sess_/);
+    expect(second).toMatch(/^sess_/);
+    expect(first).not.toBe(second);
+  });
+});