We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 7b8712c commit 7915980Copy full SHA for 7915980
web/src/server/free-session/fireworks-health.ts
@@ -18,7 +18,7 @@ export type FireworksHealth = 'healthy' | 'degraded' | 'unhealthy'
18
/** Degrade once median prefill-queue latency crosses this bound. Strict by
19
* design — a 1s queue on top of ~1s prefill already means users feel 2s+
20
* before first token. */
21
-export const PREFILL_QUEUE_DEGRADED_MS = 1_000
+export const PREFILL_QUEUE_DEGRADED_MS = 600
22
23
/** Leading indicator of load — responds instantly to memory pressure, while
24
* prefill-queue p50 is a lagging window statistic. Degrading here lets us
0 commit comments