pub const CACHE_FIRST_TOKEN_LATENCY_US: &str = "cache/first_token_latency_us";
Histogram: time to first token in microseconds.