int64_t t_start_process_prompt;
int64_t t_start_generation;
- double t_prompt_processing; // ms
- double t_token_generation; // ms
+ double t_prompt_processing = 0.0; // ms
+ double t_token_generation = 0.0; // ms
std::function<void(int /* id_slot */)> callback_on_release;
int32_t cache_n = -1;
int32_t prompt_n = -1;
- double prompt_ms;
- double prompt_per_token_ms;
- double prompt_per_second;
+ double prompt_ms = 0.0;
+ double prompt_per_token_ms = 0.0;
+ double prompt_per_second = 0.0;
int32_t predicted_n = -1;
- double predicted_ms;
- double predicted_per_token_ms;
- double predicted_per_second;
+ double predicted_ms = 0.0;
+ double predicted_per_token_ms = 0.0;
+ double predicted_per_second = 0.0;
// Optional speculative metrics - only included when > 0
int32_t draft_n = 0;