diff --git a/evals/benchmark/stresscli/commands/config.ini b/evals/benchmark/stresscli/commands/config.ini index fd195d5e..f5d144d1 100644 --- a/evals/benchmark/stresscli/commands/config.ini +++ b/evals/benchmark/stresscli/commands/config.ini @@ -11,14 +11,14 @@ End_to_End_latency_P50 = End to End latency\(ms\),\s+P50:\s+([\d.]+) End_to_End_latency_P90 = End to End latency\(ms\),\s+P50:[\s\d.,]+P90:\s+([\d.]+) End_to_End_latency_P99 = End to End latency\(ms\),\s+P50:[\s\d.,]+P90:\s+[\s\d.,]+P99:\s+([\d.]+) End_to_End_latency_Avg = End to End latency\(ms\),\s+P50:[\s\d.,]+P90:\s+[\s\d.,]+P99:\s+[\s\d.,]+Avg:\s+([\d.]+) -First_token_latency_P50 = First token latency\(ms\),\s+P50:\s+([\d.]+) -First_token_latency_P90 = First token latency\(ms\),\s+P50:[\s\d.,]+P90:\s+([\d.]+) -First_token_latency_P99 = First token latency\(ms\),\s+P50:[\s\d.,]+P90:\s+[\s\d.,]+P99:\s+([\d.]+) -First_token_latency_Avg = First token latency\(ms\),\s+P50:[\s\d.,]+P90:\s+[\s\d.,]+P99:\s+[\s\d.,]+Avg:\s+([\d.]+) -Next_token_latency_P50 = Next token latency\(ms\),\s+P50:\s+([\d.]+) -Next_token_latency_P90 = Next token latency\(ms\),\s+P50:[\s\d.,]+P90:\s+([\d.]+) -Next_token_latency_P99 = Next token latency\(ms\),\s+P50:[\s\d.,]+P90:\s+[\s\d.,]+P99:\s+([\d.]+) -Next_token_latency_Avg = Next token latency\(ms\),\s+P50:[\s\d.,]+P90:\s+[\s\d.,]+P99:\s+[\s\d.,]+Avg:\s+([\d.]+) +Time_to_First_Token-TTFT_P50 = Time to First Token-TTFT\(ms\),\s+P50:\s+([\d.]+) +Time_to_First_Token-TTFT_P90 = Time to First Token-TTFT\(ms\),\s+P50:[\s\d.,]+P90:\s+([\d.]+) +Time_to_First_Token-TTFT_P99 = Time to First Token-TTFT\(ms\),\s+P50:[\s\d.,]+P90:\s+[\s\d.,]+P99:\s+([\d.]+) +Time_to_First_Token-TTFT_Avg = Time to First Token-TTFT\(ms\),\s+P50:[\s\d.,]+P90:\s+[\s\d.,]+P99:\s+[\s\d.,]+Avg:\s+([\d.]+) +Time_Per_Output_Token-TPOT_P50 = Time Per Output Token-TPOT\(ms\),\s+P50:\s+([\d.]+) +Time_Per_Output_Token-TPOT_P90 = Time Per Output Token-TPOT\(ms\),\s+P50:[\s\d.,]+P90:\s+([\d.]+) +Time_Per_Output_Token-TPOT_P99 = Time Per Output Token-TPOT\(ms\),\s+P50:[\s\d.,]+P90:\s+[\s\d.,]+P99:\s+([\d.]+) +Time_Per_Output_Token-TPOT_Avg = Time Per Output Token-TPOT\(ms\),\s+P50:[\s\d.,]+P90:\s+[\s\d.,]+P99:\s+[\s\d.,]+Avg:\s+([\d.]+) Average_token_latency = Average token latency\(ms\)\s+:\s+([\d.]+) locust_num_requests = \"num_requests\":\s+(\d+) locust_num_failures = \"num_failures\":\s+(\d+)