Skip to content

Commit 7483853

Browse files
committed
[benchmark] add max-concurrency in result table
Signed-off-by: Peter Pan <Peter.Pan@daocloud.io>
1 parent 8a4e5c5 commit 7483853

File tree

2 files changed

+4
-0
lines changed

2 files changed

+4
-0
lines changed

benchmarks/benchmark_serving.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -520,6 +520,8 @@ async def limited_request_func(request_func_input, pbar):
520520

521521
print("{s:{c}^{n}}".format(s=" Serving Benchmark Result ", n=50, c="="))
522522
print("{:<40} {:<10}".format("Successful requests:", metrics.completed))
523+
if max_concurrency is not None:
524+
print("{:<40} {:<10}".format("Maximum request concurrency:", max_concurrency))
523525
print("{:<40} {:<10.2f}".format("Benchmark duration (s):", benchmark_duration))
524526
print("{:<40} {:<10}".format("Total input tokens:", metrics.total_input))
525527
print("{:<40} {:<10}".format("Total generated tokens:", metrics.total_output))

benchmarks/benchmark_serving_structured_output.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -569,6 +569,8 @@ async def limited_request_func(request_func_input, pbar):
569569

570570
print("{s:{c}^{n}}".format(s=" Serving Benchmark Result ", n=50, c="="))
571571
print("{:<40} {:<10}".format("Successful requests:", metrics.completed))
572+
if max_concurrency is not None:
573+
print("{:<40} {:<10}".format("Maximum request concurrency:", max_concurrency))
572574
print("{:<40} {:<10.2f}".format("Benchmark duration (s):", benchmark_duration))
573575
print("{:<40} {:<10}".format("Total input tokens:", metrics.total_input))
574576
print("{:<40} {:<10}".format("Total generated tokens:", metrics.total_output))

0 commit comments

Comments
 (0)