We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent c6e8f26 commit c2a264eCopy full SHA for c2a264e
benchmarks/benchmark_throughput.py
@@ -272,8 +272,10 @@ def main(args: argparse.Namespace):
272
raise ValueError(f"Unknown backend: {args.backend}")
273
total_num_tokens = sum(prompt_len + output_len
274
for _, prompt_len, output_len in requests)
275
+ total_output_tokens = sum(output_len for _, _, output_len in requests)
276
print(f"Throughput: {len(requests) / elapsed_time:.2f} requests/s, "
- f"{total_num_tokens / elapsed_time:.2f} tokens/s")
277
+ f"{total_num_tokens / elapsed_time:.2f} total tokens/s, "
278
+ f"{total_output_tokens / elapsed_time:.2f} output tokens/s")
279
280
# Output JSON results if specified
281
if args.output_json:
0 commit comments