Skip to content

Commit e194eab

Browse files
committed
benchmark_serving with short fixed_output_len
1 parent 71d21c7 commit e194eab

File tree

1 file changed

+4
-3
lines changed

1 file changed

+4
-3
lines changed

benchmarks/benchmark_serving.py

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -117,7 +117,7 @@ def sample_sharegpt_requests(
117117
prompt_len = len(prompt_token_ids)
118118
output_len = len(completion_token_ids
119119
) if fixed_output_len is None else fixed_output_len
120-
if prompt_len < 4 or output_len < 4:
120+
if prompt_len < 4 or (fixed_output_len is not None and output_len < 4):
121121
# Prune too short sequences.
122122
continue
123123
if prompt_len > 1024 or prompt_len + output_len > 2048:
@@ -228,10 +228,11 @@ def sample_hf_requests(
228228
prompt_len = len(prompt_token_ids)
229229
output_len = len(completion_token_ids
230230
) if fixed_output_len is None else fixed_output_len
231-
if prompt_len < 4 or output_len < 4:
231+
if fixed_output_len is None and (prompt_len < 4 or output_len < 4):
232232
# Prune too short sequences.
233233
continue
234-
if prompt_len > 1024 or prompt_len + output_len > 2048:
234+
if fixed_output_len is None and \
235+
(prompt_len > 1024 or prompt_len + output_len > 2048):
235236
# Prune too long sequences.
236237
continue
237238

0 commit comments

Comments
 (0)