Skip to content

Commit 8f20fc0

Browse files
UranusSevenZhong Wang
and
Zhong Wang
authored
[Misc] fix docstrings (#4191)
Co-authored-by: Zhong Wang <wangzhong@infini-ai.com>
1 parent 221d93e commit 8f20fc0

File tree

1 file changed

+3
-6
lines changed

1 file changed

+3
-6
lines changed

vllm/sequence.py

Lines changed: 3 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -160,7 +160,7 @@ def reset_state_for_recompute(self) -> None:
160160
self._stage = SequenceStage.PREFILL
161161

162162
def get_num_uncomputed_tokens(self) -> int:
163-
"""Return the number of prefil tokens that are not computed."""
163+
"""Return the number of prefill tokens that are not computed."""
164164
# we use `get_len()` which includes prompt_len + output_len instead
165165
# of prompt_len here. This is because during recompute we need to
166166
# prefill for both prompt and output.
@@ -345,12 +345,9 @@ def fork(self, new_seq_id: int) -> "Sequence":
345345
def get_num_new_tokens(self) -> int:
346346
"""Get the number of new tokens to be computed.
347347
348-
Args:
349-
remainig_token_budget: The remaining token budgets.
350348
Returns:
351-
The new number of tokens to be computed. I.e., 1 for decode, prompt
352-
size for prefill. If there's not enough remainig_token_budget, it
353-
can return the chunked number of new tokens.
349+
The new number of tokens to be computed. I.e., 1 for decode, or
350+
the remaining prompt size for prefill.
354351
"""
355352
if self.data.stage == SequenceStage.DECODE:
356353
return 1

0 commit comments

Comments
 (0)