File tree 1 file changed +3
-6
lines changed
1 file changed +3
-6
lines changed Original file line number Diff line number Diff line change @@ -160,7 +160,7 @@ def reset_state_for_recompute(self) -> None:
160
160
self ._stage = SequenceStage .PREFILL
161
161
162
162
def get_num_uncomputed_tokens (self ) -> int :
163
- """Return the number of prefil tokens that are not computed."""
163
+ """Return the number of prefill tokens that are not computed."""
164
164
# we use `get_len()` which includes prompt_len + output_len instead
165
165
# of prompt_len here. This is because during recompute we need to
166
166
# prefill for both prompt and output.
@@ -345,12 +345,9 @@ def fork(self, new_seq_id: int) -> "Sequence":
345
345
def get_num_new_tokens (self ) -> int :
346
346
"""Get the number of new tokens to be computed.
347
347
348
- Args:
349
- remainig_token_budget: The remaining token budgets.
350
348
Returns:
351
- The new number of tokens to be computed. I.e., 1 for decode, prompt
352
- size for prefill. If there's not enough remainig_token_budget, it
353
- can return the chunked number of new tokens.
349
+ The new number of tokens to be computed. I.e., 1 for decode, or
350
+ the remaining prompt size for prefill.
354
351
"""
355
352
if self .data .stage == SequenceStage .DECODE :
356
353
return 1
You can’t perform that action at this time.
0 commit comments