Skip to content

Commit b016daf

Browse files
authored
typo--
1 parent b65e2e2 commit b016daf

File tree

1 file changed

+3
-3
lines changed

1 file changed

+3
-3
lines changed

llama_cpp/llama.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -940,9 +940,9 @@ def _create_completion(
940940

941941
completion_id: str = f"cmpl-{str(uuid.uuid4())}"
942942
created: int = int(time.time())
943-
prefix_token_id: int = int(self.metadata.get("tokenizer.ggml.prefix_token_id", self.token_prefix()))
944-
middle_token_id: int = int(self.metadata.get("tokenizer.ggml.middle_token_id", self.token_middle()))
945-
suffix_token_id: int = int(self.metadata.get("tokenizer.ggml.suffix_token_id", self.token_suffix()))
943+
prefix_token_id: int = int(self.metadata.get("tokenizer.ggml.prefix_token_id", self._model.token_prefix()))
944+
middle_token_id: int = int(self.metadata.get("tokenizer.ggml.middle_token_id", self._model.token_middle()))
945+
suffix_token_id: int = int(self.metadata.get("tokenizer.ggml.suffix_token_id", self._model.token_suffix()))
946946
# If prompt is empty, initialize completion with BOS token to avoid
947947
# detokenization including a space at the beginning of the completion
948948
completion_tokens: List[int] = [] if len(prompt) > 0 else [self.token_bos()]

0 commit comments

Comments
 (0)