Skip to content

Commit b58ce7c

Browse files
authored
Merge pull request #121 from ggerganov/master
b2894
2 parents e4c0d67 + e1b40ac commit b58ce7c

File tree

2 files changed

+238
-145
lines changed

2 files changed

+238
-145
lines changed

ggml-cuda.cu

+1-1
Original file line numberDiff line numberDiff line change
@@ -2558,7 +2558,7 @@ GGML_CALL static enum ggml_status ggml_backend_cuda_graph_compute(ggml_backend_t
25582558
}
25592559

25602560
// Disable CUDA graphs (from the next token) if the use-case is demanding too many consecutive graph updates.
2561-
if (cuda_graph_update_required) {
2561+
if (use_cuda_graph && cuda_graph_update_required) {
25622562
cuda_ctx->cuda_graph->number_consecutive_updates++;
25632563
} else {
25642564
cuda_ctx->cuda_graph->number_consecutive_updates = 0;

0 commit comments

Comments
 (0)