ggml-cuda: fixes for concurrent streams (#18496)

This commit is contained in:
Aman Gupta
2026-01-03 23:15:01 +08:00
committed by GitHub
parent a554a1ecc7
commit e57f52334b
2 changed files with 42 additions and 15 deletions
+1
View File
@@ -1063,6 +1063,7 @@ struct ggml_cuda_graph {
bool disable_due_to_too_many_updates = false;
bool disable_due_to_failed_graph_capture = false;
int number_consecutive_updates = 0;
bool cuda_graphs_enabled = false;
std::vector<ggml_graph_node_properties> ggml_graph_properties;
#endif
};