metal : disable graph concurrency optimization due to bug (#2413)

2024-11-11 21:39:52 +00:00 · 2023-07-27 11:00:54 +03:00 · 2023-07-27 11:00:54 +03:00 · 1a941869cb
commit 1a941869cb
parent b5472ea0ad
1 changed files with 4 additions and 3 deletions
--- a/llama.cpp
+++ b/llama.cpp
@ -1722,9 +1722,10 @@ static bool llama_eval_internal(

 #ifdef GGML_USE_METAL
    if (lctx.ctx_metal && N == 1) {
-        if (!ggml_metal_if_optimized(lctx.ctx_metal)) {
-            ggml_metal_graph_find_concurrency(lctx.ctx_metal, gf);
-        }
+        // TODO: disabled until #2413 is resolved
+        //if (!ggml_metal_if_optimized(lctx.ctx_metal)) {
+        //    ggml_metal_graph_find_concurrency(lctx.ctx_metal, gf);
+        //}
        ggml_metal_set_n_cb     (lctx.ctx_metal, n_threads);
        ggml_metal_graph_compute(lctx.ctx_metal, gf);
        ggml_metal_get_tensor   (lctx.ctx_metal, cur);