metal : disable graph concurrency optimization due to bug (#2413)

This commit is contained in:
Georgi Gerganov 2023-07-27 11:00:54 +03:00
parent b5472ea0ad
commit 1a941869cb
No known key found for this signature in database
GPG key ID: 449E073F9DC10735

View file

@ -1722,9 +1722,10 @@ static bool llama_eval_internal(
#ifdef GGML_USE_METAL
if (lctx.ctx_metal && N == 1) {
if (!ggml_metal_if_optimized(lctx.ctx_metal)) {
ggml_metal_graph_find_concurrency(lctx.ctx_metal, gf);
}
// TODO: disabled until #2413 is resolved
//if (!ggml_metal_if_optimized(lctx.ctx_metal)) {
// ggml_metal_graph_find_concurrency(lctx.ctx_metal, gf);
//}
ggml_metal_set_n_cb (lctx.ctx_metal, n_threads);
ggml_metal_graph_compute(lctx.ctx_metal, gf);
ggml_metal_get_tensor (lctx.ctx_metal, cur);