mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2025-01-10 18:51:45 +00:00
Release encode block when re-setting encoding buffer count if needed
This commit is contained in:
parent
5e6358398c
commit
4af03de2a6
@ -3428,6 +3428,10 @@ static void ggml_backend_metal_set_n_cb(ggml_backend_t backend, int n_cb) {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
if(ctx->encode_async) {
|
||||||
|
Block_release(ctx->encode_async);
|
||||||
|
}
|
||||||
|
|
||||||
ctx->encode_async = Block_copy(^(size_t iter) {
|
ctx->encode_async = Block_copy(^(size_t iter) {
|
||||||
const int cb_idx = iter;
|
const int cb_idx = iter;
|
||||||
const int n_cb_l = ctx->n_cb;
|
const int n_cb_l = ctx->n_cb;
|
||||||
|
Loading…
Reference in New Issue
Block a user