mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2024-12-28 12:24:35 +00:00
metal : fix NSG1 > 1
This commit is contained in:
parent
845876d012
commit
e8b00e2941
@ -4980,7 +4980,7 @@ void kernel_mul_mm2_impl(
|
|||||||
|
|
||||||
for (int is = 0; is < NSG1; is++) {
|
for (int is = 0; is < NSG1; is++) {
|
||||||
const int i1 = i11 + is*8;
|
const int i1 = i11 + is*8;
|
||||||
const int nstore = MIN(8*NSG1, ne1 - i1) * (8*NSG0);
|
const int nstore = MIN(8, ne1 - i1) * (8*NSG0);
|
||||||
|
|
||||||
for (int i = tiisg; i < nstore; i += NW) {
|
for (int i = tiisg; i < nstore; i += NW) {
|
||||||
const int ic = i%(8*NSG0);
|
const int ic = i%(8*NSG0);
|
||||||
|
Loading…
Reference in New Issue
Block a user