mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2026-07-04 10:10:19 +00:00
metal : fix mat-vec Q8_0 kernel for BS > 1
This commit is contained in:
@@ -1071,8 +1071,15 @@ kernel void kernel_mul_mv_q8_0_f32(
|
||||
constant int64_t & ne00,
|
||||
constant int64_t & ne01,
|
||||
constant int64_t & ne02,
|
||||
constant uint64_t & nb00,
|
||||
constant uint64_t & nb01,
|
||||
constant uint64_t & nb02,
|
||||
constant int64_t & ne10,
|
||||
constant int64_t & ne11,
|
||||
constant int64_t & ne12,
|
||||
constant uint64_t & nb10,
|
||||
constant uint64_t & nb11,
|
||||
constant uint64_t & nb12,
|
||||
constant int64_t & ne0,
|
||||
constant int64_t & ne1,
|
||||
constant uint & r2 [[buffer(17)]],
|
||||
|
||||
Reference in New Issue
Block a user