File tree 1 file changed +4
-4
lines changed
1 file changed +4
-4
lines changed Original file line number Diff line number Diff line change @@ -3018,8 +3018,8 @@ void kernel_mul_mv_q4_K_f32_impl(
3018
3018
constant uint & r2,
3019
3019
constant uint & r3,
3020
3020
uint3 tgpig[[threadgroup_position_in_grid]],
3021
- uint tiisg[[thread_index_in_simdgroup]],
3022
- uint sgitg[[simdgroup_index_in_threadgroup]]) {
3021
+ uint tiisg[[thread_index_in_simdgroup]],
3022
+ uint sgitg[[simdgroup_index_in_threadgroup]]) {
3023
3023
3024
3024
const int ix = tiisg/4 ; // 0...7
3025
3025
const int it = tiisg%4 ; // 0...3
@@ -3028,7 +3028,7 @@ void kernel_mul_mv_q4_K_f32_impl(
3028
3028
const int r0 = tgpig.x ;
3029
3029
const int r1 = tgpig.y ;
3030
3030
const int im = tgpig.z ;
3031
- const int first_row = (r0 * N_SIMDGROUP + sgitg) * N_DST;
3031
+ const int first_row = r0 * N_DST;
3032
3032
const int ib_row = first_row * nb;
3033
3033
3034
3034
const uint i12 = im%ne12;
@@ -3094,7 +3094,7 @@ void kernel_mul_mv_q4_K_f32_impl(
3094
3094
for (int row = 0 ; row < N_DST; ++row) {
3095
3095
all_sum = simd_sum (sumf[row]);
3096
3096
if (tiisg == 0 ) {
3097
- dst[r1*ne0+ im*ne0*ne1 + first_row + row] = all_sum;
3097
+ dst[r1*ne0 + im*ne0*ne1 + first_row + row] = all_sum;
3098
3098
}
3099
3099
}
3100
3100
}
You can’t perform that action at this time.
0 commit comments