Skip to content

Commit ebbf544

Browse files
authored
sycl : fix for untransposed GDA recurrent state (ggml-org#20583)
1 parent b91d7df commit ebbf544

1 file changed

Lines changed: 2 additions & 2 deletions

File tree

ggml/src/ggml-sycl/gated_delta_net.cpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -55,7 +55,7 @@ void gated_delta_net_sycl(const float * q,
5555
#pragma unroll
5656
for (int r = 0; r < rows_per_lane; r++) {
5757
const int i = r * warp_size + lane;
58-
s_shard[r] = curr_state[i * S_v + col];
58+
s_shard[r] = curr_state[col * S_v + i];
5959
}
6060

6161
for (int t = 0; t < n_tokens; t++) {
@@ -137,7 +137,7 @@ void gated_delta_net_sycl(const float * q,
137137
#pragma unroll
138138
for (int r = 0; r < rows_per_lane; r++) {
139139
const int i = r * warp_size + lane;
140-
state[i * S_v + col] = s_shard[r];
140+
state[col * S_v + i] = s_shard[r];
141141
}
142142
}
143143

0 commit comments

Comments
 (0)