You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
// Store the output when doing grouped query attention.
109
29
// Rows index by Q's dimension 2, and the first N rows are valid.
@@ -114,27 +34,6 @@ D_TYPE perElemOpGqaStore(const in uint32_t r, const in uint32_t c, const in D_TY
114
34
return elem;
115
35
}
116
36
117
-
// Store column zero. This is used to save per-row m and L values for split_k.
118
-
ACC_TYPE perElemOpStoreCol0(const in uint32_t r, const in uint32_t c, const in ACC_TYPE elem, const in uint32_t o_offset, const in uint32_t iq2, const in uint32_t N)
119
-
{
120
-
if (r < N && c == 0) {
121
-
uint32_t offset = iq2 + r;
122
-
data_o[o_offset + offset] = D_TYPE(elem);
123
-
}
124
-
return elem;
125
-
}
126
-
127
-
// Load the slope matrix, indexed by Q's dimension 2.
128
-
ACC_TYPE perElemOpComputeSlope(const in uint32_t r, const in uint32_t c, const in ACC_TYPE elem, const in uint32_t iq2)
// Store column zero. This is used to save per-row m and L values for split_k.
89
+
ACC_TYPE perElemOpStoreCol0(const in uint32_t r, const in uint32_t c, const in ACC_TYPE elem, const in uint32_t o_offset, const in uint32_t iq2, const in uint32_t N)
90
+
{
91
+
if (r < N && c == 0) {
92
+
uint32_t offset = iq2 + r;
93
+
data_o[o_offset + offset] = D_TYPE(elem);
94
+
}
95
+
return elem;
96
+
}
97
+
98
+
// Load the slope matrix, indexed by Q's dimension 2.
99
+
ACC_TYPE perElemOpComputeSlope(const in uint32_t r, const in uint32_t c, const in ACC_TYPE elem, const in uint32_t iq2)
0 commit comments