Skip to content

Commit 75d3df1

Browse files
author
ilmarkov
committed
Fix CodecQ4
Signed-off-by: ilmarkov <imarkov@redhat.com>
1 parent 247348e commit 75d3df1

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

csrc/quickreduce/quick_reduce_impl.cuh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -182,7 +182,7 @@ struct CodecQ4 : public CodecBase {
182182
for (int i = 0; i < 4; i++) {
183183
if constexpr (std::is_same<T, half>::value) {
184184
int32_t q4 = ((qw >> (i * 4)) & kMask000F) | kHalf2_1024;
185-
packed_add<half>(w[i], kHalf2_1032);
185+
w[i] = packed_add<half>(w[i], kHalf2_1032);
186186
} else {
187187
int32_t int16_2 = (qw >> (i * 4)) & kMask000F;
188188
int16_t low = static_cast<int16_t>(int16_2 & 0xFFFF);

0 commit comments

Comments
 (0)