Skip to content

Commit 7e26967

Browse files
henrylhtsangfacebook-github-bot
authored andcommitted
Make vllm compatible with cutlass 4.0 (#20460)
Summary: Rollback Plan: Differential Revision: D77771042
1 parent 8d1096e commit 7e26967

File tree

4 files changed

+2
-4
lines changed

4 files changed

+2
-4
lines changed

csrc/cutlass_extensions/gemm/collective/sm90_mma_tma_gmma_ss_warpspecialized_fp8_blockwise_scaling.hpp

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -45,7 +45,6 @@
4545
#include "cute/algorithm/functional.hpp"
4646
#include "cute/atom/mma_atom.hpp"
4747
#include "cute/algorithm/gemm.hpp"
48-
#include "cute/tensor_predicate.hpp"
4948
#include "cute/numeric/arithmetic_tuple.hpp"
5049

5150
#include "cutlass_extensions/gemm/dispatch_policy.hpp"

csrc/quantization/cutlass_w8a8/c3x/scaled_mm.cuh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -51,7 +51,7 @@ struct cutlass_3x_gemm {
5151
// These are the minimum alignments needed for the kernels to compile
5252
static constexpr int AlignmentAB =
5353
128 / cutlass::sizeof_bits<ElementAB>::value;
54-
static constexpr int AlignmentCD = 4;
54+
static constexpr int AlignmentCD = 8;
5555

5656
using CollectiveEpilogue =
5757
typename cutlass::epilogue::collective::CollectiveBuilder<

csrc/quantization/machete/machete_mainloop.cuh

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -38,7 +38,6 @@
3838
#include "cute/atom/mma_atom.hpp"
3939
#include "cute/atom/copy_traits_sm90_tma.hpp"
4040
#include "cute/algorithm/gemm.hpp"
41-
#include "cute/tensor_predicate.hpp"
4241
#include "cute/numeric/arithmetic_tuple.hpp"
4342
#include "cutlass/pipeline/pipeline.hpp"
4443
#include "cutlass/transform/collective/sm90_wgmma_transpose.hpp"

csrc/sparse/cutlass/sparse_scaled_mm_c3x.cuh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -79,7 +79,7 @@ struct cutlass_sparse_3x_gemm {
7979
// These are the minimum alignments needed for the kernels to compile
8080
static constexpr int AlignmentAB =
8181
128 / cutlass::sizeof_bits<ElementAB>::value;
82-
static constexpr int AlignmentCD = 4;
82+
static constexpr int AlignmentCD = 8;
8383

8484
using CollectiveEpilogue =
8585
typename cutlass::epilogue::collective::CollectiveBuilder<

0 commit comments

Comments
 (0)