You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: examples/67_hopper_fp8_warp_specialized_gemm_with_blockwise_scaling/67_hopper_fp8_warp_specialized_gemm_with_blockwise_scaling.cu
+1-1Lines changed: 1 addition & 1 deletion
Original file line number
Diff line number
Diff line change
@@ -123,7 +123,7 @@ using ArchTag = cutlass::arch::Sm90; // T
123
123
using OperatorClass = cutlass::arch::OpClassTensorOp; // Operator class tag
124
124
using TileShape = Shape<_128,_128,_128>; // Threadblock-level tile size
125
125
using ClusterShape = Shape<_1,_2,_1>; // Shape of the threadblocks in a cluster
126
-
using KernelSchedule = cutlass::gemm::KernelTmaWarpSpecializedCooperativeFP8BlockScaledAccum;
126
+
using KernelSchedule = cutlass::gemm::KernelTmaWarpSpecializedCooperativeFP8BlockScaledAccum<>;
127
127
using EpilogueSchedule = cutlass::epilogue::TmaWarpSpecializedCooperative;
128
128
129
129
using EpilogueTileType = cutlass::epilogue::collective::EpilogueTileAuto;
Copy file name to clipboardExpand all lines: examples/67_hopper_fp8_warp_specialized_gemm_with_blockwise_scaling/67_hopper_fp8_warp_specialized_gemm_with_groupwise_scaling.cu
Copy file name to clipboardExpand all lines: examples/67_hopper_fp8_warp_specialized_gemm_with_blockwise_scaling/reference/host/gemm_with_groupwise_scaling.h
// Returns the maximum number of smem tiles that can be used with a given smem capacity in gemm of blockwise/groupwise scale.
88
+
template<int capacity_bytes_, classElementA, classElementB, classElementBlockScale, classTileShapeMNK, int ScaleMsPerTile, int carveout_bytes_, int alignment = 128>
// Returns the maximum number of smem tiles that can be used with a given smem capacity (with an optional scale matrix), or overrides with manual count.
88
110
template<int capacity_bytes, classElementA, classElementB, classElementScale, classElementZero, classTileShapeMNK, int stages, int alignment = 128>
0 commit comments