Skip to content

Instantly share code, notes, and snippets.

@mlazos
Created May 12, 2025 21:34
Show Gist options
  • Save mlazos/f99205fdcf4c76116078210d3972acc6 to your computer and use it in GitHub Desktop.
Save mlazos/f99205fdcf4c76116078210d3972acc6 to your computer and use it in GitHub Desktop.
using Accum = cutlass::epilogue::fusion::Sm90AccFetch;
using ElementD = cutlass::half_t;
using StrideD = cute::Stride<int64_t, cute::Int<1>, cute::Int<0>>;
using Bias = cutlass::epilogue::fusion::Sm90ColBroadcast<
0 /*Stages*/, typename EpilogueDescriptor::TileShape, cutlass::half_t, cutlass::half_t,
cute::Stride<cute::Int<1>, cute::Int<0>, cute::Int<0>>
>;
using Compute0 = cutlass::epilogue::fusion::Sm90Compute<
cutlass::plus, float, float,
cutlass::FloatRoundStyle::round_to_nearest
>;
using EVTCompute0 = cutlass::epilogue::fusion::Sm90EVT<
Compute0,
EVTD,
Bias>;
using EDescriptor = cutlass::epilogue::collective::detail::AuxStoreDescriptor<
EpilogueDescriptor, cute::Stride<int64_t, cute::Int<1>, cute::Int<0>>, cutlass::half_t
>;
using E = cutlass::epilogue::fusion::Sm90AuxStore<
EDescriptor::Stages, typename EDescriptor::EpilogueTile, cutlass::half_t,
cutlass::FloatRoundStyle::round_to_nearest, cute::Stride<int64_t, cute::Int<1>, cute::Int<0>>, typename EDescriptor::SmemLayoutAtom,
typename EDescriptor::CopyOpR2S
>;
using EVTE = cutlass::epilogue::fusion::Sm90EVT<
E,
EVTCompute0>;
using ElementC = void;
using StrideC = StrideD;
Accum
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment