warp_gemm.hpp Source File#
warp_gemm.hpp
Go to the documentation of this file.
67using WarpGemmMfmaF16F16F32M32N32K8SwizzleA = WarpGemmImpl<WarpGemmAttributeMfmaIterateK_SwizzleA<
71using WarpGemmMfmaF16F16F32M32N32K16SwizzleA = WarpGemmImpl<WarpGemmAttributeMfmaIterateK_SwizzleA<
188using WarpGemmMfmaBf16Bf16F32M32N32K8SwizzleA = WarpGemmImpl<WarpGemmAttributeMfmaIterateK_SwizzleA<
261 WarpGemmAttributeMfma<WarpGemmAttributeMfmaImpl_f32_32x32x16_fp8_fp8<WGAttrCtlEnum::Default_>>>;
264 WarpGemmAttributeMfma<WarpGemmAttributeMfmaImpl_f32_32x32x16_fp8_bf8<WGAttrCtlEnum::Default_>>>;
267 WarpGemmAttributeMfma<WarpGemmAttributeMfmaImpl_f32_16x16x32_fp8_bf8<WGAttrCtlEnum::Default_>>>;
270 WarpGemmAttributeMfma<WarpGemmAttributeMfmaImpl_f32_32x32x16_bf8_fp8<WGAttrCtlEnum::Default_>>>;
273 WarpGemmAttributeMfma<WarpGemmAttributeMfmaImpl_f32_32x32x16_bf8_bf8<WGAttrCtlEnum::Default_>>>;
288 WarpGemmAttributeMfma<WarpGemmAttributeMfmaImpl_f32_16x16x32_fp8_fp8<WGAttrCtlEnum::Default_>>>;
295 WarpGemmAttributeMfma<WarpGemmAttributeMfmaImpl_f32_16x16x32_bf8_bf8<WGAttrCtlEnum::Default_>>>;
311 WarpGemmAttributeMfma<WarpGemmAttributeMfmaScaleImpl_f32_16x16x128_fp4<WGAttrCtlEnum::Default_>,
Definition tile/core/algorithm/cluster_descriptor.hpp:13
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImpl_f32_16x16x128_bf8_fp8< WGAttrCtlEnum::Default_ >, AttrNumAccess > > WarpGemmMfma_f32_16x16x128_bf8_fp8
Definition warp_gemm.hpp:324
WarpGemmImpl< WarpGemmAttributeMfmaTransposedCDistribution< WarpGemmAttributeMfmaImpl_f32_32x32x16_bf8_bf8< WGAttrCtlEnum::Default_ > > > WarpGemmMfma_f32_32x32x16_bf8_bf8_CTransposed
Definition warp_gemm.hpp:389
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImpl_f32_16x16x32_bf8_bf8< WGAttrCtlEnum::Default_ > > > WarpGemmMfma_f32_16x16x32_bf8_bf8
Definition warp_gemm.hpp:294
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImpl_f32_32x32x16_fp8_fp8< WGAttrCtlEnum::Default_ > > > WarpGemmMfma_f32_32x32x16_fp8_fp8
Definition warp_gemm.hpp:260
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImplBf16Bf16F32M16N16K16< WGAttrCtlEnum::Default_ > > > WarpGemmMfmaBf16Bf16F32M16N16K16
Definition warp_gemm.hpp:159
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImpl_f32_16x16x128_fp8_fp8< WGAttrCtlEnum::Default_ >, AttrNumAccess > > WarpGemmMfma_f32_16x16x128_fp8_fp8
Definition warp_gemm.hpp:314
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImpl_f32_32x32x64_fp8_bf8< WGAttrCtlEnum::Default_ >, AttrNumAccess > > WarpGemmMfma_f32_32x32x64_fp8_bf8
Definition warp_gemm.hpp:363
WarpGemmImpl< WarpGemmAttributeMfmaIterateK< WarpGemmAttributeMfmaImpl_f32_32x32x16_fp8_fp8< WGAttrCtlEnum::Default_ >, 2 > > WarpGemmMfma_f32_32x32x32_fp8_fp8
Definition warp_gemm.hpp:275
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImpl_i32_16x16x32_i8< WGAttrCtlEnum::Default_ > > > WarpGemmMfma_i32_16x16x32_i8_i8
Definition warp_gemm.hpp:408
WarpGemmImpl< WarpGemmAttributeMfmaIterateK< WarpGemmAttributeMfmaImplBf16Bf16F32M16N16K16< WGAttrCtlEnum::Default_ >, 2, AttrNumAccess > > WarpGemmMfmaBf16Bf16F32M16N16K32
Definition warp_gemm.hpp:182
WarpGemmSmfmacImpl< WarpGemmAttributeSmfmac< WarpGemmAttributeSmfmacImplF16F16F32M16N16K32< WGAttrCtlEnum::Default_ > > > WarpGemmSmfmacF16F16F32M16N16K32
Definition warp_gemm.hpp:152
WarpGemmImpl< WarpGemmAttributeMfmaIterateK< WarpGemmAttributeMfmaImplF16F16F32M4N64K4< WGAttrCtlEnum::Default_ >, 4 > > WarpGemmMfmaF16F16F32M4N64K16
Definition warp_gemm.hpp:140
WarpGemmImpl< WarpGemmAttributeMfmaTransposedCDistribution< WarpGemmAttributeMfmaImpl_i32_16x16x32_i8< WGAttrCtlEnum::Default_ > > > WarpGemmMfma_i32_16x16x32_i8_i8_CTransposed
Definition warp_gemm.hpp:411
WarpGemmImpl< WarpGemmAttributeMfmaTransposedCDistribution< WarpGemmAttributeMfmaImpl_i32_32x32x16_i8< WGAttrCtlEnum::Default_ > > > WarpGemmMfma_i32_32x32x16_i8_i8_CTransposed
Definition warp_gemm.hpp:404
WarpGemmImpl< WarpGemmAttributeMfmaTransposedCDistribution< WarpGemmAttributeMfmaImpl_f32_16x16x32_fp8_fp8< WGAttrCtlEnum::Default_ > > > WarpGemmMfma_f32_16x16x32_fp8_fp8_CTransposed
Definition warp_gemm.hpp:290
WarpGemmImpl< WarpGemmAttributeMfmaTransposedCDistribution< WarpGemmAttributeMfmaImplBf16Bf16F32M32N32K8< WGAttrCtlEnum::Default_ > > > WarpGemmMfmaBf16Bf16F32M32N32K8TransposedCDistribution
Definition warp_gemm.hpp:197
WarpGemmAttributeMfmaImpl_f32_32x32x16_f8_base< fp8_t, bf8_t, Ctrl_ > WarpGemmAttributeMfmaImpl_f32_32x32x16_fp8_bf8
Definition warp_gemm_attribute_mfma_impl.hpp:1511
WarpGemmImpl< WarpGemmAttributeMfmaIterateK< WarpGemmAttributeMfmaImplBf16Bf16F32M4N64K4< WGAttrCtlEnum::Default_ >, 4 > > WarpGemmMfmaBf16Bf16F32M4N64K16
Definition warp_gemm.hpp:250
WarpGemmAttributeMfmaImpl_f32_32x32x16_f8_base< bf8_t, bf8_t, Ctrl_ > WarpGemmAttributeMfmaImpl_f32_32x32x16_bf8_bf8
Definition warp_gemm_attribute_mfma_impl.hpp:1526
WarpGemmAttributeMfmaImpl_f32_32x32x16_f8_base< fp8_t, fp8_t, Ctrl_ > WarpGemmAttributeMfmaImpl_f32_32x32x16_fp8_fp8
Definition warp_gemm_attribute_mfma_impl.hpp:1505
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaScaleImpl_f32_16x16x128_fp4< WGAttrCtlEnum::Default_ >, AttrNumAccess > > WarpGemmMfma_f32_16x16x128_fp4
Definition warp_gemm.hpp:310
WarpGemmImpl< WarpGemmAttributeMfmaTransposedCDistribution< WarpGemmAttributeMfmaImpl_f32_16x16x32_bf8_bf8< WGAttrCtlEnum::Default_ > > > WarpGemmMfma_f32_16x16x32_bf8_bf8_CTransposed
Definition warp_gemm.hpp:297
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImplF16F16F32M16N16K16< WGAttrCtlEnum::Default_ > > > WarpGemmMfmaF16F16F32M16N16K16
Definition warp_gemm.hpp:38
WarpGemmImpl< WarpGemmAttributeMfmaTransposedCDistribution_SwizzleB< WarpGemmAttributeMfmaImplBf16Bf16F32M32N32K8< WGAttrCtlEnum::Default_ > > > WarpGemmMfmaBf16Bf16F32M32N32K8SwizzleBTransposedCDistribution
Definition warp_gemm.hpp:235
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImpl_f32_32x32x64_fp8_fp8< WGAttrCtlEnum::Default_ >, AttrNumAccess > > WarpGemmMfma_f32_32x32x64_fp8_fp8
Definition warp_gemm.hpp:358
WarpGemmImpl< WarpGemmAttributeMfmaTransposedCDistribution< WarpGemmAttributeMfmaImpl_f32_32x32x16_fp8_fp8< WGAttrCtlEnum::Default_ > > > WarpGemmMfma_f32_32x32x16_fp8_fp8_CTransposed
Definition warp_gemm.hpp:377
WarpGemmImpl< WarpGemmAttributeMfmaIterateK< WarpGemmAttributeMfmaImpl_f32_32x32x16_fp8_bf8< WGAttrCtlEnum::Default_ >, 2 > > WarpGemmMfma_f32_32x32x32_fp8_bf8
Definition warp_gemm.hpp:283
WarpGemmImpl< WarpGemmAttributeMfmaIterateK< WarpGemmAttributeMfmaImplF16F16F32M64N4K4< WGAttrCtlEnum::Default_ >, 4 > > WarpGemmMfmaF16F16F32M64N4K16
Definition warp_gemm.hpp:144
WarpGemmAttributeMfmaImpl_f32_16x16x32_f8_base< fp8_t, fp8_t, Ctrl_ > WarpGemmAttributeMfmaImpl_f32_16x16x32_fp8_fp8
Definition warp_gemm_attribute_mfma_impl.hpp:1508
WarpGemmImpl< WarpGemmAttributeMfmaIterateK< WarpGemmAttributeMfmaImplBf16Bf16F32M64N4K4< WGAttrCtlEnum::Default_ >, 4 > > WarpGemmMfmaBf16Bf16F32M64N4K16
Definition warp_gemm.hpp:254
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImpl_f32_16x16x32_fp8_fp8< WGAttrCtlEnum::Default_ > > > WarpGemmMfma_f32_16x16x32_fp8_fp8
Definition warp_gemm.hpp:287
WarpGemmImpl< WarpGemmAttributeMfmaIterateK< WarpGemmAttributeMfmaImplF16F16F32M32N32K8< WGAttrCtlEnum::Default_ >, 2, AttrNumAccess > > WarpGemmMfmaF16F16F32M32N32K16
Definition warp_gemm.hpp:48
WarpGemmImpl< WarpGemmAttributeMfmaIterateK< WarpGemmAttributeMfmaImplF16F16F32M16N16K16< WGAttrCtlEnum::Default_ >, 2, AttrNumAccess > > WarpGemmMfmaF16F16F32M16N16K32
Definition warp_gemm.hpp:61
WarpGemmImpl< WarpGemmAttributeMfmaIterateK< WarpGemmAttributeMfmaImplBf16Bf16F32M32N32K8< WGAttrCtlEnum::Default_ >, 2, AttrNumAccess > > WarpGemmMfmaBf16Bf16F32M32N32K16
Definition warp_gemm.hpp:169
WarpGemmImpl< WarpGemmAttributeMfmaIterateKAndTransposedCDistribution_SwizzleB< WarpGemmAttributeMfmaImplF16F16F32M32N32K8< WGAttrCtlEnum::Default_ >, 2 > > WarpGemmMfmaF16F16F32M32N32K16SwizzleBTransposedCDistribution
Definition warp_gemm.hpp:134
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImpl_f32_16x16x128_bf8_bf8< WGAttrCtlEnum::Default_ >, AttrNumAccess > > WarpGemmMfma_f32_16x16x128_bf8_bf8
Definition warp_gemm.hpp:329
WarpGemmImpl< WarpGemmAttributeMfmaTransposedCDistribution< WarpGemmAttributeMfmaImplBf16Bf16F32M16N16K16< WGAttrCtlEnum::Default_ > > > WarpGemmMfmaBf16Bf16F32M16N16K16TransposedCDistribution
Definition warp_gemm.hpp:201
WarpGemmImpl< WarpGemmAttributeMfmaIterateK_SwizzleA< WarpGemmAttributeMfmaImplBf16Bf16F32M32N32K8< WGAttrCtlEnum::Default_ >, 2 > > WarpGemmMfmaBf16Bf16F32M32N32K16SwizzleA
Definition warp_gemm.hpp:192
WarpGemmImpl< WarpGemmAttributeMfmaTransposedCDistribution< WarpGemmAttributeMfmaImpl_f32_16x16x128_fp8_fp8< WGAttrCtlEnum::Default_ >, AttrNumAccess > > WarpGemmMfma_f32_16x16x128_fp8_fp8_CTransposed
Definition warp_gemm.hpp:334
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImpl_f32_32x32x64_bf8_fp8< WGAttrCtlEnum::Default_ >, AttrNumAccess > > WarpGemmMfma_f32_32x32x64_bf8_fp8
Definition warp_gemm.hpp:368
WarpGemmImpl< WarpGemmAttributeMfmaTransposedCDistribution< WarpGemmAttributeMfmaImplF16F16F32M16N16K16< WGAttrCtlEnum::Default_ > > > WarpGemmMfmaF16F16F32M16N16K16TransposedCDistribution
Definition warp_gemm.hpp:79
WarpGemmImpl< WarpGemmAttributeMfmaIterateKAndTransposedCDistribution< WarpGemmAttributeMfmaImplF16F16F32M32N32K8< WGAttrCtlEnum::Default_ >, 2, AttrNumAccess > > WarpGemmMfmaF16F16F32M32N32K16TransposedCDistribution
Definition warp_gemm.hpp:91
WarpGemmAttributeMfmaImpl_f32_16x16x128_f8_bf8_base< fp8_t, bf8_t, Ctrl_ > WarpGemmAttributeMfmaImpl_f32_16x16x128_fp8_bf8
Definition warp_gemm_attribute_mfma_impl.hpp:1616
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImplBf16Bf16F32M32N32K8< WGAttrCtlEnum::Default_ > > > WarpGemmMfmaBf16Bf16F32M32N32K8
Definition warp_gemm.hpp:156
WarpGemmImpl< WarpGemmAttributeMfmaIterateK_SwizzleA< WarpGemmAttributeMfmaImplF16F16F32M32N32K8< WGAttrCtlEnum::Default_ >, 2 > > WarpGemmMfmaF16F16F32M32N32K16SwizzleA
Definition warp_gemm.hpp:71
WarpGemmImpl< WarpGemmAttributeMfmaIterateK< WarpGemmAttributeMfmaImpl_f32_32x32x16_bf8_bf8< WGAttrCtlEnum::Default_ >, 2 > > WarpGemmMfma_f32_32x32x32_bf8_bf8
Definition warp_gemm.hpp:279
WarpGemmImpl< WarpGemmAttributeMfmaIterateK< WarpGemmAttributeMfmaImpl_f32_16x16x32_bf8_bf8< WGAttrCtlEnum::Default_ >, 2 > > WarpGemmMfma_f32_16x16x64_bf8_bf8
Definition warp_gemm.hpp:305
WarpGemmImpl< WarpGemmAttributeMfmaIterateKAndTransposedCDistribution_SwizzleB< WarpGemmAttributeMfmaImplBf16Bf16F32M32N32K8< WGAttrCtlEnum::Default_ >, 2 > > WarpGemmMfmaBf16Bf16F32M32N32K16SwizzleBTransposedCDistribution
Definition warp_gemm.hpp:244
WarpGemmAttributeMfmaImpl_f32_16x16x128_f8_bf8_base< bf8_t, bf8_t, Ctrl_ > WarpGemmAttributeMfmaImpl_f32_16x16x128_bf8_bf8
Definition warp_gemm_attribute_mfma_impl.hpp:1624
WarpGemmImpl< WarpGemmAttributeMfmaIterateK_SwizzleA< WarpGemmAttributeMfmaImplF16F16F32M32N32K8< WGAttrCtlEnum::Default_ >, 1 > > WarpGemmMfmaF16F16F32M32N32K8SwizzleA
Definition warp_gemm.hpp:67
WarpGemmImpl< WarpGemmAttributeMfmaIterateKAndTransposedCDistribution< WarpGemmAttributeMfmaImplBf16Bf16F32M16N16K16< WGAttrCtlEnum::Default_ >, 2, AttrNumAccess > > WarpGemmMfmaBf16Bf16F32M16N16K32TransposedCDistribution
Definition warp_gemm.hpp:228
WarpGemmSmfmacImpl< WarpGemmAttributeSmfmac< WarpGemmAttributeSmfmacImplF16F16F32M32N32K16< WGAttrCtlEnum::Default_ > > > WarpGemmSmfmacF16F16F32M32N32K16
Definition warp_gemm.hpp:149
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImpl_f32_32x32x64_bf8_bf8< WGAttrCtlEnum::Default_ >, AttrNumAccess > > WarpGemmMfma_f32_32x32x64_bf8_bf8
Definition warp_gemm.hpp:373
WarpGemmAttributeMfmaImpl_f32_32x32x16_f8_base< bf8_t, fp8_t, Ctrl_ > WarpGemmAttributeMfmaImpl_f32_32x32x16_bf8_fp8
Definition warp_gemm_attribute_mfma_impl.hpp:1522
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImpl_f32_16x16x32_fp8_bf8< WGAttrCtlEnum::Default_ > > > WarpGemmMfma_f32_16x16x32_fp8_bf8
Definition warp_gemm.hpp:266
WarpGemmImpl< WarpGemmAttributeMfmaIterateKAndTransposedCDistribution< WarpGemmAttributeMfmaImplF32F32F32M16N16K4< WGAttrCtlEnum::Default_ >, 4, AttrNumAccess > > WarpGemmMfmaF32F32F32M16N16K16TransposedCDistribution
Definition warp_gemm.hpp:27
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImplF16F16F32M32N32K8< WGAttrCtlEnum::Default_ > > > WarpGemmMfmaF16F16F32M32N32K8
Definition warp_gemm.hpp:35
WarpGemmImpl< WarpGemmAttributeMfmaIterateKAndTransposedCDistribution< WarpGemmAttributeMfmaImplBf16Bf16F32M32N32K8< WGAttrCtlEnum::Default_ >, 2, AttrNumAccess > > WarpGemmMfmaBf16Bf16F32M32N32K16TransposedCDistribution
Definition warp_gemm.hpp:213
WarpGemmImpl< WarpGemmAttributeMfmaTransposedCDistribution_SwizzleB< WarpGemmAttributeMfmaImplF16F16F32M32N32K8< WGAttrCtlEnum::Default_ > > > WarpGemmMfmaF16F16F32M32N32K8SwizzleBTransposedCDistribution
Definition warp_gemm.hpp:125
WarpGemmAttributeMfmaImpl_f32_16x16x128_f8_bf8_base< fp8_t, fp8_t, Ctrl_ > WarpGemmAttributeMfmaImpl_f32_16x16x128_fp8_fp8
Definition warp_gemm_attribute_mfma_impl.hpp:1612
WarpGemmImpl< WarpGemmAttributeMfmaIterateKAndTransposedCDistribution< WarpGemmAttributeMfmaImplF16F16F32M16N16K16< WGAttrCtlEnum::Default_ >, 2, AttrNumAccess > > WarpGemmMfmaF16F16F32M16N16K32TransposedCDistribution
Definition warp_gemm.hpp:106
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImplF32F32F32M16N16K4< WGAttrCtlEnum::Default_ > > > WarpGemmMfmaF32F32F32M16N16K4
Definition warp_gemm.hpp:17
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImpl_f32_16x16x128_fp8_bf8< WGAttrCtlEnum::Default_ >, AttrNumAccess > > WarpGemmMfma_f32_16x16x128_fp8_bf8
Definition warp_gemm.hpp:319
WarpGemmImpl< WarpGemmAttributeMfmaTransposedCDistribution< WarpGemmAttributeMfmaImpl_f32_16x16x128_bf8_fp8< WGAttrCtlEnum::Default_ >, AttrNumAccess > > WarpGemmMfma_f32_16x16x128_bf8_fp8_CTransposed
Definition warp_gemm.hpp:346
WarpGemmAttributeMfmaImpl_f32_16x16x128_f8_bf8_base< bf8_t, fp8_t, Ctrl_ > WarpGemmAttributeMfmaImpl_f32_16x16x128_bf8_fp8
Definition warp_gemm_attribute_mfma_impl.hpp:1620
WarpGemmImpl< WarpGemmAttributeMfmaTransposedCDistribution< WarpGemmAttributeMfmaImpl_f32_16x16x128_fp8_bf8< WGAttrCtlEnum::Default_ >, AttrNumAccess > > WarpGemmMfma_f32_16x16x128_fp8_bf8_CTransposed
Definition warp_gemm.hpp:340
WarpGemmImpl< WarpGemmAttributeMfmaTransposedCDistribution< WarpGemmAttributeMfmaImpl_f32_32x32x16_fp8_bf8< WGAttrCtlEnum::Default_ > > > WarpGemmMfma_f32_32x32x16_fp8_bf8_CTransposed
Definition warp_gemm.hpp:381
WarpGemmImpl< WarpGemmAttributeMfmaIterateK_SwizzleA< WarpGemmAttributeMfmaImplBf16Bf16F32M32N32K8< WGAttrCtlEnum::Default_ >, 1 > > WarpGemmMfmaBf16Bf16F32M32N32K8SwizzleA
Definition warp_gemm.hpp:188
WarpGemmImpl< WarpGemmAttributeMfmaTransposedCDistribution< WarpGemmAttributeMfmaImplF16F16F32M32N32K8< WGAttrCtlEnum::Default_ > > > WarpGemmMfmaF16F16F32M32N32K8TransposedCDistribution
Definition warp_gemm.hpp:75
WarpGemmImpl< WarpGemmAttributeMfmaIterateK< WarpGemmAttributeMfmaImplF32F32F32M16N16K4< WGAttrCtlEnum::Default_ >, 4, AttrNumAccess > > WarpGemmMfmaF32F32F32M16N16K16
Definition warp_gemm.hpp:21
WarpGemmImpl< WarpGemmAttributeMfmaTransposedCDistribution< WarpGemmAttributeMfmaImpl_f32_32x32x16_bf8_fp8< WGAttrCtlEnum::Default_ > > > WarpGemmMfma_f32_32x32x16_bf8_fp8_CTransposed
Definition warp_gemm.hpp:385
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImpl_i32_32x32x16_i8< WGAttrCtlEnum::Default_ > > > WarpGemmMfma_i32_32x32x16_i8_i8
Definition warp_gemm.hpp:401
WarpGemmAttributeMfmaImpl_f32_16x16x32_f8_base< bf8_t, bf8_t, Ctrl_ > WarpGemmAttributeMfmaImpl_f32_16x16x32_bf8_bf8
Definition warp_gemm_attribute_mfma_impl.hpp:1518
WarpGemmImpl< WarpGemmAttributeMfmaIterateK< WarpGemmAttributeMfmaImpl_f32_16x16x32_fp8_fp8< WGAttrCtlEnum::Default_ >, 2 > > WarpGemmMfma_f32_16x16x64_fp8_fp8
Definition warp_gemm.hpp:301
WarpGemmImpl< WarpGemmAttributeMfmaTransposedCDistribution< WarpGemmAttributeMfmaImpl_f32_16x16x128_bf8_bf8< WGAttrCtlEnum::Default_ >, AttrNumAccess > > WarpGemmMfma_f32_16x16x128_bf8_bf8_CTransposed
Definition warp_gemm.hpp:352
WarpGemmImpl< WarpGemmAttributeMfmaIterateKAndTransposedCDistribution_SwizzleB< WarpGemmAttributeMfmaImpl_f32_32x32x16_fp8_fp8< WGAttrCtlEnum::Default_ >, 2, swizzle_factor > > WarpGemmMfmaFp8Fp8F32M32N32K32SwizzleBTransposedCDistribution
Definition warp_gemm.hpp:394
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImpl_f32_32x32x16_fp8_bf8< WGAttrCtlEnum::Default_ > > > WarpGemmMfma_f32_32x32x16_fp8_bf8
Definition warp_gemm.hpp:263
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImpl_f32_32x32x16_bf8_bf8< WGAttrCtlEnum::Default_ > > > WarpGemmMfma_f32_32x32x16_bf8_bf8
Definition warp_gemm.hpp:272
WarpGemmImpl< WarpGemmAttributeMfma< WarpGemmAttributeMfmaImpl_f32_32x32x16_bf8_fp8< WGAttrCtlEnum::Default_ > > > WarpGemmMfma_f32_32x32x16_bf8_fp8
Definition warp_gemm.hpp:269
Definition warp_gemm_attribute_mfma.hpp:23
Definition warp_gemm_attribute_mfma_impl.hpp:1890
Definition warp_gemm_attribute_mfma_impl.hpp:1820
Definition warp_gemm_attribute_mfma_impl.hpp:666
Definition warp_gemm_attribute_mfma_impl.hpp:196
Definition warp_gemm_attribute_mfma_impl.hpp:1049
Definition warp_gemm_attribute_mfma_impl.hpp:577
Definition warp_gemm_attribute_mfma_impl.hpp:754
Definition warp_gemm_attribute_mfma_impl.hpp:844
Definition warp_gemm_attribute_mfma_impl.hpp:322
Definition warp_gemm_attribute_mfma_impl.hpp:385
Definition warp_gemm_attribute_mfma_impl.hpp:935
Definition warp_gemm_attribute_mfma_impl.hpp:259
Definition warp_gemm_attribute_mfma_impl.hpp:448
Definition warp_gemm_attribute_mfma_impl.hpp:512
Definition warp_gemm_attribute_mfma_impl.hpp:67
Definition warp_gemm_attribute_mfma.hpp:869
Definition warp_gemm_attribute_mfma.hpp:725
Definition warp_gemm_attribute_mfma.hpp:575
Definition warp_gemm_attribute_mfma.hpp:130
Definition warp_gemm_attribute_mfma.hpp:479
Definition warp_gemm_attribute_mfma.hpp:395
Class describing structured sparsity mfma instructions.
Definition warp_gemm_attribute_smfmac.hpp:26
Definition warp_gemm_attribute_smfmac_impl.hpp:65
Definition warp_gemm_attribute_smfmac_impl.hpp:14
Definition warp_gemm_impl.hpp:11
Definition warp_gemm_smfmac_impl.hpp:11