Mojo struct
MMAConfig
struct MMAConfig[InType: DType, OutType: DType, mma_shape: IndexList[3], transpose_b: Bool = True]
Implemented traitsβ
AnyType,
Copyable,
ImplicitlyCopyable,
ImplicitlyDestructible,
Movable,
RegisterPassable,
TrivialRegisterPassable
comptime membersβ
k_group_size_aβ
comptime k_group_size_a = (MMAConfig[InType, OutType, mma_shape, transpose_b].simd_width // MMAConfig[InType, OutType, mma_shape, transpose_b].registers_per_thread_a)
k_group_size_bβ
comptime k_group_size_b = (MMAConfig[InType, OutType, mma_shape, transpose_b].simd_width // MMAConfig[InType, OutType, mma_shape, transpose_b].registers_per_thread_b)
mmaβ
comptime mma = TensorCore()
registers_per_thread_aβ
comptime registers_per_thread_a = num_matrix_reg[mma_shape[0], mma_shape[2]]()
registers_per_thread_bβ
comptime registers_per_thread_b = num_matrix_reg[mma_shape[1], mma_shape[2]]()
simd_widthβ
comptime simd_width = simd_width_of[InType]()
Methodsβ
adjusted_mma_k_shape_aβ
adjusted_mma_k_shape_bβ
Was this page helpful?
Thank you! We'll create more content like this.
Thank you for helping us improve!