Mojo struct
DecodeSM100TensorAccumulatorSS
@register_passable(trivial)
struct DecodeSM100TensorAccumulatorSS[operand_type: DType, accum_type: DType, *, config: MLA_SM100_Decode_Config]
Implemented traits
AnyType,
Copyable,
ImplicitlyCopyable,
ImplicitlyDestructible,
Movable
comptime members
__copyinit__is_trivial
comptime __copyinit__is_trivial = True
__del__is_trivial
comptime __del__is_trivial = True
__moveinit__is_trivial
comptime __moveinit__is_trivial = True
a_swizzle
comptime a_swizzle = config.swizzle_mode
b_swizzle
comptime b_swizzle = config.kv_swizzle_mode
BK
comptime BK = config.BN
BM
comptime BM = config.BM
BN
comptime BN = config.BN
MMA_K
comptime MMA_K = MLA_SM100_Decode_Config.MMA_K
MMA_M
comptime MMA_M = config.BM
MMA_N
comptime MMA_N = config.BN
num_k_mmas
comptime num_k_mmas = (DecodeSM100TensorAccumulatorSS[operand_type, accum_type, config=config].BK // 16)
O_M
comptime O_M = (config * 2)
O_N
comptime O_N = (config // 2)
operand_size
comptime operand_size = size_of[operand_type]()
S_M
comptime S_M = (config * 2)
S_N
comptime S_N = (config // 2)
Was this page helpful?
Thank you! We'll create more content like this.
Thank you for helping us improve!