Mojo struct
AMDStructuredConfig
struct AMDStructuredConfig[config: MHAConfig[config.dtype], group: Int, token_gen: Bool = False, mla_mode: Bool = False]
Implemented traitsβ
AnyType,
Copyable,
ImplicitlyCopyable,
ImplicitlyDestructible,
Movable
comptime membersβ
depth_paddedβ
comptime depth_padded = False
double_bufferβ
comptime double_buffer = not token_gen
double_buffer_k_onlyβ
comptime double_buffer_k_only = token_gen and (config.block_n() <= 64)
full_kvβ
comptime full_kv = True
shared_kvβ
comptime shared_kv = token_gen and (config > 256)
Methodsβ
q_head_idxβ
q_tile_idxβ
kv_head_idxβ
get_mma_shapeβ
get_q_offsetβ
get_output_offsetβ
Was this page helpful?
Thank you! We'll create more content like this.
Thank you for helping us improve!