Mojo struct
AMDStructuredConfig
struct AMDStructuredConfig[config: MHAConfig[config.dtype], group: Int, token_gen: Bool = False, mla_mode: Bool = False]
Implemented traits
AnyType,
Copyable,
ImplicitlyCopyable,
ImplicitlyDestructible,
Movable
comptime members
depth_padded
comptime depth_padded = False
double_buffer
comptime double_buffer = not token_gen
double_buffer_k_only
comptime double_buffer_k_only = token_gen and (config.block_n() <= 64)
full_kv
comptime full_kv = True
shared_kv
comptime shared_kv = token_gen and (config > 256)
Methods
q_head_idx
q_tile_idx
kv_head_idx
get_mma_shape
get_q_offset
get_output_offset
Was this page helpful?
Thank you! We'll create more content like this.
Thank you for helping us improve!