Mojo struct
MHAAttentionConfig
struct MHAAttentionConfig[token_gen: Bool, config: MHAConfig[config.dtype], group: Int]
Implemented traits
AnyType,
AttentionConfig,
Copyable,
ImplicitlyCopyable,
ImplicitlyDestructible,
Movable
comptime members
depth_padded
comptime depth_padded = False
double_buffer
comptime double_buffer = not token_gen
double_buffer_k_only
comptime double_buffer_k_only = token_gen and (config.block_n() <= 64)
full_kv
comptime full_kv = True
shared_kv
comptime shared_kv = token_gen and (config > 256)
Methods
q_head_idx
q_tile_idx
kv_head_idx
get_mma_shape
get_q_offset
get_output_offset
Was this page helpful?
Thank you! We'll create more content like this.
Thank you for helping us improve!