Mojo trait
AsyncTensorAccumulator
Implemented traits
AnyType
,
UnknownDestructibility
Aliases
a_t
alias a_t
ab_t
alias ab_t
accum_t
alias accum_t
b_t
alias b_t
c_t
alias c_t
operand_t
alias operand_t
Methods
__init__
__init__(smem: UnsafePointer[SharedMemBarrier, address_space=AddressSpace(3), alignment=8]) -> _Self
mma_descriptors
static mma_descriptors[dtype_a: DType, dtype_b: DType](p_a: UnsafePointer[SIMD[dtype_a, 1], address_space=AddressSpace(3)], p_b: UnsafePointer[SIMD[dtype_b, 1], address_space=AddressSpace(3)]) -> get_vtable_entry(:trait<_nn::_mha_sm100::_AsyncTensorAccumulator> _Self, "ab_t")
mma
mma(self: _Self, a: get_vtable_entry(:trait<_nn::_mha_sm100::_AsyncTensorAccumulator> _Self, "a_t"), b: get_vtable_entry(:trait<_nn::_mha_sm100::_AsyncTensorAccumulator> _Self, "b_t"), c: get_vtable_entry(:trait<_nn::_mha_sm100::_AsyncTensorAccumulator> _Self, "c_t"), c_scale: SIMD[uint32, 1], wg_idx: SIMD[uint32, 1] = __init__[__mlir_type.!pop.int_literal](0))
wait_group
wait_group[wgmma_left_in_flight: Int = 0](mut self: _Self)
Was this page helpful?
Thank you! We'll create more content like this.
Thank you for helping us improve!