For the complete documentation index, see llms.txt. Markdown versions of all pages are available by appending .md to any URL (e.g. /max/get-started.md).

Mojo function

promote_accumulators

def promote_accumulators[pipeline_stages: Int, num_accum_pipeline_stages: Int, accum_type: DType, accum_layout: TensorLayout, a_scales_type: DType, b_scales_type: DType, b_scales_layout: TensorLayout, /, *, block_tile_shape: IndexList[Int(3)], mma_shape: IndexList[Int(3)], cta_group: Int, CLUSTER_SIZE: Int32, is_lower_frag_required: Bool, num_output_warps: Int](b_scales: TileTensor[b_scales_type, b_scales_layout, Storage=b_scales.Storage, address_space=b_scales.address_space, linear_idx_type=b_scales.linear_idx_type, element_size=b_scales.element_size], a_scales_smem_tiles: SMemTileArray2DRowMajor[a_scales_type], c_upper_main_tile: TileTensor[accum_type, accum_layout, Storage=c_upper_main_tile.Storage, address_space=AddressSpace.LOCAL, linear_idx_type=c_upper_main_tile.linear_idx_type, element_size=c_upper_main_tile.element_size], c_lower_main_tile: TileTensor[accum_type, accum_layout, Storage=c_lower_main_tile.Storage, address_space=AddressSpace.LOCAL, linear_idx_type=c_lower_main_tile.linear_idx_type, element_size=c_lower_main_tile.element_size], mma_output_pipeline: ProducerConsumerPipeline[num_accum_pipeline_stages], tmem_addr: UInt32, load_mma_pipeline: ProducerConsumerPipeline[pipeline_stages], work_tile_coord: Tuple[Int, Int], elect_one_warp: Bool, stage_stride_cols: Int, k_iter: Int, problem_shape: StaticTuple[Int32, Int(3)])