Mojo function

grouped_matmul_amd_kernel_launcher

grouped_matmul_amd_kernel_launcher[c_type: DType, a_type: DType, b_type: DType, LayoutC: TensorLayout, LayoutA: TensorLayout, LayoutB: TensorLayout, AOffsetsLayout: TensorLayout, ExpertIdsLayout: TensorLayout, transpose_b: Bool, config: MatmulConfig[a_type, b_type, c_type, transpose_b], elementwise_lambda_fn: Optional[elementwise_epilogue_type] = None](c_tensor: TileTensor[c_type, LayoutC, MutAnyOrigin], a_tensor: TileTensor[a_type, LayoutA, MutAnyOrigin], b_tensor: TileTensor[b_type, LayoutB, MutAnyOrigin], a_offsets: TileTensor[DType.uint32, AOffsetsLayout, ImmutAnyOrigin], expert_ids: TileTensor[DType.int32, ExpertIdsLayout, ImmutAnyOrigin], num_active_experts: Int)