For the complete documentation index, see llms.txt. Markdown versions of all pages are available by appending .md to any URL (e.g. /max/get-started.md).

Mojo function

print_kv_cache_paged_generic_gpu

def print_kv_cache_paged_generic_gpu[target: StringSlice[StaticConstantOrigin], dtype: DType, kv_params: KVCacheStaticParams, page_size: Int](valid_lengths: LayoutTensor[DType.uint32, element_layout=valid_lengths.element_layout, layout_int_type=valid_lengths.layout_int_type, linear_idx_type=valid_lengths.linear_idx_type, masked=valid_lengths.masked, alignment=valid_lengths.alignment], kv_collection: PagedKVCacheCollection[dtype, kv_params, page_size, scale_dtype_=kv_collection.scale_dtype_, quantization_granularity_=kv_collection.quantization_granularity_], layer_idx: UInt32, is_print_compact: Bool, context: DeviceContext)