from dequantize_utils import torch_convert_bit_twiddling, torch_convert def _tir_u8_to_f4_to_bf16(nbit: int, val: tirx.PrimExpr, pos: tirx.PrimExpr, scale: tirx.PrimExpr, dtype: str): Convert a 4-bit ...