Skip to content
Merged
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Prev Previous commit
Next Next commit
update int4 usage
Signed-off-by: Kaihui-intel <[email protected]>
  • Loading branch information
Kaihui-intel committed Jul 22, 2024
commit e538a63110b71c303bcceef265b7acaeed9df5f2
9 changes: 7 additions & 2 deletions neural_compressor/torch/quantization/algorithm_entry.py
Original file line number Diff line number Diff line change
Expand Up @@ -567,9 +567,14 @@ def autoround_quantize_entry(
if quant_config.name != AUTOROUND or quant_config.dtype == "fp32":
continue
else:
dtype = quant_config.dtype
bits = quant_config.bits
if dtype != "int" and "int" in dtype:
bits = int(dtype.lstrip("int"))
dtype = "int"
weight_config[op_name] = {
"data_type": quant_config.dtype,
"bits": quant_config.bits,
"data_type": dtype,
"bits": bits,
"sym": quant_config.use_sym,
"group_size": quant_config.group_size,
"act_bits": quant_config.act_bits,
Expand Down