diff --git a/examples/language-modeling/main.py b/examples/language-modeling/main.py index 8af4bbdc..588aa68a 100644 --- a/examples/language-modeling/main.py +++ b/examples/language-modeling/main.py @@ -329,7 +329,7 @@ def get_library_version(library_name): compression_dtype=torch.int8, compression_dim=0, use_optimum_format=False, device="xpu") if "cpu" in deployment_device: - autoround.save_quantized(output_dir=f'{export_dir}-cpu', format='itrex', inplace=inplace) + autoround.save_quantized(output_dir=f'{export_dir}-cpu', format='auto_round', inplace=inplace) if "fake" in deployment_device: model = model.to("cpu") model.save_pretrained(output_dir)