From 4b748716fff3426d572f7864ed6bed630bebfdb8 Mon Sep 17 00:00:00 2001 From: shanjiaz Date: Tue, 15 Apr 2025 14:47:03 -0400 Subject: [PATCH 1/2] update default observer to be mse --- src/compressed_tensors/quantization/quant_args.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/compressed_tensors/quantization/quant_args.py b/src/compressed_tensors/quantization/quant_args.py index 69c289d2..46f41af6 100644 --- a/src/compressed_tensors/quantization/quant_args.py +++ b/src/compressed_tensors/quantization/quant_args.py @@ -225,7 +225,7 @@ def validate_model_after(model: "QuantizationArgs") -> Dict[str, Any]: elif observer is None: # default to minmax for non-dynamic cases - observer = "minmax" + observer = "mse" # write back modified values model.strategy = strategy From 9aed941b0dd8bbf04c18a5704b864dc4f64abced Mon Sep 17 00:00:00 2001 From: shanjiaz <43143795+shanjiaz@users.noreply.github.com> Date: Tue, 15 Apr 2025 16:14:19 -0400 Subject: [PATCH 2/2] Update src/compressed_tensors/quantization/quant_args.py Co-authored-by: Brian Dellabetta --- src/compressed_tensors/quantization/quant_args.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/compressed_tensors/quantization/quant_args.py b/src/compressed_tensors/quantization/quant_args.py index 46f41af6..211e3e92 100644 --- a/src/compressed_tensors/quantization/quant_args.py +++ b/src/compressed_tensors/quantization/quant_args.py @@ -224,7 +224,7 @@ def validate_model_after(model: "QuantizationArgs") -> Dict[str, Any]: observer = None elif observer is None: - # default to minmax for non-dynamic cases + # default to mse for non-dynamic cases observer = "mse" # write back modified values