From eff649762eb19fa22b1144ec5dae19f99319ad0e Mon Sep 17 00:00:00 2001 From: Uri Livne Date: Thu, 26 Dec 2024 14:46:42 +0200 Subject: [PATCH] [SW-214428] Added quant config files for Naver scenarios (#92) --- .../text-generation/quantization_config/pow2_quant.json | 7 +++++++ .../quantization_config/weight_opt_quant.json | 7 +++++++ 2 files changed, 14 insertions(+) create mode 100644 examples/text-generation/quantization_config/pow2_quant.json create mode 100644 examples/text-generation/quantization_config/weight_opt_quant.json diff --git a/examples/text-generation/quantization_config/pow2_quant.json b/examples/text-generation/quantization_config/pow2_quant.json new file mode 100644 index 0000000000..e1f2eb1c6e --- /dev/null +++ b/examples/text-generation/quantization_config/pow2_quant.json @@ -0,0 +1,7 @@ +{ + "method": "HOOKS", + "mode": "QUANTIZE", + "observer": "maxabs", + "scale_method": "maxabs_pow2", + "dump_stats_path": "./hqt_output/measure" +} diff --git a/examples/text-generation/quantization_config/weight_opt_quant.json b/examples/text-generation/quantization_config/weight_opt_quant.json new file mode 100644 index 0000000000..1ec2dc6b6a --- /dev/null +++ b/examples/text-generation/quantization_config/weight_opt_quant.json @@ -0,0 +1,7 @@ +{ + "method": "HOOKS", + "mode": "QUANTIZE", + "observer": "maxabs", + "scale_method": "maxabs_hw_opt_weight", + "dump_stats_path": "./hqt_output/measure" +}