OPEA
/

DeepSeek-V2.5-1210-int4-sym-inc

4-bit precision

intel/auto-round

Model card Files Files and versions Community

wenhuach commited on Dec 30, 2024

Commit

2a9d75b

·

1 Parent(s): 16af7a2

autoround format

Signed-off-by: wenhuach <[email protected]>

Files changed (1) hide show

config.json +4 -5

config.json CHANGED Viewed

@@ -39,11 +39,11 @@
   "quantization_config": {
     "amp": true,
     "autoround_version": "0.4.3",
     "batch_size": 2,
     "bits": 4,
-    "damp_percent": 0.01,
     "data_type": "int",
-    "desc_act": false,
     "enable_minmax_tuning": true,
     "enable_norm_bias_tuning": false,
     "enable_quanted_input": true,
@@ -54,12 +54,11 @@
     "lr": 0.005,
     "minmax_lr": 0.005,
     "nsamples": 128,
-    "quant_method": "gptq",
     "scale_dtype": "torch.float16",
     "seqlen": 2048,
     "sym": true,
-    "to_quant_block_names": null,
-    "true_sequential": false
   },
   "rms_norm_eps": 1e-06,
   "rope_scaling": {

   "quantization_config": {
     "amp": true,
     "autoround_version": "0.4.3",
+    "backend": "auto_round:gptq:exllamav2",
     "batch_size": 2,
     "bits": 4,
     "data_type": "int",
+    "dataset": "NeelNanda/pile-10k",
     "enable_minmax_tuning": true,
     "enable_norm_bias_tuning": false,
     "enable_quanted_input": true,
     "lr": 0.005,
     "minmax_lr": 0.005,
     "nsamples": 128,
+    "quant_method": "intel/auto-round",
     "scale_dtype": "torch.float16",
     "seqlen": 2048,
     "sym": true,
+    "to_quant_block_names": null
   },
   "rms_norm_eps": 1e-06,
   "rope_scaling": {