Shubhra Pandit commited on
Commit
5f68add
·
1 Parent(s): dafe403

Update model files

Browse files
config.json CHANGED
@@ -26,7 +26,7 @@
26
  "Linear"
27
  ],
28
  "weights": {
29
- "actorder": null,
30
  "block_structure": null,
31
  "dynamic": false,
32
  "group_size": 128,
 
26
  "Linear"
27
  ],
28
  "weights": {
29
+ "actorder": "weight",
30
  "block_structure": null,
31
  "dynamic": false,
32
  "group_size": 128,
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ce6ddbca2d055a42ad5a803f9e18ee8ffdff756d74d01253b2e0a988087fac81
3
  size 4982297672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17264c775027afaa54bf0681021d8c1738169e794cc8b2d427028684fb7637d1
3
  size 4982297672
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c4cb75c5ceb476d930251e12c8b5a6d1066e59774f2ccb90c2b31be2ceda9d5
3
  size 1916188912
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1e26c007d7c105f5950e5203707079d17e3e954b29c51d508e48d7369ac937f
3
  size 1916188912
recipe.yaml CHANGED
@@ -3,6 +3,10 @@ DEFAULT_stage:
3
  GPTQModifier:
4
  sequential_targets: [Qwen2_5_VLDecoderLayer]
5
  dampening_frac: 0.03
6
- scheme: W4A16
 
 
 
 
7
  targets: Linear
8
  ignore: [lm_head, 're:visual.*']
 
3
  GPTQModifier:
4
  sequential_targets: [Qwen2_5_VLDecoderLayer]
5
  dampening_frac: 0.03
6
+ config_groups:
7
+ config_group:
8
+ targets: [Linear]
9
+ weights: {num_bits: 4, type: int, symmetric: true, group_size: 128, strategy: group,
10
+ dynamic: false, actorder: weight, observer: minmax}
11
  targets: Linear
12
  ignore: [lm_head, 're:visual.*']