Shubhra Pandit commited on
Commit
2156d9e
·
1 Parent(s): 589ba0a

Update model files

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
config.json CHANGED
@@ -26,7 +26,7 @@
26
  "Linear"
27
  ],
28
  "weights": {
29
- "actorder": null,
30
  "block_structure": null,
31
  "dynamic": false,
32
  "group_size": 128,
@@ -211,7 +211,7 @@
211
  "quantization_status": "compressed",
212
  "sparsity_config": {
213
  "format": "dense",
214
- "global_sparsity": 0.15522512352032172,
215
  "ignore": [
216
  "visual.blocks.0.attn.qkv",
217
  "visual.blocks.0.attn.proj",
@@ -974,4 +974,4 @@
974
  "vision_start_token_id": 151652,
975
  "vision_token_id": 151654,
976
  "vocab_size": 152064
977
- }
 
26
  "Linear"
27
  ],
28
  "weights": {
29
+ "actorder": "weight",
30
  "block_structure": null,
31
  "dynamic": false,
32
  "group_size": 128,
 
211
  "quantization_status": "compressed",
212
  "sparsity_config": {
213
  "format": "dense",
214
+ "global_sparsity": 0.15507475599525683,
215
  "ignore": [
216
  "visual.blocks.0.attn.qkv",
217
  "visual.blocks.0.attn.proj",
 
974
  "vision_start_token_id": 151652,
975
  "vision_token_id": 151654,
976
  "vocab_size": 152064
977
+ }
model-00001-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:65ae6205182adb03619a5a259938f7ccc7e0de841d692c9ff43ed0b25d056e4d
3
  size 4883683112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c34f07cf41be4d5842aeeb5b67d0768cd2ba9bbcb917531336ea100e2ed80e72
3
  size 4883683112
model-00002-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c59e382470f47fa6f49e97fffda25ef8d4030e509222e9b45dc46db976820fba
3
  size 4978586528
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c265f1ab71a9fa5c342790aaa75bb39fe37c11f0e395e3c779b7c806bcb2045e
3
  size 4978586528
model-00003-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9fffadac0b79d5fcbda277a65228d1f3a8477d0e64d598aa81779520c7d8b6f0
3
  size 4978586728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4edd3cb757f4ced8b7b18d3c2181056a2b369ea584343edb15b164d629888a0
3
  size 4978586728
model-00004-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4347cc3cd726cc58348ffa4219936f57f4ef41e2ac032d7aa287a48f54295785
3
  size 4978586728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8cb8859e839ca8aa7d8d5d624f96e1d6a3dea642293779ed6215f9e6737f3602
3
  size 4978586728
model-00005-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c6237c2d3dab8dc5231e1753cb48e524371cb16465fe16b50d0e2eedb35f9c7
3
  size 4978586728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:194ebf83b82f23955344ad5fb661552ff9276b43e08ad86442195502e41dcf53
3
  size 4978586728
model-00006-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4e4a9d890927c5c4dae6a19f3b759dc98a8543d58aafaf50021d29c0f6d7377f
3
  size 4978586728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c57dd01ca5923863ca29ebc51f5c0334dc0528918a80ea9a658350f169b19a75
3
  size 4978586728
model-00007-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7498e9424272f765a649fde0e937779b232bddafc41ee3677930460d083896ae
3
  size 4978586728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8883dbacb084499cc9c67b78ace5c822aafd2eb2e0cd806ed5915bd79389471
3
  size 4978586728
model-00008-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:687fcd6bf5a296efe10c8eab1d9141724aa2c71f567abe1967e1f022e8f37eb9
3
  size 4978586728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:780cadf70c5d6dbd24dc2fb38d1f5708d005434b4e3c6edd2e92f70cf20b46e9
3
  size 4978586728
model-00009-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:79becbef2f38683dc0340ed4da922bf41b76ef1171204d191613469b6e52386e
3
  size 2866152816
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6111bf4938b9555988d2b736115f615c951de748562f5456e1ca31dddbd8f3ac
3
  size 2866152816
recipe.yaml CHANGED
@@ -3,6 +3,10 @@ DEFAULT_stage:
3
  GPTQModifier:
4
  sequential_targets: [Qwen2_5_VLDecoderLayer]
5
  dampening_frac: 0.03
6
- scheme: W4A16
 
 
 
 
7
  targets: Linear
8
  ignore: [lm_head, 're:visual.*']
 
3
  GPTQModifier:
4
  sequential_targets: [Qwen2_5_VLDecoderLayer]
5
  dampening_frac: 0.03
6
+ config_groups:
7
+ config_group:
8
+ targets: [Linear]
9
+ weights: {num_bits: 4, type: int, symmetric: true, group_size: 128, strategy: group,
10
+ dynamic: false, actorder: weight, observer: minmax}
11
  targets: Linear
12
  ignore: [lm_head, 're:visual.*']
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:913950e4971737031da511cdd1b410daae4566f62eb845b3975bca5a102323d8
3
- size 11421995
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa
3
+ size 11421896