chheplo commited on
Commit
dd79b5e
·
verified ·
1 Parent(s): bc6eff3

Upload 2 files

Browse files

added SpinQuant files

Files changed (3) hide show
  1. .gitattributes +1 -0
  2. llama3_2.pte +3 -0
  3. params.json +17 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ llama3_2.pte filter=lfs diff=lfs merge=lfs -text
llama3_2.pte ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fdc4a794d03f15ad91e8009cf39316c36a19fbc7948cb0875c1bbe4bf60dd5f
3
+ size 1137008912
params.json ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dim": 2048,
3
+ "n_layers": 16,
4
+ "n_heads": 32,
5
+ "n_kv_heads": 8,
6
+ "vocab_size": 128256,
7
+ "ffn_dim_multiplier": 1.5,
8
+ "multiple_of": 256,
9
+ "norm_eps": 1e-05,
10
+ "rope_theta": 500000.0,
11
+ "use_scaled_rope": true,
12
+ "quantization_args": {
13
+ "group_size": 32,
14
+ "scheme": "int4_weight_int8_dynamic_activation",
15
+ "spinquant": true
16
+ }
17
+ }