03bd1b46b9832627f141196723a144e7aaa9245d308f4e7fd3907b68d02232ec
Browse files- .gitattributes +12 -0
- checkpoint/pytorch_model.bin/p97.model.layers.10.mlp.down_proj.weight +3 -0
- checkpoint/pytorch_model.bin/p98.model.layers.10.input_layernorm.weight +3 -0
- checkpoint/pytorch_model.bin/p99.model.layers.10.post_attention_layernorm.weight +3 -0
- compiled/1744545db8406da6398e.neff +3 -0
- compiled/1bb198a13076d1853641.neff +3 -0
- compiled/2e107447c6e0a7f19573.neff +3 -0
- compiled/51f8a515591560780d48.neff +3 -0
- compiled/6cab3b785bfcdd58ee6a.neff +3 -0
- compiled/a37ede77a746b866b69d.neff +3 -0
- compiled/b938f58ffd873c7146a7.neff +3 -0
- compiled/c3741198db69eb019273.neff +3 -0
- compiled/d632e5ec42990d4ee01b.neff +3 -0
- compiled/d95062416ef36beb6494.neff +3 -0
- compiled/dfcd5ec203680dc9542c.neff +3 -0
- compiled/e65e10acdd5186bd49cc.neff +3 -0
- config.json +39 -0
- generation_config.json +10 -0
.gitattributes
CHANGED
@@ -33,3 +33,15 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
compiled/1744545db8406da6398e.neff filter=lfs diff=lfs merge=lfs -text
|
37 |
+
compiled/1bb198a13076d1853641.neff filter=lfs diff=lfs merge=lfs -text
|
38 |
+
compiled/2e107447c6e0a7f19573.neff filter=lfs diff=lfs merge=lfs -text
|
39 |
+
compiled/51f8a515591560780d48.neff filter=lfs diff=lfs merge=lfs -text
|
40 |
+
compiled/6cab3b785bfcdd58ee6a.neff filter=lfs diff=lfs merge=lfs -text
|
41 |
+
compiled/a37ede77a746b866b69d.neff filter=lfs diff=lfs merge=lfs -text
|
42 |
+
compiled/b938f58ffd873c7146a7.neff filter=lfs diff=lfs merge=lfs -text
|
43 |
+
compiled/c3741198db69eb019273.neff filter=lfs diff=lfs merge=lfs -text
|
44 |
+
compiled/d632e5ec42990d4ee01b.neff filter=lfs diff=lfs merge=lfs -text
|
45 |
+
compiled/d95062416ef36beb6494.neff filter=lfs diff=lfs merge=lfs -text
|
46 |
+
compiled/dfcd5ec203680dc9542c.neff filter=lfs diff=lfs merge=lfs -text
|
47 |
+
compiled/e65e10acdd5186bd49cc.neff filter=lfs diff=lfs merge=lfs -text
|
checkpoint/pytorch_model.bin/p97.model.layers.10.mlp.down_proj.weight
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f31785ebc10913a12d01b17d3451891c027e0ffd1fc0be8f89056ba45b625e09
|
3 |
+
size 180355961
|
checkpoint/pytorch_model.bin/p98.model.layers.10.input_layernorm.weight
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ea3540d2d759589d994e0bef604803dd9b625d224dbf25d6d8bc4344e9fd15f
|
3 |
+
size 17279
|
checkpoint/pytorch_model.bin/p99.model.layers.10.post_attention_layernorm.weight
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:479c1a72ac29ed1048bf0f865f8f4056edfb6717591b75e1d47f1d28c2e7e51d
|
3 |
+
size 17306
|
compiled/1744545db8406da6398e.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db39f3197b1e1d81f7311a77a9880a7cb12cc953b2ca744ae18f2e64eefcd4b2
|
3 |
+
size 7906304
|
compiled/1bb198a13076d1853641.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:25f6911913ea26aebfc424db47991712b61cfa26e7a8d95fb59ad7de56f36556
|
3 |
+
size 12770304
|
compiled/2e107447c6e0a7f19573.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f81d1225bac88c9bfe8fe32769f9ca456611cd2ebc3bb1f8769b9257d0406be7
|
3 |
+
size 7875584
|
compiled/51f8a515591560780d48.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea629fe1a08447276532c5049ffec9b62f4b4775fe99990cd4a15910d99f52af
|
3 |
+
size 10036224
|
compiled/6cab3b785bfcdd58ee6a.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c1e53bc6a227ad6ca8dc9dd5bc3029e85b5de3d5444eeae3dd0f659cca3c519
|
3 |
+
size 8551424
|
compiled/a37ede77a746b866b69d.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a8262fa30782e5bcf46811cf3a5411bf3f1a3356986e8f711fcb893212c2b86
|
3 |
+
size 7998464
|
compiled/b938f58ffd873c7146a7.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ad1e997ab8eb40c27977d5ffeca7e0e2590eb75984d5e673a40c7e8267212a2
|
3 |
+
size 23307264
|
compiled/c3741198db69eb019273.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:456bd364c91fcfc9a255138e0869098708f2414ed9df16cd0fca9ae619438d71
|
3 |
+
size 8162304
|
compiled/d632e5ec42990d4ee01b.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e4b9ce4d8f1b2e9bb8ec344f890cc95573f6524a0692b8cda9c6182c1ccd40a
|
3 |
+
size 8479744
|
compiled/d95062416ef36beb6494.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:94754b229abb0c3b0af8adb6bed0bf4c0fa646eb070caefdc396dbc10cd64284
|
3 |
+
size 8899584
|
compiled/dfcd5ec203680dc9542c.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6821744725d584b72d3b5419efe49a1471c329e73d1909789e6d76ae5059d7af
|
3 |
+
size 9186304
|
compiled/e65e10acdd5186bd49cc.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34bbf0325dcea2421ba7270bf30e7922a433ae8ae0aa2a21e146c92cd240177c
|
3 |
+
size 47197184
|
config.json
ADDED
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "meta-llama/Llama-2-7b-hf",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 4096,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 11008,
|
14 |
+
"max_position_embeddings": 4096,
|
15 |
+
"model_type": "llama",
|
16 |
+
"neuron": {
|
17 |
+
"auto_cast_type": "fp16",
|
18 |
+
"batch_size": 1,
|
19 |
+
"checkpoint_id": "meta-llama/Llama-2-7b-hf",
|
20 |
+
"checkpoint_revision": "8cca527612d856d7d32bd94f8103728d614eb852",
|
21 |
+
"compiler_type": "neuronx-cc",
|
22 |
+
"compiler_version": "2.12.68.0+4480452af",
|
23 |
+
"num_cores": 2,
|
24 |
+
"sequence_length": 4096,
|
25 |
+
"task": "text-generation"
|
26 |
+
},
|
27 |
+
"num_attention_heads": 32,
|
28 |
+
"num_hidden_layers": 32,
|
29 |
+
"num_key_value_heads": 32,
|
30 |
+
"pretraining_tp": 1,
|
31 |
+
"rms_norm_eps": 1e-05,
|
32 |
+
"rope_scaling": null,
|
33 |
+
"rope_theta": 10000.0,
|
34 |
+
"tie_word_embeddings": false,
|
35 |
+
"torch_dtype": "float16",
|
36 |
+
"transformers_version": "4.36.2",
|
37 |
+
"use_cache": true,
|
38 |
+
"vocab_size": 32000
|
39 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token_id": 1,
|
3 |
+
"do_sample": true,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"max_length": 4096,
|
6 |
+
"pad_token_id": 0,
|
7 |
+
"temperature": 0.6,
|
8 |
+
"top_p": 0.9,
|
9 |
+
"transformers_version": "4.36.2"
|
10 |
+
}
|