migtissera
commited on
Commit
•
c70bd3a
1
Parent(s):
f56affb
first commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +35 -0
- generation_config.json +9 -0
- pytorch_model-00001-of-00191.bin +3 -0
- pytorch_model-00002-of-00191.bin +3 -0
- pytorch_model-00003-of-00191.bin +3 -0
- pytorch_model-00004-of-00191.bin +3 -0
- pytorch_model-00005-of-00191.bin +3 -0
- pytorch_model-00006-of-00191.bin +3 -0
- pytorch_model-00007-of-00191.bin +3 -0
- pytorch_model-00008-of-00191.bin +3 -0
- pytorch_model-00009-of-00191.bin +3 -0
- pytorch_model-00010-of-00191.bin +3 -0
- pytorch_model-00011-of-00191.bin +3 -0
- pytorch_model-00012-of-00191.bin +3 -0
- pytorch_model-00013-of-00191.bin +3 -0
- pytorch_model-00014-of-00191.bin +3 -0
- pytorch_model-00015-of-00191.bin +3 -0
- pytorch_model-00016-of-00191.bin +3 -0
- pytorch_model-00017-of-00191.bin +3 -0
- pytorch_model-00018-of-00191.bin +3 -0
- pytorch_model-00019-of-00191.bin +3 -0
- pytorch_model-00020-of-00191.bin +3 -0
- pytorch_model-00021-of-00191.bin +3 -0
- pytorch_model-00022-of-00191.bin +3 -0
- pytorch_model-00023-of-00191.bin +3 -0
- pytorch_model-00024-of-00191.bin +3 -0
- pytorch_model-00025-of-00191.bin +3 -0
- pytorch_model-00026-of-00191.bin +3 -0
- pytorch_model-00027-of-00191.bin +3 -0
- pytorch_model-00028-of-00191.bin +3 -0
- pytorch_model-00029-of-00191.bin +3 -0
- pytorch_model-00030-of-00191.bin +3 -0
- pytorch_model-00031-of-00191.bin +3 -0
- pytorch_model-00032-of-00191.bin +3 -0
- pytorch_model-00033-of-00191.bin +3 -0
- pytorch_model-00034-of-00191.bin +3 -0
- pytorch_model-00035-of-00191.bin +3 -0
- pytorch_model-00036-of-00191.bin +3 -0
- pytorch_model-00037-of-00191.bin +3 -0
- pytorch_model-00038-of-00191.bin +3 -0
- pytorch_model-00039-of-00191.bin +3 -0
- pytorch_model-00040-of-00191.bin +3 -0
- pytorch_model-00041-of-00191.bin +3 -0
- pytorch_model-00042-of-00191.bin +3 -0
- pytorch_model-00043-of-00191.bin +3 -0
- pytorch_model-00044-of-00191.bin +3 -0
- pytorch_model-00045-of-00191.bin +3 -0
- pytorch_model-00046-of-00191.bin +3 -0
- pytorch_model-00047-of-00191.bin +3 -0
- pytorch_model-00048-of-00191.bin +3 -0
config.json
ADDED
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "migtissera/Meta-Llama-3.1-405B",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 128000,
|
9 |
+
"eos_token_id": 128001,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 16384,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 53248,
|
14 |
+
"max_position_embeddings": 131072,
|
15 |
+
"mlp_bias": false,
|
16 |
+
"model_type": "llama",
|
17 |
+
"num_attention_heads": 128,
|
18 |
+
"num_hidden_layers": 126,
|
19 |
+
"num_key_value_heads": 16,
|
20 |
+
"pretraining_tp": 1,
|
21 |
+
"rms_norm_eps": 1e-05,
|
22 |
+
"rope_scaling": {
|
23 |
+
"factor": 8.0,
|
24 |
+
"high_freq_factor": 4.0,
|
25 |
+
"low_freq_factor": 1.0,
|
26 |
+
"original_max_position_embeddings": 8192,
|
27 |
+
"rope_type": "llama3"
|
28 |
+
},
|
29 |
+
"rope_theta": 500000.0,
|
30 |
+
"tie_word_embeddings": false,
|
31 |
+
"torch_dtype": "bfloat16",
|
32 |
+
"transformers_version": "4.43.3",
|
33 |
+
"use_cache": false,
|
34 |
+
"vocab_size": 128256
|
35 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 128000,
|
4 |
+
"do_sample": true,
|
5 |
+
"eos_token_id": 128001,
|
6 |
+
"temperature": 0.6,
|
7 |
+
"top_p": 0.9,
|
8 |
+
"transformers_version": "4.43.3"
|
9 |
+
}
|
pytorch_model-00001-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:660ea50b72b38a10ad74daac55c2c7bd84d0de99e9b192cd7d84a9ff7a8350d5
|
3 |
+
size 4873783664
|
pytorch_model-00002-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ee34a5e8cda43727a4ac4d253553f7f78d9e3e3ec7b567fb44f154538cbc327
|
3 |
+
size 4026533863
|
pytorch_model-00003-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42ec79830ecfb07688c9328ac9211742f720038c985232d50639961d29ffdbc3
|
3 |
+
size 4697689628
|
pytorch_model-00004-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7cb5a001f14fe28d937b7bf050b3a814b7da5a98b986b79c6752736d7901e549
|
3 |
+
size 4697689628
|
pytorch_model-00005-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31362c09086d5199645b665f2f06e58b3cdc24280d280d4de5161eac38bb849c
|
3 |
+
size 3489662678
|
pytorch_model-00006-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f66128c2e9cf354a1fb487191c6eda20b65c332ca5583690f418fb40cd9d29e
|
3 |
+
size 4697689628
|
pytorch_model-00007-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ee945918cc0b65190a32e0c424da50c0dceb7752755cc7b68cbd2762eb036fb
|
3 |
+
size 4697689628
|
pytorch_model-00008-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85921bf3048ff4e81ee7a7406b0b80dc2766d36f2b4c8a03e1fefee3197cb2d3
|
3 |
+
size 3489662678
|
pytorch_model-00009-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8018cc70ec97b2ff4944ca6f5a7f63e013a4ea43281bb46707ebdfc457f008a
|
3 |
+
size 4697689628
|
pytorch_model-00010-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c5fa1631a5b8d642ec0ff55d9b3f9ccd2bcaa4cedc83d64ba33daad23727ca6
|
3 |
+
size 4697689628
|
pytorch_model-00011-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68eea86da733de000023934567247a5da459dc10083d817ba68ad451dba81104
|
3 |
+
size 3489662678
|
pytorch_model-00012-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed2b83eb245895032d19eb14e7863fc43448f107ccfd0f20e36cbb1cb2c462a0
|
3 |
+
size 4697689628
|
pytorch_model-00013-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b38e4732aab490d3416fd89c2584576438d107103ff6e5081929f26654b4dec
|
3 |
+
size 4697689628
|
pytorch_model-00014-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e01e117f0bb2eb6e7350f009969d009ee4c79e28c04569c84b2be9a4422b909b
|
3 |
+
size 3489662678
|
pytorch_model-00015-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:832b4d56b241a868c8061c132958b73a968275ebf7dc72e1dd4227bc24f7f756
|
3 |
+
size 4697689628
|
pytorch_model-00016-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2bf5def9ae13af900b66505a323c28228d0730588281b5a7428754249a18eeef
|
3 |
+
size 4697689628
|
pytorch_model-00017-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f28eed2d84b458a27074ef2903885b31bf8e73a31b770202dbe75303c1a0023b
|
3 |
+
size 3489662678
|
pytorch_model-00018-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6dcb33538a64e90e86e34b8f3b66168169be18c9f512c969854d79a769654b1f
|
3 |
+
size 4697689628
|
pytorch_model-00019-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59e3742f045d3df9c99a4172ce7df0fee6f8d60b833c967d6ffd5f4dde848a30
|
3 |
+
size 4697689628
|
pytorch_model-00020-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb1b7a94a1edad5b50001d9632822e96298a73df6485ddf75c3c67ce0bb6569f
|
3 |
+
size 3489662678
|
pytorch_model-00021-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1423e2b3a1e4c7096266d051ee653a2465edfe8627eb78dfb1ddb9f961fce85
|
3 |
+
size 4697689628
|
pytorch_model-00022-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f886b76f45bbab56e4deb98304994a3587407b54df4632b3aa47608db52f610d
|
3 |
+
size 4697689628
|
pytorch_model-00023-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b98308684a63d23876febb4c9fe1252027c7fe838f8b7a1c45752ad55e843d7
|
3 |
+
size 3489662678
|
pytorch_model-00024-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac04c9c287bad2279590308020528c7785161096a7cc9c13504d88218d42665a
|
3 |
+
size 4697689628
|
pytorch_model-00025-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a343a95a43326e0d914dc2af420e167155fa8daaefd41138b13baabc3f68925f
|
3 |
+
size 4697689628
|
pytorch_model-00026-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d49adb4f3c9de13d654127fa5db30e4ce28205ed3a0a9fcd48c9c98bfad6327b
|
3 |
+
size 3489662678
|
pytorch_model-00027-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1a4d35ce8211ecafe60b4b6c34610c2cbd75b66b10bdb7ee84d414c044f7f91
|
3 |
+
size 4697689628
|
pytorch_model-00028-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40ef1c43d0c2356e0b268646af7c3c567f4b5f054ca73931b2dbc5e2a6e1dc02
|
3 |
+
size 4697689628
|
pytorch_model-00029-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4b44bd7f80d6c355e88053f9dea0b96ebd87c763ead83c5a2f19a2e25327d8f
|
3 |
+
size 3489662678
|
pytorch_model-00030-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:211f1f69d6f8c871a5ca0eba8ddf02afbf512d1658b792c6dd4e8b1be5c76b03
|
3 |
+
size 4697689628
|
pytorch_model-00031-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ae6b3fe55fba08bf8fad3a03400fabcdc1e7cdac656e82b2b71e44c2205aff9
|
3 |
+
size 4697689628
|
pytorch_model-00032-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62db8364d1f84d1d13758a72682ccb884d49afaea2f579f1450dc6d7db418474
|
3 |
+
size 3489662678
|
pytorch_model-00033-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01903f44513039293db445ea72830468799e148e248ed2be70d967c7dfbe1764
|
3 |
+
size 4697689628
|
pytorch_model-00034-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe6293f0a5fe7b2abd4f159aaa0f2d1c07dfb3b0101392b4a602d89a71a28564
|
3 |
+
size 4697689628
|
pytorch_model-00035-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1c4157c7bde1c720149a5bc87c6b560f43efdee936285f127b5ab5abcc3c6c3
|
3 |
+
size 3489662678
|
pytorch_model-00036-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c1bb423be02bef93189d30b52be0a86b04fbf59ec9c7894ccef7947bdc0cab1
|
3 |
+
size 4697689628
|
pytorch_model-00037-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:178a3faf3897b847f3c7c8f1dfde0785d2753e606ac3da4525065b931d972981
|
3 |
+
size 4697689628
|
pytorch_model-00038-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f71c930c352721a86335b81fbb531ab57d1bba178c72c166e9ebd9cf3d9f96f
|
3 |
+
size 3489662678
|
pytorch_model-00039-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83cdafa79478dc6539d3b1aa0004a2fcbbf5186f253d6fabf7466749a000dbcc
|
3 |
+
size 4697689628
|
pytorch_model-00040-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:655c8ca39557a76bb5273e623f78607239a1301557e1604e1959bae5ec357ba0
|
3 |
+
size 4697689628
|
pytorch_model-00041-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b18ff9c38405bed339499ff4271efc281d64dd2c2c67b50b164b3ec3e0b9d42d
|
3 |
+
size 3489662678
|
pytorch_model-00042-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e97b66314b0a9edb92022a483b0088f5da240974158a819b60a2bc3bf3ac7842
|
3 |
+
size 4697689628
|
pytorch_model-00043-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8002b1ce7ec790503569c72939f23a2fd8f70b3a5b7fdfde40a8e7e735e78af
|
3 |
+
size 4697689628
|
pytorch_model-00044-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:122ba8fd4e9f196e5455c4fd86d8ca1ece875fc3acfeae37d3ebbe487e1a67b1
|
3 |
+
size 3489662678
|
pytorch_model-00045-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e481dd054ef7ef70cb28a2e9001fd447d96ef589f296583efe62d20d31bfa3f
|
3 |
+
size 4697689628
|
pytorch_model-00046-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2c8c2cd8b4ce116ef943462b309a16b2026822b12dedd071e45c90a648e93b6
|
3 |
+
size 4697689628
|
pytorch_model-00047-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3562ff0102a458cede51f66bb73af0dbeed6e12c309c72d907f52c791176330f
|
3 |
+
size 3489662678
|
pytorch_model-00048-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6caff9a50ba28797b32b0a2ba9c3efcc4d4149958b8cc3d01846b84ab74ec5cc
|
3 |
+
size 4697689628
|