migtissera commited on
Commit
c70bd3a
1 Parent(s): f56affb

first commit

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +35 -0
  2. generation_config.json +9 -0
  3. pytorch_model-00001-of-00191.bin +3 -0
  4. pytorch_model-00002-of-00191.bin +3 -0
  5. pytorch_model-00003-of-00191.bin +3 -0
  6. pytorch_model-00004-of-00191.bin +3 -0
  7. pytorch_model-00005-of-00191.bin +3 -0
  8. pytorch_model-00006-of-00191.bin +3 -0
  9. pytorch_model-00007-of-00191.bin +3 -0
  10. pytorch_model-00008-of-00191.bin +3 -0
  11. pytorch_model-00009-of-00191.bin +3 -0
  12. pytorch_model-00010-of-00191.bin +3 -0
  13. pytorch_model-00011-of-00191.bin +3 -0
  14. pytorch_model-00012-of-00191.bin +3 -0
  15. pytorch_model-00013-of-00191.bin +3 -0
  16. pytorch_model-00014-of-00191.bin +3 -0
  17. pytorch_model-00015-of-00191.bin +3 -0
  18. pytorch_model-00016-of-00191.bin +3 -0
  19. pytorch_model-00017-of-00191.bin +3 -0
  20. pytorch_model-00018-of-00191.bin +3 -0
  21. pytorch_model-00019-of-00191.bin +3 -0
  22. pytorch_model-00020-of-00191.bin +3 -0
  23. pytorch_model-00021-of-00191.bin +3 -0
  24. pytorch_model-00022-of-00191.bin +3 -0
  25. pytorch_model-00023-of-00191.bin +3 -0
  26. pytorch_model-00024-of-00191.bin +3 -0
  27. pytorch_model-00025-of-00191.bin +3 -0
  28. pytorch_model-00026-of-00191.bin +3 -0
  29. pytorch_model-00027-of-00191.bin +3 -0
  30. pytorch_model-00028-of-00191.bin +3 -0
  31. pytorch_model-00029-of-00191.bin +3 -0
  32. pytorch_model-00030-of-00191.bin +3 -0
  33. pytorch_model-00031-of-00191.bin +3 -0
  34. pytorch_model-00032-of-00191.bin +3 -0
  35. pytorch_model-00033-of-00191.bin +3 -0
  36. pytorch_model-00034-of-00191.bin +3 -0
  37. pytorch_model-00035-of-00191.bin +3 -0
  38. pytorch_model-00036-of-00191.bin +3 -0
  39. pytorch_model-00037-of-00191.bin +3 -0
  40. pytorch_model-00038-of-00191.bin +3 -0
  41. pytorch_model-00039-of-00191.bin +3 -0
  42. pytorch_model-00040-of-00191.bin +3 -0
  43. pytorch_model-00041-of-00191.bin +3 -0
  44. pytorch_model-00042-of-00191.bin +3 -0
  45. pytorch_model-00043-of-00191.bin +3 -0
  46. pytorch_model-00044-of-00191.bin +3 -0
  47. pytorch_model-00045-of-00191.bin +3 -0
  48. pytorch_model-00046-of-00191.bin +3 -0
  49. pytorch_model-00047-of-00191.bin +3 -0
  50. pytorch_model-00048-of-00191.bin +3 -0
config.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "migtissera/Meta-Llama-3.1-405B",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 128000,
9
+ "eos_token_id": 128001,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 16384,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 53248,
14
+ "max_position_embeddings": 131072,
15
+ "mlp_bias": false,
16
+ "model_type": "llama",
17
+ "num_attention_heads": 128,
18
+ "num_hidden_layers": 126,
19
+ "num_key_value_heads": 16,
20
+ "pretraining_tp": 1,
21
+ "rms_norm_eps": 1e-05,
22
+ "rope_scaling": {
23
+ "factor": 8.0,
24
+ "high_freq_factor": 4.0,
25
+ "low_freq_factor": 1.0,
26
+ "original_max_position_embeddings": 8192,
27
+ "rope_type": "llama3"
28
+ },
29
+ "rope_theta": 500000.0,
30
+ "tie_word_embeddings": false,
31
+ "torch_dtype": "bfloat16",
32
+ "transformers_version": "4.43.3",
33
+ "use_cache": false,
34
+ "vocab_size": 128256
35
+ }
generation_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 128000,
4
+ "do_sample": true,
5
+ "eos_token_id": 128001,
6
+ "temperature": 0.6,
7
+ "top_p": 0.9,
8
+ "transformers_version": "4.43.3"
9
+ }
pytorch_model-00001-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:660ea50b72b38a10ad74daac55c2c7bd84d0de99e9b192cd7d84a9ff7a8350d5
3
+ size 4873783664
pytorch_model-00002-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ee34a5e8cda43727a4ac4d253553f7f78d9e3e3ec7b567fb44f154538cbc327
3
+ size 4026533863
pytorch_model-00003-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42ec79830ecfb07688c9328ac9211742f720038c985232d50639961d29ffdbc3
3
+ size 4697689628
pytorch_model-00004-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7cb5a001f14fe28d937b7bf050b3a814b7da5a98b986b79c6752736d7901e549
3
+ size 4697689628
pytorch_model-00005-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31362c09086d5199645b665f2f06e58b3cdc24280d280d4de5161eac38bb849c
3
+ size 3489662678
pytorch_model-00006-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f66128c2e9cf354a1fb487191c6eda20b65c332ca5583690f418fb40cd9d29e
3
+ size 4697689628
pytorch_model-00007-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ee945918cc0b65190a32e0c424da50c0dceb7752755cc7b68cbd2762eb036fb
3
+ size 4697689628
pytorch_model-00008-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85921bf3048ff4e81ee7a7406b0b80dc2766d36f2b4c8a03e1fefee3197cb2d3
3
+ size 3489662678
pytorch_model-00009-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8018cc70ec97b2ff4944ca6f5a7f63e013a4ea43281bb46707ebdfc457f008a
3
+ size 4697689628
pytorch_model-00010-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c5fa1631a5b8d642ec0ff55d9b3f9ccd2bcaa4cedc83d64ba33daad23727ca6
3
+ size 4697689628
pytorch_model-00011-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68eea86da733de000023934567247a5da459dc10083d817ba68ad451dba81104
3
+ size 3489662678
pytorch_model-00012-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed2b83eb245895032d19eb14e7863fc43448f107ccfd0f20e36cbb1cb2c462a0
3
+ size 4697689628
pytorch_model-00013-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b38e4732aab490d3416fd89c2584576438d107103ff6e5081929f26654b4dec
3
+ size 4697689628
pytorch_model-00014-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e01e117f0bb2eb6e7350f009969d009ee4c79e28c04569c84b2be9a4422b909b
3
+ size 3489662678
pytorch_model-00015-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:832b4d56b241a868c8061c132958b73a968275ebf7dc72e1dd4227bc24f7f756
3
+ size 4697689628
pytorch_model-00016-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2bf5def9ae13af900b66505a323c28228d0730588281b5a7428754249a18eeef
3
+ size 4697689628
pytorch_model-00017-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f28eed2d84b458a27074ef2903885b31bf8e73a31b770202dbe75303c1a0023b
3
+ size 3489662678
pytorch_model-00018-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6dcb33538a64e90e86e34b8f3b66168169be18c9f512c969854d79a769654b1f
3
+ size 4697689628
pytorch_model-00019-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59e3742f045d3df9c99a4172ce7df0fee6f8d60b833c967d6ffd5f4dde848a30
3
+ size 4697689628
pytorch_model-00020-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb1b7a94a1edad5b50001d9632822e96298a73df6485ddf75c3c67ce0bb6569f
3
+ size 3489662678
pytorch_model-00021-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1423e2b3a1e4c7096266d051ee653a2465edfe8627eb78dfb1ddb9f961fce85
3
+ size 4697689628
pytorch_model-00022-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f886b76f45bbab56e4deb98304994a3587407b54df4632b3aa47608db52f610d
3
+ size 4697689628
pytorch_model-00023-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b98308684a63d23876febb4c9fe1252027c7fe838f8b7a1c45752ad55e843d7
3
+ size 3489662678
pytorch_model-00024-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac04c9c287bad2279590308020528c7785161096a7cc9c13504d88218d42665a
3
+ size 4697689628
pytorch_model-00025-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a343a95a43326e0d914dc2af420e167155fa8daaefd41138b13baabc3f68925f
3
+ size 4697689628
pytorch_model-00026-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d49adb4f3c9de13d654127fa5db30e4ce28205ed3a0a9fcd48c9c98bfad6327b
3
+ size 3489662678
pytorch_model-00027-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1a4d35ce8211ecafe60b4b6c34610c2cbd75b66b10bdb7ee84d414c044f7f91
3
+ size 4697689628
pytorch_model-00028-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40ef1c43d0c2356e0b268646af7c3c567f4b5f054ca73931b2dbc5e2a6e1dc02
3
+ size 4697689628
pytorch_model-00029-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4b44bd7f80d6c355e88053f9dea0b96ebd87c763ead83c5a2f19a2e25327d8f
3
+ size 3489662678
pytorch_model-00030-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:211f1f69d6f8c871a5ca0eba8ddf02afbf512d1658b792c6dd4e8b1be5c76b03
3
+ size 4697689628
pytorch_model-00031-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ae6b3fe55fba08bf8fad3a03400fabcdc1e7cdac656e82b2b71e44c2205aff9
3
+ size 4697689628
pytorch_model-00032-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62db8364d1f84d1d13758a72682ccb884d49afaea2f579f1450dc6d7db418474
3
+ size 3489662678
pytorch_model-00033-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01903f44513039293db445ea72830468799e148e248ed2be70d967c7dfbe1764
3
+ size 4697689628
pytorch_model-00034-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe6293f0a5fe7b2abd4f159aaa0f2d1c07dfb3b0101392b4a602d89a71a28564
3
+ size 4697689628
pytorch_model-00035-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1c4157c7bde1c720149a5bc87c6b560f43efdee936285f127b5ab5abcc3c6c3
3
+ size 3489662678
pytorch_model-00036-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c1bb423be02bef93189d30b52be0a86b04fbf59ec9c7894ccef7947bdc0cab1
3
+ size 4697689628
pytorch_model-00037-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:178a3faf3897b847f3c7c8f1dfde0785d2753e606ac3da4525065b931d972981
3
+ size 4697689628
pytorch_model-00038-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f71c930c352721a86335b81fbb531ab57d1bba178c72c166e9ebd9cf3d9f96f
3
+ size 3489662678
pytorch_model-00039-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83cdafa79478dc6539d3b1aa0004a2fcbbf5186f253d6fabf7466749a000dbcc
3
+ size 4697689628
pytorch_model-00040-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:655c8ca39557a76bb5273e623f78607239a1301557e1604e1959bae5ec357ba0
3
+ size 4697689628
pytorch_model-00041-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b18ff9c38405bed339499ff4271efc281d64dd2c2c67b50b164b3ec3e0b9d42d
3
+ size 3489662678
pytorch_model-00042-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e97b66314b0a9edb92022a483b0088f5da240974158a819b60a2bc3bf3ac7842
3
+ size 4697689628
pytorch_model-00043-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8002b1ce7ec790503569c72939f23a2fd8f70b3a5b7fdfde40a8e7e735e78af
3
+ size 4697689628
pytorch_model-00044-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:122ba8fd4e9f196e5455c4fd86d8ca1ece875fc3acfeae37d3ebbe487e1a67b1
3
+ size 3489662678
pytorch_model-00045-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e481dd054ef7ef70cb28a2e9001fd447d96ef589f296583efe62d20d31bfa3f
3
+ size 4697689628
pytorch_model-00046-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2c8c2cd8b4ce116ef943462b309a16b2026822b12dedd071e45c90a648e93b6
3
+ size 4697689628
pytorch_model-00047-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3562ff0102a458cede51f66bb73af0dbeed6e12c309c72d907f52c791176330f
3
+ size 3489662678
pytorch_model-00048-of-00191.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6caff9a50ba28797b32b0a2ba9c3efcc4d4149958b8cc3d01846b84ab74ec5cc
3
+ size 4697689628