Upload 11 files
Browse files- config.json +16 -0
- generation_config.json +4 -0
- model.safetensors +3 -0
- optimizer.pt +3 -0
- rng_state_0.pth +3 -0
- rng_state_1.pth +3 -0
- rng_state_2.pth +3 -0
- rng_state_3.pth +3 -0
- scheduler.pt +3 -0
- trainer_state.json +0 -0
- training_args.bin +3 -0
config.json
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"LumensparkModel"
|
4 |
+
],
|
5 |
+
"depth": 8,
|
6 |
+
"dropout": 0.058823529411764705,
|
7 |
+
"embed_dim": 768,
|
8 |
+
"heads": 12,
|
9 |
+
"k": 384,
|
10 |
+
"model_type": "lumenspark",
|
11 |
+
"rank": 256,
|
12 |
+
"seq_length": 768,
|
13 |
+
"torch_dtype": "float32",
|
14 |
+
"transformers_version": "4.45.2",
|
15 |
+
"vocab_size": 50257
|
16 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"transformers_version": "4.45.2"
|
4 |
+
}
|
model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ddd93a3f44030d6029a41e5163f5dc2b101e133013d6bdfffb2b9afce71c38f1
|
3 |
+
size 450017780
|
optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bdb36dc6763541549a11e53193dcd79edc5882e02487a49e328742ce9c29f79
|
3 |
+
size 900132282
|
rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9a659ea42d4507bbe0c13020a189a34f500a72c3df9aace25e184f73ebfed90
|
3 |
+
size 15024
|
rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78ba3656f5eaf650efe2971462d998b1b5682a40fa41e6a1071feb5bf8982b06
|
3 |
+
size 15024
|
rng_state_2.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d52affa74bdbc66c5a02358a1e515663c8cf3ff7393c48f7854269b0364b23e8
|
3 |
+
size 15024
|
rng_state_3.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae320a6d3df28e053729564eda3d7c031a794097dacab5616b5e3cb34ef95be4
|
3 |
+
size 15024
|
scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f635691e188822b5431a13200046b0fb034c0fb13ffeb3dfe4530f591c3f6be
|
3 |
+
size 1064
|
trainer_state.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9cbcde9022319038a994fa46a7bc160123338ad3fb289996676abaa83b413c97
|
3 |
+
size 5176
|