fracapuano commited on
Commit
5d3b3e8
·
verified ·
1 Parent(s): e50354a

Training in progress, epoch 10

Browse files
Files changed (3) hide show
  1. config.json +5 -5
  2. model.safetensors +2 -2
  3. training_args.bin +1 -1
config.json CHANGED
@@ -4,18 +4,18 @@
4
  ],
5
  "batch_size": 4,
6
  "bos_token_id": 1,
7
- "d_ff": 1024,
8
  "d_model": 1024,
9
- "dropout": 0.13129617833969415,
10
  "eos_token_id": 2,
11
- "model_size": 81697026,
12
  "model_type": "custom_code",
13
  "n_heads": 16,
14
- "n_layers": 2,
15
  "num_train_epochs": 20,
16
  "pad_token_id": 0,
17
  "router_dim": 10,
18
- "sequence_length": 128,
19
  "source_sequence_dimension": 70,
20
  "target_sequence_dimension": 306,
21
  "torch_dtype": "float32",
 
4
  ],
5
  "batch_size": 4,
6
  "bos_token_id": 1,
7
+ "d_ff": 512,
8
  "d_model": 1024,
9
+ "dropout": 0.13619667425956658,
10
  "eos_token_id": 2,
11
+ "model_size": 105627906,
12
  "model_type": "custom_code",
13
  "n_heads": 16,
14
+ "n_layers": 3,
15
  "num_train_epochs": 20,
16
  "pad_token_id": 0,
17
  "router_dim": 10,
18
+ "sequence_length": 64,
19
  "source_sequence_dimension": 70,
20
  "target_sequence_dimension": 306,
21
  "torch_dtype": "float32",
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5cdcd2e137e1b5fdf92d760c2be873e2b3f1aa7f37bde4b653a562dd8d2ef0b0
3
- size 326804928
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c401adcd171ceaac8bd9e0845b7661d85538d010a74c55ed814bc2d0873bf641
3
+ size 422536616
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b59d643fb47105b5f85b598a0cb6beda4cd27a5bded38d9410678baf60529918
3
  size 5304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:159967394442ef4416aa90ecbee137ab3ec1bd4be825e4d6cb189ca9244b56f9
3
  size 5304