Anish13 commited on
Commit
8d6f5b5
·
verified ·
1 Parent(s): 33828aa

Training in progress, step 10000

Browse files
Files changed (2) hide show
  1. config.json +3 -3
  2. model.safetensors +2 -2
config.json CHANGED
@@ -3,15 +3,15 @@
3
  "TransformerModel"
4
  ],
5
  "d_model": 512,
6
- "dim_feedforward": 2048,
7
  "dropout": 0.1,
8
- "input_dim": 307985,
9
  "max_seq_len": 1024,
10
  "model_type": "transformer",
11
  "nhead": 8,
12
  "num_decoder_layers": 6,
13
  "num_encoder_layers": 6,
14
- "output_dim": 307985,
15
  "torch_dtype": "float32",
16
  "transformers_version": "4.40.2"
17
  }
 
3
  "TransformerModel"
4
  ],
5
  "d_model": 512,
6
+ "dim_feedforward": 1024,
7
  "dropout": 0.1,
8
+ "input_dim": 30000,
9
  "max_seq_len": 1024,
10
  "model_type": "transformer",
11
  "nhead": 8,
12
  "num_decoder_layers": 6,
13
  "num_encoder_layers": 6,
14
+ "output_dim": 30000,
15
  "torch_dtype": "float32",
16
  "transformers_version": "4.40.2"
17
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:46b28b367ce5bd9e108bd301b82b111c1c7fb3a1bf87b2c8c1c4d12a44fb4972
3
- size 1441420244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e7b2fc832897759de1e1b28285a97aa8b49baee85c039379339fd9e34332d5c
3
+ size 251300560