results_model5 / config.json
Anish13's picture
Training in progress, step 10000
8d6f5b5 verified
raw
history blame contribute delete
346 Bytes
{
"architectures": [
"TransformerModel"
],
"d_model": 512,
"dim_feedforward": 1024,
"dropout": 0.1,
"input_dim": 30000,
"max_seq_len": 1024,
"model_type": "transformer",
"nhead": 8,
"num_decoder_layers": 6,
"num_encoder_layers": 6,
"output_dim": 30000,
"torch_dtype": "float32",
"transformers_version": "4.40.2"
}