results_model6_2 / config.json
Anish13's picture
Training in progress, step 1000
3ab02e1 verified
raw
history blame contribute delete
345 Bytes
{
"architectures": [
"TransformerModel"
],
"d_model": 512,
"dim_feedforward": 1024,
"dropout": 0.1,
"input_dim": 30000,
"max_seq_len": 512,
"model_type": "transformer",
"nhead": 8,
"num_decoder_layers": 6,
"num_encoder_layers": 6,
"output_dim": 30000,
"torch_dtype": "float32",
"transformers_version": "4.41.0"
}