pearl-11m-translate / config.json
kambale's picture
Update model: Epochs 50, Val Loss 1.1906, Test BLEU 27.90
3c973e2 verified
{
"model_type": "seq2seq_transformer_from_scratch",
"architecture": "Encoder-Decoder Transformer",
"framework": "pytorch",
"source_language": "english",
"target_language": "luganda",
"pytorch_model_path": "pytorch_model.bin",
"src_tokenizer_file": "english_tokenizer.json",
"trg_tokenizer_file": "luganda_tokenizer.json",
"model_parameters": {
"input_dim_vocab_size_src": 10000,
"output_dim_vocab_size_trg": 10000,
"hidden_dim": 256,
"encoder_layers": 3,
"decoder_layers": 3,
"encoder_heads": 8,
"decoder_heads": 8,
"encoder_pf_dim": 512,
"decoder_pf_dim": 512,
"encoder_dropout": 0.1,
"decoder_dropout": 0.1,
"max_seq_length": 128
},
"special_token_ids": {
"pad_token_id": 0,
"sos_token_id": 1,
"eos_token_id": 2,
"unk_token_id": 3
},
"dataset_used_for_training": "kambale/luganda-english-parallel-corpus",
"training_epochs": 50,
"batch_size": 128,
"learning_rate": 0.0005,
"best_validation_loss": 1.1906119108200073,
"bleu_on_test_set": 27.901593935858266
}