thouficatranslator / configuration
thaslimthoufica's picture
Create configuration
acbd1ad verified
{
"model_name": "thaslimthoufica/english-tamil-translator",
"base_model": "unsloth/Meta-Llama-3.1-8B-bnb-4bit",
"dataset_name": "thaslimthoufica/English_tamil_dataset",
"max_seq_length": 512,
"dtype": "bfloat16",
"load_in_4bit": true,
"use_cache": false,
"train_test_split": 0.2,
"training_args": {
"per_device_train_batch_size": 4,
"per_device_eval_batch_size": 4,
"num_train_epochs": 5,
"learning_rate": 2e-5,
"weight_decay": 0.01,
"logging_steps": 50,
"save_steps": 500,
"evaluation_strategy": "epoch",
"save_total_limit": 2,
"push_to_hub": true
},
"trainer_settings": {
"report_to": "wandb",
"save_model_every_epoch": true
}
}