|
{ |
|
"model_name": "thaslimthoufica/english-tamil-translator", |
|
"base_model": "unsloth/Meta-Llama-3.1-8B-bnb-4bit", |
|
"dataset_name": "thaslimthoufica/English_tamil_dataset", |
|
"max_seq_length": 512, |
|
"dtype": "bfloat16", |
|
"load_in_4bit": true, |
|
"use_cache": false, |
|
"train_test_split": 0.2, |
|
"training_args": { |
|
"per_device_train_batch_size": 4, |
|
"per_device_eval_batch_size": 4, |
|
"num_train_epochs": 5, |
|
"learning_rate": 2e-5, |
|
"weight_decay": 0.01, |
|
"logging_steps": 50, |
|
"save_steps": 500, |
|
"evaluation_strategy": "epoch", |
|
"save_total_limit": 2, |
|
"push_to_hub": true |
|
}, |
|
"trainer_settings": { |
|
"report_to": "wandb", |
|
"save_model_every_epoch": true |
|
} |
|
} |