thaslimthoufica
/

thouficatranslator

Model card Files Files and versions Community

thaslimthoufica commited on Feb 19

Commit

acbd1ad

·

verified ·

1 Parent(s): fc95c0a

Create configuration

Files changed (1) hide show

configuration +26 -0

configuration ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+  "model_name": "thaslimthoufica/english-tamil-translator",
+  "base_model": "unsloth/Meta-Llama-3.1-8B-bnb-4bit",
+  "dataset_name": "thaslimthoufica/English_tamil_dataset",
+  "max_seq_length": 512,
+  "dtype": "bfloat16",
+  "load_in_4bit": true,
+  "use_cache": false,
+  "train_test_split": 0.2,
+  "training_args": {
+    "per_device_train_batch_size": 4,
+    "per_device_eval_batch_size": 4,
+    "num_train_epochs": 5,
+    "learning_rate": 2e-5,
+    "weight_decay": 0.01,
+    "logging_steps": 50,
+    "save_steps": 500,
+    "evaluation_strategy": "epoch",
+    "save_total_limit": 2,
+    "push_to_hub": true
+  },
+  "trainer_settings": {
+    "report_to": "wandb",
+    "save_model_every_epoch": true
+  }
+}