iyashnayi
/

SocioLens-llama-3.2-3B

Text Generation

Generated from Trainer

text-generation-inference

4-bit precision

Model card Files Files and versions Community

iyashnayi commited on 23 days ago

Commit

e9a2a08

·

verified ·

1 Parent(s): 4e29401

iyashnayi/SocioLens-llama-3.2-3B

Files changed (4) hide show

README.md +1 -1
adapter_config.json +20 -7
adapter_model.safetensors +2 -2
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -27,7 +27,7 @@ print(output["generated_text"])
 ## Training procedure
-[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/yashnayi00-university-of-new-haven/huggingface/runs/r1mh79zm)
 This model was trained with SFT.

 ## Training procedure
+[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/yashnayi00-university-of-new-haven/huggingface/runs/2qg27orl)
 This model was trained with SFT.

adapter_config.json CHANGED Viewed

@@ -1,23 +1,36 @@
 {
   "auto_mapping": null,
   "base_model_name_or_path": "meta-llama/Llama-3.2-3B",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "init_lora_weights": true,
   "layers_pattern": null,
   "layers_to_transform": null,
-  "lora_alpha": 32,
-  "lora_dropout": 0.05,
   "modules_to_save": null,
   "peft_type": "LORA",
-  "r": 16,
   "revision": null,
   "target_modules": [
-    "q_proj",
     "k_proj",
-    "v_proj",
-    "o_proj"
   ],
-  "task_type": "CAUSAL_LM"
 }

 {
+  "alpha_pattern": {},
   "auto_mapping": null,
   "base_model_name_or_path": "meta-llama/Llama-3.2-3B",
   "bias": "none",
+  "corda_config": null,
+  "eva_config": null,
+  "exclude_modules": null,
   "fan_in_fan_out": false,
   "inference_mode": true,
   "init_lora_weights": true,
+  "layer_replication": null,
   "layers_pattern": null,
   "layers_to_transform": null,
+  "loftq_config": {},
+  "lora_alpha": 16,
+  "lora_bias": false,
+  "lora_dropout": 0.15,
+  "megatron_config": null,
+  "megatron_core": "megatron.core",
   "modules_to_save": null,
   "peft_type": "LORA",
+  "r": 8,
+  "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "k_proj",
+    "o_proj",
+    "q_proj",
+    "v_proj"
   ],
+  "task_type": "CAUSAL_LM",
+  "trainable_token_indices": null,
+  "use_dora": false,
+  "use_rslora": false
 }

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:58628071bf6251f15c43ab108a9dfcc619577e514e8a4009144d6e1305d5537e
-size 36730224

 version https://git-lfs.github.com/spec/v1
+oid sha256:4c3be50ee8fbeaeb3e67984c730e276a795074a7c46176ffa70c37f34e226b8d
+size 18379784

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:67f5db76b3df48d7826532eb3fd17580a466d67b16ae396b9bdcd8afc3c629b2
 size 5624

 version https://git-lfs.github.com/spec/v1
+oid sha256:7dd2014c21bd34ab1494eee9ca8bccc38c94b5a65cb51c6169b0081d798ff27f
 size 5624