End of training

Files changed (6) hide show

README.md CHANGED Viewed

@@ -28,7 +28,7 @@ print(output["generated_text"])
 ## Training procedure
-[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/romain_fnc-xventures/Gradients-On-Demand/runs/cx014uko)
 This model was trained with DPO, a method introduced in [Direct Preference Optimization: Your Language Model is Secretly a Reward Model](https://huggingface.co/papers/2305.18290).

 ## Training procedure
+[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/romain_fnc-xventures/Gradients-On-Demand/runs/b1pe3qef)
 This model was trained with DPO, a method introduced in [Direct Preference Optimization: Your Language Model is Secretly a Reward Model](https://huggingface.co/papers/2305.18290).

adapter_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ca8bc6b9c40dbee3cbe94d2e96d13382a54c668c52be8a8936201a7579286ff5
 size 671250634

 version https://git-lfs.github.com/spec/v1
+oid sha256:079085281394f6c8f684d345baf657566ba7cdf0378dcc96b554d1fe41473087
 size 671250634

config.json CHANGED Viewed

@@ -1,5 +1,4 @@
 {
-  "_attn_implementation_autoset": true,
   "_name_or_path": "Intel/neural-chat-7b-v3-3",
   "architectures": [
     "MistralForCausalLM"
@@ -21,7 +20,7 @@
   "rope_theta": 10000.0,
   "sliding_window": 4096,
   "tie_word_embeddings": false,
-  "torch_dtype": "float16",
   "transformers_version": "4.46.0",
   "use_cache": false,
   "vocab_size": 32000

 {
   "_name_or_path": "Intel/neural-chat-7b-v3-3",
   "architectures": [
     "MistralForCausalLM"
   "rope_theta": 10000.0,
   "sliding_window": 4096,
   "tie_word_embeddings": false,
+  "torch_dtype": "bfloat16",
   "transformers_version": "4.46.0",
   "use_cache": false,
   "vocab_size": 32000

pytorch_model-00001-of-00004.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:87b1be796accf9c1d5c1d8e61a38e19815df6b4a8498d9902a9c7dd9fc950c30
 size 4924890283

 version https://git-lfs.github.com/spec/v1
+oid sha256:d9ee5fd5003382acc32bd7aa2e800c7785d6b28445e3473155e9d208e53364cd
 size 4924890283

pytorch_model-00002-of-00004.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:81f8b004977369a194b567c72f53fa619a75100b00faa509c470df040e844589
 size 4993591120

 version https://git-lfs.github.com/spec/v1
+oid sha256:6a8e8c82b33c9a733d59c7538fd6c1b407009993cf5fb2a9fa251a8300450cd8
 size 4993591120

pytorch_model-00003-of-00004.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cee96edb8f65dc813341d8c2d46a3b9c55e3356749b6235184aef0ee838d77bd
 size 4974198733

 version https://git-lfs.github.com/spec/v1
+oid sha256:86aeb528daf86754a53010f0b2a7df413b88323b312f4db64116b18228e0184f
 size 4974198733