Model save

Files changed (9) hide show

README.md CHANGED Viewed

@@ -1,11 +1,9 @@
 ---
 base_model: Qwen/Qwen2-VL-2B-Instruct
-datasets: MMInstruction/Clevr_CoGenT_TrainA_R1
 library_name: transformers
 model_name: Qwen2-VL-2B-Instruct-SFT
 tags:
 - generated_from_trainer
-- R1-V
 - trl
 - sft
 licence: license
@@ -13,7 +11,7 @@ licence: license
 # Model Card for Qwen2-VL-2B-Instruct-SFT
-This model is a fine-tuned version of [Qwen/Qwen2-VL-2B-Instruct](https://huggingface.co/Qwen/Qwen2-VL-2B-Instruct) on the [MMInstruction/Clevr_CoGenT_TrainA_R1](https://huggingface.co/datasets/MMInstruction/Clevr_CoGenT_TrainA_R1) dataset.
 It has been trained using [TRL](https://github.com/huggingface/trl).
 ## Quick start
@@ -29,7 +27,7 @@ print(output["generated_text"])
 ## Training procedure
-[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/2741919970-hustvl/huggingface/runs/hxbtcd5t)
 This model was trained with SFT.

 ---
 base_model: Qwen/Qwen2-VL-2B-Instruct
 library_name: transformers
 model_name: Qwen2-VL-2B-Instruct-SFT
 tags:
 - generated_from_trainer
 - trl
 - sft
 licence: license
 # Model Card for Qwen2-VL-2B-Instruct-SFT
+This model is a fine-tuned version of [Qwen/Qwen2-VL-2B-Instruct](https://huggingface.co/Qwen/Qwen2-VL-2B-Instruct).
 It has been trained using [TRL](https://github.com/huggingface/trl).
 ## Quick start
 ## Training procedure
+[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/2741919970-hustvl/huggingface/runs/kd2rv0e6)
 This model was trained with SFT.

all_results.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
-    "epoch": 0.9990182603573532,
-    "total_flos": 3801667199303680.0,
-    "train_loss": 0.13866351419509207,
-    "train_runtime": 19174.2073,
     "train_samples": 40742,
-    "train_samples_per_second": 2.125,
-    "train_steps_per_second": 0.033
 }

 {
+    "epoch": 0.9998919736415686,
+    "total_flos": 2.0789981999005696e+16,
+    "train_loss": 0.0,
+    "train_runtime": 2.6266,
     "train_samples": 40742,
+    "train_samples_per_second": 15511.09,
+    "train_steps_per_second": 242.135
 }

config.json CHANGED Viewed

@@ -31,7 +31,7 @@
   "tie_word_embeddings": true,
   "torch_dtype": "bfloat16",
   "transformers_version": "4.51.1",
-  "use_cache": true,
   "use_sliding_window": false,
   "video_token_id": 151656,
   "vision_config": {

   "tie_word_embeddings": true,
   "torch_dtype": "bfloat16",
   "transformers_version": "4.51.1",
+  "use_cache": false,
   "use_sliding_window": false,
   "video_token_id": 151656,
   "vision_config": {

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b273740cd5cd9da749e890d55f3aa7359dab6251a6b6efc9401e1679cac1fe73
 size 4418050848

 version https://git-lfs.github.com/spec/v1
+oid sha256:a93d511a98455c9d5009dcd7ea903d76fcb4303705b60a2d3a9362d1f716da4d
 size 4418050848

tokenizer.json CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:88a3a6fcb80132f76da8aa40cdc3fccd7e5d8468ef15421f5b0c2715e85217d2
-size 11420538

 version https://git-lfs.github.com/spec/v1
+oid sha256:091aa7594dc2fcfbfa06b9e3c22a5f0562ac14f30375c13af7309407a0e67b8a
+size 11420371

tokenizer_config.json CHANGED Viewed

@@ -138,7 +138,6 @@
   "model_max_length": 32768,
   "pad_token": "<|endoftext|>",
   "padding_side": "left",
-  "processor_class": "Qwen2VLProcessor",
   "split_special_tokens": false,
   "tokenizer_class": "Qwen2Tokenizer",
   "unk_token": null

   "model_max_length": 32768,
   "pad_token": "<|endoftext|>",
   "padding_side": "left",
   "split_special_tokens": false,
   "tokenizer_class": "Qwen2Tokenizer",
   "unk_token": null

train_results.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
-    "epoch": 0.9990182603573532,
-    "total_flos": 3801667199303680.0,
-    "train_loss": 0.13866351419509207,
-    "train_runtime": 19174.2073,
     "train_samples": 40742,
-    "train_samples_per_second": 2.125,
-    "train_steps_per_second": 0.033
 }

 {
+    "epoch": 0.9998919736415686,
+    "total_flos": 2.0789981999005696e+16,
+    "train_loss": 0.0,
+    "train_runtime": 2.6266,
     "train_samples": 40742,
+    "train_samples_per_second": 15511.09,
+    "train_steps_per_second": 242.135
 }

trainer_state.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e0ad5fbd3e0469121f3468c0072223705b7b01e3a9485a29ea073465504a8a2e
 size 7096

 version https://git-lfs.github.com/spec/v1
+oid sha256:5400234002a39681ded90e6b855bb91540f369831054877899b9164742860350
 size 7096