English
mjjung commited on
Commit
0f255ef
·
1 Parent(s): d1d0080
Files changed (2) hide show
  1. TimeChat-7B-ActivityNet-VTune.pth +3 -0
  2. log.txt +113 -0
TimeChat-7B-ActivityNet-VTune.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1bf7dfc879b35a0afad7f54bd39a415323a78a9c0cba52f77369df64ca5e7cf
3
+ size 2897697291
log.txt ADDED
@@ -0,0 +1,113 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "run": {
3
+ "task": "video_text_pretrain",
4
+ "lr_sched": "linear_warmup_cosine_lr",
5
+ "init_lr": 3e-05,
6
+ "min_lr": 1e-05,
7
+ "warmup_lr": 1e-06,
8
+ "weight_decay": 0.05,
9
+ "max_epoch": 3,
10
+ "iters_per_epoch": 51377,
11
+ "batch_size_train": 2,
12
+ "batch_size_eval": 4,
13
+ "num_workers": 4,
14
+ "warmup_steps": 25688,
15
+ "accum_grad_iters": 8,
16
+ "seed": 42,
17
+ "output_dir": "/data/mjjung/timechat/activitynet_vtune",
18
+ "amp": true,
19
+ "resume_ckpt_path": null,
20
+ "evaluate": false,
21
+ "train_splits": [
22
+ "train"
23
+ ],
24
+ "device": "cuda",
25
+ "world_size": 4,
26
+ "dist_url": "env://",
27
+ "distributed": true,
28
+ "rank": 0,
29
+ "gpu": 0,
30
+ "dist_backend": "nccl"
31
+ },
32
+ "model": {
33
+ "arch": "timechat",
34
+ "image_size": 224,
35
+ "drop_path_rate": 0,
36
+ "use_grad_checkpoint": true,
37
+ "vit_precision": "fp16",
38
+ "freeze_vit": true,
39
+ "freeze_qformer": false,
40
+ "num_query_token": 32,
41
+ "llama_model": "/data/mjjung/Video-LLaMA/Video-LLaMA-2-7B-Finetuned/llama-2-7b-chat-hf/",
42
+ "prompt": "",
43
+ "model_type": "pretrain_llama_v2",
44
+ "vit_model": "/data/mjjung/timechat/eva_vit_g.pth",
45
+ "q_former_model": "/data/mjjung/timechat/instruct_blip_vicuna7b_trimmed.pth",
46
+ "ckpt": "/data/mjjung/timechat/timechat_7b.pth",
47
+ "frozen_llama_proj": false,
48
+ "frozen_video_Qformer": false,
49
+ "fusion_head_layers": 2,
50
+ "max_frame_pos": 96,
51
+ "fusion_header_type": "seqTransf",
52
+ "max_txt_len": 2048,
53
+ "end_sym": "</s>",
54
+ "prompt_path": "",
55
+ "prompt_template": "[INST] <<SYS>>\\n \\n<</SYS>>\\n\\n{} [/INST] ",
56
+ "lora": true,
57
+ "lora_inference_mode": false,
58
+ "qformer_text_input": true,
59
+ "window_size": 32,
60
+ "stride": 32
61
+ },
62
+ "preprocess": {
63
+ "vis_processor": {
64
+ "train": {
65
+ "name": "alpro_video_train",
66
+ "image_size": 224,
67
+ "n_frms": 8
68
+ },
69
+ "eval": {
70
+ "name": "alpro_video_eval",
71
+ "image_size": 224,
72
+ "n_frms": 8
73
+ }
74
+ },
75
+ "text_processor": {
76
+ "train": {
77
+ "name": "blip_caption"
78
+ },
79
+ "eval": {
80
+ "name": "blip_caption"
81
+ }
82
+ }
83
+ },
84
+ "datasets": {
85
+ "charades_instruct": {
86
+ "data_type": "video",
87
+ "build_info": {
88
+ "anno_dir": "data/activitynet_filtered_qa_grounding.json",
89
+ "videos_dir": "/data/video_datasets/"
90
+ },
91
+ "vis_processor": {
92
+ "train": {
93
+ "name": "alpro_video_train",
94
+ "n_frms": 96,
95
+ "image_size": 224
96
+ }
97
+ },
98
+ "text_processor": {
99
+ "train": {
100
+ "name": "blip_caption"
101
+ }
102
+ },
103
+ "num_video_query_token": 32,
104
+ "tokenizer_name": "/data/mjjung/Video-LLaMA/Video-LLaMA-2-7B-Finetuned/llama-2-7b-chat-hf/",
105
+ "model_type": "llama_v2",
106
+ "num_frm": 96,
107
+ "sample_type": "rand",
108
+ "max_txt_len": 2048,
109
+ "stride": 32
110
+ }
111
+ }
112
+ }
113
+ {"train_lr": "0.000", "train_loss": "0.162"}