EnriqueSolarte commited on
Commit
c8bfb70
·
verified ·
1 Parent(s): c427317

Training in progress, epoch 1

Browse files
README.md CHANGED
@@ -1,5 +1,5 @@
1
  ---
2
- base_model: Qwen/Qwen2.5-VL-7B-Instruct
3
  library_name: transformers
4
  model_name: qwen2.5-VL-7B-instruct-00004-VqCaAuuoeWk_0
5
  tags:
@@ -11,7 +11,7 @@ licence: license
11
 
12
  # Model Card for qwen2.5-VL-7B-instruct-00004-VqCaAuuoeWk_0
13
 
14
- This model is a fine-tuned version of [Qwen/Qwen2.5-VL-7B-Instruct](https://huggingface.co/Qwen/Qwen2.5-VL-7B-Instruct).
15
  It has been trained using [TRL](https://github.com/huggingface/trl).
16
 
17
  ## Quick start
 
1
  ---
2
+ base_model: UCSC-VLAA/VLAA-Thinker-Qwen2.5VL-3B
3
  library_name: transformers
4
  model_name: qwen2.5-VL-7B-instruct-00004-VqCaAuuoeWk_0
5
  tags:
 
11
 
12
  # Model Card for qwen2.5-VL-7B-instruct-00004-VqCaAuuoeWk_0
13
 
14
+ This model is a fine-tuned version of [UCSC-VLAA/VLAA-Thinker-Qwen2.5VL-3B](https://huggingface.co/UCSC-VLAA/VLAA-Thinker-Qwen2.5VL-3B).
15
  It has been trained using [TRL](https://github.com/huggingface/trl).
16
 
17
  ## Quick start
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "Qwen/Qwen2.5-VL-7B-Instruct",
5
  "bias": "none",
6
  "corda_config": null,
7
  "eva_config": null,
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "UCSC-VLAA/VLAA-Thinker-Qwen2.5VL-3B",
5
  "bias": "none",
6
  "corda_config": null,
7
  "eva_config": null,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:832421a1bed0ec02e349d8746f3b9b345e38ead2c05a3641b850acc29b629963
3
- size 10108960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60c39a0b2982363789261b33e20a51e2158f3f232d8ab89530a449a4a0b5e67a
3
+ size 7393888
preprocessor_config.json CHANGED
@@ -21,7 +21,7 @@
21
  0.27577711
22
  ],
23
  "input_data_format": null,
24
- "max_pixels": 12845056,
25
  "merge_size": 2,
26
  "min_pixels": 3136,
27
  "patch_size": 14,
@@ -30,7 +30,7 @@
30
  "rescale_factor": 0.00392156862745098,
31
  "return_tensors": null,
32
  "size": {
33
- "longest_edge": 12845056,
34
  "shortest_edge": 3136
35
  },
36
  "temporal_patch_size": 2
 
21
  0.27577711
22
  ],
23
  "input_data_format": null,
24
+ "max_pixels": 501760,
25
  "merge_size": 2,
26
  "min_pixels": 3136,
27
  "patch_size": 14,
 
30
  "rescale_factor": 0.00392156862745098,
31
  "return_tensors": null,
32
  "size": {
33
+ "longest_edge": 501760,
34
  "shortest_edge": 3136
35
  },
36
  "temporal_patch_size": 2
runs/Sep09_15-32-32_workstation-one/events.out.tfevents.1757431963.workstation-one.1228196.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:252cfbd48232339693b25f34e04b45cd539ce56267d4ee69b1452246dd2752f0
3
+ size 10747
tokenizer_config.json CHANGED
@@ -199,10 +199,13 @@
199
  "eos_token": "<|im_end|>",
200
  "errors": "replace",
201
  "extra_special_tokens": {},
 
 
202
  "model_max_length": 131072,
203
  "pad_token": "<|endoftext|>",
204
  "processor_class": "Qwen2_5_VLProcessor",
205
  "split_special_tokens": false,
206
  "tokenizer_class": "Qwen2Tokenizer",
207
- "unk_token": null
 
208
  }
 
199
  "eos_token": "<|im_end|>",
200
  "errors": "replace",
201
  "extra_special_tokens": {},
202
+ "max_pixels": 501760,
203
+ "min_pixels": 3136,
204
  "model_max_length": 131072,
205
  "pad_token": "<|endoftext|>",
206
  "processor_class": "Qwen2_5_VLProcessor",
207
  "split_special_tokens": false,
208
  "tokenizer_class": "Qwen2Tokenizer",
209
+ "unk_token": null,
210
+ "use_fast": true
211
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3dd1341587efc15903605ae5e5e373891d4c6b006a9ae24f855c03d1e1373dcc
3
- size 6353
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f4a607f106199b8cada31e14d82dc5dffda3c28c9eca97ec41c741f684d2366
3
+ size 6417
video_preprocessor_config.json CHANGED
@@ -16,6 +16,7 @@
16
  0.4578275,
17
  0.40821073
18
  ],
 
19
  "image_std": [
20
  0.26862954,
21
  0.26130258,
@@ -23,7 +24,7 @@
23
  ],
24
  "input_data_format": null,
25
  "max_frames": 768,
26
- "max_pixels": 12845056,
27
  "merge_size": 2,
28
  "min_frames": 4,
29
  "min_pixels": 3136,
@@ -34,7 +35,7 @@
34
  "rescale_factor": 0.00392156862745098,
35
  "return_metadata": false,
36
  "size": {
37
- "longest_edge": 12845056,
38
  "shortest_edge": 3136
39
  },
40
  "size_divisor": null,
 
16
  0.4578275,
17
  0.40821073
18
  ],
19
+ "image_processor_type": "Qwen2VLImageProcessorFast",
20
  "image_std": [
21
  0.26862954,
22
  0.26130258,
 
24
  ],
25
  "input_data_format": null,
26
  "max_frames": 768,
27
+ "max_pixels": 501760,
28
  "merge_size": 2,
29
  "min_frames": 4,
30
  "min_pixels": 3136,
 
35
  "rescale_factor": 0.00392156862745098,
36
  "return_metadata": false,
37
  "size": {
38
+ "longest_edge": 501760,
39
  "shortest_edge": 3136
40
  },
41
  "size_divisor": null,