Training in progress, step 10
Browse files
README.md
CHANGED
@@ -1,6 +1,5 @@
|
|
1 |
---
|
2 |
base_model: Qwen/Qwen2.5-VL-3B-Instruct
|
3 |
-
datasets: lmms-lab/multimodal-open-r1-8k-verified
|
4 |
library_name: transformers
|
5 |
model_name: Qwen2.5-VL-3B-Instruct-Thinking
|
6 |
tags:
|
@@ -12,7 +11,7 @@ licence: license
|
|
12 |
|
13 |
# Model Card for Qwen2.5-VL-3B-Instruct-Thinking
|
14 |
|
15 |
-
This model is a fine-tuned version of [Qwen/Qwen2.5-VL-3B-Instruct](https://huggingface.co/Qwen/Qwen2.5-VL-3B-Instruct)
|
16 |
It has been trained using [TRL](https://github.com/huggingface/trl).
|
17 |
|
18 |
## Quick start
|
|
|
1 |
---
|
2 |
base_model: Qwen/Qwen2.5-VL-3B-Instruct
|
|
|
3 |
library_name: transformers
|
4 |
model_name: Qwen2.5-VL-3B-Instruct-Thinking
|
5 |
tags:
|
|
|
11 |
|
12 |
# Model Card for Qwen2.5-VL-3B-Instruct-Thinking
|
13 |
|
14 |
+
This model is a fine-tuned version of [Qwen/Qwen2.5-VL-3B-Instruct](https://huggingface.co/Qwen/Qwen2.5-VL-3B-Instruct).
|
15 |
It has been trained using [TRL](https://github.com/huggingface/trl).
|
16 |
|
17 |
## Quick start
|
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 7393888
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16ad78ab6fa8ca02ae2d84afa2379bdc31da86eeab1529ca3f0f23c7d64a4120
|
3 |
size 7393888
|
preprocessor_config.json
CHANGED
@@ -1,4 +1,10 @@
|
|
1 |
{
|
|
|
|
|
|
|
|
|
|
|
|
|
2 |
"do_convert_rgb": true,
|
3 |
"do_normalize": true,
|
4 |
"do_rescale": true,
|
@@ -8,12 +14,13 @@
|
|
8 |
0.4578275,
|
9 |
0.40821073
|
10 |
],
|
11 |
-
"image_processor_type": "
|
12 |
"image_std": [
|
13 |
0.26862954,
|
14 |
0.26130258,
|
15 |
0.27577711
|
16 |
],
|
|
|
17 |
"max_pixels": 12845056,
|
18 |
"merge_size": 2,
|
19 |
"min_pixels": 3136,
|
@@ -21,6 +28,7 @@
|
|
21 |
"processor_class": "Qwen2_5_VLProcessor",
|
22 |
"resample": 3,
|
23 |
"rescale_factor": 0.00392156862745098,
|
|
|
24 |
"size": {
|
25 |
"longest_edge": 12845056,
|
26 |
"shortest_edge": 3136
|
|
|
1 |
{
|
2 |
+
"crop_size": null,
|
3 |
+
"data_format": "channels_first",
|
4 |
+
"default_to_square": true,
|
5 |
+
"device": null,
|
6 |
+
"disable_grouping": null,
|
7 |
+
"do_center_crop": null,
|
8 |
"do_convert_rgb": true,
|
9 |
"do_normalize": true,
|
10 |
"do_rescale": true,
|
|
|
14 |
0.4578275,
|
15 |
0.40821073
|
16 |
],
|
17 |
+
"image_processor_type": "Qwen2VLImageProcessorFast",
|
18 |
"image_std": [
|
19 |
0.26862954,
|
20 |
0.26130258,
|
21 |
0.27577711
|
22 |
],
|
23 |
+
"input_data_format": null,
|
24 |
"max_pixels": 12845056,
|
25 |
"merge_size": 2,
|
26 |
"min_pixels": 3136,
|
|
|
28 |
"processor_class": "Qwen2_5_VLProcessor",
|
29 |
"resample": 3,
|
30 |
"rescale_factor": 0.00392156862745098,
|
31 |
+
"return_tensors": null,
|
32 |
"size": {
|
33 |
"longest_edge": 12845056,
|
34 |
"shortest_edge": 3136
|
runs/Jul28_13-21-17_f76ea2c310ec/events.out.tfevents.1753708949.f76ea2c310ec.36632.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b99b1cc8d7053ed056eab6a48c538db5e4c33edf5eb40fa7c1ff940cee741c4f
|
3 |
+
size 10601
|
tokenizer_config.json
CHANGED
@@ -205,5 +205,6 @@
|
|
205 |
"processor_class": "Qwen2_5_VLProcessor",
|
206 |
"split_special_tokens": false,
|
207 |
"tokenizer_class": "Qwen2Tokenizer",
|
208 |
-
"unk_token": null
|
|
|
209 |
}
|
|
|
205 |
"processor_class": "Qwen2_5_VLProcessor",
|
206 |
"split_special_tokens": false,
|
207 |
"tokenizer_class": "Qwen2Tokenizer",
|
208 |
+
"unk_token": null,
|
209 |
+
"use_fast": true
|
210 |
}
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:43028820679d4f6ee87f1f232ec6907e43bcdaa245be62b39aec0f5de9c20c4e
|
3 |
+
size 6584
|