Update README.md
Browse files
README.md
CHANGED
@@ -42,7 +42,7 @@ https://huggingface.co/Qwen/Qwen2.5-VL-3B-Instruct
|
|
42 |
**Image Process**
|
43 |
|Chips| input size | image num | image encoder | ttft(320 tokens) | w8a16 | DDR | Flash |
|
44 |
|--|--|--|--|--|--|--|--|
|
45 |
-
|AX650| 448*448 | 1 | 780 ms |
|
46 |
|
47 |
**Video Process**
|
48 |
|Chips| input size | image num | image encoder |ttft(512 tokens) | w8a16 | DDR | Flash |
|
@@ -104,15 +104,25 @@ root@ax650:/mnt/qtang/llm-test/qwen2.5-vl-3b# tree -L 2
|
|
104 |
|
105 |
```
|
106 |
|
|
|
|
|
107 |
#### Install transformer
|
108 |
|
109 |
```
|
110 |
pip install transformers==4.41.1
|
111 |
```
|
112 |
|
113 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
114 |
|
115 |
-
|
116 |
|
117 |
- input text
|
118 |
|
@@ -156,10 +166,18 @@ image >> image/ssd_car.jpg
|
|
156 |
[N][ Run][ 779]: hit eos,avg 5.96 token/s
|
157 |
```
|
158 |
|
159 |
-
|
160 |
|
161 |
Please pre-process the image of the video file into a 308x308 size picture
|
162 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
163 |
```
|
164 |
root@ax650:/mnt/qtang/llm-test/qwen2.5-vl-3b# ./run_qwen2_5_vl_video.sh
|
165 |
[I][ Init][ 129]: LLM init start
|
|
|
42 |
**Image Process**
|
43 |
|Chips| input size | image num | image encoder | ttft(320 tokens) | w8a16 | DDR | Flash |
|
44 |
|--|--|--|--|--|--|--|--|
|
45 |
+
|AX650| 448*448 | 1 | 780 ms | 2857 ms | 6.2 tokens/sec| 4.3 GiB | 4.6 GiB |
|
46 |
|
47 |
**Video Process**
|
48 |
|Chips| input size | image num | image encoder |ttft(512 tokens) | w8a16 | DDR | Flash |
|
|
|
104 |
|
105 |
```
|
106 |
|
107 |
+
### Prepare tokenizer server
|
108 |
+
|
109 |
#### Install transformer
|
110 |
|
111 |
```
|
112 |
pip install transformers==4.41.1
|
113 |
```
|
114 |
|
115 |
+
### Demo Run
|
116 |
+
|
117 |
+
#### Image understand demo
|
118 |
+
|
119 |
+
##### start tokenizer server for image understand demo
|
120 |
+
|
121 |
+
```
|
122 |
+
python3 qwen2_tokenizer_image_448.py --port 12345
|
123 |
+
```
|
124 |
|
125 |
+
##### run image understand demo
|
126 |
|
127 |
- input text
|
128 |
|
|
|
166 |
[N][ Run][ 779]: hit eos,avg 5.96 token/s
|
167 |
```
|
168 |
|
169 |
+
#### Video understand demo
|
170 |
|
171 |
Please pre-process the image of the video file into a 308x308 size picture
|
172 |
|
173 |
+
##### start tokenizer server for image understand demo
|
174 |
+
|
175 |
+
```
|
176 |
+
python qwen2_tokenizer_video_308.py --port 12345
|
177 |
+
```
|
178 |
+
|
179 |
+
##### run image understand demo
|
180 |
+
|
181 |
```
|
182 |
root@ax650:/mnt/qtang/llm-test/qwen2.5-vl-3b# ./run_qwen2_5_vl_video.sh
|
183 |
[I][ Init][ 129]: LLM init start
|