Update README.md
Browse files
README.md
CHANGED
@@ -1,5 +1,6 @@
|
|
1 |
-
A Large Multimodal Reasoning Model.
|
2 |
|
|
|
3 |
```
|
4 |
from transformers import Qwen2_5_VLForConditionalGeneration, AutoTokenizer, AutoProcessor
|
5 |
from qwen_vl_utils import process_vision_info
|
@@ -87,4 +88,23 @@ output_text = processor.batch_decode(
|
|
87 |
generated_ids_trimmed, skip_special_tokens=True, clean_up_tokenization_spaces=False
|
88 |
)
|
89 |
print(output_text)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
90 |
```
|
|
|
1 |
+
# A Large Multimodal Reasoning Model.
|
2 |
|
3 |
+
## Usage
|
4 |
```
|
5 |
from transformers import Qwen2_5_VLForConditionalGeneration, AutoTokenizer, AutoProcessor
|
6 |
from qwen_vl_utils import process_vision_info
|
|
|
88 |
generated_ids_trimmed, skip_special_tokens=True, clean_up_tokenization_spaces=False
|
89 |
)
|
90 |
print(output_text)
|
91 |
+
```
|
92 |
+
|
93 |
+
## Citations
|
94 |
+
```
|
95 |
+
@misc {di_zhang_2025,
|
96 |
+
author = { {Di Zhang} },
|
97 |
+
title = { Qwen2.5-VL-7B-R1-Distillation (Revision 6cc3c46) },
|
98 |
+
year = 2025,
|
99 |
+
url = { https://huggingface.co/di-zhang-fdu/Qwen2.5-VL-7B-R1-Distillation },
|
100 |
+
doi = { 10.57967/hf/4710 },
|
101 |
+
publisher = { Hugging Face }
|
102 |
+
}
|
103 |
+
|
104 |
+
@article{zhang2024critic,
|
105 |
+
title={Critic-V: VLM Critics Help Catch VLM Errors in Multimodal Reasoning},
|
106 |
+
author={Zhang, Di and Lei, Jingdi and Li, Junxian and Wang, Xunzhi and Liu, Yujie and Yang, Zonglin and Li, Jiatong and Wang, Weida and Yang, Suorong and Wu, Jianbo and others},
|
107 |
+
journal={arXiv preprint arXiv:2411.18203},
|
108 |
+
year={2024}
|
109 |
+
}
|
110 |
```
|