Update README.md
Browse files
README.md
CHANGED
|
@@ -34,6 +34,14 @@ The primary intended users of the model are researchers in computer vision, natu
|
|
| 34 |
Please kindly cite our paper if you find our resources useful:
|
| 35 |
|
| 36 |
```
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 37 |
@misc{lu2023vim,
|
| 38 |
title={VIM: Probing Multimodal Large Language Models for Visual Embedded Instruction Following},
|
| 39 |
author={Yujie Lu and Xiujun Li and William Yang Wang and Yejin Choi},
|
|
|
|
| 34 |
Please kindly cite our paper if you find our resources useful:
|
| 35 |
|
| 36 |
```
|
| 37 |
+
@misc{li2024text,
|
| 38 |
+
title={Text as Images: Can Multimodal Large Language Models Follow Printed Instructions in Pixels?},
|
| 39 |
+
author={Xiujun Li and Yujie Lu and Zhe Gan and Jianfeng Gao and William Yang Wang and Yejin Choi},
|
| 40 |
+
year={2024},
|
| 41 |
+
eprint={2311.17647},
|
| 42 |
+
archivePrefix={arXiv},
|
| 43 |
+
primaryClass={cs.CV}
|
| 44 |
+
}
|
| 45 |
@misc{lu2023vim,
|
| 46 |
title={VIM: Probing Multimodal Large Language Models for Visual Embedded Instruction Following},
|
| 47 |
author={Yujie Lu and Xiujun Li and William Yang Wang and Yejin Choi},
|