Update README.md
Browse files
README.md
CHANGED
@@ -34,6 +34,14 @@ The primary intended users of the model are researchers in computer vision, natu
|
|
34 |
Please kindly cite our paper if you find our resources useful:
|
35 |
|
36 |
```
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
37 |
@misc{lu2023vim,
|
38 |
title={VIM: Probing Multimodal Large Language Models for Visual Embedded Instruction Following},
|
39 |
author={Yujie Lu and Xiujun Li and William Yang Wang and Yejin Choi},
|
|
|
34 |
Please kindly cite our paper if you find our resources useful:
|
35 |
|
36 |
```
|
37 |
+
@misc{li2024text,
|
38 |
+
title={Text as Images: Can Multimodal Large Language Models Follow Printed Instructions in Pixels?},
|
39 |
+
author={Xiujun Li and Yujie Lu and Zhe Gan and Jianfeng Gao and William Yang Wang and Yejin Choi},
|
40 |
+
year={2024},
|
41 |
+
eprint={2311.17647},
|
42 |
+
archivePrefix={arXiv},
|
43 |
+
primaryClass={cs.CV}
|
44 |
+
}
|
45 |
@misc{lu2023vim,
|
46 |
title={VIM: Probing Multimodal Large Language Models for Visual Embedded Instruction Following},
|
47 |
author={Yujie Lu and Xiujun Li and William Yang Wang and Yejin Choi},
|