Update README.md
Browse files
README.md
CHANGED
@@ -57,3 +57,29 @@ print(res)
|
|
57 |
|
58 |
```
|
59 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
57 |
|
58 |
```
|
59 |
|
60 |
+
|
61 |
+
|
62 |
+
## More Multimodal Projects
|
63 |
+
|
64 |
+
👏 Welcome to explore more multimodal projects of our team:
|
65 |
+
|
66 |
+
[Vary](https://github.com/Ucas-HaoranWei/Vary) | [Fox](https://github.com/ucaslcl/Fox) | [OneChart](https://github.com/LingyvKong/OneChart)
|
67 |
+
|
68 |
+
## Citation
|
69 |
+
|
70 |
+
If you find our work helpful, please consider citing our papers 📝 and liking this project ❤️!
|
71 |
+
|
72 |
+
```bib
|
73 |
+
@article{wei2024general,
|
74 |
+
title={General OCR Theory: Towards OCR-2.0 via a Unified End-to-end Model},
|
75 |
+
author={Wei, Haoran and Liu, Chenglong and Chen, Jinyue and Wang, Jia and Kong, Lingyu and Xu, Yanming and Ge, Zheng and Zhao, Liang and Sun, Jianjian and Peng, Yuang and others},
|
76 |
+
journal={arXiv preprint arXiv:2409.01704},
|
77 |
+
year={2024}
|
78 |
+
}
|
79 |
+
@article{wei2023vary,
|
80 |
+
title={Vary: Scaling up the Vision Vocabulary for Large Vision-Language Models},
|
81 |
+
author={Wei, Haoran and Kong, Lingyu and Chen, Jinyue and Zhao, Liang and Ge, Zheng and Yang, Jinrong and Sun, Jianjian and Han, Chunrui and Zhang, Xiangyu},
|
82 |
+
journal={arXiv preprint arXiv:2312.06109},
|
83 |
+
year={2023}
|
84 |
+
}
|
85 |
+
```
|