@inproceedings{ijcai2024p0193, title = {ChatSpot: Bootstrapping Multimodal LLMs via Precise Referring Instruction Tuning}, author = {Zhao, Liang and Yu, En and Ge, Zheng and Yang, Jinrong and Wei, Haoran and Zhou, Hongyu and Sun, Jianjian and Peng, Yuang and Dong, Runpei and Han, Chunrui and Zhang, Xiangyu}, booktitle = {Proceedings of the Thirty-Third International Joint Conference on Artificial Intelligence, {IJCAI-24}}, publisher = {International Joint Conferences on Artificial Intelligence Organization}, editor = {Kate Larson}, pages = {1743--1752}, year = {2024}, month = {8}, note = {Main Track}, doi = {10.24963/ijcai.2024/193}, url = {https://doi.org/10.24963/ijcai.2024/193}, }