@inproceedings{xiao2024grounding, title = {Grounding Language Models for Visual Entity Recognition}, author = {Xiao, Zilin and Gong, Ming and Cascante-Bonilla, Paola and Zhang, Xingyao and Wu, Jie and Ordonez, Vicente}, year = {2024}, booktitle = {European Conference on Computer Vision ECCV 2024}, url = {https://arxiv.org/abs/2402.18695}, }