Toward a Scalable and Grounded Data Engine for Video LLMs
@article{zhou2025strefer,
title={Strefer: Empowering Video LLMs with Space-Time Referring and Reasoning via Synthetic Instruction Data},
author={Zhou, Honglu and Peng, Xiangyu and Kendre, Shrikant and Ryoo, Michael S. and Savarese, Silvio and Xong, Caiming and Niebles, Juan Carlos},
journal={arXiv preprint arXiv:2509.03501},
year={2025}
}
}