@article{choudhuri2024ow, title={OW-VISCap: Open-World Video Instance Segmentation and Captioning}, author={Choudhuri, Anwesa and Chowdhary, Girish and Schwing, Alexander G}, journal={arXiv preprint arXiv:2404.03657}, year={2024} }