Dr.V: A Hierarchical Perception-Temporal-Cognition Framework to Diagnose Video Hallucination by Fine-grained Spatial-Temporal Grounding
BibTex
Copy
@misc{luo2025drvhierarchicalperceptiontemporalcognition,
title={Dr.V: A Hierarchical Perception-Temporal-Cognition Framework to Diagnose Video Hallucination by Fine-grained Spatial-Temporal Grounding},
author={Meng Luo and Shengqiong Wu and Liqiang Jing and Tianjie Ju and Li Zheng and Jinxiang Lai and Tianlong Wu and Xinya Du and Jian Li and Siyuan Yan and Jiebo Luo and William Yang Wang and Hao Fei and Mong-Li Lee and Wynne Hsu},
year={2025},
eprint={2509.11866},
archivePrefix={arXiv},
primaryClass={cs.CV},
url={https://arxiv.org/abs/2509.11866},
}