@ARTICLE{10789221, author={You, Zeng and Wen, Zhiquan and Chen, Yaofo and Li, Xin and Zeng, Runhao and Wang, Yaowei and Tan, Mingkui}, journal={IEEE Transactions on Circuits and Systems for Video Technology}, title={Toward Long Video Understanding via Fine-Detailed Video Story Generation}, year={2025}, volume={35}, number={5}, pages={4592-4607}, keywords={Visualization;Termination of employment;Semantics;Circuits and systems;Large language models;Feature extraction;Training;Streaming media;Redundancy;Interference;Foundation models;video understanding;large language models}, doi={10.1109/TCSVT.2024.3514820}}