🌐 Homepage | 🔬 Paper | 👩💻 Code | 📊 Dataset | 🤗 Model
conda create -n v2xumllm python=3.9 -yconda activate v2xumllmpython -m v2xumllm.inference
@article{hua2024v2xum,
title={V2xum-llm: Cross-modal video summarization with temporal prompt instruction tuning},
author={Hua, Hang and Tang, Yunlong and Xu, Chenliang and Luo, Jiebo},
journal={arXiv preprint arXiv:2404.12353},
year={2024}
}