This repo holds codes of the paper: ''Vision Enhanced Generative Pre-trained Language Model for Multimodal Sentence Summarization '' published on the journal Mach. Intell. Res..
if you find this is helpful, feel free to cite the following publication:
@article{DBLP:journals/ijautcomp/JingLXYSS23,
author = {Liqiang Jing and
Yiren Li and
Junhao Xu and
Yongcan Yu and
Pei Shen and
Xuemeng Song},
title = {Vision Enhanced Generative Pre-trained Language Model for Multimodal
Sentence Summarization},
journal = {Mach. Intell. Res.},
volume = {20},
number = {2},
pages = {289--298},
year = {2023},
doi = {10.1007/s11633-022-1372-x},
}