@inproceedings{weko_229896_1, author = "鮑,飛 and 石川,孝明 and 渡辺,裕", title = "Research on Video Captioning with a Late Fusion Based Multimodal Transformer Network", booktitle = "第85回全国大会講演論文集", year = "2023", volume = "2023", number = "1", pages = "195--196", month = "feb" }