@article{bb244100,
        AUTHOR = "Tapaswi, M. and Bauml, M. and Stiefelhagen, R.",
        TITLE = "Aligning plot synopses to videos for story-based retrieval",
        JOURNAL = MultInfoRetr,
        VOLUME = "4",
        YEAR = "2015",
        NUMBER = "1",
        MONTH = "March",
        PAGES = "3-16",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT238992"}

@inproceedings{bb244101,
        AUTHOR = "Tapaswi, M. and Bauml, M. and Stiefelhagen, R.",
        TITLE = "Book2Movie: Aligning video scenes with book chapters",
        BOOKTITLE = CVPR15,
        YEAR = "2015",
        PAGES = "1827-1835",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT238993"}

@article{bb244102,
        AUTHOR = "Ahmadzade, A.M. and Farsi, H.",
        TITLE = "Video Summarization by an Innovative Method in Shot Detection",
        JOURNAL = ELCVIA,
        VOLUME = "14",
        YEAR = "2015",
        NUMBER = "1",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT238994"}

@article{bb244103,
        AUTHOR = "Li, K. and Wang, J. and Wang, H. and Dai, Q.H.",
        TITLE = "Structuring Lecture Videos by Automatic Projection Screen
Localization and Analysis",
        JOURNAL = PAMI,
        VOLUME = "37",
        YEAR = "2015",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "1233-1246",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT238995"}

@article{bb244104,
        AUTHOR = "Chu, W.T. and Yu, C.H. and Wang, H.H.",
        TITLE = "Optimized Comics-Based Storytelling for Temporal Image Sequences",
        JOURNAL = MultMed,
        VOLUME = "17",
        YEAR = "2015",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "201-215",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT238996"}

@article{bb244105,
        AUTHOR = "Mademlis, I. and Tefas, A. and Nikolaidis, N. and Pitas, I.",
        TITLE = "Multimodal Stereoscopic Movie Summarization Conforming to Narrative
Characteristics",
        JOURNAL = IP,
        VOLUME = "25",
        YEAR = "2016",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "5828-5840",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT238997"}

@article{bb244106,
        AUTHOR = "Aparicio, M. and Figueiredo, P. and Raposo, F. and de Matos, D.M. and Ribeiro, R. and Marujo, L.",
        TITLE = "Summarization of films and documentaries based on subtitles and
scripts",
        JOURNAL = PRL,
        VOLUME = "73",
        YEAR = "2016",
        NUMBER = "1",
        PAGES = "7-12",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT238998"}

@article{bb244107,
        AUTHOR = "Baraldi, L. and Grana, C. and Cucchiara, R.",
        TITLE = "Recognizing and Presenting the Storytelling Video Structure With Deep
Multimodal Networks",
        JOURNAL = MultMed,
        VOLUME = "19",
        YEAR = "2017",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "955-968",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT238999"}

@article{bb244108,
        AUTHOR = "Lu, Q. and Chai, B.J. and Zhang, H.B.",
        TITLE = "Storytelling by the StoryCake visualization",
        JOURNAL = VC,
        VOLUME = "33",
        YEAR = "2017",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "1241-1252",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239000"}

@article{bb244109,
        AUTHOR = "Somandepalli, K. and Kumar, N. and Guha, T. and Narayanan, S.S.",
        TITLE = "Unsupervised Discovery of Character Dictionaries in Animation Movies",
        JOURNAL = MultMed,
        VOLUME = "20",
        YEAR = "2018",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "539-551",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239001"}

@article{bb244110,
        AUTHOR = "Berendsen, M.E. and Hamerlinck, J.D. and Webster, G.R.",
        TITLE = "Digital Story Mapping to Advance Educational Atlas Design and Enable
Student Engagement",
        JOURNAL = IJGI,
        VOLUME = "7",
        YEAR = "2018",
        NUMBER = "3",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239002"}

@article{bb244111,
        AUTHOR = "Yang, X.S. and Zhang, T.Z. and Xu, C.S.",
        TITLE = "Text2Video:
An End-to-end Learning Framework for Expressing Text With Videos",
        JOURNAL = MultMed,
        VOLUME = "20",
        YEAR = "2018",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "2360-2370",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239003"}

@inproceedings{bb244112,
        AUTHOR = "Sun, K. and Lei, Z. and Zhu, J.S. and Hou, X.X. and Liu, B. and Qiu, G.P.",
        TITLE = "Character Prediction in TV Series via a Semantic Projection Network",
        BOOKTITLE = "MMMod19",
        YEAR = "2019",
        PAGES = "I:300-311",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239004"}

@article{bb244113,
        AUTHOR = "Nabati, M. and Behrad, A.",
        TITLE = "Video captioning using boosted and parallel Long Short-Term Memory
networks",
        JOURNAL = CVIU,
        VOLUME = "190",
        YEAR = "2020",
        PAGES = "102840",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239005"}

@article{bb244114,
        AUTHOR = "Xiao, H.H. and Xu, J.W. and Shi, J.L.",
        TITLE = "Exploring diverse and fine-grained caption for video by incorporating
convolutional architecture into LSTM-based model",
        JOURNAL = PRL,
        VOLUME = "129",
        YEAR = "2020",
        PAGES = "173-180",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239006"}

@article{bb244115,
        AUTHOR = "Han, Y. and Wang, B. and Hong, R. and Wu, F.",
        TITLE = "Movie Question Answering via Textual Memory and Plot Graph",
        JOURNAL = CirSysVideo,
        VOLUME = "30",
        YEAR = "2020",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "875-887",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239007"}

@article{bb244116,
        AUTHOR = "Zhou, P. and Xu, T. and Yin, Z. and Liu, D. and Chen, E. and Lv, G. and Li, C.",
        TITLE = "Character-Oriented Video Summarization With Visual and Textual Cues",
        JOURNAL = MultMed,
        VOLUME = "22",
        YEAR = "2020",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "2684-2697",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239008"}

@inproceedings{bb244117,
        AUTHOR = "Fujita, S. and Hirao, T. and Kamigaito, H. and Okumura, M. and Nagata, M.",
        TITLE = "Soda: Story Oriented Dense Video Captioning Evaluation Framework",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "VI:517-531",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239009"}

@article{bb244118,
        AUTHOR = "Ghose, S. and Prevost, J.J.",
        TITLE = "AutoFoley: Artificial Synthesis of Synchronized Sound Tracks for
Silent Videos With Deep Learning",
        JOURNAL = MultMed,
        VOLUME = "23",
        YEAR = "2021",
        PAGES = "1895-1907",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239010"}

@article{bb244119,
        AUTHOR = "Apostolidis, E. and Adamantidou, E. and Metsai, A.I. and Mezaris, V. and Patras, I.",
        TITLE = "AC-SUM-GAN: Connecting Actor-Critic and Generative Adversarial
Networks for Unsupervised Video Summarization",
        JOURNAL = CirSysVideo,
        VOLUME = "31",
        YEAR = "2021",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "3278-3292",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239011"}

@article{bb244120,
        AUTHOR = "Liu, D. and Kamath, N. and Bhattacharya, S. and Puri, R.",
        TITLE = "Adaptive Context Reading Network for Movie Scene Detection",
        JOURNAL = CirSysVideo,
        VOLUME = "31",
        YEAR = "2021",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "3559-3574",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239012"}

@article{bb244121,
        AUTHOR = "Wang, J.Y. and Xu, M. and Jiang, L. and Song, Y.H.",
        TITLE = "Attention-Based Deep Reinforcement Learning for Virtual
Cinematography of 360° Videos",
        JOURNAL = MultMed,
        VOLUME = "23",
        YEAR = "2021",
        PAGES = "3227-3238",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239013"}

@article{bb244122,
        AUTHOR = "Wu, A. and Han, Y.H. and Zhao, Z. and Yang, Y.",
        TITLE = "Hierarchical Memory Decoder for Visual Narrating",
        JOURNAL = CirSysVideo,
        VOLUME = "31",
        YEAR = "2021",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "2438-2449",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239014"}

@article{bb244123,
        AUTHOR = "Xie, J.H. and Chen, X.B. and Zhang, T.Y. and Zhang, Y.X. and Lu, S.P. and Cesar, P. and Yang, Y.",
        TITLE = "Multimodal-Based and Aesthetic-Guided Narrative Video Summarization",
        JOURNAL = MultMed,
        VOLUME = "25",
        YEAR = "2023",
        PAGES = "4894-4908",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239015"}

@article{bb244124,
        AUTHOR = "Papalampidi, P. and Keller, F. and Lapata, M.",
        TITLE = "Finding the Right Moment: Human-Assisted Trailer Creation via Task
Composition",
        JOURNAL = PAMI,
        VOLUME = "46",
        YEAR = "2024",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "292-304",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239016"}

@article{bb244125,
        AUTHOR = "Lu, Y. and Ni, F.Y. and Wang, H. and Guo, X.F. and Zhu, L.C. and Yang, Z.X. and Song, R.H. and Cheng, L. and Yang, Y.",
        TITLE = "Show Me a Video: A Large-Scale Narrated Video Dataset for Coherent
Story Illustration",
        JOURNAL = MultMed,
        VOLUME = "26",
        YEAR = "2024",
        PAGES = "2456-2466",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239017"}

@article{bb244126,
        AUTHOR = "Yuan, M.Q. and Jia, G. and Bao, B.K.",
        TITLE = "GPT-Based Knowledge Guiding Network for Commonsense Video Captioning",
        JOURNAL = MultMed,
        VOLUME = "26",
        YEAR = "2024",
        PAGES = "5147-5158",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239018"}

@article{bb244127,
        AUTHOR = "Wang, Y.Z. and Hu, W.B. and Hong, R.C.",
        TITLE = "Iterative Adversarial Attack on Image-Guided Story Ending Generation",
        JOURNAL = MultMed,
        VOLUME = "26",
        YEAR = "2024",
        PAGES = "6117-6130",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239019"}

@article{bb244128,
        AUTHOR = "Chen, Z. and Zhang, K. and Cai, H. and Ding, X.Y. and Jiang, C.X. and Chen, Z.Z.",
        TITLE = "Audio-visual saliency prediction for movie viewing in immersive
environments: Dataset and benchmarks",
        JOURNAL = JVCIR,
        VOLUME = "100",
        YEAR = "2024",
        PAGES = "104095",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239020"}

@article{bb244129,
        AUTHOR = "Kaur, P.C. and Ragha, L.",
        TITLE = "Optimized deep learning enabled lecture audio video summarization",
        JOURNAL = JVCIR,
        VOLUME = "104",
        YEAR = "2024",
        PAGES = "104309",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239021"}

@inproceedings{bb244130,
        AUTHOR = "Tao, M. and Bao, B.K. and Tang, H. and Wang, Y.W. and Xu, C.S.",
        TITLE = "Storyimager: A Unified and Efficient Framework for Coherent Story
Visualization and Completion",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "LVI: 479-495",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239022"}

@article{bb244131,
        AUTHOR = "Guo, J.H. and Lu, A. and Wu, Z.Q. and Wang, Z.Y. and Liang, C.",
        TITLE = "Who, What, and Where: Composite-Semantics Instance Search for Story
Videos",
        JOURNAL = IP,
        VOLUME = "34",
        YEAR = "2025",
        PAGES = "1412-1426",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239023"}

@article{bb244132,
        AUTHOR = "Qin, P.G. and Xu, T. and Zhang, C. and Wang, H. and Hu, Y. and Chen, E.",
        TITLE = "Scenario-Aware Multimodal Chain-of-Thought Prompting for Rationales
of VideoSocial Relations",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "11598-11612",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239024"}

@inproceedings{bb244133,
        AUTHOR = "Wang, H.L. and Tong, Z. and Zheng, K. and Shen, Y.J. and Wang, L.M.",
        TITLE = "Contextual AD Narration with Interleaved Multimodal Sequence",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "8372-8383",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239025"}

@inproceedings{bb244134,
        AUTHOR = "Kim, S. and Do, S. and Park, J.",
        TITLE = "ShowMak3r: Compositional TV Show Reconstruction",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "864-874",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239026"}

@inproceedings{bb244135,
        AUTHOR = "Wu, W.J. and Liu, M.Y. and Zhu, Z. and Xia, X. and Feng, H. and Wang, W. and Lin, K.Q. and Shen, C.H. and Shou, M.Z.",
        TITLE = "MovieBench: A Hierarchical Movie Level Dataset for Long Video
Generation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "28984-28994",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239027"}

@inproceedings{bb244136,
        AUTHOR = "Park, J. and Ye, J. and Lee, S. and Ka, H.W. and Han, D.",
        TITLE = "NarrAD: Automatic Generation of Audio Descriptions for Movies with
Rich Narrative Context",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "409-419",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239028"}

@inproceedings{bb244137,
        AUTHOR = "Zhang, C. and Lei, Y.M. and Liu, Z. and Leng, H.T. and Liu, S. and Gao, T.T. and Liu, Q.J. and Wang, Y.H.",
        TITLE = "SeriesBench: A Benchmark for Narrative-Driven Drama Series
Understanding",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "28995-29004",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239029"}

@inproceedings{bb244138,
        AUTHOR = "Lin, K.Q. and Zhang, P. and Gao, D.F. and Xia, X. and Chen, J. and Gao, Z.T. and Xie, J.H. and Xiao, X.H. and Shou, M.Z.",
        TITLE = "Learning Video Context as Interleaved Multimodal Sequences",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XLIX: 375-396",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239030"}

@inproceedings{bb244139,
        AUTHOR = "Avetisyan, A. and Xie, C. and Howard Jenkins, H. and Yang, T.Y. and Aroudj, S. and Patra, S. and Zhang, F. and Frost, D. and Holland, L. and Orme, C. and Engel, J. and Miller, E. and Newcombe, R. and Balntas, V.",
        TITLE = "Scenescript: Reconstructing Scenes with an Autoregressive Structured
Language Model",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "LXI: 247-263",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239031"}

@inproceedings{bb244140,
        AUTHOR = "Shvetsova, N. and Kukleva, A. and Hong, X.D. and Rupprecht, C. and Schiele, B. and Kuehne, H.",
        TITLE = "Howtocaption: Prompting LLMs to Transform Video Annotations at Scale",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "LVI: 1-18",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239032"}

@inproceedings{bb244141,
        AUTHOR = "Tan, J.W. and Wang, H.X. and Li, J.X. and Ou, Z.L. and Qian, Z.",
        TITLE = "Neighbor Relations Matter in Video Scene Detection",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "18473-18482",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239033"}

@inproceedings{bb244142,
        AUTHOR = "Raajesh, H. and Desanur, N.R. and Khan, Z. and Tapaswi, M.",
        TITLE = "MICap: A Unified Model for Identity-Aware Movie Descriptions",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "14011-14021",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239034"}

@inproceedings{bb244143,
        AUTHOR = "Argaw, D.M. and Soldan, M. and Pardo, A. and Zhao, C. and Heilbron, F.C. and Chung, J.S. and Ghanem, B.",
        TITLE = "Towards Automated Movie Trailer Generation",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "7445-7454",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239035"}

@inproceedings{bb244144,
        AUTHOR = "Singh, A.K. and Srivastava, D. and Tapaswi, M.",
        TITLE = "'Previously on...' from Recaps to Story Summarization",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "13635-13646",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239036"}

@inproceedings{bb244145,
        AUTHOR = "Pan, X.C. and Qin, P. and Li, Y.H. and Xue, H. and Chen, W.",
        TITLE = "Synthesizing Coherent Story with Auto-Regressive Latent Diffusion
Models",
        BOOKTITLE = WACV24,
        YEAR = "2024",
        PAGES = "2908-2918",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239037"}

@inproceedings{bb244146,
        AUTHOR = "Zhang, Z.P. and Gu, Y.W. and Plummer, B.A. and Miao, X. and Liu, J.Y. and Wang, H.",
        TITLE = "Movie Genre Classification by Language Augmentation and Shot Sampling",
        BOOKTITLE = WACV24,
        YEAR = "2024",
        PAGES = "7260-7270",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239038"}

@inproceedings{bb244147,
        AUTHOR = "Ahn, D.C. and Kim, D. and Song, G. and Kim, S.H. and Lee, H.L. and Kang, D. and Choi, J.H.",
        TITLE = "Story Visualization by Online Text Augmentation with Context Memory",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "3102-3112",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239039"}

@inproceedings{bb244148,
        AUTHOR = "Vacchetti, B. and Argaw, D.M. and Cequtelli, T.",
        TITLE = "LEMMS: Label Estimation of Multi-feature Movie Segments",
        BOOKTITLE = CVEU23,
        YEAR = "2023",
        PAGES = "3019-3027",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239040"}

@inproceedings{bb244149,
        AUTHOR = "Han, T.D. and Bain, M. and Nagrani, A. and Varol, G. and Xie, W. and Zisserman, A.",
        TITLE = "AutoAD II: The Sequel - Who, When, and What in Movie Audio
Description",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "13599-13609",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239041"}

@inproceedings{bb244150,
        AUTHOR = "Argaw, D.M. and Lee, J.Y. and Woodson, M. and Kweon, I.S. and Heilbron, F.C.",
        TITLE = "Long-range Multimodal Pretraining for Movie Understanding",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "13346-13357",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239042"}

@inproceedings{bb244151,
        AUTHOR = "Sadoughi, N. and Li, X.Y. and Vajpayee, A. and Fan, D. and Shuai, B. and Santos Villalobos, H. and Bhat, V. and Mv, R.",
        TITLE = "MEGA: Multimodal Alignment Aggregation and Distillation For Cinematic
Video Segmentation",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "23274-23283",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239043"}

@inproceedings{bb244152,
        AUTHOR = "Han, T. and Bain, M. and Nagrani, A. and Varol, G. and Xie, W. and Zisserman, A.",
        TITLE = "AutoAD: Movie Description in Context",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "18930-18940",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239044"}

@inproceedings{bb244153,
        AUTHOR = "Rahman, T. and Lee, H. .Y. and Ren, J. and Tulyakov, S. and Mahajan, S. and Sigal, L.",
        TITLE = "Make-A-Story: Visual Memory Conditioned Consistent Story Generation",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "2493-2502",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239045"}

@inproceedings{bb244154,
        AUTHOR = "Malakan, Z.M. and Hassan, G.M. and Jalwana, M.A.A.K. and Aafaq, N. and Mian, A.",
        TITLE = "Semantic Attribute Enriched Storytelling from a Sequence of Images",
        BOOKTITLE = DICTA21,
        YEAR = "2021",
        PAGES = "1-8",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239046"}

@inproceedings{bb244155,
        AUTHOR = "Huang, Y.Z. and Bai, X. and Wang, O. and Caba, F. and Agarwala, A.",
        TITLE = "Learning Where to Cut from Edited Videos",
        BOOKTITLE = CVEU21,
        YEAR = "2021",
        PAGES = "3208-3216",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239047"}

@inproceedings{bb244156,
        AUTHOR = "Gaikwad, B. and Sontakke, A. and Patwardhan, M. and Pedanekar, N. and Karande, S.",
        TITLE = "Plots to Previews: Towards Automatic Movie Preview Retrieval using
Publicly Available Meta-data",
        BOOKTITLE = CVEU21,
        YEAR = "2021",
        PAGES = "3198-3207",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239048"}

@inproceedings{bb244157,
        AUTHOR = "Yu, Y.J. and Chung, J. and Yun, H.S. and Kim, J.S. and Kim, G.",
        TITLE = "Transitional Adaptation of Pretrained Models for Visual Storytelling",
        BOOKTITLE = CVPR21,
        YEAR = "2021",
        PAGES = "12653-12663",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239049"}

@inproceedings{bb244158,
        AUTHOR = "Reboud, A. and Troncy, R.",
        TITLE = "What You Say Is Not What You Do: Studying Visio-Linguistic Models for
TV Series Summarization",
        BOOKTITLE = CLVL21,
        YEAR = "2021",
        PAGES = "3142-3146",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239050"}

@inproceedings{bb244159,
        AUTHOR = "Hao, X. and Chettiar, K. and Cheung, B. and Germano, V. and Hamid, R.",
        TITLE = "Intro and Recap Detection for Movies and TV Series",
        BOOKTITLE = WACV21,
        YEAR = "2021",
        PAGES = "167-176",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239051"}

@inproceedings{bb244160,
        AUTHOR = "Bain, M. and Nagrani, A. and Brown, A. and Zisserman, A.",
        TITLE = "Condensed Movies: Story Based Retrieval with Contextual Embeddings",
        BOOKTITLE = ACCV20,
        YEAR = "2020",
        PAGES = "V:460-479",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239052"}

@inproceedings{bb244161,
        AUTHOR = "Wang, L. and Liu, D. and Puri, R. and Metaxas, D.N.",
        TITLE = "Learning Trailer Moments in Full-length Movies with Co-contrastive
Attention",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "XVIII:300-316",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239053"}

@inproceedings{bb244162,
        AUTHOR = "Huang, Q.Q. and Xiong, Y. and Rao, A. and Wang, J.Z. and Lin, D.H.",
        TITLE = "Movienet: A Holistic Dataset for Movie Understanding",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "IV:709-727",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239054"}

@inproceedings{bb244163,
        AUTHOR = "Li, K. and Fang, C. and Wang, Z. and Kim, S. and Jin, H. and Fu, Y.",
        TITLE = "Screencast Tutorial Video Understanding",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "12523-12532",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239055"}

@inproceedings{bb244164,
        AUTHOR = "Nagrani, A. and Sun, C. and Ross, D. and Sukthankar, R. and Schmid, C. and Zisserman, A.",
        TITLE = "Speech2Action: Cross-Modal Supervision for Action Recognition",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "10314-10323",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239056"}

@inproceedings{bb244165,
        AUTHOR = "Rao, A. and Xu, L. and Xiong, Y. and Xu, G. and Huang, Q. and Zhou, B. and Lin, D.",
        TITLE = "A Local-to-Global Approach to Multi-Modal Movie Scene Segmentation",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "10143-10152",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239057"}

@inproceedings{bb244166,
        AUTHOR = "Zhang, M. and Ye, K. and Hwa, R. and Kovashka, A.",
        TITLE = "Story Completion with Explicit Modeling of Commonsense Knowledge",
        BOOKTITLE = MVM20,
        YEAR = "2020",
        PAGES = "1543-1546",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239058"}

@inproceedings{bb244167,
        AUTHOR = "Li, W.X. and Pan, G. and Wang, C. and Xing, Z. and Zhou, X.Z. and Dong, X.X. and Zhang, J.W.",
        TITLE = "From Coarse to Fine: Hierarchical Structure-aware Video Summarization",
        BOOKTITLE = MLCSA20,
        YEAR = "2020",
        PAGES = "75-87",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239059"}

@inproceedings{bb244168,
        AUTHOR = "Liu, Y. and Li, Y. and Yang, F. and Chen, S. and Wang, Y.F.",
        TITLE = "Learning Hierarchical Self-Attention for Video Summarization",
        BOOKTITLE = ICIP19,
        YEAR = "2019",
        PAGES = "3377-3381",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239060"}

@inproceedings{bb244169,
        AUTHOR = "Lee, S. and Sung, J. and Yu, Y. and Kim, G.",
        TITLE = "A Memory Network Approach for Story-Based Temporal Summarization of
360° Videos",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "1410-1419",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239061"}

@inproceedings{bb244170,
        AUTHOR = "Mo, L.B. and Zhang, C.H. and Ji, Y. and Hu, Z.",
        TITLE = "Adversarial Learning for Visual Storytelling with Sense Group Partition",
        BOOKTITLE = ACCV18,
        YEAR = "2018",
        PAGES = "IV:175-190",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239062"}

@inproceedings{bb244171,
        AUTHOR = "Ueno, M.",
        TITLE = "Structure Analysis on Common Plot in Four-Scene Comic Story Dataset",
        BOOKTITLE = MANPU19,
        YEAR = "2019",
        PAGES = "625-636",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239063"}

@inproceedings{bb244172,
        AUTHOR = "Zhang, J.C. and Peng, Y.X.",
        TITLE = "Hierarchical Vision-Language Alignment for Video Captioning",
        BOOKTITLE = "MMMod19",
        YEAR = "2019",
        PAGES = "I:42-54",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239064"}

@inproceedings{bb244173,
        AUTHOR = "Smeaton, A.F. and Graham, Y. and McGuinness, K. and O'Connor, N.E. and Quinn, S. and Sanchez, E.A.",
        TITLE = "Exploring the Impact of Training Data Bias on Automatic Generation of
Video Captions",
        BOOKTITLE = "MMMod19",
        YEAR = "2019",
        PAGES = "I:178-190",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239065"}

@inproceedings{bb244174,
        AUTHOR = "Guyot, P. and Malon, T. and Roman Jimenez, G. and Chambon, S. and Charvillat, V. and Crouzil, A. and Peninou, A. and Pinquier, J. and Sedes, F. and Senac, C.",
        TITLE = "Audiovisual Annotation Procedure for Multi-view Field Recordings",
        BOOKTITLE = "MMMod19",
        YEAR = "2019",
        PAGES = "I:399-410",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239066"}

@inproceedings{bb244175,
        AUTHOR = "Gupta, T. and Schwenk, D. and Farhadi, A. and Hoiem, D. and Kembhavi, A.",
        TITLE = "Imagine This! Scripts to Compositions to Videos",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "VIII: 610-626",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239067"}

@inproceedings{bb244176,
        AUTHOR = "Chen, Y.Y. and Wang, S.H. and Zhang, W.G. and Huang, Q.M.",
        TITLE = "Less Is More: Picking Informative Frames for Video Captioning",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "XIII: 367-384",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239068"}

@inproceedings{bb244177,
        AUTHOR = "Iyyer, M. and Manjunatha, V. and Guha, A. and Vyas, Y. and Boyd Graber, J. and Daume, H. and Davis, L.S.",
        TITLE = "The Amazing Mysteries of the Gutter:
Drawing Inferences Between Panels in Comic Book Narratives",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "6478-6487",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239069"}

@inproceedings{bb244178,
        AUTHOR = "Khan, U.A. and Ejaz, N. and Martinez del Amor, M.A. and Sparenberg, H.",
        TITLE = "Movies tags extraction using deep learning",
        BOOKTITLE = AVSS17,
        YEAR = "2017",
        PAGES = "1-6",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239070"}

@inproceedings{bb244179,
        AUTHOR = "Zhong, G. and Tsai, Y.H. and Liu, S. and Su, Z. and Yang, M.H.",
        TITLE = "Learning Video-Story Composition via Recurrent Neural Network",
        BOOKTITLE = WACV18,
        YEAR = "2018",
        PAGES = "1727-1735",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239071"}

@inproceedings{bb244180,
        AUTHOR = "Na, S. and Lee, S.H. and Kim, J.S. and Kim, G.",
        TITLE = "A Read-Write Memory Network for Movie Story Understanding",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "677-685",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239072"}

@inproceedings{bb244181,
        AUTHOR = "Naim, I. and Al Mamun, A. and Song, Y.C. and Luo, J. and Kautz, H. and Gildea, D.",
        TITLE = "Aligning movies with scripts by exploiting temporal ordering
constraints",
        BOOKTITLE = ICPR16,
        YEAR = "2016",
        PAGES = "1786-1791",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239073"}

@inproceedings{bb244182,
        AUTHOR = "Tapaswi, M. and Zhu, Y. and Stiefelhagen, R. and Torralba, A.B. and Urtasun, R. and Fidler, S.",
        TITLE = "MovieQA: Understanding Stories in Movies through Question-Answering",
        BOOKTITLE = CVPR16,
        YEAR = "2016",
        PAGES = "4631-4640",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239074"}

@inproceedings{bb244183,
        AUTHOR = "Suchan, J. and Bhatt, M.",
        TITLE = "The geometry of a scene:
On deep semantics for visual perception driven cognitive film, studies",
        BOOKTITLE = WACV16,
        YEAR = "2016",
        PAGES = "1-9",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239075"}

@inproceedings{bb244184,
        AUTHOR = "Qu, B.Q. and Vallet, F. and Carrive, J. and Gravier, G.",
        TITLE = "Content-Based Discovery of Multiple Structures from Episodes of
Recurrent TV Programs Based on Grammatical Inference",
        BOOKTITLE = MMMod15,
        YEAR = "2015",
        PAGES = "I: 140-154",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239076"}

@inproceedings{bb244185,
        AUTHOR = "Song, Y. and Vallmitjana, J. and Stent, A. and Jaimes, A.",
        TITLE = "TVSum: Summarizing web videos using titles",
        BOOKTITLE = CVPR15,
        YEAR = "2015",
        PAGES = "5179-5187",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239077"}

@inproceedings{bb244186,
        AUTHOR = "Koutras, P. and Zlatintsi, A. and Iosif, E. and Katsamanis, A. and Maragos, P. and Potamianos, A.",
        TITLE = "Predicting audio-visual salient events based on visual, audio and
text modalities for movie summarization",
        BOOKTITLE = ICIP15,
        YEAR = "2015",
        PAGES = "4361-4365",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239078"}

@inproceedings{bb244187,
        AUTHOR = "Eberts, M. and Ulges, A. and Schwanecke, U.",
        TITLE = "AMIGO - automatic indexing of lecture footage",
        BOOKTITLE = ICDAR15,
        YEAR = "2015",
        PAGES = "1206-1210",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239079"}

@inproceedings{bb244188,
        AUTHOR = "Xu, P. and Tax, D.M.J. and Hanjalic, A.",
        TITLE = "A structure-based video representation for web video categorization",
        BOOKTITLE = ICPR12,
        YEAR = "2012",
        PAGES = "433-436",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239080"}

@inproceedings{bb244189,
        AUTHOR = "Hanjalic, A. and Xu, L.Q.",
        TITLE = "User-Oriented Affective Video Content Analysis",
        BOOKTITLE = CBAIVL01,
        YEAR = "2001",
        PAGES = "50",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239081"}

@inproceedings{bb244190,
        AUTHOR = "Shrestha, A. and Zhu, Y. and Miller, B. and Zhao, Y.",
        TITLE = "Storygraph: Telling Stories from Spatio-temporal Data",
        BOOKTITLE = ISVC13,
        YEAR = "2013",
        PAGES = "II:693-702",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239082"}

@inproceedings{bb244191,
        AUTHOR = "Lu, Z. and Grauman, K.",
        TITLE = "Story-Driven Summarization for Egocentric Video",
        BOOKTITLE = CVPR13,
        YEAR = "2013",
        PAGES = "2714-2721",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239083"}

@inproceedings{bb244192,
        AUTHOR = "Chowdhury, A.S. and Kuanar, S.K. and Panda, R. and Das, M.N.",
        TITLE = "Video storyboard design using Delaunay graphs",
        BOOKTITLE = ICPR12,
        YEAR = "2012",
        PAGES = "3108-3111",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239084"}

@inproceedings{bb244193,
        AUTHOR = "Fu, W. and Wang, J.Q. and Zhu, X.B. and Lu, H.Q. and Ma, S.D.",
        TITLE = "Video Reshuffling with Narratives toward Effective Video Browsing",
        BOOKTITLE = ICIG11,
        YEAR = "2011",
        PAGES = "821-826",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239085"}

@inproceedings{bb244194,
        AUTHOR = "Jain, M. and Jawahar, C.V.",
        TITLE = "Characteristic pattern discovery in videos",
        BOOKTITLE = ICCVGIP10,
        YEAR = "2010",
        PAGES = "306-313",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239086"}

@inproceedings{bb244195,
        AUTHOR = "Ding, L. and Yilmaz, A.",
        TITLE = "Learning Relations among Movie Characters: A Social Network Perspective",
        BOOKTITLE = ECCV10,
        YEAR = "2010",
        PAGES = "IV: 410-423",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239087"}

@inproceedings{bb244196,
        AUTHOR = "Rodriguez, M.",
        TITLE = "CRAM: Compact representation of actions in movies",
        BOOKTITLE = CVPR10,
        YEAR = "2010",
        PAGES = "3328-3335",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239088"}

@inproceedings{bb244197,
        AUTHOR = "Zhao, Z.C. and Ge, X.J.",
        TITLE = "A computable structure model for Hollywood film",
        BOOKTITLE = ICIP10,
        YEAR = "2010",
        PAGES = "877-880",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239089"}

@inproceedings{bb244198,
        AUTHOR = "Zhang, S.L. and Tian, Q. and Huang, Q.M. and Gao, W. and Li, S.P.",
        TITLE = "Utilizing affective analysis for efficient movie browsing",
        BOOKTITLE = ICIP09,
        YEAR = "2009",
        PAGES = "1853-1856",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239090"}

@inproceedings{bb244199,
        AUTHOR = "Gupta, A. and Srinivasan, P. and Shi, J.B. and Davis, L.S.",
        TITLE = "Understanding videos, constructing plots learning a visually grounded
storyline model from annotated videos",
        BOOKTITLE = CVPR09,
        YEAR = "2009",
        PAGES = "2012-2019",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mo1.html#TT239091"}

Last update:Nov 26, 2025 at 20:24:09