@inproceedings{bb235700, AUTHOR = "Anjulan, A. and Canagarajah, C.N.", TITLE = "Video Object Mining with Local Region Tracking", BOOKTITLE = MCAM07, YEAR = "2007", PAGES = "172-183", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230617"} @inproceedings{bb235701, AUTHOR = "Anjulan, A. and Canagarajah, C.N.", TITLE = "Video Scene Retrieval Based on Local Region Features", BOOKTITLE = ICIP06, YEAR = "2006", PAGES = "3177-3180", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230618"} @inproceedings{bb235702, AUTHOR = "Anjulan, A. and Canagarajah, C.N.", TITLE = "A Novel Framework for Robust Annotation and Retrieval in Video Sequences", BOOKTITLE = CIVR06, YEAR = "2006", PAGES = "183-192", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230619"} @article{bb235703, AUTHOR = "Ionescu, B. and Coquin, D. and Lambert, P. and Buzuloiu, V.", TITLE = "A Fuzzy Color-Based Approach for Understanding Animated Movies Content in the Indexing Task", JOURNAL = JIVP, VOLUME = "2008", YEAR = "2008", NUMBER = "2008", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230620"} @inproceedings{bb235704, AUTHOR = "Ionescu, B. and Seyerlehner, K. and Rasche, C. and Vertan, C. and Lambert, P.", TITLE = "Content-Based Video Description for Automatic Video Genre Categorization", BOOKTITLE = MMMod12, YEAR = "2012", PAGES = "51-62", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230621"} @article{bb235705, AUTHOR = "Anjulan, A. and Canagarajah, C.N.", TITLE = "A Unified Framework for Object Retrieval and Mining", JOURNAL = CirSysVideo, VOLUME = "19", YEAR = "2009", NUMBER = "1", MONTH = "January", PAGES = "63-76", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230622"} @article{bb235706, AUTHOR = "Campanella, M. and Leonardi, R. and Migliorati, P.", TITLE = "Interactive visualization of video content and associated description for semantic annotation", JOURNAL = SIViP, VOLUME = "3", YEAR = "2009", NUMBER = "2", MONTH = "June", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230623"} @inproceedings{bb235707, AUTHOR = "Campanella, M. and Leonardi, R. and Migliorati, P.", TITLE = "The Future-Viewer Visual Environment for Semantic Characterization of Video Sequences", BOOKTITLE = ICIP05, YEAR = "2005", PAGES = "I: 1209-1212", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230624"} @article{bb235708, AUTHOR = "Wang, M. and Hua, X.S. and Hong, R. and Tang, J. and Qi, G.J. and Song, Y.", TITLE = "Unified Video Annotation via Multigraph Learning", JOURNAL = CirSysVideo, VOLUME = "19", YEAR = "2009", NUMBER = "5", MONTH = "May", PAGES = "733-746", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230625"} @inproceedings{bb235709, AUTHOR = "Qi, G.J. and Song, Y. and Hua, X.S. and Zhang, H.J. and Dai, L.R.", TITLE = "Video Annotation by Active Learning and Cluster Tuning", BOOKTITLE = SLAM06, YEAR = "2006", PAGES = "114", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230626"} @article{bb235710, AUTHOR = "You, J.Y. and Liu, G.Z. and Perkis, A.", TITLE = "A semantic framework for video genre classification and event analysis", JOURNAL = SP:IC, VOLUME = "25", YEAR = "2010", NUMBER = "4", MONTH = "April", PAGES = "April 2010, 287-302", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230627"} @article{bb235711, AUTHOR = "Moxley, E. and Mei, T. and Manjunath, B.S.", TITLE = "Video Annotation Through Search and Graph Reinforcement Mining", JOURNAL = MultMed, VOLUME = "12", YEAR = "2010", NUMBER = "3", MONTH = "March", PAGES = "184-193", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230628"} @article{bb235712, AUTHOR = "Torralba, A.B. and Russell, B.C. and Yuen, J.", TITLE = "LabelMe: Online Image Annotation and Applications", JOURNAL = PIEEE, VOLUME = "98", YEAR = "2010", NUMBER = "8", MONTH = "August", PAGES = "1467-1484", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230629"} @inproceedings{bb235713, AUTHOR = "Yuen, J. and Russell, B.C. and Liu, C. and Torralba, A.B.", TITLE = "LabelMe video: Building a video database with human annotations", BOOKTITLE = ICCV09, YEAR = "2009", PAGES = "1451-1458", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230630"} @article{bb235714, AUTHOR = "Li, Y. and Tian, Y. and Duan, L.Y. and Yang, Y. and Huang, T. and Gao, W.", TITLE = "Sequence Multi-Labeling: A Unified Video Annotation Scheme With Spatial and Temporal Context", JOURNAL = MultMed, VOLUME = "12", YEAR = "2010", NUMBER = "8", PAGES = "814-828", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230631"} @article{bb235715, AUTHOR = "Lee, S.Y. and de Neve, W. and Ro, Y.M.", TITLE = "Tag refinement in an image folksonomy using visual similarity and tag co-occurrence statistics", JOURNAL = SP:IC, VOLUME = "25", YEAR = "2010", NUMBER = "10", MONTH = "November", PAGES = "761-773", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230632"} @inproceedings{bb235716, AUTHOR = "Min, H.S. and Choi, J.Y. and de Neve, W. and Ro, Y.M. and Plataniotis, K.N.", TITLE = "Semantic annotation of personal video content using an image folksonomy", BOOKTITLE = ICIP09, YEAR = "2009", PAGES = "257-260", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230633"} @article{bb235717, AUTHOR = "Diou, C. and Stephanopoulos, G. and Panagiotopoulos, P. and Papachristou, C. and Dimitriou, N. and Delopoulos, A.", TITLE = "Large-Scale Concept Detection in Multimedia Data Using Small Training Sets and Cross-Domain Concept Fusion", JOURNAL = CirSysVideo, VOLUME = "20", YEAR = "2010", NUMBER = "12", MONTH = "December", PAGES = "1808-1821", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230634"} @inproceedings{bb235718, AUTHOR = "Tang, J.H. and Hua, X.S. and Mei, T. and Qi, G.J. and Li, S.P. and Wu, X.Q.", TITLE = "Temporally Consistent Gaussian Random Field for Video Semantic Analysis", BOOKTITLE = ICIP07, YEAR = "2007", PAGES = "IV: 525-528", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230635"} @inproceedings{bb235719, AUTHOR = "Yuan, X. and Lai, W. and Mei, T. and Hua, X.S. and Wu, X.Q. and Li, S.P.", TITLE = "Automatic Video Genre Categorization using Hierarchical SVM", BOOKTITLE = ICIP06, YEAR = "2006", PAGES = "2905-2908", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230636"} @article{bb235720, AUTHOR = "Paniagua Martin, F. and Garcia Crespo, A. and Colomo Palacios, R. and Ruiz Mezcua, B.", TITLE = "Semantic Annotation Architecture for Accessible Multimedia Resources", JOURNAL = MultMedMag, VOLUME = "18", YEAR = "2011", NUMBER = "2", MONTH = "April", PAGES = "16-25", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230637"} @article{bb235721, AUTHOR = "Cao, J. and Ngo, C.W. and Zhang, Y.D. and Li, J.T.", TITLE = "Tracking Web Video Topics: Discovery, Visualization, and Monitoring", JOURNAL = CirSysVideo, VOLUME = "21", YEAR = "2011", NUMBER = "12", MONTH = "December", PAGES = "1835-1846", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230638"} @article{bb235722, AUTHOR = "Lin, L. and Chen, C. and Shyu, M.L. and Chen, S.C.", TITLE = "Weighted Subspace Filtering and Ranking Algorithms for Video Concept Retrieval", JOURNAL = MultMedMag, VOLUME = "18", YEAR = "2011", NUMBER = "3", PAGES = "32-43", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230639"} @article{bb235723, AUTHOR = "Shao, J. and Ma, S. and Lu, W.M. and Zhuang, Y.T.", TITLE = "A unified framework for web video topic discovery and visualization", JOURNAL = PRL, VOLUME = "33", YEAR = "2012", NUMBER = "4", MONTH = "March", PAGES = "410-419", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230640"} @article{bb235724, AUTHOR = "Wollmer, M. and Weninger, F. and Knaup, T. and Schuller, B. and Sun, C. and Sagae, K. and Morency, L.P.", TITLE = "YouTube Movie Reviews: Sentiment Analysis in an Audio-Visual Context", JOURNAL = IEEE_Int_Sys, VOLUME = "28", YEAR = "2013", NUMBER = "3", PAGES = "46-53", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230641"} @article{bb235725, AUTHOR = "Moran, S. and Lavrenko, V.", TITLE = "A sparse kernel relevance model for automatic image annotation", JOURNAL = MultInfoRetr, VOLUME = "3", YEAR = "2014", NUMBER = "4", MONTH = "November", PAGES = "209-229", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230642"} @inproceedings{bb235726, AUTHOR = "Moran, S. and Lavrenko, V.", TITLE = "Optimal Tag Sets for Automatic Image Annotation", BOOKTITLE = BMVC11, YEAR = "2011", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230643"} @inproceedings{bb235727, AUTHOR = "Feng, S.L. and Manmatha, R. and Lavrenko, V.", TITLE = "Multiple Bernoulli relevance models for image and video annotation", BOOKTITLE = CVPR04, YEAR = "2004", PAGES = "II: 1002-1009", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230644"} @article{bb235728, AUTHOR = "Tarvainen, J. and Sjoberg, M. and Westman, S. and Laaksonen, J. and Oittinen, P.", TITLE = "Content-Based Prediction of Movie Style, Aesthetics, and Affect: Data Set and Baseline Experiments", JOURNAL = MultMed, VOLUME = "16", YEAR = "2014", NUMBER = "8", MONTH = "December", PAGES = "2085-2098", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230645"} @article{bb235729, AUTHOR = "Constantin, M.G. and Stefan, L.D. and Ionescu, B. and Duong, N.Q.K. and Demarty, C.H. and Sjoberg, M.", TITLE = "Visual Interestingness Prediction: A Benchmark Framework and Literature Review", JOURNAL = IJCV, VOLUME = "129", YEAR = "2021", NUMBER = "5", MONTH = "May", PAGES = "1526-1550", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230646"} @article{bb235730, AUTHOR = "Lew, M.S.", TITLE = "Special issue on video retrieval", JOURNAL = MultInfoRetr, VOLUME = "4", YEAR = "2015", NUMBER = "1", MONTH = "March", PAGES = "1-2", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230647"} @article{bb235731, AUTHOR = "Lew, M.S.", TITLE = "Special issue on visual information retrieval", JOURNAL = MultInfoRetr, VOLUME = "5", YEAR = "2016", NUMBER = "1", MONTH = "March", PAGES = "1-2", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230648"} @article{bb235732, AUTHOR = "Lew, M.S.", TITLE = "Editorial for the ICMR 2017 special issue", JOURNAL = MultInfoRetr, VOLUME = "8", YEAR = "2018", NUMBER = "1", MONTH = "March", PAGES = "1-2", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230649"} @article{bb235733, AUTHOR = "Lin, T. and Yang, M. and Tsai, C. and Wang, Y.F.", TITLE = "Query-Adaptive Multiple Instance Learning for Video Instance Retrieval", JOURNAL = IP, VOLUME = "24", YEAR = "2015", NUMBER = "4", MONTH = "April", PAGES = "1330-1340", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230650"} @article{bb235734, AUTHOR = "Duan, L.J. and Xi, T. and Cui, S. and Qi, H.G. and Bovik, A.C.", TITLE = "A spatiotemporal weighted dissimilarity-based method for video saliency detection", JOURNAL = SP:IC, VOLUME = "38", YEAR = "2015", NUMBER = "1", PAGES = "45-56", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230651"} @article{bb235735, AUTHOR = "Tu, Q. and Men, A. and Jiang, Z.Q. and Ye, F. and Xu, J.", TITLE = "Video saliency detection incorporating temporal information in compressed domain", JOURNAL = SP:IC, VOLUME = "38", YEAR = "2015", NUMBER = "1", PAGES = "32-44", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230652"} @inproceedings{bb235736, AUTHOR = "Li, C. and Tu, Q. and Xu, J. and Gao, R. and Wang, Q. and Chang, Y.", TITLE = "Ant colony optimization inspired saliency detection using compressed video information", BOOKTITLE = VCIP15, YEAR = "2015", PAGES = "1-4", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230653"} @inproceedings{bb235737, AUTHOR = "Gao, R. and Tu, Q. and Xu, J. and Lu, Y. and Xie, W. and Men, A.", TITLE = "Visual saliency detection based on mutual information in compressed domain", BOOKTITLE = VCIP15, YEAR = "2015", PAGES = "1-4", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230654"} @article{bb235738, AUTHOR = "Qian, X.M. and Liu, X.X. and Ma, X. and Lu, D. and Xu, C.Y.", TITLE = "What Is Happening in the Video? Annotate Video by Sentence", JOURNAL = CirSysVideo, VOLUME = "26", YEAR = "2016", NUMBER = "9", MONTH = "September", PAGES = "1746-1757", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230655"} @article{bb235739, AUTHOR = "Liao, H.S. and Chen, L. and Song, Y. and Ming, H.", TITLE = "Visualization-Based Active Learning for Video Annotation", JOURNAL = MultMed, VOLUME = "18", YEAR = "2016", NUMBER = "11", MONTH = "November", PAGES = "2196-2205", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230656"} @article{bb235740, AUTHOR = "Chou, C.L. and Chen, H.T. and Lee, S.Y.", TITLE = "Multimodal Video-to-Near-Scene Annotation", JOURNAL = MultMed, VOLUME = "19", YEAR = "2017", NUMBER = "2", MONTH = "February", PAGES = "354-366", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230657"} @article{bb235741, AUTHOR = "Wang, H. and Wu, X.X. and Jia, Y.D.", TITLE = "Heterogeneous domain adaptation method for video annotation", JOURNAL = IET-CV, VOLUME = "11", YEAR = "2017", NUMBER = "2", MONTH = "March", PAGES = "181-187", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230658"} @article{bb235742, AUTHOR = "Li, W. and Guo, D. and Fang, X.Z.", TITLE = "Multimodal architecture for video captioning with memory networks and an attention mechanism", JOURNAL = PRL, VOLUME = "105", YEAR = "2018", PAGES = "23-29", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230659"} @article{bb235743, AUTHOR = "Protasov, S. and Khan, A.M. and Sozykin, K. and Ahmad, M.", TITLE = "Using deep features for video scene detection and annotation", JOURNAL = SIViP, VOLUME = "12", YEAR = "2018", NUMBER = "5", MONTH = "July", PAGES = "991-999", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230660"} @article{bb235744, AUTHOR = "Shetty, R. and Tavakoli, H.R. and Laaksonen, J.", TITLE = "Image and Video Captioning with Augmented Neural Architectures", JOURNAL = MultMedMag, VOLUME = "25", YEAR = "2018", NUMBER = "2", MONTH = "April", PAGES = "34-46", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230661"} @article{bb235745, AUTHOR = "Yang, Y. and Zhou, J. and Ai, J. and Bin, Y. and Hanjalic, A. and Shen, H.T. and Ji, Y.", TITLE = "Video Captioning by Adversarial LSTM", JOURNAL = IP, VOLUME = "27", YEAR = "2018", NUMBER = "11", MONTH = "November", PAGES = "5600-5611", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230662"} @article{bb235746, AUTHOR = "Gao, L.L. and Li, X.P. and Song, J.K. and Shen, H.T.", TITLE = "Hierarchical LSTMs with Adaptive Attention for Visual Captioning", JOURNAL = PAMI, VOLUME = "42", YEAR = "2020", NUMBER = "5", MONTH = "May", PAGES = "1112-1131", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230663"} @article{bb235747, AUTHOR = "Zhang, X.X. and Zhu, Z.F. and Zhao, Y. and Chang, D.X.", TITLE = "Learning a General Assignment Model for Video Analytics", JOURNAL = CirSysVideo, VOLUME = "28", YEAR = "2018", NUMBER = "10", MONTH = "October", PAGES = "3066-3076", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230664"} @article{bb235748, AUTHOR = "Daskalakis, E. and Tzelepi, M. and Tefas, A.", TITLE = "Learning deep spatiotemporal features for video captioning", JOURNAL = PRL, VOLUME = "116", YEAR = "2018", PAGES = "143-149", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230665"} @article{bb235749, AUTHOR = "Xu, N. and Liu, A. and Wong, Y. and Zhang, Y. and Nie, W. and Su, Y. and Kankanhalli, M.", TITLE = "Dual-Stream Recurrent Neural Network for Video Captioning", JOURNAL = CirSysVideo, VOLUME = "29", YEAR = "2019", NUMBER = "8", MONTH = "August", PAGES = "2482-2493", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230666"} @article{bb235750, AUTHOR = "Ren, J.H. and Zhang, W.S.", TITLE = "CLOSE: Coupled content-semantic embedding", JOURNAL = SIViP, VOLUME = "13", YEAR = "2019", NUMBER = "6", MONTH = "September", PAGES = "1087-1095", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230667"} @article{bb235751, AUTHOR = "Lee, J. and Kim, J.", TITLE = "Exploring the effects of non-local blocks on video captioning networks", JOURNAL = IJCVR, VOLUME = "9", YEAR = "2019", NUMBER = "5", PAGES = "502-514", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230668"} @inproceedings{bb235752, AUTHOR = "Mun, J. and Yang, L.J. and Ren, Z. and Xu, N. and Han, B.H.", TITLE = "Streamlined Dense Video Captioning", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "6581-6590", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230669"} @article{bb235753, AUTHOR = "Wang, H.Y. and Gao, C.Y. and Han, Y.H.", TITLE = "Sequence in sequence for video captioning", JOURNAL = PRL, VOLUME = "130", YEAR = "2020", PAGES = "327-334", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230670"} @article{bb235754, AUTHOR = "Harwath, D. and Recasens, A. and Suris, D. and Chuang, G. and Torralba, A.B. and Glass, J.", TITLE = "Jointly Discovering Visual Objects and Spoken Words from Raw Sensory Input", JOURNAL = IJCV, VOLUME = "128", YEAR = "2020", NUMBER = "3", MONTH = "March", PAGES = "620-641", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230671"} @inproceedings{bb235755, AUTHOR = "Glass, J. and Torralba, A.B. and Chuang, G. and Suris, D. and Recasens, A. and Harwath, D.", TITLE = "Jointly Discovering Visual Objects and Spoken Words from Raw Sensory Input", BOOKTITLE = ECCV18, YEAR = "2018", PAGES = "VI: 659-677", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230671"} @article{bb235756, AUTHOR = "Wei, R. and Mi, L. and Hu, Y.S. and Chen, Z.Z.", TITLE = "Exploiting the local temporal information for video captioning", JOURNAL = JVCIR, VOLUME = "67", YEAR = "2020", PAGES = "102751", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230672"} @article{bb235757, AUTHOR = "Zhang, J.C. and Peng, Y.X.", TITLE = "Video Captioning With Object-Aware Spatio-Temporal Correlation and Aggregation", JOURNAL = IP, VOLUME = "29", YEAR = "2020", PAGES = "6209-6222", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230673"} @inproceedings{bb235758, AUTHOR = "Zhang, J.C. and Peng, Y.X.", TITLE = "Object-Aware Aggregation With Bidirectional Temporal Graph for Video Captioning", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "8319-8328", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230674"} @article{bb235759, AUTHOR = "Xiao, H.H. and Shi, J.L.", TITLE = "Video captioning with text-based dynamic attention and step-by-step learning", JOURNAL = PRL, VOLUME = "133", YEAR = "2020", PAGES = "305-312", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230675"} @article{bb235760, AUTHOR = "Ning, K. and Cai, M. and Xie, D. and Wu, F.", TITLE = "An Attentive Sequence to Sequence Translator for Localizing Video Clips by Natural Language", JOURNAL = MultMed, VOLUME = "22", YEAR = "2020", NUMBER = "9", MONTH = "September", PAGES = "2434-2443", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230676"} @article{bb235761, AUTHOR = "Wu, A. and Han, Y. and Yang, Y. and Hu, Q. and Wu, F.", TITLE = "Convolutional Reconstruction-to-Sequence for Video Captioning", JOURNAL = CirSysVideo, VOLUME = "30", YEAR = "2020", NUMBER = "11", MONTH = "November", PAGES = "4299-4308", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230677"} @article{bb235762, AUTHOR = "Tu, Y.B. and Zhou, C. and Guo, J.J. and Gao, S.X. and Yu, Z.T.", TITLE = "Enhancing the alignment between target words and corresponding frames for video captioning", JOURNAL = PR, VOLUME = "111", YEAR = "2021", PAGES = "107702", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230678"} @article{bb235763, AUTHOR = "Boran, E. and Erdem, A. and Ikizler Cinbis, N. and Erdem, E. and Madhyastha, P. and Specia, L.", TITLE = "Leveraging auxiliary image descriptions for dense video captioning", JOURNAL = PRL, VOLUME = "146", YEAR = "2021", PAGES = "70-76", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230679"} @article{bb235764, AUTHOR = "Wang, T. and Zheng, H. and Yu, M.J. and Tian, Q. and Hu, H.F.", TITLE = "Event-Centric Hierarchical Representation for Dense Video Captioning", JOURNAL = CirSysVideo, VOLUME = "31", YEAR = "2021", NUMBER = "5", PAGES = "1890-1900", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230680"} @article{bb235765, AUTHOR = "Xu, W. and Yu, J. and Miao, Z.J. and Wan, L. and Tian, Y. and Ji, Q.", TITLE = "Deep Reinforcement Polishing Network for Video Captioning", JOURNAL = MultMed, VOLUME = "23", YEAR = "2021", PAGES = "1772-1784", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230681"} @article{bb235766, AUTHOR = "Zhang, Z.W. and Xu, D. and Ouyang, W.L. and Zhou, L.P.", TITLE = "Dense Video Captioning Using Graph-Based Sentence Summarization", JOURNAL = MultMed, VOLUME = "23", YEAR = "2021", PAGES = "1799-1810", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230682"} @article{bb235767, AUTHOR = "Liu, S. and Ren, Z. and Yuan, J.S.", TITLE = "SibNet: Sibling Convolutional Encoder for Video Captioning", JOURNAL = PAMI, VOLUME = "43", YEAR = "2021", NUMBER = "9", MONTH = "September", PAGES = "3259-3272", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230683"} @article{bb235768, AUTHOR = "Yan, Y.C. and Zhuang, N. and Ni, B.B. and Zhang, J. and Xu, M.H. and Zhang, Q. and Zhang, Z. and Cheng, S. and Tian, Q. and Xu, Y. and Yang, X.K. and Zhang, W.J.", TITLE = "Fine-Grained Video Captioning via Graph-based Multi-Granularity Interaction Learning", JOURNAL = PAMI, VOLUME = "44", YEAR = "2022", NUMBER = "2", MONTH = "February", PAGES = "666-683", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230684"} @article{bb235769, AUTHOR = "Deng, J. and Li, L. and Zhang, B. and Wang, S.H. and Zha, Z.J. and Huang, Q.M.", TITLE = "Syntax-Guided Hierarchical Attention Network for Video Captioning", JOURNAL = CirSysVideo, VOLUME = "32", YEAR = "2022", NUMBER = "2", MONTH = "February", PAGES = "880-892", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230685"} @article{bb235770, AUTHOR = "Hua, X. and Wang, X.Q. and Rui, T. and Shao, F. and Wang, D.", TITLE = "Adversarial Reinforcement Learning With Object-Scene Relational Graph for Video Captioning", JOURNAL = IP, VOLUME = "31", YEAR = "2022", PAGES = "2004-2016", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230686"} @article{bb235771, AUTHOR = "Wang, L.X. and Li, H.L. and Qiu, H.Q. and Wu, Q.B. and Meng, F.M. and Ngan, K.N.", TITLE = "POS-Trends Dynamic-Aware Model for Video Caption", JOURNAL = CirSysVideo, VOLUME = "32", YEAR = "2022", NUMBER = "7", MONTH = "July", PAGES = "4751-4764", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230687"} @article{bb235772, AUTHOR = "Xue, P. and Zhou, B.", TITLE = "Exploring the Spatio-Temporal Aware Graph for video captioning", JOURNAL = IET-CV, VOLUME = "16", YEAR = "2022", NUMBER = "5", PAGES = "456-467", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230688"} @article{bb235773, AUTHOR = "Niu, T.Z. and Dong, S.S. and Chen, Z.D. and Luo, X. and Huang, Z. and Guo, S. and Xu, X.S.", TITLE = "A multi-layer memory sharing network for video captioning", JOURNAL = PR, VOLUME = "136", YEAR = "2023", PAGES = "109202", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230689"} @article{bb235774, AUTHOR = "Tu, Y. and Zhou, C. and Guo, J.J. and Li, H.F. and Gao, S.X. and Yu, Z.T.", TITLE = "Relation-aware attention for video captioning via graph learning", JOURNAL = PR, VOLUME = "136", YEAR = "2023", PAGES = "109204", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230690"} @article{bb235775, AUTHOR = "Li, P. and Wang, T. and Zhao, X. and Xu, X.H. and Song, M.L.", TITLE = "Pseudo-labeling with keyword refining for few-supervised video captioning", JOURNAL = PR, VOLUME = "159", YEAR = "2025", PAGES = "111176", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230691"} @inproceedings{bb235776, AUTHOR = "Radsch, T. and Reinke, A. and Weru, V. and Tizabi, M.D. and Heller, N. and Isensee, F. and Kopp Schneider, A. and Maier Hein, L.", TITLE = "Quality Assured: Rethinking Annotation Strategies in Imaging Ai", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "LXXVIII: 52-69", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230692"} @inproceedings{bb235777, AUTHOR = "Islam, M.M. and Ho, N. and Yang, X.T. and Nagarajan, T. and Torresani, L. and Bertasius, G.", TITLE = "Video ReCap: Recursive Captioning of Hour-Long Videos", BOOKTITLE = CVPR24, YEAR = "2024", PAGES = "18198-18208", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230693"} @inproceedings{bb235778, AUTHOR = "Chen, T.S. and Siarohin, A. and Menapace, W. and Deyneka, E. and Chao, H.W. and Jeon, B.E. and Fang, Y.W. and Lee, H.Y. and Ren, J. and Yang, M.H. and Tulyakov, S.", TITLE = "Panda-70M: Captioning 70M Videos with Multiple Cross-Modality Teachers", BOOKTITLE = CVPR24, YEAR = "2024", PAGES = "13320-13331", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230694"} @inproceedings{bb235779, AUTHOR = "Shao, H.L. and Fang, Z.Y. and Yang, Y.Z.", TITLE = "CAVAN: Commonsense Knowledge Anchored Video Captioning", BOOKTITLE = "ICPR22", YEAR = "2022", PAGES = "4095-4102", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230695"} @inproceedings{bb235780, AUTHOR = "Guo, Z.X. and Wang, T.J.J. and Laaksonen, J.", TITLE = "Post-Attention Modulator for Dense Video Captioning", BOOKTITLE = "ICPR22", YEAR = "2022", PAGES = "1536-1542", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230696"} @inproceedings{bb235781, AUTHOR = "Yamazaki, K. and Truong, S. and Vo, K. and Kidd, M. and Rainwater, C. and Luu, K. and Le, N.", TITLE = "VLCAP: Vision-Language with Contrastive Learning for Coherent Video Paragraph Captioning", BOOKTITLE = ICIP22, YEAR = "2022", PAGES = "3656-3661", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230697"} @inproceedings{bb235782, AUTHOR = "Lebron, L. and Graham, Y. and O'Connor, N.E. and McGuinness, K.", TITLE = "Evaluation of Automatically Generated Video Captions Using Vision and Language Models", BOOKTITLE = ICIP22, YEAR = "2022", PAGES = "2416-2420", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230698"} @inproceedings{bb235783, AUTHOR = "Chatzikonstantinou, C. and Valasidis, G.G. and Stavridis, K. and Malogiannis, G. and Axenopoulos, A. and Daras, P.", TITLE = "UCF-CAP, Video Captioning in the Wild", BOOKTITLE = ICIP22, YEAR = "2022", PAGES = "1386-1390", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230699"} @inproceedings{bb235784, AUTHOR = "Zhang, Q. and Song, Y.Q. and Jin, Q.", TITLE = "Unifying Event Detection and Captioning as Sequence Generation via Pre-training", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXXVI:363-379", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230700"} @inproceedings{bb235785, AUTHOR = "Bi, T.Y. and Jarnikov, D. and Lukkien, J.", TITLE = "Shot-Based Hybrid Fusion for Movie Genre Classification", BOOKTITLE = CIAP22, YEAR = "2022", PAGES = "I:257-269", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230701"} @inproceedings{bb235786, AUTHOR = "Fish, E. and Weinbren, J. and Gilbert, A.", TITLE = "Rethinking Genre Classification With Fine Grained Semantic Clustering", BOOKTITLE = ICIP21, YEAR = "2021", PAGES = "1274-1278", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230702"} @inproceedings{bb235787, AUTHOR = "Zhu, M.J.", TITLE = "Video Captioning in Compressed Video", BOOKTITLE = ICIVC21, YEAR = "2021", PAGES = "336-341", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230703"} @inproceedings{bb235788, AUTHOR = "Lin, X.D. and Bertasius, G. and Wang, J. and Chang, S.F. and Parikh, D. and Torresani, L.", TITLE = "VX2TEXT: End-to-End Learning of Video-Based Text Generation From Multimodal Inputs", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "7001-7011", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230704"} @inproceedings{bb235789, AUTHOR = "Liao, Y.H. and Kar, A. and Fidler, S.", TITLE = "Towards Good Practices for Efficiently Annotating Large-Scale Image Classification Datasets", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "4348-4357", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230705"} @inproceedings{bb235790, AUTHOR = "Song, Y.Q. and Chen, S.Z. and Jin, Q.", TITLE = "Towards Diverse Paragraph Captioning for Untrimmed Videos", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "11240-11249", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230706"} @inproceedings{bb235791, AUTHOR = "Chen, S. and Jiang, Y.G.", TITLE = "Towards Bridging Event Captioner and Sentence Localizer for Weakly Supervised Dense Event Captioning", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "8421-8431", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230707"} @inproceedings{bb235792, AUTHOR = "Deng, C.R. and Chen, S.Z. and Chen, D. and He, Y. and Wu, Q.", TITLE = "Sketch, Ground, and Refine: Top-Down Dense Video Captioning", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "234-243", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230708"} @inproceedings{bb235793, AUTHOR = "Zhang, Z. and Qi, Z.A. and Yuan, C.F. and Shan, Y. and Li, B. and Deng, Y. and Hu, W.M.", TITLE = "Open-book Video Captioning with Retrieve-Copy-Generate Network", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "9832-9841", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230709"} @inproceedings{bb235794, AUTHOR = "Perez Martin, J. and Bustos, B. and Perez, J.", TITLE = "Improving Video Captioning with Temporal Composition of a Visual-Syntactic Embedding*", BOOKTITLE = WACV21, YEAR = "2021", PAGES = "3038-3048", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230710"} @inproceedings{bb235795, AUTHOR = "Muller Budack, E. and Springstein, M. and Hakimov, S. and Mrutzek, K. and Ewerth, R.", TITLE = "Ontology-driven Event Type Classification in Images", BOOKTITLE = WACV21, YEAR = "2021", PAGES = "2927-2937", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230711"} @inproceedings{bb235796, AUTHOR = "Hosseinzadeh, M. and Wang, Y.", TITLE = "Video Captioning of Future Frames", BOOKTITLE = WACV21, YEAR = "2021", PAGES = "979-988", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230712"} @inproceedings{bb235797, AUTHOR = "Knights, J. and Harwood, B. and Ward, D. and Vanderkop, A. and Mackenzie Ross, O. and Moghadam, P.", TITLE = "Temporally Coherent Embeddings for Self-Supervised Video Representation Learning", BOOKTITLE = ICPR21, YEAR = "2021", PAGES = "8914-8921", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230713"} @inproceedings{bb235798, AUTHOR = "Rimle, P. and Dogan Schonberger, P. and Gross, M.", TITLE = "Enriching Video Captions With Contextual Text", BOOKTITLE = ICPR21, YEAR = "2021", PAGES = "5474-5481", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230714"} @inproceedings{bb235799, AUTHOR = "Bi, T.Y. and Jarnikov, D. and Lukkien, J.", TITLE = "Video Representation Fusion Network For Multi-Label Movie Genre Classification", BOOKTITLE = ICPR21, YEAR = "2021", PAGES = "9386-9391", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825an1.html#TT230715"}