@inproceedings{bb206200, AUTHOR = "Qiu, Z.F. and Yao, T. and Mei, T.", TITLE = "Learning Spatio-Temporal Representation with Pseudo-3D Residual Networks", BOOKTITLE = ICCV17, YEAR = "2017", PAGES = "5534-5542", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201303"} @inproceedings{bb206201, AUTHOR = "Qiu, Z.F. and Yao, T. and Ngo, C.W. and Tian, X.M. and Mei, T.", TITLE = "Learning Spatio-Temporal Representation With Local and Global Diffusion", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "12048-12057", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201304"} @inproceedings{bb206202, AUTHOR = "Yao, T. and Pan, Y. and Li, Y. and Qiu, Z. and Mei, T.", TITLE = "Boosting Image Captioning with Attributes", BOOKTITLE = ICCV17, YEAR = "2017", PAGES = "4904-4912", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201305"} @inproceedings{bb206203, AUTHOR = "Pan, Y. and Yao, T. and Li, Y. and Mei, T.", TITLE = "Video Captioning with Transferred Semantic Attributes", BOOKTITLE = CVPR17, YEAR = "2017", PAGES = "984-992", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201306"} @article{bb206204, AUTHOR = "Zhao, B. and Li, X. and Lu, X.", TITLE = "CAM-RNN: Co-Attention Model Based RNN for Video Captioning", JOURNAL = IP, VOLUME = "28", YEAR = "2019", NUMBER = "11", MONTH = "November", PAGES = "5552-5565", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201307"} @article{bb206205, AUTHOR = "Yan, C. and Tu, Y. and Wang, X. and Zhang, Y. and Hao, X. and Zhang, Y. and Dai, Q.", TITLE = "STAT: Spatial-Temporal Attention Mechanism for Video Captioning", JOURNAL = MultMed, VOLUME = "22", YEAR = "2020", NUMBER = "1", MONTH = "January", PAGES = "229-241", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201308"} @article{bb206206, AUTHOR = "Dai, Q. and Zhang, Y. and Hao, X. and Zhang, Y. and Wang, X. and Tu, Y. and Yan, C.", TITLE = "STAT: Spatial-Temporal Attention Mechanism for Video Captioning", JOURNAL = MultMed, VOLUME = "22", YEAR = "2020", NUMBER = "3", MONTH = "March", PAGES = "830-830", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201308"} @article{bb206207, AUTHOR = "Aafaq, N. and Mian, A. and Liu, W. and Gilani, S.Z. and Shah, M.", TITLE = "Video Description: A Survey of Methods, Datasets, and Evaluation Metrics", JOURNAL = Surveys, VOLUME = "52", YEAR = "2019", NUMBER = "6", MONTH = "October", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201309"} @article{bb206208, AUTHOR = "Zhang, Z. and Xu, D. and Ouyang, W. and Tan, C.", TITLE = "Show, Tell and Summarize: Dense Video Captioning Using Visual Cue Aided Sentence Summarization", JOURNAL = CirSysVideo, VOLUME = "30", YEAR = "2020", NUMBER = "9", MONTH = "September", PAGES = "3130-3139", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201310"} @article{bb206209, AUTHOR = "Zhang, W. and Wang, B.R. and Ma, L. and Liu, W.", TITLE = "Reconstruct and Represent Video Contents for Captioning via Reinforcement Learning", JOURNAL = PAMI, VOLUME = "42", YEAR = "2020", NUMBER = "12", MONTH = "December", PAGES = "3088-3101", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201311"} @article{bb206210, AUTHOR = "Lee, S. and Kim, I.", TITLE = "DVC-Net: A deep neural network model for dense video captioning", JOURNAL = IET-CV, VOLUME = "15", YEAR = "2021", NUMBER = "1", PAGES = "12-23", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201312"} @article{bb206211, AUTHOR = "Qi, S.S. and Yang, L.X.", TITLE = "Video captioning via a symmetric bidirectional decoder", JOURNAL = IET-CV, VOLUME = "15", YEAR = "2021", NUMBER = "4", PAGES = "283-296", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201313"} @article{bb206212, AUTHOR = "Li, L. and Zhang, Y.D. and Tang, S. and Xie, L.X. and Li, X.Y. and Tian, Q.", TITLE = "Adaptive Spatial Location With Balanced Loss for Video Captioning", JOURNAL = CirSysVideo, VOLUME = "32", YEAR = "2022", NUMBER = "1", MONTH = "January", PAGES = "17-30", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201314"} @article{bb206213, AUTHOR = "Zheng, Y. and Zhang, Y. and Feng, R. and Zhang, T. and Fan, W.G.", TITLE = "Stacked Multimodal Attention Network for Context-Aware Video Captioning", JOURNAL = CirSysVideo, VOLUME = "32", YEAR = "2022", NUMBER = "1", MONTH = "January", PAGES = "31-42", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201315"} @article{bb206214, AUTHOR = "Li, L. and Gao, X.Y. and Deng, J. and Tu, Y. and Zha, Z.J. and Huang, Q.M.", TITLE = "Long Short-Term Relation Transformer With Global Gating for Video Captioning", JOURNAL = IP, VOLUME = "31", YEAR = "2022", PAGES = "2726-2738", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201316"} @article{bb206215, AUTHOR = "Munusamy, H. and Sekhar, C.C.", TITLE = "Video captioning using Semantically Contextual Generative Adversarial Network", JOURNAL = CVIU, VOLUME = "221", YEAR = "2022", PAGES = "103453", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201317"} @article{bb206216, AUTHOR = "Wang, H. and Lin, G.S. and Hoi, S.C.H. and Miao, C.Y.", TITLE = "Cross-Modal Graph With Meta Concepts for Video Captioning", JOURNAL = IP, VOLUME = "31", YEAR = "2022", PAGES = "5150-5162", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201318"} @article{bb206217, AUTHOR = "Xiao, H. and Shi, J.L.", TITLE = "Diverse video captioning through latent variable expansion", JOURNAL = PRL, VOLUME = "160", YEAR = "2022", PAGES = "19-25", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201319"} @article{bb206218, AUTHOR = "Prudviraj, J. and Reddy, M.I. and Vishnu, C. and Mohan, C.K.", TITLE = "AAP-MIT: Attentive Atrous Pyramid Network and Memory Incorporated Transformer for Multisentence Video Description", JOURNAL = IP, VOLUME = "31", YEAR = "2022", PAGES = "5559-5569", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201320"} @article{bb206219, AUTHOR = "Xu, W. and Miao, Z.J. and Yu, J. and Tian, Y. and Wan, L. and Ji, Q.", TITLE = "Bridging Video and Text: A Two-Step Polishing Transformer for Video Captioning", JOURNAL = CirSysVideo, VOLUME = "32", YEAR = "2022", NUMBER = "9", MONTH = "September", PAGES = "6293-6307", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201321"} @article{bb206220, AUTHOR = "Wu, B.F. and Niu, G.C. and Yu, J. and Xiao, X.Y. and Zhang, J. and Wu, H.", TITLE = "Towards Knowledge-Aware Video Captioning via Transitive Visual Relationship Detection", JOURNAL = CirSysVideo, VOLUME = "32", YEAR = "2022", NUMBER = "10", MONTH = "October", PAGES = "6753-6765", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201322"} @article{bb206221, AUTHOR = "Yan, L.Q. and Ma, S.Q. and Wang, Q.F. and Chen, Y.J. and Zhang, X.Y. and Savakis, A. and Liu, D.F.", TITLE = "Video Captioning Using Global-Local Representation", JOURNAL = CirSysVideo, VOLUME = "32", YEAR = "2022", NUMBER = "10", MONTH = "October", PAGES = "6642-6656", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201323"} @article{bb206222, AUTHOR = "Subramaniam, A. and Vaidya, J. and Ameen, M.A.M. and Nambiar, A. and Mittal, A.", TITLE = "Co-segmentation inspired attention module for video-based computer vision tasks", JOURNAL = CVIU, VOLUME = "223", YEAR = "2022", PAGES = "103532", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201324"} @article{bb206223, AUTHOR = "Liu, F.L. and Wu, X. and You, C. and Ge, S. and Zou, Y.X. and Sun, X.", TITLE = "Aligning Source Visual and Target Language Domains for Unpaired Video Captioning", JOURNAL = PAMI, VOLUME = "44", YEAR = "2022", NUMBER = "12", MONTH = "December", PAGES = "9255-9268", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201325"} @article{bb206224, AUTHOR = "Yuan, Y.T. and Ma, L. and Zhu, W.", TITLE = "Syntax Customized Video Captioning by Imitating Exemplar Sentences", JOURNAL = PAMI, VOLUME = "44", YEAR = "2022", NUMBER = "12", MONTH = "December", PAGES = "10209-10221", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201326"} @article{bb206225, AUTHOR = "Chen, H.R. and Li, J. and Frintrop, S. and Hu, X.L.", TITLE = "The MSR-Video to Text dataset with clean annotations", JOURNAL = CVIU, VOLUME = "225", YEAR = "2022", PAGES = "103581", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201327"} @article{bb206226, AUTHOR = "Moctezuma, D. and Ramirez delReal, T. and Ruiz, G. and Gonzalez Chavez, O.", TITLE = "Video captioning: A comparative review of where we are and which could be the route", JOURNAL = CVIU, VOLUME = "231", YEAR = "2023", PAGES = "103671", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201328"} @inproceedings{bb206227, AUTHOR = "Seo, P.H. and Nagrani, A. and Arnab, A. and Schmid, C.", TITLE = "End-to-end Generative Pretraining for Multimodal Video Captioning", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "17938-17947", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201329"} @inproceedings{bb206228, AUTHOR = "Ye, H.H. and Li, G.R. and Qi, Y. and Wang, S.H. and Huang, Q.M. and Yang, M.H.", TITLE = "Hierarchical Modular Network for Video Captioning", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "17918-17927", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201330"} @inproceedings{bb206229, AUTHOR = "Lin, K. and Li, L.J. and Lin, C.C. and Ahmed, F. and Gan, Z. and Liu, Z.C. and Lu, Y. and Wang, L.J.", TITLE = "SwinBERT: End-to-End Transformers with Sparse Attention for Video Captioning", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "17928-17937", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201331"} @inproceedings{bb206230, AUTHOR = "Shi, Y. and Yang, X. and Xu, H.Y. and Yuan, C.F. and Li, B. and Hu, W.M. and Zha, Z.J.", TITLE = "EMScore: Evaluating Video Captioning via Coarse-Grained and Fine-Grained Embedding Matching", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "17908-17917", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201332"} @inproceedings{bb206231, AUTHOR = "Chen, S.X. and Jiang, Y.G.", TITLE = "Motion Guided Region Message Passing for Video Captioning", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "1523-1532", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201333"} @inproceedings{bb206232, AUTHOR = "Joshi, P. and Saharia, C. and Singh, V. and Gautam, D. and Ramakrishnan, G. and Jyothi, P.", TITLE = "A Tale of Two Modalities for Video Captioning", BOOKTITLE = MMVAMTC19, YEAR = "2019", PAGES = "3708-3712", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201334"} @inproceedings{bb206233, AUTHOR = "Wang, T. and Zhang, R. and Lu, Z.C. and Zheng, F. and Cheng, R. and Luo, P.", TITLE = "End-to-End Dense Video Captioning with Parallel Decoding", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "6827-6837", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201335"} @inproceedings{bb206234, AUTHOR = "Yang, B. and Zou, Y.X.", TITLE = "Visual Oriented Encoder: Integrating Multimodal and Multi-Scale Contexts for Video Captioning", BOOKTITLE = ICPR21, YEAR = "2021", PAGES = "188-195", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201336"} @inproceedings{bb206235, AUTHOR = "Perez Martin, J. and Bustos, B. and Perez, J.", TITLE = "Attentive Visual Semantic Specialized Network for Video Captioning", BOOKTITLE = ICPR21, YEAR = "2021", PAGES = "5767-5774", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201337"} @inproceedings{bb206236, AUTHOR = "Lu, M. and Li, X. and Liu, C.", TITLE = "Context Visual Information-based Deliberation Network for Video Captioning", BOOKTITLE = ICPR21, YEAR = "2021", PAGES = "9812-9818", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201338"} @inproceedings{bb206237, AUTHOR = "Olivastri, S. and Singh, G. and Cuzzolin, F.", TITLE = "End-to-End Video Captioning", BOOKTITLE = HVU19, YEAR = "2019", PAGES = "1474-1482", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201339"} @inproceedings{bb206238, AUTHOR = "Li, L. and Gong, B.", TITLE = "End-to-End Video Captioning With Multitask Reinforcement Learning", BOOKTITLE = WACV19, YEAR = "2019", PAGES = "339-348", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201340"} @inproceedings{bb206239, AUTHOR = "Wang, B. and Ma, L. and Zhang, W. and Liu, W.", TITLE = "Reconstruction Network for Video Captioning", BOOKTITLE = CVPR18, YEAR = "2018", PAGES = "7622-7631", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201341"} @inproceedings{bb206240, AUTHOR = "Li, Y. and Yao, T. and Pan, Y. and Chao, H. and Mei, T.", TITLE = "Jointly Localizing and Describing Events for Dense Video Captioning", BOOKTITLE = CVPR18, YEAR = "2018", PAGES = "7492-7500", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201342"} @inproceedings{bb206241, AUTHOR = "Wang, J. and Jiang, W. and Ma, L. and Liu, W. and Xu, Y.", TITLE = "Bidirectional Attentive Fusion with Context Gating for Dense Video Captioning", BOOKTITLE = CVPR18, YEAR = "2018", PAGES = "7190-7198", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201343"} @inproceedings{bb206242, AUTHOR = "Wu, X. and Li, G. and Cao, Q. and Ji, Q. and Lin, L.", TITLE = "Interpretable Video Captioning via Trajectory Structured Localization", BOOKTITLE = CVPR18, YEAR = "2018", PAGES = "6829-6837", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201344"} @inproceedings{bb206243, AUTHOR = "Wang, X. and Chen, W. and Wu, J. and Wang, Y. and Wang, W.Y.", TITLE = "Video Captioning via Hierarchical Reinforcement Learning", BOOKTITLE = CVPR18, YEAR = "2018", PAGES = "4213-4222", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201345"} @inproceedings{bb206244, AUTHOR = "Zhou, L. and Zhou, Y. and Corso, J.J. and Socher, R. and Xiong, C.", TITLE = "End-to-End Dense Video Captioning with Masked Transformer", BOOKTITLE = CVPR18, YEAR = "2018", PAGES = "8739-8748", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201346"} @inproceedings{bb206245, AUTHOR = "Yang, D. and Yuan, C.", TITLE = "Hierarchical Context Encoding for Events Captioning in Videos", BOOKTITLE = ICIP18, YEAR = "2018", PAGES = "1288-1292", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201347"} @inproceedings{bb206246, AUTHOR = "Shen, Z.Q. and Li, J.G. and Su, Z. and Li, M.J. and Chen, Y.R. and Jiang, Y.G. and Xue, X.Y.", TITLE = "Weakly Supervised Dense Video Captioning", BOOKTITLE = CVPR17, YEAR = "2017", PAGES = "5159-5167", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201348"} @inproceedings{bb206247, AUTHOR = "Baraldi, L. and Grana, C. and Cucchiara, R.", TITLE = "Hierarchical Boundary-Aware Neural Encoder for Video Captioning", BOOKTITLE = CVPR17, YEAR = "2017", PAGES = "3185-3194", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201349"} @inproceedings{bb206248, AUTHOR = "Pan, P.B. and Xu, Z.W. and Yang, Y. and Wu, F. and Zhuang, Y.T.", TITLE = "Hierarchical Recurrent Neural Encoder for Video Representation with Application to Captioning", BOOKTITLE = CVPR16, YEAR = "2016", PAGES = "1029-1038", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201350"} @inproceedings{bb206249, AUTHOR = "Yu, H.N. and Wang, J. and Huang, Z.H. and Yang, Y. and Xu, W.", TITLE = "Video Paragraph Captioning Using Hierarchical Recurrent Neural Networks", BOOKTITLE = CVPR16, YEAR = "2016", PAGES = "4584-4593", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201351"} @inproceedings{bb206250, AUTHOR = "Shin, A. and Ohnishi, K. and Harada, T.", TITLE = "Beyond caption to narrative: Video captioning with multiple sentences", BOOKTITLE = ICIP16, YEAR = "2016", PAGES = "3364-3368", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT201352"} @article{bb206251, AUTHOR = "Vakali, A. and Hacid, M.S. and Elmagarmid, A.", TITLE = "MPEG-7 based description schemes for multi-level video content classification", JOURNAL = IVC, VOLUME = "22", YEAR = "2004", NUMBER = "5", MONTH = "May", PAGES = "367-378", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201353"} @article{bb206252, AUTHOR = "Fonseca, P.M. and Pereira, F.", TITLE = "Automatic video summarization based on MPEG-7 descriptions", JOURNAL = SP:IC, VOLUME = "19", YEAR = "2004", NUMBER = "8", MONTH = "September", PAGES = "685-699", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201354"} @article{bb206253, AUTHOR = "Mrak, M. and Calic, J. and Kondoz, A.M.", TITLE = "Fast analysis of scalable video for adaptive browsing interfaces", JOURNAL = CVIU, VOLUME = "113", YEAR = "2009", NUMBER = "3", MONTH = "March", PAGES = "425-434", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201355"} @inproceedings{bb206254, AUTHOR = "Calic, J. and Mrak, M. and Kondoz, A.M.", TITLE = "Flexible generation of video summaries from layered video bit-streams", BOOKTITLE = ICIP08, YEAR = "2008", PAGES = "2516-2519", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201356"} @article{bb206255, AUTHOR = "Herranz, L. and Martinez, J.M.", TITLE = "An integrated approach to summarization and adaptation using H.264/MPEG-4 SVC", JOURNAL = SP:IC, VOLUME = "24", YEAR = "2009", NUMBER = "6", MONTH = "July", PAGES = "499-509", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201357"} @article{bb206256, AUTHOR = "Herranz, L. and Martinez, J.M.", TITLE = "On the use of hierarchical prediction structures for efficient summary generation of H.264/AVC bitstreams", JOURNAL = SP:IC, VOLUME = "24", YEAR = "2009", NUMBER = "8", MONTH = "September", PAGES = "615-629", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201358"} @article{bb206257, AUTHOR = "Matos, N. and Pereira, F.", TITLE = "Automatic creation and evaluation of MPEG-7 compliant summary descriptions for generic audiovisual content", JOURNAL = SP:IC, VOLUME = "23", YEAR = "2008", NUMBER = "8", MONTH = "September", PAGES = "581-598", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201359"} @article{bb206258, AUTHOR = "Ren, J.C. and Jiang, J.M. and Feng, Y.", TITLE = "Activity-driven content adaptation for effective video summarization", JOURNAL = JVCIR, VOLUME = "21", YEAR = "2010", NUMBER = "8", MONTH = "November", PAGES = "930-938", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201360"} @article{bb206259, AUTHOR = "Almeida, J. and Leite, N.J. and da Silva Torres, R.", TITLE = "VISON: VIdeo Summarization for ONline applications", JOURNAL = PRL, VOLUME = "33", YEAR = "2012", NUMBER = "4", MONTH = "March", PAGES = "397-409", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201361"} @inproceedings{bb206260, AUTHOR = "Almeida, J. and Leite, N.J. and da Silva Torres, R.", TITLE = "Comparison of video sequences with histograms of motion patterns", BOOKTITLE = ICIP11, YEAR = "2011", PAGES = "3673-3676", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201362"} @inproceedings{bb206261, AUTHOR = "Almeida, J. and Leite, N.J. and da Silva Torres, R.", TITLE = "Rapid Cut Detection on Compressed Video", BOOKTITLE = CIARP11, YEAR = "2011", PAGES = "71-78", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201363"} @article{bb206262, AUTHOR = "Basavarajaiah, M. and Sharma, P.", TITLE = "Survey of Compressed Domain Video Summarization Techniques", JOURNAL = Surveys, VOLUME = "52", YEAR = "2019", NUMBER = "6", MONTH = "October", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201364"} @inproceedings{bb206263, AUTHOR = "Lee, J.H. and Kim, W.Y.", TITLE = "Video Summarization and Retrieval System Using Face Recognition and MPEG-7 Descriptors", BOOKTITLE = CIVR04, YEAR = "2004", PAGES = "170-178", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201365"} @inproceedings{bb206264, AUTHOR = "Soysal, M. and Alatan, A.A.", TITLE = "Combining MPEG-7 Based Visual Experts for Reaching Semantics", BOOKTITLE = VLBV03, YEAR = "2003", PAGES = "66-75", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201366"} @inproceedings{bb206265, AUTHOR = "Divakaran, A. and Peker, K.A. and Radhakrishnan, R. and Xiong, Z.Y. and Cabasson, R.", TITLE = "Video Summarization using MPEG-7 Motion Activity and Audio Descriptors", BOOKTITLE = VideoMining03, YEAR = "2003", PAGES = "Chapter 4", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201367"} @inproceedings{bb206266, AUTHOR = "Sugano, M. and Nakajima, Y. and Yanagihara, H.", TITLE = "Automated MPEG audio-video summarization and description", BOOKTITLE = ICIP02, YEAR = "2002", PAGES = "I: 956-959", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201368"} @inproceedings{bb206267, AUTHOR = "Jaimes, A. and Echigo, T. and Teraguchi, M. and Satoh, F.", TITLE = "Learning personalized video highlights from detailed MPEG-7 metadata", BOOKTITLE = ICIP02, YEAR = "2002", PAGES = "I: 133-136", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201369"} @inproceedings{bb206268, AUTHOR = "Lin, C.Y. and Tseng, B.L. and Naphade, M.R. and Natsev, A.P. and Smith, J.R.", TITLE = "VideoAL: A novel end-to-end MPEG-7 video automatic labeling system", BOOKTITLE = ICIP03, YEAR = "2003", PAGES = "III: 53-56", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201370"} @inproceedings{bb206269, AUTHOR = "Kim, J.G. and Chang, H.S. and Kim, J.W. and Kim, H.M.", TITLE = "Efficient Camera Motion Characterization for MPEG Video Indexing", BOOKTITLE = ICME00, YEAR = "2000", PAGES = "TP11", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201371"} @inproceedings{bb206270, AUTHOR = "DeMenthon, D.F. and Megret, R.", TITLE = "Spatio-temporal Segmentation of Video by Hierarchical Mean Shift Analysis", BOOKTITLE = UMD, YEAR = "2002", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201372"} @inproceedings{bb206271, AUTHOR = "Megret, R. and DeMenthon, D.F.", TITLE = "A Survey of Spatio-temporal Grouping Techniques", BOOKTITLE = UMD, YEAR = "2002", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201373"} @inproceedings{bb206272, AUTHOR = "DeMenthon, D.F. and Latecki, L.J. and Rosenfeld, A. and Stueckelberg, M.V.", TITLE = "Relevance Ranking of Video Data using Hidden Markov Model Distances and Polygon Simplification", BOOKTITLE = UMD, YEAR = "2001", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201374"} @inproceedings{bb206273, AUTHOR = "DeMenthon, D.F. and Kobla, V. and Doermann, D.", TITLE = "Video Summarization by Curve Simplification", BOOKTITLE = UMD, YEAR = "1998", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201375"} @inproceedings{bb206274, AUTHOR = "Yoon, K. and DeMenthon, D.F. and Doermann, D.", TITLE = "Event Detection from MPEG Video in the Compressed Domain", BOOKTITLE = ICPR00, YEAR = "2000", PAGES = "Vol I: 819-822", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT201376"} @article{bb206275, AUTHOR = "Doulamis, A.D. and Doulamis, N.D. and Kollias, S.D.", TITLE = "A fuzzy video content representation for video summarization and content-based retrieval", JOURNAL = SP, VOLUME = "80", YEAR = "2000", NUMBER = "6", MONTH = "June", PAGES = "1049-1067", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201377"} @article{bb206276, AUTHOR = "Kollias, S.D. and Doulamis, N.D. and Doulamis, A.D.", TITLE = "A fuzzy video content representation for video summarization and content-based retrieval", JOURNAL = SP, VOLUME = "82", YEAR = "2002", NUMBER = "4", MONTH = "April", PAGES = "545", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201377"} @article{bb206277, AUTHOR = "Doulamis, N.D. and Doulamis, A.D. and Avrithis, Y.S. and Ntalianis, K.S. and Kollias, S.D.", TITLE = "Efficient Summarization of Stereoscopic Video Sequences", JOURNAL = CirSysVideo, VOLUME = "10", YEAR = "2000", NUMBER = "4", MONTH = "June", PAGES = "501-157", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201378"} @inproceedings{bb206278, AUTHOR = "Ntalianis, K.S. and Doulamis, A.D. and Tsapatsoulis, N.", TITLE = "Implicit visual concept modeling in image/video annotation", BOOKTITLE = ARTEMIS10, YEAR = "2010", PAGES = "33-38", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201379"} @inproceedings{bb206279, AUTHOR = "Doulamis, A.D. and Ntalianis, K.S.", TITLE = "On the Fly Semantic Annotation and Modelling of Multimedia", BOOKTITLE = WSSIP09, YEAR = "2009", PAGES = "1-4", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201380"} @inproceedings{bb206280, AUTHOR = "Doulamis, N.D. and Doulamis, A.D. and Avrithis, Y.S. and Kollias, S.D.", TITLE = "Video content representation using optimal extraction of frames and scenes", BOOKTITLE = ICIP98, YEAR = "1998", PAGES = "I: 875-879", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201381"} @article{bb206281, AUTHOR = "Amir, A. and Ashour, G. and Srinivasan, S.", TITLE = "Automatic generation of conference video proceedings", JOURNAL = JVCIR, VOLUME = "15", YEAR = "2004", NUMBER = "3", MONTH = "September", PAGES = "467-488", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201382"} @article{bb206282, AUTHOR = "Metze, F. and Ding, D. and Younessian, E. and Hauptmann, A.G.", TITLE = "Beyond audio and video retrieval: Topic-oriented multimedia summarization", JOURNAL = MultInfoRetr, VOLUME = "2", YEAR = "2013", NUMBER = "2", MONTH = "June", PAGES = "131-144", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201383"} @inproceedings{bb206283, AUTHOR = "Ding, D. and Metze, F. and Rawat, S. and Schulam, P.F. and Burger, S. and Younessian, E. and Bao, L. and Christel, M.G. and Hauptmann, A.G.", TITLE = "Beyond audio and video retrieval: Towards multimedia summarization", BOOKTITLE = ICMR12, YEAR = "2012", PAGES = "2", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201384"} @article{bb206284, AUTHOR = "Bian, J.W. and Yang, Y. and Zhang, H. and Chua, T.S.", TITLE = "Multimedia Summarization for Social Events in Microblog Stream", JOURNAL = MultMed, VOLUME = "17", YEAR = "2015", NUMBER = "2", MONTH = "February", PAGES = "216-228", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201385"} @article{bb206285, AUTHOR = "Kuanar, S.K. and Ranga, K.B. and Chowdhury, A.S.", TITLE = "Multi-View Video Summarization Using Bipartite Matching Constrained Optimum-Path Forest Clustering", JOURNAL = MultMed, VOLUME = "17", YEAR = "2015", NUMBER = "8", MONTH = "August", PAGES = "1166-1173", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201386"} @article{bb206286, AUTHOR = "Tan, C.C. and Ngo, C.W.", TITLE = "On the use of commonsense ontology for multimedia event recounting", JOURNAL = MultInfoRetr, VOLUME = "5", YEAR = "2016", NUMBER = "2", MONTH = "June", PAGES = "73-88", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201387"} @article{bb206287, AUTHOR = "Wu, F. and Fang, H. and Li, X. and Tang, S. and Lu, W. and Yang, Y. and Zhu, W. and Zhuang, Y.", TITLE = "Aspect Learning for Multimedia Summarization via Nonparametric Bayesian", JOURNAL = CirSysVideo, VOLUME = "26", YEAR = "2016", NUMBER = "10", MONTH = "October", PAGES = "1931-1942", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201388"} @article{bb206288, AUTHOR = "Jiang, Y.G. and Wu, Z.X. and Tang, J.H. and Li, Z.C. and Xue, X.Y. and Chang, S.F.", TITLE = "Modeling Multimodal Clues in a Hybrid Deep Learning Framework for Video Classification", JOURNAL = MultMed, VOLUME = "20", YEAR = "2018", NUMBER = "11", MONTH = "November", PAGES = "3137-3147", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201389"} @article{bb206289, AUTHOR = "Wu, Z.X. and Li, H.D. and Zheng, Y.B. and Xiong, C.M. and Jiang, Y.G. and Davis, L.S.", TITLE = "A Coarse-to-Fine Framework for Resource Efficient Video Recognition", JOURNAL = IJCV, VOLUME = "129", YEAR = "2021", NUMBER = "11", MONTH = "November", PAGES = "2965-2977", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201390"} @article{bb206290, AUTHOR = "Tian, F. and Wang, Q. and Li, X. and Sun, N.", TITLE = "Heterogeneous multimedia cooperative annotation based on multimodal correlation learning", JOURNAL = JVCIR, VOLUME = "58", YEAR = "2019", PAGES = "544-553", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201391"} @article{bb206291, AUTHOR = "Du, X.T. and Yuan, J. and Hu, L. and Dai, Y.", TITLE = "Description generation of open-domain videos incorporating multimodal features and bidirectional encoder", JOURNAL = VC, VOLUME = "35", YEAR = "2018", NUMBER = "12", MONTH = "December", PAGES = "1703-1712", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201392"} @article{bb206292, AUTHOR = "Li, J. and Wong, Y. and Zhao, Q. and Kankanhalli, M.S.", TITLE = "Video Storytelling: Textual Summaries for Events", JOURNAL = MultMed, VOLUME = "22", YEAR = "2020", NUMBER = "2", MONTH = "February", PAGES = "554-565", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201393"} @article{bb206293, AUTHOR = "Cascianelli, S. and Costante, G. and Devo, A. and Ciarfuglia, T.A. and Valigi, P. and Fravolini, M.L.", TITLE = "The Role of the Input in Natural Language Video Description", JOURNAL = MultMed, VOLUME = "22", YEAR = "2020", NUMBER = "1", MONTH = "January", PAGES = "271-283", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201394"} @inproceedings{bb206294, AUTHOR = "Bouritsas, G. and Koutras, P. and Zlatintsi, A. and Maragos, P.", TITLE = "Multimodal Visual Concept Learning with Weakly Supervised Techniques", BOOKTITLE = CVPR18, YEAR = "2018", PAGES = "4914-4923", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201395"} @inproceedings{bb206295, AUTHOR = "Wang, J. and Wang, W. and Huang, Y. and Wang, L. and Tan, T.", TITLE = "M3: Multimodal Memory Modelling for Video Captioning", BOOKTITLE = CVPR18, YEAR = "2018", PAGES = "7512-7520", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201396"} @inproceedings{bb206296, AUTHOR = "Kang, S.H. and Kim, J.Y. and Choi, H. and Kim, S.J. and Yoo, C.D.", TITLE = "Pivot Correlational Neural Network for Multimodal Video Categorization", BOOKTITLE = ECCV18, YEAR = "2018", PAGES = "XIV: 402-417", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201397"} @inproceedings{bb206297, AUTHOR = "Mazaheri, A. and Shah, M.", TITLE = "Visual Text Correction", BOOKTITLE = ECCV18, YEAR = "2018", PAGES = "XIII: 159-175", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201398"} @inproceedings{bb206298, AUTHOR = "Rudinac, S. and Chua, T.S. and Diaz Ferreyra, N. and Friedland, G. and Gornostaja, T. and Huet, B. and Kaptein, R. and Linden, K. and Moens, M.F. and Peltonen, J. and Redi, M. and Schedl, M. and Shamma, D.A. and Smeaton, A. and Xie, L.X.", TITLE = "Rethinking Summarization and Storytelling for Modern Social Multimedia", BOOKTITLE = MMMod18, YEAR = "2018", PAGES = "I:632-644", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201399"} @inproceedings{bb206299, AUTHOR = "Hori, C. and Hori, T. and Lee, T.Y. and Zhang, Z.M. and Harsham, B. and Hershey, J.R. and Marks, T.K. and Sumi, K.", TITLE = "Attention-Based Multimodal Fusion for Video Description", BOOKTITLE = ICCV17, YEAR = "2017", PAGES = "4203-4212", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT201400"}