@inproceedings{bb184000, AUTHOR = "Warchocki, J. and Oprescu, T. and Wang, Y.H. and Damacus, A. and Misterka, P. and Bruintjes, R.J. and Lengyel, A. and Strafforello, O. and van Gemert, J.C.", TITLE = "Benchmarking Data Efficiency and Computational Efficiency of Temporal Action Localization Models", BOOKTITLE = CVEU23, YEAR = "2023", PAGES = "3000-3008", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179471"} @inproceedings{bb184001, AUTHOR = "Heigold, G. and Keysers, D. and Minderer, M. and Lucic, M. and Gritsenko, A. and Yu, F. and Bewley, A. and Kipf, T.", TITLE = "Video OWL-ViT: Temporally-consistent open-world localization in video", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "13756-13765", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179472"} @inproceedings{bb184002, AUTHOR = "Shao, J.Y. and Wang, X.H. and Quan, R.J. and Zheng, J.J. and Yang, J. and Yang, Y.", TITLE = "Action Sensitivity Learning for Temporal Action Localization", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "13411-13423", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179473"} @inproceedings{bb184003, AUTHOR = "Barrios, W. and Soldan, M. and Ceballos Arroyo, A.M. and Heilbron, F.C. and Ghanem, B.", TITLE = "Localizing Moments in Long Video Via Multimodal Guidance", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "13621-13632", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179474"} @inproceedings{bb184004, AUTHOR = "Wang, G.Q. and Zhao, P. and Zhao, C. and Yang, S. and Cheng, J. and Leng, L. and Liao, J.X. and Guo, Q.H.", TITLE = "Weakly-Supervised Action Localization by Hierarchically-structured Latent Attention Modeling", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "10169-10179", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179475"} @inproceedings{bb184005, AUTHOR = "Shah, A. and Lundell, B. and Sawhney, H. and Chellappa, R.", TITLE = "STEPs: Self-Supervised Key Step Extraction and Localization from Unlabeled Procedural Videos", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "10341-10353", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179476"} @inproceedings{bb184006, AUTHOR = "Liu, Q. and Wang, Z. and Rong, S. and Li, J.J. and Zhang, Y.X.", TITLE = "Revisiting Foreground and Background Separation in Weakly-supervised Temporal Action Localization: A Clustering-based Approach", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "10399-10409", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179477"} @inproceedings{bb184007, AUTHOR = "Tang, X.J. and Fan, J.S. and Luo, C.C. and Zhang, Z.X. and Zhang, M. and Yang, Z.Y.", TITLE = "DDG-Net: Discriminability-Driven Graph Network for Weakly-supervised Temporal Action Localization", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "6599-6609", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179478"} @inproceedings{bb184008, AUTHOR = "Croitoru, I. and Bogolin, S.V. and Albanie, S. and Liu, Y. and Wang, Z.W. and Yoon, S.H. and Dernoncourt, F. and Jin, H.L. and Bui, T.", TITLE = "Moment Detection in Long Tutorial Videos", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "2594-2604", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179479"} @inproceedings{bb184009, AUTHOR = "Xia, K. and Wang, L. and Zhou, S.P. and Hua, G. and Tang, W.", TITLE = "Learning from Noisy Pseudo Labels for Semi-Supervised Temporal Action Localization", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "10126-10135", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179480"} @inproceedings{bb184010, AUTHOR = "Geng, T.T. and Wang, T. and Duan, J.M. and Cong, R. and Zheng, F.", TITLE = "Dense-Localizing Audio-Visual Events in Untrimmed Videos: A Large-Scale Benchmark and Baseline", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "22942-22951", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179481"} @inproceedings{bb184011, AUTHOR = "Zheng, W.R. and Yoshihashi, R. and Kawakami, R. and Sato, I. and Kanezaki, A.", TITLE = "Multi Event Localization by Audio-Visual Fusion with Omnidirectional Camera and Microphone Array", BOOKTITLE = MULA23, YEAR = "2023", PAGES = "2566-2574", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179482"} @inproceedings{bb184012, AUTHOR = "Moon, W.J. and Hyun, S. and Park, S.U. and Park, D. and Heo, J.P.", TITLE = "Query: Dependent Video Representation for Moment Retrieval and Highlight Detection", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "23023-23033", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179483"} @inproceedings{bb184013, AUTHOR = "Luo, D. and Huang, J. and Gong, S.G. and Jin, H.L. and Liu, Y.", TITLE = "Towards Generalisable Video Moment Retrieval: Visual-Dynamic Injection to Image-Text Pre-Training", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "23045-23055", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179484"} @inproceedings{bb184014, AUTHOR = "Cao, S.Q. and Luo, W.X. and Wang, B. and Zhang, W. and Ma, L.", TITLE = "E2E-LOAD: End-to-End Long-form Online Action Detection", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "10388-10398", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179485"} @inproceedings{bb184015, AUTHOR = "Shi, D.F. and Zhong, Y.J. and Cao, Q. and Ma, L. and Lit, J. and Tao, D.C.", TITLE = "TriDet: Temporal Action Detection with Relative Boundary Modeling", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "18857-18866", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179486"} @inproceedings{bb184016, AUTHOR = "Wang, Y. and Li, Y.D. and Wang, H.B.", TITLE = "Two-Stream Networks for Weakly-Supervised Temporal Action Localization with Semantic-Aware Mechanisms", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "18878-18887", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179487"} @inproceedings{bb184017, AUTHOR = "Zala, A. and Cho, J. and Kottur, S. and Chen, X. and Oguz, B. and Mehdad, Y. and Bansal, M.", TITLE = "Hierarchical Video-Moment Retrieval and Step-Captioning", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "23056-23065", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179488"} @inproceedings{bb184018, AUTHOR = "Ju, C. and Zheng, K. and Liu, J.X. and Zhao, P. and Zhang, Y. and Chang, J.L. and Tian, Q. and Wang, Y.F.", TITLE = "Distilling Vision-Language Pre-Training to Collaborate with Weakly-Supervised Temporal Action Localization", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "14751-14762", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179489"} @inproceedings{bb184019, AUTHOR = "Chi, H.G. and Lee, K. and Agarwal, N. and Xu, Y. and Ramani, K. and Choi, C.", TITLE = "AdamsFormer for Spatial Action Localization in the Future", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "17885-17895", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179490"} @inproceedings{bb184020, AUTHOR = "Rizve, M.N. and Mittal, G. and Yu, Y. and Hall, M. and Sajeev, S. and Shah, M. and Chen, M.", TITLE = "PivoTAL: Prior-Driven Supervision for Weakly-Supervised Temporal Action Localization", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "22992-23002", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179491"} @inproceedings{bb184021, AUTHOR = "Zhou, J.Q. and Huang, L. and Wang, L. and Liu, S. and Li, H.S.", TITLE = "Improving Weakly Supervised Temporal Action Localization by Bridging Train-Test Gap in Pseudo Labels", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "23003-23012", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179492"} @inproceedings{bb184022, AUTHOR = "Zhao, C. and Liu, S.M. and Mangalam, K. and Ghanem, B.", TITLE = "Re2TAL: Rewiring Pretrained Video Backbones for Reversible Temporal Action Localization", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "10637-10647", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179493"} @inproceedings{bb184023, AUTHOR = "Kang, H. and Kim, H. and An, J. and Cho, M. and Kim, S.J.", TITLE = "Soft-Landing Strategy for Alleviating the Task Discrepancy Problem in Temporal Action Localization Tasks", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "6514-6523", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179494"} @inproceedings{bb184024, AUTHOR = "Seol, M. and Kim, J. and Moon, J.", TITLE = "BMRN: Boundary Matching and Refinement Network for Temporal Moment Localization with Natural Language", BOOKTITLE = ODRUM23, YEAR = "2023", PAGES = "5571-5579", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179495"} @inproceedings{bb184025, AUTHOR = "Ren, H. and Yang, W.F. and Zhang, T.Z. and Zhang, Y.D.", TITLE = "Proposal-Based Multiple Instance Learning for Weakly-Supervised Temporal Action Localization", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "2394-2404", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179496"} @inproceedings{bb184026, AUTHOR = "Ren, H.R. and Ren, H. and Lu, H. and Jin, C.", TITLE = "Weakly-Supervised Temporal Action Localization with Regional Similarity Consistency", BOOKTITLE = MMMod23, YEAR = "2023", PAGES = "I: 69-81", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179497"} @inproceedings{bb184027, AUTHOR = "Niu, Y. and Yang, J.Y. and Liang, C. and Huang, B. and Wang, Z.Y.", TITLE = "A Spatio-Temporal Identity Verification Method for Person-Action Instance Search in Movies", BOOKTITLE = MMMod23, YEAR = "2023", PAGES = "I: 82-94", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179498"} @inproceedings{bb184028, AUTHOR = "Rai, A.K. and Krishna, T. and Dietlmeier, J. and McGuinness, K. and Smeaton, A.F. and O'Connor, N.E.", TITLE = "Motion Aware Self-Supervision for Generic Event Boundary Detection", BOOKTITLE = WACV23, YEAR = "2023", PAGES = "2727-2738", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179499"} @inproceedings{bb184029, AUTHOR = "Mahmud, T. and Marculescu, D.", TITLE = "AVE-CLIP: AudioCLIP-based Multi-window Temporal Transformer for Audio Visual Event Localization", BOOKTITLE = WACV23, YEAR = "2023", PAGES = "5147-5156", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179500"} @inproceedings{bb184030, AUTHOR = "Zhou, J.X. and Wu, Y.", TITLE = "Temporal Feature Enhancement Dilated Convolution Network for Weakly-supervised Temporal Action Localization", BOOKTITLE = WACV23, YEAR = "2023", PAGES = "6017-6026", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179501"} @inproceedings{bb184031, AUTHOR = "Kang, T.K. and Lee, G.H. and Jin, K.M. and Lee, S.W.", TITLE = "Action-aware Masking Network with Group-based Attention for Temporal Action Localization", BOOKTITLE = WACV23, YEAR = "2023", PAGES = "6047-6056", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179502"} @inproceedings{bb184032, AUTHOR = "Cao, M. and Yang, T.Y. and Weng, J.W. and Zhang, C. and Wang, J. and Zou, Y.X.", TITLE = "LocVTP: Video-Text Pre-training for Temporal Localization", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXVI:38-56", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179503"} @inproceedings{bb184033, AUTHOR = "Cheng, F. and Bertasius, G.", TITLE = "TallFormer: Temporal Action Localization with a Long-Memory Transformer", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXXIV:503-521", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179504"} @inproceedings{bb184034, AUTHOR = "Kim, Y.H. and Kang, H. and Kim, S.J.", TITLE = "A Sliding Window Scheme for Online Temporal Action Localization", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXXIV:653-669", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179505"} @inproceedings{bb184035, AUTHOR = "Rao, V. and Khalil, M.I. and Li, H. and Dai, P. and Lu, J.W.", TITLE = "Dual Perspective Network for Audio-Visual Event Localization", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXXIV:689-704", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179506"} @inproceedings{bb184036, AUTHOR = "Huang, J. and Jin, H.L. and Gong, S.G. and Liu, Y.", TITLE = "Video Activity Localisation with Uncertainties in Temporal Boundary", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXXIV:724-740", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179507"} @inproceedings{bb184037, AUTHOR = "Aakur, S. and Sarkar, S.", TITLE = "Actor-Centered Representations for Action Localization in Streaming Videos", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXXVIII:70-87", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179508"} @inproceedings{bb184038, AUTHOR = "Paul, S. and Mithun, N.C. and Roy Chowdhury, A.K.", TITLE = "Text-Based Temporal Localization of Novel Events", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XIV:567-587", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179509"} @inproceedings{bb184039, AUTHOR = "Zhang, C.L. and Wu, J.X. and Li, Y.", TITLE = "ActionFormer: Localizing Moments of Actions with Transformers", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "IV:492-510", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179510"} @inproceedings{bb184040, AUTHOR = "Togashi, R. and Otani, M. and Nakashima, Y. and Rahtu, E. and Heikkila, J. and Sakai, T.", TITLE = "AxIoU: An Axiomatically Justified Measure for Video Moment Retrieval", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "21044-21053", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179511"} @inproceedings{bb184041, AUTHOR = "Zhang, Y.H. and Doughty, H. and Shao, L. and Snoek, C.G.M.", TITLE = "Audio-Adaptive Activity Recognition Across Video Domains", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "13781-13790", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179512"} @inproceedings{bb184042, AUTHOR = "Liu, W.Z. and Tekin, B. and Coskun, H. and Vineet, V. and Fua, P. and Pollefeys, M.", TITLE = "Learning to Align Sequential Actions in the Wild", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "2171-2181", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179513"} @inproceedings{bb184043, AUTHOR = "Li, W. and Chen, S. and Gu, J.Y. and Wang, N. and Chen, C. and Guo, Y.D.", TITLE = "MV-TAL: Mulit-view Temporal Action Localization in Naturalistic Driving", BOOKTITLE = AICity22, YEAR = "2022", PAGES = "3241-3247", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179514"} @inproceedings{bb184044, AUTHOR = "Zhang, C. and Yang, T.Y. and Weng, J. and Cao, M. and Wang, J. and Zou, Y.X.", TITLE = "Unsupervised Pre-training for Temporal Action Localization Tasks", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "14011-14021", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179515"} @inproceedings{bb184045, AUTHOR = "Li, J.J. and Yang, T.Y. and Ji, W. and Wang, J. and Cheng, L.", TITLE = "Exploring Denoised Cross-video Contrast for Weakly-supervised Temporal Action Localization", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "19882-19892", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179516"} @inproceedings{bb184046, AUTHOR = "He, B. and Yang, X. and Kang, L. and Cheng, Z. and Zhou, X. and Shrivastava, A.", TITLE = "ASM-Loc: Action-aware Segment Modeling for Weakly-Supervised Temporal Action Localization", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "13915-13925", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179517"} @inproceedings{bb184047, AUTHOR = "Xia, K. and Wang, L. and Zhou, S.P. and Zheng, N.N. and Tang, W.", TITLE = "Learning to Refactor Action and Co-occurrence Features for Temporal Action Localization", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "13874-13883", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179518"} @inproceedings{bb184048, AUTHOR = "Bao, W.T. and Yu, Q. and Kong, Y.", TITLE = "OpenTAL: Towards Open Set Temporal Action Localization", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "2969-2979", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179519"} @inproceedings{bb184049, AUTHOR = "Sridhar, D. and Quader, N. and Muralidharan, S. and Li, Y.X. and Dai, P. and Lu, J.W.", TITLE = "Class Semantics-based Attention for Action Detection", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "13719-13728", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179520"} @inproceedings{bb184050, AUTHOR = "Huang, J. and Liu, Y. and Gong, S.G. and Jin, H.L.", TITLE = "Cross-Sentence Temporal and Semantic Relations in Video Activity Localisation", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "7179-7188", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179521"} @inproceedings{bb184051, AUTHOR = "Xu, M.M. and Perez Rua, J.M. and Escorcia, V. and Martinez, B. and Zhu, X.T. and Zhang, L. and Ghanem, B. and Xiang, T.", TITLE = "Boundary-sensitive Pre-training for Temporal Localization in Videos", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "7200-7210", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179522"} @inproceedings{bb184052, AUTHOR = "Nam, J. and Ahn, D.C. and Kang, D.Y. and Ha, S.J. and Choi, J.H.", TITLE = "Zero-shot Natural Language Video Localization", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "1450-1459", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179523"} @inproceedings{bb184053, AUTHOR = "Wang, Y.X. and Gao, D.F. and Yu, L.C. and Lei, W.X. and Feiszli, M. and Shou, M.Z.", TITLE = "GEB+: A Benchmark for Generic Event Boundary Captioning, Grounding and Retrieval", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXXV:709-725", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179524"} @inproceedings{bb184054, AUTHOR = "Shou, M.Z. and Lei, S.W.X. and Wang, W.Y. and Ghadiyaram, D. and Feiszli, M.", TITLE = "Generic Event Boundary Detection: A Benchmark for Event Segmentation", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "8055-8064", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179525"} @inproceedings{bb184055, AUTHOR = "Ju, C. and Zhao, P. and Chen, S. and Zhang, Y. and Wang, Y.F. and Tian, Q.", TITLE = "Divide and Conquer for Single-frame Temporal Action Localization", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "13435-13444", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179526"} @inproceedings{bb184056, AUTHOR = "Narayan, S. and Cholakkal, H. and Hayat, M. and Khan, F.S. and Yang, M.H. and Shao, L.", TITLE = "D2-Net: Weakly-Supervised Action Localization via Discriminative Embeddings and Denoised Activations", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "13588-13597", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179527"} @inproceedings{bb184057, AUTHOR = "Lee, P. and Byun, H.R.", TITLE = "Learning Action Completeness from Points for Weakly-supervised Temporal Action Localization", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "13628-13637", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179528"} @inproceedings{bb184058, AUTHOR = "Zhao, C. and Thabet, A. and Ghanem, B.", TITLE = "Video Self-Stitching Graph Network for Temporal Action Localization", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "13638-13647", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179529"} @inproceedings{bb184059, AUTHOR = "Kang, H. and Kim, K. and Ko, Y. and Kim, S.J.", TITLE = "CAG-QIL: Context-Aware Actionness Grouping via Q Imitation Learning for Online Temporal Action Localization", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "13709-13718", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179530"} @inproceedings{bb184060, AUTHOR = "Zhang, L.Y. and Radke, R.J.", TITLE = "Natural Language Video Moment Localization Through Query-Controlled Temporal Convolution", BOOKTITLE = WACV22, YEAR = "2022", PAGES = "2524-2532", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179531"} @inproceedings{bb184061, AUTHOR = "Trehan, S. and Aakur, S.N.", TITLE = "Towards Active Vision for Action Localization with Reactive Control and Predictive Learning", BOOKTITLE = WACV22, YEAR = "2022", PAGES = "3391-3400", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179532"} @inproceedings{bb184062, AUTHOR = "Lee, J.T. and Jain, M. and Yun, S.", TITLE = "Few-Shot Common Action Localization via Cross-Attentional Fusion of Context and Temporal Dynamics", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "10180-10189", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179533"} @inproceedings{bb184063, AUTHOR = "Lee, J.T. and Yun, S.", TITLE = "Multi-Scale Temporal Feature Fusion for Few-Shot Action Recognition", BOOKTITLE = ICIP23, YEAR = "2023", PAGES = "1785-1789", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179534"} @inproceedings{bb184064, AUTHOR = "Kim, H. and Jain, M. and Lee, J.T. and Yun, S. and Porikli, F.M.", TITLE = "Efficient Action Recognition via Dynamic Knowledge Propagation", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "13699-13708", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179535"} @inproceedings{bb184065, AUTHOR = "Lee, J.T. and Yun, S. and Jain, M.", TITLE = "Leaky Gated Cross-Attention for Weakly Supervised Multi-Modal Temporal Action Localization", BOOKTITLE = WACV22, YEAR = "2022", PAGES = "817-826", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179536"} @inproceedings{bb184066, AUTHOR = "Hsieh, H.Y. and Chen, D.J. and Liu, T.L.", TITLE = "Contextual Proposal Network for Action Localization", BOOKTITLE = WACV22, YEAR = "2022", PAGES = "766-775", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179537"} @inproceedings{bb184067, AUTHOR = "Cheng, Y. and Sun, Y. and Lin, D.Y. and Lim, J.H.", TITLE = "Action Relational Graph for Weakly-Supervised Temporal Action Localization", BOOKTITLE = ICIP21, YEAR = "2021", PAGES = "2563-2567", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179538"} @inproceedings{bb184068, AUTHOR = "Biswas, S. and Gall, J.", TITLE = "Multiple Instance Triplet Loss for Weakly Supervised Multi-Label Action Localisation of Interacting Persons", BOOKTITLE = DYAD21, YEAR = "2021", PAGES = "2159-2167", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179539"} @inproceedings{bb184069, AUTHOR = "Li, Z. and Abu Farha, Y. and Gall, J.", TITLE = "Temporal Action Segmentation from Timestamp Supervision", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "8361-8370", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179540"} @inproceedings{bb184070, AUTHOR = "Ma, J.W. and Gorti, S.K. and Volkovs, M. and Yu, G.", TITLE = "Weakly Supervised Action Selection Learning in Video", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "7583-7592", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179541"} @inproceedings{bb184071, AUTHOR = "Liu, Y. and Chen, J.Y. and Chen, Z.F. and Deng, B. and Huang, J.Q. and Zhang, H.W.", TITLE = "The Blessings of Unlabeled Background in Untrimmed Videos", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "6172-6181", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179542"} @inproceedings{bb184072, AUTHOR = "Li, Z.H. and Yao, L.", TITLE = "Three Birds with One Stone: Multi-Task Temporal Action Detection via Recycling Temporal Annotations", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "4749-4758", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179543"} @inproceedings{bb184073, AUTHOR = "Gao, S.H. and Han, Q. and Li, Z.Y. and Peng, P. and Wang, L. and Cheng, M.M.", TITLE = "Global2Local: Efficient Structure Search for Video Action Segmentation", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "16800-16809", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179544"} @inproceedings{bb184074, AUTHOR = "Liu, X.L. and Hu, Y. and Bai, S. and Ding, F. and Bai, X. and Torr, P.H.S.", TITLE = "Multi-shot Temporal Event Localization: a Benchmark", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "12591-12601", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179545"} @inproceedings{bb184075, AUTHOR = "Wang, H. and Zha, Z.J. and Li, L. and Liu, D. and Luo, J.B.", TITLE = "Structured Multi-Level Interaction Network for Video Moment Localization via Language Query", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "7022-7031", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179546"} @inproceedings{bb184076, AUTHOR = "Lin, C.M. and Xu, C.M. and Luo, D.H. and Wang, Y.B. and Tai, Y. and Wang, C.J. and Li, J.L. and Huang, F.Y. and Fu, Y.W.", TITLE = "Learning Salient Boundary Feature for Anchor-free Temporal Action Localization", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "3319-3328", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179547"} @inproceedings{bb184077, AUTHOR = "Tirupattur, P. and Duarte, K. and Rawat, Y.S. and Shah, M.", TITLE = "Modeling Multi-Label Action Dependencies for Temporal Action Localization", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "1460-1470", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179548"} @inproceedings{bb184078, AUTHOR = "Lopcz Sastrc, R.J. and Baptista Rios, M. and Rodriguez, F.J. .A. and Martin Martin, P. and Maldonado Bascon, S.", TITLE = "Live Video Action Recognition from Unsupervised Action Proposals", BOOKTITLE = MVA21, YEAR = "2021", PAGES = "1-6", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179549"} @inproceedings{bb184079, AUTHOR = "Tan, R. and Xu, H.J. and Saenko, K. and Plummer, B.A.", TITLE = "LoGAN: Latent Graph Co-Attention Network for Weakly-Supervised Video Moment Retrieval", BOOKTITLE = WACV21, YEAR = "2021", PAGES = "2082-2091", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179550"} @inproceedings{bb184080, AUTHOR = "Rodriguez Opazo, C. and Marrese Taylor, E. and Fernando, B. and Li, H.D. and Gould, S.", TITLE = "DORi: Discovering Object Relationships for Moment Localization of a Natural Language Query in a Video", BOOKTITLE = WACV21, YEAR = "2021", PAGES = "1078-1087", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179551"} @inproceedings{bb184081, AUTHOR = "Pardo, A. and Alwassel, H. and Heilbron, F.C. and Thabet, A. and Ghanem, B.", TITLE = "RefineLoc: Iterative Refinement for Weakly-Supervised Action Localization", BOOKTITLE = WACV21, YEAR = "2021", PAGES = "3318-3327", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179552"} @inproceedings{bb184082, AUTHOR = "Rotsidis, A. and Lutteroth, C. and Hall, P. and Richardt, C.", TITLE = "ExMaps: Long-Term Localization in Dynamic Scenes using Exponential Decay", BOOKTITLE = WACV21, YEAR = "2021", PAGES = "2866-2875", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179553"} @inproceedings{bb184083, AUTHOR = "Vaudaux Ruth, G. and Tong, A.C.H. and Achard, C.", TITLE = "SALAD: Self-Assessment Learning for Action Detection", BOOKTITLE = WACV21, YEAR = "2021", PAGES = "1268-1277", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179554"} @inproceedings{bb184084, AUTHOR = "Vaudaux Ruth, G. and Tong, A.C.H. and Achard, C.", TITLE = "ActionSpotter: Deep Reinforcement Learning Framework for Temporal Action Spotting in Videos", BOOKTITLE = ICPR21, YEAR = "2021", PAGES = "631-638", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179555"} @inproceedings{bb184085, AUTHOR = "Lu, C.K. and Li, R. and Fu, H. and Fu, B. and Wang, Y.H. and Lo, W.L. and Chi, Z.", TITLE = "Precise Temporal Localization for Complete Actions with Quantified Temporal Structure", BOOKTITLE = ICPR21, YEAR = "2021", PAGES = "4781-4788", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179556"} @inproceedings{bb184086, AUTHOR = "Lin, Y.B. and Wang, Y.C.A.F.", TITLE = "Audiovisual Transformer with Instance Attention for Audio-visual Event Localization", BOOKTITLE = ACCV20, YEAR = "2020", PAGES = "VI:274-290", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179557"} @inproceedings{bb184087, AUTHOR = "Long, F. and Yao, T. and Qiu, Z.F. and Tian, X.M. and Luo, J.B. and Mei, T.", TITLE = "Learning to Localize Actions from Moments", BOOKTITLE = ECCV20, YEAR = "2020", PAGES = "III:137-154", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179558"} @inproceedings{bb184088, AUTHOR = "Min, K. and Corso, J.J.", TITLE = "Adversarial Background-aware Loss for Weakly-supervised Temporal Activity Localization", BOOKTITLE = ECCV20, YEAR = "2020", PAGES = "XIV:283-299", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179559"} @inproceedings{bb184089, AUTHOR = "Aakur, S. and Sarkar, S.", TITLE = "Action Localization Through Continual Predictive Learning", BOOKTITLE = ECCV20, YEAR = "2020", PAGES = "XIV:300-317", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179560"} @inproceedings{bb184090, AUTHOR = "Chen, S.X. and Jiang, Y.G.", TITLE = "Hierarchical Visual-textual Graph for Temporal Activity Localization via Language", BOOKTITLE = ECCV20, YEAR = "2020", PAGES = "XX:601-618", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179561"} @inproceedings{bb184091, AUTHOR = "Yang, P.W. and Hu, V.T. and Mettes, P.S. and Snoek, C.G.M.", TITLE = "Localizing the Common Action Among a Few Videos", BOOKTITLE = ECCV20, YEAR = "2020", PAGES = "VII:505-521", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179562"} @inproceedings{bb184092, AUTHOR = "Toering, M. and Gatopoulos, I. and Stol, M. and Hu, V.T.", TITLE = "Self-supervised Video Representation Learning with Cross-Stream Prototypical Contrasting", BOOKTITLE = WACV22, YEAR = "2022", PAGES = "846-856", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179563"} @inproceedings{bb184093, AUTHOR = "Yoon, S. and Hong, J.W. and Yoon, E. and Kim, D. and Kim, J.Y. and Yoon, H.S. and Yoo, C.D.", TITLE = "Selective Query-Guided Debiasing for Video Corpus Moment Retrieval", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXXVI:185-200", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179564"} @inproceedings{bb184094, AUTHOR = "Yoon, S. and Koo, G. and Kim, D. and Yoo, C.D.", TITLE = "SCANet: Scene Complexity Aware Network for Weakly-Supervised Video Moment Retrieval", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "13530-13540", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179565"} @inproceedings{bb184095, AUTHOR = "Yoon, S. and Kim, D. and Hong, J.W. and Kim, J.Y. and Kim, K. and Yoo, C.D.", TITLE = "Weakly-Supervised Moment Retrieval Network for Video Corpus Moment Retrieval", BOOKTITLE = ICIP21, YEAR = "2021", PAGES = "534-538", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179566"} @inproceedings{bb184096, AUTHOR = "Ma, M. and Yoon, S. and Kim, J.Y. and Lee, Y.J. and Kang, S.H. and Yoo, C.D.", TITLE = "VLANet: Video-language Alignment Network for Weakly-supervised Video Moment Retrieval", BOOKTITLE = ECCV20, YEAR = "2020", PAGES = "XXVIII:156-171", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179567"} @inproceedings{bb184097, AUTHOR = "Luo, Z.K. and Guillory, D. and Shi, B.F. and Ke, W. and Wan, F. and Darrell, T.J. and Xu, H.J.", TITLE = "Weakly-supervised Action Localization with Expectation-maximization Multi-instance Learning", BOOKTITLE = ECCV20, YEAR = "2020", PAGES = "XXIX: 729-745", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179568"} @inproceedings{bb184098, AUTHOR = "Kanth, R.K. and Ramaswamy, A. and Kumar, A.A. and Gubbi, J. and Balamuralidhar, P.", TITLE = "STP-Net: Spatio-Temporal Polarization Network for action recognition using polarimetric videos", BOOKTITLE = ComputationalApp22, YEAR = "2022", PAGES = "767-776", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179569"} @inproceedings{bb184099, AUTHOR = "Ramaswamy, A. and Seemakurthy, K. and Gubbi, J. and Balamuralidhar, P.", TITLE = "Video action re-localization using spatio-temporal correlation", BOOKTITLE = Activity22, YEAR = "2022", PAGES = "192-201", BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT179570"}