Keith Price Bibliography Bibtex Entry (ANCHOR 209100 URL http://dx.doi.org/10.1016/j.patcog.2025.111421 PAGES 111421 YEAR 2025 MONTH NIL BIBSOURCE http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204417 VOLUME 162 JOURNAL PR AUTHOR Liu, Y.Y. and Zhou, N. and Huang, Y.X. and Liu, S.Y. and Liu, L.Y. and Zhou, W. and Tang, C. and Wang, K. TITLE Beyond boundaries: Hierarchical-contrast unsupervised temporal action localization with high-coupling feature learning)


@article{bb209100,
        AUTHOR = "Liu, Y.Y. and Zhou, N. and Huang, Y.X. and Liu, S.Y. and Liu, L.Y. and Zhou, W. and Tang, C. and Wang, K.",
        TITLE = "Beyond boundaries: Hierarchical-contrast unsupervised temporal action
localization with high-coupling feature learning",
        JOURNAL = PR,
        VOLUME = "162",
        YEAR = "2025",
        PAGES = "111421",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204417"}

@article{bb209101,
        AUTHOR = "Sheng, J.R. and Li, A. and Ge, Y.X.",
        TITLE = "Summarized knowledge guidance for single-frame temporal action
localization",
        JOURNAL = PRL,
        VOLUME = "191",
        YEAR = "2025",
        PAGES = "31-36",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204418"}

@article{bb209102,
        AUTHOR = "Sun, C. and Chen, M. and Zhu, C.B. and Zhang, S. and Lu, P. and Chen, J.C.",
        TITLE = "Listen With Seeing: Cross-Modal Contrastive Learning for Audio-Visual
Event Localization",
        JOURNAL = MultMed,
        VOLUME = "27",
        YEAR = "2025",
        PAGES = "2650-2665",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204419"}

@article{bb209103,
        AUTHOR = "Liu, Y. and Wu, Q. and Zeng, M. and Liu, Y. and Pan, Y.Y.",
        TITLE = "FASTEN: Video Event Localization Based on Audio-Visual Feature
Alignment and Multi-Scale Temporal Enhancement",
        JOURNAL = SPLetters,
        VOLUME = "32",
        YEAR = "2025",
        PAGES = "2010-2014",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204420"}

@article{bb209104,
        AUTHOR = "Zhang, L. and Song, P.P. and Duan, Z.L. and Wang, S. and Chang, X.J. and Yang, X.",
        TITLE = "Video Corpus Moment Retrieval With Query-Specific Context Learning
and Progressive Localization",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "5659-5670",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204421"}

@article{bb209105,
        AUTHOR = "Zhou, W. and Lin, K. and Hu, W.P. and Xie, C. and Su, T. and Hu, H.F. and Tan, Y.P.",
        TITLE = "Snippet-Inter Difference Attention Network for Weakly-Supervised
Temporal Action Localization",
        JOURNAL = MultMed,
        VOLUME = "27",
        YEAR = "2025",
        PAGES = "3610-3624",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204422"}

@article{bb209106,
        AUTHOR = "Li, J.X. and Ma, T.C. and Yang, X.H. and Yang, L.J. and Zheng, C.",
        TITLE = "Video Complicated-Information Extraction and Filtering Network for
Weakly-Supervised Temporal Action Localization",
        JOURNAL = SPLetters,
        VOLUME = "32",
        YEAR = "2025",
        PAGES = "2334-2338",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204423"}

@article{bb209107,
        AUTHOR = "Gao, Z.L. and Wang, Q.L. and Zhang, B.B. and Hu, Q.H. and Li, P.H.",
        TITLE = "A^2M^2-Net: Adaptively Aligned Multi-Scale Moment for Few-Shot Action
Recognition",
        JOURNAL = IJCV,
        VOLUME = "133",
        YEAR = "2025",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "5363-5378",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204424"}

@article{bb209108,
        AUTHOR = "Liu, H.M. and Li, X. and Fan, B. and Xu, J.L.",
        TITLE = "BRTAL: Boundary Refinement Temporal Action Localization via
Offset-Driven Diffusion Models",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "8174-8186",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204425"}

@article{bb209109,
        AUTHOR = "Zhang, P. and Shi, P. and He, X.",
        TITLE = "Audio-Visual Event Localization With Cross Co-Attention and Dynamic
Audio-Object Semantic Alignment",
        JOURNAL = SPLetters,
        VOLUME = "32",
        YEAR = "2025",
        PAGES = "3152-3156",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204426"}

@article{bb209110,
        AUTHOR = "Zhang, J. and Yu, Y. and Mao, Y. and Ren, Y.G.",
        TITLE = "Event-level multimodal feature fusion for audio-visual event
localization",
        JOURNAL = IVC,
        VOLUME = "161",
        YEAR = "2025",
        PAGES = "105610",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204427"}

@article{bb209111,
        AUTHOR = "Geng, T.T. and Wang, T. and Duan, J.M. and Zhang, Y. and Guan, W. and Zheng, F. and Shao, L.",
        TITLE = "UniAV: Unified Audio-Visual Perception for Multi-Task Video Event
Localization",
        JOURNAL = PAMI,
        VOLUME = "47",
        YEAR = "2025",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "10280-10294",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204428"}

@article{bb209112,
        AUTHOR = "Feng, Q. and Li, W. and Lin, T. and Chen, X.H.",
        TITLE = "Full-Stage Pseudo Label Quality Enhancement for Weakly-Supervised
Temporal Action Localization",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "11144-11157",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204429"}

@article{bb209113,
        AUTHOR = "Gao, J. and Zhou, S.P. and Yu, H. and Li, C.Y. and Hu, X.X.",
        TITLE = "SCESS-Net: Semantic consistency enhancement and segment selection
network for audio-visual event localization",
        JOURNAL = CVIU,
        VOLUME = "262",
        YEAR = "2025",
        PAGES = "104551",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204430"}

@article{bb209114,
        AUTHOR = "Xu, J.L. and Zhang, Y.Q. and Zhou, W.H. and Liu, H.M.",
        TITLE = "BFSTAL: Bidirectional Feature Splitting With Cross-Layer Fusion for
Temporal Action Localization",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "12707-12718",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204431"}

@article{bb209115,
        AUTHOR = "Li, J.H. and Wei, K. and Xu, Z. and Wang, L. and Deng, C.",
        TITLE = "Robust Temporal Action Localization With Meta Boundary Refinement",
        JOURNAL = MultMed,
        VOLUME = "27",
        YEAR = "2025",
        PAGES = "9240-9251",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204432"}

@article{bb209116,
        AUTHOR = "Liu, L. and Li, S.Y. and Zhu, Y.Q. and Dai, Z.X.",
        TITLE = "Modality-Aware Gated Attention Network for Audio-Visual Event
Localization",
        JOURNAL = MultMed,
        VOLUME = "28",
        YEAR = "2026",
        PAGES = "1601-1612",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204433"}

@inproceedings{bb209117,
        AUTHOR = "Liu, L. and Li, S.Y. and Zhu, Y.Q.",
        TITLE = "Audio-Visual Semantic Graph Network for Audio-Visual Event
Localization",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "23957-23966",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204434"}

@article{bb209118,
        AUTHOR = "Yu, Y. and Wang, C. and Shi, Y.X.",
        TITLE = "Enhancing temporal action localization through cross-modal and
cross-structural knowledge distillation",
        JOURNAL = JVCIR,
        VOLUME = "116",
        YEAR = "2026",
        PAGES = "104734",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204435"}

@article{bb209119,
        AUTHOR = "Kim, J. and Choi, J. and Jeon, Y. and Heo, J.P.",
        TITLE = "Boundary-recovering network for temporal action detection",
        JOURNAL = PR,
        VOLUME = "176",
        YEAR = "2026",
        PAGES = "113141",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204436"}

@inproceedings{bb209120,
        AUTHOR = "Lee, S.B. and Moon, W.J. and Seong, H.S. and Heo, J.P.",
        TITLE = "Temporal Alignment-Free Video Matching for Few-Shot Action
Recognition",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "5412-5421",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204437"}

@inproceedings{bb209121,
        AUTHOR = "Moon, W.J. and Hyun, S. and Park, S.U. and Park, D. and Heo, J.P.",
        TITLE = "Query: Dependent Video Representation for Moment Retrieval and
Highlight Detection",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "23023-23033",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204438"}

@inproceedings{bb209122,
        AUTHOR = "Bunn, C. and Li, W.Q. and Yang, J.",
        TITLE = "Re-Purposing Segment Anything For Skeleton Action Localization",
        BOOKTITLE = ICIP25,
        YEAR = "2025",
        PAGES = "1678-1683",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204439"}

@inproceedings{bb209123,
        AUTHOR = "Chen, X.Y. and Guo, Y. and Liang, J.M. and Zhuang, S.T. and Zeng, R. and Hu, X.P.",
        TITLE = "Temporal Action Detection Model Compression by Progressive Block Drop",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "29225-29236",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204440"}

@inproceedings{bb209124,
        AUTHOR = "Khosla, S. and V, S.T. and Schwing, A. and Hoiem, D.",
        TITLE = "Relocate: A Simple Training-Free Baseline for Visual Query
Localization Using Region-Based Representations",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "3697-3706",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204441"}

@inproceedings{bb209125,
        AUTHOR = "Xia, R. and Jiang, D. and Zhang, Q. and Zhang, K. and Yuan, C.",
        TITLE = "CLIP-AE: Clip-Assisted Cross-View Audio-Visual Enhancement for
Unsupervised Temporal Action Localization",
        BOOKTITLE = ICIP25,
        YEAR = "2025",
        PAGES = "2014-2018",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204442"}

@inproceedings{bb209126,
        AUTHOR = "Zhang, Q. and Fang, J. and Yuan, R. and Tang, X. and Qi, Y.X. and Zhang, K. and Yuan, C.",
        TITLE = "Weakly Supervised Temporal Action Localization via Dual-Prior
Collaborative Learning Guided by Multimodal Large Language Models",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "24139-24148",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204443"}

@inproceedings{bb209127,
        AUTHOR = "Liu, M. and Wang, L. and Zhou, S.P. and Xia, K. and Sun, X.L. and Hua, G.",
        TITLE = "Boosting Point-Supervised Temporal Action Localization through
Integrating Query Reformation and Optimal Transport",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "13865-13875",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204444"}

@inproceedings{bb209128,
        AUTHOR = "Zhang, G. and Fok, M.L.A. and Ma, J. and Xia, Y. and Cremers, D. and Torr, P. and Tresp, V. and Gu, J.D.",
        TITLE = "Localizing Events in Videos with Multimodal Queries",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "3339-3351",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204445"}

@inproceedings{bb209129,
        AUTHOR = "Zhou, J.X. and Guo, D. and Guo, R. and Mao, Y.X. and Hu, J.J. and Zhong, Y.R. and Chang, X.J. and Wang, M.",
        TITLE = "Towards Open-Vocabulary Audio-Visual Event Localization",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "8362-8371",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204446"}

@inproceedings{bb209130,
        AUTHOR = "Liu, Z. and Liu, Y.",
        TITLE = "Bridge the Gap: From Weak to Full Supervision for Temporal Action
Localization with PseudoFormer",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "8711-8720",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204447"}

@inproceedings{bb209131,
        AUTHOR = "Diko, A. and Wang, T. and Swaileh, W. and Sun, S.Y. and Patras, I.",
        TITLE = "ReWind: Understanding Long Videos with Instructed Learnable Memory",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "13734-13743",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204448"}

@inproceedings{bb209132,
        AUTHOR = "Hyun, J. and Han, S.H. and Kang, H. and Lee, J.Y. and Kim, S.J.",
        TITLE = "Exploring Scalability of Self-Training for Open-Vocabulary Temporal
Action Localization",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "9406-9415",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204449"}

@inproceedings{bb209133,
        AUTHOR = "Bao, W.T. and Li, K. and Chen, Y.X. and Patel, D. and Min, M.R.Q. and Kong, Y.",
        TITLE = "Exploiting VLM Localizability and Semantics for Open Vocabulary
Action Detection",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "8291-8301",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204450"}

@inproceedings{bb209134,
        AUTHOR = "Gupta, A. and Mittal, G. and Magooda, A. and Yu, Y. and Taylor, G.W. and Chen, M.",
        TITLE = "LoSA: Long-Short-Range Adapter for Scaling End-to-End Temporal Action
Localization",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "2092-2102",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204451"}

@inproceedings{bb209135,
        AUTHOR = "Pujol Perich, D. and Clapes, A. and Escalera, S.",
        TITLE = "SADA: Semantic Adversarial Unsupervised Domain Adaptation for
Temporal Action Localization",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "9237-9247",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204452"}

@inproceedings{bb209136,
        AUTHOR = "Abdullah, H.M. and Liu, T. and Wei, K. and Kong, S. and Huang, R.",
        TITLE = "UAL-Bench: The First Comprehensive Unusual Activity Localization
Benchmark",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "5801-5811",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204453"}

@inproceedings{bb209137,
        AUTHOR = "Yang, L. and Zheng, Z.W. and Han, Y.Z. and Cheng, H. and Song, S. and Huang, G. and Li, F.",
        TITLE = "Dyfadet: Dynamic Feature Aggregation for Temporal Action Detection",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XLVI: 305-322",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204454"}

@inproceedings{bb209138,
        AUTHOR = "Zeng, Y.S. and Zhong, Y.J. and Feng, C.J. and Ma, L.",
        TITLE = "Unimd: Towards Unifying Moment Retrieval and Temporal Action Detection",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XLVI: 286-304",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204455"}

@inproceedings{bb209139,
        AUTHOR = "Liu, M.N. and Wang, L. and Zhou, S.P. and Xia, K. and Wu, Q. and Zhang, Q. and Hua, G.",
        TITLE = "Stepwise Multi-grained Boundary Detector for Point-supervised Temporal
Action Localization",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "VII: 333-349",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204456"}

@inproceedings{bb209140,
        AUTHOR = "Kwon, D. and Kim, I.H. and Kwak, S.",
        TITLE = "Boosting Semi-Supervised Video Action Detection with Temporal Context",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "847-858",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204457"}

@inproceedings{bb209141,
        AUTHOR = "Lee, J. and Kim, T. and Lee, I. and Shim, M.H. and Wee, D.Y. and Cho, M. and Kwak, S.",
        TITLE = "Classification Matters: Improving Video Action Detection with
Class-specific Attention",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XX: 450-467",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204458"}

@inproceedings{bb209142,
        AUTHOR = "Song, Y.K. and Kim, D.K. and Cho, M. and Kwak, S.",
        TITLE = "Online Temporal Action Localization with Memory-augmented Transformer",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XIX: 74-91",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204459"}

@inproceedings{bb209143,
        AUTHOR = "Reza, S. and Zhang, Y.X. and Moghaddam, M. and Camps, O.",
        TITLE = "Hat: History-augmented Anchor Transformer for Online Temporal Action
Localization",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XXI: 205-222",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204460"}

@inproceedings{bb209144,
        AUTHOR = "Zhou, F.X. and Williams, B. and Rahmani, H.",
        TITLE = "Towards Adaptive Pseudo-label Learning for Semi-supervised Temporal
Action Localization",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "LXII: 320-338",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204461"}

@inproceedings{bb209145,
        AUTHOR = "Huang, D.A. and Liao, S. and Radhakrishnan, S. and Yin, H.X. and Molchanov, P. and Yu, Z. and Kautz, J.",
        TITLE = "Lita: Language Instructed Temporal-localization Assistant",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "LXIV: 202-218",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204462"}

@inproceedings{bb209146,
        AUTHOR = "Rahman, M.S. and Shihab, I.F. and Chu, L. and Sharma, A.",
        TITLE = "DeepLocalization: Using change point detection for Temporal Action
Localization",
        BOOKTITLE = AICity24,
        YEAR = "2024",
        PAGES = "7252-7260",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204463"}

@inproceedings{bb209147,
        AUTHOR = "Liberatori, B. and Conti, A. and Rota, P. and Wang, Y.M. and Ricci, E.",
        TITLE = "Test-Time Zero-Shot Temporal Action Localization",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "18720-18729",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204464"}

@inproceedings{bb209148,
        AUTHOR = "Ntinoutl, I. and Sanchez, E. and Tzimiropoulos, G.",
        TITLE = "Multiscale Vision Transformers Meet Bipartite Matching for Efficient
Single-Stage Action Localization",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "18827-18836",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204465"}

@inproceedings{bb209149,
        AUTHOR = "Gritsenko, A.A. and Xiong, X. and Djolonga, J. and Dehghani, M. and Sun, C. and Lucic, M. and Schmid, C. and Arnab, A.",
        TITLE = "End-to-End Spatio-Temporal Action Localisation with Video
Transformers",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "18373-18383",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204466"}

@inproceedings{bb209150,
        AUTHOR = "Yang, A. and Miech, A. and Sivic, J. and Laptev, I. and Schmid, C.",
        TITLE = "TubeDETR: Spatio-Temporal Video Grounding with Transformers",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "16421-16432",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204467"}

@inproceedings{bb209151,
        AUTHOR = "Zhang, Z.J. and Palmero, C. and Escalera, S.",
        TITLE = "DualH: A Dual Hierarchical Model for Temporal Action Localization",
        BOOKTITLE = FG24,
        YEAR = "2024",
        PAGES = "1-10",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204468"}

@inproceedings{bb209152,
        AUTHOR = "Denize, J. and Liashuha, M. and Rabarisoa, J. and Orcesi, A. and Herault, R.",
        TITLE = "COMEDIAN: Self-Supervised Learning and Knowledge Distillation for
Action Spotting Using Transformers",
        BOOKTITLE = Pretrain24,
        YEAR = "2024",
        PAGES = "518-528",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204469"}

@inproceedings{bb209153,
        AUTHOR = "Rahman, M.A. and Laganiere, R.",
        TITLE = "Spatio-Temporal Activity Detection via Joint Optimization of Spatial
and Temporal Localization",
        BOOKTITLE = RWSurvil24,
        YEAR = "2024",
        PAGES = "242-250",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204470"}

@inproceedings{bb209154,
        AUTHOR = "Mondal, A. and Nag, S. and Prada, J.M. and Zhu, X.T. and Dutta, A.",
        TITLE = "Actor-agnostic Multi-label Action Recognition with Multi-modal Query",
        BOOKTITLE = NIVT23,
        YEAR = "2023",
        PAGES = "784-794",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204471"}

@inproceedings{bb209155,
        AUTHOR = "Warchocki, J. and Oprescu, T. and Wang, Y.H. and Damacus, A. and Misterka, P. and Bruintjes, R.J. and Lengyel, A. and Strafforello, O. and van Gemert, J.C.",
        TITLE = "Benchmarking Data Efficiency and Computational Efficiency of Temporal
Action Localization Models",
        BOOKTITLE = CVEU23,
        YEAR = "2023",
        PAGES = "3000-3008",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204472"}

@inproceedings{bb209156,
        AUTHOR = "Heigold, G. and Keysers, D. and Minderer, M. and Lucic, M. and Gritsenko, A. and Yu, F. and Bewley, A. and Kipf, T.",
        TITLE = "Video OWL-ViT: Temporally-consistent open-world localization in video",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "13756-13765",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204473"}

@inproceedings{bb209157,
        AUTHOR = "Shao, J.Y. and Wang, X.H. and Quan, R.J. and Zheng, J.J. and Yang, J. and Yang, Y.",
        TITLE = "Action Sensitivity Learning for Temporal Action Localization",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "13411-13423",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204474"}

@inproceedings{bb209158,
        AUTHOR = "Barrios, W. and Soldan, M. and Ceballos Arroyo, A.M. and Heilbron, F.C. and Ghanem, B.",
        TITLE = "Localizing Moments in Long Video Via Multimodal Guidance",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "13621-13632",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204475"}

@inproceedings{bb209159,
        AUTHOR = "Shah, A. and Lundell, B. and Sawhney, H. and Chellappa, R.",
        TITLE = "STEPs: Self-Supervised Key Step Extraction and Localization from
Unlabeled Procedural Videos",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "10341-10353",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204476"}

@inproceedings{bb209160,
        AUTHOR = "Croitoru, I. and Bogolin, S.V. and Albanie, S. and Liu, Y. and Wang, Z.W. and Yoon, S.H. and Dernoncourt, F. and Jin, H.L. and Bui, T.",
        TITLE = "Moment Detection in Long Tutorial Videos",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "2594-2604",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204477"}

@inproceedings{bb209161,
        AUTHOR = "Xia, K. and Wang, L. and Zhou, S.P. and Hua, G. and Tang, W.",
        TITLE = "Learning from Noisy Pseudo Labels for Semi-Supervised Temporal Action
Localization",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "10126-10135",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204478"}

@inproceedings{bb209162,
        AUTHOR = "Geng, T.T. and Wang, T. and Duan, J.M. and Cong, R.M. and Zheng, F.",
        TITLE = "Dense-Localizing Audio-Visual Events in Untrimmed Videos:
A Large-Scale Benchmark and Baseline",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "22942-22951",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204479"}

@inproceedings{bb209163,
        AUTHOR = "Zheng, W.R. and Yoshihashi, R. and Kawakami, R. and Sato, I. and Kanezaki, A.",
        TITLE = "Multi Event Localization by Audio-Visual Fusion with Omnidirectional
Camera and Microphone Array",
        BOOKTITLE = MULA23,
        YEAR = "2023",
        PAGES = "2566-2574",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204480"}

@inproceedings{bb209164,
        AUTHOR = "Cao, S.Q. and Luo, W.X. and Wang, B. and Zhang, W. and Ma, L.",
        TITLE = "E2E-LOAD: End-to-End Long-form Online Action Detection",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "10388-10398",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204481"}

@inproceedings{bb209165,
        AUTHOR = "Shi, D.F. and Zhong, Y.J. and Cao, Q. and Ma, L. and Lit, J. and Tao, D.C.",
        TITLE = "TriDet: Temporal Action Detection with Relative Boundary Modeling",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "18857-18866",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204482"}

@inproceedings{bb209166,
        AUTHOR = "Zala, A. and Cho, J. and Kottur, S. and Chen, X. and Oguz, B. and Mehdad, Y. and Bansal, M.",
        TITLE = "Hierarchical Video-Moment Retrieval and Step-Captioning",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "23056-23065",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204483"}

@inproceedings{bb209167,
        AUTHOR = "Chi, H.G. and Lee, K. and Agarwal, N. and Xu, Y. and Ramani, K. and Choi, C.",
        TITLE = "AdamsFormer for Spatial Action Localization in the Future",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "17885-17895",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204484"}

@inproceedings{bb209168,
        AUTHOR = "Zhao, C. and Liu, S.M. and Mangalam, K. and Ghanem, B.",
        TITLE = "Re2TAL: Rewiring Pretrained Video Backbones for Reversible Temporal
Action Localization",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "10637-10647",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204485"}

@inproceedings{bb209169,
        AUTHOR = "Kang, H. and Kim, H. and An, J.B. and Cho, M. and Kim, S.J.",
        TITLE = "Soft-Landing Strategy for Alleviating the Task Discrepancy Problem in
Temporal Action Localization Tasks",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "6514-6523",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204486"}

@inproceedings{bb209170,
        AUTHOR = "Seol, M. and Kim, J. and Moon, J.",
        TITLE = "BMRN: Boundary Matching and Refinement Network for Temporal Moment
Localization with Natural Language",
        BOOKTITLE = ODRUM23,
        YEAR = "2023",
        PAGES = "5571-5579",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204487"}

@inproceedings{bb209171,
        AUTHOR = "Niu, Y.R. and Yang, J.Y. and Liang, C. and Huang, B. and Wang, Z.Y.",
        TITLE = "A Spatio-Temporal Identity Verification Method for Person-Action
Instance Search in Movies",
        BOOKTITLE = MMMod23,
        YEAR = "2023",
        PAGES = "I: 82-94",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204488"}

@inproceedings{bb209172,
        AUTHOR = "Rai, A.K. and Krishna, T. and Dietlmeier, J. and McGuinness, K. and Smeaton, A.F. and O'Connor, N.E.",
        TITLE = "Motion Aware Self-Supervision for Generic Event Boundary Detection",
        BOOKTITLE = WACV23,
        YEAR = "2023",
        PAGES = "2727-2738",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204489"}

@inproceedings{bb209173,
        AUTHOR = "Mahmud, T. and Marculescu, D.",
        TITLE = "AVE-CLIP: AudioCLIP-based Multi-window Temporal Transformer for Audio
Visual Event Localization",
        BOOKTITLE = WACV23,
        YEAR = "2023",
        PAGES = "5147-5156",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204490"}

@inproceedings{bb209174,
        AUTHOR = "Kim, H.J. and Lee, Y. and Hong, J.H. and Lee, S.W.",
        TITLE = "DiGIT: Multi-Dilated Gated Encoder and Central-Adjacent Region
Integrated Decoder for Temporal Action Detection Transformer",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "24286-24296",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204491"}

@inproceedings{bb209175,
        AUTHOR = "Kang, T.K. and Lee, G.H. and Jin, K.M. and Lee, S.W.",
        TITLE = "Action-aware Masking Network with Group-based Attention for Temporal
Action Localization",
        BOOKTITLE = WACV23,
        YEAR = "2023",
        PAGES = "6047-6056",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204492"}

@inproceedings{bb209176,
        AUTHOR = "Cao, M. and Yang, T.Y. and Weng, J.W. and Zhang, C. and Wang, J. and Zou, Y.X.",
        TITLE = "LocVTP: Video-Text Pre-training for Temporal Localization",
        BOOKTITLE = ECCV22,
        YEAR = "2022",
        PAGES = "XXVI:38-56",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204493"}

@inproceedings{bb209177,
        AUTHOR = "Cheng, F. and Bertasius, G.",
        TITLE = "TallFormer: Temporal Action Localization with a Long-Memory Transformer",
        BOOKTITLE = ECCV22,
        YEAR = "2022",
        PAGES = "XXXIV:503-521",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204494"}

@inproceedings{bb209178,
        AUTHOR = "Kim, Y.H. and Kang, H. and Kim, S.J.",
        TITLE = "A Sliding Window Scheme for Online Temporal Action Localization",
        BOOKTITLE = ECCV22,
        YEAR = "2022",
        PAGES = "XXXIV:653-669",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204495"}

@inproceedings{bb209179,
        AUTHOR = "Rao, V. and Khalil, M.I. and Li, H. and Dai, P. and Lu, J.W.",
        TITLE = "Dual Perspective Network for Audio-Visual Event Localization",
        BOOKTITLE = ECCV22,
        YEAR = "2022",
        PAGES = "XXXIV:689-704",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204496"}

@inproceedings{bb209180,
        AUTHOR = "Huang, J. and Jin, H.L. and Gong, S.G. and Liu, Y.",
        TITLE = "Video Activity Localisation with Uncertainties in Temporal Boundary",
        BOOKTITLE = ECCV22,
        YEAR = "2022",
        PAGES = "XXXIV:724-740",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204497"}

@inproceedings{bb209181,
        AUTHOR = "Aakur, S. and Sarkar, S.",
        TITLE = "Actor-Centered Representations for Action Localization in Streaming
Videos",
        BOOKTITLE = ECCV22,
        YEAR = "2022",
        PAGES = "XXXVIII:70-87",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204498"}

@inproceedings{bb209182,
        AUTHOR = "Paul, S. and Mithun, N.C. and Roy Chowdhury, A.K.",
        TITLE = "Text-Based Temporal Localization of Novel Events",
        BOOKTITLE = ECCV22,
        YEAR = "2022",
        PAGES = "XIV:567-587",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204499"}

@inproceedings{bb209183,
        AUTHOR = "Zhang, C.L. and Wu, J.X. and Li, Y.",
        TITLE = "ActionFormer: Localizing Moments of Actions with Transformers",
        BOOKTITLE = ECCV22,
        YEAR = "2022",
        PAGES = "IV:492-510",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204500"}

@inproceedings{bb209184,
        AUTHOR = "Zhang, Y.H. and Doughty, H. and Shao, L. and Snoek, C.G.M.",
        TITLE = "Audio-Adaptive Activity Recognition Across Video Domains",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "13781-13790",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204501"}

@inproceedings{bb209185,
        AUTHOR = "Liu, W.Z. and Tekin, B. and Coskun, H. and Vineet, V. and Fua, P. and Pollefeys, M.",
        TITLE = "Learning to Align Sequential Actions in the Wild",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "2171-2181",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204502"}

@inproceedings{bb209186,
        AUTHOR = "Li, W. and Chen, S. and Gu, J.Y. and Wang, N. and Chen, C. and Guo, Y.D.",
        TITLE = "MV-TAL: Mulit-view Temporal Action Localization in Naturalistic
Driving",
        BOOKTITLE = AICity22,
        YEAR = "2022",
        PAGES = "3241-3247",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204503"}

@inproceedings{bb209187,
        AUTHOR = "Zhang, C. and Yang, T.Y. and Weng, J. and Cao, M. and Wang, J. and Zou, Y.X.",
        TITLE = "Unsupervised Pre-training for Temporal Action Localization Tasks",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "14011-14021",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204504"}

@inproceedings{bb209188,
        AUTHOR = "Xia, K. and Wang, L. and Zhou, S.P. and Zheng, N.N. and Tang, W.",
        TITLE = "Learning to Refactor Action and Co-occurrence Features for Temporal
Action Localization",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "13874-13883",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204505"}

@inproceedings{bb209189,
        AUTHOR = "Bao, W.T. and Yu, Q. and Kong, Y.",
        TITLE = "OpenTAL: Towards Open Set Temporal Action Localization",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "2969-2979",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204506"}

@inproceedings{bb209190,
        AUTHOR = "Sridhar, D. and Quader, N. and Muralidharan, S. and Li, Y.X. and Dai, P. and Lu, J.W.",
        TITLE = "Class Semantics-based Attention for Action Detection",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "13719-13728",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204507"}

@inproceedings{bb209191,
        AUTHOR = "Huang, J. and Liu, Y. and Gong, S.G. and Jin, H.L.",
        TITLE = "Cross-Sentence Temporal and Semantic Relations in Video Activity
Localisation",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "7179-7188",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204508"}

@inproceedings{bb209192,
        AUTHOR = "Xu, M.M. and Perez Rua, J.M. and Escorcia, V. and Martinez, B. and Zhu, X.T. and Zhang, L. and Ghanem, B. and Xiang, T.",
        TITLE = "Boundary-sensitive Pre-training for Temporal Localization in Videos",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "7200-7210",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204509"}

@inproceedings{bb209193,
        AUTHOR = "Nam, J. and Ahn, D.C. and Kang, D.Y. and Ha, S.J. and Choi, J.H.",
        TITLE = "Zero-shot Natural Language Video Localization",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "1450-1459",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204510"}

@inproceedings{bb209194,
        AUTHOR = "Wang, Y.X. and Gao, D.F. and Yu, L.C. and Lei, W.X. and Feiszli, M. and Shou, M.Z.",
        TITLE = "GEB+: A Benchmark for Generic Event Boundary Captioning, Grounding and
Retrieval",
        BOOKTITLE = ECCV22,
        YEAR = "2022",
        PAGES = "XXXV:709-725",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204511"}

@inproceedings{bb209195,
        AUTHOR = "Shou, M.Z. and Lei, S.W.X. and Wang, W.Y. and Ghadiyaram, D. and Feiszli, M.",
        TITLE = "Generic Event Boundary Detection: A Benchmark for Event Segmentation",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "8055-8064",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204512"}

@inproceedings{bb209196,
        AUTHOR = "Ju, C. and Zhao, P. and Chen, S. and Zhang, Y. and Wang, Y.F. and Tian, Q.",
        TITLE = "Divide and Conquer for Single-frame Temporal Action Localization",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "13435-13444",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204513"}

@inproceedings{bb209197,
        AUTHOR = "Zhao, C. and Thabet, A. and Ghanem, B.",
        TITLE = "Video Self-Stitching Graph Network for Temporal Action Localization",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "13638-13647",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204514"}

@inproceedings{bb209198,
        AUTHOR = "Kang, H. and Kim, K. and Ko, Y. and Kim, S.J.",
        TITLE = "CAG-QIL: Context-Aware Actionness Grouping via Q Imitation Learning
for Online Temporal Action Localization",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "13709-13718",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204515"}

@inproceedings{bb209199,
        AUTHOR = "Trehan, S. and Aakur, S.N.",
        TITLE = "Towards Active Vision for Action Localization with Reactive Control
and Predictive Learning",
        BOOKTITLE = WACV22,
        YEAR = "2022",
        PAGES = "3391-3400",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742aloct1.html#TT204516"}
Last update:Mar 28, 2026 at 17:09:41