@inproceedings{bb209500,
        AUTHOR = "Wang, W. and Wu, Y. and Liu, H. and Wang, S. and Cheng, J.",
        TITLE = "Temporal Action Detection by Joint Identification-Verification",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "2026-2031",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742ase2.html#TT204816"}

@inproceedings{bb209501,
        AUTHOR = "Chauhan, J.S. and Wang, Y.",
        TITLE = "Context-Aware Action Detection in Untrimmed Videos Using
Bidirectional LSTM",
        BOOKTITLE = CRV18,
        YEAR = "2018",
        PAGES = "222-229",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742ase2.html#TT204817"}

@inproceedings{bb209502,
        AUTHOR = "Ali, A. and Taylor, G.W.",
        TITLE = "Real-Time End-to-End Action Detection with Two-Stream Networks",
        BOOKTITLE = CRV18,
        YEAR = "2018",
        PAGES = "31-38",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742ase2.html#TT204818"}

@inproceedings{bb209503,
        AUTHOR = "Shou, Z. and Pan, J.T. and Chan, J. and Miyazawa, K. and Mansour, H. and Vetro, A. and Giro i Nieto, X. and Chang, S.F.",
        TITLE = "Online Detection of Action Start in Untrimmed, Streaming Videos",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "III: 551-568",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742ase2.html#TT204819"}

@inproceedings{bb209504,
        AUTHOR = "Kuehne, H. and Gall, J. and Serre, T.",
        TITLE = "An end-to-end generative framework for video segmentation and
recognition",
        BOOKTITLE = WACV16,
        YEAR = "2016",
        PAGES = "1-8",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742ase2.html#TT204820"}

@inproceedings{bb209505,
        AUTHOR = "Ni, B.B. and Yang, X.K. and Gao, S.H.",
        TITLE = "Progressively Parsing Interactional Objects for Fine Grained Action
Detection",
        BOOKTITLE = CVPR16,
        YEAR = "2016",
        PAGES = "1020-1028",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742ase2.html#TT204821"}

@inproceedings{bb209506,
        AUTHOR = "Garcia Hernando, G.B. and Kim, T.K.",
        TITLE = "Transition Forests: Learning Discriminative Temporal Transitions for
Action Recognition and Detection",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "407-415",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742ase2.html#TT204822"}

@inproceedings{bb209507,
        AUTHOR = "Li, S. and Li, K. and Fu, Y.",
        TITLE = "Temporal Subspace Clustering for Human Motion Segmentation",
        BOOKTITLE = ICCV15,
        YEAR = "2015",
        PAGES = "4453-4461",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742ase2.html#TT204823"}

@inproceedings{bb209508,
        AUTHOR = "Lu, J. and Xu, R. and Corso, J.J.",
        TITLE = "Human action segmentation with hierarchical supervoxel consistency",
        BOOKTITLE = CVPR15,
        YEAR = "2015",
        PAGES = "3762-3771",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742ase2.html#TT204824"}

@inproceedings{bb209509,
        AUTHOR = "Kim, Y. and Chen, J.X. and Chang, M.C. and Wang, X. and Provost, E.M. and Lyu, S.W.",
        TITLE = "Modeling transition patterns between events for temporal human action
segmentation and classification",
        BOOKTITLE = FG15,
        YEAR = "2015",
        PAGES = "1-8",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742ase2.html#TT204825"}

@inproceedings{bb209510,
        AUTHOR = "Ghodrati, A. and Pedersoli, M. and Tuytelaars, T.",
        TITLE = "Coupling video segmentation and action recognition",
        BOOKTITLE = WACV14,
        YEAR = "2014",
        PAGES = "618-625",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742ase2.html#TT204826"}

@inproceedings{bb209511,
        AUTHOR = "Shu, Z.X. and Yun, K. and Samaras, D.",
        TITLE = "Action Detection with Improved Dense Trajectories and Sliding Window",
        BOOKTITLE = ChaLearn14,
        YEAR = "2014",
        PAGES = "541-551",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742ase2.html#TT204827"}

@inproceedings{bb209512,
        AUTHOR = "Natarajan, P. and Wu, S. and Vitaladevuni, S. and Zhuang, X.D. and Tsakalidis, S. and Park, U.S. and Prasad, R. and Natarajan, P.",
        TITLE = "Multimodal feature fusion for robust event detection in web videos",
        BOOKTITLE = CVPR12,
        YEAR = "2012",
        PAGES = "1298-1305",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742ase2.html#TT204828"}

@inproceedings{bb209513,
        AUTHOR = "Sorschag, R. and Horhan, M.",
        TITLE = "Action scene detection from motion and events",
        BOOKTITLE = ICIP11,
        YEAR = "2011",
        PAGES = "3641-3644",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742ase2.html#TT204829"}

@article{bb209514,
        AUTHOR = "Hu, Y.P. and Liu, M. and Su, X.O. and Gao, Z. and Nie, L.Q.",
        TITLE = "Video Moment Localization via Deep Cross-Modal Hashing",
        JOURNAL = IP,
        VOLUME = "30",
        YEAR = "2021",
        PAGES = "4667-4677",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204830"}

@article{bb209515,
        AUTHOR = "Gao, J.Y. and Xu, C.S.",
        TITLE = "Learning Video Moment Retrieval Without a Single Annotated Video",
        JOURNAL = CirSysVideo,
        VOLUME = "32",
        YEAR = "2022",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "1646-1657",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204831"}

@article{bb209516,
        AUTHOR = "Liu, M. and Nie, L.Q. and Wang, Y.X. and Wang, M. and Rui, Y.",
        TITLE = "A Survey on Video Moment Localization",
        JOURNAL = Surveys,
        VOLUME = "55",
        YEAR = "2023",
        NUMBER = "9",
        MONTH = "January",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204832"}

@article{bb209517,
        AUTHOR = "Sun, X. and Gao, J.L. and Zhu, Y.Z. and Wang, X. and Zhou, X.",
        TITLE = "Video Moment Retrieval via Comprehensive Relation-Aware Network",
        JOURNAL = CirSysVideo,
        VOLUME = "33",
        YEAR = "2023",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "5281-5295",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204833"}

@article{bb209518,
        AUTHOR = "Fang, X. and Liu, D.Z. and Zhou, P. and Hu, Y.C.",
        TITLE = "Multi-Modal Cross-Domain Alignment Network for Video Moment Retrieval",
        JOURNAL = MultMed,
        VOLUME = "25",
        YEAR = "2023",
        PAGES = "7517-7532",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204834"}

@article{bb209519,
        AUTHOR = "Yang, X. and Wang, S.S. and Dong, J. and Dong, J.F. and Wang, M. and Chua, T.S.",
        TITLE = "Video Moment Retrieval With Cross-Modal Neural Architecture Search",
        JOURNAL = IP,
        VOLUME = "31",
        YEAR = "2022",
        PAGES = "1204-1216",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204835"}

@article{bb209520,
        AUTHOR = "Han, N. and Yang, X. and Lim, E.P. and Chen, H. and Sun, Q.",
        TITLE = "Efficient Cross-Modal Video Retrieval With Meta-Optimized Frames",
        JOURNAL = MultMed,
        VOLUME = "26",
        YEAR = "2024",
        PAGES = "10924-10936",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204836"}

@article{bb209521,
        AUTHOR = "Teng, J. and Lu, X.K. and Gong, Y.S. and Liu, X.F. and Nie, X.S. and Yin, Y.L.",
        TITLE = "Regularized Two Granularity Loss Function for Weakly Supervised Video
Moment Retrieval",
        JOURNAL = MultMed,
        VOLUME = "24",
        YEAR = "2022",
        PAGES = "1141-1151",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204837"}

@article{bb209522,
        AUTHOR = "Wang, G.M. and Xu, X. and Shen, F.M. and Lu, H.M. and Ji, Y.L. and Shen, H.T.",
        TITLE = "Cross-Modal Dynamic Networks for Video Moment Retrieval With Text
Query",
        JOURNAL = MultMed,
        VOLUME = "24",
        YEAR = "2022",
        PAGES = "1221-1232",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204838"}

@article{bb209523,
        AUTHOR = "Huo, S.W. and Zhou, Y. and Wang, R.L. and Xiang, W. and Kung, S.Y.",
        TITLE = "Semantic Relevance Learning for Video-Query Based Video Moment
Retrieval",
        JOURNAL = MultMed,
        VOLUME = "25",
        YEAR = "2023",
        PAGES = "9290-9301",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204839"}

@article{bb209524,
        AUTHOR = "Wang, Y.X. and Liu, M. and Wei, Y.W. and Cheng, Z.Y. and Wang, Y.L. and Nie, L.Q.",
        TITLE = "Siamese Alignment Network for Weakly Supervised Video Moment
Retrieval",
        JOURNAL = MultMed,
        VOLUME = "25",
        YEAR = "2023",
        PAGES = "3921-3933",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204840"}

@article{bb209525,
        AUTHOR = "Wang, R.M. and Feng, J.W. and Zhang, F. and Luo, X.N. and Luo, Y.M.",
        TITLE = "Modality-Aware Heterogeneous Graph for Joint Video Moment Retrieval
and Highlight Detection",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "8896-8911",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204841"}

@article{bb209526,
        AUTHOR = "Wang, D. and Lu, X.T. and Wang, Q. and Tian, Y.M. and Wan, B. and He, L.",
        TITLE = "Gist, Content, Target-Oriented: A 3-Level Human-Like Framework for
Video Moment Retrieval",
        JOURNAL = MultMed,
        VOLUME = "26",
        YEAR = "2024",
        PAGES = "11044-11056",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204842"}

@article{bb209527,
        AUTHOR = "Huang, Z.H. and Ji, Y. and Li, Y. and Liu, C.P.",
        TITLE = "Gazing After Glancing: Edge Information Guided Perception Network for
Video Moment Retrieval",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "1535-1539",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204843"}

@article{bb209528,
        AUTHOR = "Han, D. and Cheng, X. and Guo, N. and Ye, X.C. and Rainer, B. and Priller, P.",
        TITLE = "Momentum Cross-Modal Contrastive Learning for Video Moment Retrieval",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "5977-5994",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204844"}

@article{bb209529,
        AUTHOR = "Jiang, X. and Xu, X. and Zhou, Z.L. and Yang, Y. and Shen, F.M. and Shen, H.T.",
        TITLE = "Zero-Shot Video Moment Retrieval With Angular Reconstructive Text
Embeddings",
        JOURNAL = MultMed,
        VOLUME = "26",
        YEAR = "2024",
        PAGES = "9657-9670",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204845"}

@article{bb209530,
        AUTHOR = "Zhou, S. and Zhang, F. and Wang, R.M. and Zhou, F. and Su, Z.",
        TITLE = "Subtask Prior-Driven Optimized Mechanism on Joint Video Moment
Retrieval and Highlight Detection",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "11271-11285",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204846"}

@article{bb209531,
        AUTHOR = "Ge, H.L. and Liu, X.L. and Guo, Z.H. and Qiu, Z.W.",
        TITLE = "Learning to Diversify for Robust Video Moment Retrieval",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "2894-2904",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204847"}

@article{bb209532,
        AUTHOR = "Zhao, Y. and Gao, Z. and Ma, C.J. and Guan, W. and Wang, R. and Chen, S.Y.",
        TITLE = "Fine-Grained Modality Relation-Aware Network for Video Moment
Retrieval",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "3315-3327",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204848"}

@article{bb209533,
        AUTHOR = "Jiang, X. and Zhu, L.Q. and Xu, X. and Shen, F.M. and Yang, Y. and Shen, H.T.",
        TITLE = "Query as Supervision: Toward Low-Cost and Robust Video Moment and
Highlight Retrieval",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "3955-3968",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204849"}

@article{bb209534,
        AUTHOR = "Zeng, R.H. and Zhuo, Y. and Li, J.L. and Yang, Y.J. and Wu, H. and Chen, Q. and Hu, X.P. and Leung, V.C.M.",
        TITLE = "Improving Video Moment Retrieval by Auxiliary Moment-Query Pairs With
Hyper-Interaction",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "3940-3954",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204850"}

@article{bb209535,
        AUTHOR = "Liu, J. and Zhang, Z.B. and Su, Y.T. and Yang, B. and Min, X.K. and Zhai, G.T.",
        TITLE = "Aggregate and Discriminate: Pseudo Clips-Guided Boundary Perception
for Video Moment Retrieval",
        JOURNAL = MultMed,
        VOLUME = "27",
        YEAR = "2025",
        PAGES = "4819-4830",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204851"}

@article{bb209536,
        AUTHOR = "Cai, W.T. and Huang, J. and Gong, S.G. and Jin, H.L. and Liu, Y.",
        TITLE = "MLLM as video narrator: Mitigating modality imbalance in video moment
retrieval",
        JOURNAL = PR,
        VOLUME = "166",
        YEAR = "2025",
        PAGES = "111670",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204852"}

@article{bb209537,
        AUTHOR = "Liu, W.J. and Miao, B. and Cao, J.X. and Zhu, X.L. and Ge, J.W. and Liu, B. and Nasim, M. and Mian, A.",
        TITLE = "Context-Enhanced Video Moment Retrieval With Large Language Models",
        JOURNAL = MultMed,
        VOLUME = "27",
        YEAR = "2025",
        PAGES = "6296-6306",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204853"}

@article{bb209538,
        AUTHOR = "Wang, D. and Yu, Y.S. and Li, S.F. and Zhong, H. and Liang, X. and Zhao, L.",
        TITLE = "Scene-enhanced multi-scale temporal aware network for video moment
retrieval",
        JOURNAL = PR,
        VOLUME = "165",
        YEAR = "2025",
        PAGES = "111642",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204854"}

@article{bb209539,
        AUTHOR = "Liu, J. and He, Z. and Nie, W.Z. and Zhang, Z.B. and Su, Y.T.",
        TITLE = "What and Where: Semantic Grasping and Contextual Scanning for Moment
Retrieval and Highlight Detection",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "7155-7166",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204855"}

@article{bb209540,
        AUTHOR = "Xie, P.Y. and Li, J.X. and Lu, G.M. and Xu, Y. and Zhang, D.",
        TITLE = "Caption Assisted Multimodal Large Language Model for Video Moment
Retrieval",
        JOURNAL = IP,
        VOLUME = "34",
        YEAR = "2025",
        PAGES = "6755-6766",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204856"}

@inproceedings{bb209541,
        AUTHOR = "Kwon, S. and Lee, J.H. and Kang, J.W.",
        TITLE = "Lightweight Temporal Contextual Fine-Tuning Method of Large
Multimodal Model for Video Moment Retrieval",
        BOOKTITLE = ICIP25,
        YEAR = "2025",
        PAGES = "2880-2885",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204857"}

@inproceedings{bb209542,
        AUTHOR = "Nguyen Nhu, T.A. and Tran, H.L. and Le, N.K. and Nguyen, M.N. and Nguyen, T.H. and Nguyen Huu, H.L. and Phan Nguyen, H.P. and Pham, H.T. and Nguyen, Q. and Le, H.M. and Dinh, Q.V.",
        TITLE = "A Lightweight Moment Retrieval System with Global Re-Ranking and
Robust Adaptive Bidirectional Temporal Search",
        BOOKTITLE = IntVidSea25,
        YEAR = "2025",
        PAGES = "3708-3718",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204858"}

@inproceedings{bb209543,
        AUTHOR = "Tran, H.L. and Nguyen Nhu, T.A. and Phan Nguyen, H.P. and Nguyen, T.H. and Nguyen Dich, N.M. and Dao, A. and Do, H.D. and Nguyen, Q. and Le, H.M. and Dinh, Q.V.",
        TITLE = "Towards Efficient and Robust Moment Retrieval System: A Unified
Framework for Multi-Granularity Models and Temporal Reranking",
        BOOKTITLE = IntVidSea25,
        YEAR = "2025",
        PAGES = "3719-3729",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204859"}

@inproceedings{bb209544,
        AUTHOR = "Tan, J.W. and Wang, H.X. and Weng, J. and Li, J.X. and Ou, Z.L. and Dang, K.",
        TITLE = "Anchor-Aware Similarity Cohesion in Target Frames Enables Predicting
Temporal Moment Boundaries in 2D",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "24180-24189",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204860"}

@inproceedings{bb209545,
        AUTHOR = "Jung, M. and Jang, Y. and Choi, S. and Kim, J. and Kim, J.H. and Zhang, B.T.",
        TITLE = "Background-Aware Moment Detection for Video Moment Retrieval",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "8586-8596",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204861"}

@inproceedings{bb209546,
        AUTHOR = "Flanagan, K. and Damen, D. and Wray, M.",
        TITLE = "Moment of Untruth: Dealing with Negative Queries in Video Moment
Retrieval",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "5336-5345",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204862"}

@inproceedings{bb209547,
        AUTHOR = "Panta, L. and Shrestha, P. and Sapkota, B. and Bhattarai, A. and Manandhar, S. and Sah, A.K.",
        TITLE = "Cross-modal Contrastive Learning with Asymmetric Co-attention Network
for Video Moment Retrieval",
        BOOKTITLE = Pretrain24,
        YEAR = "2024",
        PAGES = "617-624",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204863"}

@inproceedings{bb209548,
        AUTHOR = "Luo, D.Z. and Huang, J. and Gong, S.G. and Jin, H.L. and Liu, Y.",
        TITLE = "Zero-Shot Video Moment Retrieval from Frozen Vision-Language Models",
        BOOKTITLE = WACV24,
        YEAR = "2024",
        PAGES = "5452-5461",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204864"}

@inproceedings{bb209549,
        AUTHOR = "Huang, C. and Wu, Y.L. and Shuai, H.H. and Huang, C.C.",
        TITLE = "Semantic Fusion Augmentation and Semantic Boundary Detection: A Novel
Approach to Multi-Target Video Moment Retrieval",
        BOOKTITLE = WACV24,
        YEAR = "2024",
        PAGES = "6769-6778",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204865"}

@inproceedings{bb209550,
        AUTHOR = "Xiao, Y.C. and Luo, Z.Y. and Liu, Y. and Ma, Y. and Bian, H.W. and Ji, Y. and Yang, Y.J. and Li, X.",
        TITLE = "Bridging the Gap: A Unified Video Comprehension Framework for Moment
Retrieval and Highlight Detection",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "18709-18719",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204866"}

@inproceedings{bb209551,
        AUTHOR = "Huang, B. and Wang, X. and Chen, H. and Song, Z. and Zhu, W.W.",
        TITLE = "VTimeLLM: Empower LLM to Grasp Video Moments",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "14271-14280",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204867"}

@inproceedings{bb209552,
        AUTHOR = "Luo, D.Z. and Huang, J. and Gong, S.G. and Jin, H.L. and Liu, Y.",
        TITLE = "Towards Generalisable Video Moment Retrieval: Visual-Dynamic
Injection to Image-Text Pre-Training",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "23045-23055",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204868"}

@inproceedings{bb209553,
        AUTHOR = "Ma, K.J. and Zang, X.H. and Feng, Z. and Fang, H. and Ban, C. and Wei, Y.H. and He, Z.J. and Li, Y.X. and Sun, H.",
        TITLE = "LLaViLo: Boosting Video Moment Retrieval via Adapter-Based Multimodal
Modeling",
        BOOKTITLE = CLVL23,
        YEAR = "2023",
        PAGES = "2790-2795",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204869"}

@inproceedings{bb209554,
        AUTHOR = "Togashi, R. and Otani, M. and Nakashima, Y. and Rahtu, E. and Heikkila, J. and Sakai, T.",
        TITLE = "AxIoU: An Axiomatically Justified Measure for Video Moment Retrieval",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "21044-21053",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204870"}

@inproceedings{bb209555,
        AUTHOR = "Zhang, L.Y. and Radke, R.J.",
        TITLE = "Natural Language Video Moment Localization Through Query-Controlled
Temporal Convolution",
        BOOKTITLE = WACV22,
        YEAR = "2022",
        PAGES = "2524-2532",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204871"}

@inproceedings{bb209556,
        AUTHOR = "Liu, Y. and Li, S.Y. and Wu, Y. and Chen, C.W. and Shan, Y. and Qie, X.H.",
        TITLE = "UMT: Unified Multi-modal Transformers for Joint Video Moment
Retrieval and Highlight Detection",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "3032-3041",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204872"}

@inproceedings{bb209557,
        AUTHOR = "Gao, J.Y. and Xu, C.S.",
        TITLE = "Fast Video Moment Retrieval",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "1503-1512",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204873"}

@inproceedings{bb209558,
        AUTHOR = "Wang, H. and Zha, Z.J. and Li, L. and Liu, D. and Luo, J.B.",
        TITLE = "Structured Multi-Level Interaction Network for Video Moment
Localization via Language Query",
        BOOKTITLE = CVPR21,
        YEAR = "2021",
        PAGES = "7022-7031",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204874"}

@inproceedings{bb209559,
        AUTHOR = "Mithun, N.C. and Paul, S. and Roy Chowdhury, A.K.",
        TITLE = "Weakly Supervised Video Moment Retrieval From Text Queries",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "11584-11593",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742vidmo3.html#TT204875"}

@article{bb209560,
        AUTHOR = "Luo, Q.S. and Kong, X.D. and Zeng, G.H. and Fan, J.P.",
        TITLE = "Human action detection via boosted local motion histograms",
        JOURNAL = MVA,
        VOLUME = "21",
        YEAR = "2010",
        NUMBER = "3",
        MONTH = "April",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204876"}

@article{bb209561,
        AUTHOR = "Chan Hon Tong, A. and Achard, C. and Lucat, L.",
        TITLE = "Simultaneous segmentation and classification of human actions in
video streams using deeply optimized Hough transform",
        JOURNAL = PR,
        VOLUME = "47",
        YEAR = "2014",
        NUMBER = "12",
        PAGES = "3807-3818",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204877"}

@article{bb209562,
        AUTHOR = "Vaquette, G. and Achard, C. and Lucat, L.",
        TITLE = "Robust information fusion in the DOHT paradigm for real-time action
detection",
        JOURNAL = RealTimeIP,
        VOLUME = "16",
        YEAR = "2019",
        NUMBER = "5",
        MONTH = "October",
        PAGES = "1511-1524",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204878"}

@article{bb209563,
        AUTHOR = "Hara, K. and Hirayama, T. and Mase, K.",
        TITLE = "Vote Distribution Model for Hough-Based Action Detection",
        JOURNAL = IEICE,
        VOLUME = "E99-D",
        YEAR = "2016",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "2796-2808",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204879"}

@article{bb209564,
        AUTHOR = "Zhang, B. and Yang, Y. and Chen, C. and Yang, L. and Han, J. and Shao, L.",
        TITLE = "Action Recognition Using 3D Histograms of Texture and A Multi-Class
Boosting Classifier",
        JOURNAL = IP,
        VOLUME = "26",
        YEAR = "2017",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "4648-4660",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204880"}

@article{bb209565,
        AUTHOR = "Chen, Q.Q. and Zhang, Y.J.",
        TITLE = "Sequential Segment Networks for Action Recognition",
        JOURNAL = SPLetters,
        VOLUME = "24",
        YEAR = "2017",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "712-716",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204881"}

@article{bb209566,
        AUTHOR = "Du, W.B. and Wang, Y. and Qiao, Y.",
        TITLE = "Recurrent Spatial-Temporal Attention Network for Action Recognition
in Videos",
        JOURNAL = IP,
        VOLUME = "27",
        YEAR = "2018",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "1347-1360",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204882"}

@inproceedings{bb209567,
        AUTHOR = "Du, W.B. and Wang, Y. and Qiao, Y.",
        TITLE = "RPAN: An End-to-End Recurrent Pose-Attention Network for Action
Recognition in Videos",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "3745-3754",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204883"}

@article{bb209568,
        AUTHOR = "Wang, J. and Peng, X.J. and Qiao, Y.",
        TITLE = "Cascade multi-head attention networks for action recognition",
        JOURNAL = CVIU,
        VOLUME = "192",
        YEAR = "2020",
        PAGES = "102898",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204884"}

@inproceedings{bb209569,
        AUTHOR = "Yuan, Z. and Stroud, J.C. and Lu, T. and Deng, J.",
        TITLE = "Temporal Action Localization by Structured Maximal Sums",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "3215-3223",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204885"}

@inproceedings{bb209570,
        AUTHOR = "Luo, C. and Yuille, A.L.",
        TITLE = "Grouped Spatial-Temporal Aggregation for Efficient Action Recognition",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "5511-5520",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204886"}

@inproceedings{bb209571,
        AUTHOR = "Hara, K. and Hirayama, T. and Mase, K.",
        TITLE = "Trend-sensitive hough forests for action detection",
        BOOKTITLE = ICIP14,
        YEAR = "2014",
        PAGES = "1475-1479",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204887"}

@inproceedings{bb209572,
        AUTHOR = "Kobayashi, T.",
        TITLE = "Flip-Invariant Motion Representation",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "5629-5638",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204888"}

@inproceedings{bb209573,
        AUTHOR = "Monteleone, V. and lo Presti, L. and La Cascia, M.",
        TITLE = "HoP: Histogram of Patterns for Human Action Representation",
        BOOKTITLE = CIAP17,
        YEAR = "2017",
        PAGES = "I:457-468",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204889"}

@inproceedings{bb209574,
        AUTHOR = "Abdulmunem, A. and Lai, Y.K. and Sun, X.",
        TITLE = "3D GLOH features for human action recognition",
        BOOKTITLE = ICPR16,
        YEAR = "2016",
        PAGES = "805-810",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204890"}

@inproceedings{bb209575,
        AUTHOR = "Hilsenbeck, B. and Munch, D. and Kieritz, H. and Hubner, W. and Arens, M.",
        TITLE = "Hierarchical Hough forests for view-independent action recognition",
        BOOKTITLE = ICPR16,
        YEAR = "2016",
        PAGES = "1911-1916",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204891"}

@inproceedings{bb209576,
        AUTHOR = "Garcia Hernando, G.B. and Chang, H.J. and Serrano, I. and Deniz Suarez, O. and Kim, T.K.",
        TITLE = "Transition Hough forest for trajectory-based action recognition",
        BOOKTITLE = WACV16,
        YEAR = "2016",
        PAGES = "1-8",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204892"}

@inproceedings{bb209577,
        AUTHOR = "Tian, Q. and Arbel, T. and Clark, J.J.",
        TITLE = "Shannon information based adaptive sampling for action recognition",
        BOOKTITLE = ICPR16,
        YEAR = "2016",
        PAGES = "967-972",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204893"}

@inproceedings{bb209578,
        AUTHOR = "Miao, J. and Xu, X.M. and Mathew, R. and Huang, H.Y.",
        TITLE = "Residue boundary histograms for action recognition in the compressed
domain",
        BOOKTITLE = ICIP15,
        YEAR = "2015",
        PAGES = "2825-2829",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204894"}

@inproceedings{bb209579,
        AUTHOR = "Ahsan, S.M.M. and Tan, J.K. and Kim, H. and Ishikawa, S.",
        TITLE = "Histogram of DMHI and LBP images to represent human actions",
        BOOKTITLE = ICIP14,
        YEAR = "2014",
        PAGES = "1440-1444",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204895"}

@inproceedings{bb209580,
        AUTHOR = "Ciptadi, A. and Goodwin, M.S. and Rehg, J.M.",
        TITLE = "Movement Pattern Histogram for Action Recognition and Retrieval",
        BOOKTITLE = ECCV14,
        YEAR = "2014",
        PAGES = "II: 695-710",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204896"}

@inproceedings{bb209581,
        AUTHOR = "Chua, T.W. and Leman, K.",
        TITLE = "A Novel Human Action Representation via Convolution of Shape-Motion
Histograms",
        BOOKTITLE = MMMod14,
        YEAR = "2014",
        PAGES = "I: 98-108",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204897"}

@inproceedings{bb209582,
        AUTHOR = "Ren, H.M. and Moeslund, T.B.",
        TITLE = "Action recognition using salient neighboring histograms",
        BOOKTITLE = ICIP13,
        YEAR = "2013",
        PAGES = "2807-2811",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204898"}

@inproceedings{bb209583,
        AUTHOR = "Hara, K. and Hirayama, T. and Mase, K.",
        TITLE = "Simultaneous Action Recognition and Localization Based on Multi-view
Hough Voting",
        BOOKTITLE = ACPR13,
        YEAR = "2013",
        PAGES = "616-620",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204899"}

@inproceedings{bb209584,
        AUTHOR = "Chan Hon Tong, A. and Achard, C.",
        TITLE = "Deeply Optimized Hough Transform: Application to Action Segmentation",
        BOOKTITLE = CIAP13,
        YEAR = "2013",
        PAGES = "I:51-60",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204900"}

@inproceedings{bb209585,
        AUTHOR = "Fuad, Z. and Unel, M.",
        TITLE = "Human Action Recognition Using Fusion of Depth and Inertial Sensors",
        BOOKTITLE = ICIAR18,
        YEAR = "2018",
        PAGES = "373-380",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204901"}

@inproceedings{bb209586,
        AUTHOR = "Ustundag, B.C. and Unel, M.",
        TITLE = "Human Action Recognition Using Histograms of Oriented Optical Flows
from Depth",
        BOOKTITLE = ISVC14,
        YEAR = "2014",
        PAGES = "I: 629-638",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204902"}

@inproceedings{bb209587,
        AUTHOR = "Sultani, W. and Saleemi, I.",
        TITLE = "Human Action Recognition across Datasets by Foreground-Weighted
Histogram Decomposition",
        BOOKTITLE = CVPR14,
        YEAR = "2014",
        PAGES = "764-771",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204903"}

@inproceedings{bb209588,
        AUTHOR = "Tabia, H. and Gouiffes, M. and Lacassagne, L.",
        TITLE = "Motion histogram quantification for human action recognition",
        BOOKTITLE = ICPR12,
        YEAR = "2012",
        PAGES = "2404-2407",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204904"}

@inproceedings{bb209589,
        AUTHOR = "Perez, E.A. and Mota, V.F. and Maciel, L.M. and Sad, D. and Vieira, M.B.",
        TITLE = "Combining gradient histograms using orientation tensors for human
action recognition",
        BOOKTITLE = ICPR12,
        YEAR = "2012",
        PAGES = "3460-3463",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204905"}

@inproceedings{bb209590,
        AUTHOR = "Lo, Y.C. and Lee, P.Y. and Cheng, S.C.",
        TITLE = "Space-time template matching for human action detection using
volume-based Generalized Hough transform",
        BOOKTITLE = ICIP11,
        YEAR = "2011",
        PAGES = "2097-2100",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204906"}

@inproceedings{bb209591,
        AUTHOR = "Hsu, F.S. and Lin, C.H. and Lin, W.Y.",
        TITLE = "Recognizing human actions using curvature estimation and NWFE-based
histogram vectors",
        BOOKTITLE = VCIP11,
        YEAR = "2011",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204907"}

@inproceedings{bb209592,
        AUTHOR = "Ziaeefard, M. and Ebrahimnezhad, H.",
        TITLE = "Hierarchical Human Action Recognition by Normalized-Polar Histogram",
        BOOKTITLE = ICPR10,
        YEAR = "2010",
        PAGES = "3720-3723",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204908"}

@inproceedings{bb209593,
        AUTHOR = "Lai, K.T. and Chen, M.S. and Hsieh, C.H. and Lai, M.F.",
        TITLE = "Orientation histogram of SIFT displacement for recognizing actions in
broadcast videos",
        BOOKTITLE = EUVIP11,
        YEAR = "2011",
        PAGES = "286-291",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204909"}

@inproceedings{bb209594,
        AUTHOR = "Lai, K.T. and Hsieh, C.H. and Lai, M.F. and Chen, M.S.",
        TITLE = "Human Action Recognition Using Key Points Displacement",
        BOOKTITLE = ICISP10,
        YEAR = "2010",
        PAGES = "439-447",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204910"}

@inproceedings{bb209595,
        AUTHOR = "Vezzani, R. and Baltieri, D. and Cucchiara, R.",
        TITLE = "HMM Based Action Recognition with Projection Histogram Features",
        BOOKTITLE = "ICPR-Contests10",
        YEAR = "2010",
        PAGES = "286-293",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742hist1.html#TT204911"}

@article{bb209596,
        AUTHOR = "Bobick, A.F. and Davis, J.W.",
        TITLE = "The Recognition of Human Movement Using Temporal Templates",
        JOURNAL = PAMI,
        VOLUME = "23",
        YEAR = "2001",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "257-267",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742fl2.html#TT204912"}

@inproceedings{bb209597,
        AUTHOR = "Bobick, A.F. and Davis, J.W.",
        TITLE = "Action Recognition Using Temporal Templates",
        BOOKTITLE = MBR97,
        YEAR = "1997",
        PAGES = "Chapter 6",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742fl2.html#TT204913"}

@inproceedings{bb209598,
        AUTHOR = "Bobick, A.F. and Davis, J.W.",
        TITLE = "Real-Time Recognition of Activity Using Temporal Templates",
        BOOKTITLE = WACV96,
        YEAR = "1996",
        PAGES = "39-42",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742fl2.html#TT204914"}

@inproceedings{bb209599,
        AUTHOR = "Davis, J.W. and Bobick, A.F.",
        TITLE = "Real-Time Recognition of Activity Using Temporal Templates",
        BOOKTITLE = Vismod,
        YEAR = "1997",
        BIBSOURCE = "http://www.visionbib.com/bibliography/motion-f742fl2.html#TT204914"}

Last update:Apr 6, 2026 at 11:28:57