@inproceedings{bb235200, AUTHOR = "Yang, D. and Yuan, C.", TITLE = "Hierarchical Context Encoding for Events Captioning in Videos", BOOKTITLE = ICIP18, YEAR = "2018", PAGES = "1288-1292", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT230119"} @inproceedings{bb235201, AUTHOR = "Shen, Z.Q. and Li, J.G. and Su, Z. and Li, M.J. and Chen, Y.R. and Jiang, Y.G. and Xue, X.Y.", TITLE = "Weakly Supervised Dense Video Captioning", BOOKTITLE = CVPR17, YEAR = "2017", PAGES = "5159-5167", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT230120"} @inproceedings{bb235202, AUTHOR = "Baraldi, L. and Grana, C. and Cucchiara, R.", TITLE = "Hierarchical Boundary-Aware Neural Encoder for Video Captioning", BOOKTITLE = CVPR17, YEAR = "2017", PAGES = "3185-3194", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT230121"} @inproceedings{bb235203, AUTHOR = "Pan, P.B. and Xu, Z.W. and Yang, Y. and Wu, F. and Zhuang, Y.T.", TITLE = "Hierarchical Recurrent Neural Encoder for Video Representation with Application to Captioning", BOOKTITLE = CVPR16, YEAR = "2016", PAGES = "1029-1038", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT230122"} @inproceedings{bb235204, AUTHOR = "Yu, H.N. and Wang, J. and Huang, Z.H. and Yang, Y. and Xu, W.", TITLE = "Video Paragraph Captioning Using Hierarchical Recurrent Neural Networks", BOOKTITLE = CVPR16, YEAR = "2016", PAGES = "4584-4593", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT230123"} @inproceedings{bb235205, AUTHOR = "Shin, A. and Ohnishi, K. and Harada, T.", TITLE = "Beyond caption to narrative: Video captioning with multiple sentences", BOOKTITLE = ICIP16, YEAR = "2016", PAGES = "3364-3368", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vc4.html#TT230124"} @article{bb235206, AUTHOR = "Vakali, A. and Hacid, M.S. and Elmagarmid, A.", TITLE = "MPEG-7 based description schemes for multi-level video content classification", JOURNAL = IVC, VOLUME = "22", YEAR = "2004", NUMBER = "5", MONTH = "May", PAGES = "367-378", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230125"} @article{bb235207, AUTHOR = "Fonseca, P.M. and Pereira, F.", TITLE = "Automatic video summarization based on MPEG-7 descriptions", JOURNAL = SP:IC, VOLUME = "19", YEAR = "2004", NUMBER = "8", MONTH = "September", PAGES = "685-699", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230126"} @article{bb235208, AUTHOR = "Mrak, M. and Calic, J. and Kondoz, A.M.", TITLE = "Fast analysis of scalable video for adaptive browsing interfaces", JOURNAL = CVIU, VOLUME = "113", YEAR = "2009", NUMBER = "3", MONTH = "March", PAGES = "425-434", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230127"} @inproceedings{bb235209, AUTHOR = "Calic, J. and Mrak, M. and Kondoz, A.M.", TITLE = "Flexible generation of video summaries from layered video bit-streams", BOOKTITLE = ICIP08, YEAR = "2008", PAGES = "2516-2519", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230128"} @article{bb235210, AUTHOR = "Herranz, L. and Martinez, J.M.", TITLE = "An integrated approach to summarization and adaptation using H.264/MPEG-4 SVC", JOURNAL = SP:IC, VOLUME = "24", YEAR = "2009", NUMBER = "6", MONTH = "July", PAGES = "499-509", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230129"} @article{bb235211, AUTHOR = "Herranz, L. and Martinez, J.M.", TITLE = "On the use of hierarchical prediction structures for efficient summary generation of H.264/AVC bitstreams", JOURNAL = SP:IC, VOLUME = "24", YEAR = "2009", NUMBER = "8", MONTH = "September", PAGES = "615-629", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230130"} @article{bb235212, AUTHOR = "Matos, N. and Pereira, F.", TITLE = "Automatic creation and evaluation of MPEG-7 compliant summary descriptions for generic audiovisual content", JOURNAL = SP:IC, VOLUME = "23", YEAR = "2008", NUMBER = "8", MONTH = "September", PAGES = "581-598", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230131"} @article{bb235213, AUTHOR = "Ren, J.C. and Jiang, J.M. and Feng, Y.", TITLE = "Activity-driven content adaptation for effective video summarization", JOURNAL = JVCIR, VOLUME = "21", YEAR = "2010", NUMBER = "8", MONTH = "November", PAGES = "930-938", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230132"} @article{bb235214, AUTHOR = "Almeida, J. and Leite, N.J. and da Silva Torres, R.", TITLE = "VISON: VIdeo Summarization for ONline applications", JOURNAL = PRL, VOLUME = "33", YEAR = "2012", NUMBER = "4", MONTH = "March", PAGES = "397-409", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230133"} @inproceedings{bb235215, AUTHOR = "Almeida, J. and Leite, N.J. and da Silva Torres, R.", TITLE = "Comparison of video sequences with histograms of motion patterns", BOOKTITLE = ICIP11, YEAR = "2011", PAGES = "3673-3676", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230134"} @inproceedings{bb235216, AUTHOR = "Almeida, J. and Leite, N.J. and da Silva Torres, R.", TITLE = "Rapid Cut Detection on Compressed Video", BOOKTITLE = CIARP11, YEAR = "2011", PAGES = "71-78", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230135"} @article{bb235217, AUTHOR = "Basavarajaiah, M. and Sharma, P.", TITLE = "Survey of Compressed Domain Video Summarization Techniques", JOURNAL = Surveys, VOLUME = "52", YEAR = "2019", NUMBER = "6", MONTH = "October", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230136"} @inproceedings{bb235218, AUTHOR = "Lee, J.H. and Kim, W.Y.", TITLE = "Video Summarization and Retrieval System Using Face Recognition and MPEG-7 Descriptors", BOOKTITLE = CIVR04, YEAR = "2004", PAGES = "170-178", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230137"} @inproceedings{bb235219, AUTHOR = "Soysal, M. and Alatan, A.A.", TITLE = "Combining MPEG-7 Based Visual Experts for Reaching Semantics", BOOKTITLE = VLBV03, YEAR = "2003", PAGES = "66-75", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230138"} @inproceedings{bb235220, AUTHOR = "Divakaran, A. and Peker, K.A. and Radhakrishnan, R. and Xiong, Z.Y. and Cabasson, R.", TITLE = "Video Summarization using MPEG-7 Motion Activity and Audio Descriptors", BOOKTITLE = VideoMining03, YEAR = "2003", PAGES = "Chapter 4", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230139"} @inproceedings{bb235221, AUTHOR = "Sugano, M. and Nakajima, Y. and Yanagihara, H.", TITLE = "Automated MPEG audio-video summarization and description", BOOKTITLE = ICIP02, YEAR = "2002", PAGES = "I: 956-959", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230140"} @inproceedings{bb235222, AUTHOR = "Jaimes, A. and Echigo, T. and Teraguchi, M. and Satoh, F.", TITLE = "Learning personalized video highlights from detailed MPEG-7 metadata", BOOKTITLE = ICIP02, YEAR = "2002", PAGES = "I: 133-136", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230141"} @inproceedings{bb235223, AUTHOR = "Lin, C.Y. and Tseng, B.L. and Naphade, M.R. and Natsev, A.P. and Smith, J.R.", TITLE = "VideoAL: A novel end-to-end MPEG-7 video automatic labeling system", BOOKTITLE = ICIP03, YEAR = "2003", PAGES = "III: 53-56", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230142"} @inproceedings{bb235224, AUTHOR = "Kim, J.G. and Chang, H.S. and Kim, J.W. and Kim, H.M.", TITLE = "Efficient Camera Motion Characterization for MPEG Video Indexing", BOOKTITLE = ICME00, YEAR = "2000", PAGES = "TP11", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230143"} @inproceedings{bb235225, AUTHOR = "DeMenthon, D.F. and Megret, R.", TITLE = "Spatio-temporal Segmentation of Video by Hierarchical Mean Shift Analysis", BOOKTITLE = UMD, YEAR = "2002", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230144"} @inproceedings{bb235226, AUTHOR = "Megret, R. and DeMenthon, D.F.", TITLE = "A Survey of Spatio-temporal Grouping Techniques", BOOKTITLE = UMD, YEAR = "2002", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230145"} @inproceedings{bb235227, AUTHOR = "DeMenthon, D.F. and Latecki, L.J. and Rosenfeld, A. and Stueckelberg, M.V.", TITLE = "Relevance Ranking of Video Data using Hidden Markov Model Distances and Polygon Simplification", BOOKTITLE = UMD, YEAR = "2001", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230146"} @inproceedings{bb235228, AUTHOR = "DeMenthon, D.F. and Kobla, V. and Doermann, D.", TITLE = "Video Summarization by Curve Simplification", BOOKTITLE = UMD, YEAR = "1998", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230147"} @inproceedings{bb235229, AUTHOR = "Yoon, K. and DeMenthon, D.F. and Doermann, D.", TITLE = "Event Detection from MPEG Video in the Compressed Domain", BOOKTITLE = ICPR00, YEAR = "2000", PAGES = "Vol I: 819-822", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vm3.html#TT230148"} @article{bb235230, AUTHOR = "Doulamis, A.D. and Doulamis, N.D. and Kollias, S.D.", TITLE = "A fuzzy video content representation for video summarization and content-based retrieval", JOURNAL = SP, VOLUME = "80", YEAR = "2000", NUMBER = "6", MONTH = "June", PAGES = "1049-1067", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230149"} @article{bb235231, AUTHOR = "Kollias, S.D. and Doulamis, N.D. and Doulamis, A.D.", TITLE = "A fuzzy video content representation for video summarization and content-based retrieval", JOURNAL = SP, VOLUME = "82", YEAR = "2002", NUMBER = "4", MONTH = "April", PAGES = "545", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230149"} @article{bb235232, AUTHOR = "Doulamis, N.D. and Doulamis, A.D. and Avrithis, Y.S. and Ntalianis, K.S. and Kollias, S.D.", TITLE = "Efficient Summarization of Stereoscopic Video Sequences", JOURNAL = CirSysVideo, VOLUME = "10", YEAR = "2000", NUMBER = "4", MONTH = "June", PAGES = "501-157", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230150"} @inproceedings{bb235233, AUTHOR = "Ntalianis, K.S. and Doulamis, A.D. and Tsapatsoulis, N.", TITLE = "Implicit visual concept modeling in image/video annotation", BOOKTITLE = ARTEMIS10, YEAR = "2010", PAGES = "33-38", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230151"} @inproceedings{bb235234, AUTHOR = "Doulamis, A.D. and Ntalianis, K.S.", TITLE = "On the Fly Semantic Annotation and Modelling of Multimedia", BOOKTITLE = WSSIP09, YEAR = "2009", PAGES = "1-4", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230152"} @inproceedings{bb235235, AUTHOR = "Doulamis, N.D. and Doulamis, A.D. and Avrithis, Y.S. and Kollias, S.D.", TITLE = "Video content representation using optimal extraction of frames and scenes", BOOKTITLE = ICIP98, YEAR = "1998", PAGES = "I: 875-879", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230153"} @article{bb235236, AUTHOR = "Amir, A. and Ashour, G. and Srinivasan, S.", TITLE = "Automatic generation of conference video proceedings", JOURNAL = JVCIR, VOLUME = "15", YEAR = "2004", NUMBER = "3", MONTH = "September", PAGES = "467-488", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230154"} @article{bb235237, AUTHOR = "Metze, F. and Ding, D. and Younessian, E. and Hauptmann, A.G.", TITLE = "Beyond audio and video retrieval: Topic-oriented multimedia summarization", JOURNAL = MultInfoRetr, VOLUME = "2", YEAR = "2013", NUMBER = "2", MONTH = "June", PAGES = "131-144", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230155"} @inproceedings{bb235238, AUTHOR = "Ding, D. and Metze, F. and Rawat, S. and Schulam, P.F. and Burger, S. and Younessian, E. and Bao, L. and Christel, M.G. and Hauptmann, A.G.", TITLE = "Beyond audio and video retrieval: Towards multimedia summarization", BOOKTITLE = ICMR12, YEAR = "2012", PAGES = "2", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230156"} @article{bb235239, AUTHOR = "Bian, J.W. and Yang, Y. and Zhang, H.W. and Chua, T.S.", TITLE = "Multimedia Summarization for Social Events in Microblog Stream", JOURNAL = MultMed, VOLUME = "17", YEAR = "2015", NUMBER = "2", MONTH = "February", PAGES = "216-228", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230157"} @article{bb235240, AUTHOR = "Kuanar, S.K. and Ranga, K.B. and Chowdhury, A.S.", TITLE = "Multi-View Video Summarization Using Bipartite Matching Constrained Optimum-Path Forest Clustering", JOURNAL = MultMed, VOLUME = "17", YEAR = "2015", NUMBER = "8", MONTH = "August", PAGES = "1166-1173", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230158"} @article{bb235241, AUTHOR = "Tan, C.C. and Ngo, C.W.", TITLE = "On the use of commonsense ontology for multimedia event recounting", JOURNAL = MultInfoRetr, VOLUME = "5", YEAR = "2016", NUMBER = "2", MONTH = "June", PAGES = "73-88", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230159"} @article{bb235242, AUTHOR = "Wu, F. and Fang, H. and Li, X. and Tang, S. and Lu, W. and Yang, Y. and Zhu, W. and Zhuang, Y.", TITLE = "Aspect Learning for Multimedia Summarization via Nonparametric Bayesian", JOURNAL = CirSysVideo, VOLUME = "26", YEAR = "2016", NUMBER = "10", MONTH = "October", PAGES = "1931-1942", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230160"} @article{bb235243, AUTHOR = "Jiang, Y.G. and Wu, Z.X. and Tang, J.H. and Li, Z.C. and Xue, X.Y. and Chang, S.F.", TITLE = "Modeling Multimodal Clues in a Hybrid Deep Learning Framework for Video Classification", JOURNAL = MultMed, VOLUME = "20", YEAR = "2018", NUMBER = "11", MONTH = "November", PAGES = "3137-3147", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230161"} @article{bb235244, AUTHOR = "Wu, Z.X. and Li, H.D. and Zheng, Y.B. and Xiong, C.M. and Jiang, Y.G. and Davis, L.S.", TITLE = "A Coarse-to-Fine Framework for Resource Efficient Video Recognition", JOURNAL = IJCV, VOLUME = "129", YEAR = "2021", NUMBER = "11", MONTH = "November", PAGES = "2965-2977", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230162"} @article{bb235245, AUTHOR = "Tian, F. and Wang, Q. and Li, X. and Sun, N.", TITLE = "Heterogeneous multimedia cooperative annotation based on multimodal correlation learning", JOURNAL = JVCIR, VOLUME = "58", YEAR = "2019", PAGES = "544-553", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230163"} @article{bb235246, AUTHOR = "Du, X.T. and Yuan, J. and Hu, L. and Dai, Y.", TITLE = "Description generation of open-domain videos incorporating multimodal features and bidirectional encoder", JOURNAL = VC, VOLUME = "35", YEAR = "2018", NUMBER = "12", MONTH = "December", PAGES = "1703-1712", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230164"} @article{bb235247, AUTHOR = "Li, J. and Wong, Y. and Zhao, Q. and Kankanhalli, M.S.", TITLE = "Video Storytelling: Textual Summaries for Events", JOURNAL = MultMed, VOLUME = "22", YEAR = "2020", NUMBER = "2", MONTH = "February", PAGES = "554-565", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230165"} @article{bb235248, AUTHOR = "Cascianelli, S. and Costante, G. and Devo, A. and Ciarfuglia, T.A. and Valigi, P. and Fravolini, M.L.", TITLE = "The Role of the Input in Natural Language Video Description", JOURNAL = MultMed, VOLUME = "22", YEAR = "2020", NUMBER = "1", MONTH = "January", PAGES = "271-283", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230166"} @article{bb235249, AUTHOR = "Zhang, Y.Z. and Liu, Y. and Kang, W. and Zheng, Y.X.", TITLE = "MAR-Net: Motion-Assisted Reconstruction Network for Unsupervised Video Summarization", JOURNAL = SPLetters, VOLUME = "30", YEAR = "2023", PAGES = "1282-1286", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230167"} @article{bb235250, AUTHOR = "Yu, L.J. and Zhao, X. and Xie, L. and Liang, H.R. and Liang, R.H.", TITLE = "Hierarchical multi-modal video summarization with dynamic sampling", JOURNAL = IET-IPR, VOLUME = "18", YEAR = "2024", NUMBER = "14", PAGES = "4577-4588", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230168"} @article{bb235251, AUTHOR = "Sartinas, E.G. and Psarakis, E.Z. and Kosmopoulos, D.I.", TITLE = "A 3D wrist motion-based sign language video summarization technique", JOURNAL = PRL, VOLUME = "189", YEAR = "2025", PAGES = "23-30", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230169"} @inproceedings{bb235252, AUTHOR = "Bouritsas, G. and Koutras, P. and Zlatintsi, A. and Maragos, P.", TITLE = "Multimodal Visual Concept Learning with Weakly Supervised Techniques", BOOKTITLE = CVPR18, YEAR = "2018", PAGES = "4914-4923", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230170"} @inproceedings{bb235253, AUTHOR = "Wang, J. and Wang, W. and Huang, Y. and Wang, L. and Tan, T.", TITLE = "M3: Multimodal Memory Modelling for Video Captioning", BOOKTITLE = CVPR18, YEAR = "2018", PAGES = "7512-7520", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230171"} @inproceedings{bb235254, AUTHOR = "Kang, S.H. and Kim, J.Y. and Choi, H. and Kim, S.J. and Yoo, C.D.", TITLE = "Pivot Correlational Neural Network for Multimodal Video Categorization", BOOKTITLE = ECCV18, YEAR = "2018", PAGES = "XIV: 402-417", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230172"} @inproceedings{bb235255, AUTHOR = "Mazaheri, A. and Shah, M.", TITLE = "Visual Text Correction", BOOKTITLE = ECCV18, YEAR = "2018", PAGES = "XIII: 159-175", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230173"} @inproceedings{bb235256, AUTHOR = "Rudinac, S. and Chua, T.S. and Diaz Ferreyra, N. and Friedland, G. and Gornostaja, T. and Huet, B. and Kaptein, R. and Linden, K. and Moens, M.F. and Peltonen, J. and Redi, M. and Schedl, M. and Shamma, D.A. and Smeaton, A. and Xie, L.X.", TITLE = "Rethinking Summarization and Storytelling for Modern Social Multimedia", BOOKTITLE = MMMod18, YEAR = "2018", PAGES = "I:632-644", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230174"} @inproceedings{bb235257, AUTHOR = "Hori, C. and Hori, T. and Lee, T.Y. and Zhang, Z.M. and Harsham, B. and Hershey, J.R. and Marks, T.K. and Sumi, K.", TITLE = "Attention-Based Multimodal Fusion for Video Description", BOOKTITLE = ICCV17, YEAR = "2017", PAGES = "4203-4212", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230175"} @inproceedings{bb235258, AUTHOR = "Gupta, R.K. and Yang, Y.P.", TITLE = "Leveraging Multi-modal Analyses and Online Knowledge Base for Video Aboutness Generation", BOOKTITLE = ISVC16, YEAR = "2016", PAGES = "II: 55-64", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230176"} @inproceedings{bb235259, AUTHOR = "Vallet, F. and Essid, S. and Carrive, J. and Richard, G.", TITLE = "Robust visual features for the multimodal identification of unregistered speakers in TV talk-shows", BOOKTITLE = ICIP10, YEAR = "2010", PAGES = "1469-1472", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230177"} @inproceedings{bb235260, AUTHOR = "Bailer, W. and Thallinger, G.", TITLE = "A framework for multimedia content abstraction and its application to rushes exploration", BOOKTITLE = CIVR07, YEAR = "2007", PAGES = "146-153", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230178"} @inproceedings{bb235261, AUTHOR = "Tesic, J. and Smith, J.R.", TITLE = "Efficient Summarizing of Multimedia Archives Using Cluster Labeling", BOOKTITLE = CIVR06, YEAR = "2006", PAGES = "518-520", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825mms4.html#TT230179"} @inproceedings{bb235262, AUTHOR = "Mauldin, M.L. and Smith, M.A. and Stevens, S.M. and Wactlar, H.D. and Christel, M.G. and Reddy, D.R.", TITLE = "System and method for skimming digital audio/video data", BOOKTITLE = US_Patent, YEAR = "1997", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230180"} @article{bb235263, AUTHOR = "Almeida, J. and Leite, N.J. and da Silva Torres, R.", TITLE = "Online video summarization on compressed domain", JOURNAL = JVCIR, VOLUME = "24", YEAR = "2013", NUMBER = "6", MONTH = "August", PAGES = "729-738", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230181"} @article{bb235264, AUTHOR = "Sreeja, M.U. and Kovoor, B.C.", TITLE = "Towards genre-specific frameworks for video summarisation: A survey", JOURNAL = JVCIR, VOLUME = "62", YEAR = "2019", PAGES = "340-358", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230182"} @article{bb235265, AUTHOR = "Vivekraj, V.K. and Sen, D. and Raman, B.", TITLE = "Video Skimming: Taxonomy and Comprehensive Survey", JOURNAL = Surveys, VOLUME = "52", YEAR = "2019", NUMBER = "5", MONTH = "October", PAGES = "Article No 106", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230183"} @article{bb235266, AUTHOR = "Kumar, K.", TITLE = "EVS-DK: Event video skimming using deep keyframe", JOURNAL = JVCIR, VOLUME = "58", YEAR = "2019", PAGES = "345-352", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230184"} @article{bb235267, AUTHOR = "Silva, M.M. and Ramos, W.L.S. and Campos, M.F.M. and Nascimento, E.R.", TITLE = "A Sparse Sampling-Based Framework for Semantic Fast-Forward of First-Person Videos", JOURNAL = PAMI, VOLUME = "43", YEAR = "2021", NUMBER = "4", MONTH = "April", PAGES = "1438-1444", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230185"} @inproceedings{bb235268, AUTHOR = "Silva, M.M. and Ramos, W.L.S. and Ferreira, J.P.K. and Chamone, F. and Campos, M.F.M. and Nascimento, E.R.", TITLE = "A Weighted Sparse Sampling and Smoothing Frame Transition Approach for Semantic Fast-Forward First-Person Videos", BOOKTITLE = CVPR18, YEAR = "2018", PAGES = "2383-2392", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230186"} @inproceedings{bb235269, AUTHOR = "Silva, M.M. and Ramos, W.L.S. and Ferreira, J.P.K. and Campos, M.F.M. and Nascimento, E.R.", TITLE = "Towards Semantic Fast-Forward and Stabilized Egocentric Videos", BOOKTITLE = Egocentric16, YEAR = "2016", PAGES = "I: 557-571", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230187"} @inproceedings{bb235270, AUTHOR = "Ramos, W.L.S. and Silva, M.M. and Campos, M.F.M. and Nascimento, E.R.", TITLE = "Fast-forward video based on semantic extraction", BOOKTITLE = ICIP16, YEAR = "2016", PAGES = "3334-3338", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230188"} @inproceedings{bb235271, AUTHOR = "Ramos, W.L.S. and Silva, M.M. and Araujo, E. and Marcolino, L.S. and Nascimento, E.R.", TITLE = "Straight to the Point: Fast-Forwarding Videos via Reinforcement Learning Using Textual Data", BOOKTITLE = CVPR20, YEAR = "2020", PAGES = "10928-10937", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230189"} @article{bb235272, AUTHOR = "Sun, X.Y. and Wang, H.L. and He, B.", TITLE = "MABAN: Multi-Agent Boundary-Aware Network for Natural Language Moment Retrieval", JOURNAL = IP, VOLUME = "30", YEAR = "2021", PAGES = "5589-5599", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230190"} @article{bb235273, AUTHOR = "Lan, S. and Wang, Z. and Wei, E. and Roy Chowdhury, A.K. and Zhu, Q.", TITLE = "Collaborative Multi-Agent Video Fast-Forwarding", JOURNAL = MultMed, VOLUME = "26", YEAR = "2024", PAGES = "1041-1054", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230191"} @inproceedings{bb235274, AUTHOR = "Lan, S. and Panda, R. and Zhu, Q. and Roy Chowdhury, A.K.", TITLE = "FFNet: Video Fast-Forwarding via Reinforcement Learning", BOOKTITLE = CVPR18, YEAR = "2018", PAGES = "6771-6780", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230192"} @inproceedings{bb235275, AUTHOR = "Vivekraj, V.K. and Balasubramanian, R. and Sen, D.", TITLE = "Vector R-ordering based selection of segments for video skimming", BOOKTITLE = ICPR16, YEAR = "2016", PAGES = "871-876", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230193"} @inproceedings{bb235276, AUTHOR = "Christel, M.G. and Lin, W.H. and Maher, B.", TITLE = "Evaluating audio skimming and frame rate acceleration for summarizing BBC rushes", BOOKTITLE = CIVR08, YEAR = "2008", PAGES = "407-416", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230194"} @inproceedings{bb235277, AUTHOR = "Sundaram, H. and Chang, S.F.", TITLE = "Video skims: taxonomies and an optimal generation framework", BOOKTITLE = ICIP02, YEAR = "2002", PAGES = "II: 21-24", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230195"} @inproceedings{bb235278, AUTHOR = "Sundaram, H. and Chang, S.F.", TITLE = "Constrained Utility Maximizations for Generating Visual Skims", BOOKTITLE = CBAIVL01, YEAR = "2001", PAGES = "124", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230196"} @inproceedings{bb235279, AUTHOR = "Ma, Y.F. and Zbang, H.J.", TITLE = "A model of motion attention for video skimming", BOOKTITLE = ICIP02, YEAR = "2002", PAGES = "I: 129-132", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230197"} @inproceedings{bb235280, AUTHOR = "di Lecce, V. and Dimauro, G. and Guerriero, A. and Impedovo, S. and Pirlo, G. and Salzo, A.", TITLE = "Image basic features indexing techniques for video skimming", BOOKTITLE = CIAP99, YEAR = "1999", PAGES = "715-720", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230198"} @inproceedings{bb235281, AUTHOR = "Smith, M.A. and Kanade, T.", TITLE = "Video Skimming and Characterization through the Combination of Image and Language Understanding Techniques", BOOKTITLE = CVPR97, YEAR = "1997", PAGES = "775-781", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230199"} @inproceedings{bb235282, AUTHOR = "Kanade, T. and Smith, M.A.", TITLE = "Video Skimming and Characterization through the Combination of Image and Language Understanding Techniques", BOOKTITLE = DARPA97, YEAR = "1997", PAGES = "357-366", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230199"} @inproceedings{bb235283, AUTHOR = "Kanade, T. and Smith, M.A.", TITLE = "Video Skimming and Characterization through the Combination of Image and Language Understanding Techniques", BOOKTITLE = CMU-CS-TR, YEAR = "1997", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230199"} @inproceedings{bb235284, AUTHOR = "Smith, M.A. and Kanade, T.", TITLE = "Video Skimming for Quick Browsing based on Audio and Image Characterization", BOOKTITLE = CMU-CS-TR, YEAR = "1995", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vsk1.html#TT230200"} @article{bb235285, AUTHOR = "Brostow, G.J. and Fauqueur, J. and Cipolla, R.", TITLE = "Semantic object classes in video: A high-definition ground truth database", JOURNAL = PRL, VOLUME = "30", YEAR = "2009", NUMBER = "2", MONTH = "January", PAGES = "88-97", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vu1.html#TT230202"} @inproceedings{bb235286, AUTHOR = "Aodha, O.M. and Brostow, G.J. and Pollefeys, M.", TITLE = "Segmenting video into classes of algorithm-suitability", BOOKTITLE = CVPR10, YEAR = "2010", PAGES = "1054-1061", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vu1.html#TT230203"} @article{bb235287, AUTHOR = "Suresha, M. and Kuppa, S. and Raghukumar, D.S.", TITLE = "A study on deep learning spatiotemporal models and feature extraction techniques for video understanding", JOURNAL = MultInfoRetr, VOLUME = "9", YEAR = "2020", NUMBER = "2", MONTH = "June", PAGES = "81-101", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vu1.html#TT230204"} @article{bb235288, AUTHOR = "Kavoosifar, M.R. and Apiletti, D. and Baralis, E. and Garza, P. and Huet, B.", TITLE = "Effective video hyperlinking by means of enriched feature sets and monomodal query combinations", JOURNAL = MultInfoRetr, VOLUME = "9", YEAR = "2020", NUMBER = "3", MONTH = "September", PAGES = "215-227", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vu1.html#TT230205"} @article{bb235289, AUTHOR = "Tang, P.J. and Tan, Y.L. and Li, J.Z. and Tan, B.", TITLE = "Translating video into language by enhancing visual and language representations", JOURNAL = JVCIR, VOLUME = "72", YEAR = "2020", PAGES = "102875", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vu1.html#TT230206"} @article{bb235290, AUTHOR = "Yu, J. and Jiang, X. and Qin, Z. and Zhang, W. and Hu, Y. and Wu, Q.", TITLE = "Learning Dual Encoding Model for Adaptive Visual Understanding in Visual Dialogue", JOURNAL = IP, VOLUME = "30", YEAR = "2021", PAGES = "220-233", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vu1.html#TT230207"} @article{bb235291, AUTHOR = "Duan, J.H. and Xu, H. and Lin, X.Z. and Zhu, S.C. and Du, Y.Z.", TITLE = "Multi-semantic long-range dependencies capturing for efficient video representation learning", JOURNAL = IVC, VOLUME = "104", YEAR = "2020", PAGES = "103988", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vu1.html#TT230208"} @article{bb235292, AUTHOR = "Tan, H.L. and Zhu, H.Y. and Lim, J.H. and Tan, C.", TITLE = "A comprehensive survey of procedural video datasets", JOURNAL = CVIU, VOLUME = "202", YEAR = "2021", PAGES = "103107", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vu1.html#TT230209"} @article{bb235293, AUTHOR = "Lin, J. and Gan, C. and Wang, K. and Han, S.", TITLE = "TSM: Temporal Shift Module for Efficient and Scalable Video Understanding on Edge Devices", JOURNAL = PAMI, VOLUME = "44", YEAR = "2022", NUMBER = "5", MONTH = "May", PAGES = "2760-2774", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vu1.html#TT230210"} @inproceedings{bb235294, AUTHOR = "Lin, J. and Gan, C. and Han, S.", TITLE = "TSM: Temporal Shift Module for Efficient Video Understanding", BOOKTITLE = ICCV19, YEAR = "2019", PAGES = "7082-7092", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vu1.html#TT230211"} @article{bb235295, AUTHOR = "Zhou, W. and Hou, Y. and Ouyang, K.W. and Zhou, S.L.", TITLE = "Exploring complementary information of self-supervised pretext tasks for unsupervised video pre-training", JOURNAL = IET-CV, VOLUME = "16", YEAR = "2022", NUMBER = "3", PAGES = "255-265", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vu1.html#TT230212"} @article{bb235296, AUTHOR = "Li, Z.Q. and Wang, W.M. and Li, Z.Y. and Huang, Y.F. and Sato, Y.", TITLE = "Spatio-Temporal Perturbations for Video Attribution", JOURNAL = CirSysVideo, VOLUME = "32", YEAR = "2022", NUMBER = "4", MONTH = "April", PAGES = "2043-2056", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vu1.html#TT230213"} @article{bb235297, AUTHOR = "Tao, L. and Wang, X.T. and Yamasaki, T.", TITLE = "An Improved Inter-Intra Contrastive Learning Framework on Self-Supervised Video Representation", JOURNAL = CirSysVideo, VOLUME = "32", YEAR = "2022", NUMBER = "8", MONTH = "August", PAGES = "5266-5280", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vu1.html#TT230214"} @article{bb235298, AUTHOR = "Huang, L. and Zhang, C. and Zhang, H.Y.", TITLE = "Self-Adaptive Training: Bridging Supervised and Self-Supervised Learning", JOURNAL = PAMI, VOLUME = "46", YEAR = "2024", NUMBER = "3", MONTH = "March", PAGES = "1362-1377", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vu1.html#TT230215"} @inproceedings{bb235299, AUTHOR = "Huang, L. and You, S. and Zheng, M.K. and Wang, F. and Qian, C. and Yamasaki, T.", TITLE = "Learning Where to Learn in Cross-View Self-Supervised Learning", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "14431-14440", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat825vu1.html#TT230216"}