@inproceedings{bb158100,
        AUTHOR = "Wang, A. and Chen, H. and Lin, Z.J. and Han, J.G. and Ding, G.G.",
        TITLE = "Rep ViT: Revisiting Mobile CNN From ViT Perspective",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "15909-15920",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153971"}

@article{bb158101,
        AUTHOR = "Liu, Z. and Zhu, J.C. and Li, N.N. and Huang, G.",
        TITLE = "Multiple-Exit Tuning: Towards Inference-Efficient Adaptation for
Vision Transformer",
        JOURNAL = CirSysVideo,
        VOLUME = "36",
        YEAR = "2026",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "2123-2136",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153972"}

@article{bb158102,
        AUTHOR = "Chen, X.Y. and Wang, X.T. and Zhang, W.L. and Kong, X.T. and Qiao, Y. and Zhou, J.T. and Dong, C.",
        TITLE = "HAT: Hybrid Attention Transformer for Image Restoration",
        JOURNAL = PAMI,
        VOLUME = "48",
        YEAR = "2026",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "2676-2694",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153973"}

@article{bb158103,
        AUTHOR = "Li, C. and Su, J. and Gao, J.S.",
        TITLE = "BiPAZSL: A bidirectional progressive attention method for zero-shot
learning domain shift mitigation",
        JOURNAL = PR,
        VOLUME = "174",
        YEAR = "2026",
        PAGES = "112959",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153974"}

@article{bb158104,
        AUTHOR = "Zhang, T.F. and Li, L. and Zhou, Y. and Liu, W.T. and Qian, C. and Hwang, J.N. and Ji, X.Y.",
        TITLE = "CAS-ViT: Convolutional Additive Self-Attention Vision Transformers
for Efficient Mobile Applications",
        JOURNAL = IP,
        VOLUME = "35",
        YEAR = "2026",
        PAGES = "1899-1909",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153975"}

@article{bb158105,
        AUTHOR = "Xiao, W.J. and Li, X.Z. and Hu, L. and Hao, Y.X. and Chen, M.",
        TITLE = "DTSNet: Dynamic Transformer Slimming for Efficient Vision Recognition",
        JOURNAL = MultMed,
        VOLUME = "28",
        YEAR = "2026",
        PAGES = "1589-1600",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153976"}

@article{bb158106,
        AUTHOR = "Xu, G. and Hao, J.W. and Luo, Y. and Shen, L. and Hu, H. and Zeng, D.",
        TITLE = "EEformer: Early Exiting for Transformer With Global-Local Exits and
Progressive Fine-Tuning",
        JOURNAL = MultMed,
        VOLUME = "28",
        YEAR = "2026",
        PAGES = "1352-1364",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153977"}

@article{bb158107,
        AUTHOR = "Zhang, Z.W. and Lin, P.X. and Wang, Z.W. and Zhang, Y.Y. and Xu, Z.Q.J.",
        TITLE = "Complexity Control Facilitates Reasoning-Based Compositional
Generalization in Transformers",
        JOURNAL = PAMI,
        VOLUME = "48",
        YEAR = "2026",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "4336-4349",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153978"}

@article{bb158108,
        AUTHOR = "Zhou, W.W. and Zhao, S.J. and Liu, Y.Z. and Li, Y.P.",
        TITLE = "CCTformer: Calibrated Context-Aware Transformer for Correspondence
Pruning",
        JOURNAL = SPLetters,
        VOLUME = "33",
        YEAR = "2026",
        PAGES = "1461-1465",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153979"}

@inproceedings{bb158109,
        AUTHOR = "Nozawa, Y. and Lin, Y.C. and Nakamura, K. and Ng, Y.",
        TITLE = "Prompt-Guided Attention Head Selection for Focus-Oriented Image
Retrieval",
        BOOKTITLE = PixFM25,
        YEAR = "2025",
        PAGES = "4131-4141",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153980"}

@inproceedings{bb158110,
        AUTHOR = "Abraham, S.J. and Hauenstein, J.D. and Scheirer, W.J.",
        TITLE = "Wavelet-Based Mechanistic Interpretability of Vision Transformers via
Frequency-Aware Ablations",
        BOOKTITLE = InterpVis25,
        YEAR = "2025",
        PAGES = "4830-4834",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153981"}

@inproceedings{bb158111,
        AUTHOR = "Augustin, M. and Sarwar, S.S. and Elhoushi, M. and Li, Y.C. and Zhang, S.Q. and de Salvo, B.",
        TITLE = "PETAH: Parameter Efficient Task Adaptation for Hybrid Transformers",
        BOOKTITLE = MobileAI25,
        YEAR = "2025",
        PAGES = "1858-1868",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153982"}

@inproceedings{bb158112,
        AUTHOR = "Ali, M. and Raza, H. and Gan, J.Q. and Haris, M.",
        TITLE = "Optimising Vision Transformer Performance on Limited Datasets: A
Multi-Gradient Approach",
        BOOKTITLE = "FaDE-TCV25",
        YEAR = "2025",
        PAGES = "693-702",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153983"}

@inproceedings{bb158113,
        AUTHOR = "Echevarrieta Catalan, N. and Ribas Rodriguez, A. and Cedron, F. and Schwartz, O. and Aguiar Pulido, V.",
        TITLE = "Enhancing Vision Transformer Explainability using Artificial
Astrocytes",
        BOOKTITLE = LXCV25,
        YEAR = "2025",
        PAGES = "58-64",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153984"}

@inproceedings{bb158114,
        AUTHOR = "Takatsuki, R. and Joseph, S. and Fujisawa, I. and Kanai, R.",
        TITLE = "Decoding Vision Transformers: The Diffusion Steering Lens",
        BOOKTITLE = InterpVis25,
        YEAR = "2025",
        PAGES = "4819-4824",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153985"}

@inproceedings{bb158115,
        AUTHOR = "He, X. and Quan, Y.H. and Xu, R. and Ji, H.",
        TITLE = "A Universal Scale-Adaptive Deformable Transformer for Image
Restoration across Diverse Artifacts",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "12731-12741",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153986"}

@inproceedings{bb158116,
        AUTHOR = "Fixelle, J.",
        TITLE = "Hypergraph Vision Transformers: Images are More than Nodes, More than
Edges",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "9751-9761",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153987"}

@inproceedings{bb158117,
        AUTHOR = "Ahmed, S. and Arafat, A.A. and Najafi, D. and Mahmood, A. and Rizve, M.N. and Nahian, M.A. and Zhou, R.Y. and Angizi, S. and Rakin, A.S.",
        TITLE = "DeepCompress-ViT: Rethinking Model Compression to Enhance Efficiency
of Vision Transformers at the Edge",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "30147-30156",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153988"}

@inproceedings{bb158118,
        AUTHOR = "Bouniot, Q. and Redko, I. and Mallasto, A. and Laclau, C. and Struckmeier, O. and Arndt, K. and Heinonen, M. and Kyrki, V. and Kaski, S.",
        TITLE = "From Alexnet to Transformers: Measuring the Non-linearity of Deep
Neural Networks with Affine Optimal Transport",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "25250-25260",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153989"}

@inproceedings{bb158119,
        AUTHOR = "Wang, Z.Q. and Xia, X.B. and Chen, R. and Yu, D.D. and Wang, C.H. and Gong, M.M. and Liu, T.L.",
        TITLE = "LaVin-DiT: Large Vision Diffusion Transformer",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "20060-20070",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153990"}

@inproceedings{bb158120,
        AUTHOR = "Zhou, Y. and Xu, Q.S. and Cui, J. and Zhou, J. and Zhang, J. and Hong, R.C. and Zhang, H.W.",
        TITLE = "CARE Transformer: Mobile-Friendly Linear Visual Transformer via
Decoupled Dual Interaction",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "20135-20145",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153991"}

@inproceedings{bb158121,
        AUTHOR = "Yu, H. and Jiang, T. and Jia, S. and Yan, S.N. and Liu, S.N. and Qian, H.L. and Li, G.H. and Dong, S.T. and Yuan, C.",
        TITLE = "ComRoPE: Scalable and Robust Rotary Position Embedding Parameterized
by Trainable Commuting Angle Matrices",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "4508-4517",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153992"}

@inproceedings{bb158122,
        AUTHOR = "Chen, G.L. and Fu, T.W. and Chen, H.W. and Teng, W.B. and Xiao, H.Y. and Zhao, Y.J.",
        TITLE = "RDD: Robust Feature Detector and Descriptor using Deformable
Transformer",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "6394-6403",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153993"}

@inproceedings{bb158123,
        AUTHOR = "Pardyl, A. and Kurzejamski, G. and Olszewski, J. and Trzcinski, T. and Zielinski, B.",
        TITLE = "Beyond Grids: Exploring Elastic Input Sampling for Vision
Transformers",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "8536-8545",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153994"}

@inproceedings{bb158124,
        AUTHOR = "Zhong, Y. and Zhou, Y.",
        TITLE = "Rethinking Low-Rank Adaptation in Vision:
Exploring Head-Level Responsiveness across Diverse Tasks",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "7787-7796",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153995"}

@inproceedings{bb158125,
        AUTHOR = "Pipoli, V. and Bolelli, F. and Sarto, S. and Cornia, M. and Baraldi, L. and Grana, C. and Cucchiara, R. and Ficarra, E.",
        TITLE = "Semantically Conditioned Prompts for Visual Recognition Under Missing
Modality Scenarios",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "4968-4977",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153996"}

@inproceedings{bb158126,
        AUTHOR = "Go, J. and Ryu, J.B.",
        TITLE = "Channel Propagation Networks for Refreshable Vision Transformer",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "1353-1362",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153997"}

@inproceedings{bb158127,
        AUTHOR = "Nauen, T.C. and Palacio, S. and Raue, F. and Dengel, A.",
        TITLE = "Which Transformer to Favor: A Comparative Analysis of Efficiency in
Vision Transformers",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "6955-6966",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153998"}

@inproceedings{bb158128,
        AUTHOR = "Tai, Y.S. and Wu, A.Y.A.",
        TITLE = "AMP-ViT: Optimizing Vision Transformer Efficiency with Adaptive
Mixed-Precision Post-Training Quantization",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "6828-6837",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT153999"}

@inproceedings{bb158129,
        AUTHOR = "Chen, P.Q. and Yu, L. and Wan, Y. and Zhang, Y.J. and Wang, J. and Zhong, L.H. and Chen, J.D. and Yang, M.",
        TITLE = "Ecomatcher: Efficient Clustering Oriented Matcher for Detector-free
Image Matching",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "LXVIII: 344-360",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154000"}

@inproceedings{bb158130,
        AUTHOR = "Wang, H.Q. and Zhang, T. and Salzmann, M.",
        TITLE = "Sinder: Repairing the Singular Defects of Dinov2",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "VII: 20-35",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154001"}

@inproceedings{bb158131,
        AUTHOR = "Suri, S. and Walmer, M. and Gupta, K. and Shrivastava, A.",
        TITLE = "Lift: A Surprisingly Simple Lightweight Feature Transform for Dense Vit
Descriptors",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "VII: 110-128",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154002"}

@inproceedings{bb158132,
        AUTHOR = "Pan, Z.Z. and Liu, J. and He, H.Y. and Cai, J.F. and Zhuang, B.",
        TITLE = "Stitched VITS are Flexible Vision Backbones",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XLI: 258-274",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154003"}

@inproceedings{bb158133,
        AUTHOR = "Kim, D.H. and Heo, B. and Han, D.Y.",
        TITLE = "Densenets Reloaded: Paradigm Shift Beyond Resnets and VITS",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "III: 395-415",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154004"}

@inproceedings{bb158134,
        AUTHOR = "Zhang, C. and Cheng, J. and Li, Q.X.",
        TITLE = "An Optimal Control View of Lora and Binary Controller Design for Vision
Transformers",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "LIII: 144-160",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154005"}

@inproceedings{bb158135,
        AUTHOR = "Zhang, T. and Bai, J. and Lu, Z. and Lian, D.Z. and Wang, G. and Wang, X.C. and Xia, S.T.",
        TITLE = "Parameter-efficient and Memory-efficient Tuning for Vision Transformer:
A Disentangled Approach",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XLV: 346-363",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154006"}

@inproceedings{bb158136,
        AUTHOR = "Wang, H.Y. and Tang, H. and Jiang, L. and Shi, S.S. and Naeem, M.F. and Li, H.S. and Schiele, B. and Wang, L.W.",
        TITLE = "Git: Towards Generalist Vision Transformer Through Universal Language
Interface",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XXIX: 55-73",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154007"}

@inproceedings{bb158137,
        AUTHOR = "Wu, Z.G.Y. and Chen, J.X. and Zhong, H. and Huang, D. and Wang, Y.H.",
        TITLE = "Adalog: Post-training Quantization for Vision Transformers with
Adaptive Logarithm Quantizer",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XXVII: 411-427",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154008"}

@inproceedings{bb158138,
        AUTHOR = "Xiao, H. and Zheng, W.Z. and Zuo, S.C. and Gao, P. and Zhou, J. and Lu, J.W.",
        TITLE = "Spatialformer: Towards Generalizable Vision Transformers with Explicit
Spatial Understanding",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XIII: 37-54",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154009"}

@inproceedings{bb158139,
        AUTHOR = "Heo, B. and Park, S. and Han, D.Y. and Yun, S.",
        TITLE = "Rotary Position Embedding for Vision Transformer",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "X: 289-305",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154010"}

@inproceedings{bb158140,
        AUTHOR = "Bellitto, G. and Sortino, R. and Spadaro, P. and Palazzo, S. and Salanitri, F.P. and Fiameni, G. and Gavves, E. and Spampinato, C.",
        TITLE = "Vito: Vision Transformer Optimization Via Knowledge Distillation On
Decoders",
        BOOKTITLE = ICIP24,
        YEAR = "2024",
        PAGES = "493-499",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154011"}

@inproceedings{bb158141,
        AUTHOR = "Gani, H. and Saadi, N. and Hussein, N. and Nandakumar, K.",
        TITLE = "Multi-Attribute Vision Transformers are Efficient and Robust Learners",
        BOOKTITLE = ICIP24,
        YEAR = "2024",
        PAGES = "766-772",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154012"}

@inproceedings{bb158142,
        AUTHOR = "Cho, J.H. and Krahenbuhl, P.",
        TITLE = "Language-Conditioned Detection Transformer",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "16593-16603",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154013"}

@inproceedings{bb158143,
        AUTHOR = "Lin, S. and Lyu, P. and Liu, D.R. and Tang, T. and Liang, X.D. and Song, A. and Chang, X.J.",
        TITLE = "MLP Can Be a Good Transformer Learner",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "19489-19498",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154014"}

@inproceedings{bb158144,
        AUTHOR = "Weng, H.H. and Huang, D. and Qiao, Y. and Hu, Z. and Lin, C.Y. and Zhang, T. and Chen, C.L.P.",
        TITLE = "Desigen: A Pipeline for Controllable Design Template Generation",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "12721-12732",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154015"}

@inproceedings{bb158145,
        AUTHOR = "Park, S. and Byun, H.R.",
        TITLE = "Fair-VPT: Fair Visual Prompt Tuning for Image Classification",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "12268-12278",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154016"}

@inproceedings{bb158146,
        AUTHOR = "Xu, H.Y. and Xiang, L. and Ye, H.Y. and Yao, D. and Chu, P.Z. and Li, B.C.",
        TITLE = "Permutation Equivariance of Transformers and its Applications",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "5987-5996",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154017"}

@inproceedings{bb158147,
        AUTHOR = "Zhang, Y.Y. and Ding, X.H. and Gong, K.X. and Ge, Y.X. and Shan, Y. and Yue, X.Y.",
        TITLE = "Multimodal Pathway: Improve Transformers with Irrelevant Data from
Other Modalities",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "6108-6117",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154018"}

@inproceedings{bb158148,
        AUTHOR = "Kobayashi, T.",
        TITLE = "Mean-Shift Feature Transformer",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "6047-6056",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154019"}

@inproceedings{bb158149,
        AUTHOR = "Shi, X.Y. and Hao, Z.C. and Yu, Z.F.",
        TITLE = "SpikingResformer: Bridging ResNet and Vision Transformer in Spiking
Neural Networks",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "5610-5619",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154020"}

@inproceedings{bb158150,
        AUTHOR = "Ye, H.C. and Yu, C. and Ye, P. and Xia, R. and Tang, Y.S. and Lu, J.W. and Chen, T. and Zhang, B.",
        TITLE = "Once for Both: Single Stage of Importance and Sparsity Search for
Vision Transformer Compression",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "5578-5588",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154021"}

@inproceedings{bb158151,
        AUTHOR = "Zhang, J. and Herrmann, C. and Hur, J. and Chen, E. and Jampani, V. and Sun, D.Q. and Yang, M.H.",
        TITLE = "Telling Left from Right: Identifying Geometry-Aware Semantic
Correspondence",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "3076-3085",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154022"}

@inproceedings{bb158152,
        AUTHOR = "Huang, N.C. and Chang, C.C. and Lin, W.C. and Taka, E. and Marculescu, D. and Wu, K.C.A.",
        TITLE = "ELSA: Exploiting Layer-wise N:M Sparsity for Vision Transformer
Acceleration",
        BOOKTITLE = ECV24,
        YEAR = "2024",
        PAGES = "8006-8015",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154023"}

@inproceedings{bb158153,
        AUTHOR = "Devulapally, A. and Khan, M.F.F. and Advani, S. and Narayanan, V.",
        TITLE = "Multi-Modal Fusion of Event and RGB for Monocular Depth Estimation
Using a Unified Transformer-based Architecture",
        BOOKTITLE = MULA24,
        YEAR = "2024",
        PAGES = "2081-2089",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154024"}

@inproceedings{bb158154,
        AUTHOR = "Yang, Z.D. and Li, Z. and Zeng, A.L. and Li, Z.X. and Yuan, C. and Li, Y.",
        TITLE = "ViTKD: Feature-based Knowledge Distillation for Vision Transformers",
        BOOKTITLE = PBDL24,
        YEAR = "2024",
        PAGES = "1379-1388",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154025"}

@inproceedings{bb158155,
        AUTHOR = "Mehri, F. and Baghshah, M.S. and Pilehvar, M.T.",
        TITLE = "LibraGrad: Balancing Gradient Flow for Universally Better Vision
Transformer Attributions",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "67-78",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154026"}

@inproceedings{bb158156,
        AUTHOR = "Mehri, F. and Fayyaz, M. and Baghshah, M.S. and Pilehvar, M.T.",
        TITLE = "SkipPLUS: Skip the First Few Layers to Better Explain Vision
Transformers",
        BOOKTITLE = FaDE-TCV24,
        YEAR = "2024",
        PAGES = "204-215",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154027"}

@inproceedings{bb158157,
        AUTHOR = "Jain, S. and Dutta, T.",
        TITLE = "Towards Understanding and Improving Adversarial Robustness of Vision
Transformers",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "24736-24745",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154028"}

@inproceedings{bb158158,
        AUTHOR = "Yang, S. and Bai, J. and Gao, K. and Yang, Y. and Li, Y.M. and Xia, S.T.",
        TITLE = "Not All Prompts Are Secure: A Switchable Backdoor Attack Against
Pre-trained Vision Transfomers",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "24431-24441",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154029"}

@inproceedings{bb158159,
        AUTHOR = "Steitz, J.M.O. and Roth, S.",
        TITLE = "Adapters Strike Back",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "23449-23459",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154030"}

@inproceedings{bb158160,
        AUTHOR = "Rangwani, H. and Mondal, P. and Mondal, P. and Mishra, M. and Asokan, A.R. and Babu, R.V.",
        TITLE = "DeiT-LT: Distillation Strikes Back for Vision Transformer Training on
Long-Tailed Datasets",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "23396-23406",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154031"}

@inproceedings{bb158161,
        AUTHOR = "Liu, J.Y. and Teshome, W. and Ghimire, S. and Sznaier, M. and Camps, O.",
        TITLE = "Solving Masked Jigsaw Puzzles with Diffusion Vision Transformers*",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "23009-23018",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154032"}

@inproceedings{bb158162,
        AUTHOR = "Kim, M. and Seo, P.H. and Schmid, C. and Cho, M.",
        TITLE = "Learning Correlation Structures for Vision Transformers",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "18941-18951",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154033"}

@inproceedings{bb158163,
        AUTHOR = "Shi, D.",
        TITLE = "TransNeXt: Robust Foveal Visual Perception for Vision Transformers",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "17773-17783",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154034"}

@inproceedings{bb158164,
        AUTHOR = "Agiza, A. and Neseem, M. and Reda, S.",
        TITLE = "MTLoRA: A Low-Rank Adaptation Approach for Efficient Multi-Task
Learning",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "16196-16205",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154035"}

@inproceedings{bb158165,
        AUTHOR = "Dong, W. and Zhang, X. and Chen, B. and Yan, D.W. and Lin, Z.J. and Yan, Q. and Wang, P. and Yang, Y.",
        TITLE = "Low-Rank Rescaled Vision Transformer Fine-Tuning:
A Residual Design Approach",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "16101-16110",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154036"}

@inproceedings{bb158166,
        AUTHOR = "Wu, J. and Kang, W.T. and Tang, H. and Hong, Y. and Yan, Y.",
        TITLE = "On the Faithfulness of Vision Transformer Explanations",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "10936-10945",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154037"}

@inproceedings{bb158167,
        AUTHOR = "Navaneet, K.L. and Koohpayegani, S.A. and Sleiman, E. and Pirsiavash, H.",
        TITLE = "SlowFormer: Adversarial Attack on Compute and Energy Consumption of
Efficient Vision Transformers",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "24786-24797",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154038"}

@inproceedings{bb158168,
        AUTHOR = "Koyun, O.C. and Toreyin, B.U.",
        TITLE = "HaLViT: Half of the Weights are Enough",
        BOOKTITLE = LargeVM24,
        YEAR = "2024",
        PAGES = "3669-3678",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154039"}

@inproceedings{bb158169,
        AUTHOR = "Bafghi, R.A. and Harilal, N. and Monteleoni, C. and Raissi, M.",
        TITLE = "Parameter Efficient Fine-tuning of Self-supervised ViTs without
Catastrophic Forgetting",
        BOOKTITLE = LargeVM24,
        YEAR = "2024",
        PAGES = "3679-3684",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154040"}

@inproceedings{bb158170,
        AUTHOR = "Raissi, M. and Monteleoni, C. and Harilal, N. and Bafghi, R.A.",
        TITLE = "Parameter Efficient Fine-tuning of Self-supervised ViTs without
Catastrophic Forgetting",
        BOOKTITLE = LargeVM24,
        YEAR = "2024",
        PAGES = "7864-7869",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154040"}

@inproceedings{bb158171,
        AUTHOR = "Edalati, A. and Hameed, M.G.A. and Mosleh, A.",
        TITLE = "Generalized Kronecker-based Adapters for Parameter-efficient
Fine-tuning of Vision Transformers",
        BOOKTITLE = CRV23,
        YEAR = "2023",
        PAGES = "97-104",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154041"}

@inproceedings{bb158172,
        AUTHOR = "Marouf, I.E. and Tartaglione, E. and Lathuiliere, S.",
        TITLE = "Mini but Mighty: Finetuning ViTs with Mini Adapters",
        BOOKTITLE = WACV24,
        YEAR = "2024",
        PAGES = "1721-1730",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154042"}

@inproceedings{bb158173,
        AUTHOR = "Kim, G. and Kim, J. and Lee, J.S.",
        TITLE = "Exploring Adversarial Robustness of Vision Transformers in the
Spectral Perspective",
        BOOKTITLE = WACV24,
        YEAR = "2024",
        PAGES = "3964-3973",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154043"}

@inproceedings{bb158174,
        AUTHOR = "Han, Q. and Zhang, G.J. and Huang, J.X. and Gao, P. and Wei, Z. and Lu, S.J.",
        TITLE = "Efficient MAE towards Large-Scale Vision Transformers",
        BOOKTITLE = WACV24,
        YEAR = "2024",
        PAGES = "595-604",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154044"}

@inproceedings{bb158175,
        AUTHOR = "Park, J.W. and Kahatapitiya, K. and Kim, D.H. and Sudalairaj, S. and Fan, Q.F. and Ryoo, M.S.",
        TITLE = "Grafting Vision Transformers",
        BOOKTITLE = WACV24,
        YEAR = "2024",
        PAGES = "1134-1143",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154045"}

@inproceedings{bb158176,
        AUTHOR = "Shimizu, S. and Tamaki, T.",
        TITLE = "Joint learning of images and videos with a single Vision Transformer",
        BOOKTITLE = MVA23,
        YEAR = "2023",
        PAGES = "1-6",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154046"}

@inproceedings{bb158177,
        AUTHOR = "Chen, M.Z. and Lin, M. and Lin, Z.H. and Zhang, Y.X. and Chao, F. and Ji, R.R.",
        TITLE = "SMMix: Self-Motivated Image Mixing for Vision Transformers",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "17214-17224",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154047"}

@inproceedings{bb158178,
        AUTHOR = "Kim, D. and Angelova, A. and Kuo, W.C.",
        TITLE = "Contrastive Feature Masking Open-Vocabulary Vision Transformer",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "15556-15566",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154048"}

@inproceedings{bb158179,
        AUTHOR = "Li, Z.K. and Gu, Q.Y.",
        TITLE = "I-ViT: Integer-only Quantization for Efficient Vision Transformer
Inference",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "17019-17029",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154049"}

@inproceedings{bb158180,
        AUTHOR = "Frumkin, N. and Gope, D. and Marculescu, D.",
        TITLE = "Jumping through Local Minima: Quantization in the Loss Landscape of
Vision Transformers",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "16932-16942",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154050"}

@inproceedings{bb158181,
        AUTHOR = "Li, Z.K. and Xiao, J.R. and Yang, L.W. and Gu, Q.Y.",
        TITLE = "RepQ-ViT: Scale Reparameterization for Post-Training Quantization of
Vision Transformers",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "17181-17190",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154051"}

@inproceedings{bb158182,
        AUTHOR = "Wang, X. and Chu, X.J. and Han, C. and Zhang, X.Y.",
        TITLE = "SCSC: Spatial Cross-scale Convolution Module to Strengthen both CNNs
and Transformers",
        BOOKTITLE = NIVT23,
        YEAR = "2023",
        PAGES = "731-741",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154052"}

@inproceedings{bb158183,
        AUTHOR = "Chen, Y.H. and Weng, Y.C. and Kao, C.H. and Chien, C. and Chiu, W.C. and Peng, W.H.",
        TITLE = "TransTIC: Transferring Transformer-based Image Compression from Human
Perception to Machine Perception",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "23240-23250",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154053"}

@inproceedings{bb158184,
        AUTHOR = "Li, Y.Y. and Hu, J. and Wen, Y. and Evangelidis, G. and Salahi, K. and Wang, Y.Z. and Tulyakov, S. and Ren, J.",
        TITLE = "Rethinking Vision Transformers for MobileNet Size and Speed",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "16843-16854",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154054"}

@inproceedings{bb158185,
        AUTHOR = "Nurgazin, M. and Tu, N.A.",
        TITLE = "A Comparative Study of Vision Transformer Encoders and Few-shot
Learning for Medical Image Classification",
        BOOKTITLE = CVAMD23,
        YEAR = "2023",
        PAGES = "2505-2513",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154055"}

@inproceedings{bb158186,
        AUTHOR = "Vasu, P.K.A. and Gabriel, J. and Zhu, J. and Tuzel, O. and Ranjan, A.",
        TITLE = "FastViT: A Fast Hybrid Vision Transformer using Structural
Reparameterization",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "5762-5772",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154056"}

@inproceedings{bb158187,
        AUTHOR = "Tang, C. and Zhang, L.L. and Jiang, H.Q. and Xu, J.H. and Cao, T. and Zhang, Q. and Yang, Y.Q. and Wang, Z. and Yang, M.",
        TITLE = "ElasticViT: Conflict-aware Supernet Training for Deploying Fast
Vision Transformer on Diverse Mobile Devices",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "5806-5817",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154057"}

@inproceedings{bb158188,
        AUTHOR = "Lin, W.F. and Wu, Z.H. and Chen, J.Y. and Huang, J. and Jin, L.W.",
        TITLE = "Scale-Aware Modulation Meet Transformer",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "5992-6003",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154058"}

@inproceedings{bb158189,
        AUTHOR = "He, Y.F. and Lou, Z.Y. and Zhang, L. and Liu, J. and Wu, W.J. and Zhou, H. and Zhuang, B.",
        TITLE = "BiViT: Extremely Compressed Binary Vision Transformers",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "5628-5640",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154059"}

@inproceedings{bb158190,
        AUTHOR = "Dutson, M. and Li, Y. and Gupta, M.",
        TITLE = "Eventful Transformers:
Leveraging Temporal Redundancy in Vision Transformers",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "16865-16877",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154060"}

@inproceedings{bb158191,
        AUTHOR = "Wang, Z.Q. and Fang, Y.T. and Cao, J.H. and Zhang, Q. and Wang, Z. and Xu, R.",
        TITLE = "Masked Spiking Transformer",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "1761-1771",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154061"}

@inproceedings{bb158192,
        AUTHOR = "Peebles, W. and Xie, S.",
        TITLE = "Scalable Diffusion Models with Transformers",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "4172-4182",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154062"}

@inproceedings{bb158193,
        AUTHOR = "Mentzer, F. and Agustson, E. and Tschannen, M.",
        TITLE = "M2T: Masking Transformers Twice for Faster Decoding",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "5317-5326",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154063"}

@inproceedings{bb158194,
        AUTHOR = "Yu, R.Y. and Wang, Z.N. and Wang, Y.H. and Li, K. and Liu, C. and Duan, H.Y. and Ji, X.Y. and Chen, J.",
        TITLE = "LaPE: Layer-adaptive Position Embedding for Vision Transformers with
Independent Layer Normalization",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "5863-5873",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154064"}

@inproceedings{bb158195,
        AUTHOR = "Roy, A. and Verma, V.K. and Voonna, S. and Ghosh, K. and Ghosh, S. and Das, A.",
        TITLE = "Exemplar-Free Continual Transformer with Convolutions",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "5874-5884",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154065"}

@inproceedings{bb158196,
        AUTHOR = "Xu, Y.X. and Li, C. and Li, D. and Sheng, X. and Jiang, F. and Tian, L. and Sirasao, A.",
        TITLE = "FDViT: Improve the Hierarchical Architecture of Vision Transformer",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "5927-5937",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154066"}

@inproceedings{bb158197,
        AUTHOR = "Chen, Y.J. and Liu, H.M. and Yin, H.R. and Fan, B.",
        TITLE = "Building Vision Transformers with Hierarchy Aware Feature Aggregation",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "5885-5895",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154067"}

@inproceedings{bb158198,
        AUTHOR = "Quetu, V. and Milovanovic, M. and Tartaglione, E.",
        TITLE = "Sparse Double Descent in Vision Transformers: Real or Phantom Threat?",
        BOOKTITLE = CIAP23,
        YEAR = "2023",
        PAGES = "II:490-502",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154068"}

@inproceedings{bb158199,
        AUTHOR = "Ak, K.E. and Lee, G.G. and Xu, Y. and Shen, M.W.",
        TITLE = "Leveraging Efficient Training and Feature Fusion in Transformers for
Multimodal Classification",
        BOOKTITLE = ICIP23,
        YEAR = "2023",
        PAGES = "1420-1424",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154069"}

Last update:May 24, 2026 at 14:46:09