@inproceedings{bb158800,
        AUTHOR = "Webb, A.R. and Shannon, S.",
        TITLE = "Adaptive Radial Basis Functions",
        BOOKTITLE = ICPR96,
        YEAR = "1996",
        PAGES = "IV: 630-634",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT154668"}

@inproceedings{bb158801,
        AUTHOR = "Webb, A.R.",
        TITLE = "Nonlinear Feature Extraction with Radial Basis Functions Using a
Weighted Multidimensional Scaling Stress Measure",
        BOOKTITLE = ICPR96,
        YEAR = "1996",
        PAGES = "IV: 635-639",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT154669"}

@article{bb158802,
        AUTHOR = "Bazi, Y. and Bashmal, L. and Al Rahhal, M.M. and Al Dayil, R. and Al Ajlan, N.",
        TITLE = "Vision Transformers for Remote Sensing Image Classification",
        JOURNAL = RS,
        VOLUME = "13",
        YEAR = "2021",
        NUMBER = "3",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154670"}

@article{bb158803,
        AUTHOR = "Li, T. and Zhang, Z. and Pei, L. and Gan, Y.",
        TITLE = "HashFormer: Vision Transformer Based Deep Hashing for Image Retrieval",
        JOURNAL = SPLetters,
        VOLUME = "29",
        YEAR = "2022",
        PAGES = "827-831",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154671"}

@article{bb158804,
        AUTHOR = "Chen, Z.M. and Cui, Q. and Zhao, B. and Song, R.J. and Zhang, X.Q. and Yoshie, O.",
        TITLE = "SST: Spatial and Semantic Transformers for Multi-Label Image
Recognition",
        JOURNAL = IP,
        VOLUME = "31",
        YEAR = "2022",
        PAGES = "2570-2583",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154672"}

@article{bb158805,
        AUTHOR = "Wang, G.H. and Li, B. and Zhang, T. and Zhang, S.",
        TITLE = "A Network Combining a Transformer and a Convolutional Neural Network
for Remote Sensing Image Change Detection",
        JOURNAL = RS,
        VOLUME = "14",
        YEAR = "2022",
        NUMBER = "9",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154673"}

@article{bb158806,
        AUTHOR = "Luo, G. and Zhou, Y. and Sun, X.S. and Wang, Y. and Cao, L.J. and Wu, Y.J. and Huang, F.Y. and Ji, R.R.",
        TITLE = "Towards Lightweight Transformer Via Group-Wise Transformation for
Vision-and-Language Tasks",
        JOURNAL = IP,
        VOLUME = "31",
        YEAR = "2022",
        PAGES = "3386-3398",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154674"}

@article{bb158807,
        AUTHOR = "Zhong, Y.S. and Hu, J.W. and Lin, M. and Chen, M.Z. and Ji, R.R.",
        TITLE = "I&S-ViT: An Inclusive & Stable Method for Post-Training ViTs
Quantization",
        JOURNAL = PAMI,
        VOLUME = "48",
        YEAR = "2026",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "1063-1080",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154675"}

@article{bb158808,
        AUTHOR = "Wang, J.Y. and Chakraborty, R. and Yu, S.X.",
        TITLE = "Transformer for 3D Point Clouds",
        JOURNAL = PAMI,
        VOLUME = "44",
        YEAR = "2022",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "4419-4431",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154676"}

@article{bb158809,
        AUTHOR = "Wu, J.J. and Wei, Z.Q. and Zhang, J.P. and Zhang, Y.S. and Jia, D.N. and Yin, B. and Yu, Y.C.",
        TITLE = "Full-Coupled Convolutional Transformer for Surface-Based Duct
Refractivity Inversion",
        JOURNAL = RS,
        VOLUME = "14",
        YEAR = "2022",
        NUMBER = "17",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154677"}

@article{bb158810,
        AUTHOR = "Jiang, K. and Peng, P. and Lian, Y.Z. and Xu, W.S.",
        TITLE = "The encoding method of position embeddings in vision transformer",
        JOURNAL = JVCIR,
        VOLUME = "89",
        YEAR = "2022",
        PAGES = "103664",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154678"}

@article{bb158811,
        AUTHOR = "Han, K. and Wang, Y.H. and Chen, H.T. and Chen, X.H. and Guo, J.Y. and Liu, Z.H. and Tang, Y.H. and Xiao, A. and Xu, C.J. and Xu, Y.X. and Yang, Z.H. and Zhang, Y. and Tao, D.C.",
        TITLE = "A Survey on Vision Transformer",
        JOURNAL = PAMI,
        VOLUME = "45",
        YEAR = "2023",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "87-110",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154679"}

@article{bb158812,
        AUTHOR = "Hou, Q. and Jiang, Z.H. and Yuan, L. and Cheng, M.M. and Yan, S.C. and Feng, J.S.",
        TITLE = "Vision Permutator:
A Permutable MLP-Like Architecture for Visual Recognition",
        JOURNAL = PAMI,
        VOLUME = "45",
        YEAR = "2023",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "1328-1334",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154680"}

@article{bb158813,
        AUTHOR = "Yu, W.H. and Si, C.Y. and Zhou, P. and Luo, M. and Zhou, Y.C. and Feng, J.S. and Yan, S.C. and Wang, X.C.",
        TITLE = "MetaFormer Baselines for Vision",
        JOURNAL = PAMI,
        VOLUME = "46",
        YEAR = "2024",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "896-912",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154681"}

@inproceedings{bb158814,
        AUTHOR = "Yu, W.H. and Luo, M. and Zhou, P. and Si, C.Y. and Zhou, Y.C. and Wang, X.C. and Feng, J.S. and Yan, S.C.",
        TITLE = "MetaFormer is Actually What You Need for Vision",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "10809-10819",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154682"}

@article{bb158815,
        AUTHOR = "Yuan, L. and Hou, Q. and Jiang, Z.H. and Feng, J.S. and Yan, S.C.",
        TITLE = "VOLO: Vision Outlooker for Visual Recognition",
        JOURNAL = PAMI,
        VOLUME = "45",
        YEAR = "2023",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "6575-6586",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154683"}

@article{bb158816,
        AUTHOR = "Wu, Y.H. and Liu, Y. and Zhan, X. and Cheng, M.M.",
        TITLE = "P2T: Pyramid Pooling Transformer for Scene Understanding",
        JOURNAL = PAMI,
        VOLUME = "45",
        YEAR = "2023",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "12760-12771",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154684"}

@article{bb158817,
        AUTHOR = "Wang, H. and Du, Y.T. and Zhang, Y.B. and Li, S. and Zhang, L.",
        TITLE = "One-Stage Visual Relationship Referring With Transformers and
Adaptive Message Passing",
        JOURNAL = IP,
        VOLUME = "32",
        YEAR = "2023",
        PAGES = "190-202",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154685"}

@article{bb158818,
        AUTHOR = "Kiya, H. and Iijima, R. and Maungmaung, A. and Kinoshit, Y.",
        TITLE = "Image and Model Transformation with Secret Key for Vision Transformer",
        JOURNAL = IEICE,
        VOLUME = "E106-D",
        YEAR = "2023",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "2-11",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154686"}

@article{bb158819,
        AUTHOR = "Li, Y. and Chen, K. and Sun, S.L. and He, C.",
        TITLE = "Multi-scale homography estimation based on dual feature aggregation
transformer",
        JOURNAL = IET-IPR,
        VOLUME = "17",
        YEAR = "2023",
        NUMBER = "5",
        PAGES = "1403-1416",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154687"}

@article{bb158820,
        AUTHOR = "Wang, G.Q. and Chen, H. and Chen, L. and Zhuang, Y. and Zhang, S.H. and Zhang, T. and Dong, H. and Gao, P.",
        TITLE = "P2FEViT: Plug-and-Play CNN Feature Embedded Hybrid Vision Transformer
for Remote Sensing Image Classification",
        JOURNAL = RS,
        VOLUME = "15",
        YEAR = "2023",
        NUMBER = "7",
        PAGES = "1773",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154688"}

@article{bb158821,
        AUTHOR = "Zhang, Q.M. and Xu, Y.F. and Zhang, J. and Tao, D.C.",
        TITLE = "ViTAEv2: Vision Transformer Advanced by Exploring Inductive Bias for
Image Recognition and Beyond",
        JOURNAL = IJCV,
        VOLUME = "131",
        YEAR = "2023",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "1141-1162",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154689"}

@article{bb158822,
        AUTHOR = "Zhang, J.N. and Li, X.T. and Wang, Y.B. and Wang, C.J. and Yang, Y.B. and Liu, Y. and Tao, D.C.",
        TITLE = "EATFormer: Improving Vision Transformer Inspired by Evolutionary
Algorithm",
        JOURNAL = IJCV,
        VOLUME = "132",
        YEAR = "2024",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "3509-3536",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154690"}

@article{bb158823,
        AUTHOR = "Fan, X.Y. and Liu, H.J.",
        TITLE = "FlexFormer: Flexible Transformer for efficient visual recognition",
        JOURNAL = PRL,
        VOLUME = "169",
        YEAR = "2023",
        PAGES = "95-101",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154691"}

@article{bb158824,
        AUTHOR = "Cho, S. and Hong, S. and Kim, S.",
        TITLE = "CATs++: Boosting Cost Aggregation With Convolutions and Transformers",
        JOURNAL = PAMI,
        VOLUME = "45",
        YEAR = "2023",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "7174-7194",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154692"}

@inproceedings{bb158825,
        AUTHOR = "Yue, X.Y. and Sun, S.Y. and Kuang, Z.H. and Wei, M. and Torr, P.H.S. and Zhang, W. and Lin, D.",
        TITLE = "Vision Transformer with Progressive Sampling",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "377-386",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154693"}

@article{bb158826,
        AUTHOR = "Huang, X.Y. and Liu, F. and Cui, Y.H. and Chen, P. and Li, L.L. and Li, P.F.",
        TITLE = "Faster and Better: A Lightweight Transformer Network for Remote
Sensing Scene Classification",
        JOURNAL = RS,
        VOLUME = "15",
        YEAR = "2023",
        NUMBER = "14",
        PAGES = "3645",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154694"}

@article{bb158827,
        AUTHOR = "Zhao, J.X. and Jiao, L.C. and Wang, C. and Liu, X. and Liu, F. and Li, L.L. and Ma, M. and Yang, S.Y.",
        TITLE = "Knowledge Guided Evolutionary Transformer for Remote Sensing Scene
Classification",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "10368-10384",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154695"}

@article{bb158828,
        AUTHOR = "Zhang, D. and Ma, W.P. and Jiao, L.C. and Liu, X. and Yang, Y.T. and Liu, F.",
        TITLE = "Multiple Hierarchical Cross-Scale Transformer for Remote Sensing
Scene Classification",
        JOURNAL = RS,
        VOLUME = "17",
        YEAR = "2025",
        NUMBER = "1",
        PAGES = "42",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154696"}

@article{bb158829,
        AUTHOR = "Yao, T. and Li, Y. and Pan, Y.W. and Wang, Y. and Zhang, X.P. and Mei, T.",
        TITLE = "Dual Vision Transformer",
        JOURNAL = PAMI,
        VOLUME = "45",
        YEAR = "2023",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "10870-10882",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154697"}

@article{bb158830,
        AUTHOR = "Rao, Y.M. and Liu, Z. and Zhao, W.L. and Zhou, J. and Lu, J.W.",
        TITLE = "Dynamic Spatial Sparsification for Efficient Vision Transformers and
Convolutional Neural Networks",
        JOURNAL = PAMI,
        VOLUME = "45",
        YEAR = "2023",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "10883-10897",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154698"}

@article{bb158831,
        AUTHOR = "Li, J. and Liu, Z. and Li, L. and Lin, J.Q. and Yao, J. and Tu, J.",
        TITLE = "Multi-view convolutional vision transformer for 3D object recognition",
        JOURNAL = JVCIR,
        VOLUME = "95",
        YEAR = "2023",
        PAGES = "103906",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154699"}

@article{bb158832,
        AUTHOR = "Shang, J.H. and Li, X. and Kahatapitiya, K. and Lee, Y.C. and Ryoo, M.S.",
        TITLE = "StARformer: Transformer With State-Action-Reward Representations for
Robot Learning",
        JOURNAL = PAMI,
        VOLUME = "45",
        YEAR = "2023",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "12862-12877",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154700"}

@inproceedings{bb158833,
        AUTHOR = "Shang, J.H. and Kahatapitiya, K. and Li, X. and Ryoo, M.S.",
        TITLE = "StARformer: Transformer with State-Action-Reward Representations for
Visual Reinforcement Learning",
        BOOKTITLE = ECCV22,
        YEAR = "2022",
        PAGES = "XXIX:462-479",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154701"}

@article{bb158834,
        AUTHOR = "Duan, H.R. and Long, Y. and Wang, S.D. and Zhang, H.F. and Willcocks, C.G. and Shao, L.",
        TITLE = "Dynamic Unary Convolution in Transformers",
        JOURNAL = PAMI,
        VOLUME = "45",
        YEAR = "2023",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "12747-12759",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154702"}

@article{bb158835,
        AUTHOR = "Sun, W.X. and Qin, Z. and Deng, H. and Wang, J.Y. and Zhang, Y. and Zhang, K. and Barnes, N. and Birchfield, S. and Kong, L.P. and Zhong, Y.R.",
        TITLE = "Vicinity Vision Transformer",
        JOURNAL = PAMI,
        VOLUME = "45",
        YEAR = "2023",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "12635-12649",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154703"}

@article{bb158836,
        AUTHOR = "Cao, C.J. and Dong, Q.L. and Fu, Y.W.",
        TITLE = "ZITS++: Image Inpainting by Improving the Incremental Transformer on
Structural Priors",
        JOURNAL = PAMI,
        VOLUME = "45",
        YEAR = "2023",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "12667-12684",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154704"}

@article{bb158837,
        AUTHOR = "Fang, Y.X. and Wang, X.G. and Wu, R. and Liu, W.Y.",
        TITLE = "What Makes for Hierarchical Vision Transformer?",
        JOURNAL = PAMI,
        VOLUME = "45",
        YEAR = "2023",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "12714-12720",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154705"}

@article{bb158838,
        AUTHOR = "Liu, J. and Guo, H.R. and He, Y. and Li, H.L.",
        TITLE = "Vision Transformer-Based Ensemble Learning for Hyperspectral Image
Classification",
        JOURNAL = RS,
        VOLUME = "15",
        YEAR = "2023",
        NUMBER = "21",
        PAGES = "5208",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154706"}

@article{bb158839,
        AUTHOR = "Lin, M.B. and Chen, M.Z. and Zhang, Y.X. and Shen, C.H. and Ji, R.R. and Cao, L.J.",
        TITLE = "Super Vision Transformer",
        JOURNAL = IJCV,
        VOLUME = "131",
        YEAR = "2023",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "3136-3151",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154707"}

@article{bb158840,
        AUTHOR = "Li, Z.Y. and Gao, S.H. and Cheng, M.M.",
        TITLE = "SERE: Exploring Feature Self-Relation for Self-Supervised Transformer",
        JOURNAL = PAMI,
        VOLUME = "45",
        YEAR = "2023",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "15619-15631",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154708"}

@article{bb158841,
        AUTHOR = "Yuan, Y.H. and Liang, W.C. and Ding, H.H. and Liang, Z.H. and Zhang, C. and Hu, H.",
        TITLE = "Expediting Large-Scale Vision Transformer for Dense Prediction
Without Fine-Tuning",
        JOURNAL = PAMI,
        VOLUME = "46",
        YEAR = "2024",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "250-266",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154709"}

@article{bb158842,
        AUTHOR = "Jiao, J.Y. and Tang, Y.M. and Lin, K.Y. and Gao, Y.P. and Ma, A.J. and Wang, Y.W. and Zheng, W.S.",
        TITLE = "DilateFormer: Multi-Scale Dilated Transformer for Visual Recognition",
        JOURNAL = MultMed,
        VOLUME = "25",
        YEAR = "2023",
        PAGES = "8906-8919",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154710"}

@article{bb158843,
        AUTHOR = "Ghosal, S.S. and Li, Y.X.",
        TITLE = "Are Vision Transformers Robust to Spurious Correlations?",
        JOURNAL = IJCV,
        VOLUME = "132",
        YEAR = "2024",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "689-709",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154711"}

@article{bb158844,
        AUTHOR = "Nguyen, H. and Kim, C. and Li, F.",
        TITLE = "Space-time recurrent memory network",
        JOURNAL = CVIU,
        VOLUME = "241",
        YEAR = "2024",
        PAGES = "103943",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154712"}

@inproceedings{bb158845,
        AUTHOR = "Kheldouni, A. and Boumhidi, J.",
        TITLE = "A Study of Bidirectional Encoder Representations from Transformers
for Sequential Recommendations",
        BOOKTITLE = ISCV22,
        YEAR = "2022",
        PAGES = "1-5",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154713"}

@article{bb158846,
        AUTHOR = "Xiao, Q. and Zhang, Y. and Yang, Q.",
        TITLE = "Selective Random Walk for Transfer Learning in Heterogeneous Label
Spaces",
        JOURNAL = PAMI,
        VOLUME = "46",
        YEAR = "2024",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "4476-4488",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154714"}

@article{bb158847,
        AUTHOR = "Akkaya, I.B. and Kathiresan, S.S. and Arani, E. and Zonooz, B.",
        TITLE = "Enhancing performance of vision transformers on small datasets
through local inductive bias incorporation",
        JOURNAL = PR,
        VOLUME = "153",
        YEAR = "2024",
        PAGES = "110510",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154715"}

@article{bb158848,
        AUTHOR = "Yao, T. and Li, Y. and Pan, Y.W. and Mei, T.",
        TITLE = "HIRI-ViT: Scaling Vision Transformer With High Resolution Inputs",
        JOURNAL = PAMI,
        VOLUME = "46",
        YEAR = "2024",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "6431-6442",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154716"}

@article{bb158849,
        AUTHOR = "Xu, G.Y. and Ye, J.Y. and Liu, X.Y. and Wen, X.B. and Li, Y. and Wang, J.J.",
        TITLE = "LV-Adapter: Adapting Vision Transformers for Visual Classification
with Linear-layers and Vectors",
        JOURNAL = CVIU,
        VOLUME = "246",
        YEAR = "2024",
        PAGES = "104049",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154717"}

@article{bb158850,
        AUTHOR = "Yan, L.Q. and Yan, R.X. and Chai, B. and Geng, G.H. and Zhou, P.B. and Gao, J.",
        TITLE = "DM-GAN: CNN hybrid vits for training GANs under limited data",
        JOURNAL = PR,
        VOLUME = "156",
        YEAR = "2024",
        PAGES = "110810",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154718"}

@article{bb158851,
        AUTHOR = "Feng, Q.H. and Li, P.Y. and Lu, Z.X. and Li, C.Z. and Wang, Z. and Liu, Z.Q. and Duan, C.H. and Huang, F. and Weng, J. and Yu, P.S.",
        TITLE = "EViT: Privacy-Preserving Image Retrieval via Encrypted Vision
Transformer in Cloud Computing",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "7467-7483",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154719"}

@article{bb158852,
        AUTHOR = "Wang, H.Y. and Ma, S.M. and Dong, L. and Huang, S. and Zhang, D.D. and Wei, F.",
        TITLE = "DeepNet: Scaling Transformers to 1,000 Layers",
        JOURNAL = PAMI,
        VOLUME = "46",
        YEAR = "2024",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "6761-6774",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154720"}

@article{bb158853,
        AUTHOR = "Papa, L. and Russo, P. and Amerini, I. and Zhou, L.P.",
        TITLE = "A Survey on Efficient Vision Transformers: Algorithms, Techniques,
and Performance Benchmarking",
        JOURNAL = PAMI,
        VOLUME = "46",
        YEAR = "2024",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "7682-7700",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154721"}

@article{bb158854,
        AUTHOR = "Hu, S.C. and Shen, L. and Zhang, Y. and Chen, Y.X. and Tao, D.C.",
        TITLE = "On Transforming Reinforcement Learning With Transformers:
The Development Trajectory",
        JOURNAL = PAMI,
        VOLUME = "46",
        YEAR = "2024",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "8580-8599",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154722"}

@article{bb158855,
        AUTHOR = "Xu, R.S. and Chen, C.J. and Tu, Z.Z. and Yang, M.H.",
        TITLE = "V2X-ViTv2: Improved Vision Transformers for Vehicle-to-Everything
Cooperative Perception",
        JOURNAL = PAMI,
        VOLUME = "47",
        YEAR = "2025",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "650-662",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154723"}

@inproceedings{bb158856,
        AUTHOR = "Xu, R.S. and Xiang, H. and Tu, Z.Z. and Xia, X. and Yang, M.H. and Ma, J.Q.",
        TITLE = "V2X-ViT: Vehicle-to-Everything Cooperative Perception with Vision
Transformer",
        BOOKTITLE = ECCV22,
        YEAR = "2022",
        PAGES = "XXIX:107-124",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154724"}

@inproceedings{bb158857,
        AUTHOR = "Xiang, H. and Zheng, Z.L. and Xia, X. and Xu, R.S. and Gao, L. and Zhou, Z.W. and Han, X. and Ji, X. and Li, M.X. and Meng, Z.L. and Jin, L. and Lei, M.Y. and Ma, Z.Y. and He, Z.H. and Ma, H.X. and Yuan, Y.S. and Zhao, Y.Q. and Ma, J.Q.",
        TITLE = "V2X-Real: A Largs-scale Dataset for Vehicle-to-everything Cooperative
Perception",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "LII: 455-470",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154725"}

@inproceedings{bb158858,
        AUTHOR = "Xiang, H. and Xu, R.S. and Ma, J.Q.",
        TITLE = "HM-ViT: Hetero-modal Vehicle-to-Vehicle Cooperative Perception with
Vision Transformer",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "284-295",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154726"}

@article{bb158859,
        AUTHOR = "Ma, X. and Zhang, Z. and Yu, R. and Ji, Z. and Li, M.C. and Zhang, Y.H. and Chen, Q.",
        TITLE = "SAVE: Encoding spatial interactions for vision transformers",
        JOURNAL = IVC,
        VOLUME = "152",
        YEAR = "2024",
        PAGES = "105312",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154727"}

@article{bb158860,
        AUTHOR = "Xiao, J. and Li, Z.K. and Li, J.Q. and Yang, L.W. and Gu, Q.Y.",
        TITLE = "BinaryViT: Toward Efficient and Accurate Binary Vision Transformers",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "195-206",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154728"}

@article{bb158861,
        AUTHOR = "Mao, C.X. and Li, J. and Hu, T. and Zhao, X.Y.",
        TITLE = "CMVT: ConVit Transformer Network Recombined with Convolutional Layer",
        JOURNAL = IJIG,
        VOLUME = "25",
        YEAR = "2025",
        NUMBER = "1",
        MONTH = "Jan",
        PAGES = "2450060",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154729"}

@article{bb158862,
        AUTHOR = "Zhong, Y.S. and Huang, Y. and Hu, J.W. and Zhang, Y.X. and Ji, R.R.",
        TITLE = "Towards Accurate Post-Training Quantization of Vision Transformers
via Error Reduction",
        JOURNAL = PAMI,
        VOLUME = "47",
        YEAR = "2025",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "2676-2692",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154730"}

@article{bb158863,
        AUTHOR = "Tian, R. and Wu, Z.X. and Dai, Q. and Goldblum, M. and Hu, H. and Jiang, Y.G.",
        TITLE = "The Role of ViT Design and Training in Robustness to Common
Corruptions",
        JOURNAL = MultMed,
        VOLUME = "27",
        YEAR = "2025",
        PAGES = "1374-1385",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154731"}

@article{bb158864,
        AUTHOR = "Li, X.T. and Jiao, L.C. and Liu, F. and Yang, S.Y. and Zhu, H. and Liu, X. and Li, L.L. and Ma, W.P.",
        TITLE = "Adaptive Complex Wavelet Informed Transformer Operator",
        JOURNAL = MultMed,
        VOLUME = "27",
        YEAR = "2025",
        PAGES = "3513-3526",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154732"}

@article{bb158865,
        AUTHOR = "Pan, Y.W. and Li, Y. and Yao, T. and Ngo, C.W. and Mei, T.",
        TITLE = "Stream-ViT: Learning Streamlined Convolutions in Vision Transformer",
        JOURNAL = MultMed,
        VOLUME = "27",
        YEAR = "2025",
        PAGES = "3755-3765",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154733"}

@article{bb158866,
        AUTHOR = "Wen, T. and Wang, H. and Wang, L.G.",
        TITLE = "Dual-Branch Spatial-Spectral Transformer with Similarity Propagation
for Hyperspectral Image Classification",
        JOURNAL = RS,
        VOLUME = "17",
        YEAR = "2025",
        NUMBER = "14",
        PAGES = "2386",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154734"}

@article{bb158867,
        AUTHOR = "Yu, C. and Chen, T. and Gan, Z.X.",
        TITLE = "Taylor-Series-Expansion-Based Vision Transformer Models",
        JOURNAL = PAMI,
        VOLUME = "47",
        YEAR = "2025",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "8213-8230",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154735"}

@article{bb158868,
        AUTHOR = "Kong, Z.L. and Xu, D.K. and Li, Z.G. and Dong, P.Y. and Tang, H. and Wang, Y.Z. and Mukherjee, S.",
        TITLE = "AutoViT: Achieving Real-Time Vision Transformers on Mobile via
Latency-aware Coarse-to-Fine Search",
        JOURNAL = IJCV,
        VOLUME = "133",
        YEAR = "2025",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "6170-6186",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154736"}

@article{bb158869,
        AUTHOR = "Tan, C. and Gao, Z.Y. and Li, S.Y. and Li, S.Z.",
        TITLE = "SimVPv2: Towards Simple Yet Powerful Spatiotemporal Predictive
Learning",
        JOURNAL = MultMed,
        VOLUME = "27",
        YEAR = "2025",
        PAGES = "5170-5184",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154737"}

@inproceedings{bb158870,
        AUTHOR = "Tan, C. and Gao, Z.Y. and Wu, L.R. and Xu, Y.J. and Xia, J. and Li, S.Y. and Li, S.Z.",
        TITLE = "Temporal Attention Unit: Towards Efficient Spatiotemporal Predictive
Learning",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "18770-18782",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154738"}

@article{bb158871,
        AUTHOR = "Yang, S. and Hu, C.Y. and Xie, L. and Lee, F.F. and Chen, Q.",
        TITLE = "MG-SSAF: An advanced vision Transformer",
        JOURNAL = JVCIR,
        VOLUME = "112",
        YEAR = "2025",
        PAGES = "104578",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154739"}

@article{bb158872,
        AUTHOR = "Sharma, A.K. and Verma, N.K.",
        TITLE = "A novel vision transformer with selective residual in multihead
self-attention for pattern recognition",
        JOURNAL = PR,
        VOLUME = "172",
        YEAR = "2026",
        PAGES = "112497",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154740"}

@article{bb158873,
        AUTHOR = "Huang, Y.Q. and Ye, P. and Tu, C.J. and Chen, T. and He, T. and Ouyang, W.L.",
        TITLE = "Sparse-to-Dense Training: A Novel Training Scheme to Enhance Vision
Transformers",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "12329-12340",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154741"}

@article{bb158874,
        AUTHOR = "Xu, G. and Huang, W.F. and Jia, W.J. and Li, J. and Gao, G. and Qi, G.J.",
        TITLE = "S2AFormer: Strip Self-Attention for Efficient Vision Transformer",
        JOURNAL = IP,
        VOLUME = "34",
        YEAR = "2025",
        PAGES = "8243-8256",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154742"}

@article{bb158875,
        AUTHOR = "Luo, A. and Yuan, K.W.",
        TITLE = "Simple Self-Organizing Map With Vision Transformers",
        JOURNAL = SPLetters,
        VOLUME = "33",
        YEAR = "2026",
        PAGES = "331-335",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154743"}

@article{bb158876,
        AUTHOR = "Li, Q. and He, J. and Guo, T.C. and Gao, X.P. and Bhanu, B.",
        TITLE = "PE-ViT: Parameter-efficient vision transformer with
dimension-adaptive experts and economical attention",
        JOURNAL = PRL,
        VOLUME = "200",
        YEAR = "2026",
        PAGES = "135-141",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154744"}

@article{bb158877,
        AUTHOR = "Wang, A. and Chen, H. and Lin, Z.J. and Zhao, S.C. and Han, J.G. and Ding, G.G.",
        TITLE = "CAIT: Triple-Win Compression Toward High Accuracy, Fast Inference,
and Favorable Transferability for ViTs",
        JOURNAL = PAMI,
        VOLUME = "48",
        YEAR = "2026",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "1373-1389",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154745"}

@inproceedings{bb158878,
        AUTHOR = "Wang, A. and Chen, H. and Lin, Z.J. and Han, J.G. and Ding, G.G.",
        TITLE = "Rep ViT: Revisiting Mobile CNN From ViT Perspective",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "15909-15920",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154746"}

@article{bb158879,
        AUTHOR = "Liu, Z. and Zhu, J.C. and Li, N.N. and Huang, G.",
        TITLE = "Multiple-Exit Tuning: Towards Inference-Efficient Adaptation for
Vision Transformer",
        JOURNAL = CirSysVideo,
        VOLUME = "36",
        YEAR = "2026",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "2123-2136",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154747"}

@article{bb158880,
        AUTHOR = "Chen, X.Y. and Wang, X.T. and Zhang, W.L. and Kong, X.T. and Qiao, Y. and Zhou, J.T. and Dong, C.",
        TITLE = "HAT: Hybrid Attention Transformer for Image Restoration",
        JOURNAL = PAMI,
        VOLUME = "48",
        YEAR = "2026",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "2676-2694",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154748"}

@article{bb158881,
        AUTHOR = "Li, C. and Su, J. and Gao, J.S.",
        TITLE = "BiPAZSL: A bidirectional progressive attention method for zero-shot
learning domain shift mitigation",
        JOURNAL = PR,
        VOLUME = "174",
        YEAR = "2026",
        PAGES = "112959",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154749"}

@article{bb158882,
        AUTHOR = "Zhang, T.F. and Li, L. and Zhou, Y. and Liu, W.T. and Qian, C. and Hwang, J.N. and Ji, X.Y.",
        TITLE = "CAS-ViT: Convolutional Additive Self-Attention Vision Transformers
for Efficient Mobile Applications",
        JOURNAL = IP,
        VOLUME = "35",
        YEAR = "2026",
        PAGES = "1899-1909",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154750"}

@article{bb158883,
        AUTHOR = "Xiao, W.J. and Li, X.Z. and Hu, L. and Hao, Y.X. and Chen, M.",
        TITLE = "DTSNet: Dynamic Transformer Slimming for Efficient Vision Recognition",
        JOURNAL = MultMed,
        VOLUME = "28",
        YEAR = "2026",
        PAGES = "1589-1600",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154751"}

@article{bb158884,
        AUTHOR = "Xu, G. and Hao, J.W. and Luo, Y. and Shen, L. and Hu, H. and Zeng, D.",
        TITLE = "EEformer: Early Exiting for Transformer With Global-Local Exits and
Progressive Fine-Tuning",
        JOURNAL = MultMed,
        VOLUME = "28",
        YEAR = "2026",
        PAGES = "1352-1364",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154752"}

@article{bb158885,
        AUTHOR = "Zhang, Z.W. and Lin, P.X. and Wang, Z.W. and Zhang, Y.Y. and Xu, Z.Q.J.",
        TITLE = "Complexity Control Facilitates Reasoning-Based Compositional
Generalization in Transformers",
        JOURNAL = PAMI,
        VOLUME = "48",
        YEAR = "2026",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "4336-4349",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154753"}

@article{bb158886,
        AUTHOR = "Zhou, W.W. and Zhao, S.J. and Liu, Y.Z. and Li, Y.P.",
        TITLE = "CCTformer: Calibrated Context-Aware Transformer for Correspondence
Pruning",
        JOURNAL = SPLetters,
        VOLUME = "33",
        YEAR = "2026",
        PAGES = "1461-1465",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154754"}

@article{bb158887,
        AUTHOR = "Chen, P.T. and Shen, M.Z. and Ye, P. and Cao, J.J. and Tu, C.J. and Bouganis, C.S. and Ren, Y.",
        TITLE = "Delta-DiT: Accelerating Diffusion Transformers without Training via
Denoising Property Alignment",
        JOURNAL = IJCV,
        VOLUME = "134",
        YEAR = "2026",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "276",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154755"}

@article{bb158888,
        AUTHOR = "Liu, X.Y. and Shi, H. and Xu, Y. and Wang, Z.F.",
        TITLE = "TaQ-DiT: Time-Aware Quantization for Diffusion Transformers",
        JOURNAL = CirSysVideo,
        VOLUME = "36",
        YEAR = "2026",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "6225-6229",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154756"}

@inproceedings{bb158889,
        AUTHOR = "Nozawa, Y. and Lin, Y.C. and Nakamura, K. and Ng, Y.",
        TITLE = "Prompt-Guided Attention Head Selection for Focus-Oriented Image
Retrieval",
        BOOKTITLE = PixFM25,
        YEAR = "2025",
        PAGES = "4131-4141",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154757"}

@inproceedings{bb158890,
        AUTHOR = "Abraham, S.J. and Hauenstein, J.D. and Scheirer, W.J.",
        TITLE = "Wavelet-Based Mechanistic Interpretability of Vision Transformers via
Frequency-Aware Ablations",
        BOOKTITLE = InterpVis25,
        YEAR = "2025",
        PAGES = "4830-4834",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154758"}

@inproceedings{bb158891,
        AUTHOR = "Augustin, M. and Sarwar, S.S. and Elhoushi, M. and Li, Y.C. and Zhang, S.Q. and de Salvo, B.",
        TITLE = "PETAH: Parameter Efficient Task Adaptation for Hybrid Transformers",
        BOOKTITLE = MobileAI25,
        YEAR = "2025",
        PAGES = "1858-1868",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154759"}

@inproceedings{bb158892,
        AUTHOR = "Ali, M. and Raza, H. and Gan, J.Q. and Haris, M.",
        TITLE = "Optimising Vision Transformer Performance on Limited Datasets: A
Multi-Gradient Approach",
        BOOKTITLE = "FaDE-TCV25",
        YEAR = "2025",
        PAGES = "693-702",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154760"}

@inproceedings{bb158893,
        AUTHOR = "Echevarrieta Catalan, N. and Ribas Rodriguez, A. and Cedron, F. and Schwartz, O. and Aguiar Pulido, V.",
        TITLE = "Enhancing Vision Transformer Explainability using Artificial
Astrocytes",
        BOOKTITLE = LXCV25,
        YEAR = "2025",
        PAGES = "58-64",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154761"}

@inproceedings{bb158894,
        AUTHOR = "Takatsuki, R. and Joseph, S. and Fujisawa, I. and Kanai, R.",
        TITLE = "Decoding Vision Transformers: The Diffusion Steering Lens",
        BOOKTITLE = InterpVis25,
        YEAR = "2025",
        PAGES = "4819-4824",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154762"}

@inproceedings{bb158895,
        AUTHOR = "He, X. and Quan, Y.H. and Xu, R. and Ji, H.",
        TITLE = "A Universal Scale-Adaptive Deformable Transformer for Image
Restoration across Diverse Artifacts",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "12731-12741",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154763"}

@inproceedings{bb158896,
        AUTHOR = "Fixelle, J.",
        TITLE = "Hypergraph Vision Transformers: Images are More than Nodes, More than
Edges",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "9751-9761",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154764"}

@inproceedings{bb158897,
        AUTHOR = "Ahmed, S. and Arafat, A.A. and Najafi, D. and Mahmood, A. and Rizve, M.N. and Nahian, M.A. and Zhou, R.Y. and Angizi, S. and Rakin, A.S.",
        TITLE = "DeepCompress-ViT: Rethinking Model Compression to Enhance Efficiency
of Vision Transformers at the Edge",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "30147-30156",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154765"}

@inproceedings{bb158898,
        AUTHOR = "Bouniot, Q. and Redko, I. and Mallasto, A. and Laclau, C. and Struckmeier, O. and Arndt, K. and Heinonen, M. and Kyrki, V. and Kaski, S.",
        TITLE = "From Alexnet to Transformers: Measuring the Non-linearity of Deep
Neural Networks with Affine Optimal Transport",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "25250-25260",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154766"}

@inproceedings{bb158899,
        AUTHOR = "Wang, Z.Q. and Xia, X.B. and Chen, R. and Yu, D.D. and Wang, C.H. and Gong, M.M. and Liu, T.L.",
        TITLE = "LaVin-DiT: Large Vision Diffusion Transformer",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "20060-20070",
        BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT154767"}

Last update:Jun 13, 2026 at 20:41:05