@article{bb140100, AUTHOR = "Tang, X. and Habashy, K. and Huang, F.Z. and Li, C. and Ban, D.", TITLE = "SCA-Net: Spatial and channel attention-based network for 3D point clouds", JOURNAL = CVIU, VOLUME = "232", YEAR = "2023", PAGES = "103690", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136105"} @article{bb140101, AUTHOR = "Rivas Manzaneque, F. and Ribeiro, A. and Avila Garcia, O.", TITLE = "ICE: Implicit Coordinate Encoder for Multiple Image Neural Representation", JOURNAL = IP, VOLUME = "32", YEAR = "2023", PAGES = "5209-5219", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136106"} @inproceedings{bb140102, AUTHOR = "Gandikota, K.V. and Geiping, J. and Lahner, Z. and Czaplinski, A. and Moller, M.", TITLE = "A Simple Strategy to Provable Invariance via Orbit Mapping", BOOKTITLE = ACCV22, YEAR = "2022", PAGES = "V:387-405", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136107"} @inproceedings{bb140103, AUTHOR = "Saltori, C. and Roy, S. and Sebe, N. and Iacca, G.", TITLE = "Regularized Evolutionary Algorithm for Dynamic Neural Topology Search", BOOKTITLE = CIAP19, YEAR = "2019", PAGES = "I:219-230", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136108"} @inproceedings{bb140104, AUTHOR = "Chang, Y. and Wu, X. and Zhang, S.", TITLE = "Piecewise Linear Units for Fast Self-Normalizing Neural Networks", BOOKTITLE = ICPR18, YEAR = "2018", PAGES = "429-434", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136109"} @inproceedings{bb140105, AUTHOR = "Fan, L.", TITLE = "Deep Epitome for Unravelling Generalized Hamming Network", BOOKTITLE = ICPR18, YEAR = "2018", PAGES = "409-416", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136110"} @inproceedings{bb140106, AUTHOR = "Wang, X.L. and Girshick, R. and Gupta, A. and He, K.M.", TITLE = "Non-local Neural Networks", BOOKTITLE = CVPR18, YEAR = "2018", PAGES = "7794-7803", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136111"} @inproceedings{bb140107, AUTHOR = "Meng, Z.H. and Adluru, N. and Kim, H.W.J. and Fung, G. and Singh, V.", TITLE = "Efficient Relative Attribute Learning Using Graph Neural Networks", BOOKTITLE = ECCV18, YEAR = "2018", PAGES = "XIV: 575-590", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136112"} @inproceedings{bb140108, AUTHOR = "Haeusser, P. and Mordvintsev, A. and Cremers, D.", TITLE = "Learning by Association: A Versatile Semi-Supervised Training Method for Neural Networks", BOOKTITLE = CVPR17, YEAR = "2017", PAGES = "626-635", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136113"} @inproceedings{bb140109, AUTHOR = "Knobelreiter, P. and Reinbacher, C. and Shekhovtsov, A. and Pock, T.", TITLE = "End-to-End Training of Hybrid CNN-CRF Models for Stereo", BOOKTITLE = CVPR17, YEAR = "2017", PAGES = "1456-1465", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136114"} @inproceedings{bb140110, AUTHOR = "Jiang, Z. and Wang, Y. and Davis, L. and Andrews, W. and Rozgic, V.", TITLE = "Learning Discriminative Features via Label Consistent Neural Network", BOOKTITLE = WACV17, YEAR = "2017", PAGES = "207-216", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136115"} @inproceedings{bb140111, AUTHOR = "Hafiz, A.R. and Al Marzouqi, H.", TITLE = "Efficient neural network training using curvelet features", BOOKTITLE = IVMSP16, YEAR = "2016", PAGES = "1-5", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136116"} @inproceedings{bb140112, AUTHOR = "Movshovitz Attias, Y. and Yu, Q. and Stumpe, M.C. and Shet, V. and Arnoud, S. and Yatziv, L.", TITLE = "Ontological supervision for fine grained classification of Street View storefronts", BOOKTITLE = CVPR15, YEAR = "2015", PAGES = "1693-1702", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136117"} @inproceedings{bb140113, AUTHOR = "Kim, E. and Hannan, D. and Kenyon, G.T.", TITLE = "Deep Sparse Coding for Invariant Multimodal Halle Berry Neurons", BOOKTITLE = CVPR18, YEAR = "2018", PAGES = "1111-1120", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136118"} @inproceedings{bb140114, AUTHOR = "Schultz, P.F. and Bettencourt, L.M. and Kenyon, G.T.", TITLE = "A symmetry-breaking generative model of a simple-cell/complex-cell hierarchy", BOOKTITLE = Southwest12, YEAR = "2012", PAGES = "89-92", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136119"} @inproceedings{bb140115, AUTHOR = "Hornlein, T. and Jahne, B.", TITLE = "Boosting Shift-Invariant Features", BOOKTITLE = DAGM09, YEAR = "2009", PAGES = "121-130", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136120"} @inproceedings{bb140116, AUTHOR = "Szilagyi, S.M. and Szilagyi, L. and Frigy, A. and Gorog, L.K. and Benyo, Z.", TITLE = "Unified Neural Network Based Pathologic Event Reconstruction Using Spatial Heart Model", BOOKTITLE = CIARP07, YEAR = "2007", PAGES = "851-860", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136121"} @inproceedings{bb140117, AUTHOR = "Wersing, H. and Kirstein, S. and Schneiders, B. and Bauer Wersing, U. and Korner, E.", TITLE = "Online Learning for Bootstrapping of Object Recognition and Localization in a Biologically Motivated Architecture", BOOKTITLE = CVS08, YEAR = "2008", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136122"} @inproceedings{bb140118, AUTHOR = "Kirstein, S. and Wersing, H. and Korner, E.", TITLE = "Rapid Online Learning of Objects in a Biologically Motivated Recognition Architecture", BOOKTITLE = DAGM05, YEAR = "2005", PAGES = "301", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136123"} @inproceedings{bb140119, AUTHOR = "Doulamis, N.D. and Doulamis, A.D.", TITLE = "Non-linear 3D rendering workload prediction based on a combined fuzzy-neural network architecture for grid computing applications", BOOKTITLE = ICIP03, YEAR = "2003", PAGES = "III: 1069-1072", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136124"} @inproceedings{bb140120, AUTHOR = "Loh, A.W.K. and Robey, M.C. and West, G.A.W.", TITLE = "IFOSART: a noise resistant neural network capable of incremental learning", BOOKTITLE = ICPR00, YEAR = "2000", PAGES = "Vol II: 985-988", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136125"} @inproceedings{bb140121, AUTHOR = "Loh, A.W.K. and Robey, M.C. and West, G.A.W.", TITLE = "Refining 3d models using a two-stage neural network-based iterative process", BOOKTITLE = ICPR02, YEAR = "2002", PAGES = "I: 172-175", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136126"} @inproceedings{bb140122, AUTHOR = "Villela, P.R. and Sossa Azuela, J.H.", TITLE = "Object Recognition by Indexing Using Neural Networks", BOOKTITLE = ICPR00, YEAR = "2000", PAGES = "Vol II: 1001-1004", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136127"} @inproceedings{bb140123, AUTHOR = "Papamarkos, N.", TITLE = "Using Local Features in a Neural Network Based Gray-level Reduction Technique", BOOKTITLE = ICPR00, YEAR = "2000", PAGES = "Vol III: 1025-1028", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136128"} @inproceedings{bb140124, AUTHOR = "Papamarkos, N.", TITLE = "Using Local Features in a Neural Network Based Gray-level Reduction Technique", BOOKTITLE = ICPR00, YEAR = "2000", PAGES = "Vol III: 1037-1040", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136128"} @inproceedings{bb140125, AUTHOR = "Webb, A.R. and Shannon, S.", TITLE = "Adaptive Radial Basis Functions", BOOKTITLE = ICPR96, YEAR = "1996", PAGES = "IV: 630-634", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136129"} @inproceedings{bb140126, AUTHOR = "Webb, A.R.", TITLE = "Nonlinear Feature Extraction with Radial Basis Functions Using a Weighted Multidimensional Scaling Stress Measure", BOOKTITLE = ICPR96, YEAR = "1996", PAGES = "IV: 635-639", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern650.html#TT136130"} @article{bb140127, AUTHOR = "Bazi, Y. and Bashmal, L. and Al Rahhal, M.M. and Al Dayil, R. and Al Ajlan, N.", TITLE = "Vision Transformers for Remote Sensing Image Classification", JOURNAL = RS, VOLUME = "13", YEAR = "2021", NUMBER = "3", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136131"} @article{bb140128, AUTHOR = "Li, T. and Zhang, Z. and Pei, L. and Gan, Y.", TITLE = "HashFormer: Vision Transformer Based Deep Hashing for Image Retrieval", JOURNAL = SPLetters, VOLUME = "29", YEAR = "2022", PAGES = "827-831", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136132"} @article{bb140129, AUTHOR = "Jiang, B. and Zhao, K.K. and Tang, J.", TITLE = "RGTransformer: Region-Graph Transformer for Image Representation and Few-Shot Classification", JOURNAL = SPLetters, VOLUME = "29", YEAR = "2022", PAGES = "792-796", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136133"} @article{bb140130, AUTHOR = "Chen, Z.M. and Cui, Q. and Zhao, B. and Song, R.J. and Zhang, X.Q. and Yoshie, O.", TITLE = "SST: Spatial and Semantic Transformers for Multi-Label Image Recognition", JOURNAL = IP, VOLUME = "31", YEAR = "2022", PAGES = "2570-2583", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136134"} @article{bb140131, AUTHOR = "Wang, G.H. and Li, B. and Zhang, T. and Zhang, S.", TITLE = "A Network Combining a Transformer and a Convolutional Neural Network for Remote Sensing Image Change Detection", JOURNAL = RS, VOLUME = "14", YEAR = "2022", NUMBER = "9", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136135"} @article{bb140132, AUTHOR = "Luo, G. and Zhou, Y. and Sun, X.S. and Wang, Y. and Cao, L.J. and Wu, Y.J. and Huang, F.Y. and Ji, R.R.", TITLE = "Towards Lightweight Transformer Via Group-Wise Transformation for Vision-and-Language Tasks", JOURNAL = IP, VOLUME = "31", YEAR = "2022", PAGES = "3386-3398", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136136"} @article{bb140133, AUTHOR = "Tu, Y.B. and Li, L. and Su, L. and Gao, S.X. and Yan, C.G. and Zha, Z.J. and Yu, Z.T. and Huang, Q.M.", TITLE = "I2-Transformer: Intra- and Inter-Relation Embedding Transformer for TV Show Captioning", JOURNAL = IP, VOLUME = "31", YEAR = "2022", PAGES = "3565-3577", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136137"} @article{bb140134, AUTHOR = "Wang, J.Y. and Chakraborty, R. and Yu, S.X.", TITLE = "Transformer for 3D Point Clouds", JOURNAL = PAMI, VOLUME = "44", YEAR = "2022", NUMBER = "8", MONTH = "August", PAGES = "4419-4431", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136138"} @article{bb140135, AUTHOR = "Li, Z.K. and Liu, Y.F. and Li, B. and Feng, B.L. and Wu, K. and Peng, C.W. and Hu, W.M.", TITLE = "SDTP: Semantic-Aware Decoupled Transformer Pyramid for Dense Image Prediction", JOURNAL = CirSysVideo, VOLUME = "32", YEAR = "2022", NUMBER = "9", MONTH = "September", PAGES = "6160-6173", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136139"} @article{bb140136, AUTHOR = "Wu, J.J. and Wei, Z.Q. and Zhang, J.P. and Zhang, Y.S. and Jia, D.N. and Yin, B. and Yu, Y.C.", TITLE = "Full-Coupled Convolutional Transformer for Surface-Based Duct Refractivity Inversion", JOURNAL = RS, VOLUME = "14", YEAR = "2022", NUMBER = "17", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136140"} @article{bb140137, AUTHOR = "Jiang, K. and Peng, P. and Lian, Y. and Xu, W.S.", TITLE = "The encoding method of position embeddings in vision transformer", JOURNAL = JVCIR, VOLUME = "89", YEAR = "2022", PAGES = "103664", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136141"} @article{bb140138, AUTHOR = "Han, K. and Wang, Y.H. and Chen, H.T. and Chen, X.H. and Guo, J.Y. and Liu, Z.H. and Tang, Y. and Xiao, A. and Xu, C.J. and Xu, Y.X. and Yang, Z.H. and Zhang, Y. and Tao, D.C.", TITLE = "A Survey on Vision Transformer", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "1", MONTH = "January", PAGES = "87-110", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136142"} @article{bb140139, AUTHOR = "Hou, Q. and Jiang, Z. and Yuan, L. and Cheng, M.M. and Yan, S.C. and Feng, J.S.", TITLE = "Vision Permutator: A Permutable MLP-Like Architecture for Visual Recognition", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "1", MONTH = "January", PAGES = "1328-1334", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136143"} @article{bb140140, AUTHOR = "Yu, W.H. and Si, C.Y. and Zhou, P. and Luo, M. and Zhou, Y.C. and Feng, J.S. and Yan, S.C. and Wang, X.C.", TITLE = "MetaFormer Baselines for Vision", JOURNAL = PAMI, VOLUME = "46", YEAR = "2024", NUMBER = "2", MONTH = "February", PAGES = "896-912", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136144"} @inproceedings{bb140141, AUTHOR = "Yu, W.H. and Luo, M. and Zhou, P. and Si, C.Y. and Zhou, Y.C. and Wang, X.C. and Feng, J.S. and Yan, S.C.", TITLE = "MetaFormer is Actually What You Need for Vision", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "10809-10819", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136145"} @article{bb140142, AUTHOR = "Zhou, D. and Hou, Q. and Yang, L.J. and Jin, X.J. and Feng, J.S.", TITLE = "Token Selection is a Simple Booster for Vision Transformers", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "11", MONTH = "November", PAGES = "12738-12746", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136146"} @article{bb140143, AUTHOR = "Yuan, L. and Hou, Q. and Jiang, Z. and Feng, J.S. and Yan, S.C.", TITLE = "VOLO: Vision Outlooker for Visual Recognition", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "5", MONTH = "May", PAGES = "6575-6586", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136147"} @inproceedings{bb140144, AUTHOR = "Ren, S. and Zhou, D. and He, S.F. and Feng, J.S. and Wang, X.C.", TITLE = "Shunted Self-Attention via Multi-Scale Token Aggregation", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "10843-10852", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136148"} @article{bb140145, AUTHOR = "Wu, Y.H. and Liu, Y. and Zhan, X. and Cheng, M.M.", TITLE = "P2T: Pyramid Pooling Transformer for Scene Understanding", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "11", MONTH = "November", PAGES = "12760-12771", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136149"} @article{bb140146, AUTHOR = "Li, Y. and Yao, T. and Pan, Y.W. and Mei, T.", TITLE = "Contextual Transformer Networks for Visual Recognition", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "2", MONTH = "February", PAGES = "1489-1500", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136150"} @article{bb140147, AUTHOR = "Wang, H. and Du, Y. and Zhang, Y. and Li, S. and Zhang, L.", TITLE = "One-Stage Visual Relationship Referring With Transformers and Adaptive Message Passing", JOURNAL = IP, VOLUME = "32", YEAR = "2023", PAGES = "190-202", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136151"} @article{bb140148, AUTHOR = "Kim, B. and Kim, J. and Ye, J.C.", TITLE = "Task-Agnostic Vision Transformer for Distributed Learning of Image Processing", JOURNAL = IP, VOLUME = "32", YEAR = "2023", PAGES = "203-218", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136152"} @article{bb140149, AUTHOR = "Park, S. and Ye, J.C.", TITLE = "Multi-Task Distributed Learning Using Vision Transformer With Random Patch Permutation", JOURNAL = MedImg, VOLUME = "42", YEAR = "2023", NUMBER = "7", MONTH = "July", PAGES = "2091-2105", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136153"} @article{bb140150, AUTHOR = "Kiya, H. and Iijima, R. and Maungmaung, A. and Kinoshit, Y.", TITLE = "Image and Model Transformation with Secret Key for Vision Transformer", JOURNAL = IEICE, VOLUME = "E106-D", YEAR = "2023", NUMBER = "1", MONTH = "January", PAGES = "2-11", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136154"} @article{bb140151, AUTHOR = "Zhang, H.F. and Mao, F. and Xue, M.Q. and Fang, G.F. and Feng, Z.L. and Song, J. and Song, M.L.", TITLE = "Knowledge Amalgamation for Object Detection With Transformers", JOURNAL = IP, VOLUME = "32", YEAR = "2023", PAGES = "2093-2106", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136155"} @article{bb140152, AUTHOR = "Li, Y. and Chen, K. and Sun, S.L. and He, C.", TITLE = "Multi-scale homography estimation based on dual feature aggregation transformer", JOURNAL = IET-IPR, VOLUME = "17", YEAR = "2023", NUMBER = "5", PAGES = "1403-1416", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136156"} @article{bb140153, AUTHOR = "Wang, G.Q. and Chen, H. and Chen, L. and Zhuang, Y. and Zhang, S.H. and Zhang, T. and Dong, H. and Gao, P.", TITLE = "P2FEViT: Plug-and-Play CNN Feature Embedded Hybrid Vision Transformer for Remote Sensing Image Classification", JOURNAL = RS, VOLUME = "15", YEAR = "2023", NUMBER = "7", PAGES = "1773", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136157"} @article{bb140154, AUTHOR = "Zhang, Q.M. and Xu, Y.F. and Zhang, J. and Tao, D.C.", TITLE = "ViTAEv2: Vision Transformer Advanced by Exploring Inductive Bias for Image Recognition and Beyond", JOURNAL = IJCV, VOLUME = "131", YEAR = "2023", NUMBER = "5", MONTH = "May", PAGES = "1141-1162", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136158"} @article{bb140155, AUTHOR = "Fan, X. and Liu, H.J.", TITLE = "FlexFormer: Flexible Transformer for efficient visual recognition", JOURNAL = PRL, VOLUME = "169", YEAR = "2023", PAGES = "95-101", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136159"} @article{bb140156, AUTHOR = "Cho, S. and Hong, S. and Kim, S.", TITLE = "CATs++: Boosting Cost Aggregation With Convolutions and Transformers", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "6", MONTH = "June", PAGES = "7174-7194", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136160"} @article{bb140157, AUTHOR = "Kim, B.J. and Choi, H. and Jang, H. and Lee, D.G. and Jeong, W. and Kim, S.W.", TITLE = "Improved robustness of vision transformers via prelayernorm in patch embedding", JOURNAL = PR, VOLUME = "141", YEAR = "2023", PAGES = "109659", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136161"} @article{bb140158, AUTHOR = "He, Q. and Sun, X. and Yan, Z.Y. and Wang, B. and Zhu, Z. and Diao, W.H. and Yang, M.Y.", TITLE = "AST: Adaptive Self-supervised Transformer for optical remote sensing representation", JOURNAL = PandRS, VOLUME = "200", YEAR = "2023", PAGES = "41-54", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136162"} @article{bb140159, AUTHOR = "Wang, Z.W. and Wang, C.Y. and Xu, X.W. and Zhou, J. and Lu, J.W.", TITLE = "Quantformer: Learning Extremely Low-Precision Vision Transformers", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "7", MONTH = "July", PAGES = "8813-8826", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136163"} @article{bb140160, AUTHOR = "Sun, S.Y. and Yue, X.Y. and Zhao, H.S. and Torr, P.H.S. and Bai, S.", TITLE = "Patch-Based Separable Transformer for Visual Recognition", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "7", MONTH = "July", PAGES = "9241-9247", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136164"} @inproceedings{bb140161, AUTHOR = "Yue, X.Y. and Sun, S.Y. and Kuang, Z.H. and Wei, M. and Torr, P.H.S. and Zhang, W. and Lin, D.", TITLE = "Vision Transformer with Progressive Sampling", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "377-386", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136165"} @article{bb140162, AUTHOR = "Peng, Z.L. and Guo, Z.H. and Huang, W. and Wang, Y.W. and Xie, L.X. and Jiao, J.B. and Tian, Q. and Ye, Q.X.", TITLE = "Conformer: Local Features Coupling Global Representations for Recognition and Detection", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "8", MONTH = "August", PAGES = "9454-9468", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136166"} @inproceedings{bb140163, AUTHOR = "Peng, Z.L. and Huang, W. and Gu, S.Z. and Xie, L.X. and Wang, Y. and Jiao, J.B. and Ye, Q.X.", TITLE = "Conformer: Local Features Coupling Global Representations for Visual Recognition", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "357-366", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136167"} @article{bb140164, AUTHOR = "Feng, Z.Z. and Zhang, S.L.", TITLE = "Efficient Vision Transformer via Token Merger", JOURNAL = IP, VOLUME = "32", YEAR = "2023", PAGES = "4156-4169", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136168"} @article{bb140165, AUTHOR = "Yang, J.H. and Li, X.Y. and Zheng, M. and Wang, Z. and Zhu, Y.Q. and Guo, X.Q. and Yuan, Y.C. and Chai, Z. and Jiang, S.Q.", TITLE = "MemBridge: Video-Language Pre-Training With Memory-Augmented Inter-Modality Bridge", JOURNAL = IP, VOLUME = "32", YEAR = "2023", PAGES = "4073-4087", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136169"} @article{bb140166, AUTHOR = "Wang, D.L. and Chen, Y. and Naz, B. and Sun, L. and Li, B.Z.", TITLE = "Spatial-Aware Transformer (SAT): Enhancing Global Modeling in Transformer Segmentation for Remote Sensing Images", JOURNAL = RS, VOLUME = "15", YEAR = "2023", NUMBER = "14", PAGES = "3607", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136170"} @article{bb140167, AUTHOR = "Huang, X.Y. and Liu, F. and Cui, Y.H. and Chen, P. and Li, L.L. and Li, P.F.", TITLE = "Faster and Better: A Lightweight Transformer Network for Remote Sensing Scene Classification", JOURNAL = RS, VOLUME = "15", YEAR = "2023", NUMBER = "14", PAGES = "3645", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136171"} @article{bb140168, AUTHOR = "Yao, T. and Li, Y. and Pan, Y.W. and Wang, Y. and Zhang, X.P. and Mei, T.", TITLE = "Dual Vision Transformer", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "9", MONTH = "September", PAGES = "10870-10882", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136172"} @article{bb140169, AUTHOR = "Rao, Y.M. and Liu, Z. and Zhao, W.L. and Zhou, J. and Lu, J.W.", TITLE = "Dynamic Spatial Sparsification for Efficient Vision Transformers and Convolutional Neural Networks", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "9", MONTH = "September", PAGES = "10883-10897", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136173"} @article{bb140170, AUTHOR = "Li, J. and Liu, Z. and Li, L. and Lin, J.Q. and Yao, J. and Tu, J.", TITLE = "Multi-view convolutional vision transformer for 3D object recognition", JOURNAL = JVCIR, VOLUME = "95", YEAR = "2023", PAGES = "103906", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136174"} @article{bb140171, AUTHOR = "Shang, J.H. and Li, X. and Kahatapitiya, K. and Lee, Y.C. and Ryoo, M.S.", TITLE = "StARformer: Transformer With State-Action-Reward Representations for Robot Learning", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "11", MONTH = "November", PAGES = "12862-12877", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136175"} @inproceedings{bb140172, AUTHOR = "Shang, J.H. and Kahatapitiya, K. and Li, X. and Ryoo, M.S.", TITLE = "StARformer: Transformer with State-Action-Reward Representations for Visual Reinforcement Learning", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXIX:462-479", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136176"} @article{bb140173, AUTHOR = "Duan, H.R. and Long, Y. and Wang, S.D. and Zhang, H.F. and Willcocks, C.G. and Shao, L.", TITLE = "Dynamic Unary Convolution in Transformers", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "11", MONTH = "November", PAGES = "12747-12759", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136177"} @article{bb140174, AUTHOR = "Chen, S.M. and Hong, Z.M. and Hou, W.J. and Xie, G.S. and Song, Y.B. and Zhao, J. and You, X.G. and Yan, S.C. and Shao, L.", TITLE = "TransZero++: Cross Attribute-Guided Transformer for Zero-Shot Learning", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "11", MONTH = "November", PAGES = "12844-12861", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136178"} @article{bb140175, AUTHOR = "Qian, S.J. and Zhu, Y. and Li, W.B. and Li, M. and Jia, J.Y.", TITLE = "What Makes for Good Tokenizers in Vision Transformer?", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "11", MONTH = "November", PAGES = "13011-13023", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136179"} @article{bb140176, AUTHOR = "Sun, W.X. and Qin, Z. and Deng, H. and Wang, J. and Zhang, Y. and Zhang, K. and Barnes, N. and Birchfield, S. and Kong, L.P. and Zhong, Y.", TITLE = "Vicinity Vision Transformer", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "10", MONTH = "October", PAGES = "12635-12649", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136180"} @article{bb140177, AUTHOR = "Cao, C.J. and Dong, Q. and Fu, Y.W.", TITLE = "ZITS++: Image Inpainting by Improving the Incremental Transformer on Structural Priors", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "10", MONTH = "October", PAGES = "12667-12684", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136181"} @article{bb140178, AUTHOR = "Fang, Y.X. and Wang, X.G. and Wu, R. and Liu, W.Y.", TITLE = "What Makes for Hierarchical Vision Transformer?", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "10", MONTH = "October", PAGES = "12714-12720", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136182"} @article{bb140179, AUTHOR = "Xu, P. and Zhu, X.T. and Clifton, D.A.", TITLE = "Multimodal Learning With Transformers: A Survey", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "10", MONTH = "October", PAGES = "12113-12132", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136183"} @article{bb140180, AUTHOR = "Liu, J. and Guo, H.R. and He, Y. and Li, H.L.", TITLE = "Vision Transformer-Based Ensemble Learning for Hyperspectral Image Classification", JOURNAL = RS, VOLUME = "15", YEAR = "2023", NUMBER = "21", PAGES = "5208", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136184"} @article{bb140181, AUTHOR = "Lin, M.B. and Chen, M.Z. and Zhang, Y.X. and Shen, C.H. and Ji, R.R. and Cao, L.J.", TITLE = "Super Vision Transformer", JOURNAL = IJCV, VOLUME = "131", YEAR = "2023", NUMBER = "12", MONTH = "December", PAGES = "3136-3151", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136185"} @article{bb140182, AUTHOR = "Li, Z.Y. and Gao, S.H. and Cheng, M.M.", TITLE = "SERE: Exploring Feature Self-Relation for Self-Supervised Transformer", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "12", MONTH = "December", PAGES = "15619-15631", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136186"} @article{bb140183, AUTHOR = "Yuan, Y.H. and Liang, W.C. and Ding, H.H. and Liang, Z.H. and Zhang, C. and Hu, H.", TITLE = "Expediting Large-Scale Vision Transformer for Dense Prediction Without Fine-Tuning", JOURNAL = PAMI, VOLUME = "46", YEAR = "2024", NUMBER = "1", MONTH = "January", PAGES = "250-266", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136187"} @article{bb140184, AUTHOR = "Jiao, J. and Tang, Y.M. and Lin, K.Y. and Gao, Y.P. and Ma, A.J. and Wang, Y.W. and Zheng, W.S.", TITLE = "DilateFormer: Multi-Scale Dilated Transformer for Visual Recognition", JOURNAL = MultMed, VOLUME = "25", YEAR = "2023", PAGES = "8906-8919", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136188"} @article{bb140185, AUTHOR = "Li, Z. and Li, Y.X. and Li, Q.D. and Wang, P. and Guo, D. and Lu, L. and Jin, D. and Zhang, Y. and Hong, Q.Q.", TITLE = "LViT: Language Meets Vision Transformer in Medical Image Segmentation", JOURNAL = MedImg, VOLUME = "43", YEAR = "2024", NUMBER = "1", MONTH = "January", PAGES = "96-107", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136189"} @article{bb140186, AUTHOR = "Fu, K. and Yuan, M.Z. and Liu, S.L. and Wang, M.", TITLE = "Boosting Point-BERT by Multi-Choice Tokens", JOURNAL = CirSysVideo, VOLUME = "34", YEAR = "2024", NUMBER = "1", MONTH = "January", PAGES = "438-447", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136190"} @article{bb140187, AUTHOR = "Ghosal, S.S. and Li, Y.X.", TITLE = "Are Vision Transformers Robust to Spurious Correlations?", JOURNAL = IJCV, VOLUME = "132", YEAR = "2024", NUMBER = "3", MONTH = "March", PAGES = "689-709", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136191"} @article{bb140188, AUTHOR = "Yan, F.Y. and Yan, B. and Liang, W. and Pei, M.T.", TITLE = "Token labeling-guided multi-scale medical image classification", JOURNAL = PRL, VOLUME = "178", YEAR = "2024", PAGES = "28-34", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136192"} @article{bb140189, AUTHOR = "Li, Y.X. and Huang, Y.W. and He, N. and Ma, K. and Zheng, Y.F.", TITLE = "Improving vision transformer for medical image classification via token-wise perturbation", JOURNAL = JVCIR, VOLUME = "98", YEAR = "2024", PAGES = "104022", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136193"} @article{bb140190, AUTHOR = "Nguyen, H. and Kim, C. and Li, F.", TITLE = "Space-time recurrent memory network", JOURNAL = CVIU, VOLUME = "241", YEAR = "2024", PAGES = "103943", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136194"} @inproceedings{bb140191, AUTHOR = "Kheldouni, A. and Boumhidi, J.", TITLE = "A Study of Bidirectional Encoder Representations from Transformers for Sequential Recommendations", BOOKTITLE = ISCV22, YEAR = "2022", PAGES = "1-5", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136195"} @article{bb140192, AUTHOR = "Chen, Z. and Bai, C.Y. and Zhu, Y.L. and Lu, X.W.", TITLE = "TUT: Template-Augmented U-Net Transformer for Unsupervised Anomaly Detection", JOURNAL = SPLetters, VOLUME = "31", YEAR = "2024", PAGES = "780-784", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136196"} @inproceedings{bb140193, AUTHOR = "Shimizu, S. and Tamaki, T.", TITLE = "Joint learning of images and videos with a single Vision Transformer", BOOKTITLE = MVA23, YEAR = "2023", PAGES = "1-6", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136197"} @inproceedings{bb140194, AUTHOR = "Li, K.C. and Wang, Y. and Li, Y.Z. and Wang, Y. and He, Y. and Wang, L.M. and Qiao, Y.", TITLE = "Unmasked Teacher: Towards Training-Efficient Video Foundation Models", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "19891-19903", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136198"} @inproceedings{bb140195, AUTHOR = "Ding, S.R. and Zhao, P.S. and Zhang, X.P. and Qian, R. and Xiong, H.K. and Tian, Q.", TITLE = "Prune Spatio-temporal Tokens by Semantic-aware Temporal Accumulation", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "16899-16910", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136199"} @inproceedings{bb140196, AUTHOR = "Chen, M.Z. and Lin, M. and Lin, Z.H. and Zhang, Y.X. and Chao, F. and Ji, R.R.", TITLE = "SMMix: Self-Motivated Image Mixing for Vision Transformers", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "17214-17224", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136200"} @inproceedings{bb140197, AUTHOR = "Kim, D. and Angelova, A. and Kuo, W.C.", TITLE = "Contrastive Feature Masking Open-Vocabulary Vision Transformer", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "15556-15566", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136201"} @inproceedings{bb140198, AUTHOR = "Zhang, Y. and Chen, D. and Kundu, S. and Li, C.H. and Beerel, P.A.", TITLE = "SAL-ViT: Towards Latency Efficient Private Inference on ViT using Selective Attention Search with a Learnable Softmax Approximation", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "5093-5102", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136202"} @inproceedings{bb140199, AUTHOR = "Li, Z. and Gu, Q.Y.", TITLE = "I-ViT: Integer-only Quantization for Efficient Vision Transformer Inference", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "17019-17029", BIBSOURCE = "http://www.visionbib.com/bibliography/pattern651vit2.html#TT136203"}