@inproceedings{bb70400,
AUTHOR = "Wang, Z.Y. and Feng, T.L. and Lyu, F. and Shang, F. and Feng, W. and Wan, L.",
TITLE = "Dual Semantic Guidance for Open Vocabulary Semantic Segmentation",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "20212-20222",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68095"}
@inproceedings{bb70401,
AUTHOR = "Lee, M. and Cho, S. and Lee, J. and Yang, S. and Choi, H. and Kim, I.J. and Lee, S.Y.",
TITLE = "Effective SAM Combination for Open-Vocabulary Semantic Segmentation",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "26081-26090",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68096"}
@inproceedings{bb70402,
AUTHOR = "Li, K.Y. and Liu, R.X. and Cao, X. and Bai, X. and Zhou, F. and Meng, D.Y. and Wang, Z.",
TITLE = "SegEarth-OV: Towards Training-Free Open-Vocabulary Segmentation for
Remote Sensing Images",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "10545-10556",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68097"}
@inproceedings{bb70403,
AUTHOR = "Lai, Z.H.",
TITLE = "Exploring Simple Open-Vocabulary Semantic Segmentation",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "30221-30230",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68098"}
@inproceedings{bb70404,
AUTHOR = "Stojnic, V. and Kalantidis, Y. and Matas, J. and Tolias, G.",
TITLE = "LPOSS: Label Propagation Over Patches and Pixels for Open-vocabulary
Semantic Segmentation",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "9794-9803",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68099"}
@inproceedings{bb70405,
AUTHOR = "Qorbani, R. and Villani, G. and Panagiotakopoulos, T. and Colomer, M.B. and Harenstam Nielsen, L. and Segu, M. and Dovesi, P.L. and Karlgren, J. and Cremers, D. and Tombari, F. and Poggi, M.",
TITLE = "Semantic Library Adaptation: LoRA Retrieval and Fusion for
Open-Vocabulary Semantic Segmentation",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "9804-9815",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68100"}
@inproceedings{bb70406,
AUTHOR = "Choi, J. and Lee, S. and Lee, M. and Lee, S. and Shim, H.J.",
TITLE = "Fine-Grained Image-Text Correspondence with Cost Aggregation for
Open-Vocabulary Part Segmentation",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "9782-9793",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68101"}
@inproceedings{bb70407,
AUTHOR = "Kim, C. and Ju, D. and Han, W. and Yang, M.H. and Hwang, S.J.",
TITLE = "Distilling Spectral Graph for Object-Context Aware Open-Vocabulary
Semantic Segmentation",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "15033-15042",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68102"}
@inproceedings{bb70408,
AUTHOR = "Choi, J. and Ko, J. and Lee, D.J. and Kim, J.",
TITLE = "AH-OCDA: Amplitude-Based Curriculum Learning and Hopfield
Segmentation Model for Open Compound Domain Adaptation",
BOOKTITLE = WACV25,
YEAR = "2025",
PAGES = "8280-8290",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68103"}
@inproceedings{bb70409,
AUTHOR = "Zhuo, Y.X. and Bessinger, Z. and Wang, L.C. and Khosravan, N. and Li, B.X. and Kang, S.B.",
TITLE = "TFM2: Training-Free Mask Matching for Open-Vocabulary Semantic
Segmentation",
BOOKTITLE = WACV25,
YEAR = "2025",
PAGES = "4693-4703",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68104"}
@inproceedings{bb70410,
AUTHOR = "Wang, Y.M. and Czarnecki, K.",
TITLE = "AiDe: Improving 3D Open-Vocabulary Semantic Segmentation by Aligned
Vision-Language Learning",
BOOKTITLE = WACV25,
YEAR = "2025",
PAGES = "2674-2685",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68105"}
@inproceedings{bb70411,
AUTHOR = "Kalluri, T. and Wang, W.Y. and Wang, H. and Chandraker, M. and Torresani, L. and Tran, D.",
TITLE = "Open-world Instance Segmentation: Top-down Learning with Bottom-up
Supervision",
BOOKTITLE = L3D-IVU24,
YEAR = "2024",
PAGES = "2693-2703",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68106"}
@inproceedings{bb70412,
AUTHOR = "Zheng, J.W. and Liu, R.P. and Chen, Y.F. and Peng, K.Y. and Wu, C.Z. and Yang, K.L. and Zhang, J.M. and Stiefelhagen, R.",
TITLE = "Open Panoramic Segmentation",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "XXXIX: 164-182",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68107"}
@inproceedings{bb70413,
AUTHOR = "Karazija, L. and Laina, I. and Vedaldi, A. and Rupprecht, C.",
TITLE = "Diffusion Models for Open-vocabulary Segmentation",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "V: 299-317",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68108"}
@inproceedings{bb70414,
AUTHOR = "Wilms, C. and Rolff, T. and Hillemann, M. and Johanson, R. and Frintrop, S.",
TITLE = "Sos: Segment Object System for Open-world Instance Segmentation with
Object Priors",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "XXVII: 165-182",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68109"}
@inproceedings{bb70415,
AUTHOR = "Jiao, S. and Zhu, H.G. and Huang, J.N. and Zhao, Y. and Wei, Y.C. and Shi, H.",
TITLE = "Collaborative Vision-text Representation Optimizing for Open-vocabulary
Segmentation",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "XXXIII: 399-416",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68110"}
@inproceedings{bb70416,
AUTHOR = "Wysoczanska, M. and Simeoni, O. and Ramamonjisoa, M. and Bursuc, A. and Trzcinski, T. and Perez, P.",
TITLE = "CLIP-dinoiser: Teaching CLIP a Few Dino Tricks for Open-vocabulary
Semantic Segmentation",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "LXI: 320-337",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68111"}
@inproceedings{bb70417,
AUTHOR = "Shao, T. and Tian, Z. and Zhao, H. and Su, J.",
TITLE = "Explore the Potential of CLIP for Training-free Open Vocabulary
Semantic Segmentation",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "LXXXVI: 139-156",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68112"}
@inproceedings{bb70418,
AUTHOR = "Lan, M.C. and Chen, C.F. and Ke, Y.P. and Wang, X.J. and Feng, L. and Zhang, W.",
TITLE = "Proxyclip: Proxy Attention Improves CLIP for Open-vocabulary
Segmentation",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "LXVIII: 70-88",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68113"}
@inproceedings{bb70419,
AUTHOR = "Jiang, L. and Shi, S.S. and Schiele, B.",
TITLE = "Open-Vocabulary 3D Semantic Segmentation with Foundation Models",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "21284-21294",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68114"}
@inproceedings{bb70420,
AUTHOR = "Zhao, W.J. and Li, J. and Dong, X. and Xiang, Y. and Guo, Y.H.",
TITLE = "Segment Every Out-of-Distribution Object",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "3910-3920",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68115"}
@inproceedings{bb70421,
AUTHOR = "Liu, Y. and Bai, S. and Li, G.B. and Wang, Y.T. and Tang, Y.S.",
TITLE = "Open-Vocabulary Segmentation with Semantic-Assisted Calibration",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "3491-3500",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68116"}
@inproceedings{bb70422,
AUTHOR = "Bousselham, W. and Petersen, F. and Ferrari, V. and Kuehne, H.",
TITLE = "Grounding Everything: Emerging Localization Properties in
Vision-Language Transformers",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "3828-3837",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68117"}
@inproceedings{bb70423,
AUTHOR = "Wang, Y. and Sun, R. and Luo, N. and Pan, Y. and Zhang, T.Z.",
TITLE = "Image-to-Image Matching via Foundation Models: A New Perspective for
Open-Vocabulary Semantic Segmentation",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "3952-3963",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68118"}
@inproceedings{bb70424,
AUTHOR = "Nguyen, P. and Ngo, T.D. and Kalogerakis, E. and Gan, C. and Tran, A. and Pham, C. and Nguyen, K.",
TITLE = "Open3DIS: Open-Vocabulary 3D Instance Segmentation with 2D Mask
Guidance",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "4018-4028",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68119"}
@inproceedings{bb70425,
AUTHOR = "Luo, J.Y. and Khandelwal, S. and Sigal, L. and Li, B.Y.",
TITLE = "Emergent Open-Vocabulary Semantic Segmentation from Off-the-Shelf
Vision-Language Models",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "4029-4040",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68120"}
@inproceedings{bb70426,
AUTHOR = "Bourouis, A. and Fan, J.E. and Gryaditskaya, Y.",
TITLE = "Open Vocabulary Semantic Scene Sketch Understanding",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "4176-4186",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68121"}
@inproceedings{bb70427,
AUTHOR = "Wang, X.Q. and He, W.B. and Xuan, X. and Sebastian, C. and Ono, J.P. and Li, X. and Behpour, S. and Doan, T. and Gou, L. and Shen, H.W. and Ren, L.",
TITLE = "USE: Universal Segment Embeddings for Open-Vocabulary Image
Segmentation",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "4187-4196",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68122"}
@inproceedings{bb70428,
AUTHOR = "Marcos Manchon, P. and Alcover Couso, R. and SanMiguel, J.C. and Martinez, J.M.",
TITLE = "Open-Vocabulary Attention Maps with Token Optimization for Semantic
Segmentation in Diffusion Models",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "9242-9252",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68123"}
@inproceedings{bb70429,
AUTHOR = "Sun, S.Y. and Li, R. and Torr, P. and Gu, X. and Li, S.Y.",
TITLE = "CLIP as RNN: Segment Countless Visual Concepts without Training
Endeavor",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "13171-13182",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68124"}
@inproceedings{bb70430,
AUTHOR = "Kong, L.D. and Liu, Y.Q. and Ng, L.X. and Cottereau, B.R. and Ooi, W.T.",
TITLE = "OpenESS: Event-Based Semantic Scene Understanding with Open
Vocabularies",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "15686-15698",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68125"}
@inproceedings{bb70431,
AUTHOR = "Xu, J.X. and Chen, W.Y. and Zhao, Y. and Wei, Y.C.",
TITLE = "Transferable and Principled Efficiency for Open-Vocabulary
Segmentation",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "15814-15824",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68126"}
@inproceedings{bb70432,
AUTHOR = "Barsellotti, L. and Amoroso, R. and Cornia, M. and Baraldi, L. and Cucchiara, R.",
TITLE = "Training-Free Open-Vocabulary Segmentation with Offline
Diffusion-Augmented Prototype Generation",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "3689-3698",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68127"}
@inproceedings{bb70433,
AUTHOR = "Choe, S.A. and Shin, A.H. and Park, K.H. and Choi, J. and Park, G.M.",
TITLE = "Open-Set Domain Adaptation for Semantic Segmentation",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "23943-23953",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68128"}
@inproceedings{bb70434,
AUTHOR = "Shan, X.H. and Wu, D.Y. and Zhu, G.L. and Shao, Y.J. and Sang, N. and Gao, C.X.",
TITLE = "Open-Vocabulary Semantic Segmentation with Image Embedding Balancing",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "28412-28421",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68129"}
@inproceedings{bb70435,
AUTHOR = "Li, Z. and Zhou, Q. and Zhang, X.Y. and Zhang, Y. and Wang, Y.F. and Xie, W.",
TITLE = "Open-vocabulary Object Segmentation with Diffusion Models",
BOOKTITLE = ICCV23,
YEAR = "2023",
PAGES = "7633-7642",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68130"}
@inproceedings{bb70436,
AUTHOR = "Zhu, M. and Li, H.T. and Chen, H. and Fan, C.X. and Mao, W. and Jing, C.C. and Liu, Y.F. and Shen, C.H.",
TITLE = "SegPrompt:
Boosting Open-world Segmentation via Category-level Prompt Learning",
BOOKTITLE = ICCV23,
YEAR = "2023",
PAGES = "999-1008",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68131"}
@inproceedings{bb70437,
AUTHOR = "Zhang, H. and Li, F. and Zou, X. and Liu, S.L. and Li, C.Y. and Yang, J.W. and Zhang, L.",
TITLE = "A Simple Framework for Open-Vocabulary Segmentation and Detection",
BOOKTITLE = ICCV23,
YEAR = "2023",
PAGES = "1020-1031",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68132"}
@inproceedings{bb70438,
AUTHOR = "Huang, K. and Wang, F. and Xi, Y. and Gao, Y.T.",
TITLE = "Prototypical Kernel Learning and Open-set Foreground Perception for
Generalized Few-shot Semantic Segmentation",
BOOKTITLE = ICCV23,
YEAR = "2023",
PAGES = "19199-19208",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68133"}
@inproceedings{bb70439,
AUTHOR = "Cai, K.X. and Ren, P.Z. and Zhu, Y. and Xu, H. and Liu, J.Z. and Li, C.L. and Wang, G.R. and Liang, X.D.",
TITLE = "MixReorg: Cross-Modal Mixed Patch Reorganization is a Good Mask
Learner for Open-World Semantic Segmentation",
BOOKTITLE = ICCV23,
YEAR = "2023",
PAGES = "1196-1205",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68134"}
@inproceedings{bb70440,
AUTHOR = "Chen, J. and Zhu, D. and Qian, G.C. and Ghanem, B. and Yan, Z.C. and Zhu, C.C. and Xiao, F.Y. and Culatana, S.C. and Elhoseiny, M.",
TITLE = "Exploring Open-Vocabulary Semantic Segmentation from CLIP Vision
Encoder Distillation Only",
BOOKTITLE = ICCV23,
YEAR = "2023",
PAGES = "699-710",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68135"}
@inproceedings{bb70441,
AUTHOR = "Han, K.Y. and Liu, Y. and Liew, J.H. and Ding, H.H. and Liu, J.J. and Wang, Y.T. and Tang, Y.S. and Yang, Y. and Feng, J.S. and Zhao, Y. and Wei, Y.C.",
TITLE = "Global Knowledge Calibration for Fast Open-Vocabulary Segmentation",
BOOKTITLE = ICCV23,
YEAR = "2023",
PAGES = "797-807",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68136"}
@inproceedings{bb70442,
AUTHOR = "Barsellotti, L. and Amoroso, R. and Baraldi, L. and Cucchiara, R.",
TITLE = "FOSSIL: Free Open-Vocabulary Semantic Segmentation through Synthetic
References Retrieval",
BOOKTITLE = WACV24,
YEAR = "2024",
PAGES = "1453-1462",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68137"}
@inproceedings{bb70443,
AUTHOR = "Barsellotti, L. and Amoroso, R. and Baraldi, L. and Cucchiara, R.",
TITLE = "Enhancing Open-vocabulary Semantic Segmentation with Prototype
Retrieval",
BOOKTITLE = CIAP23,
YEAR = "2023",
PAGES = "II:196-208",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68138"}
@inproceedings{bb70444,
AUTHOR = "Xu, J. and Hou, J.L. and Zhang, Y.J. and Feng, R. and Wang, Y. and Qiao, Y. and Xie, W.",
TITLE = "Learning Open-Vocabulary Semantic Segmentation Models From Natural
Language Supervision",
BOOKTITLE = CVPR23,
YEAR = "2023",
PAGES = "2935-2944",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68139"}
@inproceedings{bb70445,
AUTHOR = "Cha, J. and Mun, J. and Roh, B.",
TITLE = "Learning to Generate Text-Grounded Mask for Open-World Semantic
Segmentation from Only Image-Text Pairs",
BOOKTITLE = CVPR23,
YEAR = "2023",
PAGES = "11165-11174",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68140"}
@inproceedings{bb70446,
AUTHOR = "Mukhoti, J. and Lin, T.Y. and Poursaeed, O. and Wang, R. and Shah, A. and Torr, P.H.S. and Lim, S.N.",
TITLE = "Open Vocabulary Semantic Segmentation with Patch Aligned Contrastive
Learning",
BOOKTITLE = CVPR23,
YEAR = "2023",
PAGES = "19413-19423",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68141"}
@inproceedings{bb70447,
AUTHOR = "Liang, F. and Wu, B. and Dai, X.L. and Li, K.P. and Zhao, Y. and Zhang, H. and Zhang, P.Z. and Vajda, P. and Marculescu, D.",
TITLE = "Open-Vocabulary Semantic Segmentation with Mask-adapted CLIP",
BOOKTITLE = CVPR23,
YEAR = "2023",
PAGES = "7061-7070",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68142"}
@inproceedings{bb70448,
AUTHOR = "Zabari, N. and Hoshen, Y.",
TITLE = "Open-vocabulary Semantic Segmentation Using Test-time Distillation",
BOOKTITLE = LLID22,
YEAR = "2022",
PAGES = "56-72",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68143"}
@inproceedings{bb70449,
AUTHOR = "Nunes, I. and Pereira, M.B. and Oliveira, H. and dos Santos, J.A. and Poggi, M.",
TITLE = "Conditional Reconstruction for Open-Set Semantic Segmentation",
BOOKTITLE = ICIP22,
YEAR = "2022",
PAGES = "946-950",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68144"}
@inproceedings{bb70450,
AUTHOR = "Liu, Q.D. and Wen, Y.P. and Han, J.H. and Xu, C.J. and Xu, H. and Liang, X.D.",
TITLE = "Open-World Semantic Segmentation via Contrasting and Clustering
Vision-Language Embedding",
BOOKTITLE = ECCV22,
YEAR = "2022",
PAGES = "XX:275-292",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350opse6.html#TT68145"}
@article{bb70451,
AUTHOR = "Jin, Y. and Han, D. and Ko, H.S.",
TITLE = "TrSeg: Transformer for semantic segmentation",
JOURNAL = PRL,
VOLUME = "148",
YEAR = "2021",
PAGES = "29-35",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68146"}
@article{bb70452,
AUTHOR = "Wang, L. and Li, R. and Zhang, C. and Fang, S.H. and Duan, C.X. and Meng, X.L. and Atkinson, P.M.",
TITLE = "UNetFormer: A UNet-like transformer for efficient semantic
segmentation of remote sensing urban scene imagery",
JOURNAL = PandRS,
VOLUME = "190",
YEAR = "2022",
PAGES = "196-214",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68147"}
@article{bb70453,
AUTHOR = "Li, Z.K. and Liu, Y.F. and Li, B. and Feng, B.L. and Wu, K. and Peng, C.W. and Hu, W.M.",
TITLE = "SDTP: Semantic-Aware Decoupled Transformer Pyramid for Dense Image
Prediction",
JOURNAL = CirSysVideo,
VOLUME = "32",
YEAR = "2022",
NUMBER = "9",
MONTH = "September",
PAGES = "6160-6173",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68148"}
@article{bb70454,
AUTHOR = "Mou, C. and Zhang, J.",
TITLE = "TransCL: Transformer Makes Strong and Flexible Compressive Learning",
JOURNAL = PAMI,
VOLUME = "45",
YEAR = "2023",
NUMBER = "4",
MONTH = "April",
PAGES = "5236-5251",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68149"}
@article{bb70455,
AUTHOR = "Lin, X. and Sun, S.Z. and Huang, W. and Sheng, B. and Li, P. and Feng, D.D.",
TITLE = "EAPT: Efficient Attention Pyramid Transformer for Image Processing",
JOURNAL = MultMed,
VOLUME = "25",
YEAR = "2023",
PAGES = "50-61",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68150"}
@article{bb70456,
AUTHOR = "Yu, L. and Xiang, W. and Fang, J. and Chen, Y.P.P. and Chi, L.",
TITLE = "eX-ViT: A Novel explainable vision transformer for weakly supervised
semantic segmentation",
JOURNAL = PR,
VOLUME = "142",
YEAR = "2023",
PAGES = "109666",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68151"}
@article{bb70457,
AUTHOR = "Quan, Y. and Zhang, D. and Zhang, L.Y. and Tang, J.H.",
TITLE = "Centralized Feature Pyramid for Object Detection",
JOURNAL = IP,
VOLUME = "32",
YEAR = "2023",
PAGES = "4341-4354",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68152"}
@article{bb70458,
AUTHOR = "Jin, Z.C. and Yu, D.D. and Yuan, Z.H. and Yu, L.Q.",
TITLE = "MCIBI++: Soft Mining Contextual Information Beyond Image for Semantic
Segmentation",
JOURNAL = PAMI,
VOLUME = "45",
YEAR = "2023",
NUMBER = "5",
MONTH = "May",
PAGES = "5988-6005",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68153"}
@inproceedings{bb70459,
AUTHOR = "Jin, Z.C. and Gong, T. and Yu, D.D. and Chu, Q. and Wang, J. and Wang, C.H. and Shao, J.",
TITLE = "Mining Contextual Information Beyond Image for Semantic Segmentation",
BOOKTITLE = ICCV21,
YEAR = "2021",
PAGES = "7211-7221",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68154"}
@article{bb70460,
AUTHOR = "Zhang, J.M. and Liu, H. and Yang, K.L. and Hu, X.X. and Liu, R.P. and Stiefelhagen, R.",
TITLE = "CMX: Cross-Modal Fusion for RGB-X Semantic Segmentation With
Transformers",
JOURNAL = ITS,
VOLUME = "24",
YEAR = "2023",
NUMBER = "12",
MONTH = "December",
PAGES = "14679-14694",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68155"}
@article{bb70461,
AUTHOR = "Wang, D.L. and Chen, Y. and Naz, B. and Sun, L. and Li, B.Z.",
TITLE = "Spatial-Aware Transformer (SAT): Enhancing Global Modeling in
Transformer Segmentation for Remote Sensing Images",
JOURNAL = RS,
VOLUME = "15",
YEAR = "2023",
NUMBER = "14",
PAGES = "3607",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68156"}
@article{bb70462,
AUTHOR = "Yuan, Z. and Wang, J.H. and Lv, Y.X. and Wang, D. and Fang, Y.",
TITLE = "Laformer: Vision Transformer for Panoramic Image Semantic
Segmentation",
JOURNAL = SPLetters,
VOLUME = "30",
YEAR = "2023",
PAGES = "1792-1796",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68157"}
@article{bb70463,
AUTHOR = "Zhang, B. and Liu, L.Y. and Phan, M.H. and Tian, Z. and Shen, C.H. and Liu, Y.F.",
TITLE = "SegViT v2: Exploring Efficient and Continual Semantic Segmentation with
Plain Vision Transformers",
JOURNAL = IJCV,
VOLUME = "132",
YEAR = "2024",
NUMBER = "4",
MONTH = "April",
PAGES = "1126-1147",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68158"}
@article{bb70464,
AUTHOR = "Ding, H.J. and Wang, B. and Kang, G.L. and Li, W.J. and He, C.H. and Zhao, Y. and Wei, Y.C.",
TITLE = "DropQueries: A Simple Way to Discover Comprehensive Segment
Representations",
JOURNAL = MultMed,
VOLUME = "26",
YEAR = "2024",
PAGES = "3481-3490",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68159"}
@article{bb70465,
AUTHOR = "Deng, J.H. and Zhang, X.Y. and Li, W. and Duan, L.X. and Xu, D.",
TITLE = "Cross-Domain Detection Transformer Based on Spatial-Aware and
Semantic-Aware Token Alignment",
JOURNAL = MultMed,
VOLUME = "26",
YEAR = "2024",
PAGES = "5234-5245",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68160"}
@article{bb70466,
AUTHOR = "Hong, W.X. and Ren, W. and Lao, J.W. and Xie, L. and Zhong, L.H. and Wang, J. and Chen, J.D. and Liu, H.H. and Chu, W.",
TITLE = "Training Object Detectors from Scratch:
An Empirical Study in the Era of Vision Transformer",
JOURNAL = IJCV,
VOLUME = "132",
YEAR = "2024",
NUMBER = "8",
MONTH = "August",
PAGES = "2929-2942",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68161"}
@inproceedings{bb70467,
AUTHOR = "Hong, W.X. and Lao, J.W. and Ren, W. and Wang, J. and Chen, J.D. and Liu, H.H.",
TITLE = "Training Object Detectors from Scratch:
An Empirical Study in the Era of Vision Transformer",
BOOKTITLE = CVPR22,
YEAR = "2022",
PAGES = "4652-4661",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68161"}
@article{bb70468,
AUTHOR = "Cao, H. and Chen, G. and Zhao, H.S. and Jiang, D.S. and Zhang, X.P. and Tian, Q. and Knoll, A.",
TITLE = "SDPT: Semantic-Aware Dimension-Pooling Transformer for Image
Segmentation",
JOURNAL = ITS,
VOLUME = "25",
YEAR = "2024",
NUMBER = "11",
MONTH = "November",
PAGES = "15934-15946",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68162"}
@article{bb70469,
AUTHOR = "Zeng, W. and Jin, S. and Xu, L. and Liu, W.T. and Qian, C. and Ouyang, W.L. and Luo, P. and Wang, X.G.",
TITLE = "TCFormer: Visual Recognition via Token Clustering Transformer",
JOURNAL = PAMI,
VOLUME = "46",
YEAR = "2024",
NUMBER = "12",
MONTH = "December",
PAGES = "9521-9535",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68163"}
@inproceedings{bb70470,
AUTHOR = "Zeng, W. and Jin, S. and Liu, W.T. and Qian, C. and Luo, P. and Ouyang, W.L. and Wang, X.G.",
TITLE = "Not All Tokens Are Equal:
Human-centric Visual Analysis via Token Clustering Transformer",
BOOKTITLE = CVPR22,
YEAR = "2022",
PAGES = "11091-11101",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68164"}
@article{bb70471,
AUTHOR = "Li, Z.H. and Li, Y.X. and Li, Q.D. and Wang, P. and Guo, D. and Lu, L. and Jin, D. and Zhang, Y. and Hong, Q.Q.",
TITLE = "LViT: Language Meets Vision Transformer in Medical Image Segmentation",
JOURNAL = MedImg,
VOLUME = "43",
YEAR = "2024",
NUMBER = "1",
MONTH = "January",
PAGES = "96-107",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68165"}
@article{bb70472,
AUTHOR = "Ma, X.Y. and Lv, P.Y. and Gong, X.Q.",
TITLE = "SSOD-QCTR: Semi-Supervised Query Consistent Transformer for Optical
Remote Sensing Image Object Detection",
JOURNAL = RS,
VOLUME = "16",
YEAR = "2024",
NUMBER = "23",
PAGES = "4556",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68166"}
@article{bb70473,
AUTHOR = "Chen, S. and Han, T. and Zhang, C.S. and Su, J. and Wang, R.S. and Chen, Y.P. and Wang, Z.Y. and Cai, G.R.",
TITLE = "HSPFormer: Hierarchical Spatial Perception Transformer for Semantic
Segmentation",
JOURNAL = ITS,
VOLUME = "26",
YEAR = "2025",
NUMBER = "4",
MONTH = "April",
PAGES = "4975-4987",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68167"}
@article{bb70474,
AUTHOR = "Li, Y. and Jiao, L.C. and Liu, X. and Liu, F. and Li, L.L. and Chen, P.",
TITLE = "LGSNet: Local-Global Semantics Learning Object Detection",
JOURNAL = MultMed,
VOLUME = "27",
YEAR = "2025",
PAGES = "2281-2292",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68168"}
@article{bb70475,
AUTHOR = "Liu, Y.Z. and Yan, T.X.",
TITLE = "Vision transformer enhanced with convolutional attention and graph
convolution for semantic segmentation",
JOURNAL = IVC,
VOLUME = "161",
YEAR = "2025",
PAGES = "105633",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68169"}
@inproceedings{bb70476,
AUTHOR = "Zhou, Y.F. and Li, L.R. and Lu, L. and Xu, M.F.",
TITLE = "nnWNet: Rethinking the Use of Transformers in Biomedical Image
Segmentation and Calling for a Unified Evaluation Benchmark",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "20852-20862",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68170"}
@inproceedings{bb70477,
AUTHOR = "Arica, S. and Rubin, O. and Gershov, S. and Laufer, S.",
TITLE = "CuVLER: Enhanced Unsupervised Object Discoveries through Exhaustive
Self-Supervised Transformers",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "23105-23114",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68171"}
@inproceedings{bb70478,
AUTHOR = "Yu, H.W. and Cho, Y. and Kang, B. and Moon, S. and Kong, K. and Kang, S.J.",
TITLE = "Embedding-free Transformer with Inference Spatial Reduction for
Efficient Semantic Segmentation",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "XLII: 92-110",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68172"}
@inproceedings{bb70479,
AUTHOR = "Zhang, D.Y. and Liang, D.K. and Tan, Z.C. and Ye, X.Q. and Zhang, C. and Wang, J.D. and Bai, X.",
TITLE = "Make Your Vit-based Multi-view 3d Detectors Faster via Token
Compression",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "XLVII: 56-72",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68173"}
@inproceedings{bb70480,
AUTHOR = "Rojas Gomez, R.A. and Lim, T.Y.F. and Do, M.N. and Yeh, R.A.",
TITLE = "Making Vision Transformers Truly Shift-Equivariant",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "5568-5577",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68174"}
@inproceedings{bb70481,
AUTHOR = "Wang, S. and Li, J. and Zhao, Z. and Lian, D.Z. and Huang, B.B. and Wang, X.M. and Li, Z.X. and Gao, S.H.",
TITLE = "TSP-Transformer: Task-Specific Prompts Boosted Transformer for
Holistic Scene Understanding",
BOOKTITLE = WACV24,
YEAR = "2024",
PAGES = "914-923",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68175"}
@inproceedings{bb70482,
AUTHOR = "Kang, B. and Moon, S. and Cho, Y. and Yu, H.W. and Kang, S.J.",
TITLE = "MetaSeg: MetaFormer-based Global Contexts-aware Network for Efficient
Semantic Segmentation",
BOOKTITLE = WACV24,
YEAR = "2024",
PAGES = "433-442",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68176"}
@inproceedings{bb70483,
AUTHOR = "Koohpayegani, S.A. and Pirsiavash, H.",
TITLE = "SimA: Simple Softmax-free Attention for Vision Transformers",
BOOKTITLE = WACV24,
YEAR = "2024",
PAGES = "2595-2605",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68177"}
@inproceedings{bb70484,
AUTHOR = "Kluska, P. and Castello, A. and Scheidegger, F. and Malossi, A.C.I. and Quintana Orti, E.S.",
TITLE = "QAttn: Efficient GPU Kernels for mixed-precision Vision Transformers",
BOOKTITLE = LargeVM24,
YEAR = "2024",
PAGES = "3648-3657",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68178"}
@inproceedings{bb70485,
AUTHOR = "Jain, J. and Singh, A. and Orlov, N. and Huang, Z.L. and Li, J.C. and Walton, S. and Shi, H.",
TITLE = "SeMask: Semantically Masked Transformers for Semantic Segmentation",
BOOKTITLE = NIVT23,
YEAR = "2023",
PAGES = "752-761",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68179"}
@inproceedings{bb70486,
AUTHOR = "Wang, K. and Kim, D.H. and Feris, R.S. and Betke, M.",
TITLE = "CDAC: Cross-domain Attention Consistency in Transformer for Domain
Adaptive Semantic Segmentation",
BOOKTITLE = ICCV23,
YEAR = "2023",
PAGES = "11485-11495",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68180"}
@inproceedings{bb70487,
AUTHOR = "Tang, Q. and Zhang, B. and Liu, J.J. and Liu, F.G. and Liu, Y.F.",
TITLE = "Dynamic Token Pruning in Plain Vision Transformers for Semantic
Segmentation",
BOOKTITLE = ICCV23,
YEAR = "2023",
PAGES = "777-786",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68181"}
@inproceedings{bb70488,
AUTHOR = "Shi, H. and Hayat, M. and Cai, J.F.",
TITLE = "Transformer Scale Gate for Semantic Segmentation",
BOOKTITLE = CVPR23,
YEAR = "2023",
PAGES = "3051-3060",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68182"}
@inproceedings{bb70489,
AUTHOR = "Mo, S.T. and Sun, Z. and Li, C.",
TITLE = "Multi-level Contrastive Learning for Self-Supervised Vision
Transformers",
BOOKTITLE = WACV23,
YEAR = "2023",
PAGES = "2777-2786",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68183"}
@inproceedings{bb70490,
AUTHOR = "Marin, D. and Chang, J.H.R. and Ranjan, A. and Prabhu, A. and Rastegari, M. and Tuzel, O.",
TITLE = "Token Pooling in Vision Transformers for Image Classification",
BOOKTITLE = WACV23,
YEAR = "2023",
PAGES = "12-21",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68184"}
@inproceedings{bb70491,
AUTHOR = "Chen, J.N. and Sun, S.Y. and He, J. and Torr, P.H.S. and Yuille, A.L. and Bai, S.",
TITLE = "TransMix: Attend to Mix for Vision Transformers",
BOOKTITLE = CVPR22,
YEAR = "2022",
PAGES = "12125-12134",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68185"}
@inproceedings{bb70492,
AUTHOR = "Liu, H. and Jiang, X.H. and Li, X. and Bao, Z.M. and Jiang, D.Q. and Ren, B.",
TITLE = "NomMer: Nominate Synergistic Context in Vision Transformer for Visual
Recognition",
BOOKTITLE = CVPR22,
YEAR = "2022",
PAGES = "12063-12072",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68186"}
@inproceedings{bb70493,
AUTHOR = "Guo, J.Y. and Tang, Y.H. and Han, K. and Chen, X.H. and Wu, H. and Xu, C. and Xu, C. and Wang, Y.H.",
TITLE = "Hire-MLP: Vision MLP via Hierarchical Rearrangement",
BOOKTITLE = CVPR22,
YEAR = "2022",
PAGES = "816-826",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68187"}
@inproceedings{bb70494,
AUTHOR = "Lee, Y. and Kim, J. and Willette, J. and Hwang, S.J.",
TITLE = "MPViT: Multi-Path Vision Transformer for Dense Prediction",
BOOKTITLE = CVPR22,
YEAR = "2022",
PAGES = "7277-7286",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68188"}
@inproceedings{bb70495,
AUTHOR = "Li, W. and Li, Z.X.",
TITLE = "Causal-SETR:
A SEgmentation TRansformer Variant Based on Causal Intervention",
BOOKTITLE = ACCV22,
YEAR = "2022",
PAGES = "VII:414-430",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68189"}
@inproceedings{bb70496,
AUTHOR = "Lin, F.J. and Wu, S.T. and Ma, Y.Z. and Tian, S.W.",
TITLE = "Full-scale Selective Transformer for Semantic Segmentation",
BOOKTITLE = ACCV22,
YEAR = "2022",
PAGES = "VII:310-326",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68190"}
@inproceedings{bb70497,
AUTHOR = "Rossetti, S. and Zappia, D. and Sanzari, M. and Schaerf, M. and Pirri, F.",
TITLE = "Max Pooling with Vision Transformers Reconciles Class and Shape in
Weakly Supervised Semantic Segmentation",
BOOKTITLE = ECCV22,
YEAR = "2022",
PAGES = "XXX:446-463",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68191"}
@inproceedings{bb70498,
AUTHOR = "Themyr, L. and Rambour, C. and Thome, N. and Collins, T. and Hostettler, A.",
TITLE = "Full Contextual Attention for Multi-resolution Transformers in
Semantic Segmentation",
BOOKTITLE = WACV23,
YEAR = "2023",
PAGES = "3223-3232",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68192"}
@inproceedings{bb70499,
AUTHOR = "Shi, B. and Jiang, D.S. and Zhang, X.P. and Li, H. and Dai, W.R. and Zou, J. and Xiong, H.K. and Tian, Q.",
TITLE = "A Transformer-Based Decoder for Semantic Segmentation with Multi-level
Context Mining",
BOOKTITLE = ECCV22,
YEAR = "2022",
PAGES = "XXVIII:624-639",
BIBSOURCE = "http://www.visionbib.com/bibliography/segment350trs5.html#TT68193"}
Last update:Jun 4, 2026 at 16:38:45