Keith Price Bibliography Bibtex Entry (ANCHOR 101400 URL http://dx.doi.org/10.1109/CVPR52729.2023.00821 TYPE CONFERENCE PAGES 8496-8506 YEAR 2023 MONTH NIL BIBSOURCE http://www.visionbib.com/bibliography/describe489dift2i4.html#TT98157 VOLUME NIL JOURNAL CVPR23 AUTHOR Kim, S.W. and Brown, B. and Yin, K.X. and Kreis, K. and Schwarz, K. and Li, D. and Rombach, R. and Torralba, A. and Fidler, S. TITLE NeuralField-LDM: Scene Generation with Hierarchical Latent Diffusion Models)


@inproceedings{bb101400,
        AUTHOR = "Kim, S.W. and Brown, B. and Yin, K.X. and Kreis, K. and Schwarz, K. and Li, D. and Rombach, R. and Torralba, A. and Fidler, S.",
        TITLE = "NeuralField-LDM: Scene Generation with Hierarchical Latent Diffusion
Models",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "8496-8506",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT98157"}

@inproceedings{bb101401,
        AUTHOR = "Zhu, Y.Z. and Li, Z.H. and Wang, T.W. and He, M.C. and Yao, C.",
        TITLE = "Conditional Text Image Generation with Diffusion Models",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "14235-14244",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT98158"}

@inproceedings{bb101402,
        AUTHOR = "Zhou, Y.F. and Liu, B.C. and Zhu, Y.Z. and Yang, X. and Chen, C.Y. and Xu, J.H.",
        TITLE = "Shifted Diffusion for Text-to-image Generation",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "10157-10166",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT98159"}

@inproceedings{bb101403,
        AUTHOR = "Li, M.H. and Duan, Y.Q. and Zhou, J. and Lu, J.W.",
        TITLE = "Diffusion-SDF: Text-to-Shape via Voxelized Diffusion",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "12642-12651",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT98160"}

@inproceedings{bb101404,
        AUTHOR = "Chai, S. and Zhuang, L.S. and Yan, F.Y.",
        TITLE = "LayoutDM: Transformer-based Diffusion Model for Layout Generation",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "18349-18358",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT98161"}

@inproceedings{bb101405,
        AUTHOR = "Wu, Q.C. and Liu, Y.J. and Zhao, H. and Kale, A. and Bui, T. and Yu, T. and Lin, Z. and Zhang, Y. and Chang, S.Y.",
        TITLE = "Uncovering the Disentanglement Capability in Text-to-Image Diffusion
Models",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "1900-1910",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT98162"}

@inproceedings{bb101406,
        AUTHOR = "Jain, A. and Xie, A. and Abbeel, P.",
        TITLE = "VectorFusion: Text-to-SVG by Abstracting Pixel-Based Diffusion Models",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "1911-1920",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT98163"}

@inproceedings{bb101407,
        AUTHOR = "Kumari, N. and Zhang, B.L. and Zhang, R. and Shechtman, E. and Zhu, J.Y.",
        TITLE = "Multi-Concept Customization of Text-to-Image Diffusion",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "1931-1941",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT98164"}

@inproceedings{bb101408,
        AUTHOR = "Hui, M. and Zhang, Z.Z. and Zhang, X.Y. and Xie, W.X. and Wang, Y.W. and Lu, Y.",
        TITLE = "Unifying Layout Generation with a Decoupled Diffusion Model",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "1942-1951",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT98165"}

@inproceedings{bb101409,
        AUTHOR = "Ruiz, N. and Li, Y.Z. and Jampani, V. and Pritch, Y. and Rubinstein, M. and Aberman, K.",
        TITLE = "DreamBooth: Fine Tuning Text-to-Image Diffusion Models for
Subject-Driven Generation",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "22500-22510",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT98166"}

@inproceedings{bb101410,
        AUTHOR = "Zheng, G.C. and Zhou, X.P. and Li, X.W. and Qi, Z.A. and Shan, Y. and Li, X.",
        TITLE = "LayoutDiffusion: Controllable Diffusion Model for Layout-to-Image
Generation",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "22490-22499",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT98167"}

@inproceedings{bb101411,
        AUTHOR = "Liu, X.H. and Park, D.H. and Azadi, S. and Zhang, G. and Chopikyan, A. and Hu, Y.X. and Shi, H. and Rohrbach, A. and Darrell, T.J.",
        TITLE = "More Control for Free! Image Synthesis with Semantic Diffusion
Guidance",
        BOOKTITLE = WACV23,
        YEAR = "2023",
        PAGES = "289-299",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT98168"}

@inproceedings{bb101412,
        AUTHOR = "Pan, Z.H. and Zhou, X. and Tian, H.",
        TITLE = "Arbitrary Style Guidance for Enhanced Diffusion-Based Text-to-Image
Generation",
        BOOKTITLE = WACV23,
        YEAR = "2023",
        PAGES = "4450-4460",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT98169"}

@inproceedings{bb101413,
        AUTHOR = "Gu, S.Y. and Chen, D. and Bao, J.M. and Wen, F. and Zhang, B. and Chen, D.D. and Yuan, L. and Guo, B.N.",
        TITLE = "Vector Quantized Diffusion Model for Text-to-Image Synthesis",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "10686-10696",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT98170"}

@inproceedings{bb101414,
        AUTHOR = "Jing, B. and Corso, G. and Berlinghieri, R. and Jaakkola, T.",
        TITLE = "Subspace Diffusion Generative Models",
        BOOKTITLE = ECCV22,
        YEAR = "2022",
        PAGES = "XXIII:274-289",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT98171"}

@inproceedings{bb101415,
        AUTHOR = "Han, L.G. and Li, Y.X. and Zhang, H. and Milanfar, P. and Metaxas, D.N. and Yang, F.",
        TITLE = "SVDiff: Compact Parameter Space for Diffusion Fine-Tuning",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "7289-7300",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT98172"}

@inproceedings{bb101416,
        AUTHOR = "Nair, N.G. and Bandara, W.G.C. and Patel, V.M.",
        TITLE = "Unite and Conquer: Plug and Play Multi-Modal Synthesis Using
Diffusion Models",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "6070-6079",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT98173"}

@inproceedings{bb101417,
        AUTHOR = "Zheng, G. and Li, S.M. and Wang, H. and Yao, T.P. and Chen, Y. and Ding, S.H. and Li, X.",
        TITLE = "Entropy-Driven Sampling and Training Scheme for Conditional Diffusion
Generation",
        BOOKTITLE = ECCV22,
        YEAR = "2022",
        PAGES = "XXII:754-769",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT98174"}

@inproceedings{bb101418,
        AUTHOR = "Sehwag, V. and Hazirbas, C. and Gordo, A. and Ozgenel, F. and Ferrer, C.C.",
        TITLE = "Generating High Fidelity Data from Low-density Regions using
Diffusion Models",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "11482-11491",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT98175"}

@article{bb101419,
        AUTHOR = "Lin, Z.H. and Lin, M. and Zhan, W. and Ji, R.R.",
        TITLE = "AccDiffusion v2: Toward More Accurate Higher-Resolution Diffusion
Extrapolation",
        JOURNAL = PAMI,
        VOLUME = "47",
        YEAR = "2025",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "8351-8363",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489hresdift2i5.html#TT98176"}

@inproceedings{bb101420,
        AUTHOR = "Han, J. and Liu, J. and Jiang, Y. and Yan, B. and Zhang, Y.Q. and Yuan, Z.H. and Peng, B.Y. and Liu, X.B.",
        TITLE = "Infinity?: Scaling Bitwise AutoRegressive Modeling for
High-Resolution Image Synthesis",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "15733-15744",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489hresdift2i5.html#TT98177"}

@inproceedings{bb101421,
        AUTHOR = "Jeong, J.H. and Han, S. and Kim, J. and Kim, S.J.",
        TITLE = "Latent Space Super-Resolution for Higher-Resolution Image Generation
with Diffusion Models",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "2355-2365",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489hresdift2i5.html#TT98178"}

@inproceedings{bb101422,
        AUTHOR = "Liu, Q.H. and Yin, X. and Yuille, A.L. and Brown, A. and Singh, M.",
        TITLE = "Flowing from Words to Pixels: A Noise-Free Framework for
Cross-Modality Evolution",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "2755-2765",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489hresdift2i5.html#TT98179"}

@inproceedings{bb101423,
        AUTHOR = "Choi, S. and Yun, J. and Park, J. and Choo, J.",
        TITLE = "Disentangling Subject-Irrelevant Elements in Personalized
Text-to-Image Diffusion via Filtered Self-Distillation",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "9073-9082",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489hresdift2i5.html#TT98180"}

@inproceedings{bb101424,
        AUTHOR = "Wu, H.N. and Shen, S.C. and Hu, Q. and Zhang, X.Y. and Zhang, Y. and Wang, Y.F.",
        TITLE = "MegaFusion: Extend Diffusion Models towards Higher-resolution Image
Generation without Further Tuning",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "3944-3953",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489hresdift2i5.html#TT98181"}

@inproceedings{bb101425,
        AUTHOR = "Zhang, S. and Chen, Z.W. and Zhao, Z.Y. and Chen, Y.H. and Tang, Y. and Liang, J.J.",
        TITLE = "Hidiffusion: Unlocking Higher-resolution Creativity and Efficiency in
Pretrained Diffusion Models",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "LI: 145-161",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489hresdift2i5.html#TT98182"}

@inproceedings{bb101426,
        AUTHOR = "Huang, L.J. and Fang, R.Y. and Zhang, A.P. and Song, G.L. and Liu, S. and Liu, Y. and Li, H.S.",
        TITLE = "FouriScale: A Frequency Perspective on Training-free High-resolution
Image Synthesis",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XII: 196-212",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489hresdift2i5.html#TT98183"}

@inproceedings{bb101427,
        AUTHOR = "Kim, G. and Kim, H. and Seo, H. and Kang, D.U. and Chun, S.Y.",
        TITLE = "Beyondscene: Higher-resolution Human-centric Scene Generation with
Pretrained Diffusion",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "LXIV: 126-142",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489hresdift2i5.html#TT98184"}

@inproceedings{bb101428,
        AUTHOR = "Lin, Z.H. and Lin, M.B. and Zhao, M. and Ji, R.R.",
        TITLE = "Accdiffusion: An Accurate Method for Higher-resolution Image Generation",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "VI: 38-53",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489hresdift2i5.html#TT98185"}

@inproceedings{bb101429,
        AUTHOR = "Li, M.Y. and Cai, T. and Cao, J.X. and Zhang, Q.S. and Cai, H. and Bai, J.J. and Jia, Y.Q. and Li, K. and Han, S.",
        TITLE = "DistriFusion: Distributed Parallel Inference for High-Resolution
Diffusion Models",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "7183-7193",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489hresdift2i5.html#TT98186"}

@inproceedings{bb101430,
        AUTHOR = "Du, R. and Chang, D.L. and Hospedales, T. and Song, Y.Z. and Ma, Z.Y.",
        TITLE = "DemoFusion: Democratising High-Resolution Image Generation With No $$",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "6159-6168",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489hresdift2i5.html#TT98187"}

@inproceedings{bb101431,
        AUTHOR = "Zhou, J.X. and Ding, T.Y. and Chen, T.Y. and Jiang, J.C. and Zharkov, I. and Zhu, Z.H. and Liang, L.",
        TITLE = "DREAM: Diffusion Rectification and Estimation-Adaptive Models",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "8342-8351",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489hresdift2i5.html#TT98188"}

@inproceedings{bb101432,
        AUTHOR = "Sun, H. and Li, W.B. and Liu, J.Z. and Chen, H.Y. and Pei, R. and Zou, X. and Yan, Y. and Yang, Y.",
        TITLE = "CoSeR: Bridging Image and Language for Cognitive Super-Resolution",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "25868-25878",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489hresdift2i5.html#TT98189"}

@inproceedings{bb101433,
        AUTHOR = "Mei, K. and Delbracio, M. and Talebi, H. and Tu, Z.Z. and Patel, V.M. and Milanfar, P.",
        TITLE = "CoDi: Conditional Diffusion Distillation for Higher-Fidelity and
Faster Image Generation",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "9048-9058",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489hresdift2i5.html#TT98190"}

@inproceedings{bb101434,
        AUTHOR = "Gandikota, K.V. and Chandramouli, P.",
        TITLE = "Text-Guided Explorable Image Super-Resolution",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "25900-25911",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489hresdift2i5.html#TT98191"}

@inproceedings{bb101435,
        AUTHOR = "Zhao, T.C. and Ning, X.F. and Fang, T. and Liu, E. and Huang, G. and Lin, Z. and Yan, S. and Dai, G.H. and Wang, Y.",
        TITLE = "Mixdq: Memory-efficient Few-step Text-to-image Diffusion Models with
Metric-decoupled Mixed Precision Quantization",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XIV: 285-302",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489hresdift2i5.html#TT98192"}

@inproceedings{bb101436,
        AUTHOR = "Parihar, R. and Sachidanand, V.S. and Mani, S. and Karmali, T. and Babu, R.V.",
        TITLE = "Precisecontrol: Enhancing Text-to-image Diffusion Models with
Fine-grained Attribute Control",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "LXXXII: 469-487",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489hresdift2i5.html#TT98193"}

@inproceedings{bb101437,
        AUTHOR = "Gandikota, R. and Materzynska, J. and Zhou, T. and Torralba, A. and Bau, D.",
        TITLE = "Concept Sliders: Lora Adaptors for Precise Control in Diffusion Models",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XL: 172-188",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489hresdift2i5.html#TT98194"}

@article{bb101438,
        AUTHOR = "Naveen, S. and Ram Kiran, M.S. and Indupriya, M. and Manikanta, T.V. and Sudeep, P.V.",
        TITLE = "Transformer models for enhancing AttnGAN based text to image
generation",
        JOURNAL = IVC,
        VOLUME = "115",
        YEAR = "2021",
        PAGES = "104284",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98195"}

@article{bb101439,
        AUTHOR = "Dalmaz, O. and Yurt, M. and Cukur, T.",
        TITLE = "ResViT: Residual Vision Transformers for Multimodal Medical Image
Synthesis",
        JOURNAL = MedImg,
        VOLUME = "41",
        YEAR = "2022",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "2598-2614",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98196"}

@article{bb101440,
        AUTHOR = "Zhang, X. and Jiao, W.T. and Wang, B. and Tian, X.D.",
        TITLE = "CT-GAN: A conditional Generative Adversarial Network of transformer
architecture for text-to-image",
        JOURNAL = SP:IC,
        VOLUME = "115",
        YEAR = "2023",
        PAGES = "116959",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98197"}

@article{bb101441,
        AUTHOR = "Sortino, R. and Palazzo, S. and Rundo, F. and Spampinato, C.",
        TITLE = "Transformer-based image generation from scene graphs",
        JOURNAL = CVIU,
        VOLUME = "233",
        YEAR = "2023",
        PAGES = "103721",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98198"}

@inproceedings{bb101442,
        AUTHOR = "Sortino, R. and Palazzo, S. and Spampinato, C.",
        TITLE = "Transforming Image Generation from Scene Graphs",
        BOOKTITLE = "ICPR22",
        YEAR = "2022",
        PAGES = "4118-4124",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98199"}

@inproceedings{bb101443,
        AUTHOR = "Wang, Z.C. and Ren, Q. and Wang, J.L. and Yan, C.G. and Jiang, C.J.",
        TITLE = "Mush: Multi-scale Hierarchical Feature Extraction for Semantic Image
Synthesis",
        BOOKTITLE = ACCV22,
        YEAR = "2022",
        PAGES = "VII:185-201",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98200"}

@article{bb101444,
        AUTHOR = "Wei, Z.P. and Chen, J.J. and Goldblum, M. and Wu, Z.X. and Goldstein, T. and Jiang, Y.G. and Davis, L.S.",
        TITLE = "Towards Transferable Adversarial Attacks on Image and Video
Transformers",
        JOURNAL = IP,
        VOLUME = "32",
        YEAR = "2023",
        PAGES = "6346-6358",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98201"}

@article{bb101445,
        AUTHOR = "Wei, Z.P. and Chen, J.J. and Wu, Z.X. and Jiang, Y.G.",
        TITLE = "Adaptive Cross-Modal Transferable Adversarial Attacks From Images to
Videos",
        JOURNAL = PAMI,
        VOLUME = "46",
        YEAR = "2024",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "3772-3783",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98202"}

@inproceedings{bb101446,
        AUTHOR = "Wei, Z.P. and Chen, J.J. and Wu, Z.X. and Jiang, Y.G.",
        TITLE = "Cross-Modal Transferable Adversarial Attacks from Images to Videos",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "15044-15053",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98203"}

@article{bb101447,
        AUTHOR = "Bahani, M. and El Ouaazizi, A. and Maalmi, K.",
        TITLE = "The effectiveness of T5, GPT-2, and BERT on text-to-image generation
task",
        JOURNAL = PRL,
        VOLUME = "173",
        YEAR = "2023",
        PAGES = "57-63",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98204"}

@article{bb101448,
        AUTHOR = "Su, S. and Zhu, J.C. and Gao, L.L. and Song, J.K.",
        TITLE = "Utilizing Greedy Nature for Multimodal Conditional Image Synthesis in
Transformers",
        JOURNAL = MultMed,
        VOLUME = "26",
        YEAR = "2024",
        PAGES = "2354-2366",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98205"}

@article{bb101449,
        AUTHOR = "Li, Z. and Liu, F.",
        TITLE = "Scalable video transformer for full-frame video prediction",
        JOURNAL = CVIU,
        VOLUME = "249",
        YEAR = "2024",
        PAGES = "104166",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98206"}

@article{bb101450,
        AUTHOR = "Cao, B. and Qi, G.L. and Zhao, J.M. and Zhu, P.F. and Hu, Q.H. and Gao, X.B.",
        TITLE = "RTF: Recursive TransFusion for Multi-Modal Image Synthesis",
        JOURNAL = IP,
        VOLUME = "34",
        YEAR = "2025",
        PAGES = "1573-1587",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98207"}

@article{bb101451,
        AUTHOR = "Zheng, J.B. and Liu, D.Q. and Wang, C.Y. and Hu, M.H. and Yang, Z.P. and Ding, C.X. and Tao, D.C.",
        TITLE = "MMoT: Mixture-of-Modality-Tokens Transformer for Composed Multimodal
Conditional Image Synthesis",
        JOURNAL = IJCV,
        VOLUME = "132",
        YEAR = "2024",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "3537-3565",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98208"}

@inproceedings{bb101452,
        AUTHOR = "Wu, C.Y. and Chen, X.K. and Wu, Z.Y. and Ma, Y.Y. and Liu, X.C. and Pan, Z.Z. and Liu, W. and Xie, Z. and Yu, X.K. and Ruan, C. and Luo, P.",
        TITLE = "Janus: Decoupling Visual Encoding for Unified Multimodal
Understanding and Generation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "12966-12977",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98209"}

@inproceedings{bb101453,
        AUTHOR = "Zha, K.W. and Yu, L.J. and Fathi, A. and Ross, D.A. and Schmid, C. and Katabi, D. and Gu, X.",
        TITLE = "Language-Guided Image Tokenization for Generation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "15713-15722",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98210"}

@inproceedings{bb101454,
        AUTHOR = "Tu, K.Y. and Huang, M.Q. and Chen, Z. and Mao, Z.D.",
        TITLE = "A4A: Adapter for Adapter Transfer via All-for-All Mapping for
Cross-Architecture Models",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "18476-18485",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98211"}

@inproceedings{bb101455,
        AUTHOR = "Wang, H.J. and Byeon, W. and Xu, J.R. and Gu, J. and Cheung, K.C. and Wang, X.L. and Han, K. and Kautz, J. and Liu, S.",
        TITLE = "Parallel Sequence Modeling via Generalized Spatial Propagation
Network",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "4473-4483",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98212"}

@inproceedings{bb101456,
        AUTHOR = "Deng, J.Y. and Wu, X. and Yang, Y.X. and Zhu, C.C. and Wang, S. and Wu, Z.Y.",
        TITLE = "Acquire and then Adapt: Squeezing out Text-to-Image Model for Image
Restoration",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "23195-23206",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98213"}

@inproceedings{bb101457,
        AUTHOR = "Choudhury, Z.Z. and McCane, B. and Coffey, S.",
        TITLE = "Medical Image Synthesis Using Autoencoder with Vision Transformer",
        BOOKTITLE = IVCNZ24,
        YEAR = "2024",
        PAGES = "1-6",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98214"}

@inproceedings{bb101458,
        AUTHOR = "Tschannen, M. and Eastwood, C. and Mentzer, F.",
        TITLE = "GIVT: Generative Infinite-vocabulary Transformers",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "LVII: 292-309",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98215"}

@inproceedings{bb101459,
        AUTHOR = "Ni, Z. and Wang, Y.L. and Zhou, R.P. and Lu, R. and Guo, J.Y. and Hu, J.Y. and Liu, Z.Y. and Yao, Y. and Huang, G.",
        TITLE = "Adanat: Exploring Adaptive Policy for Token-based Image Generation",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XVI: 302-319",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98216"}

@inproceedings{bb101460,
        AUTHOR = "Xu, M. and Lin, M.Y. and Ren, Q. and Jia, S.",
        TITLE = "Ssthyper: Sparse Spectral Transformer for Hyperspectral Image
Reconstruction",
        BOOKTITLE = ACCV24,
        YEAR = "2024",
        PAGES = "IV: 142-159",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98217"}

@inproceedings{bb101461,
        AUTHOR = "Hatamizadeh, A. and Song, J.M. and Liu, G.L. and Kautz, J. and Vahdat, A.",
        TITLE = "Diffit: Diffusion Vision Transformers for Image Generation",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "VIII: 37-55",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98218"}

@inproceedings{bb101462,
        AUTHOR = "Gu, Y.C. and Wang, X.T. and Ge, Y.X. and Shan, Y. and Shou, M.Z.",
        TITLE = "Rethinking the Objectives of Vector-Quantized Tokenizers for Image
Synthesis",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "7631-7640",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98219"}

@inproceedings{bb101463,
        AUTHOR = "Ni, Z.L. and Wang, Y.L. and Zhou, R.P. and Guo, J.Y. and Hu, J.Y. and Liu, Z.Y. and Song, S. and Yao, Y. and Huang, G.",
        TITLE = "Revisiting Non-Autoregressive Transformers for Efficient Image
Synthesis",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "7007-7016",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98220"}

@inproceedings{bb101464,
        AUTHOR = "Zhao, Y.Q. and Zhao, Z. and Li, J. and Dong, S. and Gao, S.H.",
        TITLE = "RoomDesigner: Encoding Anchor-latents for Style-consistent and
Shape-compatible Indoor Scene Generation",
        BOOKTITLE = "3DV24",
        YEAR = "2024",
        PAGES = "1413-1423",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98221"}

@inproceedings{bb101465,
        AUTHOR = "Cai, H. and Li, M. and Zhang, Q.S. and Liu, M.Y. and Han, S.",
        TITLE = "Condition-Aware Neural Network for Controlled Image Generation",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "7194-7203",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98222"}

@inproceedings{bb101466,
        AUTHOR = "Zheng, S. and Yuan, X.",
        TITLE = "Unfolding Framework with Prior of Convolution-Transformer Mixture and
Uncertainty Estimation for Video Snapshot Compressive Imaging",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "12692-12703",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98223"}

@inproceedings{bb101467,
        AUTHOR = "Cao, S.Y. and Yin, Y.Q. and Huang, L.H. and Liu, Y. and Zhao, X. and Zhao, D.L. and Huang, K.Q.",
        TITLE = "Efficient-VQGAN: Towards High-Resolution Image Generation with
Efficient Vision Transformers",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "7334-7343",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98224"}

@inproceedings{bb101468,
        AUTHOR = "Yun, J. and Lee, S. and Park, M.H. and Choo, J.",
        TITLE = "iColoriT: Towards Propagating Local Hints to the Right Region in
Interactive Colorization by Leveraging Vision Transformer",
        BOOKTITLE = WACV23,
        YEAR = "2023",
        PAGES = "1787-1796",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98225"}

@inproceedings{bb101469,
        AUTHOR = "Lin, K.E. and Yen Chen, L. and Lai, W.S. and Lin, T.Y. and Shih, Y.C. and Ramamoorthi, R.",
        TITLE = "Vision Transformer for NeRF-Based View Synthesis from a Single Input
Image",
        BOOKTITLE = WACV23,
        YEAR = "2023",
        PAGES = "806-815",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98226"}

@inproceedings{bb101470,
        AUTHOR = "Lezama, J. and Chang, H. and Jiang, L. and Essa, I.",
        TITLE = "Improved Masked Image Generation with Token-Critic",
        BOOKTITLE = ECCV22,
        YEAR = "2022",
        PAGES = "XXIII:70-86",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98227"}

@inproceedings{bb101471,
        AUTHOR = "Kong, X. and Jiang, L. and Chang, H. and Zhang, H. and Hao, Y. and Gong, H.F. and Essa, I.",
        TITLE = "BLT: Bidirectional Layout Transformer for Controllable Layout
Generation",
        BOOKTITLE = ECCV22,
        YEAR = "2022",
        PAGES = "XVII:474-490",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98228"}

@inproceedings{bb101472,
        AUTHOR = "Kong, D. and Kong, K. and Kim, K. and Min, S.J. and Kang, S.J.",
        TITLE = "Image-Adaptive Hint Generation via Vision Transformer for Outpainting",
        BOOKTITLE = WACV22,
        YEAR = "2022",
        PAGES = "4029-4038",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98229"}

@inproceedings{bb101473,
        AUTHOR = "Maharana, A. and Hannan, D. and Bansal, M.",
        TITLE = "StoryDALL-E: Adapting Pretrained Text-to-Image Transformers for Story
Continuation",
        BOOKTITLE = ECCV22,
        YEAR = "2022",
        PAGES = "XXXVII:70-87",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98230"}

@inproceedings{bb101474,
        AUTHOR = "Kim, T. and Song, G. and Lee, S. and Kim, S. and Seo, Y. and Lee, S. and Kim, S.H. and Lee, H.L. and Bae, K.",
        TITLE = "L-Verse: Bidirectional Generation Between Image and Text",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "16505-16515",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98231"}

@inproceedings{bb101475,
        AUTHOR = "Wang, J.A. and Lu, G.S. and Xu, H. and Li, Z.G. and Xu, C.J. and Fu, Y.W.",
        TITLE = "ManiTrans: Entity-Level Text-Guided Image Manipulation via Token-wise
Semantic Alignment and Generation",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "10697-10707",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98232"}

@inproceedings{bb101476,
        AUTHOR = "Liu, Z.Z. and Wang, Y. and Qi, X.J. and Fu, C.W.",
        TITLE = "Towards Implicit Text-Guided 3D Shape Generation",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "17875-17885",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98233"}

@inproceedings{bb101477,
        AUTHOR = "Wu, F.X. and Liu, L. and Hao, F.S. and He, F.X. and Cheng, J.",
        TITLE = "Text-to-Image Synthesis based on Object-Guided Joint-Decoding
Transformer",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "18092-18101",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98234"}

@inproceedings{bb101478,
        AUTHOR = "Wang, X.P. and Yeshwanth, C. and Nießner, M.",
        TITLE = "SceneFormer: Indoor Scene Generation with Transformers",
        BOOKTITLE = "3DV21",
        YEAR = "2021",
        PAGES = "106-115",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98235"}

@inproceedings{bb101479,
        AUTHOR = "Mariotti, O. and Aodha, O.M. and Bilen, H.",
        TITLE = "ViewNet: Unsupervised Viewpoint Estimation from Conditional
Generation",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "10398-10408",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98236"}

@inproceedings{bb101480,
        AUTHOR = "Ribeiro, L.S.F. and Bui, T. and Collomosse, J. and Ponti, M.",
        TITLE = "Scene Designer:
A Unified Model for Scene Search and Synthesis from Sketch",
        BOOKTITLE = SHE21,
        YEAR = "2021",
        PAGES = "2424-2433",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98237"}

@inproceedings{bb101481,
        AUTHOR = "Yang, C.F. and Fan, W.C. and Yang, F.E. and Wang, Y.C.A.F.",
        TITLE = "LayoutTransformer: Scene Layout Generation with Conceptual and
Spatial Diversity",
        BOOKTITLE = CVPR21,
        YEAR = "2021",
        PAGES = "3731-3740",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT98238"}

@article{bb101482,
        AUTHOR = "Li, M. and Zhou, P. and Liu, J.W. and Keppo, J. and Lin, M. and Yan, S.C. and Xu, X.Y.",
        TITLE = "Instant3D: Instant Text-to-3D Generation",
        JOURNAL = IJCV,
        VOLUME = "132",
        YEAR = "2024",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "4456-4472",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT98239"}

@article{bb101483,
        AUTHOR = "Xu, X.Y. and Yan, S.C. and Lin, M. and Keppo, J. and Liu, J.W. and Zhou, P. and Li, M.",
        TITLE = "Instant3D: Instant Text-to-3D Generation",
        JOURNAL = IJCV,
        VOLUME = "133",
        YEAR = "2025",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "509-509",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT98239"}

@article{bb101484,
        AUTHOR = "Nie, W.Z. and Chen, R.D. and Wang, W.J. and Lepri, B. and Sebe, N.",
        TITLE = "T2TD: Text-3D Generation Model Based on Prior Knowledge Guidance",
        JOURNAL = PAMI,
        VOLUME = "47",
        YEAR = "2025",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "172-189",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT98240"}

@article{bb101485,
        AUTHOR = "Ye, Z. and Liu, Y. and Peng, Y.X.",
        TITLE = "MAAN: Memory-Augmented Auto-Regressive Network for Text-Driven 3D
Indoor Scene Generation",
        JOURNAL = MultMed,
        VOLUME = "26",
        YEAR = "2024",
        PAGES = "11057-11069",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT98241"}

@article{bb101486,
        AUTHOR = "Luo, X.Z. and Zhao, H.T. and Liu, Y.P. and Liu, N.N. and Chen, J. and Yang, H. and Pan, J.",
        TITLE = "A High-Precision Virtual Central Projection Image Generation Method
for an Aerial Dual-Camera",
        JOURNAL = RS,
        VOLUME = "17",
        YEAR = "2025",
        NUMBER = "4",
        PAGES = "683",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT98242"}

@article{bb101487,
        AUTHOR = "Di, D.L. and Yang, J.H. and Luo, C.F. and Xue, Z. and Chen, W. and Yang, X. and Gao, Y.",
        TITLE = "Hyper-3DG: Text-to-3D Gaussian Generation via Hypergraph",
        JOURNAL = IJCV,
        VOLUME = "133",
        YEAR = "2025",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "2886-2909",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT98243"}

@article{bb101488,
        AUTHOR = "Huang, S.Y. and Huang, C.P. and Chang, K.P. and Chou, Z.T. and Liu, I.J. and Wang, Y.C.A.F.",
        TITLE = "Learning Shape-Color Diffusion Priors for Text-Guided 3D Object
Generation",
        JOURNAL = MultMed,
        VOLUME = "27",
        YEAR = "2025",
        PAGES = "3294-3306",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT98244"}

@article{bb101489,
        AUTHOR = "Yu, S.S. and Zhu, J.X. and Li, J.Q. and Li, X.C. and Wang, K. and Tu, J. and Guo, D.",
        TITLE = "SceneDiffusion: Scene Generation Model Embedded with Spatial
Constraints",
        JOURNAL = IJGI,
        VOLUME = "14",
        YEAR = "2025",
        NUMBER = "7",
        PAGES = "250",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT98245"}

@article{bb101490,
        AUTHOR = "Kim, J.Y. and Park, J. and Kong, K. and Kang, S.J.",
        TITLE = "Programmable-Room: Interactive Textured 3D Room Meshes Generation
Empowered by Large Language Models",
        JOURNAL = MultMed,
        VOLUME = "27",
        YEAR = "2025",
        PAGES = "6358-6368",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT98246"}

@article{bb101491,
        AUTHOR = "Fu, K. and Duan, H.Y. and Zhang, Z.C. and Liu, X.H. and Min, X.K. and Wang, J. and Zhai, G.T.",
        TITLE = "Multi-Dimensional Quality Assessment for Text-to-3D Assets:
Dataset and Model",
        JOURNAL = MultMed,
        VOLUME = "27",
        YEAR = "2025",
        PAGES = "8145-8159",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT98247"}

@inproceedings{bb101492,
        AUTHOR = "Sinha, S. and Khan, M.S. and Usama, M. and Sam, S. and Stricker, D. and Ali, S.A. and Afzal, M.Z.",
        TITLE = "MARVEL-40M+: Multi-Level Visual Elaboration for High-Fidelity
Text-to-3D Content Creation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "8105-8116",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT98248"}

@inproceedings{bb101493,
        AUTHOR = "Xiang, J.F. and Lv, Z. and Xu, S.C. and Deng, Y. and Wang, R.C. and Zhang, B. and Chen, D. and Tong, X. and Yang, J.",
        TITLE = "Structured 3D Latents for Scalable and Versatile 3D Generation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "21469-21480",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT98249"}

@inproceedings{bb101494,
        AUTHOR = "Xu, Y.L. and Qu, H.X. and Liu, J. and Zhang, W.X. and Yang, X.",
        TITLE = "CMMLoc: Advancing Text-to-PointCloud Localization with
Cauchy-Mixture-Model Based Framework",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "6637-6647",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT98250"}

@inproceedings{bb101495,
        AUTHOR = "Edelstein, Y. and Patashnik, O. and Cohen Bar, D. and Zelnik Manor, L.",
        TITLE = "Sharp-It: A Multi-view to Multi-view Diffusion Model for 3D Synthesis
and Manipulation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "21458-21468",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT98251"}

@inproceedings{bb101496,
        AUTHOR = "Hu, H.Z. and Yin, T.W. and Luan, F. and Hu, Y.W. and Tan, H. and Xu, Z.X. and Bi, S. and Tulsiani, S. and Zhang, K.",
        TITLE = "Turbo3D: Ultra-fast Text-to-3D Generation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "23668-23678",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT98252"}

@inproceedings{bb101497,
        AUTHOR = "Qin, Y.M. and Xu, Z. and Liu, Y.",
        TITLE = "Apply Hierarchical-Chain-of-Generation to Complex Attributes
Text-to-3D Generation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "18521-18530",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT98253"}

@inproceedings{bb101498,
        AUTHOR = "Chen, Y.W. and Lan, Y.S. and Zhou, S. and Wang, T.F. and Pan, X.G.",
        TITLE = "SAR3D: Autoregressive 3D Object Generation and Understanding via
Multi-scale 3D VQVAE",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "28371-28382",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT98254"}

@inproceedings{bb101499,
        AUTHOR = "Li, J.H. and Ma, W.J. and Li, X.Y. and Lou, Y.Z. and Zhou, G.C. and Zhou, X.D.",
        TITLE = "CAD-Llama: Leveraging Large Language Models for Computer-Aided Design
Parametric 3D Model Generation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "18563-18573",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT98255"}
Last update:Nov 26, 2025 at 20:24:09