@inproceedings{bb99400, AUTHOR = "Wu, Q.C. and Liu, Y.J. and Zhao, H. and Kale, A. and Bui, T. and Yu, T. and Lin, Z. and Zhang, Y. and Chang, S.Y.", TITLE = "Uncovering the Disentanglement Capability in Text-to-Image Diffusion Models", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "1900-1910", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT96162"} @inproceedings{bb99401, AUTHOR = "Jain, A. and Xie, A. and Abbeel, P.", TITLE = "VectorFusion: Text-to-SVG by Abstracting Pixel-Based Diffusion Models", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "1911-1920", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT96163"} @inproceedings{bb99402, AUTHOR = "Kumari, N. and Zhang, B.L. and Zhang, R. and Shechtman, E. and Zhu, J.Y.", TITLE = "Multi-Concept Customization of Text-to-Image Diffusion", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "1931-1941", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT96164"} @inproceedings{bb99403, AUTHOR = "Hui, M. and Zhang, Z.Z. and Zhang, X.Y. and Xie, W.X. and Wang, Y.W. and Lu, Y.", TITLE = "Unifying Layout Generation with a Decoupled Diffusion Model", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "1942-1951", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT96165"} @inproceedings{bb99404, AUTHOR = "Ruiz, N. and Li, Y.Z. and Jampani, V. and Pritch, Y. and Rubinstein, M. and Aberman, K.", TITLE = "DreamBooth: Fine Tuning Text-to-Image Diffusion Models for Subject-Driven Generation", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "22500-22510", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT96166"} @inproceedings{bb99405, AUTHOR = "Zheng, G.C. and Zhou, X.P. and Li, X.W. and Qi, Z.A. and Shan, Y. and Li, X.", TITLE = "LayoutDiffusion: Controllable Diffusion Model for Layout-to-Image Generation", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "22490-22499", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT96167"} @inproceedings{bb99406, AUTHOR = "Liu, X.H. and Park, D.H. and Azadi, S. and Zhang, G. and Chopikyan, A. and Hu, Y.X. and Shi, H. and Rohrbach, A. and Darrell, T.J.", TITLE = "More Control for Free! Image Synthesis with Semantic Diffusion Guidance", BOOKTITLE = WACV23, YEAR = "2023", PAGES = "289-299", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT96168"} @inproceedings{bb99407, AUTHOR = "Pan, Z.H. and Zhou, X. and Tian, H.", TITLE = "Arbitrary Style Guidance for Enhanced Diffusion-Based Text-to-Image Generation", BOOKTITLE = WACV23, YEAR = "2023", PAGES = "4450-4460", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT96169"} @inproceedings{bb99408, AUTHOR = "Gu, S.Y. and Chen, D. and Bao, J.M. and Wen, F. and Zhang, B. and Chen, D.D. and Yuan, L. and Guo, B.N.", TITLE = "Vector Quantized Diffusion Model for Text-to-Image Synthesis", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "10686-10696", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT96170"} @inproceedings{bb99409, AUTHOR = "Jing, B. and Corso, G. and Berlinghieri, R. and Jaakkola, T.", TITLE = "Subspace Diffusion Generative Models", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXIII:274-289", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT96171"} @inproceedings{bb99410, AUTHOR = "Han, L.G. and Li, Y.X. and Zhang, H. and Milanfar, P. and Metaxas, D.N. and Yang, F.", TITLE = "SVDiff: Compact Parameter Space for Diffusion Fine-Tuning", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "7289-7300", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT96172"} @inproceedings{bb99411, AUTHOR = "Nair, N.G. and Bandara, W.G.C. and Patel, V.M.", TITLE = "Unite and Conquer: Plug and Play Multi-Modal Synthesis Using Diffusion Models", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "6070-6079", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT96173"} @inproceedings{bb99412, AUTHOR = "Benny, Y. and Wolf, L.B.", TITLE = "Dynamic Dual-Output Diffusion Models", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "11472-11481", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT96174"} @inproceedings{bb99413, AUTHOR = "Hu, M.H. and Wang, Y.J. and Cham, T.J. and Yang, J.F. and Suganthan, P.N.", TITLE = "Global Context with Discrete Diffusion in Vector Quantised Modelling for Image Generation", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "11492-11501", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT96175"} @inproceedings{bb99414, AUTHOR = "Ma, H.Y. and Zhang, L. and Zhu, X.T. and Feng, J.F.", TITLE = "Accelerating Score-Based Generative Models with Preconditioned Diffusion Sampling", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXIII:1-16", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT96176"} @inproceedings{bb99415, AUTHOR = "Zheng, G. and Li, S. and Wang, H. and Yao, T.P. and Chen, Y. and Ding, S.H. and Li, X.", TITLE = "Entropy-Driven Sampling and Training Scheme for Conditional Diffusion Generation", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXII:754-769", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT96177"} @inproceedings{bb99416, AUTHOR = "Liu, N. and Li, S. and Du, Y.L. and Torralba, A. and Tenenbaum, J.B.", TITLE = "Compositional Visual Generation with Composable Diffusion Models", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XVII:423-439", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT96178"} @inproceedings{bb99417, AUTHOR = "Sehwag, V. and Hazirbas, C. and Gordo, A. and Ozgenel, F. and Ferrer, C.C.", TITLE = "Generating High Fidelity Data from Low-density Regions using Diffusion Models", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "11482-11491", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489dift2i4.html#TT96179"} @article{bb99418, AUTHOR = "Naveen, S. and Ram Kiran, M.S. and Indupriya, M. and Manikanta, T.V. and Sudeep, P.V.", TITLE = "Transformer models for enhancing AttnGAN based text to image generation", JOURNAL = IVC, VOLUME = "115", YEAR = "2021", PAGES = "104284", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96180"} @article{bb99419, AUTHOR = "Dalmaz, O. and Yurt, M. and Cukur, T.", TITLE = "ResViT: Residual Vision Transformers for Multimodal Medical Image Synthesis", JOURNAL = MedImg, VOLUME = "41", YEAR = "2022", NUMBER = "10", MONTH = "October", PAGES = "2598-2614", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96181"} @article{bb99420, AUTHOR = "Zhang, X. and Jiao, W.T. and Wang, B. and Tian, X.D.", TITLE = "CT-GAN: A conditional Generative Adversarial Network of transformer architecture for text-to-image", JOURNAL = SP:IC, VOLUME = "115", YEAR = "2023", PAGES = "116959", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96182"} @article{bb99421, AUTHOR = "Sortino, R. and Palazzo, S. and Rundo, F. and Spampinato, C.", TITLE = "Transformer-based image generation from scene graphs", JOURNAL = CVIU, VOLUME = "233", YEAR = "2023", PAGES = "103721", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96183"} @inproceedings{bb99422, AUTHOR = "Sortino, R. and Palazzo, S. and Spampinato, C.", TITLE = "Transforming Image Generation from Scene Graphs", BOOKTITLE = "ICPR22", YEAR = "2022", PAGES = "4118-4124", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96184"} @inproceedings{bb99423, AUTHOR = "Wang, Z.C. and Ren, Q. and Wang, J.L. and Yan, C.G. and Jiang, C.J.", TITLE = "Mush: Multi-scale Hierarchical Feature Extraction for Semantic Image Synthesis", BOOKTITLE = ACCV22, YEAR = "2022", PAGES = "VII:185-201", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96185"} @article{bb99424, AUTHOR = "Wei, Z.P. and Chen, J.J. and Goldblum, M. and Wu, Z.X. and Goldstein, T. and Jiang, Y.G. and Davis, L.S.", TITLE = "Towards Transferable Adversarial Attacks on Image and Video Transformers", JOURNAL = IP, VOLUME = "32", YEAR = "2023", PAGES = "6346-6358", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96186"} @article{bb99425, AUTHOR = "Wei, Z.P. and Chen, J.J. and Wu, Z.X. and Jiang, Y.G.", TITLE = "Adaptive Cross-Modal Transferable Adversarial Attacks From Images to Videos", JOURNAL = PAMI, VOLUME = "46", YEAR = "2024", NUMBER = "5", MONTH = "May", PAGES = "3772-3783", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96187"} @inproceedings{bb99426, AUTHOR = "Wei, Z.P. and Chen, J.J. and Wu, Z.X. and Jiang, Y.G.", TITLE = "Cross-Modal Transferable Adversarial Attacks from Images to Videos", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "15044-15053", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96188"} @article{bb99427, AUTHOR = "Bahani, M. and El Ouaazizi, A. and Maalmi, K.", TITLE = "The effectiveness of T5, GPT-2, and BERT on text-to-image generation task", JOURNAL = PRL, VOLUME = "173", YEAR = "2023", PAGES = "57-63", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96189"} @article{bb99428, AUTHOR = "Su, S. and Zhu, J.C. and Gao, L.L. and Song, J.K.", TITLE = "Utilizing Greedy Nature for Multimodal Conditional Image Synthesis in Transformers", JOURNAL = MultMed, VOLUME = "26", YEAR = "2024", PAGES = "2354-2366", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96190"} @article{bb99429, AUTHOR = "Li, Z. and Liu, F.", TITLE = "Scalable video transformer for full-frame video prediction", JOURNAL = CVIU, VOLUME = "249", YEAR = "2024", PAGES = "104166", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96191"} @article{bb99430, AUTHOR = "Cao, B. and Qi, G.L. and Zhao, J. and Zhu, P.F. and Hu, Q.H. and Gao, X.B.", TITLE = "RTF: Recursive TransFusion for Multi-Modal Image Synthesis", JOURNAL = IP, VOLUME = "34", YEAR = "2025", PAGES = "1573-1587", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96192"} @inproceedings{bb99431, AUTHOR = "Choudhury, Z.Z. and McCane, B. and Coffey, S.", TITLE = "Medical Image Synthesis Using Autoencoder with Vision Transformer", BOOKTITLE = IVCNZ24, YEAR = "2024", PAGES = "1-6", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96193"} @inproceedings{bb99432, AUTHOR = "Tschannen, M. and Eastwood, C. and Mentzer, F.", TITLE = "GIVT: Generative Infinite-vocabulary Transformers", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "LVII: 292-309", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96194"} @inproceedings{bb99433, AUTHOR = "Ni, Z. and Wang, Y.L. and Zhou, R.P. and Lu, R. and Guo, J.Y. and Hu, J.Y. and Liu, Z.Y. and Yao, Y. and Huang, G.", TITLE = "Adanat: Exploring Adaptive Policy for Token-based Image Generation", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "XVI: 302-319", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96195"} @inproceedings{bb99434, AUTHOR = "Xu, M. and Lin, M.Y. and Ren, Q. and Jia, S.", TITLE = "Ssthyper: Sparse Spectral Transformer for Hyperspectral Image Reconstruction", BOOKTITLE = ACCV24, YEAR = "2024", PAGES = "IV: 142-159", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96196"} @inproceedings{bb99435, AUTHOR = "Hatamizadeh, A. and Song, J. and Liu, G.L. and Kautz, J. and Vahdat, A.", TITLE = "Diffit: Diffusion Vision Transformers for Image Generation", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "VIII: 37-55", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96197"} @inproceedings{bb99436, AUTHOR = "Gu, Y.C. and Wang, X. and Ge, Y.X. and Shan, Y. and Shou, M.Z.", TITLE = "Rethinking the Objectives of Vector-Quantized Tokenizers for Image Synthesis", BOOKTITLE = CVPR24, YEAR = "2024", PAGES = "7631-7640", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96198"} @inproceedings{bb99437, AUTHOR = "Ni, Z.L. and Wang, Y.L. and Zhou, R.P. and Guo, J.Y. and Hu, J.Y. and Liu, Z.Y. and Song, S. and Yao, Y. and Huang, G.", TITLE = "Revisiting Non-Autoregressive Transformers for Efficient Image Synthesis", BOOKTITLE = CVPR24, YEAR = "2024", PAGES = "7007-7016", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96199"} @inproceedings{bb99438, AUTHOR = "Zheng, S. and Yuan, X.", TITLE = "Unfolding Framework with Prior of Convolution-Transformer Mixture and Uncertainty Estimation for Video Snapshot Compressive Imaging", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "12692-12703", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96200"} @inproceedings{bb99439, AUTHOR = "Cao, S.Y. and Yin, Y.Q. and Huang, L.H. and Liu, Y. and Zhao, X. and Zhao, D.L. and Huang, K.Q.", TITLE = "Efficient-VQGAN: Towards High-Resolution Image Generation with Efficient Vision Transformers", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "7334-7343", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96201"} @inproceedings{bb99440, AUTHOR = "Yun, J. and Lee, S. and Park, M.H. and Choo, J.", TITLE = "iColoriT: Towards Propagating Local Hints to the Right Region in Interactive Colorization by Leveraging Vision Transformer", BOOKTITLE = WACV23, YEAR = "2023", PAGES = "1787-1796", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96202"} @inproceedings{bb99441, AUTHOR = "Lin, K.E. and Yen Chen, L. and Lai, W.S. and Lin, T.Y. and Shih, Y.C. and Ramamoorthi, R.", TITLE = "Vision Transformer for NeRF-Based View Synthesis from a Single Input Image", BOOKTITLE = WACV23, YEAR = "2023", PAGES = "806-815", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96203"} @inproceedings{bb99442, AUTHOR = "Lezama, J. and Chang, H. and Jiang, L. and Essa, I.", TITLE = "Improved Masked Image Generation with Token-Critic", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXIII:70-86", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96204"} @inproceedings{bb99443, AUTHOR = "Kong, X. and Jiang, L. and Chang, H. and Zhang, H. and Hao, Y. and Gong, H.F. and Essa, I.", TITLE = "BLT: Bidirectional Layout Transformer for Controllable Layout Generation", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XVII:474-490", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96205"} @inproceedings{bb99444, AUTHOR = "Kong, D. and Kong, K. and Kim, K. and Min, S.J. and Kang, S.J.", TITLE = "Image-Adaptive Hint Generation via Vision Transformer for Outpainting", BOOKTITLE = WACV22, YEAR = "2022", PAGES = "4029-4038", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96206"} @inproceedings{bb99445, AUTHOR = "Maharana, A. and Hannan, D. and Bansal, M.", TITLE = "StoryDALL-E: Adapting Pretrained Text-to-Image Transformers for Story Continuation", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXXVII:70-87", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96207"} @inproceedings{bb99446, AUTHOR = "Kim, T. and Song, G. and Lee, S. and Kim, S. and Seo, Y. and Lee, S. and Kim, S.H. and Lee, H.L. and Bae, K.", TITLE = "L-Verse: Bidirectional Generation Between Image and Text", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "16505-16515", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96208"} @inproceedings{bb99447, AUTHOR = "Wang, J.A. and Lu, G.S. and Xu, H. and Li, Z.G. and Xu, C.J. and Fu, Y.W.", TITLE = "ManiTrans: Entity-Level Text-Guided Image Manipulation via Token-wise Semantic Alignment and Generation", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "10697-10707", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96209"} @inproceedings{bb99448, AUTHOR = "Liu, Z.Z. and Wang, Y. and Qi, X.J. and Fu, C.W.", TITLE = "Towards Implicit Text-Guided 3D Shape Generation", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "17875-17885", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96210"} @inproceedings{bb99449, AUTHOR = "Wu, F.X. and Liu, L. and Hao, F.S. and He, F.X. and Cheng, J.", TITLE = "Text-to-Image Synthesis based on Object-Guided Joint-Decoding Transformer", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "18092-18101", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96211"} @inproceedings{bb99450, AUTHOR = "Wang, X.P. and Yeshwanth, C. and Nießner, M.", TITLE = "SceneFormer: Indoor Scene Generation with Transformers", BOOKTITLE = "3DV21", YEAR = "2021", PAGES = "106-115", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96212"} @inproceedings{bb99451, AUTHOR = "Mariotti, O. and Aodha, O.M. and Bilen, H.", TITLE = "ViewNet: Unsupervised Viewpoint Estimation from Conditional Generation", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "10398-10408", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96213"} @inproceedings{bb99452, AUTHOR = "Ribeiro, L.S.F. and Bui, T. and Collomosse, J. and Ponti, M.", TITLE = "Scene Designer: A Unified Model for Scene Search and Synthesis from Sketch", BOOKTITLE = SHE21, YEAR = "2021", PAGES = "2424-2433", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96214"} @inproceedings{bb99453, AUTHOR = "Yang, C.F. and Fan, W.C. and Yang, F.E. and Wang, Y.C.A.F.", TITLE = "LayoutTransformer: Scene Layout Generation with Conceptual and Spatial Diversity", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "3731-3740", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96215"} @inproceedings{bb99454, AUTHOR = "Lin, C. and Yumer, E. and Wang, O. and Shechtman, E. and Lucey, S.", TITLE = "ST-GAN: Spatial Transformer Generative Adversarial Networks for Image Compositing", BOOKTITLE = CVPR18, YEAR = "2018", PAGES = "9455-9464", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489synvit5.html#TT96216"} @article{bb99455, AUTHOR = "Li, M. and Zhou, P. and Liu, J.W. and Keppo, J. and Lin, M. and Yan, S.C. and Xu, X.Y.", TITLE = "Instant3D: Instant Text-to-3D Generation", JOURNAL = IJCV, VOLUME = "132", YEAR = "2024", NUMBER = "10", MONTH = "October", PAGES = "4456-4472", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96217"} @article{bb99456, AUTHOR = "Xu, X.Y. and Yan, S.C. and Lin, M. and Keppo, J. and Liu, J.W. and Zhou, P. and Li, M.", TITLE = "Instant3D: Instant Text-to-3D Generation", JOURNAL = IJCV, VOLUME = "133", YEAR = "2025", NUMBER = "1", MONTH = "January", PAGES = "509-509", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96217"} @article{bb99457, AUTHOR = "Nie, W.Z. and Chen, R.D. and Wang, W.J. and Lepri, B. and Sebe, N.", TITLE = "T2TD: Text-3D Generation Model Based on Prior Knowledge Guidance", JOURNAL = PAMI, VOLUME = "47", YEAR = "2025", NUMBER = "1", MONTH = "January", PAGES = "172-189", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96218"} @article{bb99458, AUTHOR = "Ye, Z. and Liu, Y. and Peng, Y.X.", TITLE = "MAAN: Memory-Augmented Auto-Regressive Network for Text-Driven 3D Indoor Scene Generation", JOURNAL = MultMed, VOLUME = "26", YEAR = "2024", PAGES = "11057-11069", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96219"} @article{bb99459, AUTHOR = "Luo, X.Z. and Zhao, H.T. and Liu, Y.P. and Liu, N.N. and Chen, J. and Yang, H. and Pan, J.", TITLE = "A High-Precision Virtual Central Projection Image Generation Method for an Aerial Dual-Camera", JOURNAL = RS, VOLUME = "17", YEAR = "2025", NUMBER = "4", PAGES = "683", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96220"} @article{bb99460, AUTHOR = "Di, D.L. and Yang, J.H. and Luo, C.F. and Xue, Z. and Chen, W. and Yang, X. and Gao, Y.", TITLE = "Hyper-3DG: Text-to-3D Gaussian Generation via Hypergraph", JOURNAL = IJCV, VOLUME = "133", YEAR = "2025", NUMBER = "5", MONTH = "May", PAGES = "2886-2909", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96221"} @inproceedings{bb99461, AUTHOR = "Nath, U. and Goel, R. and Jeon, E.S. and Kim, C. and Min, K. and Yang, Y.Z. and Yang, Y.Z. and Turaga, P.", TITLE = "Deep Geometric Moments Promote Shape Consistency in Text-to-3D Generation", BOOKTITLE = WACV25, YEAR = "2025", PAGES = "4331-4341", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96222"} @inproceedings{bb99462, AUTHOR = "Attaiki, S. and Guerrero, P. and Ceylan, D. and Mitra, N.J. and Ovsjanikov, M.", TITLE = "GANFusion: Feed-Forward Text-to-3D with Diffusion in GAN Space", BOOKTITLE = WACV25, YEAR = "2025", PAGES = "3985-3995", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96223"} @inproceedings{bb99463, AUTHOR = "Mercier, A. and Nakhli, R. and Reddy, M. and Yasarla, R. and Cai, H. and Porikli, F.M. and Berger, G.", TITLE = "HexaGen3D: StableDiffusion is One Step Away from Fast and Diverse Text-to-3D Generation", BOOKTITLE = WACV25, YEAR = "2025", PAGES = "1247-1257", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96224"} @inproceedings{bb99464, AUTHOR = "Li, J. and Zhang, Z. and Yang, J.", TITLE = "TP2O: Creative Text Pair-to-object Generation Using Balance Swap-Sampling", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "LXXII: 92-111", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96225"} @inproceedings{bb99465, AUTHOR = "Xu, Y.H. and Shi, Z.F. and Wang, Y.F. and Chen, H.S. and Yang, C. and Peng, S. and Shen, Y.J. and Wetzstein, G.", TITLE = "GRM: Large Gaussian Reconstruction Model for Efficient 3D Reconstruction and Generation", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "XV: 1-20", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96226"} @inproceedings{bb99466, AUTHOR = "Liu, F.F. and Wang, H.Y. and Chen, W.L. and Sun, H.W. and Duan, Y.Q.", TITLE = "Make-your-3d: Fast and Consistent Subject-driven 3d Content Generation", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "LXXXIV: 389-406", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96227"} @inproceedings{bb99467, AUTHOR = "Tang, J.X. and Chen, Z.X. and Chen, X.K. and Wang, T.F. and Zeng, G. and Liu, Z.W.", TITLE = "LGM: Large Multi-view Gaussian Model for High-resolution 3d Content Creation", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "IV: 1-18", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96228"} @inproceedings{bb99468, AUTHOR = "Ocal, B.M. and Tatarchenko, M. and Karaoglu, S. and Gevers, T.", TITLE = "Sceneteller: Language-to-3d Scene Generation", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "LXXXV: 362-378", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96229"} @inproceedings{bb99469, AUTHOR = "Zuo, Q. and Gu, X.D. and Dong, Y. and Zhao, Z.Y. and Yuan, W.H. and Qiu, L.T. and Bo, L. and Dong, Z.L.", TITLE = "High-fidelity 3d Textured Shapes Generation by Sparse Encoding and Adversarial Decoding", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "X: 52-69", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96230"} @inproceedings{bb99470, AUTHOR = "Xie, K. and Lorraine, J. and Cao, T. and Gao, J. and Lucas, J. and Torralba, A. and Fidler, S. and Zeng, X.H.", TITLE = "Latte3d: Large-scale Amortized Text-to-enhanced3d Synthesis", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "LXXVII: 305-322", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96231"} @inproceedings{bb99471, AUTHOR = "Fu, R. and Wen, Z. and Liu, Z.C. and Sridhar, S.", TITLE = "Anyhome: Open-vocabulary Generation of Structured and Textured 3d Homes", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "XXXIX: 52-70", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96232"} @inproceedings{bb99472, AUTHOR = "Yang, H.B. and Chen, Y. and Pan, Y.W. and Yao, T. and Chen, Z. and Wu, Z.X. and Jiang, Y.G. and Mei, T.", TITLE = "Dreammesh: Jointly Manipulating and Texturing Triangle Meshes for Text-to-3d Generation", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "LIX: 162-178", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96233"} @inproceedings{bb99473, AUTHOR = "Ye, J.L. and Liu, F.F. and Li, Q.X. and Wang, Z.Y. and Wang, Y.K. and Wang, X.Z. and Duan, Y.Q. and Zhu, J.", TITLE = "Dreamreward: Text-to-3d Generation with Human Preference", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "LXX: 259-276", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96234"} @inproceedings{bb99474, AUTHOR = "Li, H.R. and Shi, H.L. and Zhang, W.L. and Wu, W.J. and Liao, Y. and Wang, L. and Lee, L.H. and Zhou, P.Y.", TITLE = "Dreamscene: 3d Gaussian-based Text-to-3d Scene Generation via Formation Pattern Sampling", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "LXXIV: 214-230", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96235"} @inproceedings{bb99475, AUTHOR = "Tran, U.D. and Luu, M. and Nguyen, P.H. and Nguyen, K. and Hua, B.S.", TITLE = "Diverse Text-to-3d Synthesis with Augmented Text Embedding", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "LXXV: 217-235", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96236"} @inproceedings{bb99476, AUTHOR = "Li, Z. and Hu, M.H. and Zheng, Q. and Jiang, X.D.", TITLE = "Connecting Consistency Distillation to Score Distillation for Text-to-3d Generation", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "XLIII: 274-291", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96237"} @inproceedings{bb99477, AUTHOR = "Jiang, C. and Zeng, Y. and Hu, T.Y. and Xu, S. and Zhang, W. and Xu, H. and Yeung, D.Y.", TITLE = "Jointdreamer: Ensuring Geometry Consistency and Text Congruence in Text-to-3d Generation via Joint Score Distillation", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "XXVI: 439-456", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96238"} @inproceedings{bb99478, AUTHOR = "Yan, J. and Gao, Y.P. and Yang, Q.Z. and Wei, X. and Xie, X. and Wu, A. and Zheng, W.S.", TITLE = "Dreamview: Injecting View-specific Text Guidance Into Text-to-3d Generation", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "XXV: 358-374", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96239"} @inproceedings{bb99479, AUTHOR = "He, X.L. and Chen, J. and Peng, S. and Huang, D. and Li, Y.G. and Huang, X.S. and Yuan, C. and Ouyang, W.L. and He, T.", TITLE = "Gvgen: Text-to-3d Generation with Volumetric Representation", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "VIII: 463-479", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96240"} @inproceedings{bb99480, AUTHOR = "Ma, Z.Y. and Wei, Y.X. and Zhang, Y. and Zhu, X.Y. and Lei, Z. and Zhang, L.", TITLE = "Scaledreamer: Scalable Text-to-3d Synthesis with Asynchronous Score Distillation", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "VII: 1-19", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96241"} @inproceedings{bb99481, AUTHOR = "Wu, B.S. and Chen, H.E. and Huang, S.Y. and Wang, Y.C.A.F.", TITLE = "TPA3D: Triplane Attention for Fast Text-to-3d Generation", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "XVIII: 438-455", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96242"} @inproceedings{bb99482, AUTHOR = "Zhuo, W.J. and Ma, F. and Fan, H. and Yang, Y.", TITLE = "Vividdreamer: Invariant Score Distillation for Hyper-realistic Text-to-3d Generation", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "LXXXVIII: 122-139", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96243"} @inproceedings{bb99483, AUTHOR = "Wang, D.Q. and Zhang, T. and Abboud, A. and Susstrunk, S.", TITLE = "InNeRF360: Text-Guided 3D-Consistent Object Inpainting on 360° Neural Radiance Fields", BOOKTITLE = CVPR24, YEAR = "2024", PAGES = "12677-12686", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96244"} @inproceedings{bb99484, AUTHOR = "Zhang, Q.H. and Wang, C.Y. and Siarohin, A. and Zhuang, P. and Xu, Y.H. and Yang, C. and Lin, D. and Zhou, B. and Tulyakov, S. and Lee, H.Y.", TITLE = "Towards Text-guided 3D Scene Composition", BOOKTITLE = CVPR24, YEAR = "2024", PAGES = "6829-6838", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96245"} @inproceedings{bb99485, AUTHOR = "Wang, P.H. and Xu, D. and Fan, Z.W. and Wang, D. and Mohan, S. and Iandola, F. and Ranjan, R. and Li, Y.L. and Liu, Q. and Wang, Z.Y. and Chandra, V.", TITLE = "Taming Mode Collapse in Score Distillation for Text-to-3D Generation", BOOKTITLE = CVPR24, YEAR = "2024", PAGES = "9037-9047", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96246"} @inproceedings{bb99486, AUTHOR = "Wu, T. and Yang, G. and Li, Z.B. and Zhang, K. and Liu, Z.W. and Guibas, L.J. and Lin, D. and Wetzstein, G.", TITLE = "GPT-4V(ision) is a Human-Aligned Evaluator for Text-to-3D Generation", BOOKTITLE = CVPR24, YEAR = "2024", PAGES = "22227-22238", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96247"} @inproceedings{bb99487, AUTHOR = "Zhang, S. and Zhang, Y. and Zheng, Q. and Ma, R. and Hua, W. and Bao, H.J. and Xu, W.W. and Zou, C.Q.", TITLE = "3D-SceneDreamer: Text-Driven 3D-Consistent Scene Generation", BOOKTITLE = CVPR24, YEAR = "2024", PAGES = "10170-10180", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96248"} @inproceedings{bb99488, AUTHOR = "Kim, S. and Li, K. and Deng, X.Q. and Shi, Y.C. and Cho, M. and Wang, P.", TITLE = "Enhancing 3D Fidelity of Text-to-3D using Cross-View Correspondences", BOOKTITLE = CVPR24, YEAR = "2024", PAGES = "10649-10658", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96249"} @inproceedings{bb99489, AUTHOR = "Novotny, D. and Tseng, H.Y. and Richardt, C. and Zollhofer, M. and Nießner, M.", TITLE = "ViewDiff: 3D-Consistent Image Generation with Text-to-Image Models", BOOKTITLE = CVPR24, YEAR = "2024", PAGES = "5043-5052", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96250"} @inproceedings{bb99490, AUTHOR = "Wu, J. and Gao, X.B. and Liu, X. and Shen, Z.Y. and Zhao, C. and Feng, H.C. and Liu, J. and Ding, E.", TITLE = "HD-Fusion: Detailed Text-to-3D Generation Leveraging Multiple Noise Estimation", BOOKTITLE = WACV24, YEAR = "2024", PAGES = "3190-3199", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96251"} @inproceedings{bb99491, AUTHOR = "Tsalicoglou, C. and Manhardt, F. and Tonioni, A. and Niemeyer, M. and Tombari, F.", TITLE = "TextMesh: Generation of Realistic 3D Meshes From Text Prompts", BOOKTITLE = "3DV24", YEAR = "2024", PAGES = "1554-1563", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96252"} @inproceedings{bb99492, AUTHOR = "Liao, T.T. and Yi, H.W. and Xiu, Y.L. and Tang, J.X. and Huang, Y. and Thies, J. and Black, M.J.", TITLE = "TADA! Text to Animatable Digital Avatars", BOOKTITLE = "3DV24", YEAR = "2024", PAGES = "1508-1519", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96253"} @inproceedings{bb99493, AUTHOR = "Lorraine, J. and Xie, K. and Zeng, X.H. and Lin, C.H. and Takikawa, T. and Sharp, N. and Lin, T.Y. and Liu, M.Y. and Fidler, S. and Lucas, J.", TITLE = "ATT3D: Amortized Text-to-3D Object Synthesis", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "17900-17910", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96254"} @inproceedings{bb99494, AUTHOR = "Chen, R. and Chen, Y.W. and Jiao, N.X. and Jia, K.", TITLE = "Fantasia3D: Disentangling Geometry and Appearance for High-quality Text-to-3D Content Creation", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "22189-22199", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96255"} @inproceedings{bb99495, AUTHOR = "Amaduzzi, A. and Lisanti, G. and Salti, S. and di Stefano, L.", TITLE = "Looking at Words and Points with Attention: A Benchmark for Text-to-Shape Coherence", BOOKTITLE = AI3DCC23, YEAR = "2023", PAGES = "2860-2869", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96256"} @inproceedings{bb99496, AUTHOR = "Raj, A. and Kaza, S. and Poole, B. and Niemeyer, M. and Ruiz, N. and Mildenhall, B. and Zada, S. and Aberman, K. and Rubinstein, M. and Barron, J. and Li, Y.Z. and Jampani, V.", TITLE = "DreamBooth3D: Subject-Driven Text-to-3D Generation", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "2349-2359", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96257"} @inproceedings{bb99497, AUTHOR = "Lin, C.H. and Gao, J. and Tang, L. and Takikawa, T. and Zeng, X.H. and Huang, X. and Kreis, K. and Fidler, S. and Liu, M.Y. and Lin, T.Y.", TITLE = "Magic3D: High-Resolution Text-to-3D Content Creation", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "300-309", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489tx23d6.html#TT96258"} @article{bb99498, AUTHOR = "Cao, Z. and Hong, F.Z. and Wu, T. and Pan, L. and Liu, Z.W.", TITLE = "DiffTF++: 3D-Aware Diffusion Transformer for Large-Vocabulary 3D Generation", JOURNAL = PAMI, VOLUME = "47", YEAR = "2025", NUMBER = "4", MONTH = "April", PAGES = "3018-3030", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489diftx23d7.html#TT96259"} @article{bb99499, AUTHOR = "Xu, H.F. and Huai, Y.J. and Nie, X.Y. and Meng, Q. and Zhao, X. and Pei, X. and Lu, H.", TITLE = "Diff-Tree: A Diffusion Model for Diversified Tree Point Cloud Generation with High Realism", JOURNAL = RS, VOLUME = "17", YEAR = "2025", NUMBER = "5", PAGES = "923", BIBSOURCE = "http://www.visionbib.com/bibliography/describe489diftx23d7.html#TT96260"}