@inproceedings{d39d573aeb8b4708812fa3e129b2bba0,
title = "T4Di: A Hybrid TTT-Transformer Backbone for Scalable and Efficient Diffusion Model",
abstract = "Diffusion models have achieved significant progress in image generation, with backbone architectures evolving from U-Net to Transformers. However, the quadratic complexity of Transformer-based diffusion models limits their scalability and efficiency, and this limitation becomes more prominent with increasing resolution. Linear complexity models such as Mamba partially address this issue but struggle with spatial continuity when applied to two-dimensional image data. To tackle these challenges, we propose T4Di, a hybrid backbone architecture combining the efficiency of Test-Time Training (TTT) with the global modeling capability of Transformers. By introducing multidirectional scanning and lightweight local feature enhancement modules, T4Di adapts TTT to 2D image signals, improving spatial continuity and local coherence. Moreover, we explore adaptive block composition, adjusting the ratio between Transformer and TTT components to achieve a favorable balance between generation quality and computational cost. We evaluate T4Di on both unconditional and class-conditional image generation tasks across CIFAR-10, CelebA, and ImageNet benchmarks. Experimental results demonstrate that T4Di consistently outperforms existing diffusion models in terms of both generation quality and computational efficiency, establishing it as a scalable and effective solution for image synthesis.",
keywords = "Diffusion, Hybrid, Image Generator, Test-Time Training, Transformer",
author = "Xirui Wu and Haixia Pan and Ruijun Liu and Biao Dong and Ying Zheng and Huolong Ye",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Singapore Pte Ltd. 2025.; 21st International Conference on Intelligent Computing, ICIC 2025 ; Conference date: 26-07-2025 Through 29-07-2025",
year = "2025",
doi = "10.1007/978-981-96-9812-7\_14",
language = "英语",
isbn = "9789819698110",
series = "Lecture Notes in Computer Science",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "162--173",
editor = "De-Shuang Huang and Qinhu Zhang and Chuanlei Zhang and Wei Chen",
booktitle = "Advanced Intelligent Computing Technology and Applications - 21st International Conference, ICIC 2025, Proceedings",
address = "德国",
}