@inproceedings{e763b8ba75454fa3bb439684396cbc90,
  title     = "Text-Guided Token Communication for Wireless Image Transmission",
  abstract  = "With the emergence of 6G networks and proliferation of visual applications, efficient image transmission under adverse channel conditions is critical. We present a text-guided token communication system leveraging pre-trained foundation models for wireless image transmission. Our approach converts images to discrete tokens, applies 5G NR polar codec on top of the tokenizeation, and employs text as a conditioning signal to generate lost tokens to mitigate the cliff effect at lower signal-to-noise ratios (SNRs). Evaluations on ImageNet show our method outperforms state-of-the-art deep joint source-channel coding scheme in perceptual quality and semantic preservation at extremely low bandwidth ratio, i.e., 1/96. In addition, Our system requires no scenario-specific retraining and exhibits superior cross-dataset generalization, establishing a new paradigm for efficient image transmission aligned with human perceptual priorities.",
  keywords  = "6 G networks, cross modality, foundation models, generative semantic communications, Token communication",
  author    = "Bole Liu and Li Qiao and Ye Wang and Zhen Gao and Yu Ma and Keke Ying and Tong Qin",
  note      = "Publisher Copyright: {\textcopyright} 2025 IEEE.; 2025 IEEE/CIC International Conference on Communications in China, ICCC 2025 ; Conference date: 10-08-2025 Through 13-08-2025",
  year      = "2025",
  doi       = "10.1109/ICCC65529.2025.11149073",
  language  = "English",
  series    = "2025 IEEE/CIC International Conference on Communications in China:Shaping the Future of Integrated Connectivity, ICCC 2025",
  publisher = "Institute of Electrical and Electronics Engineers Inc.",
  booktitle = "2025 IEEE/CIC International Conference on Communications in China:Shaping the Future of Integrated Connectivity, ICCC 2025",
  address   = "United States",
}