C3LLM: Conditional Multimodal Content Generation Using Large Language Models. Wang, Z., Duan, Q., Tai, Y., & Tang, C. arXiv preprint arXiv:2405.16136, 2024.
bibtex   
@article{wang2024c3llm,
  title={C3LLM: Conditional Multimodal Content Generation Using Large Language Models},
  author={Wang, Zixuan and Duan, Qinkai and Tai, Yu-Wing and Tang, Chi-Keung},
  journal={arXiv preprint arXiv:2405.16136},
  year={2024}
}

Downloads: 0