LEGO Co-builder: Exploring Fine-Grained Vision-Language Modeling for Multimodal LEGO Assembly Assistants. Huang, H., Pei, J., Aliannejadi, M., Sun, X., Ahsan, M., Yu, C., Ren, Z., César, P., & Wang, J. CoRR, 2025.
LEGO Co-builder: Exploring Fine-Grained Vision-Language Modeling for Multimodal LEGO Assembly Assistants [link]Paper  doi  bibtex   
@article{DBLP:journals/corr/abs-2507-05515,
  author       = {Haochen Huang and
                  Jiahuan Pei and
                  Mohammad Aliannejadi and
                  Xin Sun and
                  Moonisa Ahsan and
                  Chuang Yu and
                  Zhaochun Ren and
                  Pablo C{\'{e}}sar and
                  Junxiao Wang},
  title        = {{LEGO} Co-builder: Exploring Fine-Grained Vision-Language Modeling
                  for Multimodal {LEGO} Assembly Assistants},
  journal      = {CoRR},
  volume       = {abs/2507.05515},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2507.05515},
  doi          = {10.48550/ARXIV.2507.05515},
  eprinttype    = {arXiv},
  eprint       = {2507.05515},
  timestamp    = {Sat, 15 Nov 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2507-05515.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

Downloads: 0