SnapNTell: Enhancing Entity-Centric Visual Question Answering with Retrieval Augmented Multimodal LLM

SnapNTell: Enhancing Entity-Centric Visual Question Answering with Retrieval Augmented Multimodal LLM. Qiu, J., Madotto, A., Lin, Z., Crook, P. A., Xu, Y. E., Damavandi, B., Dong, X., Faloutsos, C., Li, L., & Moon, S. In Al-Onaizan, Y., Bansal, M., & Chen, Y., editors, Findings of the Association for Computational Linguistics: EMNLP 2024, Miami, Florida, USA, November 12-16, 2024, pages 247–266, 2024. Association for Computational Linguistics.

Paper bibtex

@inproceedings{DBLP:conf/emnlp/QiuMLCXD0F0M24,
  author       = {Jielin Qiu and
                  Andrea Madotto and
                  Zhaojiang Lin and
                  Paul A. Crook and
                  Yifan Ethan Xu and
                  Babak Damavandi and
                  Xin Dong and
                  Christos Faloutsos and
                  Lei Li and
                  Seungwhan Moon},
  editor       = {Yaser Al{-}Onaizan and
                  Mohit Bansal and
                  Yun{-}Nung Chen},
  title        = {SnapNTell: Enhancing Entity-Centric Visual Question Answering with
                  Retrieval Augmented Multimodal {LLM}},
  booktitle    = {Findings of the Association for Computational Linguistics: {EMNLP}
                  2024, Miami, Florida, USA, November 12-16, 2024},
  pages        = {247--266},
  publisher    = {Association for Computational Linguistics},
  year         = {2024},
  url          = {https://aclanthology.org/2024.findings-emnlp.14},
  timestamp    = {Mon, 18 Nov 2024 09:05:59 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/QiuMLCXD0F0M24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

Downloads: 0

{"_id":"TtrsbCJkNs79Eoab6","bibbaseid":"qiu-madotto-lin-crook-xu-damavandi-dong-faloutsos-etal-snapntellenhancingentitycentricvisualquestionansweringwithretrievalaugmentedmultimodalllm-2024","author_short":["Qiu, J.","Madotto, A.","Lin, Z.","Crook, P. A.","Xu, Y. E.","Damavandi, B.","Dong, X.","Faloutsos, C.","Li, L.","Moon, S."],"bibdata":{"bibtype":"inproceedings","type":"inproceedings","author":[{"firstnames":["Jielin"],"propositions":[],"lastnames":["Qiu"],"suffixes":[]},{"firstnames":["Andrea"],"propositions":[],"lastnames":["Madotto"],"suffixes":[]},{"firstnames":["Zhaojiang"],"propositions":[],"lastnames":["Lin"],"suffixes":[]},{"firstnames":["Paul","A."],"propositions":[],"lastnames":["Crook"],"suffixes":[]},{"firstnames":["Yifan","Ethan"],"propositions":[],"lastnames":["Xu"],"suffixes":[]},{"firstnames":["Babak"],"propositions":[],"lastnames":["Damavandi"],"suffixes":[]},{"firstnames":["Xin"],"propositions":[],"lastnames":["Dong"],"suffixes":[]},{"firstnames":["Christos"],"propositions":[],"lastnames":["Faloutsos"],"suffixes":[]},{"firstnames":["Lei"],"propositions":[],"lastnames":["Li"],"suffixes":[]},{"firstnames":["Seungwhan"],"propositions":[],"lastnames":["Moon"],"suffixes":[]}],"editor":[{"firstnames":["Yaser"],"propositions":[],"lastnames":["Al-Onaizan"],"suffixes":[]},{"firstnames":["Mohit"],"propositions":[],"lastnames":["Bansal"],"suffixes":[]},{"firstnames":["Yun-Nung"],"propositions":[],"lastnames":["Chen"],"suffixes":[]}],"title":"SnapNTell: Enhancing Entity-Centric Visual Question Answering with Retrieval Augmented Multimodal LLM","booktitle":"Findings of the Association for Computational Linguistics: EMNLP 2024, Miami, Florida, USA, November 12-16, 2024","pages":"247–266","publisher":"Association for Computational Linguistics","year":"2024","url":"https://aclanthology.org/2024.findings-emnlp.14","timestamp":"Mon, 18 Nov 2024 09:05:59 +0100","biburl":"https://dblp.org/rec/conf/emnlp/QiuMLCXD0F0M24.bib","bibsource":"dblp computer science bibliography, https://dblp.org","bibtex":"@inproceedings{DBLP:conf/emnlp/QiuMLCXD0F0M24,\n author = {Jielin Qiu and\n Andrea Madotto and\n Zhaojiang Lin and\n Paul A. Crook and\n Yifan Ethan Xu and\n Babak Damavandi and\n Xin Dong and\n Christos Faloutsos and\n Lei Li and\n Seungwhan Moon},\n editor = {Yaser Al{-}Onaizan and\n Mohit Bansal and\n Yun{-}Nung Chen},\n title = {SnapNTell: Enhancing Entity-Centric Visual Question Answering with\n Retrieval Augmented Multimodal {LLM}},\n booktitle = {Findings of the Association for Computational Linguistics: {EMNLP}\n 2024, Miami, Florida, USA, November 12-16, 2024},\n pages = {247--266},\n publisher = {Association for Computational Linguistics},\n year = {2024},\n url = {https://aclanthology.org/2024.findings-emnlp.14},\n timestamp = {Mon, 18 Nov 2024 09:05:59 +0100},\n biburl = {https://dblp.org/rec/conf/emnlp/QiuMLCXD0F0M24.bib},\n bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n","author_short":["Qiu, J.","Madotto, A.","Lin, Z.","Crook, P. A.","Xu, Y. E.","Damavandi, B.","Dong, X.","Faloutsos, C.","Li, L.","Moon, S."],"editor_short":["Al-Onaizan, Y.","Bansal, M.","Chen, Y."],"key":"DBLP:conf/emnlp/QiuMLCXD0F0M24","id":"DBLP:conf/emnlp/QiuMLCXD0F0M24","bibbaseid":"qiu-madotto-lin-crook-xu-damavandi-dong-faloutsos-etal-snapntellenhancingentitycentricvisualquestionansweringwithretrievalaugmentedmultimodalllm-2024","role":"author","urls":{"Paper":"https://aclanthology.org/2024.findings-emnlp.14"},"metadata":{"authorlinks":{}}},"bibtype":"inproceedings","biburl":"https://dblp.org/pid/f/CFaloutsos.bib","dataSources":["zM4wMHSu34vjmb6Cm"],"keywords":[],"search_terms":["snapntell","enhancing","entity","centric","visual","question","answering","retrieval","augmented","multimodal","llm","qiu","madotto","lin","crook","xu","damavandi","dong","faloutsos","li","moon"],"title":"SnapNTell: Enhancing Entity-Centric Visual Question Answering with Retrieval Augmented Multimodal LLM","year":2024}