Visual Cropping Improves Zero-Shot Question Answering of Multimodal Large Language Models. Zhang, J., Khayatkhoei, M., Chhikara, P., & Ilievski, F. In Advances in Neural Information Processing Systems Workshop on Robustness of Few-shot and Zero-shot Learning in Foundation Models, December, 2023. Paper Link bibtex @InProceedings{zhang2023visual-crop,
title={Visual Cropping Improves Zero-Shot Question Answering of Multimodal Large Language Models},
author={Zhang, Jiarui and Khayatkhoei, Mahyar and Chhikara, Prateek and Ilievski, Filip},
booktitle={Advances in Neural Information Processing Systems Workshop on Robustness of Few-shot and Zero-shot Learning in Foundation Models},
year={2023},
month={December},
url_Paper={https://openreview.net/pdf?id=YrYcoV2dAk},
url_Link={https://neurips.cc/virtual/2023/76680},
ISIArea = {ML, VISTA, NLP}
}
Downloads: 0
{"_id":"j9b9h5XczRnJiWTbh","bibbaseid":"zhang-khayatkhoei-chhikara-ilievski-visualcroppingimproveszeroshotquestionansweringofmultimodallargelanguagemodels-2023","author_short":["Zhang, J.","Khayatkhoei, M.","Chhikara, P.","Ilievski, F."],"bibdata":{"bibtype":"inproceedings","type":"inproceedings","title":"Visual Cropping Improves Zero-Shot Question Answering of Multimodal Large Language Models","author":[{"propositions":[],"lastnames":["Zhang"],"firstnames":["Jiarui"],"suffixes":[]},{"propositions":[],"lastnames":["Khayatkhoei"],"firstnames":["Mahyar"],"suffixes":[]},{"propositions":[],"lastnames":["Chhikara"],"firstnames":["Prateek"],"suffixes":[]},{"propositions":[],"lastnames":["Ilievski"],"firstnames":["Filip"],"suffixes":[]}],"booktitle":"Advances in Neural Information Processing Systems Workshop on Robustness of Few-shot and Zero-shot Learning in Foundation Models","year":"2023","month":"December","url_paper":"https://openreview.net/pdf?id=YrYcoV2dAk","url_link":"https://neurips.cc/virtual/2023/76680","isiarea":"ML, VISTA, NLP","bibtex":"@InProceedings{zhang2023visual-crop,\n title={Visual Cropping Improves Zero-Shot Question Answering of Multimodal Large Language Models},\n author={Zhang, Jiarui and Khayatkhoei, Mahyar and Chhikara, Prateek and Ilievski, Filip},\n booktitle={Advances in Neural Information Processing Systems Workshop on Robustness of Few-shot and Zero-shot Learning in Foundation Models},\n year={2023},\n month={December},\n url_Paper={https://openreview.net/pdf?id=YrYcoV2dAk},\n url_Link={https://neurips.cc/virtual/2023/76680},\n ISIArea = {ML, VISTA, NLP}\n}\n\n","author_short":["Zhang, J.","Khayatkhoei, M.","Chhikara, P.","Ilievski, F."],"bibbaseid":"zhang-khayatkhoei-chhikara-ilievski-visualcroppingimproveszeroshotquestionansweringofmultimodallargelanguagemodels-2023","role":"author","urls":{" paper":"https://openreview.net/pdf?id=YrYcoV2dAk"," link":"https://neurips.cc/virtual/2023/76680"},"metadata":{"authorlinks":{}}},"bibtype":"inproceedings","biburl":"https://bibbase.org/f/t575wpByatfqCc36x/mkhayat-2023.bib","dataSources":["pD7Fen8gEB6sGt3k6"],"keywords":[],"search_terms":["visual","cropping","improves","zero","shot","question","answering","multimodal","large","language","models","zhang","khayatkhoei","chhikara","ilievski"],"title":"Visual Cropping Improves Zero-Shot Question Answering of Multimodal Large Language Models","year":2023}