LAION-5B: An open large-scale dataset for training next generation image-text models. Schuhmann, C., Beaumont, R., Vencu, R., Gordon, C., Wightman, R., Cherti, M., Coombes, T., Katta, A., Mullis, C., Wortsman, M., Schramowski, P., Kundurthy, S., Crowson, K., Schmidt, L., Kaczmarczyk, R., & Jitsev, J. In Advances in Neural Information Processing Systems, volume 35, pages 25278–25294, December, 2022.
Paper bibtex @inproceedings{schuhmann_laion-5b_2022,
title = {{LAION}-{5B}: {An} open large-scale dataset for training next generation image-text models},
volume = {35},
shorttitle = {{LAION}-{5B}},
url = {https://papers.nips.cc/paper_files/paper/2022/hash/a1859debfb3b59d094f3504d5ebb6c25-Abstract-Datasets_and_Benchmarks.html},
language = {en},
urldate = {2023-08-16},
booktitle = {Advances in {Neural} {Information} {Processing} {Systems}},
author = {Schuhmann, Christoph and Beaumont, Romain and Vencu, Richard and Gordon, Cade and Wightman, Ross and Cherti, Mehdi and Coombes, Theo and Katta, Aarush and Mullis, Clayton and Wortsman, Mitchell and Schramowski, Patrick and Kundurthy, Srivatsa and Crowson, Katherine and Schmidt, Ludwig and Kaczmarczyk, Robert and Jitsev, Jenia},
month = dec,
year = {2022},
keywords = {\#LLM, \#Multi-Modal, \#NIPS{\textgreater}22, \#NLP, \#Vision, /unread, ❤️},
pages = {25278--25294},
}
Downloads: 0
{"_id":"rDENRqy66LJgtec3f","bibbaseid":"schuhmann-beaumont-vencu-gordon-wightman-cherti-coombes-katta-etal-laion5banopenlargescaledatasetfortrainingnextgenerationimagetextmodels-2022","author_short":["Schuhmann, C.","Beaumont, R.","Vencu, R.","Gordon, C.","Wightman, R.","Cherti, M.","Coombes, T.","Katta, A.","Mullis, C.","Wortsman, M.","Schramowski, P.","Kundurthy, S.","Crowson, K.","Schmidt, L.","Kaczmarczyk, R.","Jitsev, J."],"bibdata":{"bibtype":"inproceedings","type":"inproceedings","title":"LAION-5B: An open large-scale dataset for training next generation image-text models","volume":"35","shorttitle":"LAION-5B","url":"https://papers.nips.cc/paper_files/paper/2022/hash/a1859debfb3b59d094f3504d5ebb6c25-Abstract-Datasets_and_Benchmarks.html","language":"en","urldate":"2023-08-16","booktitle":"Advances in Neural Information Processing Systems","author":[{"propositions":[],"lastnames":["Schuhmann"],"firstnames":["Christoph"],"suffixes":[]},{"propositions":[],"lastnames":["Beaumont"],"firstnames":["Romain"],"suffixes":[]},{"propositions":[],"lastnames":["Vencu"],"firstnames":["Richard"],"suffixes":[]},{"propositions":[],"lastnames":["Gordon"],"firstnames":["Cade"],"suffixes":[]},{"propositions":[],"lastnames":["Wightman"],"firstnames":["Ross"],"suffixes":[]},{"propositions":[],"lastnames":["Cherti"],"firstnames":["Mehdi"],"suffixes":[]},{"propositions":[],"lastnames":["Coombes"],"firstnames":["Theo"],"suffixes":[]},{"propositions":[],"lastnames":["Katta"],"firstnames":["Aarush"],"suffixes":[]},{"propositions":[],"lastnames":["Mullis"],"firstnames":["Clayton"],"suffixes":[]},{"propositions":[],"lastnames":["Wortsman"],"firstnames":["Mitchell"],"suffixes":[]},{"propositions":[],"lastnames":["Schramowski"],"firstnames":["Patrick"],"suffixes":[]},{"propositions":[],"lastnames":["Kundurthy"],"firstnames":["Srivatsa"],"suffixes":[]},{"propositions":[],"lastnames":["Crowson"],"firstnames":["Katherine"],"suffixes":[]},{"propositions":[],"lastnames":["Schmidt"],"firstnames":["Ludwig"],"suffixes":[]},{"propositions":[],"lastnames":["Kaczmarczyk"],"firstnames":["Robert"],"suffixes":[]},{"propositions":[],"lastnames":["Jitsev"],"firstnames":["Jenia"],"suffixes":[]}],"month":"December","year":"2022","keywords":"#LLM, #Multi-Modal, #NIPS\\textgreater22, #NLP, #Vision, /unread, ❤️","pages":"25278–25294","bibtex":"@inproceedings{schuhmann_laion-5b_2022,\n\ttitle = {{LAION}-{5B}: {An} open large-scale dataset for training next generation image-text models},\n\tvolume = {35},\n\tshorttitle = {{LAION}-{5B}},\n\turl = {https://papers.nips.cc/paper_files/paper/2022/hash/a1859debfb3b59d094f3504d5ebb6c25-Abstract-Datasets_and_Benchmarks.html},\n\tlanguage = {en},\n\turldate = {2023-08-16},\n\tbooktitle = {Advances in {Neural} {Information} {Processing} {Systems}},\n\tauthor = {Schuhmann, Christoph and Beaumont, Romain and Vencu, Richard and Gordon, Cade and Wightman, Ross and Cherti, Mehdi and Coombes, Theo and Katta, Aarush and Mullis, Clayton and Wortsman, Mitchell and Schramowski, Patrick and Kundurthy, Srivatsa and Crowson, Katherine and Schmidt, Ludwig and Kaczmarczyk, Robert and Jitsev, Jenia},\n\tmonth = dec,\n\tyear = {2022},\n\tkeywords = {\\#LLM, \\#Multi-Modal, \\#NIPS{\\textgreater}22, \\#NLP, \\#Vision, /unread, ❤️},\n\tpages = {25278--25294},\n}\n\n\n\n","author_short":["Schuhmann, C.","Beaumont, R.","Vencu, R.","Gordon, C.","Wightman, R.","Cherti, M.","Coombes, T.","Katta, A.","Mullis, C.","Wortsman, M.","Schramowski, P.","Kundurthy, S.","Crowson, K.","Schmidt, L.","Kaczmarczyk, R.","Jitsev, J."],"key":"schuhmann_laion-5b_2022","id":"schuhmann_laion-5b_2022","bibbaseid":"schuhmann-beaumont-vencu-gordon-wightman-cherti-coombes-katta-etal-laion5banopenlargescaledatasetfortrainingnextgenerationimagetextmodels-2022","role":"author","urls":{"Paper":"https://papers.nips.cc/paper_files/paper/2022/hash/a1859debfb3b59d094f3504d5ebb6c25-Abstract-Datasets_and_Benchmarks.html"},"keyword":["#LLM","#Multi-Modal","#NIPS\\textgreater22","#NLP","#Vision","/unread","❤️"],"metadata":{"authorlinks":{}},"downloads":0,"html":""},"bibtype":"inproceedings","biburl":"https://bibbase.org/zotero/zzhenry2012","dataSources":["nZHrFJKyxKKDaWYM8"],"keywords":["#llm","#multi-modal","#nips\\textgreater22","#nlp","#vision","/unread","❤️"],"search_terms":["laion","open","large","scale","dataset","training","next","generation","image","text","models","schuhmann","beaumont","vencu","gordon","wightman","cherti","coombes","katta","mullis","wortsman","schramowski","kundurthy","crowson","schmidt","kaczmarczyk","jitsev"],"title":"LAION-5B: An open large-scale dataset for training next generation image-text models","year":2022}