Scaling Instruction-Finetuned Language Models. Chung, H. W., Hou, L., Longpre, S., Zoph, B., Tay, Y., Fedus, W., Li, Y., Wang, X., Dehghani, M., Brahma, S., Webson, A., Gu, S. S., Dai, Z., Suzgun, M., Chen, X., Chowdhery, A., Castro-Ros, A., Pellat, M., Robinson, K., Valter, D., Narang, S., Mishra, G., Yu, A., Zhao, V. Y., Huang, Y., Dai, A. M., Yu, H., Petrov, S., Chi, E. H., Dean, J., Devlin, J., Roberts, A., Zhou, D., Le, Q. V., & Wei, J. J. Mach. Learn. Res., 25:70:1–70:53, 2024. Paper bibtex @article{DBLP:journals/jmlr/ChungHLZTFL00BW24,
author = {Hyung Won Chung and
Le Hou and
Shayne Longpre and
Barret Zoph and
Yi Tay and
William Fedus and
Yunxuan Li and
Xuezhi Wang and
Mostafa Dehghani and
Siddhartha Brahma and
Albert Webson and
Shixiang Shane Gu and
Zhuyun Dai and
Mirac Suzgun and
Xinyun Chen and
Aakanksha Chowdhery and
Alex Castro{-}Ros and
Marie Pellat and
Kevin Robinson and
Dasha Valter and
Sharan Narang and
Gaurav Mishra and
Adams Yu and
Vincent Y. Zhao and
Yanping Huang and
Andrew M. Dai and
Hongkun Yu and
Slav Petrov and
Ed H. Chi and
Jeff Dean and
Jacob Devlin and
Adam Roberts and
Denny Zhou and
Quoc V. Le and
Jason Wei},
title = {Scaling Instruction-Finetuned Language Models},
journal = {J. Mach. Learn. Res.},
volume = {25},
pages = {70:1--70:53},
year = {2024},
url = {https://jmlr.org/papers/v25/23-0870.html},
timestamp = {Mon, 16 Sep 2024 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/jmlr/ChungHLZTFL00BW24.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Downloads: 0
{"_id":"7T8zXdyAXEs9jbgEH","bibbaseid":"chung-hou-longpre-zoph-tay-fedus-li-wang-etal-scalinginstructionfinetunedlanguagemodels-2024","author_short":["Chung, H. W.","Hou, L.","Longpre, S.","Zoph, B.","Tay, Y.","Fedus, W.","Li, Y.","Wang, X.","Dehghani, M.","Brahma, S.","Webson, A.","Gu, S. S.","Dai, Z.","Suzgun, M.","Chen, X.","Chowdhery, A.","Castro-Ros, A.","Pellat, M.","Robinson, K.","Valter, D.","Narang, S.","Mishra, G.","Yu, A.","Zhao, V. Y.","Huang, Y.","Dai, A. M.","Yu, H.","Petrov, S.","Chi, E. H.","Dean, J.","Devlin, J.","Roberts, A.","Zhou, D.","Le, Q. V.","Wei, J."],"bibdata":{"bibtype":"article","type":"article","author":[{"firstnames":["Hyung","Won"],"propositions":[],"lastnames":["Chung"],"suffixes":[]},{"firstnames":["Le"],"propositions":[],"lastnames":["Hou"],"suffixes":[]},{"firstnames":["Shayne"],"propositions":[],"lastnames":["Longpre"],"suffixes":[]},{"firstnames":["Barret"],"propositions":[],"lastnames":["Zoph"],"suffixes":[]},{"firstnames":["Yi"],"propositions":[],"lastnames":["Tay"],"suffixes":[]},{"firstnames":["William"],"propositions":[],"lastnames":["Fedus"],"suffixes":[]},{"firstnames":["Yunxuan"],"propositions":[],"lastnames":["Li"],"suffixes":[]},{"firstnames":["Xuezhi"],"propositions":[],"lastnames":["Wang"],"suffixes":[]},{"firstnames":["Mostafa"],"propositions":[],"lastnames":["Dehghani"],"suffixes":[]},{"firstnames":["Siddhartha"],"propositions":[],"lastnames":["Brahma"],"suffixes":[]},{"firstnames":["Albert"],"propositions":[],"lastnames":["Webson"],"suffixes":[]},{"firstnames":["Shixiang","Shane"],"propositions":[],"lastnames":["Gu"],"suffixes":[]},{"firstnames":["Zhuyun"],"propositions":[],"lastnames":["Dai"],"suffixes":[]},{"firstnames":["Mirac"],"propositions":[],"lastnames":["Suzgun"],"suffixes":[]},{"firstnames":["Xinyun"],"propositions":[],"lastnames":["Chen"],"suffixes":[]},{"firstnames":["Aakanksha"],"propositions":[],"lastnames":["Chowdhery"],"suffixes":[]},{"firstnames":["Alex"],"propositions":[],"lastnames":["Castro-Ros"],"suffixes":[]},{"firstnames":["Marie"],"propositions":[],"lastnames":["Pellat"],"suffixes":[]},{"firstnames":["Kevin"],"propositions":[],"lastnames":["Robinson"],"suffixes":[]},{"firstnames":["Dasha"],"propositions":[],"lastnames":["Valter"],"suffixes":[]},{"firstnames":["Sharan"],"propositions":[],"lastnames":["Narang"],"suffixes":[]},{"firstnames":["Gaurav"],"propositions":[],"lastnames":["Mishra"],"suffixes":[]},{"firstnames":["Adams"],"propositions":[],"lastnames":["Yu"],"suffixes":[]},{"firstnames":["Vincent","Y."],"propositions":[],"lastnames":["Zhao"],"suffixes":[]},{"firstnames":["Yanping"],"propositions":[],"lastnames":["Huang"],"suffixes":[]},{"firstnames":["Andrew","M."],"propositions":[],"lastnames":["Dai"],"suffixes":[]},{"firstnames":["Hongkun"],"propositions":[],"lastnames":["Yu"],"suffixes":[]},{"firstnames":["Slav"],"propositions":[],"lastnames":["Petrov"],"suffixes":[]},{"firstnames":["Ed","H."],"propositions":[],"lastnames":["Chi"],"suffixes":[]},{"firstnames":["Jeff"],"propositions":[],"lastnames":["Dean"],"suffixes":[]},{"firstnames":["Jacob"],"propositions":[],"lastnames":["Devlin"],"suffixes":[]},{"firstnames":["Adam"],"propositions":[],"lastnames":["Roberts"],"suffixes":[]},{"firstnames":["Denny"],"propositions":[],"lastnames":["Zhou"],"suffixes":[]},{"firstnames":["Quoc","V."],"propositions":[],"lastnames":["Le"],"suffixes":[]},{"firstnames":["Jason"],"propositions":[],"lastnames":["Wei"],"suffixes":[]}],"title":"Scaling Instruction-Finetuned Language Models","journal":"J. Mach. Learn. Res.","volume":"25","pages":"70:1–70:53","year":"2024","url":"https://jmlr.org/papers/v25/23-0870.html","timestamp":"Mon, 16 Sep 2024 01:00:00 +0200","biburl":"https://dblp.org/rec/journals/jmlr/ChungHLZTFL00BW24.bib","bibsource":"dblp computer science bibliography, https://dblp.org","bibtex":"@article{DBLP:journals/jmlr/ChungHLZTFL00BW24,\n author = {Hyung Won Chung and\n Le Hou and\n Shayne Longpre and\n Barret Zoph and\n Yi Tay and\n William Fedus and\n Yunxuan Li and\n Xuezhi Wang and\n Mostafa Dehghani and\n Siddhartha Brahma and\n Albert Webson and\n Shixiang Shane Gu and\n Zhuyun Dai and\n Mirac Suzgun and\n Xinyun Chen and\n Aakanksha Chowdhery and\n Alex Castro{-}Ros and\n Marie Pellat and\n Kevin Robinson and\n Dasha Valter and\n Sharan Narang and\n Gaurav Mishra and\n Adams Yu and\n Vincent Y. Zhao and\n Yanping Huang and\n Andrew M. Dai and\n Hongkun Yu and\n Slav Petrov and\n Ed H. Chi and\n Jeff Dean and\n Jacob Devlin and\n Adam Roberts and\n Denny Zhou and\n Quoc V. Le and\n Jason Wei},\n title = {Scaling Instruction-Finetuned Language Models},\n journal = {J. Mach. Learn. Res.},\n volume = {25},\n pages = {70:1--70:53},\n year = {2024},\n url = {https://jmlr.org/papers/v25/23-0870.html},\n timestamp = {Mon, 16 Sep 2024 01:00:00 +0200},\n biburl = {https://dblp.org/rec/journals/jmlr/ChungHLZTFL00BW24.bib},\n bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n","author_short":["Chung, H. W.","Hou, L.","Longpre, S.","Zoph, B.","Tay, Y.","Fedus, W.","Li, Y.","Wang, X.","Dehghani, M.","Brahma, S.","Webson, A.","Gu, S. S.","Dai, Z.","Suzgun, M.","Chen, X.","Chowdhery, A.","Castro-Ros, A.","Pellat, M.","Robinson, K.","Valter, D.","Narang, S.","Mishra, G.","Yu, A.","Zhao, V. Y.","Huang, Y.","Dai, A. M.","Yu, H.","Petrov, S.","Chi, E. H.","Dean, J.","Devlin, J.","Roberts, A.","Zhou, D.","Le, Q. V.","Wei, J."],"key":"DBLP:journals/jmlr/ChungHLZTFL00BW24","id":"DBLP:journals/jmlr/ChungHLZTFL00BW24","bibbaseid":"chung-hou-longpre-zoph-tay-fedus-li-wang-etal-scalinginstructionfinetunedlanguagemodels-2024","role":"author","urls":{"Paper":"https://jmlr.org/papers/v25/23-0870.html"},"metadata":{"authorlinks":{}}},"bibtype":"article","biburl":"http://dblp.org/pers/tb2/d/Dean:Jeffrey","dataSources":["rMEZSGRpGTSfEZaHM"],"keywords":[],"search_terms":["scaling","instruction","finetuned","language","models","chung","hou","longpre","zoph","tay","fedus","li","wang","dehghani","brahma","webson","gu","dai","suzgun","chen","chowdhery","castro-ros","pellat","robinson","valter","narang","mishra","yu","zhao","huang","dai","yu","petrov","chi","dean","devlin","roberts","zhou","le","wei"],"title":"Scaling Instruction-Finetuned Language Models","year":2024}