Scaling Instruction-Finetuned Language Models. Chung, H. W., Hou, L., Longpre, S., Zoph, B., Tay, Y., Fedus, W., Li, Y., Wang, X., Dehghani, M., Brahma, S., Webson, A., Gu, S. S., Dai, Z., Suzgun, M., Chen, X., Chowdhery, A., Castro-Ros, A., Pellat, M., Robinson, K., Valter, D., Narang, S., Mishra, G., Yu, A., Zhao, V. Y., Huang, Y., Dai, A. M., Yu, H., Petrov, S., Chi, E. H., Dean, J., Devlin, J., Roberts, A., Zhou, D., Le, Q. V., & Wei, J. J. Mach. Learn. Res., 25:70:1–70:53, 2024.  
Paper  bibtex   @article{DBLP:journals/jmlr/ChungHLZTFL00BW24,
  author       = {Hyung Won Chung and
                  Le Hou and
                  Shayne Longpre and
                  Barret Zoph and
                  Yi Tay and
                  William Fedus and
                  Yunxuan Li and
                  Xuezhi Wang and
                  Mostafa Dehghani and
                  Siddhartha Brahma and
                  Albert Webson and
                  Shixiang Shane Gu and
                  Zhuyun Dai and
                  Mirac Suzgun and
                  Xinyun Chen and
                  Aakanksha Chowdhery and
                  Alex Castro{-}Ros and
                  Marie Pellat and
                  Kevin Robinson and
                  Dasha Valter and
                  Sharan Narang and
                  Gaurav Mishra and
                  Adams Yu and
                  Vincent Y. Zhao and
                  Yanping Huang and
                  Andrew M. Dai and
                  Hongkun Yu and
                  Slav Petrov and
                  Ed H. Chi and
                  Jeff Dean and
                  Jacob Devlin and
                  Adam Roberts and
                  Denny Zhou and
                  Quoc V. Le and
                  Jason Wei},
  title        = {Scaling Instruction-Finetuned Language Models},
  journal      = {J. Mach. Learn. Res.},
  volume       = {25},
  pages        = {70:1--70:53},
  year         = {2024},
  url          = {https://jmlr.org/papers/v25/23-0870.html},
  timestamp    = {Mon, 16 Sep 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/ChungHLZTFL00BW24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
} 
Downloads: 0
{"_id":"eH8cAdSQp8Y4cdssx","bibbaseid":"chung-hou-longpre-zoph-tay-fedus-li-wang-etal-scalinginstructionfinetunedlanguagemodels-2024","author_short":["Chung, H. W.","Hou, L.","Longpre, S.","Zoph, B.","Tay, Y.","Fedus, W.","Li, Y.","Wang, X.","Dehghani, M.","Brahma, S.","Webson, A.","Gu, S. S.","Dai, Z.","Suzgun, M.","Chen, X.","Chowdhery, A.","Castro-Ros, A.","Pellat, M.","Robinson, K.","Valter, D.","Narang, S.","Mishra, G.","Yu, A.","Zhao, V. Y.","Huang, Y.","Dai, A. M.","Yu, H.","Petrov, S.","Chi, E. H.","Dean, J.","Devlin, J.","Roberts, A.","Zhou, D.","Le, Q. V.","Wei, J."],"bibdata":{"bibtype":"article","type":"article","author":[{"firstnames":["Hyung","Won"],"propositions":[],"lastnames":["Chung"],"suffixes":[]},{"firstnames":["Le"],"propositions":[],"lastnames":["Hou"],"suffixes":[]},{"firstnames":["Shayne"],"propositions":[],"lastnames":["Longpre"],"suffixes":[]},{"firstnames":["Barret"],"propositions":[],"lastnames":["Zoph"],"suffixes":[]},{"firstnames":["Yi"],"propositions":[],"lastnames":["Tay"],"suffixes":[]},{"firstnames":["William"],"propositions":[],"lastnames":["Fedus"],"suffixes":[]},{"firstnames":["Yunxuan"],"propositions":[],"lastnames":["Li"],"suffixes":[]},{"firstnames":["Xuezhi"],"propositions":[],"lastnames":["Wang"],"suffixes":[]},{"firstnames":["Mostafa"],"propositions":[],"lastnames":["Dehghani"],"suffixes":[]},{"firstnames":["Siddhartha"],"propositions":[],"lastnames":["Brahma"],"suffixes":[]},{"firstnames":["Albert"],"propositions":[],"lastnames":["Webson"],"suffixes":[]},{"firstnames":["Shixiang","Shane"],"propositions":[],"lastnames":["Gu"],"suffixes":[]},{"firstnames":["Zhuyun"],"propositions":[],"lastnames":["Dai"],"suffixes":[]},{"firstnames":["Mirac"],"propositions":[],"lastnames":["Suzgun"],"suffixes":[]},{"firstnames":["Xinyun"],"propositions":[],"lastnames":["Chen"],"suffixes":[]},{"firstnames":["Aakanksha"],"propositions":[],"lastnames":["Chowdhery"],"suffixes":[]},{"firstnames":["Alex"],"propositions":[],"lastnames":["Castro-Ros"],"suffixes":[]},{"firstnames":["Marie"],"propositions":[],"lastnames":["Pellat"],"suffixes":[]},{"firstnames":["Kevin"],"propositions":[],"lastnames":["Robinson"],"suffixes":[]},{"firstnames":["Dasha"],"propositions":[],"lastnames":["Valter"],"suffixes":[]},{"firstnames":["Sharan"],"propositions":[],"lastnames":["Narang"],"suffixes":[]},{"firstnames":["Gaurav"],"propositions":[],"lastnames":["Mishra"],"suffixes":[]},{"firstnames":["Adams"],"propositions":[],"lastnames":["Yu"],"suffixes":[]},{"firstnames":["Vincent","Y."],"propositions":[],"lastnames":["Zhao"],"suffixes":[]},{"firstnames":["Yanping"],"propositions":[],"lastnames":["Huang"],"suffixes":[]},{"firstnames":["Andrew","M."],"propositions":[],"lastnames":["Dai"],"suffixes":[]},{"firstnames":["Hongkun"],"propositions":[],"lastnames":["Yu"],"suffixes":[]},{"firstnames":["Slav"],"propositions":[],"lastnames":["Petrov"],"suffixes":[]},{"firstnames":["Ed","H."],"propositions":[],"lastnames":["Chi"],"suffixes":[]},{"firstnames":["Jeff"],"propositions":[],"lastnames":["Dean"],"suffixes":[]},{"firstnames":["Jacob"],"propositions":[],"lastnames":["Devlin"],"suffixes":[]},{"firstnames":["Adam"],"propositions":[],"lastnames":["Roberts"],"suffixes":[]},{"firstnames":["Denny"],"propositions":[],"lastnames":["Zhou"],"suffixes":[]},{"firstnames":["Quoc","V."],"propositions":[],"lastnames":["Le"],"suffixes":[]},{"firstnames":["Jason"],"propositions":[],"lastnames":["Wei"],"suffixes":[]}],"title":"Scaling Instruction-Finetuned Language Models","journal":"J. Mach. Learn. Res.","volume":"25","pages":"70:1–70:53","year":"2024","url":"https://jmlr.org/papers/v25/23-0870.html","timestamp":"Mon, 16 Sep 2024 01:00:00 +0200","biburl":"https://dblp.org/rec/journals/jmlr/ChungHLZTFL00BW24.bib","bibsource":"dblp computer science bibliography, https://dblp.org","bibtex":"@article{DBLP:journals/jmlr/ChungHLZTFL00BW24,\n  author       = {Hyung Won Chung and\n                  Le Hou and\n                  Shayne Longpre and\n                  Barret Zoph and\n                  Yi Tay and\n                  William Fedus and\n                  Yunxuan Li and\n                  Xuezhi Wang and\n                  Mostafa Dehghani and\n                  Siddhartha Brahma and\n                  Albert Webson and\n                  Shixiang Shane Gu and\n                  Zhuyun Dai and\n                  Mirac Suzgun and\n                  Xinyun Chen and\n                  Aakanksha Chowdhery and\n                  Alex Castro{-}Ros and\n                  Marie Pellat and\n                  Kevin Robinson and\n                  Dasha Valter and\n                  Sharan Narang and\n                  Gaurav Mishra and\n                  Adams Yu and\n                  Vincent Y. Zhao and\n                  Yanping Huang and\n                  Andrew M. Dai and\n                  Hongkun Yu and\n                  Slav Petrov and\n                  Ed H. Chi and\n                  Jeff Dean and\n                  Jacob Devlin and\n                  Adam Roberts and\n                  Denny Zhou and\n                  Quoc V. Le and\n                  Jason Wei},\n  title        = {Scaling Instruction-Finetuned Language Models},\n  journal      = {J. Mach. Learn. Res.},\n  volume       = {25},\n  pages        = {70:1--70:53},\n  year         = {2024},\n  url          = {https://jmlr.org/papers/v25/23-0870.html},\n  timestamp    = {Mon, 16 Sep 2024 01:00:00 +0200},\n  biburl       = {https://dblp.org/rec/journals/jmlr/ChungHLZTFL00BW24.bib},\n  bibsource    = {dblp computer science bibliography, https://dblp.org}\n}\n\n","author_short":["Chung, H. W.","Hou, L.","Longpre, S.","Zoph, B.","Tay, Y.","Fedus, W.","Li, Y.","Wang, X.","Dehghani, M.","Brahma, S.","Webson, A.","Gu, S. S.","Dai, Z.","Suzgun, M.","Chen, X.","Chowdhery, A.","Castro-Ros, A.","Pellat, M.","Robinson, K.","Valter, D.","Narang, S.","Mishra, G.","Yu, A.","Zhao, V. Y.","Huang, Y.","Dai, A. M.","Yu, H.","Petrov, S.","Chi, E. H.","Dean, J.","Devlin, J.","Roberts, A.","Zhou, D.","Le, Q. V.","Wei, J."],"key":"DBLP:journals/jmlr/ChungHLZTFL00BW24","id":"DBLP:journals/jmlr/ChungHLZTFL00BW24","bibbaseid":"chung-hou-longpre-zoph-tay-fedus-li-wang-etal-scalinginstructionfinetunedlanguagemodels-2024","role":"author","urls":{"Paper":"https://jmlr.org/papers/v25/23-0870.html"},"metadata":{"authorlinks":{}}},"bibtype":"article","biburl":"http://dblp.org/pers/tb2/d/Dean:Jeffrey","dataSources":["rMEZSGRpGTSfEZaHM"],"keywords":[],"search_terms":["scaling","instruction","finetuned","language","models","chung","hou","longpre","zoph","tay","fedus","li","wang","dehghani","brahma","webson","gu","dai","suzgun","chen","chowdhery","castro-ros","pellat","robinson","valter","narang","mishra","yu","zhao","huang","dai","yu","petrov","chi","dean","devlin","roberts","zhou","le","wei"],"title":"Scaling Instruction-Finetuned Language Models","year":2024}