TeaMs-RL: Teaching LLMs to Generate Better Instruction Datasets via Reinforcement Learning. Gu, S., Knoll, A., & Jin, M. Transactions on Machine Learning Research, 2024.
Arxiv bibtex @article{2024_4J_Teams,
title={TeaMs-RL: Teaching LLMs to Generate Better Instruction Datasets via Reinforcement Learning},
author={Gu, Shangding and Knoll, Alois and Jin, Ming},
journal ={Transactions on Machine Learning Research},
year={2024},
url_arXiv = {https://arxiv.org/abs/2403.08694}
}
Downloads: 0
{"_id":"J452nzW4mir3nEKnE","bibbaseid":"gu-knoll-jin-teamsrlteachingllmstogeneratebetterinstructiondatasetsviareinforcementlearning-2024","author_short":["Gu, S.","Knoll, A.","Jin, M."],"bibdata":{"bibtype":"article","type":"article","title":"TeaMs-RL: Teaching LLMs to Generate Better Instruction Datasets via Reinforcement Learning","author":[{"propositions":[],"lastnames":["Gu"],"firstnames":["Shangding"],"suffixes":[]},{"propositions":[],"lastnames":["Knoll"],"firstnames":["Alois"],"suffixes":[]},{"propositions":[],"lastnames":["Jin"],"firstnames":["Ming"],"suffixes":[]}],"journal":"Transactions on Machine Learning Research","year":"2024","url_arxiv":"https://arxiv.org/abs/2403.08694","bibtex":"@article{2024_4J_Teams,\n title={TeaMs-RL: Teaching LLMs to Generate Better Instruction Datasets via Reinforcement Learning},\n author={Gu, Shangding and Knoll, Alois and Jin, Ming},\n journal ={Transactions on Machine Learning Research},\n year={2024},\nurl_arXiv = {https://arxiv.org/abs/2403.08694}\n}\n\n","author_short":["Gu, S.","Knoll, A.","Jin, M."],"key":"2024_4J_Teams","id":"2024_4J_Teams","bibbaseid":"gu-knoll-jin-teamsrlteachingllmstogeneratebetterinstructiondatasetsviareinforcementlearning-2024","role":"author","urls":{" arxiv":"https://arxiv.org/abs/2403.08694"},"metadata":{"authorlinks":{}}},"bibtype":"article","biburl":"http://www.jinming.tech/papers/myref.bib","dataSources":["sTzDHHaipTZWjp8oe"],"keywords":[],"search_terms":["teams","teaching","llms","generate","better","instruction","datasets","via","reinforcement","learning","gu","knoll","jin"],"title":"TeaMs-RL: Teaching LLMs to Generate Better Instruction Datasets via Reinforcement Learning","year":2024}