PREDILECT: Preferences Delineated with Zero-Shot Language-based Reasoning in Reinforcement Learning. Holk, S., Marta, D., & Leite, I. CoRR, 2024. Paper doi bibtex @article{DBLP:journals/corr/abs-2402-15420,
author = {Simon Holk and
Daniel Marta and
Iolanda Leite},
title = {{PREDILECT:} Preferences Delineated with Zero-Shot Language-based
Reasoning in Reinforcement Learning},
journal = {CoRR},
volume = {abs/2402.15420},
year = {2024},
url = {https://doi.org/10.48550/arXiv.2402.15420},
doi = {10.48550/ARXIV.2402.15420},
eprinttype = {arXiv},
eprint = {2402.15420},
timestamp = {Fri, 22 Mar 2024 00:00:00 +0100},
biburl = {https://dblp.org/rec/journals/corr/abs-2402-15420.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Downloads: 0
{"_id":"Aa57cY7JGfKt6mCja","bibbaseid":"holk-marta-leite-predilectpreferencesdelineatedwithzeroshotlanguagebasedreasoninginreinforcementlearning-2024","author_short":["Holk, S.","Marta, D.","Leite, I."],"bibdata":{"bibtype":"article","type":"article","author":[{"firstnames":["Simon"],"propositions":[],"lastnames":["Holk"],"suffixes":[]},{"firstnames":["Daniel"],"propositions":[],"lastnames":["Marta"],"suffixes":[]},{"firstnames":["Iolanda"],"propositions":[],"lastnames":["Leite"],"suffixes":[]}],"title":"PREDILECT: Preferences Delineated with Zero-Shot Language-based Reasoning in Reinforcement Learning","journal":"CoRR","volume":"abs/2402.15420","year":"2024","url":"https://doi.org/10.48550/arXiv.2402.15420","doi":"10.48550/ARXIV.2402.15420","eprinttype":"arXiv","eprint":"2402.15420","timestamp":"Fri, 22 Mar 2024 00:00:00 +0100","biburl":"https://dblp.org/rec/journals/corr/abs-2402-15420.bib","bibsource":"dblp computer science bibliography, https://dblp.org","bibtex":"@article{DBLP:journals/corr/abs-2402-15420,\n author = {Simon Holk and\n Daniel Marta and\n Iolanda Leite},\n title = {{PREDILECT:} Preferences Delineated with Zero-Shot Language-based\n Reasoning in Reinforcement Learning},\n journal = {CoRR},\n volume = {abs/2402.15420},\n year = {2024},\n url = {https://doi.org/10.48550/arXiv.2402.15420},\n doi = {10.48550/ARXIV.2402.15420},\n eprinttype = {arXiv},\n eprint = {2402.15420},\n timestamp = {Fri, 22 Mar 2024 00:00:00 +0100},\n biburl = {https://dblp.org/rec/journals/corr/abs-2402-15420.bib},\n bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n","author_short":["Holk, S.","Marta, D.","Leite, I."],"key":"DBLP:journals/corr/abs-2402-15420","id":"DBLP:journals/corr/abs-2402-15420","bibbaseid":"holk-marta-leite-predilectpreferencesdelineatedwithzeroshotlanguagebasedreasoninginreinforcementlearning-2024","role":"author","urls":{"Paper":"https://doi.org/10.48550/arXiv.2402.15420"},"metadata":{"authorlinks":{}}},"bibtype":"article","biburl":"https://dblp.org/pid/23/6349.bib","dataSources":["x6aKtNirHZnXYoeQo"],"keywords":[],"search_terms":["predilect","preferences","delineated","zero","shot","language","based","reasoning","reinforcement","learning","holk","marta","leite"],"title":"PREDILECT: Preferences Delineated with Zero-Shot Language-based Reasoning in Reinforcement Learning","year":2024}