Improving Stability of Fine-Tuning Pretrained Language Models via Component-Wise Gradient Norm Clipping. Yang, C. & Ma, X. In Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, pages 4854–4859, Abu Dhabi, United Arab Emirates, December, 2022. Association for Computational Linguistics. bibtex @inproceedings{yang-ma-2022-improving,
title = "Improving Stability of Fine-Tuning Pretrained Language Models via Component-Wise Gradient Norm Clipping",
author = "Yang, Chenghao and
Ma, Xuezhe",
booktitle = "Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates",
publisher = "Association for Computational Linguistics",
pages = "4854--4859",
}
Downloads: 0
{"_id":"ikwfd8S3H7S6oYWd5","bibbaseid":"yang-ma-improvingstabilityoffinetuningpretrainedlanguagemodelsviacomponentwisegradientnormclipping-2022","author_short":["Yang, C.","Ma, X."],"bibdata":{"bibtype":"inproceedings","type":"inproceedings","title":"Improving Stability of Fine-Tuning Pretrained Language Models via Component-Wise Gradient Norm Clipping","author":[{"propositions":[],"lastnames":["Yang"],"firstnames":["Chenghao"],"suffixes":[]},{"propositions":[],"lastnames":["Ma"],"firstnames":["Xuezhe"],"suffixes":[]}],"booktitle":"Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing","month":"December","year":"2022","address":"Abu Dhabi, United Arab Emirates","publisher":"Association for Computational Linguistics","pages":"4854–4859","bibtex":"@inproceedings{yang-ma-2022-improving,\n title = \"Improving Stability of Fine-Tuning Pretrained Language Models via Component-Wise Gradient Norm Clipping\",\n author = \"Yang, Chenghao and\n Ma, Xuezhe\",\n booktitle = \"Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing\",\n month = dec,\n year = \"2022\",\n address = \"Abu Dhabi, United Arab Emirates\",\n publisher = \"Association for Computational Linguistics\",\n pages = \"4854--4859\",\n}\n\n","author_short":["Yang, C.","Ma, X."],"bibbaseid":"yang-ma-improvingstabilityoffinetuningpretrainedlanguagemodelsviacomponentwisegradientnormclipping-2022","role":"author","urls":{},"metadata":{"authorlinks":{}}},"bibtype":"inproceedings","biburl":"https://bibbase.org/f/YKbTDpde2bBRHksm9/xuezhema-2023.bib","dataSources":["2oPPiCceKA3b52FNr","7qxSz9j9uMDqsXnhD"],"keywords":[],"search_terms":["improving","stability","fine","tuning","pretrained","language","models","via","component","wise","gradient","norm","clipping","yang","ma"],"title":"Improving Stability of Fine-Tuning Pretrained Language Models via Component-Wise Gradient Norm Clipping","year":2022}