Generalizability of NLP-based Models for Modern Software Development Cross-Domain Environments. Krasniqi, R. & Do, H. In 2023 IEEE/ACM 2nd International Workshop on Natural Language-Based Software Engineering (NLBSE) co-located with ICSE, pages 11–13, Melbourne, Australia, May, 2023. IEEE. Paper doi abstract bibtex Natural Language Processing (NLP) has shown to be effective for solving complex problems in the Software Engineering (SE) domain, such as building chatbots and its ability to translate multi-languages. Despite the advances allowed by NLP, there are technical loopholes that hinder its fullest potential within the SE domain. The open problem remains in their generalizability for modern software development tasks that typically operate in a dynamic environment, such as AWS and SaaS platforms. The problem with these setups is that they may not contain labeled data. This poses a challenge when applying most prominent data-centric NLP models such as BERT transformer models. This position paper highlights some of the most pressing challenges drawn between the intersection of NLP and SE domains. Our vision revolves around improving the NLP model generalizability for dynamic cross-domain environments that contain little or no labeled target-domain data. We discuss these challenges and propose a research roadmap to tackle this problem as a research community emanating from SE lenses.
@inproceedings{krasniqi_generalizability_2023,
address = {Melbourne, Australia},
title = {Generalizability of {NLP}-based {Models} for {Modern} {Software} {Development} {Cross}-{Domain} {Environments}},
isbn = {9798350301786},
url = {https://ieeexplore.ieee.org/document/10189135/},
doi = {10.1109/NLBSE59153.2023.00009},
abstract = {Natural Language Processing (NLP) has shown to be effective for solving complex problems in the Software Engineering (SE) domain, such as building chatbots and its ability to translate multi-languages. Despite the advances allowed by NLP, there are technical loopholes that hinder its fullest potential within the SE domain. The open problem remains in their generalizability for modern software development tasks that typically operate in a dynamic environment, such as AWS and SaaS platforms. The problem with these setups is that they may not contain labeled data. This poses a challenge when applying most prominent data-centric NLP models such as BERT transformer models. This position paper highlights some of the most pressing challenges drawn between the intersection of NLP and SE domains. Our vision revolves around improving the NLP model generalizability for dynamic cross-domain environments that contain little or no labeled target-domain data. We discuss these challenges and propose a research roadmap to tackle this problem as a research community emanating from SE lenses.},
urldate = {2023-07-30},
booktitle = {2023 {IEEE}/{ACM} 2nd {International} {Workshop} on {Natural} {Language}-{Based} {Software} {Engineering} ({NLBSE}) co-located with {ICSE}},
publisher = {IEEE},
author = {Krasniqi, Rrezarta and Do, Hyunsook},
month = may,
year = {2023},
keywords = {Conference Workshop Papers},
pages = {11--13},
}
Downloads: 0
{"_id":"aMFRsputiXwzCupoA","bibbaseid":"krasniqi-do-generalizabilityofnlpbasedmodelsformodernsoftwaredevelopmentcrossdomainenvironments-2023","author_short":["Krasniqi, R.","Do, H."],"bibdata":{"bibtype":"inproceedings","type":"inproceedings","address":"Melbourne, Australia","title":"Generalizability of NLP-based Models for Modern Software Development Cross-Domain Environments","isbn":"9798350301786","url":"https://ieeexplore.ieee.org/document/10189135/","doi":"10.1109/NLBSE59153.2023.00009","abstract":"Natural Language Processing (NLP) has shown to be effective for solving complex problems in the Software Engineering (SE) domain, such as building chatbots and its ability to translate multi-languages. Despite the advances allowed by NLP, there are technical loopholes that hinder its fullest potential within the SE domain. The open problem remains in their generalizability for modern software development tasks that typically operate in a dynamic environment, such as AWS and SaaS platforms. The problem with these setups is that they may not contain labeled data. This poses a challenge when applying most prominent data-centric NLP models such as BERT transformer models. This position paper highlights some of the most pressing challenges drawn between the intersection of NLP and SE domains. Our vision revolves around improving the NLP model generalizability for dynamic cross-domain environments that contain little or no labeled target-domain data. We discuss these challenges and propose a research roadmap to tackle this problem as a research community emanating from SE lenses.","urldate":"2023-07-30","booktitle":"2023 IEEE/ACM 2nd International Workshop on Natural Language-Based Software Engineering (NLBSE) co-located with ICSE","publisher":"IEEE","author":[{"propositions":[],"lastnames":["Krasniqi"],"firstnames":["Rrezarta"],"suffixes":[]},{"propositions":[],"lastnames":["Do"],"firstnames":["Hyunsook"],"suffixes":[]}],"month":"May","year":"2023","keywords":"Conference Workshop Papers","pages":"11–13","bibtex":"@inproceedings{krasniqi_generalizability_2023,\n\taddress = {Melbourne, Australia},\n\ttitle = {Generalizability of {NLP}-based {Models} for {Modern} {Software} {Development} {Cross}-{Domain} {Environments}},\n\tisbn = {9798350301786},\n\turl = {https://ieeexplore.ieee.org/document/10189135/},\n\tdoi = {10.1109/NLBSE59153.2023.00009},\n\tabstract = {Natural Language Processing (NLP) has shown to be effective for solving complex problems in the Software Engineering (SE) domain, such as building chatbots and its ability to translate multi-languages. Despite the advances allowed by NLP, there are technical loopholes that hinder its fullest potential within the SE domain. The open problem remains in their generalizability for modern software development tasks that typically operate in a dynamic environment, such as AWS and SaaS platforms. The problem with these setups is that they may not contain labeled data. This poses a challenge when applying most prominent data-centric NLP models such as BERT transformer models. This position paper highlights some of the most pressing challenges drawn between the intersection of NLP and SE domains. Our vision revolves around improving the NLP model generalizability for dynamic cross-domain environments that contain little or no labeled target-domain data. We discuss these challenges and propose a research roadmap to tackle this problem as a research community emanating from SE lenses.},\n\turldate = {2023-07-30},\n\tbooktitle = {2023 {IEEE}/{ACM} 2nd {International} {Workshop} on {Natural} {Language}-{Based} {Software} {Engineering} ({NLBSE}) co-located with {ICSE}},\n\tpublisher = {IEEE},\n\tauthor = {Krasniqi, Rrezarta and Do, Hyunsook},\n\tmonth = may,\n\tyear = {2023},\n\tkeywords = {Conference Workshop Papers},\n\tpages = {11--13},\n}\n\n","author_short":["Krasniqi, R.","Do, H."],"key":"krasniqi_generalizability_2023","id":"krasniqi_generalizability_2023","bibbaseid":"krasniqi-do-generalizabilityofnlpbasedmodelsformodernsoftwaredevelopmentcrossdomainenvironments-2023","role":"author","urls":{"Paper":"https://ieeexplore.ieee.org/document/10189135/"},"keyword":["Conference Workshop Papers"],"metadata":{"authorlinks":{}}},"bibtype":"inproceedings","biburl":"https://api.zotero.org/users/10198036/collections/2RHJXKSI/items?key=X0RoN8iO9RtTbrWfSkRasb7b&format=bibtex&limit=100","dataSources":["JHDShjsHrs6ZHE4bz","37aX9ioouEvzbunGp"],"keywords":["conference workshop papers"],"search_terms":["generalizability","nlp","based","models","modern","software","development","cross","domain","environments","krasniqi","do"],"title":"Generalizability of NLP-based Models for Modern Software Development Cross-Domain Environments","year":2023}