Mining the Lexicon Used by Programmers during Software Evolution. Antoniol, G., Guéhéneuc, Y., Merlo, E., & Tonella, P. In Tahvildari, L. & Canfora, G., editors, Proceedings of the 23<sup>rd</sup> International Conference on Software Maintenance (ICSM), pages 14–23, October, 2007. IEEE CS Press. 10 pages.Paper abstract bibtex Identifiers represent an important source of information for programmers understanding and maintaining a system. Self-documenting identifiers reduce the time and effort necessary to obtain the level of understanding appropriate for the task at hand. While the role of the lexicon in program comprehension has long been recognized, only a few works have studied the quality and enhancement of the identifiers and no works have studied the evolution of the lexicon. In this paper, we characterize the evolution of program identifiers in terms of stability metrics and occurrences of renaming. We assess whether an evolution process similar to the one occurring for the program structure exists for identifiers. We report data and results about the evolution of three large systems, for which several releases are available. We have found evidence that the evolution of the lexicon is more limited and constrained than the evolution of the structure. We argue that the different evolution results from several factors including the lack of advanced tool support for lexicon construction, documentation, and evolution. Finally, we suggest the existence of rules on the co-evolution of structure and lexicon of software systems.
@INPROCEEDINGS{Antoniol07-ICSM-LexiconEvolution,
author = {Giuliano Antoniol and Yann-Ga{\"e}l Gu{\'e}h{\'e}neuc and Ettore Merlo and Paolo Tonella},
title = {Mining the Lexicon Used by Programmers during Software Evolution},
booktitle = {Proceedings of the 23<sup>{rd}</sup> International Conference on Software Maintenance ({ICSM})},
year = {2007},
month = {October},
editor = {Ladan Tahvildari and Gerardo Canfora},
publisher = {IEEE CS Press},
note = {10 pages.},
abstract = {Identifiers represent an important source of information for programmers understanding and maintaining a system. Self-documenting identifiers reduce the time and effort necessary to obtain the level of understanding appropriate for the task at hand. While the role of the lexicon in program comprehension has long been recognized, only a few works have studied the quality and enhancement of the identifiers and no works have studied the evolution of the lexicon. In this paper, we characterize the evolution of program identifiers in terms of stability metrics and occurrences of renaming. We assess whether an evolution process similar to the one occurring for the program structure exists for identifiers. We report data and results about the evolution of three large systems, for which several releases are available. We have found evidence that the evolution of the lexicon is more limited and constrained than the evolution of the structure. We argue that the different evolution results from several factors including the lack of advanced tool support for lexicon construction, documentation, and evolution. Finally, we suggest the existence of rules on the co-evolution of structure and lexicon of software systems.},
grant = {NSERC DG},
keywords = {Identifier analysis ; ICSM},
kind = {MISA},
language = {english},
url = {http://www.ptidej.net/publications/documents/ICSM07.doc.pdf},
pdf = {http://www.ptidej.net/publications/documents/ICSM07.ppt.pdf},
pages = {14--23}
}
Downloads: 0
{"_id":"MgzyGDTKTREAEy2qv","bibbaseid":"antoniol-guhneuc-merlo-tonella-miningthelexiconusedbyprogrammersduringsoftwareevolution-2007","downloads":0,"creationDate":"2018-01-17T20:29:42.536Z","title":"Mining the Lexicon Used by Programmers during Software Evolution","author_short":["Antoniol, G.","Guéhéneuc, Y.","Merlo, E.","Tonella, P."],"year":2007,"bibtype":"inproceedings","biburl":"http://www.yann-gael.gueheneuc.net/Work/BibBase/guehene (automatically cleaned).bib","bibdata":{"bibtype":"inproceedings","type":"inproceedings","author":[{"firstnames":["Giuliano"],"propositions":[],"lastnames":["Antoniol"],"suffixes":[]},{"firstnames":["Yann-Gaël"],"propositions":[],"lastnames":["Guéhéneuc"],"suffixes":[]},{"firstnames":["Ettore"],"propositions":[],"lastnames":["Merlo"],"suffixes":[]},{"firstnames":["Paolo"],"propositions":[],"lastnames":["Tonella"],"suffixes":[]}],"title":"Mining the Lexicon Used by Programmers during Software Evolution","booktitle":"Proceedings of the 23<sup>rd</sup> International Conference on Software Maintenance (ICSM)","year":"2007","month":"October","editor":[{"firstnames":["Ladan"],"propositions":[],"lastnames":["Tahvildari"],"suffixes":[]},{"firstnames":["Gerardo"],"propositions":[],"lastnames":["Canfora"],"suffixes":[]}],"publisher":"IEEE CS Press","note":"10 pages.","abstract":"Identifiers represent an important source of information for programmers understanding and maintaining a system. Self-documenting identifiers reduce the time and effort necessary to obtain the level of understanding appropriate for the task at hand. While the role of the lexicon in program comprehension has long been recognized, only a few works have studied the quality and enhancement of the identifiers and no works have studied the evolution of the lexicon. In this paper, we characterize the evolution of program identifiers in terms of stability metrics and occurrences of renaming. We assess whether an evolution process similar to the one occurring for the program structure exists for identifiers. We report data and results about the evolution of three large systems, for which several releases are available. We have found evidence that the evolution of the lexicon is more limited and constrained than the evolution of the structure. We argue that the different evolution results from several factors including the lack of advanced tool support for lexicon construction, documentation, and evolution. Finally, we suggest the existence of rules on the co-evolution of structure and lexicon of software systems.","grant":"NSERC DG","keywords":"Identifier analysis ; ICSM","kind":"MISA","language":"english","url":"http://www.ptidej.net/publications/documents/ICSM07.doc.pdf","pdf":"http://www.ptidej.net/publications/documents/ICSM07.ppt.pdf","pages":"14–23","bibtex":"@INPROCEEDINGS{Antoniol07-ICSM-LexiconEvolution,\n author = {Giuliano Antoniol and Yann-Ga{\\\"e}l Gu{\\'e}h{\\'e}neuc and Ettore Merlo and Paolo Tonella},\n title = {Mining the Lexicon Used by Programmers during Software Evolution},\n booktitle = {Proceedings of the 23<sup>{rd}</sup> International Conference on Software Maintenance ({ICSM})},\n year = {2007},\n month = {October},\n editor = {Ladan Tahvildari and Gerardo Canfora},\n publisher = {IEEE CS Press},\n note = {10 pages.},\n abstract = {Identifiers represent an important source of information for programmers understanding and maintaining a system. Self-documenting identifiers reduce the time and effort necessary to obtain the level of understanding appropriate for the task at hand. While the role of the lexicon in program comprehension has long been recognized, only a few works have studied the quality and enhancement of the identifiers and no works have studied the evolution of the lexicon. In this paper, we characterize the evolution of program identifiers in terms of stability metrics and occurrences of renaming. We assess whether an evolution process similar to the one occurring for the program structure exists for identifiers. We report data and results about the evolution of three large systems, for which several releases are available. We have found evidence that the evolution of the lexicon is more limited and constrained than the evolution of the structure. We argue that the different evolution results from several factors including the lack of advanced tool support for lexicon construction, documentation, and evolution. Finally, we suggest the existence of rules on the co-evolution of structure and lexicon of software systems.},\n grant = {NSERC DG},\n keywords = {Identifier analysis ; ICSM},\n kind = {MISA},\n language = {english},\n url = {http://www.ptidej.net/publications/documents/ICSM07.doc.pdf},\n pdf = {http://www.ptidej.net/publications/documents/ICSM07.ppt.pdf},\n pages = {14--23}\n}\n\n","author_short":["Antoniol, G.","Guéhéneuc, Y.","Merlo, E.","Tonella, P."],"editor_short":["Tahvildari, L.","Canfora, G."],"key":"Antoniol07-ICSM-LexiconEvolution","id":"Antoniol07-ICSM-LexiconEvolution","bibbaseid":"antoniol-guhneuc-merlo-tonella-miningthelexiconusedbyprogrammersduringsoftwareevolution-2007","role":"author","urls":{"Paper":"http://www.ptidej.net/publications/documents/ICSM07.doc.pdf"},"keyword":["Identifier analysis ; ICSM"],"metadata":{"authorlinks":{"gu�h�neuc, y":"https://bibbase.org/show?bib=http%3A%2F%2Fwww.yann-gael.gueheneuc.net%2FWork%2FPublications%2FBiblio%2Fcomplete-bibliography.bib&msg=embed","guéhéneuc, y":"https://bibbase.org/show?bib=http://www.yann-gael.gueheneuc.net/Work/BibBase/guehene%20(automatically%20cleaned).bib"}},"downloads":0,"html":""},"search_terms":["mining","lexicon","used","programmers","during","software","evolution","antoniol","guéhéneuc","merlo","tonella"],"keywords":["identifier analysis ; icsm"],"authorIDs":["AfJhKcg96muyPdu7S","xkviMnkrGBneANvMr"],"dataSources":["Sed98LbBeGaXxenrM","8vn5MSGYWB4fAx9Z4"]}