Cross-Language Source Code Plagiarism Detection using Explicit Semantic Analysis and Scored Greedy String Tilling. Foltýnek, T., Vsiansky, R., Meuschke, N., Dlabolova, D., & Gipp, B. In Proceedings of the ACM/IEEE Joint Conference on Digital Libraries (JCDL), Virtual Event, August, 2020. Venue Rating: CORE A*Paper doi abstract bibtex We present a method for source code plagiarism detection that is independent of the programming language. Our method EsaGst combines Explicit Semantic Analysis and Greedy String Tiling. Using 25 cases of source code plagiarism in C++, Java, JavaScript, PHP, and Python, we show that EsaGst outperforms a baseline method in identifying plagiarism across programming languages.
@inproceedings{FoltynekVMD20,
address = {Virtual Event},
title = {Cross-{Language} {Source} {Code} {Plagiarism} {Detection} using {Explicit} {Semantic} {Analysis} and {Scored} {Greedy} {String} {Tilling}},
url = {https://www.gipp.com/wp-content/papercite-data/pdf/foltynek2020a.pdf},
doi = {10.1145/3383583.3398594},
abstract = {We present a method for source code plagiarism detection that is independent of the programming language. Our method EsaGst combines Explicit Semantic Analysis and Greedy String Tiling. Using 25 cases of source code plagiarism in C++, Java, JavaScript, PHP, and Python, we show that EsaGst outperforms a baseline method in identifying plagiarism across programming languages.},
booktitle = {Proceedings of the {ACM}/{IEEE} {Joint} {Conference} on {Digital} {Libraries} ({JCDL})},
author = {Foltýnek, Tomáš and Vsiansky, Richard and Meuschke, Norman and Dlabolova, Dita and Gipp, Bela},
month = aug,
year = {2020},
note = {Venue Rating: CORE A*},
keywords = {Plagiarism Detection},
}
Downloads: 0
{"_id":"YGnp7s885bTuJYNcv","bibbaseid":"foltnek-vsiansky-meuschke-dlabolova-gipp-crosslanguagesourcecodeplagiarismdetectionusingexplicitsemanticanalysisandscoredgreedystringtilling-2020","author_short":["Foltýnek, T.","Vsiansky, R.","Meuschke, N.","Dlabolova, D.","Gipp, B."],"bibdata":{"bibtype":"inproceedings","type":"inproceedings","address":"Virtual Event","title":"Cross-Language Source Code Plagiarism Detection using Explicit Semantic Analysis and Scored Greedy String Tilling","url":"https://www.gipp.com/wp-content/papercite-data/pdf/foltynek2020a.pdf","doi":"10.1145/3383583.3398594","abstract":"We present a method for source code plagiarism detection that is independent of the programming language. Our method EsaGst combines Explicit Semantic Analysis and Greedy String Tiling. Using 25 cases of source code plagiarism in C++, Java, JavaScript, PHP, and Python, we show that EsaGst outperforms a baseline method in identifying plagiarism across programming languages.","booktitle":"Proceedings of the ACM/IEEE Joint Conference on Digital Libraries (JCDL)","author":[{"propositions":[],"lastnames":["Foltýnek"],"firstnames":["Tomáš"],"suffixes":[]},{"propositions":[],"lastnames":["Vsiansky"],"firstnames":["Richard"],"suffixes":[]},{"propositions":[],"lastnames":["Meuschke"],"firstnames":["Norman"],"suffixes":[]},{"propositions":[],"lastnames":["Dlabolova"],"firstnames":["Dita"],"suffixes":[]},{"propositions":[],"lastnames":["Gipp"],"firstnames":["Bela"],"suffixes":[]}],"month":"August","year":"2020","note":"Venue Rating: CORE A*","keywords":"Plagiarism Detection","bibtex":"@inproceedings{FoltynekVMD20,\n\taddress = {Virtual Event},\n\ttitle = {Cross-{Language} {Source} {Code} {Plagiarism} {Detection} using {Explicit} {Semantic} {Analysis} and {Scored} {Greedy} {String} {Tilling}},\n\turl = {https://www.gipp.com/wp-content/papercite-data/pdf/foltynek2020a.pdf},\n\tdoi = {10.1145/3383583.3398594},\n\tabstract = {We present a method for source code plagiarism detection that is independent of the programming language. Our method EsaGst combines Explicit Semantic Analysis and Greedy String Tiling. Using 25 cases of source code plagiarism in C++, Java, JavaScript, PHP, and Python, we show that EsaGst outperforms a baseline method in identifying plagiarism across programming languages.},\n\tbooktitle = {Proceedings of the {ACM}/{IEEE} {Joint} {Conference} on {Digital} {Libraries} ({JCDL})},\n\tauthor = {Foltýnek, Tomáš and Vsiansky, Richard and Meuschke, Norman and Dlabolova, Dita and Gipp, Bela},\n\tmonth = aug,\n\tyear = {2020},\n\tnote = {Venue Rating: CORE A*},\n\tkeywords = {Plagiarism Detection},\n}\n\n","author_short":["Foltýnek, T.","Vsiansky, R.","Meuschke, N.","Dlabolova, D.","Gipp, B."],"key":"FoltynekVMD20","id":"FoltynekVMD20","bibbaseid":"foltnek-vsiansky-meuschke-dlabolova-gipp-crosslanguagesourcecodeplagiarismdetectionusingexplicitsemanticanalysisandscoredgreedystringtilling-2020","role":"author","urls":{"Paper":"https://www.gipp.com/wp-content/papercite-data/pdf/foltynek2020a.pdf"},"keyword":["Plagiarism Detection"],"metadata":{"authorlinks":{}}},"bibtype":"inproceedings","biburl":"https://api.zotero.org/groups/2532143/items?key=DOjJ33bOgISaFjBIBr7jCV5S&format=bibtex&limit=100","dataSources":["bQwdfx3o8Q3vnsqfH","SzFkcrpurPzNHEyqX","6KJgnNtYZiwwFkcGq","dHLtmS5G7GmooD755","EvZZTzAZvA3EsuMjm"],"keywords":["plagiarism detection"],"search_terms":["cross","language","source","code","plagiarism","detection","using","explicit","semantic","analysis","scored","greedy","string","tilling","foltýnek","vsiansky","meuschke","dlabolova","gipp"],"title":"Cross-Language Source Code Plagiarism Detection using Explicit Semantic Analysis and Scored Greedy String Tilling","year":2020}