Determining if two documents are written by the same author. Koppel, M. & Winter, Y. Journal of the Association for Information Science and Technology, 65(1):178–187, 2014. _eprint: https://onlinelibrary.wiley.com/doi/pdf/10.1002/asi.22954Paper doi abstract bibtex Almost any conceivable authorship attribution problem can be reduced to one fundamental problem: whether a pair of (possibly short) documents were written by the same author. In this article, we offer an (almost) unsupervised method for solving this problem with surprisingly high accuracy. The main idea is to use repeated feature subsampling methods to determine if one document of the pair allows us to select the other from among a background set of “impostors” in a sufficiently robust manner.
@article{koppel_determining_2014,
title = {Determining if two documents are written by the same author},
volume = {65},
issn = {2330-1643},
url = {https://onlinelibrary.wiley.com/doi/abs/10.1002/asi.22954},
doi = {10.1002/asi.22954},
abstract = {Almost any conceivable authorship attribution problem can be reduced to one fundamental problem: whether a pair of (possibly short) documents were written by the same author. In this article, we offer an (almost) unsupervised method for solving this problem with surprisingly high accuracy. The main idea is to use repeated feature subsampling methods to determine if one document of the pair allows us to select the other from among a background set of “impostors” in a sufficiently robust manner.},
language = {en},
number = {1},
urldate = {2023-07-23},
journal = {Journal of the Association for Information Science and Technology},
author = {Koppel, Moshe and Winter, Yaron},
year = {2014},
note = {\_eprint: https://onlinelibrary.wiley.com/doi/pdf/10.1002/asi.22954},
keywords = {automatic classification, machine learning, natural language processing},
pages = {178--187},
}
Downloads: 0
{"_id":"E9hRMiFaK2nu2ssZe","bibbaseid":"koppel-winter-determiningiftwodocumentsarewrittenbythesameauthor-2014","author_short":["Koppel, M.","Winter, Y."],"bibdata":{"bibtype":"article","type":"article","title":"Determining if two documents are written by the same author","volume":"65","issn":"2330-1643","url":"https://onlinelibrary.wiley.com/doi/abs/10.1002/asi.22954","doi":"10.1002/asi.22954","abstract":"Almost any conceivable authorship attribution problem can be reduced to one fundamental problem: whether a pair of (possibly short) documents were written by the same author. In this article, we offer an (almost) unsupervised method for solving this problem with surprisingly high accuracy. The main idea is to use repeated feature subsampling methods to determine if one document of the pair allows us to select the other from among a background set of “impostors” in a sufficiently robust manner.","language":"en","number":"1","urldate":"2023-07-23","journal":"Journal of the Association for Information Science and Technology","author":[{"propositions":[],"lastnames":["Koppel"],"firstnames":["Moshe"],"suffixes":[]},{"propositions":[],"lastnames":["Winter"],"firstnames":["Yaron"],"suffixes":[]}],"year":"2014","note":"_eprint: https://onlinelibrary.wiley.com/doi/pdf/10.1002/asi.22954","keywords":"automatic classification, machine learning, natural language processing","pages":"178–187","bibtex":"@article{koppel_determining_2014,\n\ttitle = {Determining if two documents are written by the same author},\n\tvolume = {65},\n\tissn = {2330-1643},\n\turl = {https://onlinelibrary.wiley.com/doi/abs/10.1002/asi.22954},\n\tdoi = {10.1002/asi.22954},\n\tabstract = {Almost any conceivable authorship attribution problem can be reduced to one fundamental problem: whether a pair of (possibly short) documents were written by the same author. In this article, we offer an (almost) unsupervised method for solving this problem with surprisingly high accuracy. The main idea is to use repeated feature subsampling methods to determine if one document of the pair allows us to select the other from among a background set of “impostors” in a sufficiently robust manner.},\n\tlanguage = {en},\n\tnumber = {1},\n\turldate = {2023-07-23},\n\tjournal = {Journal of the Association for Information Science and Technology},\n\tauthor = {Koppel, Moshe and Winter, Yaron},\n\tyear = {2014},\n\tnote = {\\_eprint: https://onlinelibrary.wiley.com/doi/pdf/10.1002/asi.22954},\n\tkeywords = {automatic classification, machine learning, natural language processing},\n\tpages = {178--187},\n}\n\n\n\n","author_short":["Koppel, M.","Winter, Y."],"key":"koppel_determining_2014","id":"koppel_determining_2014","bibbaseid":"koppel-winter-determiningiftwodocumentsarewrittenbythesameauthor-2014","role":"author","urls":{"Paper":"https://onlinelibrary.wiley.com/doi/abs/10.1002/asi.22954"},"keyword":["automatic classification","machine learning","natural language processing"],"metadata":{"authorlinks":{}}},"bibtype":"article","biburl":"https://bibbase.org/zotero-group/schulzkx/5158478","dataSources":["JFDnASMkoQCjjGL8E"],"keywords":["automatic classification","machine learning","natural language processing"],"search_terms":["determining","two","documents","written","same","author","koppel","winter"],"title":"Determining if two documents are written by the same author","year":2014}