More Effective Boilerplate Removal - the GoldMiner Algorithm. Endrédy, I. & Novák, A. Polibits - Research journal on Computer science and computer engineering with applications, 2013. Paper bibtex @article{endredy_more_2013,
title = {More {Effective} {Boilerplate} {Removal} - the {GoldMiner} {Algorithm}},
issn = {1870-9044},
url = {http://polibits.gelbukh.com/2013_48},
language = {eng},
number = {48},
journal = {Polibits - Research journal on Computer science and computer engineering with applications},
author = {Endrédy, István and Novák, Attila},
year = {2013},
keywords = {Corpus building, boilerplate removal, the web as corpus},
pages = {79--83},
}
Downloads: 0
{"_id":"svd3a3xWSfRuxoo3t","bibbaseid":"endrdy-novk-moreeffectiveboilerplateremovalthegoldmineralgorithm-2013","author_short":["Endrédy, I.","Novák, A."],"bibdata":{"bibtype":"article","type":"article","title":"More Effective Boilerplate Removal - the GoldMiner Algorithm","issn":"1870-9044","url":"http://polibits.gelbukh.com/2013_48","language":"eng","number":"48","journal":"Polibits - Research journal on Computer science and computer engineering with applications","author":[{"propositions":[],"lastnames":["Endrédy"],"firstnames":["István"],"suffixes":[]},{"propositions":[],"lastnames":["Novák"],"firstnames":["Attila"],"suffixes":[]}],"year":"2013","keywords":"Corpus building, boilerplate removal, the web as corpus","pages":"79–83","bibtex":"@article{endredy_more_2013,\n\ttitle = {More {Effective} {Boilerplate} {Removal} - the {GoldMiner} {Algorithm}},\n\tissn = {1870-9044},\n\turl = {http://polibits.gelbukh.com/2013_48},\n\tlanguage = {eng},\n\tnumber = {48},\n\tjournal = {Polibits - Research journal on Computer science and computer engineering with applications},\n\tauthor = {Endrédy, István and Novák, Attila},\n\tyear = {2013},\n\tkeywords = {Corpus building, boilerplate removal, the web as corpus},\n\tpages = {79--83},\n}\n\n","author_short":["Endrédy, I.","Novák, A."],"key":"endredy_more_2013","id":"endredy_more_2013","bibbaseid":"endrdy-novk-moreeffectiveboilerplateremovalthegoldmineralgorithm-2013","role":"author","urls":{"Paper":"http://polibits.gelbukh.com/2013_48"},"keyword":["Corpus building","boilerplate removal","the web as corpus"],"metadata":{"authorlinks":{}}},"bibtype":"article","biburl":"https://api.zotero.org/groups/2532329/items?key=3gRHj8hfOfGJBww9EhlzpL4j&format=bibtex&limit=100","dataSources":["72w8hmKFm76DkeXyN","fQ66AuPM43rBsaruw"],"keywords":["corpus building","boilerplate removal","the web as corpus"],"search_terms":["more","effective","boilerplate","removal","goldminer","algorithm","endrédy","novák"],"title":"More Effective Boilerplate Removal - the GoldMiner Algorithm","year":2013}