comparison of sampling techniques for web graph characterization. Becchetti, L., Castillo, C., & Donato, D. In LinkKDD, PA, USA, 2006. Paper abstract bibtex We present a detailed statistical analysis of the characteris- tics of partial Web graphs obtained by sub-sampling a large collection of Web pages. We show that in general the macroscopic properties of the Web are better represented by a shallow exploration of a large number of sites than by a deep exploration of a limited set of sites. We also describe and quantify the bias induced by the different sampling strategies, and show that it can be significant even if the sample covers a large fraction of the collection.
@inproceedings{ Becchetti2006,
abstract = {We present a detailed statistical analysis of the characteris- tics of partial Web graphs obtained by sub-sampling a large collection of Web pages. We show that in general the macroscopic properties of the Web are better represented by a shallow exploration of a large number of sites than by a deep exploration of a limited set of sites. We also describe and quantify the bias induced by the different sampling strategies, and show that it can be significant even if the sample covers a large fraction of the collection.},
address = {PA, USA},
author = {Becchetti, Luca and Castillo, Carlos and Donato, D},
booktitle = {LinkKDD},
file = {references/AComparisonOfSamplingTechniquesForWebGraphCharacterization.pdf},
keywords = {BFS bias,sampling techniques,web,www},
mendeley-tags = {BFS bias,sampling techniques,web,www},
title = {{comparison of sampling techniques for web graph characterization}},
url = {http://ailab.ijs.si/dunja/LinkKDD2006/Papers/becchetti.pdf http://www.chato.cl/papers/donato_2006_comparing_sampling_techniques.pdf http://ailab.ijs.si/dunja/linkkdd2006/Papers/becchetti.pdf http://academic.research.microsoft.com/Publication/4568540/a-comparison-of-sampling-techniques-for-web-graph-characterization},
year = {2006}
}
Downloads: 0
{"_id":{"_str":"52b6131d9eb585cc260047db"},"__v":0,"authorIDs":[],"author_short":["Becchetti, L.","Castillo, C.","Donato, D."],"bibbaseid":"becchetti-castillo-donato-comparisonofsamplingtechniquesforwebgraphcharacterization-2006","bibdata":{"html":"<div class=\"bibbase_paper\"> \n\n\n<span class=\"bibbase_paper_titleauthoryear\">\n\t<span class=\"bibbase_paper_title\"><a name=\"Becchetti2006\"> </a>comparison of sampling techniques for web graph characterization.</span>\n\t<span class=\"bibbase_paper_author\">\n<a class=\"bibbase author link\" href=\"http://www.bibbase.org/show?bib=http%3A%2F%2Fwww.utdallas.edu%2F%7Eemrah.cem%2Frefs.bib&msg=embed\">Becchetti, L.</a>; Castillo, C.; and Donato, D.</span>\n\t<!-- <span class=\"bibbase_paper_year\">2006</span>. -->\n</span>\n\n\n\nIn\n<i>LinkKDD</i>, PA, USA, 2006.\n\n\n\n\n\n<br class=\"bibbase_paper_content\"/>\n\n<span class=\"bibbase_paper_content\">\n \n \n <!-- <i -->\n <!-- onclick=\"javascript:log_download('becchetti-castillo-donato-comparisonofsamplingtechniquesforwebgraphcharacterization-2006', 'http://ailab.ijs.si/dunja/LinkKDD2006/Papers/becchetti.pdf http://www.chato.cl/papers/donato_2006_comparing_sampling_techniques.pdf http://ailab.ijs.si/dunja/linkkdd2006/Papers/becchetti.pdf http://academic.research.microsoft.com/Publication/4568540/a-comparison-of-sampling-techniques-for-web-graph-characterization')\">DEBUG -->\n <!-- </i> -->\n\n <a href=\"http://ailab.ijs.si/dunja/LinkKDD2006/Papers/becchetti.pdf http://www.chato.cl/papers/donato_2006_comparing_sampling_techniques.pdf http://ailab.ijs.si/dunja/linkkdd2006/Papers/becchetti.pdf http://academic.research.microsoft.com/Publication/4568540/a-comparison-of-sampling-techniques-for-web-graph-characterization\"\n onclick=\"javascript:log_download('becchetti-castillo-donato-comparisonofsamplingtechniquesforwebgraphcharacterization-2006', 'http://ailab.ijs.si/dunja/LinkKDD2006/Papers/becchetti.pdf http://www.chato.cl/papers/donato_2006_comparing_sampling_techniques.pdf http://ailab.ijs.si/dunja/linkkdd2006/Papers/becchetti.pdf http://academic.research.microsoft.com/Publication/4568540/a-comparison-of-sampling-techniques-for-web-graph-characterization')\">\n <img src=\"http://www.bibbase.org/img/filetypes/blank.png\"\n\t alt=\"comparison of sampling techniques for web graph characterization [.com/Publication/4568540/a-comparison-of-sampling-techniques-for-web-graph-characterization]\" \n\t class=\"bibbase_icon\"\n\t style=\"width: 24px; height: 24px; border: 0px; vertical-align: text-top\" ><span class=\"bibbase_icon_text\">Paper</span></a> \n \n \n \n <a href=\"javascript:showBib('Becchetti2006')\"\n class=\"bibbase link\">\n <!-- <img src=\"http://www.bibbase.org/img/filetypes/bib.png\" -->\n\t<!-- alt=\"comparison of sampling techniques for web graph characterization [bib]\" -->\n\t<!-- class=\"bibbase_icon\" -->\n\t<!-- style=\"width: 24px; height: 24px; border: 0px; vertical-align: text-top\"><span class=\"bibbase_icon_text\">Bibtex</span> -->\n BibTeX\n <i class=\"fa fa-caret-down\"></i></a>\n \n \n \n <a class=\"bibbase_abstract_link bibbase link\"\n href=\"javascript:showAbstract('Becchetti2006')\">\n Abstract\n <i class=\"fa fa-caret-down\"></i></a>\n \n \n \n\n \n \n \n</span>\n\n<div class=\"well well-small bibbase\" id=\"bib_Becchetti2006\"\n style=\"display:none\">\n <pre>@inproceedings{ Becchetti2006,\n abstract = {We present a detailed statistical analysis of the characteris- tics of partial Web graphs obtained by sub-sampling a large collection of Web pages. We show that in general the macroscopic properties of the Web are better represented by a shallow exploration of a large number of sites than by a deep exploration of a limited set of sites. We also describe and quantify the bias induced by the different sampling strategies, and show that it can be significant even if the sample covers a large fraction of the collection.},\n address = {PA, USA},\n author = {Becchetti, Luca and Castillo, Carlos and Donato, D},\n booktitle = {LinkKDD},\n file = {references/AComparisonOfSamplingTechniquesForWebGraphCharacterization.pdf},\n keywords = {BFS bias,sampling techniques,web,www},\n mendeley-tags = {BFS bias,sampling techniques,web,www},\n title = {{comparison of sampling techniques for web graph characterization}},\n url = {http://ailab.ijs.si/dunja/LinkKDD2006/Papers/becchetti.pdf http://www.chato.cl/papers/donato_2006_comparing_sampling_techniques.pdf http://ailab.ijs.si/dunja/linkkdd2006/Papers/becchetti.pdf http://academic.research.microsoft.com/Publication/4568540/a-comparison-of-sampling-techniques-for-web-graph-characterization},\n year = {2006}\n}</pre>\n</div>\n\n\n<div class=\"well well-small bibbase\" id=\"abstract_Becchetti2006\"\n style=\"display:none\">\n We present a detailed statistical analysis of the characteris- tics of partial Web graphs obtained by sub-sampling a large collection of Web pages. We show that in general the macroscopic properties of the Web are better represented by a shallow exploration of a large number of sites than by a deep exploration of a limited set of sites. We also describe and quantify the bias induced by the different sampling strategies, and show that it can be significant even if the sample covers a large fraction of the collection.\n</div>\n\n\n</div>\n","downloads":0,"keyword":["BFS bias","sampling techniques","web","www"],"bibbaseid":"becchetti-castillo-donato-comparisonofsamplingtechniquesforwebgraphcharacterization-2006","urls":{"Paper":"http://ailab.ijs.si/dunja/LinkKDD2006/Papers/becchetti.pdf http://www.chato.cl/papers/donato_2006_comparing_sampling_techniques.pdf http://ailab.ijs.si/dunja/linkkdd2006/Papers/becchetti.pdf http://academic.research.microsoft.com/Publication/4568540/a-comparison-of-sampling-techniques-for-web-graph-characterization"},"role":"author","abstract":"We present a detailed statistical analysis of the characteris- tics of partial Web graphs obtained by sub-sampling a large collection of Web pages. We show that in general the macroscopic properties of the Web are better represented by a shallow exploration of a large number of sites than by a deep exploration of a limited set of sites. We also describe and quantify the bias induced by the different sampling strategies, and show that it can be significant even if the sample covers a large fraction of the collection.","address":"PA, USA","author":["Becchetti, Luca","Castillo, Carlos","Donato, D"],"author_short":["Becchetti, L.","Castillo, C.","Donato, D."],"bibtex":"@inproceedings{ Becchetti2006,\n abstract = {We present a detailed statistical analysis of the characteris- tics of partial Web graphs obtained by sub-sampling a large collection of Web pages. We show that in general the macroscopic properties of the Web are better represented by a shallow exploration of a large number of sites than by a deep exploration of a limited set of sites. We also describe and quantify the bias induced by the different sampling strategies, and show that it can be significant even if the sample covers a large fraction of the collection.},\n address = {PA, USA},\n author = {Becchetti, Luca and Castillo, Carlos and Donato, D},\n booktitle = {LinkKDD},\n file = {references/AComparisonOfSamplingTechniquesForWebGraphCharacterization.pdf},\n keywords = {BFS bias,sampling techniques,web,www},\n mendeley-tags = {BFS bias,sampling techniques,web,www},\n title = {{comparison of sampling techniques for web graph characterization}},\n url = {http://ailab.ijs.si/dunja/LinkKDD2006/Papers/becchetti.pdf http://www.chato.cl/papers/donato_2006_comparing_sampling_techniques.pdf http://ailab.ijs.si/dunja/linkkdd2006/Papers/becchetti.pdf http://academic.research.microsoft.com/Publication/4568540/a-comparison-of-sampling-techniques-for-web-graph-characterization},\n year = {2006}\n}","bibtype":"inproceedings","booktitle":"LinkKDD","file":"references/AComparisonOfSamplingTechniquesForWebGraphCharacterization.pdf","id":"Becchetti2006","key":"Becchetti2006","keywords":"BFS bias,sampling techniques,web,www","mendeley-tags":"BFS bias,sampling techniques,web,www","title":"comparison of sampling techniques for web graph characterization","type":"inproceedings","url":"http://ailab.ijs.si/dunja/LinkKDD2006/Papers/becchetti.pdf http://www.chato.cl/papers/donato_2006_comparing_sampling_techniques.pdf http://ailab.ijs.si/dunja/linkkdd2006/Papers/becchetti.pdf http://academic.research.microsoft.com/Publication/4568540/a-comparison-of-sampling-techniques-for-web-graph-characterization","year":"2006"},"bibtype":"inproceedings","biburl":"http://www.utdallas.edu/~emrah.cem/refs.bib","downloads":0,"search_terms":["comparison","sampling","techniques","web","graph","characterization","becchetti","castillo","donato"],"title":"comparison of sampling techniques for web graph characterization","year":2006,"dataSources":["EFHELostezG97KaGW"]}