Ranking web sites with real user traffic. Meiss, M., R., Menczer, F., Fortunato, S., Flammini, A., & Vespignani, A. In WSDM'08 - Proceedings of the 2008 International Conference on Web Search and Data Mining, pages 65-75, 2008.
Ranking web sites with real user traffic [link]Website  doi  abstract   bibtex   
We analyze the traffic-weighted Web host graph obtained from a large sample of real Web users over about seven months. A number of interesting structural properties are revealed by this complex dynamic network, some in line with the well-studied boolean link host graph and others pointing to important differences. We find that while search is directly involved in a surprisingly small fraction of user clicks, it leads to a much larger fraction of all sites visited. The temporal traffic patterns display strong regularities, with a large portion of future requests being statistically predictable by past ones. Given the importance of topological measures such as PageRank in modeling user navigation, as well as their role in ranking sites for Web search, we use the traffic data to validate the PageRank random surfing model. The ranking obtained by the actual frequency with which a site is visited by users differs significantly from that approximated by the uniform surfing/teleportation behavior modeled by PageRank, especially for the most important sites. To interpret this finding, we consider each of the fundamental assumptions underlying PageRank and show how each is violated by actual user behavior. © 2008 ACM.
@inproceedings{
 title = {Ranking web sites with real user traffic},
 type = {inproceedings},
 year = {2008},
 keywords = {Boolean algebra; Graph theory; Statistical methods,Pagerank; Teleportation; Web traffic; Weighted ho,Websites},
 pages = {65-75},
 websites = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-42549123260&doi=10.1145%2F1341531.1341543&partnerID=40&md5=d340fd1de6e1e5c5a87fc9a7f9c6164f},
 city = {Palo Alto, CA},
 id = {5c446a95-0187-3529-9db4-5d20162b4e05},
 created = {2018-01-16T17:54:28.389Z},
 file_attached = {false},
 profile_id = {42d295c0-0737-38d6-8b43-508cab6ea85d},
 last_modified = {2018-03-12T19:03:19.297Z},
 read = {false},
 starred = {false},
 authored = {true},
 confirmed = {true},
 hidden = {false},
 citation_key = {Meiss200865},
 source_type = {conference},
 notes = {cited By 51; Conference of 2008 International Conference on Web Search and Data Mining, WSDM 2008 ; Conference Date: 11 February 2008 Through 12 February 2008; Conference Code:71934},
 folder_uuids = {971e10ae-b1f7-4c4b-8f99-aa55f77a64f6},
 private_publication = {false},
 abstract = {We analyze the traffic-weighted Web host graph obtained from a large sample of real Web users over about seven months. A number of interesting structural properties are revealed by this complex dynamic network, some in line with the well-studied boolean link host graph and others pointing to important differences. We find that while search is directly involved in a surprisingly small fraction of user clicks, it leads to a much larger fraction of all sites visited. The temporal traffic patterns display strong regularities, with a large portion of future requests being statistically predictable by past ones. Given the importance of topological measures such as PageRank in modeling user navigation, as well as their role in ranking sites for Web search, we use the traffic data to validate the PageRank random surfing model. The ranking obtained by the actual frequency with which a site is visited by users differs significantly from that approximated by the uniform surfing/teleportation behavior modeled by PageRank, especially for the most important sites. To interpret this finding, we consider each of the fundamental assumptions underlying PageRank and show how each is violated by actual user behavior. © 2008 ACM.},
 bibtype = {inproceedings},
 author = {Meiss, M R and Menczer, F and Fortunato, S and Flammini, A and Vespignani, A},
 doi = {10.1145/1341531.1341543},
 booktitle = {WSDM'08 - Proceedings of the 2008 International Conference on Web Search and Data Mining}
}

Downloads: 0