Cloud-Based Name Disambiguation Algorithm. Juan, Y., Hua, H., & Bin, W. 2010 International Conference of Information Science and Management Engineering, 2:155-158, Ieee, 2010.
Cloud-Based Name Disambiguation Algorithm [link]Website  abstract   bibtex   
In Scientific Collaboration Networks, the phenomenon that one author name corresponds to many author entities is very common. Traditional algorithms for name disambiguation performed inefficiently in dealing with massive data. This paper presents a parallel algorithm for solving the name disambiguation problem: first merge authors with same names and similar author information, then divide the scientific collaboration networks into author communities, authors with same name in one community is supposed as one entity with great possibility. The algorithm is based on the Cloud-Computing platform, and has the ability to deal with massive data. In our experiment, the algorithm efficiently processed massive data and achieved an average f-score of 0.93.
@article{
 title = {Cloud-Based Name Disambiguation Algorithm},
 type = {article},
 year = {2010},
 identifiers = {[object Object]},
 keywords = {cloud computing,community detection,similarity},
 pages = {155-158},
 volume = {2},
 websites = {http://ieeexplore.ieee.org/lpdocs/epic03/wrapper.htm?arnumber=5573917},
 publisher = {Ieee},
 id = {4c25e483-a465-3363-81bd-6ff3ffdf812f},
 created = {2012-02-28T00:51:15.000Z},
 file_attached = {false},
 profile_id = {5284e6aa-156c-3ce5-bc0e-b80cf09f3ef6},
 group_id = {066b42c8-f712-3fc3-abb2-225c158d2704},
 last_modified = {2017-03-14T14:36:19.698Z},
 tags = {personal name disambiguation},
 read = {false},
 starred = {false},
 authored = {false},
 confirmed = {true},
 hidden = {false},
 citation_key = {Juan2010},
 private_publication = {false},
 abstract = {In Scientific Collaboration Networks, the phenomenon that one author name corresponds to many author entities is very common. Traditional algorithms for name disambiguation performed inefficiently in dealing with massive data. This paper presents a parallel algorithm for solving the name disambiguation problem: first merge authors with same names and similar author information, then divide the scientific collaboration networks into author communities, authors with same name in one community is supposed as one entity with great possibility. The algorithm is based on the Cloud-Computing platform, and has the ability to deal with massive data. In our experiment, the algorithm efficiently processed massive data and achieved an average f-score of 0.93.},
 bibtype = {article},
 author = {Juan, Yang and Hua, He and Bin, Wu},
 journal = {2010 International Conference of Information Science and Management Engineering}
}

Downloads: 0