\n \n \n
\n
\n \n 2023\n \n \n (3)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n Semantics-aware Dataset Discovery from Data Lakes with Contextualized Column-based Representation Learning.\n \n \n \n\n\n \n Fan, G., Wang, J., Li, Y., Zhang, D., & Miller, R. J.\n\n\n \n\n\n\n
Proc. VLDB Endow., 16(7): 1726–1739. 2023.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/pvldb/FanWLZM23,\n author = {Grace Fan and\n Jin Wang and\n Yuliang Li and\n Dan Zhang and\n Ren{\\'{e}}e J. Miller},\n title = {Semantics-aware Dataset Discovery from Data Lakes with Contextualized\n Column-based Representation Learning},\n journal = {Proc. {VLDB} Endow.},\n volume = {16},\n number = {7},\n pages = {1726--1739},\n year = {2023}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n SANTOS: Relationship-based Semantic Table Union Search.\n \n \n \n\n\n \n Khatiwada, A., Fan, G., Shraga, R., Chen, Z., Gatterbauer, W., Miller, R. J., & Riedewald, M.\n\n\n \n\n\n\n In
SIGMOD, 2023. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{santos23,\n\tauthor = {Aamod Khatiwada and\n\tGrace Fan and\n\tRoee Shraga and\n\tZixuan Chen and\n\tWolfgang Gatterbauer and\n\tRenée J. Miller and\n\tMirek Riedewald},\n\ttitle = {SANTOS: Relationship-based Semantic Table Union Search},\n\tbooktitle = {SIGMOD},\n\tyear = {2023}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Data Lake Organization.\n \n \n \n\n\n \n Nargesian, F., Pu, K. Q., Bashardoost, B. G., Zhu, E., & Miller, R. J.\n\n\n \n\n\n\n
IEEE Trans. Knowl. Data Eng., 35(1): 237–250. 2023.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/tkde/NargesianPBZM23,\n author = {Fatemeh Nargesian and\n Ken Q. Pu and\n Bahar Ghadiri Bashardoost and\n Erkang Zhu and\n Ren{\\'{e}}e J. Miller},\n title = {Data Lake Organization},\n journal = {{IEEE} Trans. Knowl. Data Eng.},\n volume = {35},\n number = {1},\n pages = {237--250},\n year = {2023}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n \n 2022\n \n \n (6)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n Annotating Columns with Pre-trained Language Models.\n \n \n \n\n\n \n Suhara, Y., Li, J., Li, Y., Zhang, D., Demiralp, Ç., Chen, C., & Tan, W.\n\n\n \n\n\n\n In
SIGMOD, pages 1493–1503, 2022. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/sigmod/SuharaL0ZDCT22,\n\tauthor = {Yoshihiko Suhara and\n\t\tJinfeng Li and\n\t\tYuliang Li and\n\t\tDan Zhang and\n\t\t{\\c{C}}agatay Demiralp and\n\t\tChen Chen and\n\t\tWang{-}Chiew Tan},\n\ttitle = {Annotating Columns with Pre-trained Language Models},\n\tbooktitle = {SIGMOD},\n\tpages = {1493--1503},\n\tyear = {2022}\n}\n
\n
\n\n\n\n
\n\n\n
\n\n\n \n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Integrating Data Lake Tables.\n \n \n \n\n\n \n Khatiwada, A., Shraga, R., Gatterbauer, W., & Miller, R. J.\n\n\n \n\n\n\n
Proc. VLDB Endow., 16(4): 932–945. 2022.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/pvldb/KhatiwadaSGM22,\n author = {Aamod Khatiwada and\n Roee Shraga and\n Wolfgang Gatterbauer and\n Ren{\\'{e}}e J. Miller},\n title = {Integrating Data Lake Tables},\n journal = {Proc. {VLDB} Endow.},\n volume = {16},\n number = {4},\n pages = {932--945},\n year = {2022}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n WarpGate: A Semantic Join Discovery System for Cloud Data Warehouses.\n \n \n \n\n\n \n Cong, T., Gale, J., Frantz, J., Jagadish, H. V., & Demiralp, Ç.\n\n\n \n\n\n\n
CoRR, abs/2212.14155. 2022.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/corr/abs-2212-14155,\n author = {Tianji Cong and\n James Gale and\n Jason Frantz and\n H. V. Jagadish and\n {\\c{C}}agatay Demiralp},\n title = {WarpGate: {A} Semantic Join Discovery System for Cloud Data Warehouses},\n journal = {CoRR},\n volume = {abs/2212.14155},\n year = {2022}\n}\n\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n \n 2021\n \n \n (9)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n Auctus: A Dataset Search Engine for Data Discovery and Augmentation.\n \n \n \n\n\n \n Castelo, S., Rampin, R., Santos, A. S. R., Bessa, A., Chirigati, F., & Freire, J.\n\n\n \n\n\n\n
Proc. VLDB Endow., 14(12): 2791–2794. 2021.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/pvldb/CasteloRSBCF21,\n\tauthor = {Sonia Castelo and\n\tR{\\'{e}}mi Rampin and\n\tA{\\'{e}}cio S. R. Santos and\n\tAline Bessa and\n\tFernando Chirigati and\n\tJuliana Freire},\n\ttitle = {Auctus: {A} Dataset Search Engine for Data Discovery and Augmentation},\n\tjournal = {Proc. {VLDB} Endow.},\n\tvolume = {14},\n\tnumber = {12},\n\tpages = {2791--2794},\n\tyear = {2021}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n RONIN: Data Lake Exploration.\n \n \n \n\n\n \n Ouellette, P., Sciortino, A., Nargesian, F., Bashardoost, B. G., Zhu, E., Pu, K., & Miller, R. J.\n\n\n \n\n\n\n
Proc. VLDB Endow., 14(12): 2863–2866. 2021.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/pvldb/OuelletteSNBZPM21,\n author = {Paul Ouellette and\n Aidan Sciortino and\n Fatemeh Nargesian and\n Bahar Ghadiri Bashardoost and\n Erkang Zhu and\n Ken Pu and\n Ren{\\'{e}}e J. Miller},\n title = {{RONIN:} Data Lake Exploration},\n journal = {Proc. {VLDB} Endow.},\n volume = {14},\n number = {12},\n pages = {2863--2866},\n year = {2021}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Efficient Joinable Table Discovery in Data Lakes: A High-Dimensional Similarity-Based Approach.\n \n \n \n\n\n \n Dong, Y., Takeoka, K., Xiao, C., & Oyamada, M.\n\n\n \n\n\n\n In
ICDE, pages 456–467, 2021. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/icde/DongT0O21,\n\tauthor = {Yuyang Dong and\n\tKunihiro Takeoka and\n\tChuan Xiao and\n\tMasafumi Oyamada},\n\ttitle = {Efficient Joinable Table Discovery in Data Lakes: {A} High-Dimensional\n\tSimilarity-Based Approach},\n\tbooktitle = {ICDE},\n\tpages = {456--467},\n\tyear = {2021}\n}\n
\n
\n\n\n\n
\n\n\n \n\n\n
\n
\n\n \n \n \n \n \n Valentine: Evaluating Matching Techniques for Dataset Discovery.\n \n \n \n\n\n \n Koutras, C., Siachamis, G., Ionescu, A., Psarakis, K., Brons, J., Fragkoulis, M., Lofi, C., Bonifati, A., & Katsifodimos, A.\n\n\n \n\n\n\n In
ICDE, pages 468–479, 2021. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/icde/KoutrasSIPBFLBK21,\n\tauthor = {Christos Koutras and\n\tGeorge Siachamis and\n\tAndra Ionescu and\n\tKyriakos Psarakis and\n\tJerry Brons and\n\tMarios Fragkoulis and\n\tChristoph Lofi and\n\tAngela Bonifati and\n\tAsterios Katsifodimos},\n\ttitle = {Valentine: Evaluating Matching Techniques for Dataset Discovery},\n\tbooktitle = {ICDE},\n\tpages = {468--479},\n\tyear = {2021}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n TCN: Table Convolutional Network for Web Table Interpretation.\n \n \n \n\n\n \n Wang, D., Shiralkar, P., Lockard, C., Huang, B., Dong, X. L., & Jiang, M.\n\n\n \n\n\n\n In
WWW, pages 4020–4032, 2021. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/www/WangSLHDJ21,\n author = {Daheng Wang and\n Prashant Shiralkar and\n Colin Lockard and\n Binxuan Huang and\n Xin Luna Dong and\n Meng Jiang},\n title = {{TCN:} Table Convolutional Network for Web Table Interpretation},\n booktitle = {WWW},\n pages = {4020--4032},\n year = {2021}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Knowledge Graphs 2021: A Data Odyssey.\n \n \n \n\n\n \n Weikum, G.\n\n\n \n\n\n\n
Proc. VLDB Endow., 14(12): 3233–3238. 2021.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/pvldb/Weikum21,\n author = {Gerhard Weikum},\n title = {Knowledge Graphs 2021: {A} Data Odyssey},\n journal = {Proc. {VLDB} Endow.},\n volume = {14},\n number = {12},\n pages = {3233--3238},\n year = {2021}\n}\n\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n PLEX: Towards Practical Learned Indexing.\n \n \n \n\n\n \n Stoian, M., Kipf, A., Marcus, R., & Kraska, T.\n\n\n \n\n\n\n
CoRR, abs/2108.05117. 2021.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/corr/abs-2108-05117,\n author = {Mihail Stoian and\n Andreas Kipf and\n Ryan Marcus and\n Tim Kraska},\n title = {{PLEX:} Towards Practical Learned Indexing},\n journal = {CoRR},\n volume = {abs/2108.05117},\n year = {2021}\n }\n\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n DomainNet: Homograph Detection for Data Lake Disambiguation.\n \n \n \n\n\n \n Leventidis, A., Rocco, L. D., Gatterbauer, W., Miller, R. J., & Riedewald, M.\n\n\n \n\n\n\n In
EDBT, pages 13–24, 2021. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/edbt/LeventidisRMRG21,\n author = {Aristotelis Leventidis and\n Laura Di Rocco and\n Wolfgang Gatterbauer and\n Ren{\\'{e}}e J. Miller and\n Mirek Riedewald},\n title = {DomainNet: Homograph Detection for Data Lake Disambiguation},\n booktitle = {EDBT},\n pages = {13--24},\n year = {2021}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n \n 2020\n \n \n (11)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n Semantic Search over Structured Data.\n \n \n \n\n\n \n Galhotra, S., & Khurana, U.\n\n\n \n\n\n\n In
CIKM, 2020. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/cikm/GalhotraK20,\n author = {Sainyam Galhotra and\n Udayan Khurana},\n title = {Semantic Search over Structured Data},\n booktitle = {CIKM},\n year = {2020}\n}\n\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Dataset search: a survey.\n \n \n \n\n\n \n Chapman, A., Simperl, E., Koesten, L., Konstantinidis, G., Ibáñez, L., Kacprzak, E., & Groth, P.\n\n\n \n\n\n\n
VLDB J., 29(1): 251–272. 2020.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/vldb/ChapmanSKKIKG20,\n author = {Adriane Chapman and\n Elena Simperl and\n Laura Koesten and\n George Konstantinidis and\n Luis{-}Daniel Ib{\\'{a}}{\\~{n}}ez and\n Emilia Kacprzak and\n Paul Groth},\n title = {Dataset search: a survey},\n journal = {{VLDB} J.},\n volume = {29},\n number = {1},\n pages = {251--272},\n year = {2020}\n}\n
\n
\n\n\n\n
\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Sato: Contextual Semantic Type Detection in Tables.\n \n \n \n\n\n \n Zhang, D., Suhara, Y., Li, J., Hulsebos, M., Demiralp, Ç., & Tan, W.\n\n\n \n\n\n\n
Proc. VLDB Endow., 13(11): 1835–1848. 2020.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/pvldb/ZhangSLHDT20,\n author = {Dan Zhang and\n Yoshihiko Suhara and\n Jinfeng Li and\n Madelon Hulsebos and\n {\\c{C}}agatay Demiralp and\n Wang{-}Chiew Tan},\n title = {Sato: Contextual Semantic Type Detection in Tables},\n journal = {Proc. {VLDB} Endow.},\n volume = {13},\n number = {11},\n pages = {1835--1848},\n year = {2020}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Data-Driven Domain Discovery for Structured Datasets.\n \n \n \n\n\n \n Ota, M., Mueller, H., Freire, J., & Srivastava, D.\n\n\n \n\n\n\n
Proc. VLDB Endow., 13(7): 953–965. 2020.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/pvldb/OtaMFS20,\n\tauthor = {Masayo Ota and\n\tHeiko Mueller and\n\tJuliana Freire and\n\tDivesh Srivastava},\n\ttitle = {Data-Driven Domain Discovery for Structured Datasets},\n\tjournal = {Proc. {VLDB} Endow.},\n\tvolume = {13},\n\tnumber = {7},\n\tpages = {953--965},\n\tyear = {2020}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n TURL: Table Understanding through Representation Learning.\n \n \n \n\n\n \n Deng, X., Sun, H., Lees, A., Wu, Y., & Yu, C.\n\n\n \n\n\n\n
Proc. VLDB Endow., 14(3): 307–319. 2020.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/pvldb/DengSL0020,\n\tauthor = {Xiang Deng and\n\tHuan Sun and\n\tAlyssa Lees and\n\tYou Wu and\n\tCong Yu},\n\ttitle = {{TURL:} Table Understanding through Representation Learning},\n\tjournal = {Proc. {VLDB} Endow.},\n\tvolume = {14},\n\tnumber = {3},\n\tpages = {307--319},\n\tyear = {2020}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Organizing Data Lakes for Navigation.\n \n \n \n\n\n \n Nargesian, F., Pu, K. Q., Zhu, E., Bashardoost, B. G., & Miller, R. J.\n\n\n \n\n\n\n In
SIGMOD, pages 1939–1950, 2020. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n \n \n 9 downloads\n \n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/sigmod/NargesianPZBM20,\n author = {Fatemeh Nargesian and\n Ken Q. Pu and\n Erkang Zhu and\n Bahar Ghadiri Bashardoost and\n Ren{\\'{e}}e J. Miller},\n title = {Organizing Data Lakes for Navigation},\n booktitle = {SIGMOD},\n pages = {1939--1950},\n year = {2020}\n}\n
\n
\n\n\n\n
\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Creating Embeddings of Heterogeneous Relational Datasets for Data Integration Tasks.\n \n \n \n\n\n \n Cappuzzo, R., Papotti, P., & Thirumuruganathan, S.\n\n\n \n\n\n\n In
SIGMOD, pages 1335–1349, 2020. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/sigmod/CappuzzoPT20,\n author = {Riccardo Cappuzzo and\n Paolo Papotti and\n Saravanan Thirumuruganathan},\n title = {Creating Embeddings of Heterogeneous Relational Datasets for Data\n Integration Tasks},\n booktitle = {SIGMOD},\n pages = {1335--1349},\n year = {2020}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Dataset Discovery in Data Lakes.\n \n \n \n\n\n \n Bogatu, A., Fernandes, A. A. A., Paton, N. W., & Konstantinou, N.\n\n\n \n\n\n\n In
ICDE, pages 709–720, 2020. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/icde/BogatuFP020,\n\tauthor = {Alex Bogatu and\n\tAlvaro A. A. Fernandes and\n\tNorman W. Paton and\n\tNikolaos Konstantinou},\n\ttitle = {Dataset Discovery in Data Lakes},\n\tbooktitle = {ICDE},\n\tpages = {709--720},\n\tyear = {2020}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Efficient and Robust Approximate Nearest Neighbor Search Using Hierarchical Navigable Small World Graphs.\n \n \n \n\n\n \n Malkov, Y. A., & Yashunin, D. A.\n\n\n \n\n\n\n
IEEE Trans. Pattern Anal. Mach. Intell., 42(4): 824–836. 2020.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/pami/MalkovY20,\n author = {Yury A. Malkov and\n Dmitry A. Yashunin},\n title = {Efficient and Robust Approximate Nearest Neighbor Search Using Hierarchical\n Navigable Small World Graphs},\n journal = {{IEEE} Trans. Pattern Anal. Mach. Intell.},\n volume = {42},\n number = {4},\n pages = {824--836},\n year = {2020}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n \n 2019\n \n \n (6)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n Sherlock: A Deep Learning Approach to Semantic Data Type Detection.\n \n \n \n\n\n \n Hulsebos, M., Hu, K. Z., Bakker, M. A., Zgraggen, E., Satyanarayan, A., Kraska, T., Demiralp, Ç., & Hidalgo, C. A.\n\n\n \n\n\n\n In
SIGKDD, pages 1500–1508, 2019. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/kdd/HulsebosHBZSKDH19,\n author = {Madelon Hulsebos and\n Kevin Zeng Hu and\n Michiel A. Bakker and\n Emanuel Zgraggen and\n Arvind Satyanarayan and\n Tim Kraska and\n {\\c{C}}agatay Demiralp and\n C{\\'{e}}sar A. Hidalgo},\n title = {Sherlock: {A} Deep Learning Approach to Semantic Data Type Detection},\n booktitle = {SIGKDD},\n pages = {1500--1508},\n year = {2019}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Google Dataset Search: Building a search engine for datasets in an open Web ecosystem.\n \n \n \n\n\n \n Brickley, D., Burgess, M., & Noy, N. F.\n\n\n \n\n\n\n In
WWW, pages 1365–1375, 2019. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/www/BrickleyBN19,\n\tauthor = {Dan Brickley and\n\tMatthew Burgess and\n\tNatasha F. Noy},\n\ttitle = {Google Dataset Search: Building a search engine for datasets in an\n\topen Web ecosystem},\n\tbooktitle = {WWW},\n\tpages = {1365--1375},\n\tyear = {2019}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n From Auto-tuning One Size Fits All to Self-designed and Learned Data-intensive Systems.\n \n \n \n\n\n \n Idreos, S., & Kraska, T.\n\n\n \n\n\n\n In
SIGMOD, pages 2054–2059, 2019. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/sigmod/IdreosK19,\n author = {Stratos Idreos and\n Tim Kraska},\n title = {From Auto-tuning One Size Fits All to Self-designed and Learned Data-intensive\n Systems},\n booktitle = {SIGMOD},\n pages = {2054--2059},\n year = {2019}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n JOSIE: Overlap Set Similarity Search for Finding Joinable Tables in Data Lakes.\n \n \n \n\n\n \n Zhu, E., Deng, D., Nargesian, F., & Miller, R. J.\n\n\n \n\n\n\n In
SIGMOD, pages 847–864, 2019. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n \n \n 4 downloads\n \n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/sigmod/ZhuDNM19,\n\tauthor = {Erkang Zhu and\n\tDong Deng and\n\tFatemeh Nargesian and\n\tRen{\\'{e}}e J. Miller},\n\ttitle = {{JOSIE:} Overlap Set Similarity Search for Finding Joinable Tables\n\tin Data Lakes},\n\tbooktitle = {SIGMOD},\n\tpages = {847--864},\n\tyear = {2019}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Data Lake Management: Challenges and Opportunities.\n \n \n \n\n\n \n Nargesian, F., Zhu, E., Miller, R. J., Pu, K. Q., & Arocena, P. C.\n\n\n \n\n\n\n
Proc. VLDB Endow., 12(12): 1986–1989. 2019.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n \n \n 7 downloads\n \n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/pvldb/NargesianZMPA19,\n\tauthor = {Fatemeh Nargesian and\n\tErkang Zhu and\n\tRen{\\'{e}}e J. Miller and\n\tKen Q. Pu and\n\tPatricia C. Arocena},\n\ttitle = {Data Lake Management: Challenges and Opportunities},\n\tjournal = {Proc. {VLDB} Endow.},\n\tvolume = {12},\n\tnumber = {12},\n\tpages = {1986--1989},\n\tyear = {2019}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Synergy of Database Techniques and Machine Learning Models for String Similarity Search and Join.\n \n \n \n\n\n \n Lu, J., Lin, C., Wang, J., & Li, C.\n\n\n \n\n\n\n In
CIKM, pages 2975–2976, 2019. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/cikm/LuLW019,\n author = {Jiaheng Lu and\n Chunbin Lin and\n Jin Wang and\n Chen Li},\n title = {Synergy of Database Techniques and Machine Learning Models for String\n Similarity Search and Join},\n booktitle = {CIKM},\n pages = {2975--2976},\n year = {2019}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n \n 2018\n \n \n (8)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n Making Open Data Transparent: Data Discovery on Open Data.\n \n \n \n\n\n \n Miller, R. J., Nargesian, F., Zhu, E., Christodoulakis, C., Pu, K. Q., & Andritsos, P.\n\n\n \n\n\n\n
IEEE Data Eng. Bull., 41(2): 59–70. 2018.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n \n \n 5 downloads\n \n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/debu/MillerNZCPA18,\n\tauthor = {Ren{\\'{e}}e J. Miller and\n\tFatemeh Nargesian and\n\tErkang Zhu and\n\tChristina Christodoulakis and\n\tKen Q. Pu and\n\tPeriklis Andritsos},\n\ttitle = {Making Open Data Transparent: Data Discovery on Open Data},\n\tjournal = {{IEEE} Data Eng. Bull.},\n\tvolume = {41},\n\tnumber = {2},\n\tpages = {59--70},\n\tyear = {2018}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Table Union Search on Open Data.\n \n \n \n\n\n \n Nargesian, F., Zhu, E., Pu, K. Q., & Miller, R. J.\n\n\n \n\n\n\n
Proc. VLDB Endow., 11(7): 813–825. 2018.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n \n \n 3 downloads\n \n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/pvldb/NargesianZPM18,\n\tauthor = {Fatemeh Nargesian and\n\t\tErkang Zhu and\n\t\tKen Q. Pu and\n\t\tRen{\\'{e}}e J. Miller},\n\ttitle = {Table Union Search on Open Data},\n\tjournal = {Proc. {VLDB} Endow.},\n\tvolume = {11},\n\tnumber = {7},\n\tpages = {813--825},\n\tyear = {2018}\n}\n
\n
\n\n\n\n
\n\n\n \n\n\n
\n
\n\n \n \n \n \n \n Open Data Integration.\n \n \n \n\n\n \n Miller, R. J.\n\n\n \n\n\n\n
Proc. VLDB Endow., 11(12): 2130–2139. 2018.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n \n \n 8 downloads\n \n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/pvldb/Miller18,\n author = {Ren{\\'{e}}e J. Miller},\n title = {Open Data Integration},\n journal = {Proc. {VLDB} Endow.},\n volume = {11},\n number = {12},\n pages = {2130--2139},\n year = {2018}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Seeping Semantics: Linking Datasets Using Word Embeddings for Data Discovery.\n \n \n \n\n\n \n Fernandez, R. C., Mansour, E., Qahtan, A. A., Elmagarmid, A. K., Ilyas, I. F., Madden, S., Ouzzani, M., Stonebraker, M., & Tang, N.\n\n\n \n\n\n\n In
ICDE, pages 989–1000, 2018. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/icde/FernandezMQEIMO18,\n\tauthor = {Raul Castro Fernandez and\n\tEssam Mansour and\n\tAbdulhakim Ali Qahtan and\n\tAhmed K. Elmagarmid and\n\tIhab F. Ilyas and\n\tSamuel Madden and\n\tMourad Ouzzani and\n\tMichael Stonebraker and\n\tNan Tang},\n\ttitle = {Seeping Semantics: Linking Datasets Using Word Embeddings for Data\n\tDiscovery},\n\tbooktitle = {ICDE},\n\tpages = {989--1000},\n\tyear = {2018}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Aurum: A Data Discovery System.\n \n \n \n\n\n \n Fernandez, R. C., Abedjan, Z., Koko, F., Yuan, G., Madden, S., & Stonebraker, M.\n\n\n \n\n\n\n In
ICDE, pages 1001–1012, 2018. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/icde/FernandezAKYMS18,\n\tauthor = {Raul Castro Fernandez and\n\tZiawasch Abedjan and\n\tFamien Koko and\n\tGina Yuan and\n\tSamuel Madden and\n\tMichael Stonebraker},\n\ttitle = {Aurum: {A} Data Discovery System},\n\tbooktitle = {ICDE},\n\tpages = {1001--1012},\n\tyear = {2018}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n The Periodic Table of Data Structures.\n \n \n \n\n\n \n Idreos, S., Zoumpatianos, K., Athanassoulis, M., Dayan, N., Hentschel, B., Kester, M. S., Guo, D., Maas, L. M., Qin, W., Wasay, A., & Sun, Y.\n\n\n \n\n\n\n
IEEE Data Eng. Bull., 41(3): 64–75. 2018.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/debu/IdreosZADHKGMQW18,\n author = {Stratos Idreos and\n Kostas Zoumpatianos and\n Manos Athanassoulis and\n Niv Dayan and\n Brian Hentschel and\n Michael S. Kester and\n Demi Guo and\n Lukas M. Maas and\n Wilson Qin and\n Abdul Wasay and\n Yiyou Sun},\n title = {The Periodic Table of Data Structures},\n journal = {{IEEE} Data Eng. Bull.},\n volume = {41},\n number = {3},\n pages = {64--75},\n year = {2018}\n}\n\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Open Data Integration.\n \n \n \n\n\n \n Miller, R. J.\n\n\n \n\n\n\n
Proc. VLDB Endow., 11(12): 2130–2139. 2018.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n \n \n 8 downloads\n \n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/pvldb/Miller18,\n author = {Ren{\\'{e}}e J. Miller},\n title = {Open Data Integration},\n journal = {Proc. {VLDB} Endow.},\n volume = {11},\n number = {12},\n pages = {2130--2139},\n year = {2018}\n}
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n \n 2017\n \n \n (2)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n Stitching Web Tables for Improving Matching Quality.\n \n \n \n\n\n \n Lehmberg, O., & Bizer, C.\n\n\n \n\n\n\n
Proc. VLDB Endow., 10(11): 1502–1513. 2017.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/pvldb/LehmbergB17,\n\tauthor = {Oliver Lehmberg and\n\tChristian Bizer},\n\ttitle = {Stitching Web Tables for Improving Matching Quality},\n\tjournal = {Proc. {VLDB} Endow.},\n\tvolume = {10},\n\tnumber = {11},\n\tpages = {1502--1513},\n\tyear = {2017}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Discovering Enterprise Concepts Using Spreadsheet Tables.\n \n \n \n\n\n \n Li, K., He, Y., & Ganjam, K.\n\n\n \n\n\n\n In
SIGKDD, pages 1873–1882, 2017. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/kdd/LiHG17,\n author = {Keqian Li and\n Yeye He and\n Kris Ganjam},\n title = {Discovering Enterprise Concepts Using Spreadsheet Tables},\n booktitle = {SIGKDD},\n pages = {1873--1882},\n year = {2017}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n \n 2016\n \n \n (5)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n A Large Public Corpus of Web Tables containing Time and Context Metadata.\n \n \n \n\n\n \n Lehmberg, O., Ritze, D., Meusel, R., & Bizer, C.\n\n\n \n\n\n\n In
WWW, pages 75–76, 2016. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/www/LehmbergRMB16,\n author = {Oliver Lehmberg and\n Dominique Ritze and\n Robert Meusel and\n Christian Bizer},\n title = {A Large Public Corpus of Web Tables containing Time and Context Metadata},\n booktitle = {WWW},\n pages = {75--76},\n year = {2016}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n LSH Ensemble: Internet-Scale Domain Search.\n \n \n \n\n\n \n Zhu, E., Nargesian, F., Pu, K. Q., & Miller, R. J.\n\n\n \n\n\n\n
Proc. VLDB Endow., 9(12): 1185–1196. 2016.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/pvldb/ZhuNPM16,\n\tauthor = {Erkang Zhu and\n\tFatemeh Nargesian and\n\tKen Q. Pu and\n\tRen{\\'{e}}e J. Miller},\n\ttitle = {{LSH} Ensemble: Internet-Scale Domain Search},\n\tjournal = {Proc. {VLDB} Endow.},\n\tvolume = {9},\n\tnumber = {12},\n\tpages = {1185--1196},\n\tyear = {2016}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Goods: Organizing Google's Datasets.\n \n \n \n\n\n \n Halevy, A. Y., Korn, F., Noy, N. F., Olston, C., Polyzotis, N., Roy, S., & Whang, S. E.\n\n\n \n\n\n\n In
SIGMOD, pages 795–806, 2016. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/sigmod/HalevyKNOPRW16,\n author = {Alon Y. Halevy and\n Flip Korn and\n Natalya Fridman Noy and\n Christopher Olston and\n Neoklis Polyzotis and\n Sudip Roy and\n Steven Euijong Whang},\n title = {Goods: Organizing Google's Datasets},\n booktitle = {SIGMOD},\n pages = {795--806},\n year = {2016}\n}\n
\n
\n\n\n\n
\n\n\n \n\n\n
\n
\n\n \n \n \n \n \n CLAMS: Bringing Quality to Data Lakes.\n \n \n \n\n\n \n Farid, M. H., Roatis, A., Ilyas, I. F., Hoffmann, H., & Chu, X.\n\n\n \n\n\n\n In
SIGMOD, pages 2089–2092, 2016. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/sigmod/FaridRIHC16,\n author = {Mina H. Farid and\n Alexandra Roatis and\n Ihab F. Ilyas and\n Hella{-}Franziska Hoffmann and\n Xu Chu},\n title = {{CLAMS:} Bringing Quality to Data Lakes},\n booktitle = {SIGMOD},\n pages = {2089--2092},\n year = {2016}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n \n 2015\n \n \n (1)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n The Mannheim Search Join Engine.\n \n \n \n\n\n \n Lehmberg, O., Ritze, D., Ristoski, P., Meusel, R., Paulheim, H., & Bizer, C.\n\n\n \n\n\n\n
J. Web Semant., 35: 159–166. 2015.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/ws/LehmbergRRMPB15,\n author = {Oliver Lehmberg and\n Dominique Ritze and\n Petar Ristoski and\n Robert Meusel and\n Heiko Paulheim and\n Christian Bizer},\n title = {The Mannheim Search Join Engine},\n journal = {J. Web Semant.},\n volume = {35},\n pages = {159--166},\n year = {2015}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n \n 2014\n \n \n (3)\n \n \n
\n
\n \n \n
\n\n\n
\n
\n\n \n \n \n \n \n MeanKS: meaningful keyword search in relational databases with complex schema.\n \n \n \n\n\n \n Kargar, M., An, A., Cercone, N., Godfrey, P., Szlichta, J., & Yu, X.\n\n\n \n\n\n\n In
SIGMOD, pages 905–908, 2014. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/sigmod/KargarACGSY14,\n author = {Mehdi Kargar and\n Aijun An and\n Nick Cercone and\n Parke Godfrey and\n Jaroslaw Szlichta and\n Xiaohui Yu},\n title = {MeanKS: meaningful keyword search in relational databases with complex\n schema},\n booktitle = {SIGMOD},\n pages = {905--908},\n year = {2014}\n}\n
\n
\n\n\n\n
\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n \n 2013\n \n \n (2)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n Synthesizing Union Tables from the Web.\n \n \n \n\n\n \n Ling, X., Halevy, A. Y., Wu, F., & Yu, C.\n\n\n \n\n\n\n In
IJCAI, pages 2677–2683, 2013. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/ijcai/LingH0Y13,\n author = {Xiao Ling and\n Alon Y. Halevy and\n Fei Wu and\n Cong Yu},\n title = {Synthesizing Union Tables from the Web},\n booktitle = {IJCAI},\n pages = {2677--2683},\n year = {2013}\n}\n
\n
\n\n\n\n
\n\n\n \n\n\n\n\n\n
\n
\n\n
\n
\n \n 2012\n \n \n (3)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n InfoGather: entity augmentation and attribute discovery by holistic matching with web tables.\n \n \n \n\n\n \n Yakout, M., Ganjam, K., Chakrabarti, K., & Chaudhuri, S.\n\n\n \n\n\n\n In
SIGMOD, pages 97–108, 2012. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/sigmod/YakoutGCC12,\n\tauthor = {Mohamed Yakout and\n\tKris Ganjam and\n\tKaushik Chakrabarti and\n\tSurajit Chaudhuri},\n\ttitle = {InfoGather: entity augmentation and attribute discovery by holistic\n\tmatching with web tables},\n\tbooktitle = {SIGMOD} ,\n\tpages = {97--108},\n\tyear = {2012}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Answering Table Queries on the Web using Column Keywords.\n \n \n \n\n\n \n Pimplikar, R., & Sarawagi, S.\n\n\n \n\n\n\n
Proc. VLDB Endow., 5(10): 908–919. 2012.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/pvldb/PimplikarS12,\n author = {Rakesh Pimplikar and\n Sunita Sarawagi},\n title = {Answering Table Queries on the Web using Column Keywords},\n journal = {Proc. {VLDB} Endow.},\n volume = {5},\n number = {10},\n pages = {908--919},\n year = {2012}\n}\n
\n
\n\n\n\n
\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n \n 2011\n \n \n (1)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n Recovering Semantics of Tables on the Web.\n \n \n \n\n\n \n Venetis, P., Halevy, A. Y., Madhavan, J., Pasca, M., Shen, W., Wu, F., Miao, G., & Wu, C.\n\n\n \n\n\n\n
Proc. VLDB Endow., 4(9): 528–538. 2011.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/pvldb/VenetisHMPSWMW11,\n\tauthor = {Petros Venetis and\n\tAlon Y. Halevy and\n\tJayant Madhavan and\n\tMarius Pasca and\n\tWarren Shen and\n\tFei Wu and\n\tGengxin Miao and\n\tChung Wu},\n\ttitle = {Recovering Semantics of Tables on the Web},\n\tjournal = {Proc. {VLDB} Endow.},\n\tvolume = {4},\n\tnumber = {9},\n\tpages = {528--538},\n\tyear = {2011}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n \n 2010\n \n \n (2)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n Annotating and Searching Web Tables Using Entities, Types and Relationships.\n \n \n \n\n\n \n Limaye, G., Sarawagi, S., & Chakrabarti, S.\n\n\n \n\n\n\n
Proc. VLDB Endow., 3(1): 1338–1347. 2010.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/pvldb/LimayeSC10,\n\tauthor = {Girija Limaye and\n\tSunita Sarawagi and\n\tSoumen Chakrabarti},\n\ttitle = {Annotating and Searching Web Tables Using Entities, Types and Relationships},\n\tjournal = {Proc. {VLDB} Endow.},\n\tvolume = {3},\n\tnumber = {1},\n\tpages = {1338--1347},\n\tyear = {2010}\n}\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n On indexing error-tolerant set containment.\n \n \n \n\n\n \n Agrawal, P., Arasu, A., & Kaushik, R.\n\n\n \n\n\n\n In
SIGMOD, pages 927–938, 2010. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/sigmod/AgrawalAK10,\n author = {Parag Agrawal and\n Arvind Arasu and\n Raghav Kaushik},\n title = {On indexing error-tolerant set containment},\n booktitle = {{SIGMOD}},\n pages = {927--938},\n year = {2010}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n \n 2009\n \n \n (1)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n Data Integration for the Relational Web.\n \n \n \n\n\n \n Cafarella, M. J., Halevy, A. Y., & Khoussainova, N.\n\n\n \n\n\n\n
Proc. VLDB Endow., 2(1): 1090–1101. 2009.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/pvldb/CafarellaHK09,\n\tauthor = {Michael J. Cafarella and\n\tAlon Y. Halevy and\n\tNodira Khoussainova},\n\ttitle = {Data Integration for the Relational Web},\n\tjournal = {Proc. {VLDB} Endow.},\n\tvolume = {2},\n\tnumber = {1},\n\tpages = {1090--1101},\n\tyear = {2009}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n \n 2008\n \n \n (1)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n WebTables: exploring the power of tables on the web.\n \n \n \n\n\n \n Cafarella, M. J., Halevy, A. Y., Wang, D. Z., Wu, E., & Zhang, Y.\n\n\n \n\n\n\n
Proc. VLDB Endow., 1(1): 538–549. 2008.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{DBLP:journals/pvldb/CafarellaHWWZ08,\n\tauthor = {Michael J. Cafarella and\n\tAlon Y. Halevy and\n\tDaisy Zhe Wang and\n\tEugene Wu and\n\tYang Zhang},\n\ttitle = {WebTables: exploring the power of tables on the web},\n\tjournal = {Proc. {VLDB} Endow.},\n\tvolume = {1},\n\tnumber = {1},\n\tpages = {538--549},\n\tyear = {2008}\n}\n\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n \n 2004\n \n \n (1)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n Locality-sensitive hashing scheme based on p-stable distributions.\n \n \n \n\n\n \n Datar, M., Immorlica, N., Indyk, P., & Mirrokni, V. S.\n\n\n \n\n\n\n In
SCG, pages 253–262, 2004. ACM\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/compgeom/DatarIIM04,\n author = {Mayur Datar and\n Nicole Immorlica and\n Piotr Indyk and\n Vahab S. Mirrokni},\n title = {Locality-sensitive hashing scheme based on p-stable distributions},\n booktitle = {{SCG}},\n pages = {253--262},\n publisher = {{ACM}},\n year = {2004}\n}\n\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n \n 2002\n \n \n (1)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n DISCOVER: Keyword Search in Relational Databases.\n \n \n \n\n\n \n Hristidis, V., & Papakonstantinou, Y.\n\n\n \n\n\n\n In
VLDB, pages 670–681, 2002. \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/vldb/HristidisP02,\n author = {Vagelis Hristidis and\n Yannis Papakonstantinou},\n title = {{DISCOVER:} Keyword Search in Relational Databases},\n booktitle = {VLDB},\n pages = {670--681},\n year = {2002}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n\n\n\n