var bibbase_data = {"data":"\"Loading..\"\n\n
\n\n \n\n \n\n \n \n\n \n\n \n \n\n \n\n \n
\n generated by\n \n \"bibbase.org\"\n\n \n
\n \n\n
\n\n \n\n\n
\n\n Excellent! Next you can\n create a new website with this list, or\n embed it in an existing web page by copying & pasting\n any of the following snippets.\n\n
\n JavaScript\n (easiest)\n
\n \n <script src=\"https://bibbase.org/show?bib=https%3A%2F%2Fgithub.com%2FRJMillerLab%2Fdata-lake-tutorial-slides%2Fraw%2Fmaster%2Fcitations.bib&jsonp=1&jsonp=1\"></script>\n \n
\n\n PHP\n
\n \n <?php\n $contents = file_get_contents(\"https://bibbase.org/show?bib=https%3A%2F%2Fgithub.com%2FRJMillerLab%2Fdata-lake-tutorial-slides%2Fraw%2Fmaster%2Fcitations.bib&jsonp=1\");\n print_r($contents);\n ?>\n \n
\n\n iFrame\n (not recommended)\n
\n \n <iframe src=\"https://bibbase.org/show?bib=https%3A%2F%2Fgithub.com%2FRJMillerLab%2Fdata-lake-tutorial-slides%2Fraw%2Fmaster%2Fcitations.bib&jsonp=1\"></iframe>\n \n
\n\n

\n For more details see the documention.\n

\n
\n
\n\n
\n\n This is a preview! To use this list on your own web site\n or create a new web site from it,\n create a free account. The file will be added\n and you will be able to edit it in the File Manager.\n We will show you instructions once you've created your account.\n
\n\n
\n\n

To the site owner:

\n\n

Action required! Mendeley is changing its\n API. In order to keep using Mendeley with BibBase past April\n 14th, you need to:\n

    \n
  1. renew the authorization for BibBase on Mendeley, and
  2. \n
  3. update the BibBase URL\n in your page the same way you did when you initially set up\n this page.\n
  4. \n
\n

\n\n

\n \n \n Fix it now\n

\n
\n\n
\n\n\n
\n \n \n
\n
\n  \n 2019\n \n \n (10)\n \n \n
\n
\n \n \n
\n \n\n \n \n \n \n \n Parsing Gigabytes of JSON per Second.\n \n \n \n\n\n \n Langdale, G.; and Lemire, D.\n\n\n \n\n\n\n arXiv preprint arXiv:1902.08318. 2019.\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{langdale2019parsing,\n  title={Parsing Gigabytes of JSON per Second},\n  author={Langdale, Geoff and Lemire, Daniel},\n  journal={arXiv preprint arXiv:1902.08318},\n  year={2019}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Speculative Distributed CSV Data Parsing for Big Data Analytics.\n \n \n \n\n\n \n Ge, C.; Li, Y.; Eilebrecht, E.; Chandramouli, B.; and Kossmann, D.\n\n\n \n\n\n\n In Proceedings of the 2019 International Conference on Management of Data, pages 883–899, 2019. ACM\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{ge2019speculative,\n  title={Speculative Distributed CSV Data Parsing for Big Data Analytics},\n  author={Ge, Chang and Li, Yinan and Eilebrecht, Eric and Chandramouli, Badrish and Kossmann, Donald},\n  booktitle={Proceedings of the 2019 International Conference on Management of Data},\n  pages={883--899},\n  year={2019},\n  organization={ACM}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Sherlock: A Deep Learning Approach to Semantic Data Type Detection.\n \n \n \n\n\n \n Hulsebos, M.; Hu, K.; Bakker, M.; Zgraggen, E.; Satyanarayan, A.; Kraska, T.; Demiralp, Ç.; and Hidalgo, C.\n\n\n \n\n\n\n arXiv preprint arXiv:1905.10688. 2019.\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{hulsebos2019sherlock,\n  title={Sherlock: A Deep Learning Approach to Semantic Data Type Detection},\n  author={Hulsebos, Madelon and Hu, Kevin and Bakker, Michiel and Zgraggen, Emanuel and Satyanarayan, Arvind and Kraska, Tim and Demiralp, {\\c{C}}a{\\u{g}}atay and Hidalgo, C{\\'e}sar},\n  journal={arXiv preprint arXiv:1905.10688},\n  year={2019}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Unit Testing Data with Deequ.\n \n \n \n\n\n \n Schelter, S.; Biessmann, F.; Lange, D.; Rukat, T.; Schmidt, P.; Seufert, S.; Brunelle, P.; and Taptunov, A.\n\n\n \n\n\n\n In Proceedings of the 2019 International Conference on Management of Data, pages 1993–1996, 2019. ACM\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{schelter2019unit,\n  title={Unit Testing Data with Deequ},\n  author={Schelter, Sebastian and Biessmann, Felix and Lange, Dustin and Rukat, Tammo and Schmidt, Phillipp and Seufert, Stephan and Brunelle, Pierre and Taptunov, Andrey},\n  booktitle={Proceedings of the 2019 International Conference on Management of Data},\n  pages={1993--1996},\n  year={2019},\n  organization={ACM}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Lazo: A Cardinality-Based Method for Coupled Estimation of Jaccard Similarity and Containment.\n \n \n \n\n\n \n Fernandez, R. C.; Min, J.; Nava, D.; and Madden, S.\n\n\n \n\n\n\n In 2019 IEEE 35th International Conference on Data Engineering (ICDE), pages 1190–1201, 2019. IEEE\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n  \n \n 3 downloads\n \n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{fernandez2019lazo,\n  title={Lazo: A Cardinality-Based Method for Coupled Estimation of Jaccard Similarity and Containment},\n  author={Fernandez, Raul Castro and Min, Jisoo and Nava, Demitri and Madden, Samuel},\n  booktitle={2019 IEEE 35th International Conference on Data Engineering (ICDE)},\n  pages={1190--1201},\n  year={2019},\n  organization={IEEE}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n JOSIE: Overlap Set Similarity Search for Finding Joinable Tables in Data Lakes.\n \n \n \n\n\n \n Zhu, E.; Deng, D.; Nargesian, F.; and Miller, R. J\n\n\n \n\n\n\n In Proceedings of the 2019 International Conference on Management of Data, pages 847–864, 2019. ACM\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n  \n \n 4 downloads\n \n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{zhu2019josie,\n  title={JOSIE: Overlap Set Similarity Search for Finding Joinable Tables in Data Lakes},\n  author={Zhu, Erkang and Deng, Dong and Nargesian, Fatemeh and Miller, Ren{\\'e}e J},\n  booktitle={Proceedings of the 2019 International Conference on Management of Data},\n  pages={847--864},\n  year={2019},\n  organization={ACM}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Debugging Machine Learning Pipelines.\n \n \n \n\n\n \n Lourenço, R.; Freire, J.; and Shasha, D.\n\n\n \n\n\n\n In Proceedings of the 3rd International Workshop on Data Management for End-to-End Machine Learning, pages 3, 2019. ACM\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{lourencco2019debugging,\n  title={Debugging Machine Learning Pipelines},\n  author={Louren{\\c{c}}o, Raoni and Freire, Juliana and Shasha, Dennis},\n  booktitle={Proceedings of the 3rd International Workshop on Data Management for End-to-End Machine Learning},\n  pages={3},\n  year={2019},\n  organization={ACM}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n \n Large-Scale Schema Matching.\n \n \n \n \n\n\n \n Rahm, E.; and Peukert, E.\n\n\n \n\n\n\n In Encyclopedia of Big Data Technologies.. 2019.\n \n\n\n\n
\n\n\n\n \n \n \"Large-ScalePaper\n  \n \n\n \n \n doi\n  \n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@incollection{DBLP:reference/bdt/RahmP19b,\n  author    = {Erhard Rahm and\n               Eric Peukert},\n  title     = {Large-Scale Schema Matching},\n  booktitle = {Encyclopedia of Big Data Technologies.},\n  year      = {2019},\n  crossref  = {DBLP:reference/bdt/2019},\n  url       = {https://doi.org/10.1007/978-3-319-63962-8\\_330-1},\n  doi       = {10.1007/978-3-319-63962-8\\_330-1},\n  timestamp = {Thu, 14 Feb 2019 16:03:55 +0100},\n  biburl    = {https://dblp.org/rec/bib/reference/bdt/RahmP19b},\n  bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n \n Google Dataset Search: Building a search engine for datasets in an open Web ecosystem.\n \n \n \n \n\n\n \n Brickley, D.; Burgess, M.; and Noy, N. F.\n\n\n \n\n\n\n In The World Wide Web Conference, WWW 2019, San Francisco, CA, USA, May 13-17, 2019, pages 1365–1375, 2019. \n \n\n\n\n
\n\n\n\n \n \n \"GooglePaper\n  \n \n\n \n \n doi\n  \n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/www/BrickleyBN19,\n  author    = {Dan Brickley and\n               Matthew Burgess and\n               Natasha F. Noy},\n  title     = {Google Dataset Search: Building a search engine for datasets in an\n               open Web ecosystem},\n  booktitle = {The World Wide Web Conference, {WWW} 2019, San Francisco, CA, USA,\n               May 13-17, 2019},\n  pages     = {1365--1375},\n  year      = {2019},\n  crossref  = {DBLP:conf/www/2019},\n  url       = {https://doi.org/10.1145/3308558.3313685},\n  doi       = {10.1145/3308558.3313685},\n  timestamp = {Sun, 02 Jun 2019 21:15:59 +0200},\n  biburl    = {https://dblp.org/rec/bib/conf/www/BrickleyBN19},\n  bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n \n Debugging Machine Learning Pipelines.\n \n \n \n \n\n\n \n Lourenço, R.; Freire, J.; and Shasha, D.\n\n\n \n\n\n\n In Proceedings of the 3rd International Workshop on Data Management for End-to-End Machine Learning, of DEEM'19, pages 3:1–3:10, New York, NY, USA, 2019. ACM\n \n\n\n\n
\n\n\n\n \n \n \"DebuggingPaper\n  \n \n\n \n \n doi\n  \n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{Lourenco:2019:DML:3329486.3329489,\n author = {Louren\\c{c}o, Raoni and Freire, Juliana and Shasha, Dennis},\n title = {Debugging Machine Learning Pipelines},\n booktitle = {Proceedings of the 3rd International Workshop on Data Management for End-to-End Machine Learning},\n series = {DEEM'19},\n year = {2019},\n isbn = {978-1-4503-6797-4},\n location = {Amsterdam, Netherlands},\n pages = {3:1--3:10},\n articleno = {3},\n numpages = {10},\n url = {http://doi.acm.org/10.1145/3329486.3329489},\n doi = {10.1145/3329486.3329489},\n acmid = {3329489},\n publisher = {ACM},\n address = {New York, NY, USA},\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n  \n 2018\n \n \n (10)\n \n \n
\n
\n \n \n
\n \n\n \n \n \n \n \n Filter before you parse: Faster analytics on raw data with sparser.\n \n \n \n\n\n \n Palkar, S.; Abuzaid, F.; Bailis, P.; and Zaharia, M.\n\n\n \n\n\n\n Proceedings of the VLDB Endowment, 11(11): 1576–1589. 2018.\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{palkar2018filter,\n  title={Filter before you parse: Faster analytics on raw data with sparser},\n  author={Palkar, Shoumik and Abuzaid, Firas and Bailis, Peter and Zaharia, Matei},\n  journal={Proceedings of the VLDB Endowment},\n  volume={11},\n  number={11},\n  pages={1576--1589},\n  year={2018},\n  publisher={VLDB Endowment}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Navigating the data lake with datamaran: automatically extracting structure from log datasets.\n \n \n \n\n\n \n Gao, Y.; Huang, S.; and Parameswaran, A.\n\n\n \n\n\n\n In Proceedings of the 2018 International Conference on Management of Data, pages 943–958, 2018. ACM\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{gao2018navigating,\n  title={Navigating the data lake with datamaran: automatically extracting structure from log datasets},\n  author={Gao, Yihan and Huang, Silu and Parameswaran, Aditya},\n  booktitle={Proceedings of the 2018 International Conference on Management of Data},\n  pages={943--958},\n  year={2018},\n  organization={ACM}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Aurum: A data discovery system.\n \n \n \n\n\n \n Fernandez, R. C.; Abedjan, Z.; Koko, F.; Yuan, G.; Madden, S.; and Stonebraker, M.\n\n\n \n\n\n\n In 2018 IEEE 34th International Conference on Data Engineering (ICDE), pages 1001–1012, 2018. IEEE\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{fernandez2018aurum,\n  title={Aurum: A data discovery system},\n  author={Fernandez, Raul Castro and Abedjan, Ziawasch and Koko, Famien and Yuan, Gina and Madden, Samuel and Stonebraker, Michael},\n  booktitle={2018 IEEE 34th International Conference on Data Engineering (ICDE)},\n  pages={1001--1012},\n  year={2018},\n  organization={IEEE}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Seeping semantics: Linking datasets using word embeddings for data discovery.\n \n \n \n\n\n \n Fernandez, R. C.; Mansour, E.; Qahtan, A. A; Elmagarmid, A.; Ilyas, I.; Madden, S.; Ouzzani, M.; Stonebraker, M.; and Tang, N.\n\n\n \n\n\n\n In 2018 IEEE 34th International Conference on Data Engineering (ICDE), pages 989–1000, 2018. IEEE\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{fernandez2018seeping,\n  title={Seeping semantics: Linking datasets using word embeddings for data discovery},\n  author={Fernandez, Raul Castro and Mansour, Essam and Qahtan, Abdulhakim A and Elmagarmid, Ahmed and Ilyas, Ihab and Madden, Samuel and Ouzzani, Mourad and Stonebraker, Michael and Tang, Nan},\n  booktitle={2018 IEEE 34th International Conference on Data Engineering (ICDE)},\n  pages={989--1000},\n  year={2018},\n  organization={IEEE}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Skluma: An extensible metadata extraction pipeline for disorganized data.\n \n \n \n\n\n \n Skluzacek, T. J; Kumar, R.; Chard, R.; Harrison, G.; Beckman, P.; Chard, K.; and Foster, I.\n\n\n \n\n\n\n In 2018 IEEE 14th International Conference on e-Science (e-Science), pages 256–266, 2018. IEEE\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{skluzacek2018skluma,\n  title={Skluma: An extensible metadata extraction pipeline for disorganized data},\n  author={Skluzacek, Tyler J and Kumar, Rohan and Chard, Ryan and Harrison, Galen and Beckman, Paul and Chard, Kyle and Foster, Ian},\n  booktitle={2018 IEEE 14th International Conference on e-Science (e-Science)},\n  pages={256--266},\n  year={2018},\n  organization={IEEE}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Automating large-scale data quality verification.\n \n \n \n\n\n \n Schelter, S.; Lange, D.; Schmidt, P.; Celikel, M.; Biessmann, F.; and Grafberger, A.\n\n\n \n\n\n\n Proceedings of the VLDB Endowment, 11(12): 1781–1794. 2018.\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{schelter2018automating,\n  title={Automating large-scale data quality verification},\n  author={Schelter, Sebastian and Lange, Dustin and Schmidt, Philipp and Celikel, Meltem and Biessmann, Felix and Grafberger, Andreas},\n  journal={Proceedings of the VLDB Endowment},\n  volume={11},\n  number={12},\n  pages={1781--1794},\n  year={2018},\n  publisher={VLDB Endowment}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Demonstration of a Multiresolution Schema Mapping System.\n \n \n \n\n\n \n Jin, Z.; Baik, C.; Cafarella, M.; Jagadish, H.; and Lou, Y.\n\n\n \n\n\n\n arXiv preprint arXiv:1812.07658. 2018.\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{jin2018demonstration,\n  title={Demonstration of a Multiresolution Schema Mapping System},\n  author={Jin, Zhongjun and Baik, Christopher and Cafarella, Michael and Jagadish, HV and Lou, Yuze},\n  journal={arXiv preprint arXiv:1812.07658},\n  year={2018}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Apache calcite: A foundational framework for optimized query processing over heterogeneous data sources.\n \n \n \n\n\n \n Begoli, E.; Camacho-Rodrı́guez, Jesús; Hyde, J.; Mior, M. J; and Lemire, D.\n\n\n \n\n\n\n In Proceedings of the 2018 International Conference on Management of Data, pages 221–230, 2018. ACM\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{begoli2018apache,\n  title={Apache calcite: A foundational framework for optimized query processing over heterogeneous data sources},\n  author={Begoli, Edmon and Camacho-Rodr{\\'\\i}guez, Jes{\\'u}s and Hyde, Julian and Mior, Michael J and Lemire, Daniel},\n  booktitle={Proceedings of the 2018 International Conference on Management of Data},\n  pages={221--230},\n  year={2018},\n  organization={ACM}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Table union search on open data.\n \n \n \n\n\n \n Nargesian, F.; Zhu, E.; Pu, K. Q; and Miller, R. J\n\n\n \n\n\n\n Proceedings of the VLDB Endowment, 11(7): 813–825. 2018.\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n  \n \n 3 downloads\n \n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{nargesian2018table,\n  title={Table union search on open data},\n  author={Nargesian, Fatemeh and Zhu, Erkang and Pu, Ken Q and Miller, Ren{\\'e}e J},\n  journal={Proceedings of the VLDB Endowment},\n  volume={11},\n  number={7},\n  pages={813--825},\n  year={2018},\n  publisher={VLDB Endowment}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n \n ProgressER: Adaptive Progressive Approach to Relational Entity Resolution.\n \n \n \n \n\n\n \n Altowim, Y.; Kalashnikov, D. V.; and Mehrotra, S.\n\n\n \n\n\n\n TKDD, 12(3): 33:1–33:45. 2018.\n \n\n\n\n
\n\n\n\n \n \n \"ProgressER:Paper\n  \n \n\n \n \n doi\n  \n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{DBLP:journals/tkdd/AltowimKM18,\n  author    = {Yasser Altowim and\n               Dmitri V. Kalashnikov and\n               Sharad Mehrotra},\n  title     = {ProgressER: Adaptive Progressive Approach to Relational Entity Resolution},\n  journal   = {{TKDD}},\n  volume    = {12},\n  number    = {3},\n  pages     = {33:1--33:45},\n  year      = {2018},\n  url       = {https://doi.org/10.1145/3154410},\n  doi       = {10.1145/3154410},\n  timestamp = {Wed, 21 Nov 2018 12:44:28 +0100},\n  biburl    = {https://dblp.org/rec/bib/journals/tkdd/AltowimKM18},\n  bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n  \n 2017\n \n \n (5)\n \n \n
\n
\n \n \n
\n \n\n \n \n \n \n \n \n Data Profiling: A Tutorial.\n \n \n \n \n\n\n \n Abedjan, Z.; Golab, L.; and Naumann, F.\n\n\n \n\n\n\n In Proceedings of the 2017 ACM International Conference on Management of Data, SIGMOD Conference 2017, Chicago, IL, USA, May 14-19, 2017, pages 1747–1751, 2017. \n \n\n\n\n
\n\n\n\n \n \n \"DataPaper\n  \n \n\n \n \n doi\n  \n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/sigmod/AbedjanGN17,\n  author    = {Ziawasch Abedjan and\n               Lukasz Golab and\n               Felix Naumann},\n  title     = {Data Profiling: {A} Tutorial},\n  booktitle = {Proceedings of the 2017 {ACM} International Conference on Management\n               of Data, {SIGMOD} Conference 2017, Chicago, IL, USA, May 14-19, 2017},\n  pages     = {1747--1751},\n  year      = {2017},\n  crossref  = {DBLP:conf/sigmod/2017},\n  url       = {https://doi.org/10.1145/3035918.3054772},\n  doi       = {10.1145/3035918.3054772},\n  timestamp = {Tue, 06 Nov 2018 11:07:37 +0100},\n  biburl    = {https://dblp.org/rec/bib/conf/sigmod/AbedjanGN17},\n  bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n \n Skluma: A Statistical Learning Pipeline for Taming Unkempt Data Repositories.\n \n \n \n \n\n\n \n Beckman, P.; Skluzacek, T. J.; Chard, K.; and Foster, I.\n\n\n \n\n\n\n In Proceedings of the 29th International Conference on Scientific and Statistical Database Management, of SSDBM '17, pages 41:1–41:4, New York, NY, USA, 2017. ACM\n \n\n\n\n
\n\n\n\n \n \n \"Skluma:Paper\n  \n \n\n \n \n doi\n  \n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n \n \n \n \n \n \n \n \n\n\n\n
\n
@inproceedings{Beckman:2017:SSL:3085504.3091116,\n author = {Beckman, Paul and Skluzacek, Tyler J. and Chard, Kyle and Foster, Ian},\n title = {Skluma: A Statistical Learning Pipeline for Taming Unkempt Data Repositories},\n booktitle = {Proceedings of the 29th International Conference on Scientific and Statistical Database Management},\n series = {SSDBM '17},\n year = {2017},\n isbn = {978-1-4503-5282-6},\n location = {Chicago, IL, USA},\n pages = {41:1--41:4},\n articleno = {41},\n numpages = {4},\n url = {http://doi.acm.org/10.1145/3085504.3091116},\n doi = {10.1145/3085504.3091116},\n acmid = {3091116},\n publisher = {ACM},\n address = {New York, NY, USA},\n keywords = {data integration, data wrangling, metadata extraction, statistical learning},\n} \n\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n \n Parallel Progressive Approach to Entity Resolution Using MapReduce.\n \n \n \n \n\n\n \n Altowim, Y.; and Mehrotra, S.\n\n\n \n\n\n\n In 33rd IEEE International Conference on Data Engineering, ICDE 2017, San Diego, CA, USA, April 19-22, 2017, pages 909–920, 2017. \n \n\n\n\n
\n\n\n\n \n \n \"ParallelPaper\n  \n \n\n \n \n doi\n  \n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/icde/AltowimM17,\n  author    = {Yasser Altowim and\n               Sharad Mehrotra},\n  title     = {Parallel Progressive Approach to Entity Resolution Using MapReduce},\n  booktitle = {33rd {IEEE} International Conference on Data Engineering, {ICDE} 2017,\n               San Diego, CA, USA, April 19-22, 2017},\n  pages     = {909--920},\n  year      = {2017},\n  crossref  = {DBLP:conf/icde/2017},\n  url       = {https://doi.org/10.1109/ICDE.2017.139},\n  doi       = {10.1109/ICDE.2017.139},\n  timestamp = {Tue, 29 May 2018 16:11:42 +0200},\n  biburl    = {https://dblp.org/rec/bib/conf/icde/AltowimM17},\n  bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Ground: A Data Context Service.\n \n \n \n\n\n \n Hellerstein, J. M; Sreekanti, V.; Gonzalez, J. E; Dalton, J.; Dey, A.; Nag, S.; Ramachandran, K.; Arora, S.; Bhattacharyya, A.; Das, S.; and others\n\n\n \n\n\n\n In CIDR, 2017. \n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{hellerstein2017ground,\n  title={Ground: A Data Context Service.},\n  author={Hellerstein, Joseph M and Sreekanti, Vikram and Gonzalez, Joseph E and Dalton, James and Dey, Akon and Nag, Sreyashi and Ramachandran, Krishna and Arora, Sudhanshu and Bhattacharyya, Arka and Das, Shirshanka and others},\n  booktitle={CIDR},\n  year={2017}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Orpheus DB: bolt-on versioning for relational databases.\n \n \n \n\n\n \n Huang, S.; Xu, L.; Liu, J.; Elmore, A. J; and Parameswaran, A.\n\n\n \n\n\n\n Proceedings of the VLDB Endowment, 10(10): 1130–1141. 2017.\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{huang2017rpheus,\n  title={Orpheus DB: bolt-on versioning for relational databases},\n  author={Huang, Silu and Xu, Liqi and Liu, Jialin and Elmore, Aaron J and Parameswaran, Aditya},\n  journal={Proceedings of the VLDB Endowment},\n  volume={10},\n  number={10},\n  pages={1130--1141},\n  year={2017},\n  publisher={VLDB Endowment}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n  \n 2016\n \n \n (9)\n \n \n
\n
\n \n \n
\n \n\n \n \n \n \n \n \n Goods: Organizing Google's Datasets.\n \n \n \n \n\n\n \n Halevy, A.; Korn, F.; Noy, N. F.; Olston, C.; Polyzotis, N.; Roy, S.; and Whang, S. E.\n\n\n \n\n\n\n In Proceedings of the 2016 International Conference on Management of Data, of SIGMOD '16, pages 795–806, New York, NY, USA, 2016. ACM\n \n\n\n\n
\n\n\n\n \n \n \"Goods:Paper\n  \n \n\n \n \n doi\n  \n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n\n\n\n
\n
@inproceedings{Halevy:2016:GOG:2882903.2903730,\n author = {Halevy, Alon and Korn, Flip and Noy, Natalya F. and Olston, Christopher and Polyzotis, Neoklis and Roy, Sudip and Whang, Steven Euijong},\n title = {Goods: Organizing Google's Datasets},\n booktitle = {Proceedings of the 2016 International Conference on Management of Data},\n series = {SIGMOD '16},\n year = {2016},\n isbn = {978-1-4503-3531-7},\n location = {San Francisco, California, USA},\n pages = {795--806},\n numpages = {12},\n url = {http://doi.acm.org/10.1145/2882903.2903730},\n doi = {10.1145/2882903.2903730},\n acmid = {2903730},\n publisher = {ACM},\n address = {New York, NY, USA},\n keywords = {data culture, data flow, data lakes, data monitoring, data organization, data provenance, data search, enterprise data management, metadata extraction},\n} \n\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n \n Constance: An Intelligent Data Lake System.\n \n \n \n \n\n\n \n Hai, R.; Geisler, S.; and Quix, C.\n\n\n \n\n\n\n In Proceedings of the 2016 International Conference on Management of Data, of SIGMOD '16, pages 2097–2100, New York, NY, USA, 2016. ACM\n \n\n\n\n
\n\n\n\n \n \n \"Constance:Paper\n  \n \n\n \n \n doi\n  \n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n \n \n \n \n \n \n\n\n\n
\n
@inproceedings{Hai:2016:CID:2882903.2899389,\n author = {Hai, Rihan and Geisler, Sandra and Quix, Christoph},\n title = {Constance: An Intelligent Data Lake System},\n booktitle = {Proceedings of the 2016 International Conference on Management of Data},\n series = {SIGMOD '16},\n year = {2016},\n isbn = {978-1-4503-3531-7},\n location = {San Francisco, California, USA},\n pages = {2097--2100},\n numpages = {4},\n url = {http://doi.acm.org/10.1145/2882903.2899389},\n doi = {10.1145/2882903.2899389},\n acmid = {2899389},\n publisher = {ACM},\n address = {New York, NY, USA},\n keywords = {data integration, data lake, data quality},\n} \n\n\n\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Extracting databases from dark data with DeepDive.\n \n \n \n\n\n \n Zhang, C.; Shin, J.; Ré, C.; Cafarella, M.; and Niu, F.\n\n\n \n\n\n\n In Proceedings of the 2016 International Conference on Management of Data, pages 847–859, 2016. ACM\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{zhang2016extracting,\n  title={Extracting databases from dark data with DeepDive},\n  author={Zhang, Ce and Shin, Jaeho and R{\\'e}, Christopher and Cafarella, Michael and Niu, Feng},\n  booktitle={Proceedings of the 2016 International Conference on Management of Data},\n  pages={847--859},\n  year={2016},\n  organization={ACM}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n A large public corpus of web tables containing time and context metadata.\n \n \n \n\n\n \n Lehmberg, O.; Ritze, D.; Meusel, R.; and Bizer, C.\n\n\n \n\n\n\n In Proceedings of the 25th International Conference Companion on World Wide Web, pages 75–76, 2016. International World Wide Web Conferences Steering Committee\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{lehmberg2016large,\n  title={A large public corpus of web tables containing time and context metadata},\n  author={Lehmberg, Oliver and Ritze, Dominique and Meusel, Robert and Bizer, Christian},\n  booktitle={Proceedings of the 25th International Conference Companion on World Wide Web},\n  pages={75--76},\n  year={2016},\n  organization={International World Wide Web Conferences Steering Committee}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Extracting databases from dark data with DeepDive.\n \n \n \n\n\n \n Zhang, C.; Shin, J.; Ré, C.; Cafarella, M.; and Niu, F.\n\n\n \n\n\n\n In Proceedings of the 2016 International Conference on Management of Data, pages 847–859, 2016. ACM\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{zhang2016extracting,\n  title={Extracting databases from dark data with DeepDive},\n  author={Zhang, Ce and Shin, Jaeho and R{\\'e}, Christopher and Cafarella, Michael and Niu, Feng},\n  booktitle={Proceedings of the 2016 International Conference on Management of Data},\n  pages={847--859},\n  year={2016},\n  organization={ACM}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n CLAMS: bringing quality to Data Lakes.\n \n \n \n\n\n \n Farid, undefined; Roatis, A.; Ilyas, I. F; Hoffmann, H.; and Chu, X.\n\n\n \n\n\n\n In Proceedings of the 2016 International Conference on Management of Data, pages 2089–2092, 2016. ACM\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{farid2016clams,\n  title={CLAMS: bringing quality to Data Lakes},\n  author={Farid, \n  and Roatis, Alexandra and Ilyas, Ihab F and Hoffmann, Hella-Franziska and Chu, Xu},\n  booktitle={Proceedings of the 2016 International Conference on Management of Data},\n  pages={2089--2092},\n  year={2016},\n  organization={ACM}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n LSH ensemble: internet-scale domain search.\n \n \n \n\n\n \n Zhu, E.; Nargesian, F.; Pu, K. Q; and Miller, R. J\n\n\n \n\n\n\n Proceedings of the VLDB Endowment, 9(12): 1185–1196. 2016.\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{zhu2016lsh,\n  title={LSH ensemble: internet-scale domain search},\n  author={Zhu, Erkang and Nargesian, Fatemeh and Pu, Ken Q and Miller, Ren{\\'e}e J},\n  journal={Proceedings of the VLDB Endowment},\n  volume={9},\n  number={12},\n  pages={1185--1196},\n  year={2016},\n  publisher={VLDB Endowment}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n YAGO: A multilingual knowledge base from wikipedia, wordnet, and geonames.\n \n \n \n\n\n \n Rebele, T.; Suchanek, F.; Hoffart, J.; Biega, J.; Kuzey, E.; and Weikum, G.\n\n\n \n\n\n\n In International Semantic Web Conference, pages 177–185, 2016. Springer\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{rebele2016yago,\n  title={YAGO: A multilingual knowledge base from wikipedia, wordnet, and geonames},\n  author={Rebele, Thomas and Suchanek, Fabian and Hoffart, Johannes and Biega, Joanna and Kuzey, Erdal and Weikum, Gerhard},\n  booktitle={International Semantic Web Conference},\n  pages={177--185},\n  year={2016},\n  organization={Springer}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Leveraging the impact of ontology evolution on semantic annotations.\n \n \n \n\n\n \n Cardoso, S. D.; Pruski, C.; Da Silveira, M.; Lin, Y.; Groß, A.; Rahm, E.; and Reynaud-Delaı̂tre, Chantal\n\n\n \n\n\n\n In European Knowledge Acquisition Workshop, pages 68–82, 2016. Springer\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{cardoso2016leveraging,\n  title={Leveraging the impact of ontology evolution on semantic annotations},\n  author={Cardoso, Silvio Domingos and Pruski, C{\\'e}dric and Da Silveira, Marcos and Lin, Ying-Chi and Gro{\\ss}, Anika and Rahm, Erhard and Reynaud-Dela{\\^\\i}tre, Chantal},\n  booktitle={European Knowledge Acquisition Workshop},\n  pages={68--82},\n  year={2016},\n  organization={Springer}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n  \n 2015\n \n \n (7)\n \n \n
\n
\n \n \n
\n \n\n \n \n \n \n \n \n LabBook: Metadata-driven Social Collaborative Data Analysis.\n \n \n \n \n\n\n \n Kandogan, E.; Roth, M.; Schwarz, P.; Hui, J.; Terrizzano, I.; Christodoulakis, C.; and Miller, R. J.\n\n\n \n\n\n\n In Proceedings of the 2015 IEEE International Conference on Big Data (Big Data), of BIG DATA '15, pages 431–440, Washington, DC, USA, 2015. IEEE Computer Society\n \n\n\n\n
\n\n\n\n \n \n \"LabBook:Paper\n  \n \n\n \n \n doi\n  \n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n  \n \n 1 download\n \n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{Kandogan:2015:LMS:2877966.2878090,\n author = {Kandogan, Eser and Roth, Mary and Schwarz, Peter and Hui, Joshua and Terrizzano, Ignacio and Christodoulakis, Christina and Miller, Renee J.},\n title = {LabBook: Metadata-driven Social Collaborative Data Analysis},\n booktitle = {Proceedings of the 2015 IEEE International Conference on Big Data (Big Data)},\n series = {BIG DATA '15},\n year = {2015},\n isbn = {978-1-4799-9926-2},\n pages = {431--440},\n numpages = {10},\n url = {https://doi.org/10.1109/BigData.2015.7363784},\n doi = {10.1109/BigData.2015.7363784},\n acmid = {2878090},\n publisher = {IEEE Computer Society},\n address = {Washington, DC, USA},\n} \n\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Building the dresden web table corpus: A classification approach.\n \n \n \n\n\n \n Eberius, J.; Braunschweig, K.; Hentsch, M.; Thiele, M.; Ahmadov, A.; and Lehner, W.\n\n\n \n\n\n\n In 2015 IEEE/ACM 2nd International Symposium on Big Data Computing (BDC), pages 41–50, 2015. IEEE\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{eberius2015building,\n  title={Building the dresden web table corpus: A classification approach},\n  author={Eberius, Julian and Braunschweig, Katrin and Hentsch, Markus and Thiele, Maik and Ahmadov, Ahmad and Lehner, Wolfgang},\n  booktitle={2015 IEEE/ACM 2nd International Symposium on Big Data Computing (BDC)},\n  pages={41--50},\n  year={2015},\n  organization={IEEE}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Labbook: Metadata-driven social collaborative data analysis.\n \n \n \n\n\n \n Kandogan, E.; Roth, M.; Schwarz, P.; Hui, J.; Terrizzano, I.; Christodoulakis, C.; and Miller, R. J\n\n\n \n\n\n\n In 2015 IEEE International Conference on Big Data (Big Data), pages 431–440, 2015. IEEE\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n  \n \n 1 download\n \n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{kandogan2015labbook,\n  title={Labbook: Metadata-driven social collaborative data analysis},\n  author={Kandogan, Eser and Roth, Mary and Schwarz, Peter and Hui, Joshua and Terrizzano, Ignacio and Christodoulakis, Christina and Miller, Ren{\\'e}e J},\n  booktitle={2015 IEEE International Conference on Big Data (Big Data)},\n  pages={431--440},\n  year={2015},\n  organization={IEEE}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Data x-ray: A diagnostic tool for data errors.\n \n \n \n\n\n \n Wang, X.; Dong, X. L.; and Meliou, A.\n\n\n \n\n\n\n In Proceedings of the 2015 ACM SIGMOD International Conference on Management of Data, pages 1231–1245, 2015. ACM\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{wang2015data,\n  title={Data x-ray: A diagnostic tool for data errors},\n  author={Wang, Xiaolan and Dong, Xin Luna and Meliou, Alexandra},\n  booktitle={Proceedings of the 2015 ACM SIGMOD International Conference on Management of Data},\n  pages={1231--1245},\n  year={2015},\n  organization={ACM}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Principles of dataset versioning: Exploring the recreation/storage tradeoff.\n \n \n \n\n\n \n Bhattacherjee, S.; Chavan, A.; Huang, S.; Deshpande, A.; and Parameswaran, A.\n\n\n \n\n\n\n Proceedings of the VLDB Endowment, 8(12): 1346–1357. 2015.\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{bhattacherjee2015principles,\n  title={Principles of dataset versioning: Exploring the recreation/storage tradeoff},\n  author={Bhattacherjee, Souvik and Chavan, Amit and Huang, Silu and Deshpande, Amol and Parameswaran, Aditya},\n  journal={Proceedings of the VLDB Endowment},\n  volume={8},\n  number={12},\n  pages={1346--1357},\n  year={2015},\n  publisher={VLDB Endowment}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Collaborative data analytics with DataHub.\n \n \n \n\n\n \n Bhardwaj, A.; Deshpande, A.; Elmore, A. J; Karger, D.; Madden, S.; Parameswaran, A.; Subramanyam, H.; Wu, E.; and Zhang, R.\n\n\n \n\n\n\n Proceedings of the VLDB Endowment, 8(12): 1916–1919. 2015.\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{bhardwaj2015collaborative,\n  title={Collaborative data analytics with DataHub},\n  author={Bhardwaj, Anant and Deshpande, Amol and Elmore, Aaron J and Karger, David and Madden, Sam and Parameswaran, Aditya and Subramanyam, Harihar and Wu, Eugene and Zhang, Rebecca},\n  journal={Proceedings of the VLDB Endowment},\n  volume={8},\n  number={12},\n  pages={1916--1919},\n  year={2015},\n  publisher={VLDB Endowment}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Combining quantitative and logical data cleaning.\n \n \n \n\n\n \n Prokoshyna, N.; Szlichta, J.; Chiang, F.; Miller, R. J; and Srivastava, D.\n\n\n \n\n\n\n Proceedings of the VLDB Endowment, 9(4): 300–311. 2015.\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{prokoshyna2015combining,\n  title={Combining quantitative and logical data cleaning},\n  author={Prokoshyna, Nataliya and Szlichta, Jaroslaw and Chiang, Fei and Miller, Ren{\\'e}e J and Srivastava, Divesh},\n  journal={Proceedings of the VLDB Endowment},\n  volume={9},\n  number={4},\n  pages={300--311},\n  year={2015},\n  publisher={VLDB Endowment}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n  \n 2014\n \n \n (1)\n \n \n
\n
\n \n \n
\n \n\n \n \n \n \n \n Orca: a modular query optimizer architecture for big data.\n \n \n \n\n\n \n Soliman, M. A; Antova, L.; Raghavan, V.; El-Helw, A.; Gu, Z.; Shen, E.; Caragea, G. C; Garcia-Alvarado, C.; Rahman, F.; Petropoulos, M.; and others\n\n\n \n\n\n\n In Proceedings of the 2014 ACM SIGMOD international conference on Management of data, pages 337–348, 2014. ACM\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{soliman2014orca,\n  title={Orca: a modular query optimizer architecture for big data},\n  author={Soliman, Mohamed A and Antova, Lyublena and Raghavan, Venkatesh and El-Helw, Amr and Gu, Zhongxian and Shen, Entong and Caragea, George C and Garcia-Alvarado, Carlos and Rahman, Foyzur and Petropoulos, Michalis and others},\n  booktitle={Proceedings of the 2014 ACM SIGMOD international conference on Management of data},\n  pages={337--348},\n  year={2014},\n  organization={ACM}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n  \n 2013\n \n \n (2)\n \n \n
\n
\n \n \n
\n \n\n \n \n \n \n \n \n Discovering Denial Constraints.\n \n \n \n \n\n\n \n Chu, X.; Ilyas, I. F.; and Papotti, P.\n\n\n \n\n\n\n Proc. VLDB Endow., 6(13): 1498–1509. August 2013.\n \n\n\n\n
\n\n\n\n \n \n \"DiscoveringPaper\n  \n \n\n \n \n doi\n  \n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{Chu:2013:DDC:2536258.2536262,\n author = {Chu, Xu and Ilyas, Ihab F. and Papotti, Paolo},\n title = {Discovering Denial Constraints},\n journal = {Proc. VLDB Endow.},\n issue_date = {August 2013},\n volume = {6},\n number = {13},\n month = aug,\n year = {2013},\n issn = {2150-8097},\n pages = {1498--1509},\n numpages = {12},\n url = {http://dx.doi.org/10.14778/2536258.2536262},\n doi = {10.14778/2536258.2536262},\n acmid = {2536262},\n publisher = {VLDB Endowment},\n} \n\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Schema mappings and data examples.\n \n \n \n\n\n \n Ten Cate, B.; Kolaitis, P. G; and Tan, W.\n\n\n \n\n\n\n In Proceedings of the 16th International Conference on Extending Database Technology, pages 777–780, 2013. ACM\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{ten2013schema,\n  title={Schema mappings and data examples},\n  author={Ten Cate, Balder and Kolaitis, Phokion G and Tan, Wang-Chiew},\n  booktitle={Proceedings of the 16th International Conference on Extending Database Technology},\n  pages={777--780},\n  year={2013},\n  organization={ACM}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n  \n 2012\n \n \n (6)\n \n \n
\n
\n \n \n
\n \n\n \n \n \n \n \n Answering table queries on the web using column keywords.\n \n \n \n\n\n \n Pimplikar, R.; and Sarawagi, S.\n\n\n \n\n\n\n Proceedings of the VLDB Endowment, 5(10): 908–919. 2012.\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{pimplikar2012answering,\n  title={Answering table queries on the web using column keywords},\n  author={Pimplikar, Rakesh and Sarawagi, Sunita},\n  journal={Proceedings of the VLDB Endowment},\n  volume={5},\n  number={10},\n  pages={908--919},\n  year={2012},\n  publisher={VLDB Endowment}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Sample-driven schema mapping.\n \n \n \n\n\n \n Qian, L.; Cafarella, M. J; and Jagadish, H.\n\n\n \n\n\n\n In Proceedings of the 2012 ACM SIGMOD International Conference on Management of Data, pages 73–84, 2012. ACM\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{qian2012sample,\n  title={Sample-driven schema mapping},\n  author={Qian, Li and Cafarella, Michael J and Jagadish, HV},\n  booktitle={Proceedings of the 2012 ACM SIGMOD International Conference on Management of Data},\n  pages={73--84},\n  year={2012},\n  organization={ACM}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Infogather: entity augmentation and attribute discovery by holistic matching with web tables.\n \n \n \n\n\n \n Yakout, M.; Ganjam, K.; Chakrabarti, K.; and Chaudhuri, S.\n\n\n \n\n\n\n In Proceedings of the 2012 ACM SIGMOD International Conference on Management of Data, pages 97–108, 2012. ACM\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{yakout2012infogather,\n  title={Infogather: entity augmentation and attribute discovery by holistic matching with web tables},\n  author={Yakout, Mohamed and Ganjam, Kris and Chakrabarti, Kaushik and Chaudhuri, Surajit},\n  booktitle={Proceedings of the 2012 ACM SIGMOD International Conference on Management of Data},\n  pages={97--108},\n  year={2012},\n  organization={ACM}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Answering table queries on the web using column keywords.\n \n \n \n\n\n \n Pimplikar, R.; and Sarawagi, S.\n\n\n \n\n\n\n Proceedings of the VLDB Endowment, 5(10): 908–919. 2012.\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{pimplikar2012answering,\n  title={Answering table queries on the web using column keywords},\n  author={Pimplikar, Rakesh and Sarawagi, Sunita},\n  journal={Proceedings of the VLDB Endowment},\n  volume={5},\n  number={10},\n  pages={908--919},\n  year={2012},\n  publisher={VLDB Endowment}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n \n LearnPADS + + : Incremental Inference of Ad Hoc Data Formats.\n \n \n \n \n\n\n \n Zhu, K. Q.; Fisher, K.; and Walker, D.\n\n\n \n\n\n\n In Practical Aspects of Declarative Languages - 14th International Symposium, PADL 2012, Philadelphia, PA, USA, January 23-24, 2012. Proceedings, pages 168–182, 2012. \n \n\n\n\n
\n\n\n\n \n \n \"LearnPADSPaper\n  \n \n\n \n \n doi\n  \n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/padl/ZhuFW12,\n  author    = {Kenny Qili Zhu and\n               Kathleen Fisher and\n               David Walker},\n  title     = {LearnPADS + + : Incremental Inference of Ad Hoc Data Formats},\n  booktitle = {Practical Aspects of Declarative Languages - 14th International Symposium,\n               {PADL} 2012, Philadelphia, PA, USA, January 23-24, 2012. Proceedings},\n  pages     = {168--182},\n  year      = {2012},\n  crossref  = {DBLP:conf/padl/2012},\n  url       = {https://doi.org/10.1007/978-3-642-27694-1\\_13},\n  doi       = {10.1007/978-3-642-27694-1\\_13},\n  timestamp = {Tue, 14 May 2019 10:00:42 +0200},\n  biburl    = {https://dblp.org/rec/bib/conf/padl/ZhuFW12},\n  bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n \n One Permutation Hashing.\n \n \n \n \n\n\n \n Li, P.; Owen, A. B; and Zhang, C.\n\n\n \n\n\n\n In Proceedings of the 25th International Conference on Neural Information Processing Systems - Volume 2, of NIPS'12, pages 3113–3121, USA, 2012. Curran Associates Inc.\n \n\n\n\n
\n\n\n\n \n \n \"OnePaper\n  \n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{Li:2012:OPH:2999325.2999482,\n author = {Li, Ping and Owen, Art B and Zhang, Cun-Hui},\n title = {One Permutation Hashing},\n booktitle = {Proceedings of the 25th International Conference on Neural Information Processing Systems - Volume 2},\n series = {NIPS'12},\n year = {2012},\n location = {Lake Tahoe, Nevada},\n pages = {3113--3121},\n numpages = {9},\n url = {http://dl.acm.org/citation.cfm?id=2999325.2999482},\n acmid = {2999482},\n publisher = {Curran Associates Inc.},\n address = {USA},\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n  \n 2011\n \n \n (3)\n \n \n
\n
\n \n \n
\n \n\n \n \n \n \n \n Recovering semantics of tables on the web.\n \n \n \n\n\n \n Venetis, P.; Halevy, A.; Madhavan, J.; Paşca, M.; Shen, W.; Wu, F.; Miao, G.; and Wu, C.\n\n\n \n\n\n\n Proceedings of the VLDB Endowment, 4(9): 528–538. 2011.\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{venetis2011recovering,\n  title={Recovering semantics of tables on the web},\n  author={Venetis, Petros and Halevy, Alon and Madhavan, Jayant and Pa{\\c{s}}ca, Marius and Shen, Warren and Wu, Fei and Miao, Gengxin and Wu, Chung},\n  journal={Proceedings of the VLDB Endowment},\n  volume={4},\n  number={9},\n  pages={528--538},\n  year={2011},\n  publisher={VLDB Endowment}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n A unified model for data and constraint repair.\n \n \n \n\n\n \n Chiang, F.; and Miller, R. J\n\n\n \n\n\n\n In 2011 IEEE 27th International Conference on Data Engineering, pages 446–457, 2011. IEEE\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n  \n \n 2 downloads\n \n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{chiang2011unified,\n  title={A unified model for data and constraint repair},\n  author={Chiang, Fei and Miller, Renee J},\n  booktitle={2011 IEEE 27th International Conference on Data Engineering},\n  pages={446--457},\n  year={2011},\n  organization={IEEE}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n \n Schema Mapping Evolution Through Composition and Inversion.\n \n \n \n \n\n\n \n Fagin, R.; Kolaitis, P. G.; Popa, L.; and Tan, W. C.\n\n\n \n\n\n\n In Schema Matching and Mapping, pages 191–222. 2011.\n \n\n\n\n
\n\n\n\n \n \n \"SchemaPaper\n  \n \n\n \n \n doi\n  \n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@incollection{DBLP:books/sp/bellahsene2011/FaginKPT11,\n  author    = {Ronald Fagin and\n               Phokion G. Kolaitis and\n               Lucian Popa and\n               Wang Chiew Tan},\n  title     = {Schema Mapping Evolution Through Composition and Inversion},\n  booktitle = {Schema Matching and Mapping},\n  pages     = {191--222},\n  year      = {2011},\n  url       = {https://doi.org/10.1007/978-3-642-16518-4\\_7},\n  doi       = {10.1007/978-3-642-16518-4\\_7},\n  timestamp = {Fri, 02 Nov 2018 09:27:04 +0100},\n  biburl    = {https://dblp.org/rec/bib/books/sp/bellahsene2011/FaginKPT11},\n  bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n  \n 2010\n \n \n (1)\n \n \n
\n
\n \n \n
\n \n\n \n \n \n \n \n Annotating and searching web tables using entities, types and relationships.\n \n \n \n\n\n \n Limaye, G.; Sarawagi, S.; and Chakrabarti, S.\n\n\n \n\n\n\n Proceedings of the VLDB Endowment, 3(1-2): 1338–1347. 2010.\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{limaye2010annotating,\n  title={Annotating and searching web tables using entities, types and relationships},\n  author={Limaye, Girija and Sarawagi, Sunita and Chakrabarti, Soumen},\n  journal={Proceedings of the VLDB Endowment},\n  volume={3},\n  number={1-2},\n  pages={1338--1347},\n  year={2010},\n  publisher={VLDB Endowment}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n  \n 2009\n \n \n (1)\n \n \n
\n
\n \n \n
\n \n\n \n \n \n \n \n Data integration for the relational web.\n \n \n \n\n\n \n Cafarella, M. J; Halevy, A.; and Khoussainova, N.\n\n\n \n\n\n\n Proceedings of the VLDB Endowment, 2(1): 1090–1101. 2009.\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{cafarella2009data,\n  title={Data integration for the relational web},\n  author={Cafarella, Michael J and Halevy, Alon and Khoussainova, Nodira},\n  journal={Proceedings of the VLDB Endowment},\n  volume={2},\n  number={1},\n  pages={1090--1101},\n  year={2009},\n  publisher={VLDB Endowment}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n  \n 2008\n \n \n (2)\n \n \n
\n
\n \n \n
\n \n\n \n \n \n \n \n Webtables: exploring the power of tables on the web.\n \n \n \n\n\n \n Cafarella, M. J; Halevy, A.; Wang, D. Z.; Wu, E.; and Zhang, Y.\n\n\n \n\n\n\n Proceedings of the VLDB Endowment, 1(1): 538–549. 2008.\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{cafarella2008webtables,\n  title={Webtables: exploring the power of tables on the web},\n  author={Cafarella, Michael J and Halevy, Alon and Wang, Daisy Zhe and Wu, Eugene and Zhang, Yang},\n  journal={Proceedings of the VLDB Endowment},\n  volume={1},\n  number={1},\n  pages={538--549},\n  year={2008},\n  publisher={VLDB Endowment}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Quantitative data cleaning for large databases.\n \n \n \n\n\n \n Hellerstein, J. M\n\n\n \n\n\n\n . 2008.\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{hellerstein2008quantitative,\n  title={Quantitative data cleaning for large databases},\n  author={Hellerstein, Joseph M},\n  year={2008}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n  \n 2007\n \n \n (4)\n \n \n
\n
\n \n \n
\n \n\n \n \n \n \n \n PADS/ML: A functional data description language.\n \n \n \n\n\n \n Mandelbaum, Y.; Fisher, K.; Walker, D.; Fernandez, M.; and Gleyzer, A.\n\n\n \n\n\n\n In ACM SIGPLAN Notices, volume 42, pages 77–83, 2007. ACM\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{mandelbaum2007pads,\n  title={PADS/ML: A functional data description language},\n  author={Mandelbaum, Yitzhak and Fisher, Kathleen and Walker, David and Fernandez, Mary and Gleyzer, Artem},\n  booktitle={ACM SIGPLAN Notices},\n  volume={42},\n  number={1},\n  pages={77--83},\n  year={2007},\n  organization={ACM}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Yago: a core of semantic knowledge.\n \n \n \n\n\n \n Suchanek, F. M; Kasneci, G.; and Weikum, G.\n\n\n \n\n\n\n In Proceedings of the 16th international conference on World Wide Web, pages 697–706, 2007. ACM\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{suchanek2007yago,\n  title={Yago: a core of semantic knowledge},\n  author={Suchanek, Fabian M and Kasneci, Gjergji and Weikum, Gerhard},\n  booktitle={Proceedings of the 16th international conference on World Wide Web},\n  pages={697--706},\n  year={2007},\n  organization={ACM}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n \n Model Management and Schema Mappings: Theory and Practice.\n \n \n \n \n\n\n \n Bernstein, P. A.; and Ho, H.\n\n\n \n\n\n\n In Proceedings of the 33rd International Conference on Very Large Data Bases, University of Vienna, Austria, September 23-27, 2007, pages 1439–1440, 2007. \n \n\n\n\n
\n\n\n\n \n \n \"ModelPaper\n  \n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/vldb/BernsteinH07,\n  author    = {Philip A. Bernstein and\n               Howard Ho},\n  title     = {Model Management and Schema Mappings: Theory and Practice},\n  booktitle = {Proceedings of the 33rd International Conference on Very Large Data\n               Bases, University of Vienna, Austria, September 23-27, 2007},\n  pages     = {1439--1440},\n  year      = {2007},\n  crossref  = {DBLP:conf/vldb/2007},\n  url       = {http://www.vldb.org/conf/2007/papers/tutorials/p1439-bernstein.pdf},\n  timestamp = {Thu, 03 Mar 2016 17:54:19 +0100},\n  biburl    = {https://dblp.org/rec/bib/conf/vldb/BernsteinH07},\n  bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n \n Query-time Entity Resolution.\n \n \n \n \n\n\n \n Bhattacharya, I.; and Getoor, L.\n\n\n \n\n\n\n J. Artif. Intell. Res., 30: 621–657. 2007.\n \n\n\n\n
\n\n\n\n \n \n \"Query-timePaper\n  \n \n\n \n \n doi\n  \n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{DBLP:journals/jair/BhattacharyaG07,\n  author    = {Indrajit Bhattacharya and\n               Lise Getoor},\n  title     = {Query-time Entity Resolution},\n  journal   = {J. Artif. Intell. Res.},\n  volume    = {30},\n  pages     = {621--657},\n  year      = {2007},\n  url       = {https://doi.org/10.1613/jair.2290},\n  doi       = {10.1613/jair.2290},\n  timestamp = {Mon, 21 Jan 2019 15:01:17 +0100},\n  biburl    = {https://dblp.org/rec/bib/journals/jair/BhattacharyaG07},\n  bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n  \n 2006\n \n \n (1)\n \n \n
\n
\n \n \n
\n \n\n \n \n \n \n \n Table extraction using spatial reasoning on the CSS2 visual box model.\n \n \n \n\n\n \n Gatterbauer, W.; and Bohunsky, P.\n\n\n \n\n\n\n In Proceedings of the National Conference on Artificial Intelligence, volume 21, pages 1313, 2006. Menlo Park, CA; Cambridge, MA; London; AAAI Press; MIT Press; 1999\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{gatterbauer2006table,\n  title={Table extraction using spatial reasoning on the CSS2 visual box model},\n  author={Gatterbauer, Wolfgang and Bohunsky, Paul},\n  booktitle={Proceedings of the National Conference on Artificial Intelligence},\n  volume={21},\n  number={2},\n  pages={1313},\n  year={2006},\n  organization={Menlo Park, CA; Cambridge, MA; London; AAAI Press; MIT Press; 1999}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n  \n 2005\n \n \n (2)\n \n \n
\n
\n \n \n
\n \n\n \n \n \n \n \n Data exchange: semantics and query answering.\n \n \n \n\n\n \n Fagin, R.; Kolaitis, P. G; Miller, R. J; and Popa, L.\n\n\n \n\n\n\n Theoretical Computer Science, 336(1): 89–124. 2005.\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n  \n \n 2 downloads\n \n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{fagin2005data,\n  title={Data exchange: semantics and query answering},\n  author={Fagin, Ronald and Kolaitis, Phokion G and Miller, Ren{\\'e}e J and Popa, Lucian},\n  journal={Theoretical Computer Science},\n  volume={336},\n  number={1},\n  pages={89--124},\n  year={2005},\n  publisher={Elsevier}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n Schema and ontology matching with COMA++.\n \n \n \n\n\n \n Aumueller, D.; Do, H.; Massmann, S.; and Rahm, E.\n\n\n \n\n\n\n In Proceedings of the 2005 ACM SIGMOD international conference on Management of data, pages 906–908, 2005. Acm\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{aumueller2005schema,\n  title={Schema and ontology matching with COMA++},\n  author={Aumueller, David and Do, Hong-Hai and Massmann, Sabine and Rahm, Erhard},\n  booktitle={Proceedings of the 2005 ACM SIGMOD international conference on Management of data},\n  pages={906--908},\n  year={2005},\n  organization={Acm}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n  \n 2004\n \n \n (1)\n \n \n
\n
\n \n \n
\n \n\n \n \n \n \n \n \n Preserving mapping consistency under schema changes.\n \n \n \n \n\n\n \n Velegrakis, Y.; Miller, R. J.; and Popa, L.\n\n\n \n\n\n\n VLDB J., 13(3): 274–293. 2004.\n \n\n\n\n
\n\n\n\n \n \n \"PreservingPaper\n  \n \n\n \n \n doi\n  \n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n  \n \n 1 download\n \n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{DBLP:journals/vldb/VelegrakisMP04,\n  author    = {Yannis Velegrakis and\n               Ren{\\'{e}}e J. Miller and\n               Lucian Popa},\n  title     = {Preserving mapping consistency under schema changes},\n  journal   = {{VLDB} J.},\n  volume    = {13},\n  number    = {3},\n  pages     = {274--293},\n  year      = {2004},\n  url       = {https://doi.org/10.1007/s00778-004-0136-2},\n  doi       = {10.1007/s00778-004-0136-2},\n  timestamp = {Mon, 25 Dec 2017 02:18:30 +0100},\n  biburl    = {https://dblp.org/rec/bib/journals/vldb/VelegrakisMP04},\n  bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n  \n 2002\n \n \n (1)\n \n \n
\n
\n \n \n
\n \n\n \n \n \n \n \n \n Data Integration: A Theoretical Perspective.\n \n \n \n \n\n\n \n Lenzerini, M.\n\n\n \n\n\n\n In Proceedings of the Twenty-first ACM SIGACT-SIGMOD-SIGART Symposium on Principles of Database Systems, June 3-5, Madison, Wisconsin, USA, pages 233–246, 2002. \n \n\n\n\n
\n\n\n\n \n \n \"DataPaper\n  \n \n\n \n \n doi\n  \n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{DBLP:conf/pods/Lenzerini02,\n  author    = {Maurizio Lenzerini},\n  title     = {Data Integration: {A} Theoretical Perspective},\n  booktitle = {Proceedings of the Twenty-first {ACM} {SIGACT-SIGMOD-SIGART} Symposium\n               on Principles of Database Systems, June 3-5, Madison, Wisconsin, {USA}},\n  pages     = {233--246},\n  year      = {2002},\n  crossref  = {DBLP:conf/pods/2002},\n  url       = {https://doi.org/10.1145/543613.543644},\n  doi       = {10.1145/543613.543644},\n  timestamp = {Tue, 06 Nov 2018 16:58:02 +0100},\n  biburl    = {https://dblp.org/rec/bib/conf/pods/Lenzerini02},\n  bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n  \n 2001\n \n \n (2)\n \n \n
\n
\n \n \n
\n \n\n \n \n \n \n \n Generic schema matching with cupid.\n \n \n \n\n\n \n Madhavan, J.; Bernstein, P. A; and Rahm, E.\n\n\n \n\n\n\n In vldb, volume 1, pages 49–58, 2001. \n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{madhavan2001generic,\n  title={Generic schema matching with cupid},\n  author={Madhavan, Jayant and Bernstein, Philip A and Rahm, Erhard},\n  booktitle={vldb},\n  volume={1},\n  pages={49--58},\n  year={2001}\n}\n
\n
\n\n\n\n
\n\n\n
\n \n\n \n \n \n \n \n A survey of approaches to automatic schema matching.\n \n \n \n\n\n \n Rahm, E.; and Bernstein, P. A\n\n\n \n\n\n\n the VLDB Journal, 10(4): 334–350. 2001.\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@article{rahm2001survey,\n  title={A survey of approaches to automatic schema matching},\n  author={Rahm, Erhard and Bernstein, Philip A},\n  journal={the VLDB Journal},\n  volume={10},\n  number={4},\n  pages={334--350},\n  year={2001},\n  publisher={Springer}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n  \n 1999\n \n \n (1)\n \n \n
\n
\n \n \n
\n \n\n \n \n \n \n \n \n Consistent Query Answers in Inconsistent Databases.\n \n \n \n \n\n\n \n Arenas, M.; Bertossi, L.; and Chomicki, J.\n\n\n \n\n\n\n In Proceedings of the Eighteenth ACM SIGMOD-SIGACT-SIGART Symposium on Principles of Database Systems, of PODS '99, pages 68–79, New York, NY, USA, 1999. ACM\n \n\n\n\n
\n\n\n\n \n \n \"ConsistentPaper\n  \n \n\n \n \n doi\n  \n \n\n \n link\n  \n \n\n bibtex\n \n\n \n\n \n  \n \n 1 download\n \n \n\n \n \n \n \n \n \n \n\n  \n \n \n\n\n\n
\n
@inproceedings{Arenas:1999:CQA:303976.303983,\n author = {Arenas, Marcelo and Bertossi, Leopoldo and Chomicki, Jan},\n title = {Consistent Query Answers in Inconsistent Databases},\n booktitle = {Proceedings of the Eighteenth ACM SIGMOD-SIGACT-SIGART Symposium on Principles of Database Systems},\n series = {PODS '99},\n year = {1999},\n isbn = {1-58113-062-7},\n location = {Philadelphia, Pennsylvania, USA},\n pages = {68--79},\n numpages = {12},\n url = {http://doi.acm.org/10.1145/303976.303983},\n doi = {10.1145/303976.303983},\n acmid = {303983},\n publisher = {ACM},\n address = {New York, NY, USA},\n} \n\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n\n\n\n
\n\n\n \n\n \n \n \n \n\n
\n"}; document.write(bibbase_data.data);