AutoComp: Automated Data Compaction for Log-Structured Tables in Data Lake. Gruenheid, A., Camacho-Rodríguez, J., Curino, C., Ramakrishnan, R., Pak, S., Sakdeo, S., Gandhi, L., Singhal, S. K., Nilangekar, P., & Abadi, D. J. In SIGMOD, 2025.
Paper bibtex @inproceedings{autocomp,
author = {Anja Gruenheid and Jesús Camacho-Rodríguez and Carlo Curino and Raghu Ramakrishnan and Stanislav Pak and Sumedh Sakdeo and Lenisha Gandhi and Sandeep K. Singhal and Pooja Nilangekar and Daniel J. Abadi},
title = {AutoComp: Automated Data Compaction for Log-Structured Tables in Data Lake},
booktitle = {SIGMOD},
year = {2025},
venue = {SIGMOD},
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
url_Paper = {http://www.cs.umd.edu/~abadi/papers/autocomp-sigmod.pdf},
keywords = {Open data formats, Data lakes},
}
Downloads: 0
{"_id":"h478DJ7P28TMH3Hi7","bibbaseid":"gruenheid-camachorodrguez-curino-ramakrishnan-pak-sakdeo-gandhi-singhal-etal-autocompautomateddatacompactionforlogstructuredtablesindatalake-2025","author_short":["Gruenheid, A.","Camacho-Rodríguez, J.","Curino, C.","Ramakrishnan, R.","Pak, S.","Sakdeo, S.","Gandhi, L.","Singhal, S. K.","Nilangekar, P.","Abadi, D. J."],"bibdata":{"bibtype":"inproceedings","type":"inproceedings","author":[{"firstnames":["Anja"],"propositions":[],"lastnames":["Gruenheid"],"suffixes":[]},{"firstnames":["Jesús"],"propositions":[],"lastnames":["Camacho-Rodríguez"],"suffixes":[]},{"firstnames":["Carlo"],"propositions":[],"lastnames":["Curino"],"suffixes":[]},{"firstnames":["Raghu"],"propositions":[],"lastnames":["Ramakrishnan"],"suffixes":[]},{"firstnames":["Stanislav"],"propositions":[],"lastnames":["Pak"],"suffixes":[]},{"firstnames":["Sumedh"],"propositions":[],"lastnames":["Sakdeo"],"suffixes":[]},{"firstnames":["Lenisha"],"propositions":[],"lastnames":["Gandhi"],"suffixes":[]},{"firstnames":["Sandeep","K."],"propositions":[],"lastnames":["Singhal"],"suffixes":[]},{"firstnames":["Pooja"],"propositions":[],"lastnames":["Nilangekar"],"suffixes":[]},{"firstnames":["Daniel","J."],"propositions":[],"lastnames":["Abadi"],"suffixes":[]}],"title":"AutoComp: Automated Data Compaction for Log-Structured Tables in Data Lake","booktitle":"SIGMOD","year":"2025","venue":"SIGMOD","publicationtype":"Conference Paper","displaycategory":"Conference or Journal Publication","url_paper":"http://www.cs.umd.edu/~abadi/papers/autocomp-sigmod.pdf","keywords":"Open data formats, Data lakes","bibtex":"@inproceedings{autocomp,\n author = {Anja Gruenheid and Jesús Camacho-Rodríguez and Carlo Curino and Raghu Ramakrishnan and Stanislav Pak and Sumedh Sakdeo and Lenisha Gandhi and Sandeep K. Singhal and Pooja Nilangekar and Daniel J. Abadi},\n title = {AutoComp: Automated Data Compaction for Log-Structured Tables in Data Lake},\n booktitle = {SIGMOD},\n year = {2025},\n venue = {SIGMOD},\n publicationtype = \"Conference Paper\",\n displayCategory = \"Conference or Journal Publication\",\n url_Paper = {http://www.cs.umd.edu/~abadi/papers/autocomp-sigmod.pdf},\n keywords = {Open data formats, Data lakes},\n}\n\n","author_short":["Gruenheid, A.","Camacho-Rodríguez, J.","Curino, C.","Ramakrishnan, R.","Pak, S.","Sakdeo, S.","Gandhi, L.","Singhal, S. K.","Nilangekar, P.","Abadi, D. J."],"key":"autocomp","id":"autocomp","bibbaseid":"gruenheid-camachorodrguez-curino-ramakrishnan-pak-sakdeo-gandhi-singhal-etal-autocompautomateddatacompactionforlogstructuredtablesindatalake-2025","role":"author","urls":{" paper":"http://www.cs.umd.edu/~abadi/papers/autocomp-sigmod.pdf"},"keyword":["Open data formats","Data lakes"],"metadata":{"authorlinks":{}}},"bibtype":"inproceedings","biburl":"cs.umd.edu/~abadi/pubs/abadirefs.bib","dataSources":["YdtR8AbetSqiZGCey","bHTCYJduhkrS5AHxu"],"keywords":["open data formats","data lakes"],"search_terms":["autocomp","automated","data","compaction","log","structured","tables","data","lake","gruenheid","camacho-rodríguez","curino","ramakrishnan","pak","sakdeo","gandhi","singhal","nilangekar","abadi"],"title":"AutoComp: Automated Data Compaction for Log-Structured Tables in Data Lake","year":2025}