C5: Cloned Concurrency Control That Always Keeps Up.
Helt, J.; Sharma, A.; Abadi, D. J.; Lloyd, W.; and Faleiro, J. M.
PVLDB 16(1), 2022.
paper
link
bibtex
@misc{c5,
author = {Jeffrey Helt and
Abhinav Sharma and
Daniel J. Abadi and
Wyatt Lloyd and
Jose M. Faleiro},
title = {{C5:} Cloned Concurrency Control That Always Keeps Up},
journal = {Proc. {VLDB} Endow.},
volume = {16},
number = {1},
pages = {1--14},
year = {2022},
howpublished = {PVLDB 16(1)},
venue = "PVLDB",
publicationtype = "Journal Article",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/c5-paper.pdf",
}
BullFrog: Online Schema Evolution via Lazy Evaluation.
Bhattacherjee, S.; Liao, G.; Hicks, M.; and Abadi, D. J.
In
SIGMOD, 2021.
paper
link
bibtex
@inproceedings{bullfrog,
title = {BullFrog: Online Schema Evolution via Lazy Evaluation},
year = "2021",
booktitle = "SIGMOD",
venue = "SIGMOD",
author = {Souvik Bhattacherjee and Gang Liao and Michael Hicks and Daniel J. Abadi},
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/bullfrog-sigmod.pdf",
pdfKB = "1290",
iis1910613 = "Supported papers",
iis1718581 = "Supported papers",
keywords = "Schema evolution, Schema management, Scalable transactions",
}
AnyLog: a Grand Unification of the Internet of Things.
Abadi, D. J.; Arden, O.; Nawab, F.; and Shadmon, M.
In
CIDR, 2020.
paper
link
bibtex
1 download
@inproceedings{anylog,
author = {Daniel J. Abadi and Owen Arden and Faisal Nawab and Moshe Shadmon},
title = {AnyLog: a Grand Unification of the Internet of Things},
booktitle = "CIDR",
year = "2020",
venue = "CIDR",
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/anylogAbadiEtAl.pdf",
pdfKB = "256",
iis1910613 = "Supported papers",
keywords = "Decentralized database systems; Peer-to-peer database systems; Blockchain",
}
Integration of Large-Scale Data Processing Systems and Traditional Parallel Database Technology.
Abouzied, A.; Abadi, D. J.; Bajda-Pawlikowski, K.; and Silberschatz, A.
PVLDB 12(12), 2019.
paper
link
bibtex
3 downloads
@misc{hadoopdb-retrospective,
author = {Azza Abouzied and Daniel J. Abadi and Kamil Bajda-Pawlikowski and Avi Silberschatz},
title = {Integration of Large-Scale Data Processing Systems and Traditional Parallel Database Technology},
journal = {{PVLDB}},
volume = {12},
number = {12},
pages = {2290--2299},
year = {2019},
howpublished = {PVLDB 12(12)},
venue = "PVLDB",
publicationtype = "Journal Article",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/20001-Abadi.pdf",
pdfKB = "",
iis1910613 = "Supported papers",
iis1718581 = "Supported papers",
keywords = "Scalable queries,Parallel database systems,Analytical database systems,HadoopDB,MapReduce,Non-relational data,Schema management,Graph database systems",
project:multiple = "HadoopDB",
}
SLOG: Serializable, Low-latency, Geo-replicated Transactions.
Ren, K.; Li, D.; and Abadi, D. J.
PVLDB 12(11), 2019.
paper
link
bibtex
@misc{slog,
author = {Kun Ren and Dennis Li and Daniel J. Abadi},
title = {SLOG: Serializable, Low-latency, Geo-replicated Transactions},
journal = {{PVLDB}},
volume = {12},
number = {11},
pages = {1747--1761},
year = {2019},
howpublished = {PVLDB 12(11)},
venue = "PVLDB",
publicationtype = "Journal Article",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/1154-Abadi.pdf",
pdfKB = "",
iis1527118 = "Supported papers",
iis1718581 = "Supported papers",
keywords = "Scalable transactions,Deterministic systems,Distributed systems,Calvin",
project:multiple = "SLOG;Calvin",
}
The FuzzyLog: A Partially Ordered Shared Log.
Lockerman, J.; Faleiro, J. M.; Kim, J.; Sankaran, S.; Abadi, D. J.; Aspnes, J.; Sen, S.; and Balakrishnan, M.
In
OSDI, 2018.
paper
link
bibtex
1 download
@inproceedings {fuzzylog,
author = {Joshua Lockerman and Jose M. Faleiro and Juno Kim and Soham Sankaran and Daniel J. Abadi and James Aspnes and Siddhartha Sen and Mahesh Balakrishnan},
title = {The FuzzyLog: A Partially Ordered Shared Log},
booktitle = "OSDI",
year = "2018",
venue = "OSDI",
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/fuzzylog.pdf",
pdfKB = "7244",
iis1718581 = "Supported papers",
keywords = "Scalable transactions,Distributed systems",
project:multiple = "SLOG;Calvin",
}
An Overview of Deterministic Database Systems.
Abadi, D. J.; and Faleiro, J. M.
CACM, 61(9), September 2018.
paper
link
bibtex
1 download
@misc{determinism-cacm,
author = {Daniel J. Abadi and Jose M. Faleiro},
title = {An Overview of Deterministic Database Systems},
howpublished = {CACM, 61(9)},
month = {September},
year = {2018},
pages = {78-88},
venue = {CACM},
url_Paper = "http://www.cs.umd.edu/~abadi/papers/abadi-cacm2018.pdf",
pdfKB = "5530",
publicationtype = "Journal Article",
displayCategory = "Conference or Journal Publication",
iis1527118 = "Supported papers",
iis1718581 = "Supported papers",
keywords = "Calvin,Scalable transactions,Distributed systems,Deterministic systems,Main-memory database systems",
project:multiple = "SLOG;Calvin",
}
Latch-free Synchronization in Database Systems: Silver Bullet or Fool's Gold?.
Faleiro, J. M.; and Abadi, D. J.
In
CIDR, 2017.
paper
link
bibtex
@inproceedings{latch-free-sync,
author = {Jose M. Faleiro and Daniel J. Abadi},
title = {Latch-free Synchronization in Database Systems: Silver Bullet or Fool's Gold?},
booktitle = "CIDR",
year = "2017",
venue = "CIDR",
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/latch-free-cidr2017.pdf",
pdfKB = "378",
iis1527118 = "Supported papers",
keywords = "Scalable transactions,Multi-core systems,Main-memory database systems",
}
Automatic Generation of Normalized Relational Schemas from Nested Key-Value Data.
DiScala, M.; and Abadi, D. J.
In
SIGMOD, 2016.
paper
link
bibtex
@inproceedings{schemagen,
title = {Automatic Generation of Normalized Relational Schemas from Nested Key-Value Data},
year = "2016",
booktitle = "SIGMOD",
venue = "SIGMOD",
author = {Michael DiScala and Daniel J. Abadi},
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/schemagen-sigmod16.pdf",
pdfKB = "926",
iis1527118 = "Supported papers",
keywords = "Non-relational data, Schema management",
}
Design Principles for Scaling Multi-core OLTP Under High Contention.
Ren, K.; Faleiro, J.; and Abadi, D. J.
In
SIGMOD, 2016.
paper
link
bibtex
@inproceedings{orthrus,
title = {Design Principles for Scaling Multi-core OLTP Under High Contention},
year = "2016",
booktitle = "SIGMOD",
venue = "SIGMOD",
author = {Kun Ren and Jose Faleiro and Daniel J. Abadi},
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/orthrus-sigmod16.pdf",
pdfKB = "349",
iis1527118 = "Supported papers",
keywords = "Scalable transactions,Multi-core systems,Main-memory database systems",
}
Low-Overhead Asynchronous Checkpointing in Main-Memory Database Systems.
Ren, K.; Diamond, T.; Abadi, D. J.; and Thomson, A.
In
SIGMOD, 2016.
paper
link
bibtex
@inproceedings{fast-checkpoint,
title = {Low-Overhead Asynchronous Checkpointing in Main-Memory Database Systems},
year = "2016",
booktitle = "SIGMOD",
venue = "SIGMOD",
author = {Kun Ren and Thaddeus Diamond and Daniel J. Abadi and Alexander Thomson},
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/fast-checkpoint-sigmod16.pdf",
pdfKB = "436",
iis1527118 = "Supported papers",
keywords = "Scalable transactions,Main-memory database systems,Deterministic systems",
}
Scalable Pattern Matching Over Compressed Graphs via Dedensification.
Maccioni, A.; and Abadi, D. J.
In
KDD, 2016.
paper
link
bibtex
1 download
@inproceedings{graph-dedense,
title = {Scalable Pattern Matching Over Compressed Graphs via Dedensification},
year = "2016",
booktitle = "KDD",
venue = "KDD",
author = {Antonio Maccioni and Daniel J. Abadi},
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/graph-dedense.pdf",
pdfKB = "678",
iis1527118 = "Supported papers",
keywords = "Non-relational data, Graph database systems",
}
LEOPARD: Lightweight Edge-Oriented Partitioning and Replication for Dynamic Graphs.
Huang, J.; and Abadi, D. J.
PVLDB 9(7): 540-551, 2016.
paper
link
bibtex
@misc{leopard,
author = {Jiewen Huang and Daniel J. Abadi},
title = {LEOPARD: Lightweight Edge-Oriented Partitioning and Replication for Dynamic Graphs},
journal = {{PVLDB}},
volume = {9},
number = {7},
pages = {540-551},
year = {2016},
howpublished = {PVLDB 9(7): 540-551},
venue = "PVLDB",
publicationtype = "Journal Article",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/leopard-vldb16.pdf",
pdfKB = "609",
iis1527118 = "Supported papers",
keywords = "Non-relational data, Graph database systems,Distributed systems",
}
Rethinking serializable multiversion concurrency control.
Faleiro, J. M.; and Abadi, D. J.
PVLDB 8(11): 1190-1201, 2015.
paper
link
bibtex
1 download
@misc{rethink-mvcc,
author = {Jose M. Faleiro and Daniel J. Abadi},
title = {Rethinking serializable multiversion concurrency control},
journal = {{PVLDB}},
volume = {8},
number = {11},
pages = {1190-1201},
year = {2015},
howpublished = {PVLDB 8(11): 1190-1201},
venue = "PVLDB",
publicationtype = "Journal Article",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/rethink-mvcc.pdf",
pdfKB = "524",
iis1527118 = "Relevant prior work",
iis1718581 = "Relevant prior work",
iis1249722 = "Supported papers",
keywords = "Scalable transactions,Multi-core systems,Main-memory database systems,Deterministic systems",
}
VLL: A Lock Manager Redesign for Main Memory Database Systems.
Ren, K.; Thomson, A.; and Abadi, D. J.
VLDB Journal 24(5): 681-705, October 2015.
paper
link
bibtex
@misc{vll-vldbj,
author = {Kun Ren and Alexander Thomson and Daniel J. Abadi},
title = {VLL: A Lock Manager Redesign for Main Memory Database Systems},
journal = {{VLDB Journal}},
volume = {24},
number = {5},
howpublished = {VLDB Journal 24(5): 681-705},
month = {October},
year = {2015},
pages = {681-705},
venue = {VLDB Journal},
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/vldbj-vll.pdf",
pdfKB = "3464",
publicationtype = "Journal Article",
iis1527118 = "Relevant prior work",
iis1249722 = "Supported papers",
keywords = "Scalable transactions,Multi-core systems,Main-memory database systems,Distributed systems,Calvin,Deterministic systems",
project:multiple = "Calvin",
}
Lazy Evaluation of Transactions in Database Systems.
Faleiro, J.; Thomson, A.; and Abadi, D. J.
In
SIGMOD, 2014.
paper
link
bibtex
@inproceedings{lazy-xacts,
title = "Lazy Evaluation of Transactions in Database Systems",
year = "2014",
booktitle = "SIGMOD",
venue = "SIGMOD",
author = {Jose Faleiro and Alexander Thomson and Daniel J. Abadi},
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/lazy-xacts.pdf",
pdfKB = "774",
iis1527118 = "Relevant prior work",
iis1718581 = "Relevant prior work",
iis1249722 = "Supported papers",
keywords = "Scalable transactions,Multi-core systems,Main-memory database systems,Deterministic systems",
}
Sinew: a SQL System for Unified Analytics of Multi-structured Data.
Tahara, D.; Diamond, T.; and Abadi, D. J.
In
SIGMOD, 2014.
paper
link
bibtex
@inproceedings{sinew,
title = "Sinew: a SQL System for Unified Analytics of Multi-structured Data",
year = "2014",
booktitle = "SIGMOD",
venue = "SIGMOD",
author = {Daniel Tahara and Thaddeus Diamond and Daniel J. Abadi},
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/sinew-sigmod14.pdf",
pdfKB = "715",
iis0845643 = "Supported papers",
keywords = "Non-relational data, Schema management",
}
An Evaluation of the Advantages and Disadvantages of Deterministic Database Systems.
Ren, K.; Thomson, A.; and Abadi, D. J.
PVLDB 7(10): 821-832, 2014.
paper
link
bibtex
@misc{determinism-eval,
title = "An Evaluation of the Advantages and Disadvantages of Deterministic Database Systems",
howpublished = {PVLDB 7(10): 821-832},
year = "2014",
venue = "PVLDB",
author = {Kun Ren and Alexander Thomson and Daniel J. Abadi},
publicationtype = "Journal Article",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/determinism-eval.pdf",
pdfKB = "524",
iis1527118 = "Relevant prior work",
iis1249722 = "Supported papers",
keywords = "Scalable transactions,Distributed systems,Calvin,Deterministic systems",
project:multiple = "Calvin",
}
Fast Distributed Transactions and Strongly Consistent Replication for OLTP Database Systems.
Thomson, A.; Diamond, T.; Weng, S.; Ren, K.; Shao, P.; and Abadi, D. J.
ACM TODS 39(2): 11, 2014.
paper
link
bibtex
@misc{calvin-tods,
title = "Fast Distributed Transactions and Strongly Consistent Replication for OLTP Database Systems",
howpublished = {ACM TODS 39(2): 11},
year = "2014",
venue = "TODS",
author = {Alexander Thomson and Thaddeus Diamond and Shu-Chun Weng and Kun Ren and Philip Shao and Daniel J. Abadi},
publicationtype = "Journal Article",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/calvin-tods14.pdf",
pdfKB = "1987",
keywords = "Scalable transactions,Distributed systems,Calvin,Deterministic systems",
project:multiple = "Calvin",
}
Query Optimization of Distributed Pattern Matching.
Huang, J.; Venkatraman, K.; and Abadi, D. J.
In
ICDE, 2014.
paper
link
bibtex
1 download
@inproceedings{subgraph-opt,
title = "Query Optimization of Distributed Pattern Matching",
year = "2014",
booktitle = "ICDE",
venue = "ICDE",
author = {Jiewen Huang and Kartik Venkatraman and Daniel J. Abadi},
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/subgraph-opt.pdf",
pdfKB = "446",
iis0845643 = "Supported papers",
keywords = "Non-relational data,Graph database systems,Distributed systems,Scalable queries,Parallel database systems",
}
The Beckman Report on Database Research.
Abadi, D. J.; Agrawal, R.; Ailamaki, A.; Balazinska, M.; Bernstein, P. A.; Carey, M. J.; Chaudhuri, S.; Dean, J.; Doan, A.; Franklin, M. J.; Gehrke, J.; Haas, L. M.; Halevy, A. Y.; Hellerstein, J. M.; Ioannidis, Y. E.; Jagadish, H. V.; Kossmann, D.; Madden, S.; Mehrotra, S.; Milo, T.; Naughton, J. F.; Ramakrishnan, R.; Markl, V.; Olston, C.; Ooi, B. C.; Re, C.; Suciu, D.; Stonebraker, M.; Walter, T.; and Widom, J.
SIGMOD Record, 43(3): 61-70, 2014.
paper
link
bibtex
@misc{beckman-report,
author = {Daniel J. Abadi and Rakesh Agrawal and Anastasia Ailamaki and Magdalena Balazinska and Philip A. Bernstein and Michael J. Carey and Surajit Chaudhuri and Jeffrey Dean and AnHai Doan and Michael J. Franklin and Johannes Gehrke and Laura M. Haas and Alon Y. Halevy and Joseph M. Hellerstein and Yannis E. Ioannidis and H. V. Jagadish and Donald Kossmann and Samuel Madden and Sharad Mehrotra and Tova Milo and Jeffrey F. Naughton and Raghu Ramakrishnan and Volker Markl and Christopher Olston and Beng Chin Ooi and Christopher Re and Dan Suciu and Michael Stonebraker and Todd Walter and Jennifer Widom},
title = {The Beckman Report on Database Research},
journal = {{SIGMOD} Record},
volume = {43},
number = {3},
pages = {61-70},
year = {2014},
howpublished = {SIGMOD Record, 43(3): 61-70},
publicationtype = "Journal Article",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/beckman-report2013.pdf",
pdfKB = "122",
}
Modularity and Scalability in Calvin.
Thomson, A.; and Abadi, D. J.
IEEE Data Engineering Bulletin, 36(2): 48-55, 2013.
paper
link
bibtex
@misc{modular-calvin,
author = {Alexander Thomson and Daniel J. Abadi},
title = {Modularity and Scalability in Calvin},
howpublished = {IEEE Data Engineering Bulletin, 36(2): 48-55},
venue = {IEEE Data Engineering Bulletin},
volume = {36},
number = {2},
year = {2013},
pages = {48-55},
publicationtype = "Journal Article",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/scalable-calvin.pdf",
pdfKB = "628",
iis1527118 = "Relevant prior work",
iis1249722 = "Supported papers",
keywords = "Scalable transactions,Distributed systems,Calvin,Deterministic systems",
project:multiple = "Calvin",
}
The Design and Implementation of Modern Column-Oriented Database Systems.
Abadi, D.; Boncz, P.; Harizopoulos, S.; Idreos, S.; and Madden, S.
Foundations and Trends in Databases, 5(3): 197-280, 2013.
paper
link
bibtex
2 downloads
@misc{abadi-column-store-survery,
number = {3},
volume = {5},
pages = {197-280},
year = {2013},
title = {The Design and Implementation of Modern Column-Oriented Database Systems},
author = {Daniel Abadi and Peter Boncz and Stavros Harizopoulos and Stratos Idreos and Samuel Madden},
howpublished = {Foundations and Trends in Databases, 5(3): 197-280},
venue = {Foundations and Trends in Databases},
publicationtype = "Journal Article",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/abadi-column-stores.pdf",
pdfKB = "1997",
keywords = "Scalable queries,Parallel database systems,Analytical database systems,Column-stores,C-Store",
project:multiple = "C-Store",
}
Invisible Loading: Access-Driven Data Transfer from Raw Files into Database Systems.
Abouzied, A.; Abadi, D. J.; and Silberschatz, A.
In
EDBT, 2013.
paper
link
bibtex
@inproceedings{invisible-loading,
title = "Invisible Loading: Access-Driven Data Transfer from Raw Files into Database Systems",
year = "2013",
booktitle = "EDBT",
venue = "EDBT",
author = {Azza Abouzied and Daniel J. Abadi and Avi Silberschatz},
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/invisibleloading.pdf",
pdfKB = "470",
iis0845643 = "Supported papers",
keywords = "Scalable queries,Parallel database systems,Analytical database systems,HadoopDB,MapReduce",
project:multiple = "HadoopDB",
}
Lightweight Locking for Main Memory Database Systems.
Ren, K.; Thomson, A.; and Abadi, D. J.
PVLDB 6(2): 145-156, 2012.
paper
link
bibtex
@misc{abadi-vll,
title = "Lightweight Locking for Main Memory Database Systems",
howpublished = {PVLDB 6(2): 145-156},
year = "2012",
venue = "PVLDB",
author = {Kun Ren and Alexander Thomson and Daniel J. Abadi},
publicationtype = "Journal Article",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/vll-vldb13.pdf",
pdfKB = "1018",
iis1249722 = "Supported papers",
keywords = "Scalable transactions,Multi-core systems,Main-memory database systems,Distributed systems,Calvin,Deterministic systems",
project:multiple = "Calvin",
}
Consistency Tradeoffs in Modern Distributed Database System Design: CAP is Only Part of the Story.
Abadi, D. J.
IEEE Computer, 45(2), 2012.
paper
link
bibtex
@misc{abadi-pacelc,
author = {Daniel J. Abadi},
title = {Consistency Tradeoffs in Modern Distributed Database System Design: CAP is Only Part of the Story},
howpublished = {IEEE Computer, 45(2)},
year = {2012},
pages = {37-42},
venue = {IEEE Computer},
url_Paper = "http://www.cs.umd.edu/~abadi/papers/abadi-pacelc.pdf",
pdfKB = "62",
publicationtype = "Journal Article",
displayCategory = "Conference or Journal Publication",
keywords = "Scalable transactions,Distributed systems,Consistency guarantees,PACELC",
}
Calvin: Fast Distributed Transactions for Partitioned Database Systems.
Thomson, A.; Diamond, T.; Weng, S.; Ren, K.; Shao, P.; and Abadi, D. J.
In
SIGMOD, 2012.
paper
link
bibtex
1 download
@inproceedings{calvin,
title = "Calvin: Fast Distributed Transactions for Partitioned Database Systems",
year = "2012",
booktitle = "SIGMOD",
venue = "SIGMOD",
author = {Alexander Thomson and Thaddeus Diamond and Shu-Chun Weng and Kun Ren and Philip Shao and Daniel J. Abadi},
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/calvin-sigmod12.pdf",
pdfKB = "544",
iis1527118 = "Relevant prior work",
iis0845643 = "Supported papers",
keywords = "Scalable transactions,Distributed systems,Calvin,Deterministic systems",
project:multiple = "Calvin",
}
Scalable SPARQL Querying of Large RDF Graphs.
Huang, J.; Abadi, D. J.; and Ren, K.
PVLDB, 4(21), August 2011.
paper
link
bibtex
@misc{scalable-subgraphs,
author = {Jiewen Huang and Daniel J. Abadi and Kun Ren},
title = {Scalable SPARQL Querying of Large RDF Graphs},
howpublished = {PVLDB, 4(21)},
month = {August},
year = {2011},
pages = {1123-1134},
venue = {PVLDB},
url_Paper = "http://www.cs.umd.edu/~abadi/papers/sw-graph-scale.pdf",
pdfKB = "457",
publicationtype = "Journal Article",
displayCategory = "Conference or Journal Publication",
iis0845643 = "Supported papers",
keywords = "Non-relational data, Graph database systems, Distributed systems,Scalable queries,Parallel database systems,Analytical database systems",
}
Efficient Processing of Data Warehousing Queries in a Split Execution Environment.
Bajda-Pawlikowski, K.; Abadi, D. J.; Silberschatz, A.; and Paulson, E.
In
SIGMOD, 2011.
paper
link
bibtex
@inproceedings{split-execution,
title = "Efficient Processing of Data Warehousing Queries in a Split Execution Environment",
year = "2011",
booktitle = "SIGMOD",
venue = "SIGMOD",
author = {Kamil Bajda-Pawlikowski and Daniel J. Abadi and Avi Silberschatz and Erik Paulson},
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/split-execution-hadoopdb.pdf",
pdfKB = "609",
nsfclue = "Supported papers",
keywords = "Scalable queries,Parallel database systems,Analytical database systems,HadoopDB,MapReduce",
project:multiple = "HadoopDB",
}
Building Deterministic Transaction Processing Systems without Deterministic Thread Scheduling.
Thomson, A.; and Abadi, D. J.
In
WODET, 2011.
paper
link
bibtex
@inproceedings{transactions-wodet11,
title = "Building Deterministic Transaction Processing Systems without Deterministic Thread Scheduling",
year = "2011",
booktitle = "WODET",
venue = "The 2nd Workshop on Determinism and Correctness in Parallel Programming",
author = {Alexander Thomson and Daniel J. Abadi},
publicationtype = "Workshop Paper",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/transactions-wodet11.pdf",
pdfKB = "223",
keywords = "Scalable transactions,Calvin,Deterministic systems",
project:multiple = "Calvin",
}
The Case for Determinism in Database Systems.
Thomson, A.; and Abadi, D. J.
PVLDB, 3(1), September 2010.
paper
link
bibtex
1 download
@misc{dbms-determinism,
title = "The Case for Determinism in Database Systems",
howpublished = {PVLDB, 3(1)},
month = {September},
year = "2010",
venue = "PVLDB",
pages = {70-80},
author = {Alexander Thomson and Daniel J. Abadi},
publicationtype = "Journal Article",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/determinism-vldb10.pdf",
pdfKB = "550",
iis0845643 = "Supported papers",
keywords = "Scalable transactions,Distributed systems,Calvin,Deterministic systems",
project:multiple = "Calvin",
}
Low Overhead Concurrency Control for Partitioned Main Memory Databases.
Jones, E. P. C.; Abadi, D. J.; and Madden, S.
In
SIGMOD, 2010.
paper
link
bibtex
@inproceedings{hstore-cc,
title = "Low Overhead Concurrency Control for Partitioned Main Memory Databases",
year = "2010",
booktitle = "SIGMOD",
venue = "SIGMOD",
author = {Evan P. C. Jones and Daniel J. Abadi and Samuel Madden},
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/hstore-cc.pdf",
pdfKB = "300",
iis0845643 = "Supported papers",
keywords = "Scalable transactions,Multi-core systems,Main-memory database systems,Distributed systems,H-Store",
project:multiple = "H-Store",
}
MapReduce and Parallel DBMSs: Friends or Foes?.
Stonebraker, M.; Abadi, D. J.; DeWitt, D. J.; Madden, S.; Paulson, E.; Pavlo, A.; and Rasin, A.
CACM, 53(1), January 2010.
paper
link
bibtex
1 download
@misc{mr-cacm,
author = {Michael Stonebraker and Daniel J. Abadi and David. J. DeWitt and Samuel Madden and Erik Paulson and Andrew Pavlo and Alexander Rasin},
title = {MapReduce and Parallel DBMSs: Friends or Foes?},
howpublished = {CACM, 53(1)},
month = {January},
year = {2010},
pages = {64-71},
venue = {CACM},
url_Paper = "http://www.cs.umd.edu/~abadi/papers/mr-cacm2010.pdf",
pdfKB = "3625",
publicationtype = "Journal Article",
displayCategory = "Conference or Journal Publication",
nsfclue = "Supported papers",
keywords = "Scalable queries,Parallel database systems,Analytical database systems,MapReduce",
}
HadoopDB: An Architectural Hybrid of MapReduce and DBMS Technologies for Analytical Workloads.
Abouzied, A.; Bajda-Pawlikowski, K.; Abadi, D. J.; Silberschatz, A.; and Rasin, A.
PVLDB, 2(1), August 2009.
VLDB Test of Time Award
paper
link
bibtex
@misc{hadoopdb,
title = "HadoopDB: An Architectural Hybrid of MapReduce and DBMS Technologies for Analytical Workloads",
howpublished = {PVLDB, 2(1)},
month = {August},
year = {2009},
pages = {922-933},
venue = {PVLDB},
author = {Azza Abouzied and Kamil Bajda-Pawlikowski and Daniel J. Abadi and Avi Silberschatz and Alexander Rasin},
publicationtype = "Journal Article",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/hadoopdb.pdf",
pdfKB = "400",
iis0845643 = "Supported papers",
award = "VLDB Test of Time Award",
note = "<u>VLDB Test of Time Award</u>",
nsfclue = "Supported papers",
keywords = "Scalable queries,Parallel database systems,Analytical database systems,HadoopDB,MapReduce",
project:multiple = "HadoopDB",
}
A Comparison of Approaches to Large Scale Data Analysis.
Pavlo, A.; Paulson, E.; Rasin, A.; Abadi, D. J.; DeWitt, D. J.; Madden, S. R.; and Stonebraker, M.
In
SIGMOD, Providence, Rhode Island, USA, 2009.
paper
link
bibtex
1 download
@inproceedings{benchmarks-sigmod09,
title = "A Comparison of Approaches to Large Scale Data Analysis",
year = "2009",
booktitle = "SIGMOD",
venue = "SIGMOD",
address = "Providence, Rhode Island, USA",
author = {Andrew Pavlo and Erik Paulson and Alexander Rasin and Daniel J. Abadi and David J. DeWitt and Samuel R. Madden and Michael Stonebraker},
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/benchmarks-sigmod09.pdf",
pdfKB = "251",
nsfclue = "Supported papers",
keywords = "Scalable queries,Parallel database systems,Analytical database systems,MapReduce",
}
Data Management in the Cloud: Limitations and Opportunities.
Abadi, D. J.
IEEE Data Engineering Bulletin, 32(1), March 2009.
paper
link
bibtex
1 download
@misc{abadi-ieee-cloud,
author = {Daniel J. Abadi},
title = {Data Management in the Cloud: Limitations and Opportunities},
howpublished = {IEEE Data Engineering Bulletin, 32(1)},
month = {March},
year = {2009},
pages = {3-12},
venue = {IEEE Data Engineering Bulletin},
url_Paper = "http://www.cs.umd.edu/~abadi/papers/abadi-cloud-ieee09.pdf",
pdfKB = "62",
publicationtype = "Journal Article",
displayCategory = "Conference or Journal Publication",
iis0845643 = "Supported papers",
keywords = "Scalable queries,Parallel database systems,Analytical database systems,MapReduce",
}
SW-Store: A Vertically Partitioned DBMS for Semantic Web Data Management.
Abadi, D. J.; Marcus, A.; Madden, S. R.; and Hollenbach, K.
VLDB Journal, 18(2), April 2009.
paper
link
bibtex
@misc{abadi-swstore,
author = {Daniel J. Abadi and Adam Marcus and Samuel R. Madden and Kate Hollenbach},
title = {SW-Store: A Vertically Partitioned DBMS for Semantic Web Data Management},
howpublished = {VLDB Journal, 18(2)},
month = {April},
year = {2009},
pages = {385-406},
venue = {VLDB Journal},
url_Paper = "http://www.cs.umd.edu/~abadi/papers/abadi-rdf-vldbj.pdf",
pdfKB = "1124",
publicationtype = "Journal Article",
displayCategory = "Conference or Journal Publication",
iis0845643 = "Supported papers",
keywords = "Non-relational data,Scalable queries,Parallel database systems,Analytical database systems,Column-stores,C-Store",
project:multiple = "C-Store",
}
Column-Stores vs. Row-Stores: How Different Are They Really?.
Abadi, D. J.; Madden, S. R.; and Hachem, N.
In
SIGMOD, Vancouver, Canada, 2008.
paper
link
bibtex
3 downloads
@inproceedings{abadi-sigmod08,
title = "Column-Stores vs. Row-Stores: How Different Are They Really?",
year = "2008",
booktitle = "SIGMOD",
venue = "SIGMOD",
address = "Vancouver, Canada",
author = {Daniel J. Abadi and Samuel R. Madden and Nabil Hachem},
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/abadi-sigmod08.pdf",
pdfKB = "424",
keywords = "Analytical database systems,Column-stores,C-Store",
project:multiple = "C-Store",
}
OLTP Through the Looking Glass, And What We Found There.
Harizopoulos, S.; Abadi, D. J.; Madden, S. R.; and Stonebraker, M.
In
SIGMOD, Vancouver, Canada, 2008.
paper
link
bibtex
4 downloads
@inproceedings{oltp-perf,
title = "OLTP Through the Looking Glass, And What We Found There",
year = "2008",
booktitle = "SIGMOD",
venue = "SIGMOD",
address = "Vancouver, Canada",
author = {Stavros Harizopoulos and Daniel J. Abadi and Samuel R. Madden and Michael Stonebraker},
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
pdfKB = "287",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/oltpperf-sigmod08.pdf",
keywords = "Scalable transactions,Multi-core systems,Main-memory database systems,H-Store",
project:multiple = "H-Store",
}
Scalable Semantic Web Data Management Using Vertical Partitioning.
Abadi, D. J.; Marcus, A.; Madden, S. R.; and Hollenbach, K.
In
VLDB, Vienna, Austria, 2007.
Best Paper Award
paper
link
bibtex
abstract
@inproceedings{abadi-rdf,
title = "Scalable Semantic Web Data Management Using Vertical Partitioning",
year = "2007",
booktitle = "VLDB",
address = "Vienna, Austria",
venue = "VLDB",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/abadirdf.pdf",
author = {Daniel J. Abadi and Adam Marcus and Samuel R. Madden and Kate Hollenbach},
abstract = "Efficient management of RDF data is an important factor in realizing the Semantic Web vision. Performance and scalability issues are becoming increasingly pressing as Semantic Web technology is applied to real-world applications. In this paper, we examine the reasons why current data management solutions for RDF data scale poorly, and explore the fundamental scalability limitations of these approaches. We review the state of the art for improving performance for RDF databases and consider a recent suggestion, 'property tables'. We then discuss practically and empirically why this solution has undesirable features. As an improvement, we propose an alternative solution: vertically partitioning the RDF data. We compare the performance of vertical partitioning with prior art on queries generated by a Web-based RDF browser over a large-scale (more than 50 million triples) catalog of library data. Our results show that a vertical partitioned schema achieves similar performance to the property table technique while being much simpler to design. Further, if a column-oriented DBMS (a database architected specially for the vertically partitioned case) is used instead of a row-oriented DBMS, another order of magnitude performance improvement is observed, with query times dropping from minutes to several seconds.",
pdfKB = "246",
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
award = "Best Paper Award",
note = "<u>Best Paper Award</u>",
keywords = "Scalable queries,Parallel database systems,Analytical database systems,Column-stores,C-Store,Non-relational data",
project:multiple = "C-Store",
}
Efficient management of RDF data is an important factor in realizing the Semantic Web vision. Performance and scalability issues are becoming increasingly pressing as Semantic Web technology is applied to real-world applications. In this paper, we examine the reasons why current data management solutions for RDF data scale poorly, and explore the fundamental scalability limitations of these approaches. We review the state of the art for improving performance for RDF databases and consider a recent suggestion, 'property tables'. We then discuss practically and empirically why this solution has undesirable features. As an improvement, we propose an alternative solution: vertically partitioning the RDF data. We compare the performance of vertical partitioning with prior art on queries generated by a Web-based RDF browser over a large-scale (more than 50 million triples) catalog of library data. Our results show that a vertical partitioned schema achieves similar performance to the property table technique while being much simpler to design. Further, if a column-oriented DBMS (a database architected specially for the vertically partitioned case) is used instead of a row-oriented DBMS, another order of magnitude performance improvement is observed, with query times dropping from minutes to several seconds.
The End of an Architectural Era (It's Time for a Complete Rewrite).
Stonebraker, M.; Madden, S. R.; Abadi, D. J.; Harizopoulos, S.; Hachem, N.; and Helland, P.
In
VLDB, Vienna, Austria, 2007.
paper
link
bibtex
abstract
1 download
@inproceedings{hstore,
author = {Michael Stonebraker and Samuel R. Madden and Daniel J. Abadi and Stavros Harizopoulos and Nabil Hachem and Pat Helland},
title = {The End of an Architectural Era (It's Time for a Complete Rewrite)},
booktitle = {VLDB},
year = {2007},
address = {Vienna, Austria},
venue = "VLDB",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/vldb07hstore.pdf",
abstract = "In previous papers, some of us predicted the end of 'one size fits all' as a commercial relational DBMS paradigm. These papers presented reasons and experimental evidence that showed that the major relational RDBMS vendors can be outperformed by 1-2 orders of magnitude by specialized engines in the data warehouse, stream processing, text, and scientific database markets. Assuming that specialized engines dominate these markets over time, the current relational DBMS code lines will be left with the business data processing (OLTP) market and hybrid markets where more than one capability is required. In this paper we show that current RDBMSs can be beaten by nearly two orders of magnitude in the OLTP market as well. The experimental evidence comes from comparing a new OLTP prototype, H-Store, which we have built at M.I.T., to a popular RDBMS on the standard transactional benchmark, TPC-C. We conclude that current RDBMS code lines, while attempting to be a 'one size fits all' solution, in fact, excel at nothing. Hence, they are 25 year old legacy code lines that should be retired in favor of a collection of 'from scratch' specialized engines. The DBMS vendors (and research community) should start with a clean sheet of paper and design systems for tomorrow's requirements, not continue to push code lines and architectures designed for yesterday's needs.",
pdfKB = "444",
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
keywords = "Scalable transactions,Multi-core systems,Main-memory database systems,Distributed systems,H-Store",
project:multiple = "H-Store",
}
In previous papers, some of us predicted the end of 'one size fits all' as a commercial relational DBMS paradigm. These papers presented reasons and experimental evidence that showed that the major relational RDBMS vendors can be outperformed by 1-2 orders of magnitude by specialized engines in the data warehouse, stream processing, text, and scientific database markets. Assuming that specialized engines dominate these markets over time, the current relational DBMS code lines will be left with the business data processing (OLTP) market and hybrid markets where more than one capability is required. In this paper we show that current RDBMSs can be beaten by nearly two orders of magnitude in the OLTP market as well. The experimental evidence comes from comparing a new OLTP prototype, H-Store, which we have built at M.I.T., to a popular RDBMS on the standard transactional benchmark, TPC-C. We conclude that current RDBMS code lines, while attempting to be a 'one size fits all' solution, in fact, excel at nothing. Hence, they are 25 year old legacy code lines that should be retired in favor of a collection of 'from scratch' specialized engines. The DBMS vendors (and research community) should start with a clean sheet of paper and design systems for tomorrow's requirements, not continue to push code lines and architectures designed for yesterday's needs.
Column Stores for Wide and Sparse Data.
Abadi, D. J.
In
CIDR, Asilomar, CA, USA, 2007.
paper
link
bibtex
abstract
@inproceedings{abadi-cidr,
author = {Daniel J. Abadi},
title = {Column Stores for Wide and Sparse Data},
booktitle = {CIDR},
year = {2007},
address = {Asilomar, CA, USA},
venue = "CIDR",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/abadicidr07.pdf",
abstract = "While it is generally accepted that data warehouses and OLAP workloads are excellent applications for column-stores, this paper speculates that column-stores may well be suited for additional applications. In particular we observe that column-stores do not see a performance degradation when storing extremely wide tables, and column-stores handle sparse data very well. These two properties lead us to conjecture that column-stores may be good storage layers for Semantic Web data, XML data, and data with GEM-style schemas.",
pdfKB = "156",
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
keywords = "Column-stores,C-Store",
project:multiple = "C-Store",
}
While it is generally accepted that data warehouses and OLAP workloads are excellent applications for column-stores, this paper speculates that column-stores may well be suited for additional applications. In particular we observe that column-stores do not see a performance degradation when storing extremely wide tables, and column-stores handle sparse data very well. These two properties lead us to conjecture that column-stores may be good storage layers for Semantic Web data, XML data, and data with GEM-style schemas.
Materialization Strategies in a Column-Oriented DBMS.
Abadi, D. J.; Myers, D. S.; DeWitt, D. J.; and Madden, S. R.
In
ICDE, pages 466-475, Istanbul, Turkey, 2007.
paper
link
bibtex
abstract
@inproceedings{cstore-mat,
author = {Daniel J. Abadi and Daniel S. Myers and David J. DeWitt and Samuel R. Madden},
title = {Materialization Strategies in a Column-Oriented DBMS},
booktitle = {ICDE},
year = {2007},
address = {Istanbul, Turkey},
pages = {466-475},
venue = "ICDE",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/abadiicde2007.pdf",
abstract = "There has been renewed interest in column-oriented database architectures in recent years. For read-mostly query workloads such as those found in data warehouse and decision support applications, column-stores have been shown to perform particularly well relative to row-stores. In order for column-stores to be readily adopted as a replacement for row-stores, however, they must present the same interface to client applications as do row stores, which implies that they must output row-store-style tuples. Thus, the input columns stored on disk must be converted to rows at some point in the query plan, but the optimal point at which to do the conversion is not obvious. This problem can be considered as the opposite of the projection problem in row-store systems: while row-stores need to determine where in query plans to place projection operators to make tuples narrower, column-stores need to determine when to combine single-column projections into wider tuples. This paper describes a variety of strategies for tuple construction and intermediate result representations and provides a systematic evaluation of these strategies.",
pdfKB = "327",
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
keywords = "Analytical database systems,Column-stores,C-Store",
project:multiple = "C-Store",
}
There has been renewed interest in column-oriented database architectures in recent years. For read-mostly query workloads such as those found in data warehouse and decision support applications, column-stores have been shown to perform particularly well relative to row-stores. In order for column-stores to be readily adopted as a replacement for row-stores, however, they must present the same interface to client applications as do row stores, which implies that they must output row-store-style tuples. Thus, the input columns stored on disk must be converted to rows at some point in the query plan, but the optimal point at which to do the conversion is not obvious. This problem can be considered as the opposite of the projection problem in row-store systems: while row-stores need to determine where in query plans to place projection operators to make tuples narrower, column-stores need to determine when to combine single-column projections into wider tuples. This paper describes a variety of strategies for tuple construction and intermediate result representations and provides a systematic evaluation of these strategies.
Integrating Compression and Execution in Column-Oriented Database Systems.
Abadi, D. J.; Madden, S. R.; and Ferreira, M.
In
SIGMOD, pages 671-682, Chicago, IL, USA, 2006.
paper
link
bibtex
abstract
@inproceedings{cstore-comp,
author = {Daniel J. Abadi and Samuel R. Madden and Miguel Ferreira},
title = {Integrating Compression and Execution in Column-Oriented Database Systems},
booktitle = {SIGMOD},
year = {2006},
address = {Chicago, IL, USA},
pages = {671-682},
venue = "SIGMOD",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/abadisigmod06.pdf",
abstract = "Column-oriented database system architectures invite a re-evaluation of how and when data in databases is compressed. Storing data in a column-oriented fashion greatly increases the similarity of adjacent records on disk and thus opportunities for compression. The ability to compress many adjacent tuples at once lowers the per-tuple cost of compression, both in terms of CPU and space overheads. In this paper, we discuss how we extended C-Store (a column-oriented DBMS) with a compression sub-system. We show how compression schemes not traditionally used in row-oriented DBMSs can be applied to column-oriented systems. We then evaluate a set of compression schemes and show that the best scheme depends not only on the properties of the data but also on the nature of the query workload.",
pdfKB = "265",
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
keywords = "Scalable queries,Analytical database systems,Column-stores,C-Store",
project:multiple = "C-Store",
}
Column-oriented database system architectures invite a re-evaluation of how and when data in databases is compressed. Storing data in a column-oriented fashion greatly increases the similarity of adjacent records on disk and thus opportunities for compression. The ability to compress many adjacent tuples at once lowers the per-tuple cost of compression, both in terms of CPU and space overheads. In this paper, we discuss how we extended C-Store (a column-oriented DBMS) with a compression sub-system. We show how compression schemes not traditionally used in row-oriented DBMSs can be applied to column-oriented systems. We then evaluate a set of compression schemes and show that the best scheme depends not only on the properties of the data but also on the nature of the query workload.
REED: Robust, Efficient Filtering and Event Detection in Sensor Networks.
Abadi, D. J.; Madden, S. R.; and Lindner, W.
In
VLDB, pages 769-780, Trondheim, Norway, 2005.
paper
link
bibtex
abstract
@inproceedings{reed,
author = {Daniel J. Abadi and Samuel R. Madden and Wolfgang Lindner},
title = {REED: Robust, Efficient Filtering and Event Detection in Sensor Networks},
booktitle = {VLDB},
year = {2005},
address = {Trondheim, Norway},
pages = {769-780},
venue = "VLDB",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/abadivldb05.pdf",
abstract = "This paper presents a set of algorithms for efficiently evaluating join queries over static data tables in sensor networks. We describe and evaluate three algorithms that take advantage of distributed join techniques. Our algorithms are capable of running in limited amounts of RAM, can distribute the storage burden over groups of nodes, and are tolerant to dropped packets and node failures. REED is thus suitable for a wide range of event-detection applications that traditional sensor network database and data collection systems cannot be used to implement.",
pdfKB = "292",
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
keywords = "Analytical database systems,Distributed systems,Streaming data,Stream database systems",
}
This paper presents a set of algorithms for efficiently evaluating join queries over static data tables in sensor networks. We describe and evaluate three algorithms that take advantage of distributed join techniques. Our algorithms are capable of running in limited amounts of RAM, can distribute the storage burden over groups of nodes, and are tolerant to dropped packets and node failures. REED is thus suitable for a wide range of event-detection applications that traditional sensor network database and data collection systems cannot be used to implement.
C-Store: A Column-Oriented DBMS.
Stonebraker, M.; Abadi, D. J.; Batkin, A.; Chen, X.; Cherniack, M.; Ferreira, M.; Lau, E.; Lin, A.; Madden, S. R.; O'Neil, E. J.; O'Neil, P. E.; Rasin, A.; Tran, N.; and Zdonik, S. B.
In
VLDB, pages 553-564, Trondheim, Norway, 2005.
10 Year Best Paper Award
paper
link
bibtex
abstract
@inproceedings{cstore,
author = {Michael Stonebraker and Daniel J. Abadi and Adam Batkin and Xuedong Chen and Mitch Cherniack and Miguel Ferreira and Edmond Lau and Amerson Lin and Samuel R. Madden and Elizabeth J. O'Neil and Patrick E. O'Neil and Alexander Rasin and Nga Tran and Stan B. Zdonik},
title = {C-Store: A Column-Oriented DBMS},
booktitle = {VLDB},
year = {2005},
address = {Trondheim, Norway},
pages = {553-564},
venue = "VLDB",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/vldb.pdf",
abstract = "This paper presents the design of a read-optimized relational DBMS that contrasts sharply with most current systems, which are write-optimized. Among the many differences in its design are: storage of data by column rather than by row, careful coding and packing of objects into storage including main memory during query processing, storing an overlapping collection of column-oriented projections, rather than the current fare of tables and indexes, a non-traditional implementation of transactions which includes high availability and snapshot isolation for read-only transactions, and the extensive use of bitmap indexes to complement B-tree structures. We present preliminary performance data on a subset of TPC-H and show that the system we are building, C-Store, is substantially faster than popular commercial products. Hence, the architecture looks very encouraging.",
pdfKB = "170",
publicationtype = "Conference Paper",
award = "10 Year Best Paper Award",
note = "<u>10 Year Best Paper Award</u>",
displayCategory = "Conference or Journal Publication",
keywords = "Scalable queries,Parallel database systems,Analytical database systems,Column-stores,C-Store",
project:multiple = "C-Store",
}
This paper presents the design of a read-optimized relational DBMS that contrasts sharply with most current systems, which are write-optimized. Among the many differences in its design are: storage of data by column rather than by row, careful coding and packing of objects into storage including main memory during query processing, storing an overlapping collection of column-oriented projections, rather than the current fare of tables and indexes, a non-traditional implementation of transactions which includes high availability and snapshot isolation for read-only transactions, and the extensive use of bitmap indexes to complement B-tree structures. We present preliminary performance data on a subset of TPC-H and show that the system we are building, C-Store, is substantially faster than popular commercial products. Hence, the architecture looks very encouraging.
The Design of the Borealis Stream Processing Engine.
Abadi, D. J.; Ahmad, Y.; Balazinska, M.; Cetintemel, U.; Cherniack, M.; Hwang, J.; Lindner, W.; Maskey, A. S.; Rasin, A.; Ryvkina, E.; Tatbul, N.; Xing, Y.; and Zdonik, S. B.
In
CIDR, Asilomar, CA, USA, 2005.
paper
link
bibtex
abstract
@inproceedings{borealis,
author = {Daniel J. Abadi and Yanif Ahmad and Magdalena Balazinska and Ugur Cetintemel and Mitch Cherniack and Jeong-Hyon Hwang and Wolfgang Lindner and Anurag S. Maskey and Alexander Rasin and Esther Ryvkina and Nesime Tatbul and Ying Xing and Stan B. Zdonik},
title = {The Design of the Borealis Stream Processing Engine},
booktitle = {CIDR},
year = {2005},
address = {Asilomar, CA, USA},
venue = "CIDR",
url_Paper = "http://www.cs.umd.edu/~abadi/papers/cidr05.pdf",
abstract = "Borealis is a second-generation distributed stream processing engine that is being developed at Brandeis University, Brown University, and MIT. Borealis inherits core stream processing functionality from Aurora and distribution functionality from Medusa. Borealis modifies and extends both systems in non-trivial and critical ways to provide advanced capabilities that are commonly required by newly-emerging stream processing applications. In this paper, we outline the basic design and functionality of Borealis. Through sample real-world applications, we motivate the need for dynamically revising query results and modifying query specifications. We then describe how Borealis addresses these challenges through an innovative set of features, including revision records, time travel, and control lines. Finally, we present a highly flexible and scalable QoS-based optimization model that operates across server and sensor networks and a new fault-tolerance model with flexible consistency-availability trade-offs.",
pdfKB = "143",
publicationtype = "Conference Paper",
displayCategory = "Conference or Journal Publication",
keywords = "Streaming data, Stream database systems,Distributed systems",
project:multiple = "Aurora",
}
Borealis is a second-generation distributed stream processing engine that is being developed at Brandeis University, Brown University, and MIT. Borealis inherits core stream processing functionality from Aurora and distribution functionality from Medusa. Borealis modifies and extends both systems in non-trivial and critical ways to provide advanced capabilities that are commonly required by newly-emerging stream processing applications. In this paper, we outline the basic design and functionality of Borealis. Through sample real-world applications, we motivate the need for dynamically revising query results and modifying query specifications. We then describe how Borealis addresses these challenges through an innovative set of features, including revision records, time travel, and control lines. Finally, we present a highly flexible and scalable QoS-based optimization model that operates across server and sensor networks and a new fault-tolerance model with flexible consistency-availability trade-offs.
Aurora: A New Model and Architecture for Data Stream Management.
Abadi, D. J.; Carney, D.; Cetintemel, U.; Cherniack, M.; Convey, C.; Lee, S.; Stonebraker, M.; Tatbul, N.; and Zdonik, S. B.
VLDB Journal, 12(2), September 2003.
paper
link
bibtex
abstract
@misc{aurora,
author = {Daniel J. Abadi and Don Carney and Ugur Cetintemel and Mitch Cherniack and Christian Convey and Sangdon Lee and Michael Stonebraker and Nesime Tatbul and Stan B. Zdonik},
title = {Aurora: A New Model and Architecture for Data Stream Management},
howpublished = {VLDB Journal, 12(2)},
month = {September},
year = {2003},
pages = {120-139},
venue = {VLDB Journal},
url_Paper = "http://www.cs.umd.edu/~abadi/papers/vldb095.pdf",
abstract = "This paper describes the basic processing model and architecture of Aurora, a new system to manage data streams for monitoring applications. Monitoring applications differ substantially from conventional business data processing. The fact that a software system must process and react to continual inputs from many sources (e.g., sensors) rather than from human operators requires one to rethink the fundamental architecture of a DBMS for this application area. In this paper, we present Aurora, a new DBMS currently under construction at Brandeis University, Brown University, and M.I.T. We first provide an overview of the basic Aurora model and architecture and then describe in detail a stream-oriented set of operators.",
pdfKB = "984",
publicationtype = "Journal Article",
displayCategory = "Conference or Journal Publication",
keywords = "Streaming data, Stream database systems",
project:multiple = "Aurora",
}
%% Technical Reports
This paper describes the basic processing model and architecture of Aurora, a new system to manage data streams for monitoring applications. Monitoring applications differ substantially from conventional business data processing. The fact that a software system must process and react to continual inputs from many sources (e.g., sensors) rather than from human operators requires one to rethink the fundamental architecture of a DBMS for this application area. In this paper, we present Aurora, a new DBMS currently under construction at Brandeis University, Brown University, and M.I.T. We first provide an overview of the basic Aurora model and architecture and then describe in detail a stream-oriented set of operators.