paper-2019-CIDR/oliver.bib

756 lines
21 KiB
BibTeX

@proceedings{DBLP:conf/sigmod/2004,
editor = {Gerhard Weikum and
Arnd Christian König and
Stefan Deßloch},
title = {Proceedings of the ACM SIGMOD International Conference on Management
of Data, Paris, France, June 13-18, 2004},
year = {2004}
}
@proceedings{DBLP:conf/icde/2009,
editor = {Yannis E. Ioannidis and
Dik Lun Lee and
Raymond T. Ng},
title = {Proceedings of the 25th International Conference on Data Engineering,
ICDE 2009, March 29 2009 - April 2 2009, Shanghai, China},
year = {2009}
}
@proceedings{DBLP:conf/sigmod/2016,
editor = {Fatma Özcan and
Georgia Koutrika and
Sam Madden},
title = {Proceedings of the 2016 International Conference on Management of
Data, SIGMOD Conference 2016, San Francisco, CA, USA, June 26 -
July 01, 2016},
year = {2016}
}
@proceedings{DBLP:conf/icde/2018,
title = {34th IEEE International Conference on Data Engineering, ICDE 2018,
Paris, France, April 16-19, 2018},
year = {2018}
}
@inproceedings{CL03b,
author = {Andrea Calì and Domenico Lembo and Riccardo Rosati},
booktitle = {PODS},
editor = {Frank Neven and Catriel Beeri and Tova Milo},
pages = {260--271},
title = {On the decidability and complexity of query answering over inconsistent and incomplete databases},
year = {2003}
}
@conference{AK07,
author = {Antova, L. and Koch, C. and Olteanu, D.},
booktitle = {ICDE},
pages = {1479--1480},
title = {MayBMS: Managing incomplete information with probabilistic world-set decompositions},
year = {2007}
}
@article{AG17c,
author = {Bahareh Arab and Dieter Gawlick and Vasudha Krishnaswamy and Venkatesh Radhakrishnan and Boris Glavic},
journal = {TKDE},
number = {3},
pages = {599--612},
projects = {GProM; Reenactment},
title = {Using Reenactment to Retroactively Capture Provenance for Transactions},
volume = {30},
year = {2018}
}
@article{AF18,
author = {Bahareh Arab and Su Feng and Boris Glavic and Seokki Lee and Xing Niu and Qitian Zeng},
journal = {IEEE Data Eng. Bull.},
number = {1},
pages = {51--62},
projects = {GProM; Reenactment},
title = {{GProM} - A Swiss Army Knife for Your Provenance Needs},
volume = {41},
year = {2018}
}
@incollection{BC04a,
author = {Bertossi, Leopoldo and Chomicki, Jan},
booktitle = {Logics for emerging applications of databases},
pages = {43--83},
title = {Query answering in inconsistent databases},
year = {2004}
}
@article{BD15,
author = {Bhardwaj, Anant and Deshpande, Amol and Elmore, Aaron J and Karger, David and Madden, Sam and Parameswaran, Aditya and Subramanyam, Harihar and Wu, Eugene and Zhang, Rebecca},
journal = {PVLDB},
number = {12},
pages = {1916--1919},
title = {Collaborative data analytics with DataHub},
volume = {8},
year = {2015}
}
@article{BC15a,
author = {Bhattacherjee, Souvik and Chavan, Amit and Huang, Silu and Deshpande, Amol and Parameswaran, Aditya},
journal = {PVLDB},
number = {12},
pages = {1346--1357},
title = {Principles of dataset versioning: Exploring the recreation/storage tradeoff},
volume = {8},
year = {2015}
}
@inproceedings{DBLP:conf/icde/LiuJ09,
author = {Bin Liu and
H. V. Jagadish},
booktitle = {ICDE},
pages = {417--428},
title = {A Spreadsheet Algebra for a Direct Data Manipulation Query Interface},
year = {2009}
}
@article{BN09,
address = {New York, NY, USA},
articleno = {1},
author = {Bleiholder, Jens and Naumann, Felix},
issn = {0360-0300},
issue_date = {December 2008},
journal = {ACM Comput. Surv.},
number = {1},
numpages = {41},
pages = {1:1--1:41},
title = {Data fusion},
volume = {41},
year = {2009}
}
@article{GM13,
author = {Boris Glavic and Renée J. Miller and Gustavo Alonso},
journal = {In search of elegance in the theory and practice of computation: a Festschrift in honour of Peter Buneman},
pages = {291--320},
projects = {Perm},
title = {Using SQL for Efficient Generation and Querying of Provenance Information},
year = {2013}
}
@article{BM08,
author = {Bowers, Shawn and McPhillips, Timothy and Ludäscher, Bertram},
journal = {Concurrency and Computation: Practice and Experience},
number = {5},
pages = {519--529},
title = {Provenance in Collection-oriented Scientific Workflows},
volume = {20},
year = {2008}
}
@inproceedings{CF06b,
author = {Callahan, Steven P and Freire, Juliana and Santos, Emanuele and Scheidegger, Carlos E and Silva, Claudio T and Vo, Huy T},
booktitle = {ICDE Workshops},
pages = {71--71},
title = {Managing the evolution of dataflows with vistrails},
year = {2006}
}
@article{DBLP:journals/concurrency/ScheideggerKSVCFS08,
author = {Carlos Eduardo Scheidegger and
David Koop and
Emanuele Santos and
Huy T. Vo and
Steven P. Callahan and
Juliana Freire and
Cláudio T. Silva},
journal = {Concurrency and Computation: Practice and Experience},
number = {5},
pages = {473--483},
title = {Tackling the Provenance Challenge one layer at a time},
volume = {20},
year = {2008}
}
@inproceedings{CW17a,
author = {Carvalho, Lucas AMC and Wang, Regina and Gil, Yolanda and Garijo, Daniel},
booktitle = {K-CAP Workshops},
pages = {12--16},
title = {NiW: Converting Notebooks into Workflows to Capture Dataflow and Provenance.},
year = {2017}
}
@article{CC09,
author = {Cheney, James and Chiticariu, Laura and Tan, Wang-Chiew},
journal = {Foundations and Trends in Databases},
number = {4},
pages = {379--474},
title = {Provenance in Databases: Why, How, and Where},
volume = {1},
year = {2009}
}
@inproceedings{CL18a,
author = {Cristina Civili and Leonid Libkin},
booktitle = {Principles of Knowledge Representation and Reasoning: Proceedings of the Sixteenth International Conference, KR 2018, Tempe, Arizona, 30 October - 2 November 2018.},
pages = {582--591},
title = {Approximating Certainty in Querying Data and Metadata},
year = {2018}
}
@article{Curino:2008:GDS:1453856.1453939,
author = {Curino, Carlo A. and Moon, Hyun J. and Zaniolo, Carlo},
journal = {PVLDB},
number = {1},
pages = {761--772},
title = {Graceful Database Schema Evolution: The PRISM Workbench},
volume = {1},
year = {2008}
}
@inproceedings{DBLP:conf/ipaw/Koop16,
author = {David Koop},
booktitle = {IPAW},
pages = {109--121},
title = {Versioning Version Trees: The Provenance of Actions that Affect Multiple
Versions},
year = {2016}
}
@inproceedings{DF08,
author = {Davidson, Susan B and Freire, Juliana},
booktitle = {SIGMOD},
pages = {1345--1350},
title = {Provenance and scientific workflows: challenges and opportunities},
year = {2008}
}
@article{DC07,
author = {Davidson, Susan B. and Cohen-Boulakia, Sarah and Eyal, Anat and Ludäscher, Bertram and McPhillips, Timothy and Bowers, Shawn and Freire, Juliana},
journal = {IEEE Data Eng. Bull.},
number = {4},
pages = {44--50},
title = {Provenance in Scientific Workflow Systems},
volume = {32},
year = {2007}
}
@article{DBLP:journals/vldb/BhagwatCTV05,
author = {Deepavali Bhagwat and
Laura Chiticariu and
Wang Chiew Tan and
Gaurav Vijayvargiya},
journal = {VLDBJ},
number = {4},
pages = {373--396},
title = {An annotation management system for relational databases},
volume = {14},
year = {2005}
}
@inproceedings{DBLP:conf/sigmod/BakkeK16,
author = {Eirik Bakke and
David R. Karger},
booktitle = {SIGMOD},
pages = {1377--1392},
title = {Expressive Query Construction through Direct Manipulation of Nested
Relational Results},
year = {2016}
}
@article{DBLP:journals/debu/LiJ12,
author = {Fei Li and
H. V. Jagadish},
journal = {IEEE Data Eng. Bull.},
number = {3},
pages = {37--45},
title = {Usability, Databases, and HCI},
volume = {35},
year = {2012}
}
@inproceedings{feng:2019:sigmod:uncertainty,
author = {Feng, Su and Huber, Aaron and Glavic, Boris and Kennedy, Oliver},
booktitle = {SIGMOD},
title = {Uncertainty Annotated Databases - A Lightweight Approach for Approximating Certain Answers},
year = {2019}
}
@inproceedings{DBLP:conf/icde/GeertsKM06,
author = {Floris Geerts and Anastasios Kementsietsidis and Diego Milano},
booktitle = {ICDE},
pages = {82},
title = {MONDRIAN: Annotating and Querying Databases through Colors and Blocks},
year = {2006}
}
@inproceedings{freire:2016:hilda:exception,
author = {Freire, Juliana and Glavic, Boris and Kennedy, Oliver and Mueller, Heiko},
booktitle = {HILDA},
title = {The Exception That Improves The Rule},
year = {2016}
}
@inproceedings{FM05,
author = {Fuxman, Ariel D and Miller, Renée J},
booktitle = {ICDT},
pages = {337--351},
title = {First-order query rewriting for inconsistent databases},
year = {2005}
}
@article{GP17,
author = {Geerts, Floris and Pijcke, Fabian and Wijsen, Jef},
journal = {International Journal of Approximate Reasoning},
pages = {337--355},
title = {First-order under-approximations of consistent query answers},
volume = {83},
year = {2017}
}
@article{DBLP:journals/pvldb/BeskalesIG10,
author = {George Beskales and Ihab F. Ilyas and Lukasz Golab},
journal = {PVLDB},
number = {1},
pages = {197--207},
title = {Sampling the Repairs of Functional Dependency Violations under Hard Constraints},
volume = {3},
year = {2010}
}
@inproceedings{BS10a,
author = {George Beskales and Mohamed A. Soliman and Ihab F. Ilyas and Shai Ben-David and Yubin Kim},
booktitle = {ICDE},
pages = {1193--1196},
title = {ProbClean: A probabilistic duplicate detection system},
year = {2010}
}
@article{GM12,
author = {Getoor, Lise and Machanavajjhala, Ashwin},
journal = {PVLDB},
number = {12},
pages = {2018--2019},
title = {Entity resolution: theory, practice \& open challenges},
volume = {5},
year = {2012}
}
@article{GL17,
author = {Guagliardo, Paolo and Libkin, Leonid},
journal = {SIGMOD Record},
number = {3},
pages = {5--16},
title = {Correctness of SQL Queries on Databases with Nulls},
volume = {46},
year = {2017}
}
@inproceedings{GR10,
author = {Gunda, Pradeep Kumar and Ravindranath, Lenin and Thekkath, Chandramohan A and Yu, Yuan and Zhuang, Li},
booktitle = {OSDI},
pages = {75--88},
title = {Nectar: Automatic Management of Data and Computation in Datacenters.},
year = {2010}
}
@article{HD17,
author = {Herschel, Melanie and Diestelkämper, Ralf and Lahmar, Houssem Ben},
journal = {VLDB},
pages = {1--26},
title = {A survey on provenance: What for? What form? What from?},
year = {2017}
}
@article{IL84a,
author = {Imieli\'{n}ski, Tomasz and Lipski Jr, Witold},
journal = {JACM},
number = {4},
pages = {761--791},
title = {Incomplete Information in Relational Databases},
volume = {31},
year = {1984}
}
@article{Imielinski:1984:IIR:1634.1886,
address = {New York, NY, USA},
author = {Imieli\'{n}ski, Tomasz and Lipski,Jr., Witold},
issn = {0004-5411},
issuedate = {Oct. 1984},
journal = {J. ACM},
number = {4},
numpages = {31},
pages = {761--791},
title = {Incomplete Information in Relational Databases},
volume = {31},
year = {1984}
}
@article{DBLP:journals/pvldb/SzlichtaGGKS17,
author = {Jaroslaw Szlichta and Parke Godfrey and Lukasz Golab and Mehdi Kargar and Divesh Srivastava},
journal = {PVLDB},
number = {7},
pages = {721--732},
title = {Effective and Complete Discovery of Order Dependencies via Set-based Axiomatization},
volume = {10},
year = {2017}
}
@inproceedings{WT08,
author = {Jennifer Widom and Theobald, Martin and Anish Das Sarma},
booktitle = {ICDE},
pages = {1023--1032},
title = {Exploiting Lineage for Confidence Computation in Uncertain and Probabilistic Databases},
year = {2008}
}
@misc{grus:2018:notebooks,
author = {Joel Grus},
howpublished = {https://www.youtube.com/watch?v=7jiPeIFXb6U},
title = {I don't like notebooks.},
year = {2018}
}
@article{FS12,
author = {Juliana Freire and Cláudio T. Silva},
ee = {http://doi.ieeecomputersociety.org/10.1109/MCSE.2012.76},
journal = {Computing in Science and Engineering},
number = {4},
pages = {18--25},
title = {Making Computations and Publications Reproducible with VisTrails},
volume = {14},
year = {2012}
}
@article{DBLP:journals/vldb/HerrmannVPL18,
author = {Kai Herrmann and
Hannes Voigt and
Torben Bach Pedersen and
Wolfgang Lehner},
journal = {VLDBJ},
number = {4},
pages = {547--571},
title = {Multi-schema-version data management: data independence in the twenty-first
century},
volume = {27},
year = {2018}
}
@article{KG12,
author = {Karvounarakis, G. and Green, T.J.},
journal = {SIGMOD Record},
number = {3},
pages = {5--14},
title = {Semiring-Annotated Data: Queries and Provenance},
volume = {41},
year = {2012}
}
@inproceedings{koop@tapp2017,
author = {Koop, David and Patel, Jay},
booktitle = {TaPP},
title = {Dataflow Notebooks: Encoding and Tracking Dependencies of Cells},
year = {2017}
}
@inproceedings{kumari:2016:qdb:communicating,
author = {Kumari, Poonam and Achmiz, Said and Kennedy, Oliver},
booktitle = {QDB},
title = {Communicating Data Quality in On-Demand Curation},
year = {2016}
}
@inproceedings{DBLP:conf/visualization/BavoilCSVCSF05,
author = {Louis Bavoil and Steven P. Callahan and Carlos Eduardo Scheidegger and Huy T. Vo and Patricia Crossno and Cláudio T. Silva and Juliana Freire},
booktitle = {IEEE Visualization},
pages = {135--142},
title = {VisTrails: Enabling Interactive Multiple-View Visualizations},
year = {2005}
}
@article{MG16a,
author = {Maddox, Michael and Goehring, David and Elmore, Aaron J and Madden, Samuel and Parameswaran, Aditya and Deshpande, Amol},
journal = {PVLDB},
number = {9},
pages = {624--635},
title = {Decibel: The relational dataset branching system},
volume = {9},
year = {2016}
}
@article{DBLP:journals/pvldb/BendreSZZCP15,
author = {Mangesh Bendre and
Bofan Sun and
Ding Zhang and
Xinyan Zhou and
Kevin Chen-Chuan Chang and
Aditya G. Parameswaran},
journal = {PVLDB},
number = {12},
pages = {2000--2003},
title = {DATASPREAD: Unifying Databases and Spreadsheets},
volume = {8},
year = {2015}
}
@inproceedings{DBLP:conf/icde/BendreVZCP18,
author = {Mangesh Bendre and
Vipul Venkataraman and
Xinyan Zhou and
Kevin Chen-Chuan Chang and
Aditya G. Parameswaran},
booktitle = {ICDE},
pages = {113--124},
title = {Towards a Holistic Integration of Spreadsheets with Databases: A
Scalable Storage Engine for Presentational Data Management},
year = {2018}
}
@inproceedings{DBLP:conf/nsdi/ZahariaCDDMMFSS12,
author = {Matei Zaharia and Mosharaf Chowdhury and Tathagata Das and Ankur Dave and Justin Ma and Murphy McCauly and Michael J. Franklin and Scott Shenker and Ion Stoica},
booktitle = {NSDI},
pages = {15--28},
title = {Resilient Distributed Datasets: A Fault-Tolerant Abstraction for In-Memory Cluster Computing},
year = {2012}
}
@inproceedings{DBLP:conf/sigmod/BrachmannBCFFGK19,
author = {Mike Brachmann and Carlos Bautista and Sonia Castelo and Su Feng and Juliana Freire and Boris Glavic and Oliver Kennedy and Heiko Mueller and Rémi Rampin and William Spoth and Ying Yang},
booktitle = {SIGMOD},
pages = {1877--1880},
title = {Data Debugging and Exploration with Vizier},
year = {2019}
}
@inproceedings{MB13a,
author = {Missier, Paolo and Belhajjame, Khalid and Cheney, James},
booktitle = {EDBT},
pages = {773--776},
title = {The W3C PROV family of specifications for modelling provenance metadata},
year = {2013}
}
@article{MD18,
author = {Müller, Tobias and Dietrich, Benjamin and Grust, Torsten},
journal = {PVLDB},
number = {11},
title = {You Say `What', I Hear `Where'and `Why'---(Mis-) Interpreting SQL to Derive Fine-Grained Provenance},
volume = {11},
year = {2018}
}
@techreport{nandi:2016:arxiv:mimir,
author = {Nandi, Arindam and Yang, Ying and Kennedy, Oliver and Glavic, Boris and Fehling, Ronny and Liu, Zhen Hua and Gawlick, Dieter},
title = {Mimir: Bringing CTables into Practice},
year = {2016}
}
@conference{OH10,
author = {Olteanu, D. and Huang, J. and Koch, C.},
booktitle = {ICDE},
pages = {145--156},
title = {Approximate confidence computation in probabilistic databases},
year = {2010}
}
@inproceedings{DBLP:conf/sigmod/ONeilOPCSW04,
author = {Patrick E. O'Neil and
Elizabeth J. O'Neil and
Shankar Pal and
Istvan Cseri and
Gideon Schaller and
Nigel Westbury},
booktitle = {SIGMOD},
pages = {903--908},
title = {ORDPATHs: Insert-Friendly XML Node Labels},
year = {2004}
}
@inproceedings{DBLP:conf/icdt/BunemanKT01,
author = {Peter Buneman and Sanjeev Khanna and Wang Chiew Tan},
booktitle = {ICDT},
pages = {316--330},
series = {Lecture Notes in Computer Science},
title = {Why and Where: A Characterization of Data Provenance},
volume = {1973},
year = {2001}
}
@book{DBLP:books/daglib/0030287,
author = {Peter Christen},
publisher = {Springer},
series = {Data-Centric Systems and Applications},
title = {Data Matching - Concepts and Techniques for Record Linkage, Entity
Resolution, and Duplicate Detection},
year = {2012}
}
@inproceedings{pimentel:2019:msr:large,
author = {Pimentel, João Felipe and Murta, Leonardo and Braganholo, Vanessa and Freire, Juliana},
booktitle = {MSR},
title = {A Large-scale Study About Quality and Reproducibility of Jupyter Notebooks},
year = {2019}
}
@article{RD06a,
author = {Re, C. and Dalvi, N. and Suciu, D.},
journal = {IEEE Data Eng. Bull.},
number = {1},
pages = {25--31},
title = {Query evaluation on probabilistic databases},
volume = {29},
year = {2006}
}
@inproceedings{SV08,
author = {Scheidegger, Carlos Eduardo and Vo, Huy and Koop, David and Freire, Juliana and Silva, Claudio T.},
booktitle = {SIGMOD},
pages = {1251--1254},
title = {Querying and Re-using Workflows with VisTrails},
year = {2008}
}
@inproceedings{DBLP:conf/chi/KandelPHH11,
author = {Sean Kandel and
Andreas Paepcke and
Joseph M. Hellerstein and
Jeffrey Heer},
booktitle = {CHI},
pages = {3363--3372},
title = {Wrangler: interactive visual specification of data transformation scripts},
year = {2011}
}
@article{SJ18,
author = {Senellart, Pierre and Jachiet, Louis and Maniu, Silviu and Ramusat, Yann},
journal = {PVLDB},
number = {12},
pages = {2034--2037},
title = {ProvSQL: provenance and probability management in postgreSQL},
volume = {11},
year = {2018}
}
@inproceedings{GM18a,
author = {Sergio Greco and Cristian Molinaro and Irina Trubitsyna},
booktitle = {IDEAS},
pages = {1--4},
title = {Algorithms for Computing Approximate Certain Answers over Incomplete Databases},
year = {2018}
}
@inproceedings{DBLP:conf/sosp/VenkataramanPOA17,
author = {Shivaram Venkataraman and
Aurojit Panda and
Kay Ousterhout and
Michael Armbrust and
Ali Ghodsi and
Michael J. Franklin and
Benjamin Recht and
Ion Stoica},
booktitle = {SOSP},
pages = {374--389},
title = {Drizzle: Fast and Adaptable Stream Processing at Scale},
year = {2017}
}
@article{SO11,
author = {Suciu, Dan and Olteanu, Dan and Ré, Christopher and Koch, Christoph},
journal = {Synthesis Lectures on Data Management},
number = {2},
pages = {1--180},
title = {Probabilistic databases},
volume = {3},
year = {2011}
}
@misc{vizier,
author = {The VizierDB Group},
howpublished = {http://vizierdb.info},
title = {Vizier: Built for Data Exploration}
}
@incollection{M98b,
author = {van der Meyden, Ron},
booktitle = {Logics for databases and information systems},
pages = {307--356},
title = {Logical approaches to incomplete information: A survey},
year = {1998}
}
@article{DBLP:journals/pvldb/FanGJ08a,
author = {Wenfei Fan and
Floris Geerts and
Xibei Jia},
journal = {PVLDB},
number = {2},
pages = {1522--1523},
title = {A revival of integrity constraints for data cleaning},
volume = {1},
year = {2008}
}
@inproceedings{XN16,
author = {Xing Niu and Bahareh Arab and Dieter Gawlick and Zhen Hua Liu and Vasudha Krishnaswamy and Oliver Kennedy and Boris Glavic},
booktitle = {TaPP},
isworkshop = {true},
projects = {GProM},
title = {Provenance-aware Versioned Dataworkspaces},
year = {2016}
}
@article{DBLP:journals/pvldb/NiuALFZGKLG17,
author = {Xing Niu and Bahareh Sadat Arab and Seokki Lee and Su Feng and Xun Zou and Dieter Gawlick and Vasudha Krishnaswamy and Zhen Hua Liu and Boris Glavic},
journal = {PVLDB},
number = {12},
pages = {1857--1860},
title = {Debugging Transactions and Tracking their Provenance with Reenactment},
volume = {10},
year = {2017}
}
@inproceedings{DBLP:conf/sigmod/ChuIKW16,
author = {Xu Chu and Ihab F. Ilyas and Sanjay Krishnan and Jiannan Wang},
booktitle = {SIGMOD},
pages = {2201--2206},
title = {Data Cleaning: Overview and Emerging Challenges},
year = {2016}
}
@inproceedings{XH,
author = {Xu, Liqi and Huang, Silu and Hui, Sili and Elmore, A and Parameswaran, Aditya},
title = {{OrpheusDB}: {A} Lightweight Approach to Relational Dataset Versioning},
booktitle = {SIGMOD},
pages = {1655--1658},
year = {2017},
}
@article{yang2015lenses,
author = {Yang, Ying and Meneghetti, Niccolo and Fehling, Ronny and Liu, Zhen Hua and Kennedy, Oliver},
journal = {PVLDB},
number = {12},
title = {Lenses: An On-Demand Approach to ETL},
volume = {8},
year = {2015}
}
@inproceedings{Zhang:2007:SEH:1294325.1294349,
address = {New York, NY, USA},
author = {Zhang, Lingli and Krintz, Chandra and Nagpurkar, Priya},
booktitle = {Proceedings of the 5th International Symposium on Principles and Practice of Programming in Java},
numpages = {10},
pages = {175--184},
series = {PPPJ '07},
title = {Supporting Exception Handling for Futures in Java},
year = {2007}
}
@article{DBLP:journals/pvldb/AbedjanCDFIOPST16,
author = {Ziawasch Abedjan and Xu Chu and Dong Deng and Raul Castro Fernandez and Ihab F. Ilyas and Mourad Ouzzani and Paolo Papotti and Michael Stonebraker and Nan Tang},
journal = {PVLDB},
number = {12},
pages = {993--1004},
title = {Detecting Data Errors: Where are we and what needs to be done?},
volume = {9},
year = {2016}
}