Website/slides/talks/2019-1-VizierPitch/index.html

195 lines
7.2 KiB
HTML

<!doctype html>
<html>
<head>
<meta charset="utf-8">
<meta name="viewport" content="width=device-width, initial-scale=1.0, maximum-scale=1.0, user-scalable=no">
<title>reveal.js</title>
<link rel="stylesheet" href="../../reveal.js-3.7.0/css/reveal.css">
<link rel="stylesheet" href="../../reveal.js-3.7.0/css/theme/black.css">
<link rel="stylesheet" href="style.css">
<!-- Theme used for syntax highlighting of code -->
<link rel="stylesheet" href="../../reveal.js-3.7.0/lib/css/zenburn.css">
<!-- Printing and PDF exports -->
<script>
var link = document.createElement( 'link' );
link.rel = 'stylesheet';
link.type = 'text/css';
link.href = window.location.search.match( /print-pdf/gi ) ? '../../reveal.js-3.7.0/css/print/pdf.css' : '../../reveal.js-3.7.0/css/print/paper.css';
document.getElementsByTagName( 'head' )[0].appendChild( link );
</script>
</head>
<body>
<div class="reveal"><div class="slides">
<section>
<img src="vizier.svg" width="300px"/>
<h3>Sustainable Data On-boarding</h3>
</section>
<section>
<section>
<svg data-src="Data_Cycle.svg" height="500px" />
<attribution>Images from <a href="https://openclipart.org/">OpenClipArt</a></attribution>
</section>
<section>
<h3>50-80% of a Data Scientist's time is spent on <u>curation</u></h3>
<h4 style="text-align: right">- NY Times</h4>
<attribution><a href="https://www.nytimes.com/2014/08/18/technology/for-big-data-scientists-hurdle-to-insights-is-janitor-work.html">https://www.nytimes.com/2014/08/18/technology/for-big-data-scientists-hurdle-to-insights-is-janitor-work.html</a></attribution>
</section>
<section>
<h3>Bad Data Quality costs</h3>
<h2>$3.1 Trillion</h2>
<h3>per year in the US alone</h3>
<h4 style="text-align: right">- IBM</h4>
<attribution><a href="https://www.ibmbigdatahub.com/infographic/four-vs-big-data">https://www.ibmbigdatahub.com/infographic/four-vs-big-data</a></attribution>
</section>
</section>
<section>
<section>
<h3>NYS Open Data Portal</h3>
</section>
<section>
<img src="malefemale_before.png"/>
<attribution>NYS Open Data Portal: Causes of Death in NYC 2008-2014</attribution>
</section>
<section>
<img src="malefemale_after.png"/>
<attribution>NYS Open Data Portal: Causes of Death in NYC 2008-<b style="font-size: 120%;">2016</b></attribution>
</section>
</section>
<section>
<section>
<div style="display: inline-block; vertical-align: middle;">
<img src="1.2.Multilingual.png" width="500px"/>
</div>
<div style="display: inline-block; vertical-align: middle; padding-left: 30px;">
<div style="vertical-align: baseline; font-weight: bold; border-bottom: 2px solid white; margin-bottom: 40px;" >
<img src="vizier.svg" width="50px" style="vertical-align: middle;"/>
VizierDB
</div>
<ul>
<li style="margin-top: 10px;" class="fragment highlight-grey" data-fragment-index="1">Explore</li>
<li style="margin-top: 10px;">Validate</li>
<li style="margin-top: 10px;">Curate</li>
<li style="margin-top: 10px;" class="fragment highlight-grey" data-fragment-index="1">Audit</li>
<li style="margin-top: 10px;" class="fragment highlight-grey" data-fragment-index="1">Reuse</li>
</ul>
</div>
</section>
<section>
<h3>Vizier Tracks Data Bugs</h3>
<ul>
<li style="margin-top: 10px;">Recoverable Errors</li>
<li style="margin-top: 10px;">Automatic Data Warnings</li>
<li style="margin-top: 10px;">User-Provided Unit Tests</li>
</ul>
</section>
<section>
<img src="4.2.ErrorList.png" height="400px"/>
</section>
<section>
<h3>Error Alerts in the Data</h3>
<img src="ErrorWarnings.png">
</section>
</section>
<section>
<section>
<h3>Fixing Errors</h3>
<ul class="fragment">
<li>Python</li>
<li>SQL</li>
<li>Scala</li>
<li class="fragment">Automatic Suggestions</li>
<li class="fragment">Spreadsheets</li>
</ul>
</section>
<section>
<h3>Spreadsheet View</h3>
<h4>Easily Fix One-Off Errors</h4>
<img src="2.1.Spreadsheets.png"/>
<p class="fragment">Edits are tracked and versioned to make auditing and debugging easy</p>
</section>
</section>
<section>
<section>
<h3>Available Now</h3>
<ul>
<li style="margin-top: 10px;">Cloud Deployment</li>
<li style="margin-top: 10px;">On-Prem with Support</li>
<li style="margin-top: 10px;">Workflow Appliance</li>
</ul>
</section>
<section>
<div style="display: inline-block; vertical-align: middle;">
<img src="1.2.Multilingual.png" width="500px"/>
</div>
<div style="display: inline-block; vertical-align: middle; padding-left: 30px;">
<div style="vertical-align: baseline; font-weight: bold; border-bottom: 2px solid white; margin-bottom: 40px;" >
<img src="vizier.svg" width="50px" style="vertical-align: middle;"/>
VizierDB
</div>
<ul>
<li style="margin-top: 10px;">Explore</li>
<li style="margin-top: 10px;">Validate</li>
<li style="margin-top: 10px;">Curate</li>
<li style="margin-top: 10px;">Audit</li>
<li style="margin-top: 10px;">Reuse</li>
</ul>
</div>
<div>
<h4><a href="https://vizierdb.info">https://vizierdb.info</a></h4>
</div>
</section>
<section>
<h1>
<a href="https://demo.vizierdb.info/vizier-db">Demo</a>
</h1>
</section>
</div></div>
<script src="../../reveal.js-3.7.0/lib/js/head.min.js"></script>
<script src="../../reveal.js-3.7.0/js/reveal.js"></script>
<script>
var debug = false
// More info about config & dependencies:
// - https://github.com/hakimel/reveal.js#configuration
// - https://github.com/hakimel/reveal.js#dependencies
Reveal.initialize({
history: debug,
dependencies: [
{ src: '../../reveal.js-3.7.0/plugin/svginline/data-src-svg.js' },
{ src: '../../reveal.js-3.7.0/plugin/markdown/marked.js' },
{ src: '../../reveal.js-3.7.0/plugin/markdown/markdown.js' },
{ src: '../../reveal.js-3.7.0/plugin/notes/notes.js', async: true },
{ src: '../../reveal.js-3.7.0/plugin/highlight/highlight.js', async: true, callback: function() { hljs.initHighlightingOnLoad(); } }
]
});
if(debug){
document.write('<script src="http://' + (location.host || 'localhost').split(':')[0] + ':35729/livereload.js?snipver=1"></' + 'script>')
}
</script>
<script>
</script>
</body>
</html>