From 361900d19dd10a8c585b07c20180d81676f0f744 Mon Sep 17 00:00:00 2001
From: Oliver Kennedy <okennedy@buffalo.edu>
Date: Sun, 4 Mar 2018 16:37:37 -0500
Subject: [PATCH] temp

---
 .../2018-03-05-CostBasedOptimization2.html    | 112 +++++++++++++++++-
 1 file changed, 108 insertions(+), 4 deletions(-)
diff --git a/slides/cse4562sp2018/2018-03-05-CostBasedOptimization2.html b/slides/cse4562sp2018/2018-03-05-CostBasedOptimization2.html
index aac71888..7d001ee6 100644
--- a/slides/cse4562sp2018/2018-03-05-CostBasedOptimization2.html
+++ b/slides/cse4562sp2018/2018-03-05-CostBasedOptimization2.html
@@ -359,8 +359,8 @@
           <h3>(Some) Estimation Techniques</h3>
 
           <dl style="font-size: 80%">
-            <dt>Guess Randomly</dt>
-            <dd>Rules of thumb if you have no other options...</dd>
+            <dt style="color: blue;">Guess Randomly</dt>
+            <dd style="color: blue;">Rules of thumb if you have no other options...</dd>
 
             <dt style="color: grey;">Uniform Prior</dt>
             <dd style="color: grey;">Use basic statistics to make a very rough guess.</dd>
@@ -415,8 +415,8 @@
             <dt style="color: grey;">Guess Randomly</dt>
             <dd style="color: grey;">Rules of thumb if you have no other options...</dd>
 
-            <dt>Uniform Prior</dt>
-            <dd>Use basic statistics to make a very rough guess.</dd>
+            <dt style="color: blue;">Uniform Prior</dt>
+            <dd style="color: blue;">Use basic statistics to make a very rough guess.</dd>
 
             <dt style="color: grey;">Sampling / History</dt>
             <dd style="color: grey;">Small, Quick Sampling Runs (or prior executions of the query).</dd>
@@ -500,6 +500,110 @@
 
           <p style="font-size: 60%">(With constants $x_1$, $x_2$, ...)</p>
         </section>
+
+        <section>
+          <h3>Limitations</h3>
+
+          <dl>
+            <div class="fragment">
+              <dt>Don't always have statistics for $Q$</dt>
+              <dd>For example, $\pi_{A \leftarrow (B \times C)}(R)$</dd>
+            </div>
+
+            <div class="fragment">
+              <dt>Don't always have clear rules for $c$</dt>
+              <dd>For example, $\sigma_{\texttt{FitsModel}(A, B, C)}(R)$</dd>
+            </div>
+
+            <div class="fragment">
+              <dt>Attribute values are not always uniformly distributed.</dt>
+              <dd>For example, <span style="font-size: 60%"> $|\sigma_{SPC\_COMMON = 'pin\ oak'}(T)|$ vs $|\sigma_{SPC\_COMMON = 'honeylocust'}(T)|$</span></dd>
+            </div>
+
+            <div class="fragment">
+              <dt>Attribute values are sometimes correlated.</dt>
+              <dd>For example, $\sigma_{(stump < 5) \wedge (diam > 3)}(T)$</dd>
+            </div>
+
+          </dl>
+        </section>
+      </section>
+      <section>
+        <section>
+          <h3>(Some) Estimation Techniques</h3>
+
+          <dl style="font-size: 80%">
+            <dt style="color: grey;">Guess Randomly</dt>
+            <dd style="color: grey;">Rules of thumb if you have no other options...</dd>
+
+            <dt style="color: grey;">Uniform Prior</dt>
+            <dd style="color: grey;">Use basic statistics to make a very rough guess.</dd>
+
+            <dt style="color: blue;">Sampling / History</dt>
+            <dd style="color: blue;">Small, Quick Sampling Runs (or prior executions of the query).</dd>
+
+            <dt style="color: grey;">Histograms</dt>
+            <dd style="color: grey;">Using more detailed statistics for improved guesses.</dd>
+
+            <dt style="color: grey;">Constraints</dt>
+            <dd style="color: grey;">Using rules about the data for improved guesses.</dd>
+          </dl>
+        </section>
+
+        <section>
+          <p><b>Idea 1:</b> Pick 100 tuples at random from each input table.</p>
+        </section>
+      </section>
+
+      <section>
+        <section>
+          <h3>Limitations</h3>
+
+          <dl>
+            <div class="fragment highlight-grey">
+              <dt>Don't always have statistics for $Q$</dt>
+              <dd>For example, $\pi_{A \leftarrow (B \times C)}(R)$</dd>
+            </div>
+
+            <div class="fragment highlight-grey">
+              <dt>Don't always have clear rules for $c$</dt>
+              <dd>For example, $\sigma_{\texttt{FitsModel}(A, B, C)}(R)$</dd>
+            </div>
+
+            <div class="fragment highlight-blue">
+              <dt>Attribute values are not always uniformly distributed.</dt>
+              <dd>For example, <span style="font-size: 60%"> $|\sigma_{SPC\_COMMON = 'pin\ oak'}(T)|$ vs $|\sigma_{SPC\_COMMON = 'honeylocust'}(T)|$</span></dd>
+            </div>
+
+            <div class="fragment highlight-grey">
+              <dt>Attribute values are sometimes correlated.</dt>
+              <dd>For example, $\sigma_{(stump < 5) \wedge (diam > 3)}(T)$</dd>
+            </div>
+
+          </dl>
+        </section>
+
+        <section>
+          <h3>(Some) Estimation Techniques</h3>
+
+          <dl style="font-size: 80%">
+            <dt style="color: grey;">Guess Randomly</dt>
+            <dd style="color: grey;">Rules of thumb if you have no other options...</dd>
+
+            <dt style="color: grey;">Uniform Prior</dt>
+            <dd style="color: grey;">Use basic statistics to make a very rough guess.</dd>
+
+            <dt style="color: grey;">Sampling / History</dt>
+            <dd style="color: grey;">Small, Quick Sampling Runs (or prior executions of the query).</dd>
+
+            <dt style="color: blue;">Histograms</dt>
+            <dd style="color: blue;">Using more detailed statistics for improved guesses.</dd>
+
+            <dt style="color: grey;">Constraints</dt>
+            <dd style="color: grey;">Using rules about the data for improved guesses.</dd>
+          </dl>
+        </section>
+        
       </section>
 
     </div></div>