datafu-commits mailing list archives

Site index · List index
Message view « Date » · « Thread »
Top « Date » · « Thread »
From mha...@apache.org
Subject svn commit: r1827525 [40/49] - in /datafu/site/docs: datafu/1.4.0/ datafu/1.4.0/datafu/ datafu/1.4.0/datafu/pig/ datafu/1.4.0/datafu/pig/bags/ datafu/1.4.0/datafu/pig/geo/ datafu/1.4.0/datafu/pig/hash/ datafu/1.4.0/datafu/pig/hash/lsh/ datafu/1.4.0/dat...
Date Thu, 22 Mar 2018 19:01:10 GMT
Added: datafu/site/docs/hourglass/1.4.0/datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html
URL: http://svn.apache.org/viewvc/datafu/site/docs/hourglass/1.4.0/datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html?rev=1827525&view=auto
==============================================================================
--- datafu/site/docs/hourglass/1.4.0/datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html (added)
+++ datafu/site/docs/hourglass/1.4.0/datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html Thu Mar 22 19:01:04 2018
@@ -0,0 +1,504 @@
+<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd">
+<!-- NewPage -->
+<html lang="en">
+<head>
+<!-- Generated by javadoc (version 1.7.0_79) on Thu Mar 22 11:58:07 PDT 2018 -->
+<title>PartitionCollapsingExecutionPlanner (datafu-hourglass 1.4.0 API)</title>
+<meta name="date" content="2018-03-22">
+<link rel="stylesheet" type="text/css" href="../../../stylesheet.css" title="Style">
+</head>
+<body>
+<script type="text/javascript"><!--
+    if (location.href.indexOf('is-external=true') == -1) {
+        parent.document.title="PartitionCollapsingExecutionPlanner (datafu-hourglass 1.4.0 API)";
+    }
+//-->
+</script>
+<noscript>
+<div>JavaScript is disabled on your browser.</div>
+</noscript>
+<!-- ========= START OF TOP NAVBAR ======= -->
+<div class="topNav"><a name="navbar_top">
+<!--   -->
+</a><a href="#skip-navbar_top" title="Skip navigation links"></a><a name="navbar_top_firstrow">
+<!--   -->
+</a>
+<ul class="navList" title="Navigation">
+<li><a href="../../../overview-summary.html">Overview</a></li>
+<li><a href="package-summary.html">Package</a></li>
+<li class="navBarCell1Rev">Class</li>
+<li><a href="package-tree.html">Tree</a></li>
+<li><a href="../../../deprecated-list.html">Deprecated</a></li>
+<li><a href="../../../index-all.html">Index</a></li>
+<li><a href="../../../help-doc.html">Help</a></li>
+</ul>
+</div>
+<div class="subNav">
+<ul class="navList">
+<li><a href="../../../datafu/hourglass/jobs/MaxInputDataExceededException.html" title="class in datafu.hourglass.jobs"><span class="strong">Prev Class</span></a></li>
+<li><a href="../../../datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html" title="class in datafu.hourglass.jobs"><span class="strong">Next Class</span></a></li>
+</ul>
+<ul class="navList">
+<li><a href="../../../index.html?datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html" target="_top">Frames</a></li>
+<li><a href="PartitionCollapsingExecutionPlanner.html" target="_top">No Frames</a></li>
+</ul>
+<ul class="navList" id="allclasses_navbar_top">
+<li><a href="../../../allclasses-noframe.html">All Classes</a></li>
+</ul>
+<div>
+<script type="text/javascript"><!--
+  allClassesLink = document.getElementById("allclasses_navbar_top");
+  if(window==top) {
+    allClassesLink.style.display = "block";
+  }
+  else {
+    allClassesLink.style.display = "none";
+  }
+  //-->
+</script>
+</div>
+<div>
+<ul class="subNavList">
+<li>Summary:&nbsp;</li>
+<li>Nested&nbsp;|&nbsp;</li>
+<li>Field&nbsp;|&nbsp;</li>
+<li><a href="#constructor_summary">Constr</a>&nbsp;|&nbsp;</li>
+<li><a href="#method_summary">Method</a></li>
+</ul>
+<ul class="subNavList">
+<li>Detail:&nbsp;</li>
+<li>Field&nbsp;|&nbsp;</li>
+<li><a href="#constructor_detail">Constr</a>&nbsp;|&nbsp;</li>
+<li><a href="#method_detail">Method</a></li>
+</ul>
+</div>
+<a name="skip-navbar_top">
+<!--   -->
+</a></div>
+<!-- ========= END OF TOP NAVBAR ========= -->
+<!-- ======== START OF CLASS DATA ======== -->
+<div class="header">
+<div class="subTitle">datafu.hourglass.jobs</div>
+<h2 title="Class PartitionCollapsingExecutionPlanner" class="title">Class PartitionCollapsingExecutionPlanner</h2>
+</div>
+<div class="contentContainer">
+<ul class="inheritance">
+<li>java.lang.Object</li>
+<li>
+<ul class="inheritance">
+<li><a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html" title="class in datafu.hourglass.jobs">datafu.hourglass.jobs.ExecutionPlanner</a></li>
+<li>
+<ul class="inheritance">
+<li>datafu.hourglass.jobs.PartitionCollapsingExecutionPlanner</li>
+</ul>
+</li>
+</ul>
+</li>
+</ul>
+<div class="description">
+<ul class="blockList">
+<li class="blockList">
+<hr>
+<br>
+<pre>public class <span class="strong">PartitionCollapsingExecutionPlanner</span>
+extends <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html" title="class in datafu.hourglass.jobs">ExecutionPlanner</a></pre>
+<div class="block">Execution planner used by <a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html" title="class in datafu.hourglass.jobs"><code>AbstractPartitionCollapsingIncrementalJob</code></a> and its derived classes.
+ This creates a plan to process partitioned input data and collapse the partitions into a single output.
+ 
+ <p>
+ To use this class, the input and output paths must be specified.  In addition the desired input date
+ range can be specified through several methods.  Then <a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#createPlan()"><code>createPlan()</code></a> can be called and the
+ execution plan will be created.  The inputs to process will be available from <a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#getInputsToProcess()"><code>getInputsToProcess()</code></a>,
+ the number of reducers to use will be available from <a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#getNumReducers()"><code>getNumReducers()</code></a>, and the input schemas
+ will be available from <a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#getInputSchemas()"><code>getInputSchemas()</code></a>.
+ </p>
+ 
+ <p>
+ Previous output may be reused by using <a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#setReusePreviousOutput(boolean)"><code>setReusePreviousOutput(boolean)</code></a>.  If previous output exists
+ and it is to be reused then it will be available from <a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#getPreviousOutputToProcess()"><code>getPreviousOutputToProcess()</code></a>.  New input data
+ to process that is after the previous output time range is available from <a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#getNewInputsToProcess()"><code>getNewInputsToProcess()</code></a>.
+ Old input data to process that is before the previous output time range and should be subtracted from the
+ previous output is available from <a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#getOldInputsToProcess()"><code>getOldInputsToProcess()</code></a>.
+ </p>
+ 
+ <p>
+ Configuration properties are used to configure a <a href="../../../datafu/hourglass/jobs/ReduceEstimator.html" title="class in datafu.hourglass.jobs"><code>ReduceEstimator</code></a> instance.  This is used to 
+ calculate how many reducers should be used.  
+ The number of reducers to use is based on the input data size and the 
+ <em>num.reducers.bytes.per.reducer</em> property.  This setting can be controlled more granularly
+ through <em>num.reducers.input.bytes.per.reducer</em> and <em>num.reducers.previous.bytes.per.reducer</em>.
+ Check <a href="../../../datafu/hourglass/jobs/ReduceEstimator.html" title="class in datafu.hourglass.jobs"><code>ReduceEstimator</code></a> for more details on how the properties are used.
+ </p></div>
+</li>
+</ul>
+</div>
+<div class="summary">
+<ul class="blockList">
+<li class="blockList">
+<!-- ======== CONSTRUCTOR SUMMARY ======== -->
+<ul class="blockList">
+<li class="blockList"><a name="constructor_summary">
+<!--   -->
+</a>
+<h3>Constructor Summary</h3>
+<table class="overviewSummary" border="0" cellpadding="3" cellspacing="0" summary="Constructor Summary table, listing constructors, and an explanation">
+<caption><span>Constructors</span><span class="tabEnd">&nbsp;</span></caption>
+<tr>
+<th class="colOne" scope="col">Constructor and Description</th>
+</tr>
+<tr class="altColor">
+<td class="colOne"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#PartitionCollapsingExecutionPlanner(org.apache.hadoop.fs.FileSystem,%20java.util.Properties)">PartitionCollapsingExecutionPlanner</a></strong>(org.apache.hadoop.fs.FileSystem&nbsp;fs,
+                                   java.util.Properties&nbsp;props)</code>
+<div class="block">Initializes the execution planner.</div>
+</td>
+</tr>
+</table>
+</li>
+</ul>
+<!-- ========== METHOD SUMMARY =========== -->
+<ul class="blockList">
+<li class="blockList"><a name="method_summary">
+<!--   -->
+</a>
+<h3>Method Summary</h3>
+<table class="overviewSummary" border="0" cellpadding="3" cellspacing="0" summary="Method Summary table, listing methods, and an explanation">
+<caption><span>Methods</span><span class="tabEnd">&nbsp;</span></caption>
+<tr>
+<th class="colFirst" scope="col">Modifier and Type</th>
+<th class="colLast" scope="col">Method and Description</th>
+</tr>
+<tr class="altColor">
+<td class="colFirst"><code>void</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#createPlan()">createPlan</a></strong>()</code>
+<div class="block">Create the execution plan.</div>
+</td>
+</tr>
+<tr class="rowColor">
+<td class="colFirst"><code><a href="../../../datafu/hourglass/fs/DateRange.html" title="class in datafu.hourglass.fs">DateRange</a></code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#getCurrentDateRange()">getCurrentDateRange</a></strong>()</code>&nbsp;</td>
+</tr>
+<tr class="altColor">
+<td class="colFirst"><code>java.util.List&lt;org.apache.avro.Schema&gt;</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#getInputSchemas()">getInputSchemas</a></strong>()</code>
+<div class="block">Gets the input schemas.</div>
+</td>
+</tr>
+<tr class="rowColor">
+<td class="colFirst"><code>java.util.Map&lt;java.lang.String,org.apache.avro.Schema&gt;</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#getInputSchemasByPath()">getInputSchemasByPath</a></strong>()</code>
+<div class="block">Gets a map from input path to schema.</div>
+</td>
+</tr>
+<tr class="altColor">
+<td class="colFirst"><code>java.util.List&lt;<a href="../../../datafu/hourglass/fs/DatePath.html" title="class in datafu.hourglass.fs">DatePath</a>&gt;</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#getInputsToProcess()">getInputsToProcess</a></strong>()</code>
+<div class="block">Gets all inputs that will be processed.</div>
+</td>
+</tr>
+<tr class="rowColor">
+<td class="colFirst"><code>boolean</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#getNeedsAnotherPass()">getNeedsAnotherPass</a></strong>()</code>
+<div class="block">Gets whether another pass will be required.</div>
+</td>
+</tr>
+<tr class="altColor">
+<td class="colFirst"><code>java.util.List&lt;<a href="../../../datafu/hourglass/fs/DatePath.html" title="class in datafu.hourglass.fs">DatePath</a>&gt;</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#getNewInputsToProcess()">getNewInputsToProcess</a></strong>()</code>
+<div class="block">Gets only the new data that will be processed.</div>
+</td>
+</tr>
+<tr class="rowColor">
+<td class="colFirst"><code>int</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#getNumReducers()">getNumReducers</a></strong>()</code>
+<div class="block">Get the number of reducers to use based on the input and previous output data size.</div>
+</td>
+</tr>
+<tr class="altColor">
+<td class="colFirst"><code>java.util.List&lt;<a href="../../../datafu/hourglass/fs/DatePath.html" title="class in datafu.hourglass.fs">DatePath</a>&gt;</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#getOldInputsToProcess()">getOldInputsToProcess</a></strong>()</code>
+<div class="block">Gets only the old data that will be processed.</div>
+</td>
+</tr>
+<tr class="rowColor">
+<td class="colFirst"><code><a href="../../../datafu/hourglass/fs/DatePath.html" title="class in datafu.hourglass.fs">DatePath</a></code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#getPreviousOutputToProcess()">getPreviousOutputToProcess</a></strong>()</code>
+<div class="block">Gets the previous output to reuse, or null if no output is being reused.</div>
+</td>
+</tr>
+<tr class="altColor">
+<td class="colFirst"><code>boolean</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#getReusePreviousOutput()">getReusePreviousOutput</a></strong>()</code>
+<div class="block">Gets whether previous output should be reused, if it exists.</div>
+</td>
+</tr>
+<tr class="rowColor">
+<td class="colFirst"><code>void</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#setReusePreviousOutput(boolean)">setReusePreviousOutput</a></strong>(boolean&nbsp;reuse)</code>
+<div class="block">Sets whether previous output should be reused, if it exists.</div>
+</td>
+</tr>
+</table>
+<ul class="blockList">
+<li class="blockList"><a name="methods_inherited_from_class_datafu.hourglass.jobs.ExecutionPlanner">
+<!--   -->
+</a>
+<h3>Methods inherited from class&nbsp;datafu.hourglass.jobs.<a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html" title="class in datafu.hourglass.jobs">ExecutionPlanner</a></h3>
+<code><a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#determineAvailableInputDates()">determineAvailableInputDates</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#determineDateRange()">determineDateRange</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#getAvailableInputsByDate()">getAvailableInputsByDate</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#getDailyData(org.apache.hadoop.fs.Path)">getDailyData</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#getDatedData(org.apache.hadoop.fs.Path)">getDatedData</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#getDateRange()">getDateRange</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#getDaysAgo()">getDaysAgo</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#getEndDate()">getEndDate</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#getFileSystem()">getFileSystem</a>, <a href="../../
 ../datafu/hourglass/jobs/ExecutionPlanner.html#getInputPaths()">getInputPaths</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#getMaxToProcess()">getMaxToProcess</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#getNumDays()">getNumDays</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#getOutputPath()">getOutputPath</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#getProps()">getProps</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#getStartDate()">getStartDate</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#isFailOnMissing()">isFailOnMissing</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#loadInputData()">loadInputData</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#setDaysAgo(java.lang.Integer)">setDaysAgo</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#setEndDate(java.util.Date)">setEndDate</a>, <a href="../../../dataf
 u/hourglass/jobs/ExecutionPlanner.html#setFailOnMissing(boolean)">setFailOnMissing</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#setInputPaths(java.util.List)">setInputPaths</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#setMaxToProcess(java.lang.Integer)">setMaxToProcess</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#setNumDays(java.lang.Integer)">setNumDays</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#setOutputPath(org.apache.hadoop.fs.Path)">setOutputPath</a>, <a href="../../../datafu/hourglass/jobs/ExecutionPlanner.html#setStartDate(java.util.Date)">setStartDate</a></code></li>
+</ul>
+<ul class="blockList">
+<li class="blockList"><a name="methods_inherited_from_class_java.lang.Object">
+<!--   -->
+</a>
+<h3>Methods inherited from class&nbsp;java.lang.Object</h3>
+<code>clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait</code></li>
+</ul>
+</li>
+</ul>
+</li>
+</ul>
+</div>
+<div class="details">
+<ul class="blockList">
+<li class="blockList">
+<!-- ========= CONSTRUCTOR DETAIL ======== -->
+<ul class="blockList">
+<li class="blockList"><a name="constructor_detail">
+<!--   -->
+</a>
+<h3>Constructor Detail</h3>
+<a name="PartitionCollapsingExecutionPlanner(org.apache.hadoop.fs.FileSystem, java.util.Properties)">
+<!--   -->
+</a>
+<ul class="blockListLast">
+<li class="blockList">
+<h4>PartitionCollapsingExecutionPlanner</h4>
+<pre>public&nbsp;PartitionCollapsingExecutionPlanner(org.apache.hadoop.fs.FileSystem&nbsp;fs,
+                                   java.util.Properties&nbsp;props)</pre>
+<div class="block">Initializes the execution planner.</div>
+<dl><dt><span class="strong">Parameters:</span></dt><dd><code>fs</code> - file system</dd><dd><code>props</code> - configuration properties</dd></dl>
+</li>
+</ul>
+</li>
+</ul>
+<!-- ============ METHOD DETAIL ========== -->
+<ul class="blockList">
+<li class="blockList"><a name="method_detail">
+<!--   -->
+</a>
+<h3>Method Detail</h3>
+<a name="createPlan()">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>createPlan</h4>
+<pre>public&nbsp;void&nbsp;createPlan()
+                throws java.io.IOException</pre>
+<div class="block">Create the execution plan.</div>
+<dl><dt><span class="strong">Throws:</span></dt>
+<dd><code>java.io.IOException</code> - IOException</dd></dl>
+</li>
+</ul>
+<a name="getReusePreviousOutput()">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>getReusePreviousOutput</h4>
+<pre>public&nbsp;boolean&nbsp;getReusePreviousOutput()</pre>
+<div class="block">Gets whether previous output should be reused, if it exists.</div>
+<dl><dt><span class="strong">Returns:</span></dt><dd>true if previous output should be reused</dd></dl>
+</li>
+</ul>
+<a name="setReusePreviousOutput(boolean)">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>setReusePreviousOutput</h4>
+<pre>public&nbsp;void&nbsp;setReusePreviousOutput(boolean&nbsp;reuse)</pre>
+<div class="block">Sets whether previous output should be reused, if it exists.</div>
+<dl><dt><span class="strong">Parameters:</span></dt><dd><code>reuse</code> - true if previous output should be reused</dd></dl>
+</li>
+</ul>
+<a name="getNumReducers()">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>getNumReducers</h4>
+<pre>public&nbsp;int&nbsp;getNumReducers()</pre>
+<div class="block">Get the number of reducers to use based on the input and previous output data size.
+ Must call <a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#createPlan()"><code>createPlan()</code></a> first.</div>
+<dl><dt><span class="strong">Returns:</span></dt><dd>number of reducers to use</dd></dl>
+</li>
+</ul>
+<a name="getCurrentDateRange()">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>getCurrentDateRange</h4>
+<pre>public&nbsp;<a href="../../../datafu/hourglass/fs/DateRange.html" title="class in datafu.hourglass.fs">DateRange</a>&nbsp;getCurrentDateRange()</pre>
+</li>
+</ul>
+<a name="getPreviousOutputToProcess()">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>getPreviousOutputToProcess</h4>
+<pre>public&nbsp;<a href="../../../datafu/hourglass/fs/DatePath.html" title="class in datafu.hourglass.fs">DatePath</a>&nbsp;getPreviousOutputToProcess()</pre>
+<div class="block">Gets the previous output to reuse, or null if no output is being reused.
+ Must call <a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#createPlan()"><code>createPlan()</code></a> first.</div>
+<dl><dt><span class="strong">Returns:</span></dt><dd>previous output to reuse, or null</dd></dl>
+</li>
+</ul>
+<a name="getInputsToProcess()">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>getInputsToProcess</h4>
+<pre>public&nbsp;java.util.List&lt;<a href="../../../datafu/hourglass/fs/DatePath.html" title="class in datafu.hourglass.fs">DatePath</a>&gt;&nbsp;getInputsToProcess()</pre>
+<div class="block">Gets all inputs that will be processed.  This includes both old and new data.
+ Must call <a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#createPlan()"><code>createPlan()</code></a> first.</div>
+<dl><dt><span class="strong">Returns:</span></dt><dd>inputs to process</dd></dl>
+</li>
+</ul>
+<a name="getNewInputsToProcess()">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>getNewInputsToProcess</h4>
+<pre>public&nbsp;java.util.List&lt;<a href="../../../datafu/hourglass/fs/DatePath.html" title="class in datafu.hourglass.fs">DatePath</a>&gt;&nbsp;getNewInputsToProcess()</pre>
+<div class="block">Gets only the new data that will be processed.  New data is data that falls within the 
+ desired date range.
+ Must call <a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#createPlan()"><code>createPlan()</code></a> first.</div>
+<dl><dt><span class="strong">Returns:</span></dt><dd>new inputs to process</dd></dl>
+</li>
+</ul>
+<a name="getOldInputsToProcess()">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>getOldInputsToProcess</h4>
+<pre>public&nbsp;java.util.List&lt;<a href="../../../datafu/hourglass/fs/DatePath.html" title="class in datafu.hourglass.fs">DatePath</a>&gt;&nbsp;getOldInputsToProcess()</pre>
+<div class="block">Gets only the old data that will be processed.  Old data is data that falls before the
+ desired date range.  It will be subtracted out from the previous output.
+ Must call <a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#createPlan()"><code>createPlan()</code></a> first.</div>
+<dl><dt><span class="strong">Returns:</span></dt><dd>old inputs to process</dd></dl>
+</li>
+</ul>
+<a name="getNeedsAnotherPass()">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>getNeedsAnotherPass</h4>
+<pre>public&nbsp;boolean&nbsp;getNeedsAnotherPass()</pre>
+<div class="block">Gets whether another pass will be required.  Because there may be a limit on the number of inputs processed 
+ in a single run, multiple runs may be required to process all data in the desired date range.  
+ Must call <a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#createPlan()"><code>createPlan()</code></a> first.</div>
+<dl><dt><span class="strong">Returns:</span></dt><dd>true if another pass is required</dd></dl>
+</li>
+</ul>
+<a name="getInputSchemas()">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>getInputSchemas</h4>
+<pre>public&nbsp;java.util.List&lt;org.apache.avro.Schema&gt;&nbsp;getInputSchemas()</pre>
+<div class="block">Gets the input schemas.  Because multiple inputs are allowed, there may be multiple schemas.
+ Must call <a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#createPlan()"><code>createPlan()</code></a> first.
+ 
+ <p>
+ This does not include the output schema, even though previous output may be fed back as input.
+ The reason is that the ouput schema it determined based on the input schema.
+ </p></div>
+<dl><dt><span class="strong">Returns:</span></dt><dd>input schemas</dd></dl>
+</li>
+</ul>
+<a name="getInputSchemasByPath()">
+<!--   -->
+</a>
+<ul class="blockListLast">
+<li class="blockList">
+<h4>getInputSchemasByPath</h4>
+<pre>public&nbsp;java.util.Map&lt;java.lang.String,org.apache.avro.Schema&gt;&nbsp;getInputSchemasByPath()</pre>
+<div class="block">Gets a map from input path to schema.  Because multiple inputs are allowed, there may be multiple schemas.
+ Must call <a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html#createPlan()"><code>createPlan()</code></a> first.</div>
+<dl><dt><span class="strong">Returns:</span></dt><dd>map from path to input schema</dd></dl>
+</li>
+</ul>
+</li>
+</ul>
+</li>
+</ul>
+</div>
+</div>
+<!-- ========= END OF CLASS DATA ========= -->
+<!-- ======= START OF BOTTOM NAVBAR ====== -->
+<div class="bottomNav"><a name="navbar_bottom">
+<!--   -->
+</a><a href="#skip-navbar_bottom" title="Skip navigation links"></a><a name="navbar_bottom_firstrow">
+<!--   -->
+</a>
+<ul class="navList" title="Navigation">
+<li><a href="../../../overview-summary.html">Overview</a></li>
+<li><a href="package-summary.html">Package</a></li>
+<li class="navBarCell1Rev">Class</li>
+<li><a href="package-tree.html">Tree</a></li>
+<li><a href="../../../deprecated-list.html">Deprecated</a></li>
+<li><a href="../../../index-all.html">Index</a></li>
+<li><a href="../../../help-doc.html">Help</a></li>
+</ul>
+</div>
+<div class="subNav">
+<ul class="navList">
+<li><a href="../../../datafu/hourglass/jobs/MaxInputDataExceededException.html" title="class in datafu.hourglass.jobs"><span class="strong">Prev Class</span></a></li>
+<li><a href="../../../datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html" title="class in datafu.hourglass.jobs"><span class="strong">Next Class</span></a></li>
+</ul>
+<ul class="navList">
+<li><a href="../../../index.html?datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html" target="_top">Frames</a></li>
+<li><a href="PartitionCollapsingExecutionPlanner.html" target="_top">No Frames</a></li>
+</ul>
+<ul class="navList" id="allclasses_navbar_bottom">
+<li><a href="../../../allclasses-noframe.html">All Classes</a></li>
+</ul>
+<div>
+<script type="text/javascript"><!--
+  allClassesLink = document.getElementById("allclasses_navbar_bottom");
+  if(window==top) {
+    allClassesLink.style.display = "block";
+  }
+  else {
+    allClassesLink.style.display = "none";
+  }
+  //-->
+</script>
+</div>
+<div>
+<ul class="subNavList">
+<li>Summary:&nbsp;</li>
+<li>Nested&nbsp;|&nbsp;</li>
+<li>Field&nbsp;|&nbsp;</li>
+<li><a href="#constructor_summary">Constr</a>&nbsp;|&nbsp;</li>
+<li><a href="#method_summary">Method</a></li>
+</ul>
+<ul class="subNavList">
+<li>Detail:&nbsp;</li>
+<li>Field&nbsp;|&nbsp;</li>
+<li><a href="#constructor_detail">Constr</a>&nbsp;|&nbsp;</li>
+<li><a href="#method_detail">Method</a></li>
+</ul>
+</div>
+<a name="skip-navbar_bottom">
+<!--   -->
+</a></div>
+<!-- ======== END OF BOTTOM NAVBAR ======= -->
+</body>
+</html>

Added: datafu/site/docs/hourglass/1.4.0/datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html
URL: http://svn.apache.org/viewvc/datafu/site/docs/hourglass/1.4.0/datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html?rev=1827525&view=auto
==============================================================================
--- datafu/site/docs/hourglass/1.4.0/datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html (added)
+++ datafu/site/docs/hourglass/1.4.0/datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html Thu Mar 22 19:01:04 2018
@@ -0,0 +1,709 @@
+<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd">
+<!-- NewPage -->
+<html lang="en">
+<head>
+<!-- Generated by javadoc (version 1.7.0_79) on Thu Mar 22 11:58:07 PDT 2018 -->
+<title>PartitionCollapsingIncrementalJob (datafu-hourglass 1.4.0 API)</title>
+<meta name="date" content="2018-03-22">
+<link rel="stylesheet" type="text/css" href="../../../stylesheet.css" title="Style">
+</head>
+<body>
+<script type="text/javascript"><!--
+    if (location.href.indexOf('is-external=true') == -1) {
+        parent.document.title="PartitionCollapsingIncrementalJob (datafu-hourglass 1.4.0 API)";
+    }
+//-->
+</script>
+<noscript>
+<div>JavaScript is disabled on your browser.</div>
+</noscript>
+<!-- ========= START OF TOP NAVBAR ======= -->
+<div class="topNav"><a name="navbar_top">
+<!--   -->
+</a><a href="#skip-navbar_top" title="Skip navigation links"></a><a name="navbar_top_firstrow">
+<!--   -->
+</a>
+<ul class="navList" title="Navigation">
+<li><a href="../../../overview-summary.html">Overview</a></li>
+<li><a href="package-summary.html">Package</a></li>
+<li class="navBarCell1Rev">Class</li>
+<li><a href="package-tree.html">Tree</a></li>
+<li><a href="../../../deprecated-list.html">Deprecated</a></li>
+<li><a href="../../../index-all.html">Index</a></li>
+<li><a href="../../../help-doc.html">Help</a></li>
+</ul>
+</div>
+<div class="subNav">
+<ul class="navList">
+<li><a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html" title="class in datafu.hourglass.jobs"><span class="strong">Prev Class</span></a></li>
+<li><a href="../../../datafu/hourglass/jobs/PartitionPreservingExecutionPlanner.html" title="class in datafu.hourglass.jobs"><span class="strong">Next Class</span></a></li>
+</ul>
+<ul class="navList">
+<li><a href="../../../index.html?datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html" target="_top">Frames</a></li>
+<li><a href="PartitionCollapsingIncrementalJob.html" target="_top">No Frames</a></li>
+</ul>
+<ul class="navList" id="allclasses_navbar_top">
+<li><a href="../../../allclasses-noframe.html">All Classes</a></li>
+</ul>
+<div>
+<script type="text/javascript"><!--
+  allClassesLink = document.getElementById("allclasses_navbar_top");
+  if(window==top) {
+    allClassesLink.style.display = "block";
+  }
+  else {
+    allClassesLink.style.display = "none";
+  }
+  //-->
+</script>
+</div>
+<div>
+<ul class="subNavList">
+<li>Summary:&nbsp;</li>
+<li><a href="#nested_classes_inherited_from_class_datafu.hourglass.jobs.AbstractPartitionCollapsingIncrementalJob">Nested</a>&nbsp;|&nbsp;</li>
+<li><a href="#fields_inherited_from_class_datafu.hourglass.jobs.AbstractPartitionCollapsingIncrementalJob">Field</a>&nbsp;|&nbsp;</li>
+<li><a href="#constructor_summary">Constr</a>&nbsp;|&nbsp;</li>
+<li><a href="#method_summary">Method</a></li>
+</ul>
+<ul class="subNavList">
+<li>Detail:&nbsp;</li>
+<li>Field&nbsp;|&nbsp;</li>
+<li><a href="#constructor_detail">Constr</a>&nbsp;|&nbsp;</li>
+<li><a href="#method_detail">Method</a></li>
+</ul>
+</div>
+<a name="skip-navbar_top">
+<!--   -->
+</a></div>
+<!-- ========= END OF TOP NAVBAR ========= -->
+<!-- ======== START OF CLASS DATA ======== -->
+<div class="header">
+<div class="subTitle">datafu.hourglass.jobs</div>
+<h2 title="Class PartitionCollapsingIncrementalJob" class="title">Class PartitionCollapsingIncrementalJob</h2>
+</div>
+<div class="contentContainer">
+<ul class="inheritance">
+<li>java.lang.Object</li>
+<li>
+<ul class="inheritance">
+<li>org.apache.hadoop.conf.Configured</li>
+<li>
+<ul class="inheritance">
+<li><a href="../../../datafu/hourglass/jobs/AbstractJob.html" title="class in datafu.hourglass.jobs">datafu.hourglass.jobs.AbstractJob</a></li>
+<li>
+<ul class="inheritance">
+<li><a href="../../../datafu/hourglass/jobs/TimeBasedJob.html" title="class in datafu.hourglass.jobs">datafu.hourglass.jobs.TimeBasedJob</a></li>
+<li>
+<ul class="inheritance">
+<li><a href="../../../datafu/hourglass/jobs/IncrementalJob.html" title="class in datafu.hourglass.jobs">datafu.hourglass.jobs.IncrementalJob</a></li>
+<li>
+<ul class="inheritance">
+<li><a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html" title="class in datafu.hourglass.jobs">datafu.hourglass.jobs.AbstractPartitionCollapsingIncrementalJob</a></li>
+<li>
+<ul class="inheritance">
+<li>datafu.hourglass.jobs.PartitionCollapsingIncrementalJob</li>
+</ul>
+</li>
+</ul>
+</li>
+</ul>
+</li>
+</ul>
+</li>
+</ul>
+</li>
+</ul>
+</li>
+</ul>
+<div class="description">
+<ul class="blockList">
+<li class="blockList">
+<dl>
+<dt>All Implemented Interfaces:</dt>
+<dd>org.apache.hadoop.conf.Configurable</dd>
+</dl>
+<hr>
+<br>
+<pre>public class <span class="strong">PartitionCollapsingIncrementalJob</span>
+extends <a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html" title="class in datafu.hourglass.jobs">AbstractPartitionCollapsingIncrementalJob</a></pre>
+<div class="block">A concrete version of <a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html" title="class in datafu.hourglass.jobs"><code>AbstractPartitionCollapsingIncrementalJob</code></a>.
+ 
+ This provides an alternative to extending <a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html" title="class in datafu.hourglass.jobs"><code>AbstractPartitionCollapsingIncrementalJob</code></a>.
+ Instead of extending this class and implementing the abstract methods, this concrete version
+ can be used instead.  Getters and setters have been provided for the abstract methods.</div>
+</li>
+</ul>
+</div>
+<div class="summary">
+<ul class="blockList">
+<li class="blockList">
+<!-- ======== NESTED CLASS SUMMARY ======== -->
+<ul class="blockList">
+<li class="blockList"><a name="nested_class_summary">
+<!--   -->
+</a>
+<h3>Nested Class Summary</h3>
+<ul class="blockList">
+<li class="blockList"><a name="nested_classes_inherited_from_class_datafu.hourglass.jobs.AbstractPartitionCollapsingIncrementalJob">
+<!--   -->
+</a>
+<h3>Nested classes/interfaces inherited from class&nbsp;datafu.hourglass.jobs.<a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html" title="class in datafu.hourglass.jobs">AbstractPartitionCollapsingIncrementalJob</a></h3>
+<code><a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.Report.html" title="class in datafu.hourglass.jobs">AbstractPartitionCollapsingIncrementalJob.Report</a></code></li>
+</ul>
+</li>
+</ul>
+<!-- =========== FIELD SUMMARY =========== -->
+<ul class="blockList">
+<li class="blockList"><a name="field_summary">
+<!--   -->
+</a>
+<h3>Field Summary</h3>
+<ul class="blockList">
+<li class="blockList"><a name="fields_inherited_from_class_datafu.hourglass.jobs.AbstractPartitionCollapsingIncrementalJob">
+<!--   -->
+</a>
+<h3>Fields inherited from class&nbsp;datafu.hourglass.jobs.<a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html" title="class in datafu.hourglass.jobs">AbstractPartitionCollapsingIncrementalJob</a></h3>
+<code><a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html#_reusePreviousOutput">_reusePreviousOutput</a></code></li>
+</ul>
+</li>
+</ul>
+<!-- ======== CONSTRUCTOR SUMMARY ======== -->
+<ul class="blockList">
+<li class="blockList"><a name="constructor_summary">
+<!--   -->
+</a>
+<h3>Constructor Summary</h3>
+<table class="overviewSummary" border="0" cellpadding="3" cellspacing="0" summary="Constructor Summary table, listing constructors, and an explanation">
+<caption><span>Constructors</span><span class="tabEnd">&nbsp;</span></caption>
+<tr>
+<th class="colOne" scope="col">Constructor and Description</th>
+</tr>
+<tr class="altColor">
+<td class="colOne"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html#PartitionCollapsingIncrementalJob(java.lang.Class)">PartitionCollapsingIncrementalJob</a></strong>(java.lang.Class&nbsp;cls)</code>
+<div class="block">Initializes the job.</div>
+</td>
+</tr>
+</table>
+</li>
+</ul>
+<!-- ========== METHOD SUMMARY =========== -->
+<ul class="blockList">
+<li class="blockList"><a name="method_summary">
+<!--   -->
+</a>
+<h3>Method Summary</h3>
+<table class="overviewSummary" border="0" cellpadding="3" cellspacing="0" summary="Method Summary table, listing methods, and an explanation">
+<caption><span>Methods</span><span class="tabEnd">&nbsp;</span></caption>
+<tr>
+<th class="colFirst" scope="col">Modifier and Type</th>
+<th class="colLast" scope="col">Method and Description</th>
+</tr>
+<tr class="altColor">
+<td class="colFirst"><code>void</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html#config(org.apache.hadoop.conf.Configuration)">config</a></strong>(org.apache.hadoop.conf.Configuration&nbsp;conf)</code>
+<div class="block">Overridden to provide custom configuration before the job starts.</div>
+</td>
+</tr>
+<tr class="rowColor">
+<td class="colFirst"><code><a href="../../../datafu/hourglass/model/Accumulator.html" title="interface in datafu.hourglass.model">Accumulator</a>&lt;org.apache.avro.generic.GenericRecord,org.apache.avro.generic.GenericRecord&gt;</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html#getCombinerAccumulator()">getCombinerAccumulator</a></strong>()</code>
+<div class="block">Gets the accumulator used for the combiner.</div>
+</td>
+</tr>
+<tr class="altColor">
+<td class="colFirst"><code>protected org.apache.avro.Schema</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html#getIntermediateValueSchema()">getIntermediateValueSchema</a></strong>()</code>
+<div class="block">Gets the Avro schema for the intermediate value.</div>
+</td>
+</tr>
+<tr class="rowColor">
+<td class="colFirst"><code>protected org.apache.avro.Schema</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html#getKeySchema()">getKeySchema</a></strong>()</code>
+<div class="block">Gets the Avro schema for the key.</div>
+</td>
+</tr>
+<tr class="altColor">
+<td class="colFirst"><code><a href="../../../datafu/hourglass/model/Mapper.html" title="interface in datafu.hourglass.model">Mapper</a>&lt;org.apache.avro.generic.GenericRecord,org.apache.avro.generic.GenericRecord,org.apache.avro.generic.GenericRecord&gt;</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html#getMapper()">getMapper</a></strong>()</code>
+<div class="block">Gets the mapper.</div>
+</td>
+</tr>
+<tr class="rowColor">
+<td class="colFirst"><code><a href="../../../datafu/hourglass/model/Merger.html" title="interface in datafu.hourglass.model">Merger</a>&lt;org.apache.avro.generic.GenericRecord&gt;</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html#getOldRecordMerger()">getOldRecordMerger</a></strong>()</code>
+<div class="block">Gets the record merger that is capable of unmerging old partial output from the new output.</div>
+</td>
+</tr>
+<tr class="altColor">
+<td class="colFirst"><code>protected org.apache.avro.Schema</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html#getOutputValueSchema()">getOutputValueSchema</a></strong>()</code>
+<div class="block">Gets the Avro schema for the output data.</div>
+</td>
+</tr>
+<tr class="rowColor">
+<td class="colFirst"><code><a href="../../../datafu/hourglass/model/Merger.html" title="interface in datafu.hourglass.model">Merger</a>&lt;org.apache.avro.generic.GenericRecord&gt;</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html#getRecordMerger()">getRecordMerger</a></strong>()</code>
+<div class="block">Gets the record merger that is capable of merging previous output with a new partial output.</div>
+</td>
+</tr>
+<tr class="altColor">
+<td class="colFirst"><code><a href="../../../datafu/hourglass/model/Accumulator.html" title="interface in datafu.hourglass.model">Accumulator</a>&lt;org.apache.avro.generic.GenericRecord,org.apache.avro.generic.GenericRecord&gt;</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html#getReducerAccumulator()">getReducerAccumulator</a></strong>()</code>
+<div class="block">Gets the accumulator used for the reducer.</div>
+</td>
+</tr>
+<tr class="rowColor">
+<td class="colFirst"><code>void</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html#setCombinerAccumulator(datafu.hourglass.model.Accumulator)">setCombinerAccumulator</a></strong>(<a href="../../../datafu/hourglass/model/Accumulator.html" title="interface in datafu.hourglass.model">Accumulator</a>&lt;org.apache.avro.generic.GenericRecord,org.apache.avro.generic.GenericRecord&gt;&nbsp;combiner)</code>
+<div class="block">Set the accumulator for the combiner</div>
+</td>
+</tr>
+<tr class="altColor">
+<td class="colFirst"><code>void</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html#setIntermediateValueSchema(org.apache.avro.Schema)">setIntermediateValueSchema</a></strong>(org.apache.avro.Schema&nbsp;intermediateValueSchema)</code>
+<div class="block">Sets the Avro schema for the intermediate value.</div>
+</td>
+</tr>
+<tr class="rowColor">
+<td class="colFirst"><code>void</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html#setKeySchema(org.apache.avro.Schema)">setKeySchema</a></strong>(org.apache.avro.Schema&nbsp;keySchema)</code>
+<div class="block">Sets the Avro schema for the key.</div>
+</td>
+</tr>
+<tr class="altColor">
+<td class="colFirst"><code>void</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html#setMapper(datafu.hourglass.model.Mapper)">setMapper</a></strong>(<a href="../../../datafu/hourglass/model/Mapper.html" title="interface in datafu.hourglass.model">Mapper</a>&lt;org.apache.avro.generic.GenericRecord,org.apache.avro.generic.GenericRecord,org.apache.avro.generic.GenericRecord&gt;&nbsp;mapper)</code>
+<div class="block">Set the mapper.</div>
+</td>
+</tr>
+<tr class="rowColor">
+<td class="colFirst"><code>void</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html#setMerger(datafu.hourglass.model.Merger)">setMerger</a></strong>(<a href="../../../datafu/hourglass/model/Merger.html" title="interface in datafu.hourglass.model">Merger</a>&lt;org.apache.avro.generic.GenericRecord&gt;&nbsp;merger)</code>
+<div class="block">Sets the record merger that is capable of merging previous output with a new partial output.</div>
+</td>
+</tr>
+<tr class="altColor">
+<td class="colFirst"><code>void</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html#setOldMerger(datafu.hourglass.model.Merger)">setOldMerger</a></strong>(<a href="../../../datafu/hourglass/model/Merger.html" title="interface in datafu.hourglass.model">Merger</a>&lt;org.apache.avro.generic.GenericRecord&gt;&nbsp;oldMerger)</code>
+<div class="block">Sets the record merger that is capable of unmerging old partial output from the new output.</div>
+</td>
+</tr>
+<tr class="rowColor">
+<td class="colFirst"><code>void</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html#setOnSetup(datafu.hourglass.jobs.Setup)">setOnSetup</a></strong>(<a href="../../../datafu/hourglass/jobs/Setup.html" title="interface in datafu.hourglass.jobs">Setup</a>&nbsp;setup)</code>
+<div class="block">Set callback to provide custom configuration before job begins execution.</div>
+</td>
+</tr>
+<tr class="altColor">
+<td class="colFirst"><code>void</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html#setOutputValueSchema(org.apache.avro.Schema)">setOutputValueSchema</a></strong>(org.apache.avro.Schema&nbsp;outputValueSchema)</code>
+<div class="block">Sets the Avro schema for the output data.</div>
+</td>
+</tr>
+<tr class="rowColor">
+<td class="colFirst"><code>void</code></td>
+<td class="colLast"><code><strong><a href="../../../datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html#setReducerAccumulator(datafu.hourglass.model.Accumulator)">setReducerAccumulator</a></strong>(<a href="../../../datafu/hourglass/model/Accumulator.html" title="interface in datafu.hourglass.model">Accumulator</a>&lt;org.apache.avro.generic.GenericRecord,org.apache.avro.generic.GenericRecord&gt;&nbsp;reducer)</code>
+<div class="block">Set the accumulator for the reducer.</div>
+</td>
+</tr>
+</table>
+<ul class="blockList">
+<li class="blockList"><a name="methods_inherited_from_class_datafu.hourglass.jobs.AbstractPartitionCollapsingIncrementalJob">
+<!--   -->
+</a>
+<h3>Methods inherited from class&nbsp;datafu.hourglass.jobs.<a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html" title="class in datafu.hourglass.jobs">AbstractPartitionCollapsingIncrementalJob</a></h3>
+<code><a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html#getOutputSchemaName()">getOutputSchemaName</a>, <a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html#getOutputSchemaNamespace()">getOutputSchemaNamespace</a>, <a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html#getReports()">getReports</a>, <a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html#getReusePreviousOutput()">getReusePreviousOutput</a>, <a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html#initialize()">initialize</a>, <a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html#run()">run</a>, <a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html#setProperties(java.util.Properties)">setProperties</a>, <a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html#set
 ReusePreviousOutput(boolean)">setReusePreviousOutput</a></code></li>
+</ul>
+<ul class="blockList">
+<li class="blockList"><a name="methods_inherited_from_class_datafu.hourglass.jobs.IncrementalJob">
+<!--   -->
+</a>
+<h3>Methods inherited from class&nbsp;datafu.hourglass.jobs.<a href="../../../datafu/hourglass/jobs/IncrementalJob.html" title="class in datafu.hourglass.jobs">IncrementalJob</a></h3>
+<code><a href="../../../datafu/hourglass/jobs/IncrementalJob.html#getMaxIterations()">getMaxIterations</a>, <a href="../../../datafu/hourglass/jobs/IncrementalJob.html#getMaxToProcess()">getMaxToProcess</a>, <a href="../../../datafu/hourglass/jobs/IncrementalJob.html#getSchemas()">getSchemas</a>, <a href="../../../datafu/hourglass/jobs/IncrementalJob.html#isFailOnMissing()">isFailOnMissing</a>, <a href="../../../datafu/hourglass/jobs/IncrementalJob.html#setFailOnMissing(boolean)">setFailOnMissing</a>, <a href="../../../datafu/hourglass/jobs/IncrementalJob.html#setMaxIterations(java.lang.Integer)">setMaxIterations</a>, <a href="../../../datafu/hourglass/jobs/IncrementalJob.html#setMaxToProcess(java.lang.Integer)">setMaxToProcess</a></code></li>
+</ul>
+<ul class="blockList">
+<li class="blockList"><a name="methods_inherited_from_class_datafu.hourglass.jobs.TimeBasedJob">
+<!--   -->
+</a>
+<h3>Methods inherited from class&nbsp;datafu.hourglass.jobs.<a href="../../../datafu/hourglass/jobs/TimeBasedJob.html" title="class in datafu.hourglass.jobs">TimeBasedJob</a></h3>
+<code><a href="../../../datafu/hourglass/jobs/TimeBasedJob.html#getDaysAgo()">getDaysAgo</a>, <a href="../../../datafu/hourglass/jobs/TimeBasedJob.html#getEndDate()">getEndDate</a>, <a href="../../../datafu/hourglass/jobs/TimeBasedJob.html#getNumDays()">getNumDays</a>, <a href="../../../datafu/hourglass/jobs/TimeBasedJob.html#getStartDate()">getStartDate</a>, <a href="../../../datafu/hourglass/jobs/TimeBasedJob.html#setDaysAgo(java.lang.Integer)">setDaysAgo</a>, <a href="../../../datafu/hourglass/jobs/TimeBasedJob.html#setEndDate(java.util.Date)">setEndDate</a>, <a href="../../../datafu/hourglass/jobs/TimeBasedJob.html#setNumDays(java.lang.Integer)">setNumDays</a>, <a href="../../../datafu/hourglass/jobs/TimeBasedJob.html#setStartDate(java.util.Date)">setStartDate</a>, <a href="../../../datafu/hourglass/jobs/TimeBasedJob.html#validate()">validate</a></code></li>
+</ul>
+<ul class="blockList">
+<li class="blockList"><a name="methods_inherited_from_class_datafu.hourglass.jobs.AbstractJob">
+<!--   -->
+</a>
+<h3>Methods inherited from class&nbsp;datafu.hourglass.jobs.<a href="../../../datafu/hourglass/jobs/AbstractJob.html" title="class in datafu.hourglass.jobs">AbstractJob</a></h3>
+<code><a href="../../../datafu/hourglass/jobs/AbstractJob.html#createRandomTempPath()">createRandomTempPath</a>, <a href="../../../datafu/hourglass/jobs/AbstractJob.html#ensurePath(org.apache.hadoop.fs.Path)">ensurePath</a>, <a href="../../../datafu/hourglass/jobs/AbstractJob.html#getCountersParentPath()">getCountersParentPath</a>, <a href="../../../datafu/hourglass/jobs/AbstractJob.html#getFileSystem()">getFileSystem</a>, <a href="../../../datafu/hourglass/jobs/AbstractJob.html#getInputPaths()">getInputPaths</a>, <a href="../../../datafu/hourglass/jobs/AbstractJob.html#getName()">getName</a>, <a href="../../../datafu/hourglass/jobs/AbstractJob.html#getNumReducers()">getNumReducers</a>, <a href="../../../datafu/hourglass/jobs/AbstractJob.html#getOutputPath()">getOutputPath</a>, <a href="../../../datafu/hourglass/jobs/AbstractJob.html#getProperties()">getProperties</a>, <a href="../../../datafu/hourglass/jobs/AbstractJob.html#getRetentionCount()">getRetentionCount</a>, <a href="../..
 /../datafu/hourglass/jobs/AbstractJob.html#getTempPath()">getTempPath</a>, <a href="../../../datafu/hourglass/jobs/AbstractJob.html#isUseCombiner()">isUseCombiner</a>, <a href="../../../datafu/hourglass/jobs/AbstractJob.html#randomTempPath()">randomTempPath</a>, <a href="../../../datafu/hourglass/jobs/AbstractJob.html#setCountersParentPath(org.apache.hadoop.fs.Path)">setCountersParentPath</a>, <a href="../../../datafu/hourglass/jobs/AbstractJob.html#setInputPaths(java.util.List)">setInputPaths</a>, <a href="../../../datafu/hourglass/jobs/AbstractJob.html#setName(java.lang.String)">setName</a>, <a href="../../../datafu/hourglass/jobs/AbstractJob.html#setNumReducers(java.lang.Integer)">setNumReducers</a>, <a href="../../../datafu/hourglass/jobs/AbstractJob.html#setOutputPath(org.apache.hadoop.fs.Path)">setOutputPath</a>, <a href="../../../datafu/hourglass/jobs/AbstractJob.html#setRetentionCount(java.lang.Integer)">setRetentionCount</a>, <a href="../../../datafu/hourglass/jobs/Abstract
 Job.html#setTempPath(org.apache.hadoop.fs.Path)">setTempPath</a>, <a href="../../../datafu/hourglass/jobs/AbstractJob.html#setUseCombiner(boolean)">setUseCombiner</a></code></li>
+</ul>
+<ul class="blockList">
+<li class="blockList"><a name="methods_inherited_from_class_org.apache.hadoop.conf.Configured">
+<!--   -->
+</a>
+<h3>Methods inherited from class&nbsp;org.apache.hadoop.conf.Configured</h3>
+<code>getConf, setConf</code></li>
+</ul>
+<ul class="blockList">
+<li class="blockList"><a name="methods_inherited_from_class_java.lang.Object">
+<!--   -->
+</a>
+<h3>Methods inherited from class&nbsp;java.lang.Object</h3>
+<code>clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait</code></li>
+</ul>
+</li>
+</ul>
+</li>
+</ul>
+</div>
+<div class="details">
+<ul class="blockList">
+<li class="blockList">
+<!-- ========= CONSTRUCTOR DETAIL ======== -->
+<ul class="blockList">
+<li class="blockList"><a name="constructor_detail">
+<!--   -->
+</a>
+<h3>Constructor Detail</h3>
+<a name="PartitionCollapsingIncrementalJob(java.lang.Class)">
+<!--   -->
+</a>
+<ul class="blockListLast">
+<li class="blockList">
+<h4>PartitionCollapsingIncrementalJob</h4>
+<pre>public&nbsp;PartitionCollapsingIncrementalJob(java.lang.Class&nbsp;cls)
+                                  throws java.io.IOException</pre>
+<div class="block">Initializes the job.  The job name is derived from the name of a provided class.</div>
+<dl><dt><span class="strong">Parameters:</span></dt><dd><code>cls</code> - class to base job name on</dd>
+<dt><span class="strong">Throws:</span></dt>
+<dd><code>java.io.IOException</code> - IOException</dd></dl>
+</li>
+</ul>
+</li>
+</ul>
+<!-- ============ METHOD DETAIL ========== -->
+<ul class="blockList">
+<li class="blockList"><a name="method_detail">
+<!--   -->
+</a>
+<h3>Method Detail</h3>
+<a name="getMapper()">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>getMapper</h4>
+<pre>public&nbsp;<a href="../../../datafu/hourglass/model/Mapper.html" title="interface in datafu.hourglass.model">Mapper</a>&lt;org.apache.avro.generic.GenericRecord,org.apache.avro.generic.GenericRecord,org.apache.avro.generic.GenericRecord&gt;&nbsp;getMapper()</pre>
+<div class="block"><strong>Description copied from class:&nbsp;<code><a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html#getMapper()">AbstractPartitionCollapsingIncrementalJob</a></code></strong></div>
+<div class="block">Gets the mapper.</div>
+<dl>
+<dt><strong>Specified by:</strong></dt>
+<dd><code><a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html#getMapper()">getMapper</a></code>&nbsp;in class&nbsp;<code><a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html" title="class in datafu.hourglass.jobs">AbstractPartitionCollapsingIncrementalJob</a></code></dd>
+<dt><span class="strong">Returns:</span></dt><dd>mapper</dd></dl>
+</li>
+</ul>
+<a name="getCombinerAccumulator()">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>getCombinerAccumulator</h4>
+<pre>public&nbsp;<a href="../../../datafu/hourglass/model/Accumulator.html" title="interface in datafu.hourglass.model">Accumulator</a>&lt;org.apache.avro.generic.GenericRecord,org.apache.avro.generic.GenericRecord&gt;&nbsp;getCombinerAccumulator()</pre>
+<div class="block"><strong>Description copied from class:&nbsp;<code><a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html#getCombinerAccumulator()">AbstractPartitionCollapsingIncrementalJob</a></code></strong></div>
+<div class="block">Gets the accumulator used for the combiner.</div>
+<dl>
+<dt><strong>Overrides:</strong></dt>
+<dd><code><a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html#getCombinerAccumulator()">getCombinerAccumulator</a></code>&nbsp;in class&nbsp;<code><a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html" title="class in datafu.hourglass.jobs">AbstractPartitionCollapsingIncrementalJob</a></code></dd>
+<dt><span class="strong">Returns:</span></dt><dd>combiner accumulator</dd></dl>
+</li>
+</ul>
+<a name="getReducerAccumulator()">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>getReducerAccumulator</h4>
+<pre>public&nbsp;<a href="../../../datafu/hourglass/model/Accumulator.html" title="interface in datafu.hourglass.model">Accumulator</a>&lt;org.apache.avro.generic.GenericRecord,org.apache.avro.generic.GenericRecord&gt;&nbsp;getReducerAccumulator()</pre>
+<div class="block"><strong>Description copied from class:&nbsp;<code><a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html#getReducerAccumulator()">AbstractPartitionCollapsingIncrementalJob</a></code></strong></div>
+<div class="block">Gets the accumulator used for the reducer.</div>
+<dl>
+<dt><strong>Specified by:</strong></dt>
+<dd><code><a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html#getReducerAccumulator()">getReducerAccumulator</a></code>&nbsp;in class&nbsp;<code><a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html" title="class in datafu.hourglass.jobs">AbstractPartitionCollapsingIncrementalJob</a></code></dd>
+<dt><span class="strong">Returns:</span></dt><dd>reducer accumulator</dd></dl>
+</li>
+</ul>
+<a name="getKeySchema()">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>getKeySchema</h4>
+<pre>protected&nbsp;org.apache.avro.Schema&nbsp;getKeySchema()</pre>
+<div class="block"><strong>Description copied from class:&nbsp;<code><a href="../../../datafu/hourglass/jobs/IncrementalJob.html#getKeySchema()">IncrementalJob</a></code></strong></div>
+<div class="block">Gets the Avro schema for the key.
+ <p>
+ This is also used as the key for the map output.</div>
+<dl>
+<dt><strong>Specified by:</strong></dt>
+<dd><code><a href="../../../datafu/hourglass/jobs/IncrementalJob.html#getKeySchema()">getKeySchema</a></code>&nbsp;in class&nbsp;<code><a href="../../../datafu/hourglass/jobs/IncrementalJob.html" title="class in datafu.hourglass.jobs">IncrementalJob</a></code></dd>
+<dt><span class="strong">Returns:</span></dt><dd>key schema.</dd></dl>
+</li>
+</ul>
+<a name="getIntermediateValueSchema()">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>getIntermediateValueSchema</h4>
+<pre>protected&nbsp;org.apache.avro.Schema&nbsp;getIntermediateValueSchema()</pre>
+<div class="block"><strong>Description copied from class:&nbsp;<code><a href="../../../datafu/hourglass/jobs/IncrementalJob.html#getIntermediateValueSchema()">IncrementalJob</a></code></strong></div>
+<div class="block">Gets the Avro schema for the intermediate value.
+ <p>
+ This is also used for the value for the map output.</div>
+<dl>
+<dt><strong>Specified by:</strong></dt>
+<dd><code><a href="../../../datafu/hourglass/jobs/IncrementalJob.html#getIntermediateValueSchema()">getIntermediateValueSchema</a></code>&nbsp;in class&nbsp;<code><a href="../../../datafu/hourglass/jobs/IncrementalJob.html" title="class in datafu.hourglass.jobs">IncrementalJob</a></code></dd>
+<dt><span class="strong">Returns:</span></dt><dd>intermediate value schema</dd></dl>
+</li>
+</ul>
+<a name="getOutputValueSchema()">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>getOutputValueSchema</h4>
+<pre>protected&nbsp;org.apache.avro.Schema&nbsp;getOutputValueSchema()</pre>
+<div class="block"><strong>Description copied from class:&nbsp;<code><a href="../../../datafu/hourglass/jobs/IncrementalJob.html#getOutputValueSchema()">IncrementalJob</a></code></strong></div>
+<div class="block">Gets the Avro schema for the output data.</div>
+<dl>
+<dt><strong>Specified by:</strong></dt>
+<dd><code><a href="../../../datafu/hourglass/jobs/IncrementalJob.html#getOutputValueSchema()">getOutputValueSchema</a></code>&nbsp;in class&nbsp;<code><a href="../../../datafu/hourglass/jobs/IncrementalJob.html" title="class in datafu.hourglass.jobs">IncrementalJob</a></code></dd>
+<dt><span class="strong">Returns:</span></dt><dd>output data schema</dd></dl>
+</li>
+</ul>
+<a name="getRecordMerger()">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>getRecordMerger</h4>
+<pre>public&nbsp;<a href="../../../datafu/hourglass/model/Merger.html" title="interface in datafu.hourglass.model">Merger</a>&lt;org.apache.avro.generic.GenericRecord&gt;&nbsp;getRecordMerger()</pre>
+<div class="block"><strong>Description copied from class:&nbsp;<code><a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html#getRecordMerger()">AbstractPartitionCollapsingIncrementalJob</a></code></strong></div>
+<div class="block">Gets the record merger that is capable of merging previous output with a new partial output.
+ This is only needed when reusing previous output where the intermediate and output schemas are different.
+ New partial output is produced by the reducer from new input that is after the previous output.</div>
+<dl>
+<dt><strong>Overrides:</strong></dt>
+<dd><code><a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html#getRecordMerger()">getRecordMerger</a></code>&nbsp;in class&nbsp;<code><a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html" title="class in datafu.hourglass.jobs">AbstractPartitionCollapsingIncrementalJob</a></code></dd>
+<dt><span class="strong">Returns:</span></dt><dd>merger</dd></dl>
+</li>
+</ul>
+<a name="getOldRecordMerger()">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>getOldRecordMerger</h4>
+<pre>public&nbsp;<a href="../../../datafu/hourglass/model/Merger.html" title="interface in datafu.hourglass.model">Merger</a>&lt;org.apache.avro.generic.GenericRecord&gt;&nbsp;getOldRecordMerger()</pre>
+<div class="block"><strong>Description copied from class:&nbsp;<code><a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html#getOldRecordMerger()">AbstractPartitionCollapsingIncrementalJob</a></code></strong></div>
+<div class="block">Gets the record merger that is capable of unmerging old partial output from the new output.
+ This is only needed when reusing previous output for a fixed-length sliding window.
+ The new output is the result of merging the previous output with the new partial output.
+ The old partial output is produced by the reducer from old input data before the time range of
+ the previous output.</div>
+<dl>
+<dt><strong>Overrides:</strong></dt>
+<dd><code><a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html#getOldRecordMerger()">getOldRecordMerger</a></code>&nbsp;in class&nbsp;<code><a href="../../../datafu/hourglass/jobs/AbstractPartitionCollapsingIncrementalJob.html" title="class in datafu.hourglass.jobs">AbstractPartitionCollapsingIncrementalJob</a></code></dd>
+<dt><span class="strong">Returns:</span></dt><dd>merger</dd></dl>
+</li>
+</ul>
+<a name="setMapper(datafu.hourglass.model.Mapper)">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>setMapper</h4>
+<pre>public&nbsp;void&nbsp;setMapper(<a href="../../../datafu/hourglass/model/Mapper.html" title="interface in datafu.hourglass.model">Mapper</a>&lt;org.apache.avro.generic.GenericRecord,org.apache.avro.generic.GenericRecord,org.apache.avro.generic.GenericRecord&gt;&nbsp;mapper)</pre>
+<div class="block">Set the mapper.</div>
+<dl><dt><span class="strong">Parameters:</span></dt><dd><code>mapper</code> - the mapper</dd></dl>
+</li>
+</ul>
+<a name="setCombinerAccumulator(datafu.hourglass.model.Accumulator)">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>setCombinerAccumulator</h4>
+<pre>public&nbsp;void&nbsp;setCombinerAccumulator(<a href="../../../datafu/hourglass/model/Accumulator.html" title="interface in datafu.hourglass.model">Accumulator</a>&lt;org.apache.avro.generic.GenericRecord,org.apache.avro.generic.GenericRecord&gt;&nbsp;combiner)</pre>
+<div class="block">Set the accumulator for the combiner</div>
+<dl><dt><span class="strong">Parameters:</span></dt><dd><code>combiner</code> - accumulator for the combiner</dd></dl>
+</li>
+</ul>
+<a name="setReducerAccumulator(datafu.hourglass.model.Accumulator)">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>setReducerAccumulator</h4>
+<pre>public&nbsp;void&nbsp;setReducerAccumulator(<a href="../../../datafu/hourglass/model/Accumulator.html" title="interface in datafu.hourglass.model">Accumulator</a>&lt;org.apache.avro.generic.GenericRecord,org.apache.avro.generic.GenericRecord&gt;&nbsp;reducer)</pre>
+<div class="block">Set the accumulator for the reducer.</div>
+<dl><dt><span class="strong">Parameters:</span></dt><dd><code>reducer</code> - accumulator for the reducer</dd></dl>
+</li>
+</ul>
+<a name="setKeySchema(org.apache.avro.Schema)">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>setKeySchema</h4>
+<pre>public&nbsp;void&nbsp;setKeySchema(org.apache.avro.Schema&nbsp;keySchema)</pre>
+<div class="block">Sets the Avro schema for the key.
+ <p>
+ This is also used as the key for the map output.</div>
+<dl><dt><span class="strong">Parameters:</span></dt><dd><code>keySchema</code> - key schema</dd></dl>
+</li>
+</ul>
+<a name="setIntermediateValueSchema(org.apache.avro.Schema)">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>setIntermediateValueSchema</h4>
+<pre>public&nbsp;void&nbsp;setIntermediateValueSchema(org.apache.avro.Schema&nbsp;intermediateValueSchema)</pre>
+<div class="block">Sets the Avro schema for the intermediate value.
+ <p>
+ This is also used for the value for the map output.</div>
+<dl><dt><span class="strong">Parameters:</span></dt><dd><code>intermediateValueSchema</code> - intermediate value schema</dd></dl>
+</li>
+</ul>
+<a name="setOutputValueSchema(org.apache.avro.Schema)">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>setOutputValueSchema</h4>
+<pre>public&nbsp;void&nbsp;setOutputValueSchema(org.apache.avro.Schema&nbsp;outputValueSchema)</pre>
+<div class="block">Sets the Avro schema for the output data.</div>
+<dl><dt><span class="strong">Parameters:</span></dt><dd><code>outputValueSchema</code> - output value schema</dd></dl>
+</li>
+</ul>
+<a name="setMerger(datafu.hourglass.model.Merger)">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>setMerger</h4>
+<pre>public&nbsp;void&nbsp;setMerger(<a href="../../../datafu/hourglass/model/Merger.html" title="interface in datafu.hourglass.model">Merger</a>&lt;org.apache.avro.generic.GenericRecord&gt;&nbsp;merger)</pre>
+<div class="block">Sets the record merger that is capable of merging previous output with a new partial output.
+ This is only needed when reusing previous output where the intermediate and output schemas are different.
+ New partial output is produced by the reducer from new input that is after the previous output.</div>
+<dl><dt><span class="strong">Parameters:</span></dt><dd><code>merger</code> - the merger</dd></dl>
+</li>
+</ul>
+<a name="setOldMerger(datafu.hourglass.model.Merger)">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>setOldMerger</h4>
+<pre>public&nbsp;void&nbsp;setOldMerger(<a href="../../../datafu/hourglass/model/Merger.html" title="interface in datafu.hourglass.model">Merger</a>&lt;org.apache.avro.generic.GenericRecord&gt;&nbsp;oldMerger)</pre>
+<div class="block">Sets the record merger that is capable of unmerging old partial output from the new output.
+ This is only needed when reusing previous output for a fixed-length sliding window.
+ The new output is the result of merging the previous output with the new partial output.
+ The old partial output is produced by the reducer from old input data before the time range of
+ the previous output.</div>
+<dl><dt><span class="strong">Parameters:</span></dt><dd><code>oldMerger</code> - merger</dd></dl>
+</li>
+</ul>
+<a name="setOnSetup(datafu.hourglass.jobs.Setup)">
+<!--   -->
+</a>
+<ul class="blockList">
+<li class="blockList">
+<h4>setOnSetup</h4>
+<pre>public&nbsp;void&nbsp;setOnSetup(<a href="../../../datafu/hourglass/jobs/Setup.html" title="interface in datafu.hourglass.jobs">Setup</a>&nbsp;setup)</pre>
+<div class="block">Set callback to provide custom configuration before job begins execution.</div>
+<dl><dt><span class="strong">Parameters:</span></dt><dd><code>setup</code> - object with callback method</dd></dl>
+</li>
+</ul>
+<a name="config(org.apache.hadoop.conf.Configuration)">
+<!--   -->
+</a>
+<ul class="blockListLast">
+<li class="blockList">
+<h4>config</h4>
+<pre>public&nbsp;void&nbsp;config(org.apache.hadoop.conf.Configuration&nbsp;conf)</pre>
+<div class="block"><strong>Description copied from class:&nbsp;<code><a href="../../../datafu/hourglass/jobs/AbstractJob.html#config(org.apache.hadoop.conf.Configuration)">AbstractJob</a></code></strong></div>
+<div class="block">Overridden to provide custom configuration before the job starts.</div>
+<dl>
+<dt><strong>Overrides:</strong></dt>
+<dd><code><a href="../../../datafu/hourglass/jobs/AbstractJob.html#config(org.apache.hadoop.conf.Configuration)">config</a></code>&nbsp;in class&nbsp;<code><a href="../../../datafu/hourglass/jobs/AbstractJob.html" title="class in datafu.hourglass.jobs">AbstractJob</a></code></dd>
+<dt><span class="strong">Parameters:</span></dt><dd><code>conf</code> - configuration</dd></dl>
+</li>
+</ul>
+</li>
+</ul>
+</li>
+</ul>
+</div>
+</div>
+<!-- ========= END OF CLASS DATA ========= -->
+<!-- ======= START OF BOTTOM NAVBAR ====== -->
+<div class="bottomNav"><a name="navbar_bottom">
+<!--   -->
+</a><a href="#skip-navbar_bottom" title="Skip navigation links"></a><a name="navbar_bottom_firstrow">
+<!--   -->
+</a>
+<ul class="navList" title="Navigation">
+<li><a href="../../../overview-summary.html">Overview</a></li>
+<li><a href="package-summary.html">Package</a></li>
+<li class="navBarCell1Rev">Class</li>
+<li><a href="package-tree.html">Tree</a></li>
+<li><a href="../../../deprecated-list.html">Deprecated</a></li>
+<li><a href="../../../index-all.html">Index</a></li>
+<li><a href="../../../help-doc.html">Help</a></li>
+</ul>
+</div>
+<div class="subNav">
+<ul class="navList">
+<li><a href="../../../datafu/hourglass/jobs/PartitionCollapsingExecutionPlanner.html" title="class in datafu.hourglass.jobs"><span class="strong">Prev Class</span></a></li>
+<li><a href="../../../datafu/hourglass/jobs/PartitionPreservingExecutionPlanner.html" title="class in datafu.hourglass.jobs"><span class="strong">Next Class</span></a></li>
+</ul>
+<ul class="navList">
+<li><a href="../../../index.html?datafu/hourglass/jobs/PartitionCollapsingIncrementalJob.html" target="_top">Frames</a></li>
+<li><a href="PartitionCollapsingIncrementalJob.html" target="_top">No Frames</a></li>
+</ul>
+<ul class="navList" id="allclasses_navbar_bottom">
+<li><a href="../../../allclasses-noframe.html">All Classes</a></li>
+</ul>
+<div>
+<script type="text/javascript"><!--
+  allClassesLink = document.getElementById("allclasses_navbar_bottom");
+  if(window==top) {
+    allClassesLink.style.display = "block";
+  }
+  else {
+    allClassesLink.style.display = "none";
+  }
+  //-->
+</script>
+</div>
+<div>
+<ul class="subNavList">
+<li>Summary:&nbsp;</li>
+<li><a href="#nested_classes_inherited_from_class_datafu.hourglass.jobs.AbstractPartitionCollapsingIncrementalJob">Nested</a>&nbsp;|&nbsp;</li>
+<li><a href="#fields_inherited_from_class_datafu.hourglass.jobs.AbstractPartitionCollapsingIncrementalJob">Field</a>&nbsp;|&nbsp;</li>
+<li><a href="#constructor_summary">Constr</a>&nbsp;|&nbsp;</li>
+<li><a href="#method_summary">Method</a></li>
+</ul>
+<ul class="subNavList">
+<li>Detail:&nbsp;</li>
+<li>Field&nbsp;|&nbsp;</li>
+<li><a href="#constructor_detail">Constr</a>&nbsp;|&nbsp;</li>
+<li><a href="#method_detail">Method</a></li>
+</ul>
+</div>
+<a name="skip-navbar_bottom">
+<!--   -->
+</a></div>
+<!-- ======== END OF BOTTOM NAVBAR ======= -->
+</body>
+</html>



Mime
View raw message