blob: 30e8ba18773a282ab8d6169a3912803b26fb5624 [file] [log] [blame]
<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd">
<!-- NewPage -->
<html lang="en">
<head>
<!-- Generated by javadoc (1.8.0_181-google-v7) on Wed Aug 14 17:37:13 PDT 2019 -->
<title>Watch (Apache Beam 2.15.0-SNAPSHOT)</title>
<meta name="date" content="2019-08-14">
<link rel="stylesheet" type="text/css" href="../../../../../stylesheet.css" title="Style">
<script type="text/javascript" src="../../../../../script.js"></script>
</head>
<body>
<script type="text/javascript"><!--
try {
if (location.href.indexOf('is-external=true') == -1) {
parent.document.title="Watch (Apache Beam 2.15.0-SNAPSHOT)";
}
}
catch(err) {
}
//-->
var methods = {"i0":9,"i1":9,"i2":9};
var tabs = {65535:["t0","All Methods"],1:["t1","Static Methods"],8:["t4","Concrete Methods"]};
var altColor = "altColor";
var rowColor = "rowColor";
var tableTab = "tableTab";
var activeTableTab = "activeTableTab";
</script>
<noscript>
<div>JavaScript is disabled on your browser.</div>
</noscript>
<!-- ========= START OF TOP NAVBAR ======= -->
<div class="topNav"><a name="navbar.top">
<!-- -->
</a>
<div class="skipNav"><a href="#skip.navbar.top" title="Skip navigation links">Skip navigation links</a></div>
<a name="navbar.top.firstrow">
<!-- -->
</a>
<ul class="navList" title="Navigation">
<li><a href="../../../../../overview-summary.html">Overview</a></li>
<li><a href="package-summary.html">Package</a></li>
<li class="navBarCell1Rev">Class</li>
<li><a href="package-tree.html">Tree</a></li>
<li><a href="../../../../../deprecated-list.html">Deprecated</a></li>
<li><a href="../../../../../index-all.html">Index</a></li>
<li><a href="../../../../../help-doc.html">Help</a></li>
</ul>
</div>
<div class="subNav">
<ul class="navList">
<li><a href="../../../../../org/apache/beam/sdk/transforms/Wait.OnSignal.html" title="class in org.apache.beam.sdk.transforms"><span class="typeNameLink">Prev&nbsp;Class</span></a></li>
<li><a href="../../../../../org/apache/beam/sdk/transforms/Watch.Growth.html" title="class in org.apache.beam.sdk.transforms"><span class="typeNameLink">Next&nbsp;Class</span></a></li>
</ul>
<ul class="navList">
<li><a href="../../../../../index.html?org/apache/beam/sdk/transforms/Watch.html" target="_top">Frames</a></li>
<li><a href="Watch.html" target="_top">No&nbsp;Frames</a></li>
</ul>
<ul class="navList" id="allclasses_navbar_top">
<li><a href="../../../../../allclasses-noframe.html">All&nbsp;Classes</a></li>
</ul>
<div>
<script type="text/javascript"><!--
allClassesLink = document.getElementById("allclasses_navbar_top");
if(window==top) {
allClassesLink.style.display = "block";
}
else {
allClassesLink.style.display = "none";
}
//-->
</script>
</div>
<div>
<ul class="subNavList">
<li>Summary:&nbsp;</li>
<li><a href="#nested.class.summary">Nested</a>&nbsp;|&nbsp;</li>
<li>Field&nbsp;|&nbsp;</li>
<li><a href="#constructor.summary">Constr</a>&nbsp;|&nbsp;</li>
<li><a href="#method.summary">Method</a></li>
</ul>
<ul class="subNavList">
<li>Detail:&nbsp;</li>
<li>Field&nbsp;|&nbsp;</li>
<li><a href="#constructor.detail">Constr</a>&nbsp;|&nbsp;</li>
<li><a href="#method.detail">Method</a></li>
</ul>
</div>
<a name="skip.navbar.top">
<!-- -->
</a></div>
<!-- ========= END OF TOP NAVBAR ========= -->
<!-- ======== START OF CLASS DATA ======== -->
<div class="header">
<div class="subTitle">org.apache.beam.sdk.transforms</div>
<h2 title="Class Watch" class="title">Class Watch</h2>
</div>
<div class="contentContainer">
<ul class="inheritance">
<li>java.lang.Object</li>
<li>
<ul class="inheritance">
<li>org.apache.beam.sdk.transforms.Watch</li>
</ul>
</li>
</ul>
<div class="description">
<ul class="blockList">
<li class="blockList">
<hr>
<br>
<pre><a href="../../../../../org/apache/beam/sdk/annotations/Experimental.html" title="annotation in org.apache.beam.sdk.annotations">@Experimental</a>(<a href="../../../../../org/apache/beam/sdk/annotations/Experimental.html#value--">value</a>=<a href="../../../../../org/apache/beam/sdk/annotations/Experimental.Kind.html#SPLITTABLE_DO_FN">SPLITTABLE_DO_FN</a>)
public class <span class="typeNameLabel">Watch</span>
extends java.lang.Object</pre>
<div class="block">Given a "poll function" that produces a potentially growing set of outputs for an input, this
transform simultaneously continuously watches the growth of output sets of all inputs, until a
per-input termination condition is reached.
<p>The output is returned as an unbounded <a href="../../../../../org/apache/beam/sdk/values/PCollection.html" title="class in org.apache.beam.sdk.values"><code>PCollection</code></a> of <code>KV&lt;InputT, OutputT&gt;</code>,
where each <code>OutputT</code> is associated with the <code>InputT</code> that produced it, and is
assigned with the timestamp that the poll function returned when this output was detected for the
first time.
<p>Hypothetical usage example for watching new files in a collection of directories, where for
each directory we assume that new files will not appear if the directory contains a file named
".complete":
<pre><code>
PCollection&lt;String&gt; directories = ...; // E.g. Create.of(single directory)
PCollection&lt;KV&lt;String, String&gt;&gt; matches = filepatterns.apply(Watch.&lt;String, String&gt;growthOf(
new PollFn&lt;String, String&gt;() {
public PollResult&lt;String&gt; apply(TimestampedValue&lt;String&gt; input) {
String directory = input.getValue();
List&lt;TimestampedValue&lt;String&gt;&gt; outputs = new ArrayList&lt;&gt;();
... List the directory and get creation times of all files ...
boolean isComplete = ... does a file ".complete" exist in the directory ...
return isComplete ? PollResult.complete(outputs) : PollResult.incomplete(outputs);
}
})
// Poll each directory every 5 seconds
.withPollInterval(Duration.standardSeconds(5))
// Stop watching each directory 12 hours after it's seen even if it's incomplete
.withTerminationPerInput(afterTotalOf(Duration.standardHours(12)));
</code></pre>
<p>By default, the watermark for a particular input is computed from a poll result as "earliest
timestamp of new elements in this poll result". It can also be set explicitly via <a href="../../../../../org/apache/beam/sdk/transforms/Watch.Growth.PollResult.html#withWatermark-org.joda.time.Instant-"><code>Watch.Growth.PollResult.withWatermark(org.joda.time.Instant)</code></a> if the <a href="../../../../../org/apache/beam/sdk/transforms/Watch.Growth.PollFn.html" title="class in org.apache.beam.sdk.transforms"><code>Watch.Growth.PollFn</code></a> can provide a more optimistic
estimate.
<p>Note: This transform works only in runners supporting Splittable DoFn: see <a
href="https://beam.apache.org/documentation/runners/capability-matrix/">capability matrix</a>.</div>
</li>
</ul>
</div>
<div class="summary">
<ul class="blockList">
<li class="blockList">
<!-- ======== NESTED CLASS SUMMARY ======== -->
<ul class="blockList">
<li class="blockList"><a name="nested.class.summary">
<!-- -->
</a>
<h3>Nested Class Summary</h3>
<table class="memberSummary" border="0" cellpadding="3" cellspacing="0" summary="Nested Class Summary table, listing nested classes, and an explanation">
<caption><span>Nested Classes</span><span class="tabEnd">&nbsp;</span></caption>
<tr>
<th class="colFirst" scope="col">Modifier and Type</th>
<th class="colLast" scope="col">Class and Description</th>
</tr>
<tr class="altColor">
<td class="colFirst"><code>static class&nbsp;</code></td>
<td class="colLast"><code><span class="memberNameLink"><a href="../../../../../org/apache/beam/sdk/transforms/Watch.Growth.html" title="class in org.apache.beam.sdk.transforms">Watch.Growth</a>&lt;<a href="../../../../../org/apache/beam/sdk/transforms/Watch.Growth.html" title="type parameter in Watch.Growth">InputT</a>,<a href="../../../../../org/apache/beam/sdk/transforms/Watch.Growth.html" title="type parameter in Watch.Growth">OutputT</a>,<a href="../../../../../org/apache/beam/sdk/transforms/Watch.Growth.html" title="type parameter in Watch.Growth">KeyT</a>&gt;</span></code>
<div class="block">Implementation of <a href="../../../../../org/apache/beam/sdk/transforms/Watch.html#growthOf-org.apache.beam.sdk.transforms.Watch.Growth.PollFn-org.apache.beam.sdk.transforms.Requirements-"><code>growthOf(org.apache.beam.sdk.transforms.Watch.Growth.PollFn&lt;InputT, OutputT&gt;, org.apache.beam.sdk.transforms.Requirements)</code></a>.</div>
</td>
</tr>
</table>
</li>
</ul>
<!-- ======== CONSTRUCTOR SUMMARY ======== -->
<ul class="blockList">
<li class="blockList"><a name="constructor.summary">
<!-- -->
</a>
<h3>Constructor Summary</h3>
<table class="memberSummary" border="0" cellpadding="3" cellspacing="0" summary="Constructor Summary table, listing constructors, and an explanation">
<caption><span>Constructors</span><span class="tabEnd">&nbsp;</span></caption>
<tr>
<th class="colOne" scope="col">Constructor and Description</th>
</tr>
<tr class="altColor">
<td class="colOne"><code><span class="memberNameLink"><a href="../../../../../org/apache/beam/sdk/transforms/Watch.html#Watch--">Watch</a></span>()</code>&nbsp;</td>
</tr>
</table>
</li>
</ul>
<!-- ========== METHOD SUMMARY =========== -->
<ul class="blockList">
<li class="blockList"><a name="method.summary">
<!-- -->
</a>
<h3>Method Summary</h3>
<table class="memberSummary" border="0" cellpadding="3" cellspacing="0" summary="Method Summary table, listing methods, and an explanation">
<caption><span id="t0" class="activeTableTab"><span>All Methods</span><span class="tabEnd">&nbsp;</span></span><span id="t1" class="tableTab"><span><a href="javascript:show(1);">Static Methods</a></span><span class="tabEnd">&nbsp;</span></span><span id="t4" class="tableTab"><span><a href="javascript:show(8);">Concrete Methods</a></span><span class="tabEnd">&nbsp;</span></span></caption>
<tr>
<th class="colFirst" scope="col">Modifier and Type</th>
<th class="colLast" scope="col">Method and Description</th>
</tr>
<tr id="i0" class="altColor">
<td class="colFirst"><code>static &lt;InputT,OutputT,KeyT&gt;<br><a href="../../../../../org/apache/beam/sdk/transforms/Watch.Growth.html" title="class in org.apache.beam.sdk.transforms">Watch.Growth</a>&lt;InputT,OutputT,KeyT&gt;</code></td>
<td class="colLast"><code><span class="memberNameLink"><a href="../../../../../org/apache/beam/sdk/transforms/Watch.html#growthOf-org.apache.beam.sdk.transforms.Contextful-org.apache.beam.sdk.transforms.SerializableFunction-">growthOf</a></span>(<a href="../../../../../org/apache/beam/sdk/transforms/Contextful.html" title="class in org.apache.beam.sdk.transforms">Contextful</a>&lt;<a href="../../../../../org/apache/beam/sdk/transforms/Watch.Growth.PollFn.html" title="class in org.apache.beam.sdk.transforms">Watch.Growth.PollFn</a>&lt;InputT,OutputT&gt;&gt;&nbsp;pollFn,
<a href="../../../../../org/apache/beam/sdk/transforms/SerializableFunction.html" title="interface in org.apache.beam.sdk.transforms">SerializableFunction</a>&lt;OutputT,KeyT&gt;&nbsp;outputKeyFn)</code>
<div class="block">Watches the growth of the given poll function, using the given "key function" to deduplicate
outputs.</div>
</td>
</tr>
<tr id="i1" class="rowColor">
<td class="colFirst"><code>static &lt;InputT,OutputT&gt;<br><a href="../../../../../org/apache/beam/sdk/transforms/Watch.Growth.html" title="class in org.apache.beam.sdk.transforms">Watch.Growth</a>&lt;InputT,OutputT,OutputT&gt;</code></td>
<td class="colLast"><code><span class="memberNameLink"><a href="../../../../../org/apache/beam/sdk/transforms/Watch.html#growthOf-org.apache.beam.sdk.transforms.Watch.Growth.PollFn-">growthOf</a></span>(<a href="../../../../../org/apache/beam/sdk/transforms/Watch.Growth.PollFn.html" title="class in org.apache.beam.sdk.transforms">Watch.Growth.PollFn</a>&lt;InputT,OutputT&gt;&nbsp;pollFn)</code>
<div class="block">Watches the growth of the given poll function.</div>
</td>
</tr>
<tr id="i2" class="altColor">
<td class="colFirst"><code>static &lt;InputT,OutputT&gt;<br><a href="../../../../../org/apache/beam/sdk/transforms/Watch.Growth.html" title="class in org.apache.beam.sdk.transforms">Watch.Growth</a>&lt;InputT,OutputT,OutputT&gt;</code></td>
<td class="colLast"><code><span class="memberNameLink"><a href="../../../../../org/apache/beam/sdk/transforms/Watch.html#growthOf-org.apache.beam.sdk.transforms.Watch.Growth.PollFn-org.apache.beam.sdk.transforms.Requirements-">growthOf</a></span>(<a href="../../../../../org/apache/beam/sdk/transforms/Watch.Growth.PollFn.html" title="class in org.apache.beam.sdk.transforms">Watch.Growth.PollFn</a>&lt;InputT,OutputT&gt;&nbsp;pollFn,
<a href="../../../../../org/apache/beam/sdk/transforms/Requirements.html" title="class in org.apache.beam.sdk.transforms">Requirements</a>&nbsp;requirements)</code>
<div class="block">Watches the growth of the given poll function.</div>
</td>
</tr>
</table>
<ul class="blockList">
<li class="blockList"><a name="methods.inherited.from.class.java.lang.Object">
<!-- -->
</a>
<h3>Methods inherited from class&nbsp;java.lang.Object</h3>
<code>clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait</code></li>
</ul>
</li>
</ul>
</li>
</ul>
</div>
<div class="details">
<ul class="blockList">
<li class="blockList">
<!-- ========= CONSTRUCTOR DETAIL ======== -->
<ul class="blockList">
<li class="blockList"><a name="constructor.detail">
<!-- -->
</a>
<h3>Constructor Detail</h3>
<a name="Watch--">
<!-- -->
</a>
<ul class="blockListLast">
<li class="blockList">
<h4>Watch</h4>
<pre>public&nbsp;Watch()</pre>
</li>
</ul>
</li>
</ul>
<!-- ============ METHOD DETAIL ========== -->
<ul class="blockList">
<li class="blockList"><a name="method.detail">
<!-- -->
</a>
<h3>Method Detail</h3>
<a name="growthOf-org.apache.beam.sdk.transforms.Watch.Growth.PollFn-org.apache.beam.sdk.transforms.Requirements-">
<!-- -->
</a>
<ul class="blockList">
<li class="blockList">
<h4>growthOf</h4>
<pre>public static&nbsp;&lt;InputT,OutputT&gt;&nbsp;<a href="../../../../../org/apache/beam/sdk/transforms/Watch.Growth.html" title="class in org.apache.beam.sdk.transforms">Watch.Growth</a>&lt;InputT,OutputT,OutputT&gt;&nbsp;growthOf(<a href="../../../../../org/apache/beam/sdk/transforms/Watch.Growth.PollFn.html" title="class in org.apache.beam.sdk.transforms">Watch.Growth.PollFn</a>&lt;InputT,OutputT&gt;&nbsp;pollFn,
<a href="../../../../../org/apache/beam/sdk/transforms/Requirements.html" title="class in org.apache.beam.sdk.transforms">Requirements</a>&nbsp;requirements)</pre>
<div class="block">Watches the growth of the given poll function. See class documentation for more details.</div>
</li>
</ul>
<a name="growthOf-org.apache.beam.sdk.transforms.Watch.Growth.PollFn-">
<!-- -->
</a>
<ul class="blockList">
<li class="blockList">
<h4>growthOf</h4>
<pre>public static&nbsp;&lt;InputT,OutputT&gt;&nbsp;<a href="../../../../../org/apache/beam/sdk/transforms/Watch.Growth.html" title="class in org.apache.beam.sdk.transforms">Watch.Growth</a>&lt;InputT,OutputT,OutputT&gt;&nbsp;growthOf(<a href="../../../../../org/apache/beam/sdk/transforms/Watch.Growth.PollFn.html" title="class in org.apache.beam.sdk.transforms">Watch.Growth.PollFn</a>&lt;InputT,OutputT&gt;&nbsp;pollFn)</pre>
<div class="block">Watches the growth of the given poll function. See class documentation for more details.</div>
</li>
</ul>
<a name="growthOf-org.apache.beam.sdk.transforms.Contextful-org.apache.beam.sdk.transforms.SerializableFunction-">
<!-- -->
</a>
<ul class="blockListLast">
<li class="blockList">
<h4>growthOf</h4>
<pre>public static&nbsp;&lt;InputT,OutputT,KeyT&gt;&nbsp;<a href="../../../../../org/apache/beam/sdk/transforms/Watch.Growth.html" title="class in org.apache.beam.sdk.transforms">Watch.Growth</a>&lt;InputT,OutputT,KeyT&gt;&nbsp;growthOf(<a href="../../../../../org/apache/beam/sdk/transforms/Contextful.html" title="class in org.apache.beam.sdk.transforms">Contextful</a>&lt;<a href="../../../../../org/apache/beam/sdk/transforms/Watch.Growth.PollFn.html" title="class in org.apache.beam.sdk.transforms">Watch.Growth.PollFn</a>&lt;InputT,OutputT&gt;&gt;&nbsp;pollFn,
<a href="../../../../../org/apache/beam/sdk/transforms/SerializableFunction.html" title="interface in org.apache.beam.sdk.transforms">SerializableFunction</a>&lt;OutputT,KeyT&gt;&nbsp;outputKeyFn)</pre>
<div class="block">Watches the growth of the given poll function, using the given "key function" to deduplicate
outputs. For example, if OutputT is a filename + file size, this can be a function that returns
just the filename, so that if the same file is observed multiple times with different sizes,
only the first observation is emitted.
<p>By default, this is the identity function, i.e. the output is used as its own key.</div>
</li>
</ul>
</li>
</ul>
</li>
</ul>
</div>
</div>
<!-- ========= END OF CLASS DATA ========= -->
<!-- ======= START OF BOTTOM NAVBAR ====== -->
<div class="bottomNav"><a name="navbar.bottom">
<!-- -->
</a>
<div class="skipNav"><a href="#skip.navbar.bottom" title="Skip navigation links">Skip navigation links</a></div>
<a name="navbar.bottom.firstrow">
<!-- -->
</a>
<ul class="navList" title="Navigation">
<li><a href="../../../../../overview-summary.html">Overview</a></li>
<li><a href="package-summary.html">Package</a></li>
<li class="navBarCell1Rev">Class</li>
<li><a href="package-tree.html">Tree</a></li>
<li><a href="../../../../../deprecated-list.html">Deprecated</a></li>
<li><a href="../../../../../index-all.html">Index</a></li>
<li><a href="../../../../../help-doc.html">Help</a></li>
</ul>
</div>
<div class="subNav">
<ul class="navList">
<li><a href="../../../../../org/apache/beam/sdk/transforms/Wait.OnSignal.html" title="class in org.apache.beam.sdk.transforms"><span class="typeNameLink">Prev&nbsp;Class</span></a></li>
<li><a href="../../../../../org/apache/beam/sdk/transforms/Watch.Growth.html" title="class in org.apache.beam.sdk.transforms"><span class="typeNameLink">Next&nbsp;Class</span></a></li>
</ul>
<ul class="navList">
<li><a href="../../../../../index.html?org/apache/beam/sdk/transforms/Watch.html" target="_top">Frames</a></li>
<li><a href="Watch.html" target="_top">No&nbsp;Frames</a></li>
</ul>
<ul class="navList" id="allclasses_navbar_bottom">
<li><a href="../../../../../allclasses-noframe.html">All&nbsp;Classes</a></li>
</ul>
<div>
<script type="text/javascript"><!--
allClassesLink = document.getElementById("allclasses_navbar_bottom");
if(window==top) {
allClassesLink.style.display = "block";
}
else {
allClassesLink.style.display = "none";
}
//-->
</script>
</div>
<div>
<ul class="subNavList">
<li>Summary:&nbsp;</li>
<li><a href="#nested.class.summary">Nested</a>&nbsp;|&nbsp;</li>
<li>Field&nbsp;|&nbsp;</li>
<li><a href="#constructor.summary">Constr</a>&nbsp;|&nbsp;</li>
<li><a href="#method.summary">Method</a></li>
</ul>
<ul class="subNavList">
<li>Detail:&nbsp;</li>
<li>Field&nbsp;|&nbsp;</li>
<li><a href="#constructor.detail">Constr</a>&nbsp;|&nbsp;</li>
<li><a href="#method.detail">Method</a></li>
</ul>
</div>
<a name="skip.navbar.bottom">
<!-- -->
</a></div>
<!-- ======== END OF BOTTOM NAVBAR ======= -->
</body>
</html>