blob: 051f8ff8b484d1a43778d7ce316036cd20a67522 [file] [log] [blame]
<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd">
<!-- NewPage -->
<html lang="en">
<head>
<!-- Generated by javadoc -->
<title>DynamoDBIO (Apache Beam 2.38.0-SNAPSHOT)</title>
<link rel="stylesheet" type="text/css" href="../../../../../../../stylesheet.css" title="Style">
<script type="text/javascript" src="../../../../../../../script.js"></script>
</head>
<body>
<script type="text/javascript"><!--
try {
if (location.href.indexOf('is-external=true') == -1) {
parent.document.title="DynamoDBIO (Apache Beam 2.38.0-SNAPSHOT)";
}
}
catch(err) {
}
//-->
var methods = {"i0":9,"i1":9};
var tabs = {65535:["t0","All Methods"],1:["t1","Static Methods"],8:["t4","Concrete Methods"]};
var altColor = "altColor";
var rowColor = "rowColor";
var tableTab = "tableTab";
var activeTableTab = "activeTableTab";
</script>
<noscript>
<div>JavaScript is disabled on your browser.</div>
</noscript>
<!-- ========= START OF TOP NAVBAR ======= -->
<div class="topNav"><a name="navbar.top">
<!-- -->
</a>
<div class="skipNav"><a href="#skip.navbar.top" title="Skip navigation links">Skip navigation links</a></div>
<a name="navbar.top.firstrow">
<!-- -->
</a>
<ul class="navList" title="Navigation">
<li><a href="../../../../../../../overview-summary.html">Overview</a></li>
<li><a href="package-summary.html">Package</a></li>
<li class="navBarCell1Rev">Class</li>
<li><a href="package-tree.html">Tree</a></li>
<li><a href="../../../../../../../deprecated-list.html">Deprecated</a></li>
<li><a href="../../../../../../../index-all.html">Index</a></li>
<li><a href="../../../../../../../help-doc.html">Help</a></li>
</ul>
</div>
<div class="subNav">
<ul class="navList">
<li><a href="../../../../../../../org/apache/beam/sdk/io/aws2/dynamodb/DynamoDbClientProvider.html" title="interface in org.apache.beam.sdk.io.aws2.dynamodb"><span class="typeNameLink">Prev&nbsp;Class</span></a></li>
<li><a href="../../../../../../../org/apache/beam/sdk/io/aws2/dynamodb/DynamoDBIO.Read.html" title="class in org.apache.beam.sdk.io.aws2.dynamodb"><span class="typeNameLink">Next&nbsp;Class</span></a></li>
</ul>
<ul class="navList">
<li><a href="../../../../../../../index.html?org/apache/beam/sdk/io/aws2/dynamodb/DynamoDBIO.html" target="_top">Frames</a></li>
<li><a href="DynamoDBIO.html" target="_top">No&nbsp;Frames</a></li>
</ul>
<ul class="navList" id="allclasses_navbar_top">
<li><a href="../../../../../../../allclasses-noframe.html">All&nbsp;Classes</a></li>
</ul>
<div>
<script type="text/javascript"><!--
allClassesLink = document.getElementById("allclasses_navbar_top");
if(window==top) {
allClassesLink.style.display = "block";
}
else {
allClassesLink.style.display = "none";
}
//-->
</script>
</div>
<div>
<ul class="subNavList">
<li>Summary:&nbsp;</li>
<li><a href="#nested.class.summary">Nested</a>&nbsp;|&nbsp;</li>
<li>Field&nbsp;|&nbsp;</li>
<li><a href="#constructor.summary">Constr</a>&nbsp;|&nbsp;</li>
<li><a href="#method.summary">Method</a></li>
</ul>
<ul class="subNavList">
<li>Detail:&nbsp;</li>
<li>Field&nbsp;|&nbsp;</li>
<li><a href="#constructor.detail">Constr</a>&nbsp;|&nbsp;</li>
<li><a href="#method.detail">Method</a></li>
</ul>
</div>
<a name="skip.navbar.top">
<!-- -->
</a></div>
<!-- ========= END OF TOP NAVBAR ========= -->
<!-- ======== START OF CLASS DATA ======== -->
<div class="header">
<div class="subTitle">org.apache.beam.sdk.io.aws2.dynamodb</div>
<h2 title="Class DynamoDBIO" class="title">Class DynamoDBIO</h2>
</div>
<div class="contentContainer">
<ul class="inheritance">
<li>java.lang.Object</li>
<li>
<ul class="inheritance">
<li>org.apache.beam.sdk.io.aws2.dynamodb.DynamoDBIO</li>
</ul>
</li>
</ul>
<div class="description">
<ul class="blockList">
<li class="blockList">
<hr>
<br>
<pre><a href="../../../../../../../org/apache/beam/sdk/annotations/Experimental.html" title="annotation in org.apache.beam.sdk.annotations">@Experimental</a>(<a href="../../../../../../../org/apache/beam/sdk/annotations/Experimental.html#value--">value</a>=<a href="../../../../../../../org/apache/beam/sdk/annotations/Experimental.Kind.html#SOURCE_SINK">SOURCE_SINK</a>)
public final class <span class="typeNameLabel">DynamoDBIO</span>
extends java.lang.Object</pre>
<div class="block">IO to read from and write to <a href="https://aws.amazon.com/dynamodb/">DynamoDB</a> tables.
<h3>Reading from DynamoDB</h3>
<p>Example usage:
<pre><code>
PCollection&lt;List&lt;Map&lt;String, AttributeValue&gt;&gt;&gt; output =
pipeline.apply(
DynamoDBIO.&lt;List&lt;Map&lt;String, AttributeValue&gt;&gt;&gt;read()
.withScanRequestFn(in -&gt; ScanRequest.builder().tableName(tableName).totalSegments(1).build())
.items()); // ScanResponse items mapper
</code></pre>
<p>At a minimum you have to provide:
<ul>
<li>a <code>scanRequestFn</code> providing the <a href="https://static.javadoc.io/software.amazon.awssdk/dynamodb/2.17.127/software/amazon/awssdk/services/dynamodb/model/ScanRequest.html?is-external=true" title="class or interface in software.amazon.awssdk.services.dynamodb.model"><code>ScanRequest</code></a> instance; <code>table name</code> and
<code>total segments</code> are required. Note: Choose <code>total segments</code> according to the
number of workers used.
<li>a <code>scanResponseMapperFn</code> to map the <a href="https://static.javadoc.io/software.amazon.awssdk/dynamodb/2.17.127/software/amazon/awssdk/services/dynamodb/model/ScanResponse.html?is-external=true" title="class or interface in software.amazon.awssdk.services.dynamodb.model"><code>ScanResponse</code></a> to the expected output type,
such as <a href="../../../../../../../org/apache/beam/sdk/io/aws2/dynamodb/DynamoDBIO.Read.html#items--"><code>DynamoDBIO.Read.items()</code></a>.
</ul>
<h3>Writing to DynamoDB</h3>
<p>Example usage:
<pre><code>
PCollection&lt;T&gt; data = ...;
SerializableFunction&lt;T, WriteRequest&gt; requestBuilder = ...;
data.apply(
DynamoDBIO.&lt;WriteRequest&gt;write()
.withWriteRequestMapperFn(t -&gt; KV.of(tableName, requestBuilder.apply(t))));
</code></pre>
<p>At a minimum you have to provide a <code>writeRequestMapperFn</code> to map each element into a
<a href="../../../../../../../org/apache/beam/sdk/values/KV.html" title="class in org.apache.beam.sdk.values"><code>KV</code></a> of <code>table name</code> and <a href="https://static.javadoc.io/software.amazon.awssdk/dynamodb/2.17.127/software/amazon/awssdk/services/dynamodb/model/WriteRequest.html?is-external=true" title="class or interface in software.amazon.awssdk.services.dynamodb.model"><code>WriteRequest</code></a>.
<p><b>Note:</b> AWS does not allow writing duplicate keys within a single batch operation. If
primary keys possibly repeat in your stream (i.e. an upsert stream), you may encounter a
`ValidationError`. To address this you have to provide the key names corresponding to your
primary key using <a href="../../../../../../../org/apache/beam/sdk/io/aws2/dynamodb/DynamoDBIO.Write.html#withDeduplicateKeys-java.util.List-"><code>DynamoDBIO.Write.withDeduplicateKeys(List)</code></a>. Based on these keys only the last
observed element is kept. Nevertheless, if no deduplication keys are provided, identical elements
are still deduplicated.
<h3>Configuration of AWS clients</h3>
<p>AWS clients for all AWS IOs can be configured using <a href="../../../../../../../org/apache/beam/sdk/io/aws2/options/AwsOptions.html" title="interface in org.apache.beam.sdk.io.aws2.options"><code>AwsOptions</code></a>, e.g. <code>--awsRegion=us-west-1</code>. <a href="../../../../../../../org/apache/beam/sdk/io/aws2/options/AwsOptions.html" title="interface in org.apache.beam.sdk.io.aws2.options"><code>AwsOptions</code></a> contain reasonable defaults based on default providers
for <a href="https://static.javadoc.io/software.amazon.awssdk/regions/2.17.127/software/amazon/awssdk/regions/Region.html?is-external=true" title="class or interface in software.amazon.awssdk.regions"><code>Region</code></a> and <a href="https://static.javadoc.io/software.amazon.awssdk/auth/2.17.127/software/amazon/awssdk/auth/credentials/AwsCredentialsProvider.html?is-external=true" title="class or interface in software.amazon.awssdk.auth.credentials"><code>AwsCredentialsProvider</code></a>.
<p>If you require more advanced configuration, you may change the <a href="../../../../../../../org/apache/beam/sdk/io/aws2/common/ClientBuilderFactory.html" title="interface in org.apache.beam.sdk.io.aws2.common"><code>ClientBuilderFactory</code></a>
using <a href="../../../../../../../org/apache/beam/sdk/io/aws2/options/AwsOptions.html#setClientBuilderFactory-java.lang.Class-"><code>AwsOptions.setClientBuilderFactory(Class)</code></a>.
<p>Configuration for a specific IO can be overwritten using <code>withClientConfiguration()</code>,
which also allows to configure the retry behavior for the respective IO.
<h4>Retries</h4>
<p>Retries for failed requests can be configured using <code>ClientConfiguration.Builder#retry(Consumer)</code> and are handled by the AWS SDK unless there's a
partial success (batch requests). The SDK uses a backoff strategy with equal jitter for computing
the delay before the next retry.
<p><b>Note:</b> Once retries are exhausted the error is surfaced to the runner which <em>may</em>
then opt to retry the current partition in entirety or abort if the max number of retries of the
runner is reached.</div>
</li>
</ul>
</div>
<div class="summary">
<ul class="blockList">
<li class="blockList">
<!-- ======== NESTED CLASS SUMMARY ======== -->
<ul class="blockList">
<li class="blockList"><a name="nested.class.summary">
<!-- -->
</a>
<h3>Nested Class Summary</h3>
<table class="memberSummary" border="0" cellpadding="3" cellspacing="0" summary="Nested Class Summary table, listing nested classes, and an explanation">
<caption><span>Nested Classes</span><span class="tabEnd">&nbsp;</span></caption>
<tr>
<th class="colFirst" scope="col">Modifier and Type</th>
<th class="colLast" scope="col">Class and Description</th>
</tr>
<tr class="altColor">
<td class="colFirst"><code>static class&nbsp;</code></td>
<td class="colLast"><code><span class="memberNameLink"><a href="../../../../../../../org/apache/beam/sdk/io/aws2/dynamodb/DynamoDBIO.Read.html" title="class in org.apache.beam.sdk.io.aws2.dynamodb">DynamoDBIO.Read</a>&lt;<a href="../../../../../../../org/apache/beam/sdk/io/aws2/dynamodb/DynamoDBIO.Read.html" title="type parameter in DynamoDBIO.Read">T</a>&gt;</span></code>
<div class="block">Read data from DynamoDB using <a href="../../../../../../../org/apache/beam/sdk/io/aws2/dynamodb/DynamoDBIO.Read.html#getScanRequestFn--"><code>DynamoDBIO.Read.getScanRequestFn()</code></a> and emit an element of type <code>T</code>
for each <a href="https://static.javadoc.io/software.amazon.awssdk/dynamodb/2.17.127/software/amazon/awssdk/services/dynamodb/model/ScanResponse.html?is-external=true" title="class or interface in software.amazon.awssdk.services.dynamodb.model"><code>ScanResponse</code></a> using the mapping function <a href="../../../../../../../org/apache/beam/sdk/io/aws2/dynamodb/DynamoDBIO.Read.html#getScanResponseMapperFn--"><code>DynamoDBIO.Read.getScanResponseMapperFn()</code></a>.</div>
</td>
</tr>
<tr class="rowColor">
<td class="colFirst"><code>static class&nbsp;</code></td>
<td class="colLast"><code><span class="memberNameLink"><a href="../../../../../../../org/apache/beam/sdk/io/aws2/dynamodb/DynamoDBIO.RetryConfiguration.html" title="class in org.apache.beam.sdk.io.aws2.dynamodb">DynamoDBIO.RetryConfiguration</a></span></code>
<div class="block"><span class="deprecatedLabel">Deprecated.</span>&nbsp;
<div class="block"><span class="deprecationComment">Use <a href="../../../../../../../org/apache/beam/sdk/io/aws2/common/RetryConfiguration.html" title="class in org.apache.beam.sdk.io.aws2.common"><code>RetryConfiguration</code></a> instead to
delegate retries to the AWS SDK.</span></div>
</div>
</td>
</tr>
<tr class="altColor">
<td class="colFirst"><code>static class&nbsp;</code></td>
<td class="colLast"><code><span class="memberNameLink"><a href="../../../../../../../org/apache/beam/sdk/io/aws2/dynamodb/DynamoDBIO.Write.html" title="class in org.apache.beam.sdk.io.aws2.dynamodb">DynamoDBIO.Write</a>&lt;<a href="../../../../../../../org/apache/beam/sdk/io/aws2/dynamodb/DynamoDBIO.Write.html" title="type parameter in DynamoDBIO.Write">T</a>&gt;</span></code>
<div class="block">Write a PCollection<T> data into DynamoDB.</div>
</td>
</tr>
</table>
</li>
</ul>
<!-- ======== CONSTRUCTOR SUMMARY ======== -->
<ul class="blockList">
<li class="blockList"><a name="constructor.summary">
<!-- -->
</a>
<h3>Constructor Summary</h3>
<table class="memberSummary" border="0" cellpadding="3" cellspacing="0" summary="Constructor Summary table, listing constructors, and an explanation">
<caption><span>Constructors</span><span class="tabEnd">&nbsp;</span></caption>
<tr>
<th class="colOne" scope="col">Constructor and Description</th>
</tr>
<tr class="altColor">
<td class="colOne"><code><span class="memberNameLink"><a href="../../../../../../../org/apache/beam/sdk/io/aws2/dynamodb/DynamoDBIO.html#DynamoDBIO--">DynamoDBIO</a></span>()</code>&nbsp;</td>
</tr>
</table>
</li>
</ul>
<!-- ========== METHOD SUMMARY =========== -->
<ul class="blockList">
<li class="blockList"><a name="method.summary">
<!-- -->
</a>
<h3>Method Summary</h3>
<table class="memberSummary" border="0" cellpadding="3" cellspacing="0" summary="Method Summary table, listing methods, and an explanation">
<caption><span id="t0" class="activeTableTab"><span>All Methods</span><span class="tabEnd">&nbsp;</span></span><span id="t1" class="tableTab"><span><a href="javascript:show(1);">Static Methods</a></span><span class="tabEnd">&nbsp;</span></span><span id="t4" class="tableTab"><span><a href="javascript:show(8);">Concrete Methods</a></span><span class="tabEnd">&nbsp;</span></span></caption>
<tr>
<th class="colFirst" scope="col">Modifier and Type</th>
<th class="colLast" scope="col">Method and Description</th>
</tr>
<tr id="i0" class="altColor">
<td class="colFirst"><code>static &lt;T&gt;&nbsp;<a href="../../../../../../../org/apache/beam/sdk/io/aws2/dynamodb/DynamoDBIO.Read.html" title="class in org.apache.beam.sdk.io.aws2.dynamodb">DynamoDBIO.Read</a>&lt;T&gt;</code></td>
<td class="colLast"><code><span class="memberNameLink"><a href="../../../../../../../org/apache/beam/sdk/io/aws2/dynamodb/DynamoDBIO.html#read--">read</a></span>()</code>&nbsp;</td>
</tr>
<tr id="i1" class="rowColor">
<td class="colFirst"><code>static &lt;T&gt;&nbsp;<a href="../../../../../../../org/apache/beam/sdk/io/aws2/dynamodb/DynamoDBIO.Write.html" title="class in org.apache.beam.sdk.io.aws2.dynamodb">DynamoDBIO.Write</a>&lt;T&gt;</code></td>
<td class="colLast"><code><span class="memberNameLink"><a href="../../../../../../../org/apache/beam/sdk/io/aws2/dynamodb/DynamoDBIO.html#write--">write</a></span>()</code>&nbsp;</td>
</tr>
</table>
<ul class="blockList">
<li class="blockList"><a name="methods.inherited.from.class.java.lang.Object">
<!-- -->
</a>
<h3>Methods inherited from class&nbsp;java.lang.Object</h3>
<code>clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait</code></li>
</ul>
</li>
</ul>
</li>
</ul>
</div>
<div class="details">
<ul class="blockList">
<li class="blockList">
<!-- ========= CONSTRUCTOR DETAIL ======== -->
<ul class="blockList">
<li class="blockList"><a name="constructor.detail">
<!-- -->
</a>
<h3>Constructor Detail</h3>
<a name="DynamoDBIO--">
<!-- -->
</a>
<ul class="blockListLast">
<li class="blockList">
<h4>DynamoDBIO</h4>
<pre>public&nbsp;DynamoDBIO()</pre>
</li>
</ul>
</li>
</ul>
<!-- ============ METHOD DETAIL ========== -->
<ul class="blockList">
<li class="blockList"><a name="method.detail">
<!-- -->
</a>
<h3>Method Detail</h3>
<a name="read--">
<!-- -->
</a>
<ul class="blockList">
<li class="blockList">
<h4>read</h4>
<pre>public static&nbsp;&lt;T&gt;&nbsp;<a href="../../../../../../../org/apache/beam/sdk/io/aws2/dynamodb/DynamoDBIO.Read.html" title="class in org.apache.beam.sdk.io.aws2.dynamodb">DynamoDBIO.Read</a>&lt;T&gt;&nbsp;read()</pre>
</li>
</ul>
<a name="write--">
<!-- -->
</a>
<ul class="blockListLast">
<li class="blockList">
<h4>write</h4>
<pre>public static&nbsp;&lt;T&gt;&nbsp;<a href="../../../../../../../org/apache/beam/sdk/io/aws2/dynamodb/DynamoDBIO.Write.html" title="class in org.apache.beam.sdk.io.aws2.dynamodb">DynamoDBIO.Write</a>&lt;T&gt;&nbsp;write()</pre>
</li>
</ul>
</li>
</ul>
</li>
</ul>
</div>
</div>
<!-- ========= END OF CLASS DATA ========= -->
<!-- ======= START OF BOTTOM NAVBAR ====== -->
<div class="bottomNav"><a name="navbar.bottom">
<!-- -->
</a>
<div class="skipNav"><a href="#skip.navbar.bottom" title="Skip navigation links">Skip navigation links</a></div>
<a name="navbar.bottom.firstrow">
<!-- -->
</a>
<ul class="navList" title="Navigation">
<li><a href="../../../../../../../overview-summary.html">Overview</a></li>
<li><a href="package-summary.html">Package</a></li>
<li class="navBarCell1Rev">Class</li>
<li><a href="package-tree.html">Tree</a></li>
<li><a href="../../../../../../../deprecated-list.html">Deprecated</a></li>
<li><a href="../../../../../../../index-all.html">Index</a></li>
<li><a href="../../../../../../../help-doc.html">Help</a></li>
</ul>
</div>
<div class="subNav">
<ul class="navList">
<li><a href="../../../../../../../org/apache/beam/sdk/io/aws2/dynamodb/DynamoDbClientProvider.html" title="interface in org.apache.beam.sdk.io.aws2.dynamodb"><span class="typeNameLink">Prev&nbsp;Class</span></a></li>
<li><a href="../../../../../../../org/apache/beam/sdk/io/aws2/dynamodb/DynamoDBIO.Read.html" title="class in org.apache.beam.sdk.io.aws2.dynamodb"><span class="typeNameLink">Next&nbsp;Class</span></a></li>
</ul>
<ul class="navList">
<li><a href="../../../../../../../index.html?org/apache/beam/sdk/io/aws2/dynamodb/DynamoDBIO.html" target="_top">Frames</a></li>
<li><a href="DynamoDBIO.html" target="_top">No&nbsp;Frames</a></li>
</ul>
<ul class="navList" id="allclasses_navbar_bottom">
<li><a href="../../../../../../../allclasses-noframe.html">All&nbsp;Classes</a></li>
</ul>
<div>
<script type="text/javascript"><!--
allClassesLink = document.getElementById("allclasses_navbar_bottom");
if(window==top) {
allClassesLink.style.display = "block";
}
else {
allClassesLink.style.display = "none";
}
//-->
</script>
</div>
<div>
<ul class="subNavList">
<li>Summary:&nbsp;</li>
<li><a href="#nested.class.summary">Nested</a>&nbsp;|&nbsp;</li>
<li>Field&nbsp;|&nbsp;</li>
<li><a href="#constructor.summary">Constr</a>&nbsp;|&nbsp;</li>
<li><a href="#method.summary">Method</a></li>
</ul>
<ul class="subNavList">
<li>Detail:&nbsp;</li>
<li>Field&nbsp;|&nbsp;</li>
<li><a href="#constructor.detail">Constr</a>&nbsp;|&nbsp;</li>
<li><a href="#method.detail">Method</a></li>
</ul>
</div>
<a name="skip.navbar.bottom">
<!-- -->
</a></div>
<!-- ======== END OF BOTTOM NAVBAR ======= -->
</body>
</html>