blob: e36e08d54dc04269d23fd6459938a41542eb22e0 [file] [log] [blame]
import{_ as n,c as a,b as s,o as i}from"./app-DuBhTZk6.js";const t={};function l(r,e){return i(),a("div",null,e[0]||(e[0]=[s(`<h1 id="data-synchronisation" tabindex="-1"><a class="header-anchor" href="#data-synchronisation"><span>Data Synchronisation</span></a></h1><p>Data synchronisation is a typical requirement of industrial IoT. Through the data synchronisation mechanism, data sharing between IoTDBs can be achieved, and a complete data link can be built to meet the needs of intranet and extranet data interoperability, end-to-end cloud synchronisation, data migration, data backup, and so on.</p><h2 id="introduction" tabindex="-1"><a class="header-anchor" href="#introduction"><span>Introduction</span></a></h2><h3 id="synchronisation-task-overview" tabindex="-1"><a class="header-anchor" href="#synchronisation-task-overview"><span>Synchronisation Task Overview</span></a></h3><p>A data synchronisation task consists of 2 phases:</p><ul><li>Source phase: This part is used to extract data from the source IoTDB, which is defined in the source part of the SQL statement.</li><li>Sink phase: This part is used to send data to the target IoTDB and is defined in the sink part of the SQL statement.</li></ul><p>Flexible data synchronisation capabilities can be achieved by declaratively configuring the specifics of the 2 sections through SQL statements.</p><h3 id="synchronisation-task-create" tabindex="-1"><a class="header-anchor" href="#synchronisation-task-create"><span>Synchronisation Task - Create</span></a></h3><p>Use the <code>CREATE PIPE</code> statement to create a data synchronisation task, the following attributes <code>PipeId</code> and <code>sink</code> are mandatory, <code>source</code> and <code>processor</code> are optional, when entering the SQL note that the order of the <code>SOURCE </code> and <code>SINK</code> plugins are not interchangeable.</p><p>The SQL example is as follows:</p><div class="language-SQL line-numbers-mode" data-highlighter="prismjs" data-ext="SQL" data-title="SQL"><pre><code><span class="line">CREATE PIPE &lt;PipeId&gt; -- PipeId is the name that uniquely identifies the task.</span>
<span class="line">-- Data Extraction Plugin, Required Plugin</span>
<span class="line">WITH SOURCE (</span>
<span class="line"> [&lt;parameter&gt; = &lt;value&gt;,],</span>
<span class="line">)</span>
<span class="line">-- Data connection plugin, required</span>
<span class="line">WITH SINK (</span>
<span class="line"> [&lt;parameter&gt; = &lt;value&gt;,], -- data connection plugin, required.</span>
<span class="line">)</span>
<span class="line"></span></code></pre><div class="line-numbers" aria-hidden="true" style="counter-reset:line-number 0;"><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div></div></div><blockquote><p>πŸ“Œ Note: To use the data synchronisation feature, make sure that automatic metadata creation is enabled on the receiving side</p></blockquote><h3 id="synchronisation-tasks-management" tabindex="-1"><a class="header-anchor" href="#synchronisation-tasks-management"><span>Synchronisation Tasks - Management</span></a></h3><p>The Data Synchronisation task has three states; RUNNING, STOPPED and DROPPED.The task state transitions are shown below:</p><figure><img src="https://alioss.timecho.com/docs/img/ηŠΆζ€θΏη§»ε›Ύ.png" alt="State Migration Diagram" tabindex="0" loading="lazy"><figcaption>State Migration Diagram</figcaption></figure><p>A data synchronisation task passes through multiple states during its lifecycle:</p><ul><li>RUNNING: Running state. <ul><li>Explanation 1: The initial state of the task is the running state(V1.3.1+).</li></ul></li><li>STOPPED: Stopped state. <ul><li>Description 1: The initial state of the task is the stopped state(V1.3.0). A SQL statement is required to start the task.</li><li>Description 2: You can manually stop a running task with a SQL statement, and the state will change from RUNNING to STOPPED.</li><li>Description 3: When a task has an unrecoverable error, its status will automatically change from RUNNING to STOPPED.</li></ul></li><li>DROPPED: deleted state.</li></ul><p>We provide the following SQL statements to manage the status of synchronisation tasks.</p><h4 id="starting-a-task" tabindex="-1"><a class="header-anchor" href="#starting-a-task"><span>Starting a Task</span></a></h4><p>After creation, the task will not be processed immediately, you need to start the task. Use the <code>START PIPE</code> statement to start the task so that it can begin processing data:</p><div class="language-Go line-numbers-mode" data-highlighter="prismjs" data-ext="Go" data-title="Go"><pre><code><span class="line">START PIPE&lt;PipeId&gt;</span>
<span class="line"></span></code></pre><div class="line-numbers" aria-hidden="true" style="counter-reset:line-number 0;"><div class="line-number"></div></div></div><h4 id="stop-the-task" tabindex="-1"><a class="header-anchor" href="#stop-the-task"><span>Stop the task</span></a></h4><p>Stop processing data:</p><div class="language-Go line-numbers-mode" data-highlighter="prismjs" data-ext="Go" data-title="Go"><pre><code><span class="line">STOP PIPE &lt;PipeId&gt;</span>
<span class="line"></span></code></pre><div class="line-numbers" aria-hidden="true" style="counter-reset:line-number 0;"><div class="line-number"></div></div></div><h4 id="delete-a-task" tabindex="-1"><a class="header-anchor" href="#delete-a-task"><span>Delete a task</span></a></h4><p>Deletes the specified task:</p><div class="language-Go line-numbers-mode" data-highlighter="prismjs" data-ext="Go" data-title="Go"><pre><code><span class="line">DROP PIPE &lt;PipeId&gt;</span>
<span class="line"></span></code></pre><div class="line-numbers" aria-hidden="true" style="counter-reset:line-number 0;"><div class="line-number"></div></div></div><p>Deleting a task does not require you to stop synchronising the task first.</p><h4 id="viewing-tasks" tabindex="-1"><a class="header-anchor" href="#viewing-tasks"><span>Viewing Tasks</span></a></h4><p>View all tasks:</p><div class="language-Go line-numbers-mode" data-highlighter="prismjs" data-ext="Go" data-title="Go"><pre><code><span class="line">SHOW PIPES</span>
<span class="line"></span></code></pre><div class="line-numbers" aria-hidden="true" style="counter-reset:line-number 0;"><div class="line-number"></div></div></div><p>To view a specified task:</p><div class="language-Go line-numbers-mode" data-highlighter="prismjs" data-ext="Go" data-title="Go"><pre><code><span class="line">SHOW PIPE &lt;PipeId&gt;.</span>
<span class="line"></span></code></pre><div class="line-numbers" aria-hidden="true" style="counter-reset:line-number 0;"><div class="line-number"></div></div></div><h3 id="plugin" tabindex="-1"><a class="header-anchor" href="#plugin"><span>Plugin</span></a></h3><p>In order to make the overall architecture more flexible to match different synchronisation scenarios, IoTDB supports plugin assembly in the above synchronisation task framework. Some common plugins are pre-built for you to use directly, and you can also customise sink plugins and load them into the IoTDB system for use.</p><table><thead><tr><th>Modules</th><th>Plugins</th><th>Pre-configured Plugins</th><th>Customised Plugins</th></tr></thead><tbody><tr><td>Extract (Source)</td><td>Source Plugin</td><td>iotdb-source</td><td>Not Supported</td></tr><tr><td>Send (Sink)</td><td>Sink plugin</td><td>iotdb-thrift-sink</td><td>Support</td></tr></tbody></table><h4 id="preconfigured-plugins" tabindex="-1"><a class="header-anchor" href="#preconfigured-plugins"><span>Preconfigured Plugins</span></a></h4><p>The preset plugins are listed below:</p><table><thead><tr><th>Plugin Name</th><th>Type</th><th>Introduction</th><th>Available Versions</th></tr></thead><tbody><tr><td>iotdb-source</td><td>source plugin</td><td>Default source plugin for extracting IoTDB historical or real-time data</td><td>1.2.x</td></tr><tr><td>iotdb-thrift-sink</td><td>sink plugin</td><td>Used for data transfer between IoTDB (v1.2.0 and above) and IoTDB (v1.2.0 and above). Uses the Thrift RPC framework to transfer data, multi-threaded async non-blocking IO model, high transfer performance, especially for scenarios where the target is distributed</td><td>1.2.x</td></tr></tbody></table><p>Detailed parameters for each plugin can be found in the <a href="#sink-parameters">Parameter Description</a> section of this document.</p><h4 id="view-plugins" tabindex="-1"><a class="header-anchor" href="#view-plugins"><span>View Plugins</span></a></h4><p>To view the plugins in the system (including custom and built-in plugins) you can use the following statement:</p><div class="language-Go line-numbers-mode" data-highlighter="prismjs" data-ext="Go" data-title="Go"><pre><code><span class="line">SHOW PIPEPLUGINS</span>
<span class="line"></span></code></pre><div class="line-numbers" aria-hidden="true" style="counter-reset:line-number 0;"><div class="line-number"></div></div></div><p>The following results are returned:</p><div class="language-Go line-numbers-mode" data-highlighter="prismjs" data-ext="Go" data-title="Go"><pre><code><span class="line">IoTDB&gt; show pipeplugins</span>
<span class="line">+------------------------------+----------+---------------------------------------------------------------------------------+---------+</span>
<span class="line">| PluginName|PluginType| ClassName|PluginJar|</span>
<span class="line">+------------------------------+--------------------------------------------------------------------------------------------+---------+</span>
<span class="line">| DO-NOTHING-PROCESSOR| Builtin| org.apache.iotdb.commons.pipe.plugin.builtin.processor.DoNothingProcessor| |</span>
<span class="line">| DO-NOTHING-SINK| Builtin| org.apache.iotdb.commons.pipe.plugin.builtin.sink.DoNothingSink| |</span>
<span class="line">| IOTDB-SOURCE| Builtin| org.apache.iotdb.commons.pipe.plugin.builtin.source.IoTDBSOURCE| |</span>
<span class="line">| IOTDB-THRIFT-SINK| Builtin| org.apache.iotdb.commons.pipe.plugin.builtin.sink.IoTDBThriftSink| |</span>
<span class="line">+------------------------------+----------+---------------------------------------------------------------------------------+---------+</span>
<span class="line"></span>
<span class="line"></span></code></pre><div class="line-numbers" aria-hidden="true" style="counter-reset:line-number 0;"><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div></div></div><h2 id="use-examples" tabindex="-1"><a class="header-anchor" href="#use-examples"><span>Use examples</span></a></h2><h3 id="full-data-synchronisation" tabindex="-1"><a class="header-anchor" href="#full-data-synchronisation"><span>Full data synchronisation</span></a></h3><p>This example is used to demonstrate the synchronisation of all data from one IoTDB to another IoTDB with the data link as shown below:</p><figure><img src="https://alioss.timecho.com/upload/pipe1.jpg" alt="" tabindex="0" loading="lazy"><figcaption></figcaption></figure><p>In this example, we can create a synchronisation task named A2B to synchronise the full amount of data from IoTDB A to IoTDB B. Here we need to use the iotdb-thrift-sink plugin (built-in plugin) which uses sink, and we need to specify the address of the receiving end, in this example, we have specified &#39;sink.ip&#39; and &#39;sink.port&#39;, and we can also specify &#39;sink.port&#39;. This example specifies &#39;sink.ip&#39; and &#39;sink.port&#39;, and also &#39;sink.node-urls&#39;, as in the following example statement:</p><div class="language-Go line-numbers-mode" data-highlighter="prismjs" data-ext="Go" data-title="Go"><pre><code><span class="line">create pipe A2B</span>
<span class="line">with sink (</span>
<span class="line"> &#39;sink&#39;=&#39;iotdb-thrift-sink&#39;, </span>
<span class="line"> &#39;sink.ip&#39;=&#39;127.0.0.1&#39;,</span>
<span class="line"> &#39;sink.port&#39;=&#39;6668&#39;</span>
<span class="line">)</span>
<span class="line"></span></code></pre><div class="line-numbers" aria-hidden="true" style="counter-reset:line-number 0;"><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div></div></div><h3 id="synchronising-historical-data" tabindex="-1"><a class="header-anchor" href="#synchronising-historical-data"><span>Synchronising historical data</span></a></h3><p>This example is used to demonstrate the synchronisation of data from a certain historical time range (8:00pm 23 August 2023 to 8:00pm 23 October 2023) to another IoTDB, the data link is shown below:</p><figure><img src="https://alioss.timecho.com/upload/pipe2.jpg" alt="" tabindex="0" loading="lazy"><figcaption></figcaption></figure><p>In this example we can create a synchronisation task called A2B. First of all, we need to define the range of data to be transferred in source, since the data to be transferred is historical data (historical data refers to the data that existed before the creation of the synchronisation task), we need to configure the source.realtime.enable parameter to false; at the same time, we need to configure the start-time and end-time of the data and the mode of the transfer. At the same time, you need to configure the start-time and end-time of the data and the mode of transmission, and it is recommended that the mode be set to hybrid mode (hybrid mode is a mixed transmission mode, which adopts the real-time transmission mode when there is no backlog of data, and adopts the batch transmission mode when there is a backlog of data, and automatically switches according to the internal situation of the system).</p><p>The detailed statements are as follows:</p><div class="language-SQL line-numbers-mode" data-highlighter="prismjs" data-ext="SQL" data-title="SQL"><pre><code><span class="line">create pipe A2B</span>
<span class="line">WITH SOURCE (</span>
<span class="line">&#39;source&#39;= &#39;iotdb-source&#39;,</span>
<span class="line">&#39;source.realtime.mode&#39;=&#39;hybrid&#39;,</span>
<span class="line">&#39;source.history.start-time&#39; = &#39;2023.08.23T08:00:00+00:00&#39;,</span>
<span class="line">&#39;source.history.end-time&#39; = &#39;2023.10.23T08:00:00+00:00&#39;) </span>
<span class="line">with SINK (</span>
<span class="line">&#39;sink&#39;=&#39;iotdb-thrift-async-sink&#39;,</span>
<span class="line">&#39;sink.node-urls&#39;=&#39;xxxx:6668&#39;,</span>
<span class="line">&#39;sink.batch.enable&#39;=&#39;false&#39;)</span>
<span class="line"></span></code></pre><div class="line-numbers" aria-hidden="true" style="counter-reset:line-number 0;"><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div></div></div><h3 id="cascading-data-transfer" tabindex="-1"><a class="header-anchor" href="#cascading-data-transfer"><span>Cascading Data Transfer</span></a></h3><p>This example is used to demonstrate a cascading data transfer scenario between multiple IoTDBs, where data is synchronised from cluster A to cluster B and then to cluster C. The data link is shown in the figure below:</p><figure><img src="https://alioss.timecho.com/upload/pipe4.jpg" alt="" tabindex="0" loading="lazy"><figcaption></figcaption></figure><p>In this example, in order to synchronise the data from cluster A to C, the pipe between BC needs to be configured with <code>source.forwarding-pipe-requests</code> to <code>true</code>, the detailed statement is as follows:</p><p>Execute the following statement on A IoTDB to synchronise data from A to B:</p><div class="language-Go line-numbers-mode" data-highlighter="prismjs" data-ext="Go" data-title="Go"><pre><code><span class="line">create pipe AB</span>
<span class="line">with sink (</span>
<span class="line"> &#39;sink&#39;=&#39;iotdb-thrift-sink&#39;,</span>
<span class="line"> &#39;sink.ip&#39;=&#39;127.0.0.1&#39;,</span>
<span class="line"> &#39;sink.port&#39;=&#39;6668&#39;</span>
<span class="line">)</span>
<span class="line"></span></code></pre><div class="line-numbers" aria-hidden="true" style="counter-reset:line-number 0;"><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div></div></div><p>Execute the following statement on B IoTDB to synchronise data in B to C:</p><div class="language-Go line-numbers-mode" data-highlighter="prismjs" data-ext="Go" data-title="Go"><pre><code><span class="line">create pipe BC</span>
<span class="line">with source (</span>
<span class="line"> &#39;source.forwarding-pipe-requests&#39; = &#39;true&#39;,</span>
<span class="line">with sink (</span>
<span class="line"> &#39;sink&#39;=&#39;iotdb-thrift-sink&#39;,</span>
<span class="line"> &#39;sink.ip&#39;=&#39;127.0.0.1&#39;,</span>
<span class="line"> &#39;sink.port&#39;=&#39;6669&#39;</span>
<span class="line">)</span>
<span class="line"></span></code></pre><div class="line-numbers" aria-hidden="true" style="counter-reset:line-number 0;"><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div></div></div><h2 id="reference-notes" tabindex="-1"><a class="header-anchor" href="#reference-notes"><span>Reference: Notes</span></a></h2><p>The IoTDB configuration file (iotdb-common.properties) can be modified in order to adjust the parameters for data synchronisation, such as the synchronisation data storage directory. The complete configuration is as follows:</p><p>V1.3.0+:</p><div class="language-Properties line-numbers-mode" data-highlighter="prismjs" data-ext="Properties" data-title="Properties"><pre><code><span class="line">####################</span>
<span class="line">### Pipe Configuration</span>
<span class="line">####################</span>
<span class="line"></span>
<span class="line"># Uncomment the following field to configure the pipe lib directory.</span>
<span class="line"># For Windows platform</span>
<span class="line"># If its prefix is a drive specifier followed by &quot;\\\\&quot;, or if its prefix is &quot;\\\\\\\\&quot;, then the path is</span>
<span class="line"># absolute. Otherwise, it is relative.</span>
<span class="line"># pipe_lib_dir=ext\\\\pipe</span>
<span class="line"># For Linux platform</span>
<span class="line"># If its prefix is &quot;/&quot;, then the path is absolute. Otherwise, it is relative.</span>
<span class="line"># pipe_lib_dir=ext/pipe</span>
<span class="line"></span>
<span class="line"># The maximum number of threads that can be used to execute the pipe subtasks in PipeSubtaskExecutor.</span>
<span class="line"># The actual value will be min(pipe_subtask_executor_max_thread_num, max(1, CPU core number / 2)).</span>
<span class="line"># pipe_subtask_executor_max_thread_num=5</span>
<span class="line"></span>
<span class="line"># The connection timeout (in milliseconds) for the thrift client.</span>
<span class="line"># pipe_connector_timeout_ms=900000</span>
<span class="line"></span>
<span class="line"># The maximum number of selectors that can be used in the async connector.</span>
<span class="line"># pipe_async_connector_selector_number=1</span>
<span class="line"></span>
<span class="line"># The core number of clients that can be used in the async connector.</span>
<span class="line"># pipe_async_connector_core_client_number=8</span>
<span class="line"></span>
<span class="line"># The maximum number of clients that can be used in the async connector.</span>
<span class="line"># pipe_async_connector_max_client_number=16</span>
<span class="line"></span>
<span class="line"></span></code></pre><div class="line-numbers" aria-hidden="true" style="counter-reset:line-number 0;"><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div></div></div><p>V1.3.1+:</p><div class="language-Properties line-numbers-mode" data-highlighter="prismjs" data-ext="Properties" data-title="Properties"><pre><code><span class="line">####################</span>
<span class="line">### Pipe Configuration</span>
<span class="line">####################</span>
<span class="line"></span>
<span class="line"># Uncomment the following field to configure the pipe lib directory.</span>
<span class="line"># For Windows platform</span>
<span class="line"># If its prefix is a drive specifier followed by &quot;\\\\&quot;, or if its prefix is &quot;\\\\\\\\&quot;, then the path is</span>
<span class="line"># absolute. Otherwise, it is relative.</span>
<span class="line"># pipe_lib_dir=ext\\\\pipe</span>
<span class="line"># For Linux platform</span>
<span class="line"># If its prefix is &quot;/&quot;, then the path is absolute. Otherwise, it is relative.</span>
<span class="line"># pipe_lib_dir=ext/pipe</span>
<span class="line"></span>
<span class="line"># The maximum number of threads that can be used to execute the pipe subtasks in PipeSubtaskExecutor.</span>
<span class="line"># The actual value will be min(pipe_subtask_executor_max_thread_num, max(1, CPU core number / 2)).</span>
<span class="line"># pipe_subtask_executor_max_thread_num=5</span>
<span class="line"></span>
<span class="line"># The connection timeout (in milliseconds) for the thrift client.</span>
<span class="line"># pipe_sink_timeout_ms=900000</span>
<span class="line"></span>
<span class="line"></span></code></pre><div class="line-numbers" aria-hidden="true" style="counter-reset:line-number 0;"><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div></div></div><h2 id="reference-parameter-description" tabindex="-1"><a class="header-anchor" href="#reference-parameter-description"><span>Reference: parameter description</span></a></h2><p>πŸ“Œ Notes: for version 1.3.1 or later, any parameters other than &quot;source&quot;, &quot;processor&quot;, &quot;sink&quot; themselves need not be with the prefixes. For instance:</p><div class="language-Sql line-numbers-mode" data-highlighter="prismjs" data-ext="Sql" data-title="Sql"><pre><code><span class="line">create pipe A2B</span>
<span class="line">with sink (</span>
<span class="line"> &#39;sink&#39;=&#39;iotdb-air-gap-sink&#39;,</span>
<span class="line"> &#39;sink.ip&#39;=&#39;10.53.53.53&#39;,</span>
<span class="line"> &#39;sink.port&#39;=&#39;9780&#39;</span>
<span class="line">)</span>
<span class="line"></span></code></pre><div class="line-numbers" aria-hidden="true" style="counter-reset:line-number 0;"><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div></div></div><p>can be written as</p><div class="language-Sql line-numbers-mode" data-highlighter="prismjs" data-ext="Sql" data-title="Sql"><pre><code><span class="line">create pipe A2B</span>
<span class="line">with sink (</span>
<span class="line"> &#39;sink&#39;=&#39;iotdb-air-gap-sink&#39;,</span>
<span class="line"> &#39;ip&#39;=&#39;10.53.53.53&#39;,</span>
<span class="line"> &#39;port&#39;=&#39;9780&#39;</span>
<span class="line">)</span>
<span class="line"></span></code></pre><div class="line-numbers" aria-hidden="true" style="counter-reset:line-number 0;"><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div></div></div><h3 id="source-parameter" tabindex="-1"><a class="header-anchor" href="#source-parameter"><span>source parameter</span></a></h3><table><thead><tr><th>key</th><th>value</th><th>value range</th><th>required or not</th><th>default value</th></tr></thead><tbody><tr><td>source</td><td>iotdb-source</td><td>String: iotdb-source</td><td>required</td><td>-</td></tr><tr><td>source.pattern</td><td>Path prefix for filtering time series</td><td>String: any time series prefix</td><td>optional</td><td>root</td></tr><tr><td>source.history.start-time</td><td>Synchronise the start event time of historical data, including start-time</td><td>Long: [Long.MIN_VALUE, Long.MAX_VALUE]</td><td>optional</td><td>Long.MIN_VALUE</td></tr><tr><td>source.history.end-time</td><td>end event time for synchronised history data, contains end-time</td><td>Long: [Long.MIN_VALUE, Long.MAX_VALUE]</td><td>optional</td><td>Long.MAX_VALUE</td></tr><tr><td>start-time(V1.3.1+)</td><td>Synchronise the start event time of all data, including start-time</td><td>Long: [Long.MIN_VALUE, Long.MAX_VALUE]</td><td>optional</td><td>Long.MIN_VALUE</td></tr><tr><td>end-time(V1.3.1+)</td><td>end event time for synchronised all data, contains end-time</td><td>Long: [Long.MIN_VALUE, Long.MAX_VALUE]</td><td>optional</td><td>Long.MAX_VALUE</td></tr><tr><td>source.realtime.mode</td><td>Extraction mode of data</td><td>String: batch</td><td>optional</td><td>hybrid</td></tr></tbody></table><blockquote><p>πŸ’Ž <strong>Note: Difference between historical and real-time data</strong></p><ul><li><strong>Historical data</strong>: all data with arrival time &lt; current system time when the pipe was created is called historical data</li><li><strong>Real-time data</strong>: All data with arrival time &gt;= current system time when the pipe was created is called real-time data.</li><li><strong>Full data</strong>: full data = historical data + real time data</li></ul></blockquote><blockquote><p>πŸ’Ž <strong>Explanation: The meaning of batch mode</strong></p><ul><li><strong>batch</strong>: In this mode, the task will process and send data in batch (by underlying data file), which is characterised by low latency and high throughput.</li></ul></blockquote><h3 id="sink-parameters" tabindex="-1"><a class="header-anchor" href="#sink-parameters"><span>sink parameters</span></a></h3><h4 id="iotdb-thrift-sink" tabindex="-1"><a class="header-anchor" href="#iotdb-thrift-sink"><span>iotdb-thrift-sink</span></a></h4><table><thead><tr><th>key</th><th>value</th><th>value range</th><th>required or not</th><th>default value</th></tr></thead><tbody><tr><td>sink</td><td>iotdb-thrift-sink or iotdb-thrift-async-sink</td><td>String: iotdb-thrift-sink or iotdb-thrift-async-sink</td><td>required</td><td></td></tr><tr><td>sink.ip</td><td>Data service IP of a DataNode in the target IoTDB (note that the synchronisation task does not support forwarding to its own service)</td><td>String</td><td>Optional</td><td>Fill in either sink.node-urls</td></tr><tr><td>sink.port</td><td>Data service port of a DataNode in the target IoTDB (note that the synchronisation task does not support forwarding to its own service)</td><td>Integer</td><td>Optional</td><td>Fill in either sink.node-urls</td></tr><tr><td>sink.node-urls</td><td>The url of the data service port of any number of DataNodes on the target IoTDB (note that the synchronisation task does not support forwarding to its own service)</td><td>String. Example: &#39;127.0.0.1:6667,127.0.0.1:6668,127.0.0.1:6669&#39;, &#39;127.0.0.1:6667&#39;</td><td>Optional</td><td>Fill in either sink.ip:sink.port</td></tr><tr><td>sink.batch.enable</td><td>Whether to enable the log saving wholesale delivery mode, which is used to improve transmission throughput and reduce IOPS</td><td>Boolean: true, false</td><td>Optional</td><td>true</td></tr><tr><td>sink.batch.max-delay-seconds</td><td>Effective when the log save and send mode is turned on, indicates the longest time a batch of data waits before being sent (unit: s)</td><td>Integer</td><td>Optional</td><td>1</td></tr><tr><td>sink.batch.size-bytes</td><td>Effective when log saving and delivery mode is enabled, indicates the maximum saving size of a batch of data (unit: byte)</td><td>Long</td><td>Optional</td><td></td></tr></tbody></table>`,83)]))}const o=n(t,[["render",l],["__file","Data-Sync_apache.html.vue"]]),c=JSON.parse('{"path":"/UserGuide/latest/User-Manual/Data-Sync_apache.html","title":"Data Synchronisation","lang":"en-US","frontmatter":{"description":"Data Synchronisation Data synchronisation is a typical requirement of industrial IoT. Through the data synchronisation mechanism, data sharing between IoTDBs can be achieved, an...","head":[["link",{"rel":"alternate","hreflang":"zh-cn","href":"https://iotdb.apache.org/zh/UserGuide/latest/User-Manual/Data-Sync_apache.html"}],["meta",{"property":"og:url","content":"https://iotdb.apache.org/UserGuide/latest/User-Manual/Data-Sync_apache.html"}],["meta",{"property":"og:site_name","content":"IoTDB Website"}],["meta",{"property":"og:title","content":"Data Synchronisation"}],["meta",{"property":"og:description","content":"Data Synchronisation Data synchronisation is a typical requirement of industrial IoT. Through the data synchronisation mechanism, data sharing between IoTDBs can be achieved, an..."}],["meta",{"property":"og:type","content":"article"}],["meta",{"property":"og:image","content":"https://alioss.timecho.com/docs/img/%E7%8A%B6%E6%80%81%E8%BF%81%E7%A7%BB%E5%9B%BE.png"}],["meta",{"property":"og:locale","content":"en-US"}],["meta",{"property":"og:locale:alternate","content":"zh-CN"}],["meta",{"property":"og:updated_time","content":"2024-09-06T06:43:31.000Z"}],["meta",{"property":"article:modified_time","content":"2024-09-06T06:43:31.000Z"}],["script",{"type":"application/ld+json"},"{\\"@context\\":\\"https://schema.org\\",\\"@type\\":\\"Article\\",\\"headline\\":\\"Data Synchronisation\\",\\"image\\":[\\"https://alioss.timecho.com/docs/img/%E7%8A%B6%E6%80%81%E8%BF%81%E7%A7%BB%E5%9B%BE.png\\",\\"https://alioss.timecho.com/upload/pipe1.jpg\\",\\"https://alioss.timecho.com/upload/pipe2.jpg\\",\\"https://alioss.timecho.com/upload/pipe4.jpg\\"],\\"dateModified\\":\\"2024-09-06T06:43:31.000Z\\",\\"author\\":[]}"]]},"headers":[{"level":2,"title":"Introduction","slug":"introduction","link":"#introduction","children":[{"level":3,"title":"Synchronisation Task Overview","slug":"synchronisation-task-overview","link":"#synchronisation-task-overview","children":[]},{"level":3,"title":"Synchronisation Task - Create","slug":"synchronisation-task-create","link":"#synchronisation-task-create","children":[]},{"level":3,"title":"Synchronisation Tasks - Management","slug":"synchronisation-tasks-management","link":"#synchronisation-tasks-management","children":[]},{"level":3,"title":"Plugin","slug":"plugin","link":"#plugin","children":[]}]},{"level":2,"title":"Use examples","slug":"use-examples","link":"#use-examples","children":[{"level":3,"title":"Full data synchronisation","slug":"full-data-synchronisation","link":"#full-data-synchronisation","children":[]},{"level":3,"title":"Synchronising historical data","slug":"synchronising-historical-data","link":"#synchronising-historical-data","children":[]},{"level":3,"title":"Cascading Data Transfer","slug":"cascading-data-transfer","link":"#cascading-data-transfer","children":[]}]},{"level":2,"title":"Reference: Notes","slug":"reference-notes","link":"#reference-notes","children":[]},{"level":2,"title":"Reference: parameter description","slug":"reference-parameter-description","link":"#reference-parameter-description","children":[{"level":3,"title":"source parameter","slug":"source-parameter","link":"#source-parameter","children":[]},{"level":3,"title":"sink parameters","slug":"sink-parameters","link":"#sink-parameters","children":[]}]}],"git":{"createdTime":1696932526000,"updatedTime":1725605011000,"contributors":[{"name":"majialin","email":"107627937+mal117@users.noreply.github.com","commits":4},{"name":"W1y1r","email":"150988475+W1y1r@users.noreply.github.com","commits":2},{"name":"ηŸ³ζž—ζΎ","email":"50943998+shi10lin0s@users.noreply.github.com","commits":1}]},"readingTime":{"minutes":7.01,"words":2104},"filePathRelative":"UserGuide/latest/User-Manual/Data-Sync_apache.md","localizedDate":"October 10, 2023","autoDesc":true}');export{o as comp,c as data};