| <!DOCTYPE html> |
| <html lang="en"> |
| <head> |
| <meta charset="utf-8" /> |
| <meta http-equiv="X-UA-Compatible" content="IE=edge" /> |
| <meta name="viewport" content="width=device-width, initial-scale=1" /> |
| <!-- The above 3 meta tags *must* come first in the head; any other head content must come *after* these tags --> |
| <meta name="description" content="A new open source Apache Hadoop ecosystem project, Apache Kudu completes Hadoop's storage layer to enable fast analytics on fast data" /> |
| <meta name="author" content="Cloudera" /> |
| <title>Apache Kudu - Apache Kudu Prior Version Release Notes</title> |
| <!-- Bootstrap core CSS --> |
| <link rel="stylesheet" href="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.6/css/bootstrap.min.css" |
| integrity="sha384-1q8mTJOASx8j1Au+a5WDVnPi2lkFfwwEAa8hDDdjZlpLegxhjVME1fgjWPGmkzs7" |
| crossorigin="anonymous"> |
| |
| <!-- Custom styles for this template --> |
| <link href="/css/kudu.css" rel="stylesheet"/> |
| <link href="/css/asciidoc.css" rel="stylesheet"/> |
| <link rel="shortcut icon" href="/img/logo-favicon.ico" /> |
| <link rel="stylesheet" href="https://maxcdn.bootstrapcdn.com/font-awesome/4.6.1/css/font-awesome.min.css" /> |
| |
| |
| |
| <!-- HTML5 shim and Respond.js for IE8 support of HTML5 elements and media queries --> |
| <!--[if lt IE 9]> |
| <script src="https://oss.maxcdn.com/html5shiv/3.7.2/html5shiv.min.js"></script> |
| <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script> |
| <![endif]--> |
| </head> |
| <body> |
| <div class="kudu-site container-fluid"> |
| <!-- Static navbar --> |
| <nav class="navbar navbar-default"> |
| <div class="container-fluid"> |
| <div class="navbar-header"> |
| <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false" aria-controls="navbar"> |
| <span class="sr-only">Toggle navigation</span> |
| <span class="icon-bar"></span> |
| <span class="icon-bar"></span> |
| <span class="icon-bar"></span> |
| </button> |
| |
| <a class="logo" href="/"><img |
| src="//d3dr9sfxru4sde.cloudfront.net/i/k/apachekudu_logo_0716_80px.png" |
| srcset="//d3dr9sfxru4sde.cloudfront.net/i/k/apachekudu_logo_0716_80px.png 1x, //d3dr9sfxru4sde.cloudfront.net/i/k/apachekudu_logo_0716_160px.png 2x" |
| alt="Apache Kudu"/></a> |
| |
| </div> |
| <div id="navbar" class="collapse navbar-collapse"> |
| <ul class="nav navbar-nav navbar-right"> |
| <li > |
| <a href="/">Home</a> |
| </li> |
| <li > |
| <a href="/overview.html">Overview</a> |
| </li> |
| <li class="active"> |
| <a href="/docs/">Documentation</a> |
| </li> |
| <li > |
| <a href="/releases/">Releases</a> |
| </li> |
| <li > |
| <a href="/blog/">Blog</a> |
| </li> |
| <!-- NOTE: this dropdown menu does not appear on Mobile, so don't add anything here |
| that doesn't also appear elsewhere on the site. --> |
| <li class="dropdown"> |
| <a href="/community.html" role="button" aria-haspopup="true" aria-expanded="false">Community <span class="caret"></span></a> |
| <ul class="dropdown-menu"> |
| <li class="dropdown-header">GET IN TOUCH</li> |
| <li><a class="icon email" href="/community.html">Mailing Lists</a></li> |
| <li><a class="icon slack" href="https://getkudu-slack.herokuapp.com/">Slack Channel</a></li> |
| <li role="separator" class="divider"></li> |
| <li><a href="/community.html#meetups-user-groups-and-conference-presentations">Events and Meetups</a></li> |
| <li><a href="/committers.html">Project Committers</a></li> |
| <li><a href="/ecosystem.html">Ecosystem</a></li> |
| <!--<li><a href="/roadmap.html">Roadmap</a></li>--> |
| <li><a href="/community.html#contributions">How to Contribute</a></li> |
| <li role="separator" class="divider"></li> |
| <li class="dropdown-header">DEVELOPER RESOURCES</li> |
| <li><a class="icon github" href="https://github.com/apache/incubator-kudu">GitHub</a></li> |
| <li><a class="icon gerrit" href="http://gerrit.cloudera.org:8080/#/q/status:open+project:kudu">Gerrit Code Review</a></li> |
| <li><a class="icon jira" href="https://issues.apache.org/jira/browse/KUDU">JIRA Issue Tracker</a></li> |
| <li role="separator" class="divider"></li> |
| <li class="dropdown-header">SOCIAL MEDIA</li> |
| <li><a class="icon twitter" href="https://twitter.com/ApacheKudu">Twitter</a></li> |
| <li><a href="https://www.reddit.com/r/kudu/">Reddit</a></li> |
| <li role="separator" class="divider"></li> |
| <li class="dropdown-header">APACHE SOFTWARE FOUNDATION</li> |
| <li><a href="https://www.apache.org/security/" target="_blank">Security</a></li> |
| <li><a href="https://www.apache.org/foundation/sponsorship.html" target="_blank">Sponsorship</a></li> |
| <li><a href="https://www.apache.org/foundation/thanks.html" target="_blank">Thanks</a></li> |
| <li><a href="https://www.apache.org/licenses/" target="_blank">License</a></li> |
| </ul> |
| </li> |
| <li > |
| <a href="/faq.html">FAQ</a> |
| </li> |
| </ul><!-- /.nav --> |
| </div><!-- /#navbar --> |
| </div><!-- /.container-fluid --> |
| </nav> |
| |
| <!-- |
| |
| Licensed under the Apache License, Version 2.0 (the "License"); |
| you may not use this file except in compliance with the License. |
| You may obtain a copy of the License at |
| |
| http://www.apache.org/licenses/LICENSE-2.0 |
| |
| Unless required by applicable law or agreed to in writing, software |
| distributed under the License is distributed on an "AS IS" BASIS, |
| WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| See the License for the specific language governing permissions and |
| limitations under the License. |
| --> |
| |
| |
| <div class="container"> |
| <div class="row"> |
| <div class="col-md-9"> |
| |
| <h1>Apache Kudu Prior Version Release Notes</h1> |
| <div id="preamble"> |
| <div class="sectionbody"> |
| <div class="paragraph"> |
| <p>This section reproduces the release notes for new features and incompatible |
| changes in prior releases of Apache Kudu.</p> |
| </div> |
| <div class="admonitionblock note"> |
| <table> |
| <tr> |
| <td class="icon"> |
| <i class="fa icon-note" title="Note"></i> |
| </td> |
| <td class="content"> |
| The list of known issues and limitations for prior releases are not |
| reproduced on this page. Please consult the |
| <a href="http://kudu.apache.org/releases/">documentation of the appropriate release</a> |
| for a list of known issues and limitations. |
| </td> |
| </tr> |
| </table> |
| </div> |
| </div> |
| </div> |
| <div class="sect1"> |
| <h2 id="rn_1.1.0"><a class="link" href="#rn_1.1.0">Release notes specific to 1.1.0</a></h2> |
| <div class="sectionbody"> |
| |
| </div> |
| </div> |
| <div class="sect1"> |
| <h2 id="rn_1.1.0_new_features"><a class="link" href="#rn_1.1.0_new_features">New features</a></h2> |
| <div class="sectionbody"> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p>The Python client has been brought up to feature parity with the Java and C++ clients |
| and as such the package version will be brought to 1.1 with this release (from 0.3). A |
| list of the highlights can be found below.</p> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p>Improved Partial Row semantics</p> |
| </li> |
| <li> |
| <p>Range partition support</p> |
| </li> |
| <li> |
| <p>Scan Token API</p> |
| </li> |
| <li> |
| <p>Enhanced predicate support</p> |
| </li> |
| <li> |
| <p>Support for all Kudu data types (including a mapping of Python’s <code>datetime.datetime</code> to |
| <code>UNIXTIME_MICROS</code>)</p> |
| </li> |
| <li> |
| <p>Alter table support</p> |
| </li> |
| <li> |
| <p>Enabled Read at Snapshot for Scanners</p> |
| </li> |
| <li> |
| <p>Enabled Scanner Replica Selection</p> |
| </li> |
| <li> |
| <p>A few bug fixes for Python 3 in addition to various other improvements.</p> |
| </li> |
| </ul> |
| </div> |
| </li> |
| <li> |
| <p>IN LIST predicate pushdown support was added to allow optimized execution of filters which |
| match on a set of column values. Support for Spark, Map Reduce and Impala queries utilizing |
| IN LIST pushdown is not yet complete.</p> |
| </li> |
| <li> |
| <p>The Java client now features client-side request tracing in order to help troubleshoot timeouts. |
| Error messages are now augmented with traces that show which servers were contacted before the |
| timeout occured instead of just the last error. The traces also contain RPCs that were |
| required to fulfill the client’s request, such as contacting the master to discover a tablet’s |
| location. Note that the traces are not available for successful requests and are not |
| programatically queryable.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| </div> |
| <div class="sect1"> |
| <h2 id="_optimizations_and_improvements"><a class="link" href="#_optimizations_and_improvements">Optimizations and improvements</a></h2> |
| <div class="sectionbody"> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p>Kudu now publishes JAR files for Spark 2.0 compiled with Scala 2.11 along with the |
| existing Spark 1.6 JAR compiled with Scala 2.10.</p> |
| </li> |
| <li> |
| <p>The Java client now allows configuring scanners to read from the closest replica instead of |
| the known leader replica. The default remains the latter. Use the relevant <code>ReplicaSelection</code> |
| enum with the scanner’s builder to change this behavior.</p> |
| </li> |
| <li> |
| <p>Tablet servers use a new policy for retaining write-ahead log (WAL) segments. |
| Previously, servers used the 'log_min_segments_to_retain' flag to prioritize |
| any flushes which were retaining log segments past the configured value (default 2). |
| This policy caused servers to flush in-memory data more frequently than necessary, |
| limiting write performance.</p> |
| <div class="paragraph"> |
| <p>The new policy introduces a new flag 'log_target_replay_size_mb' which |
| determines the threshold at which write-ahead log retention will prioritize flushes. |
| The new flag is considered experimental and users should not need to modify |
| its value.</p> |
| </div> |
| <div class="paragraph"> |
| <p>The improved policy has been seen to improve write performance in some use cases |
| by a factor of 2x relative to the old policy.</p> |
| </div> |
| </li> |
| <li> |
| <p>Kudu’s implementation of the Raft consensus algorithm has been improved to include |
| a "pre-election" phase. This can improve the stability of tablet leader election |
| in high-load scenarios, especially if each server hosts a high number of tablets.</p> |
| </li> |
| <li> |
| <p>Tablet server start-up time has been substantially improved in the case that |
| the server contains a high number of tombstoned tablet replicas.</p> |
| </li> |
| </ul> |
| </div> |
| <div class="sect2"> |
| <h3 id="_command_line_tools"><a class="link" href="#_command_line_tools">Command line tools</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p>The tool <code>kudu tablet leader_step_down</code> has been added to manually force a leader to step down.</p> |
| </li> |
| <li> |
| <p>The tool <code>kudu remote_replica copy</code> has been added to manually copy a replica from |
| one running tablet server to another.</p> |
| </li> |
| <li> |
| <p>The tool <code>kudu local_replica delete</code> has been added to delete a replica of a tablet.</p> |
| </li> |
| <li> |
| <p>The <code>kudu test loadgen</code> tool has been added to replace the obsoleted |
| <code>insert-generated-rows</code> standalone binary. The new tool is enriched with |
| additional functionality and can be used to run load generation tests against |
| a Kudu cluster.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| </div> |
| </div> |
| <div class="sect1"> |
| <h2 id="_wire_protocol_compatibility"><a class="link" href="#_wire_protocol_compatibility">Wire protocol compatibility</a></h2> |
| <div class="sectionbody"> |
| <div class="paragraph"> |
| <p>Kudu 1.1.0 is wire-compatible with previous versions of Kudu:</p> |
| </div> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p>Kudu 1.1 clients may connect to servers running Kudu 1.0. If the client uses the new |
| 'IN LIST' predicate type, an error will be returned.</p> |
| </li> |
| <li> |
| <p>Kudu 1.0 clients may connect to servers running Kudu 1.1 without limitations.</p> |
| </li> |
| <li> |
| <p>Rolling upgrade between Kudu 1.0 and Kudu 1.1 servers is believed to be possible |
| though has not been sufficiently tested. Users are encouraged to shut down all nodes |
| in the cluster, upgrade the software, and then restart the daemons on the new version.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| </div> |
| <div class="sect1"> |
| <h2 id="rn_1.1.0_incompatible_changes"><a class="link" href="#rn_1.1.0_incompatible_changes">Incompatible changes in Kudu 1.1.0</a></h2> |
| <div class="sectionbody"> |
| <div class="sect2"> |
| <h3 id="_client_apis_c_java_python"><a class="link" href="#_client_apis_c_java_python">Client APIs (C++/Java/Python)</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p>The C++ client no longer requires the |
| <a href="https://gcc.gnu.org/onlinedocs/libstdc++/manual/using_dual_abi.html">old gcc5 ABI</a>. |
| Which ABI is actually used depends on the compiler configuration. Some new distros |
| (e.g. Ubuntu 16.04) will use the new ABI. Your application must use the same ABI as is |
| used by the client library; an easy way to guarantee this is to use the same compiler |
| to build both.</p> |
| </li> |
| <li> |
| <p>The C++ client’s <code>KuduSession::CountBufferedOperations()</code> method is |
| deprecated. Its behavior is inconsistent unless the session runs in the |
| <code>MANUAL_FLUSH</code> mode. Instead, to get number of buffered operations, count |
| invocations of the <code>KuduSession::Apply()</code> method since last |
| <code>KuduSession::Flush()</code> call or, if using asynchronous flushing, since last |
| invocation of the callback passed into <code>KuduSession::FlushAsync()</code>.</p> |
| </li> |
| <li> |
| <p>The Java client’s <code>OperationResponse.getWriteTimestamp</code> method was renamed to <code>getWriteTimestampRaw</code> |
| to emphasize that it doesn’t return milliseconds, unlike what its Javadoc indicated. The renamed |
| method was also hidden from the public APIs and should not be used.</p> |
| </li> |
| <li> |
| <p>The Java client’s sync API (<code>KuduClient</code>, <code>KuduSession</code>, <code>KuduScanner</code>) used to throw either |
| a <code>NonRecoverableException</code> or a <code>TimeoutException</code> for a timeout, and now it’s only possible for the |
| client to throw the former.</p> |
| </li> |
| <li> |
| <p>The Java client’s handling of errors in <code>KuduSession</code> was modified so that subclasses of |
| <code>KuduException</code> are converted into RowErrors instead of being thrown.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| </div> |
| </div> |
| <div class="sect1"> |
| <h2 id="rn_1.0.1"><a class="link" href="#rn_1.0.1">Release notes specific to 1.0.1</a></h2> |
| <div class="sectionbody"> |
| <div class="paragraph"> |
| <p>Apache Kudu 1.0.1 is a bug fix release, with no new features or backwards |
| incompatible changes.</p> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_1.0.1_fixed_issues"><a class="link" href="#rn_1.0.1_fixed_issues">Fixed Issues</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1681">KUDU-1681</a> Fixed a bug in |
| the tablet server which could cause a crash when the DNS lookup during master |
| heartbeat failed.</p> |
| </li> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1660">KUDU-1660</a>: Fixed a bug |
| which would cause the Kudu master and tablet server to fail to start on single |
| CPU systems.</p> |
| </li> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1651">KUDU-1652</a>: Fixed a bug |
| that would cause the C++ client, tablet server, and Java client to crash or |
| throw an exception when attempting to scan a table with a predicate which |
| simplifies to <code>IS NOT NULL</code> on a non-nullable column. For instance, setting a |
| <code>⇐ 127</code> predicate on an <code>INT8</code> column could trigger this bug, since the |
| predicate only filters null values.</p> |
| </li> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1651">KUDU-1651</a>: Fixed a bug |
| that would cause the tablet server to crash when evaluating a scan with |
| predicates over a dictionary encoded column containing an entire block of null |
| values.</p> |
| </li> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1623">KUDU-1623</a>: Fixed a bug |
| that would cause the tablet server to crash when handling UPSERT operations |
| that only set values for the primary key columns.</p> |
| </li> |
| <li> |
| <p><a href="http://gerrit.cloudera.org:8080/4488">Gerrit #4488</a> Fixed a bug in the |
| Java client’s KuduException class which could cause an unexpected |
| NullPointerException to be thrown when the exception did not have an |
| associated message.</p> |
| </li> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1090">KUDU-1090</a> Fixed a bug in |
| the memory tracker which could cause a rare crash during tablet server |
| startup.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| </div> |
| </div> |
| <div class="sect1"> |
| <h2 id="rn_1.0.0"><a class="link" href="#rn_1.0.0">Release notes specific to 1.0.0</a></h2> |
| <div class="sectionbody"> |
| <div class="paragraph"> |
| <p>After approximately a year of beta releases, Apache Kudu has reached version 1.0. |
| This version number signifies that the development team feels that Kudu is stable |
| enough for usage in production environments.</p> |
| </div> |
| <div class="paragraph"> |
| <p>If you are new to Kudu, check out its list of <a href="index.html">features and benefits</a>.</p> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_1.0.0_new_features"><a class="link" href="#rn_1.0.0_new_features">New features</a></h3> |
| <div class="paragraph"> |
| <p>Kudu 1.0.0 delivers a number of new features, bug fixes, and optimizations.</p> |
| </div> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p>Removal of multiversion concurrency control (MVCC) history is now supported. |
| This is known as tablet history GC. This allows Kudu to reclaim disk space, |
| where previously Kudu would keep a full history of all changes made to a |
| given table since the beginning of time. Previously, the only way to reclaim |
| disk space was to drop a table.</p> |
| <div class="paragraph"> |
| <p>Kudu will still keep historical data, and the amount of history retained is |
| controlled by setting the configuration flag <code>--tablet_history_max_age_sec</code>, |
| which defaults to 15 minutes (expressed in seconds). The timestamp |
| represented by the current time minus <code>tablet_history_max_age_sec</code> is known |
| as the ancient history mark (AHM). When a compaction or flush occurs, Kudu |
| will remove the history of changes made prior to the ancient history mark. |
| This only affects historical data; currently-visible data will not be |
| removed. A specialized maintenance manager background task to remove existing |
| "cold" historical data that is not in a row affected by the normal compaction |
| process will be added in a future release.</p> |
| </div> |
| </li> |
| <li> |
| <p>Most of Kudu’s command line tools have been consolidated under a new |
| top-level <code>kudu</code> tool. This reduces the number of large binaries distributed |
| with Kudu and also includes much-improved help output.</p> |
| </li> |
| <li> |
| <p>The Kudu Flume Sink now supports processing events containing Avro-encoded |
| records, using the new <code>AvroKuduOperationsProducer</code>.</p> |
| </li> |
| <li> |
| <p>Administrative tools including <code>kudu cluster ksck</code> now support running |
| against multi-master Kudu clusters.</p> |
| </li> |
| <li> |
| <p>The output of the <code>ksck</code> tool is now colorized and much easier to read.</p> |
| </li> |
| <li> |
| <p>The C++ client API now supports writing data in <code>AUTO_FLUSH_BACKGROUND</code> mode. |
| This can provide higher throughput for ingest workloads.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| <div class="sect2"> |
| <h3 id="_optimizations_and_improvements_2"><a class="link" href="#_optimizations_and_improvements_2">Optimizations and improvements</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p>The performance of comparison predicates on dictionary-encoded columns has |
| been substantially optimized. Users are encouraged to use dictionary encoding |
| on any string or binary columns with low cardinality, especially if these |
| columns will be filtered with predicates.</p> |
| </li> |
| <li> |
| <p>The Java client is now able to prune partitions from scanners based on the |
| provided predicates. For example, an equality predicate on a hash-partitioned |
| column will now only access those tablets that could possibly contain matching |
| data. This is expected to improve performance for the Spark integration as well |
| as applications using the Java client API.</p> |
| </li> |
| <li> |
| <p>The performance of compaction selection in the tablet server has been |
| substantially improved. This can increase the efficiency of the background |
| maintenance threads and improve overall throughput of heavy write workloads.</p> |
| </li> |
| <li> |
| <p>The policy by which the tablet server retains write-ahead log (WAL) files has |
| been improved so that it takes into account other replicas of the tablet. |
| This should help mitigate the spurious eviction of tablet replicas on machines |
| that temporarily lag behind the other replicas.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| <div class="sect2"> |
| <h3 id="_wire_protocol_compatibility_2"><a class="link" href="#_wire_protocol_compatibility_2">Wire protocol compatibility</a></h3> |
| <div class="paragraph"> |
| <p>Kudu 1.0.0 maintains client-server wire-compatibility with previous releases. |
| Applications using the Kudu client libraries may be upgraded either |
| before, at the same time, or after the Kudu servers.</p> |
| </div> |
| <div class="paragraph"> |
| <p>Kudu 1.0.0 does <em>not</em> maintain server-server wire compatibility with previous |
| releases. Therefore, rolling upgrades between earlier versions of Kudu and |
| Kudu 1.0.0 are not supported.</p> |
| </div> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_1.0.0_incompatible_changes"><a class="link" href="#rn_1.0.0_incompatible_changes">Incompatible changes in Kudu 1.0.0</a></h3> |
| <div class="sect3"> |
| <h4 id="_command_line_tools_2"><a class="link" href="#_command_line_tools_2">Command line tools</a></h4> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p>The <code>kudu-pbc-dump</code> tool has been removed. The same functionality is now |
| implemented as <code>kudu pbc dump</code>.</p> |
| </li> |
| <li> |
| <p>The <code>kudu-ksck</code> tool has been removed. The same functionality is now |
| implemented as <code>kudu cluster ksck</code>.</p> |
| </li> |
| <li> |
| <p>The <code>cfile-dump</code> tool has been removed. The same functionality is now |
| implemented as <code>kudu fs cfile dump</code>.</p> |
| </li> |
| <li> |
| <p>The <code>log-dump</code> tool has been removed. The same functionality is now |
| implemented as <code>kudu wal dump</code> and <code>kudu local_replica dump wals</code>.</p> |
| </li> |
| <li> |
| <p>The <code>kudu-admin</code> tool has been removed. The same functionality is now |
| implemented within <code>kudu table</code> and <code>kudu tablet</code>.</p> |
| </li> |
| <li> |
| <p>The <code>kudu-fs_dump</code> tool has been removed. The same functionality is now |
| implemented as <code>kudu fs dump</code>.</p> |
| </li> |
| <li> |
| <p>The <code>kudu-ts-cli</code> tool has been removed. The same functionality is now |
| implemented within <code>kudu master</code>, <code>kudu remote_replica</code>, and <code>kudu tserver</code>.</p> |
| </li> |
| <li> |
| <p>The <code>kudu-fs_list</code> tool has been removed and some similar useful |
| functionality has been moved under 'kudu local_replica'.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| <div class="sect3"> |
| <h4 id="_configuration_flags"><a class="link" href="#_configuration_flags">Configuration flags</a></h4> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p>Some configuration flags are now marked as 'unsafe' and 'experimental'. Such flags |
| are disallowed by default. Users may access these flags by enabling the additional |
| flags <code>--unlock_unsafe_flags</code> and <code>--unlock_experimental_flags</code>. Usage of such flags |
| is not recommended, as the flags may be removed or modified with no deprecation period |
| and without notice in future Kudu releases.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| <div class="sect3"> |
| <h4 id="_client_apis_c_java_python_2"><a class="link" href="#_client_apis_c_java_python_2">Client APIs (C++/Java/Python)</a></h4> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p>The <code>TIMESTAMP</code> column type has been renamed to <code>UNIXTIME_MICROS</code> in order to |
| reduce confusion between Kudu’s timestamp support and the timestamps supported |
| by other systems such as Apache Hive and Apache Impala (incubating). Existing |
| tables will automatically be updated to use the new name for the type.</p> |
| <div class="paragraph"> |
| <p>Clients upgrading to the new client libraries must move to the new name for |
| the type. Clients using old client libraries will continue to operate using |
| the old type name, even when connected to clusters that have been |
| upgraded. Similarly, if clients are upgraded before servers, existing |
| timestamp columns will be available using the new type name.</p> |
| </div> |
| </li> |
| <li> |
| <p><code>KuduSession</code> methods in the C++ library are no longer advertised as thread-safe |
| to have one set of semantics for both C++ and Java Kudu client libraries.</p> |
| </li> |
| <li> |
| <p>The <code>KuduScanToken::TabletServers</code> method in the C++ library has been removed. |
| The same information can now be found in the KuduScanToken::tablet method.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| <div class="sect3"> |
| <h4 id="_apache_flume_integration"><a class="link" href="#_apache_flume_integration">Apache Flume Integration</a></h4> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p>The <code>KuduEventProducer</code> interface used to process Flume events into Kudu operations |
| for the Kudu Flume Sink has changed, and has been renamed <code>KuduOperationsProducer</code>. |
| The existing `KuduEventProducer`s have been updated for the new interface, and have |
| been renamed similarly.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| </div> |
| </div> |
| </div> |
| <div class="sect1"> |
| <h2 id="rn_0.10.0"><a class="link" href="#rn_0.10.0">Release notes specific to 0.10.0</a></h2> |
| <div class="sectionbody"> |
| <div class="paragraph"> |
| <p>Kudu 0.10.0 delivers a number of new features, bug fixes, and optimizations, |
| detailed below.</p> |
| </div> |
| <div class="paragraph"> |
| <p>Kudu 0.10.0 maintains wire-compatibility with previous releases, meaning |
| that applications using the Kudu client libraries may be upgraded either |
| before, at the same time, or after the Kudu servers. However, if you begin |
| using new features of Kudu 0.10.0 such as manually range-partitioned tables, |
| you must first upgrade all clients to this release.</p> |
| </div> |
| <div class="paragraph"> |
| <p>This release does not maintain full Java API or ABI compatibility with |
| Kudu 0.9.x due to a package rename and some other small changes. See below for details.</p> |
| </div> |
| <div class="paragraph"> |
| <p>See also <a href="https://issues.apache.org/jira/issues/?jql=project%20%3D%20KUDU%20AND%20status%20%3D%20Resolved |
| %20AND%20fixVersion%20%3D%200.10.0">JIRAs resolved |
| for Kudu 0.10.0</a> and <a href="https://github.com/apache/kudu/compare/0.9.1...0.10.0">Git |
| changes between 0.9.1 and 0.10.0</a>.</p> |
| </div> |
| <div class="paragraph"> |
| <p>To upgrade to Kudu 0.10.0, see <a href="#rn_0.10.0_upgrade">[rn_0.10.0_upgrade]</a>.</p> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.10.0_incompatible_changes"><a class="link" href="#rn_0.10.0_incompatible_changes">Incompatible changes and deprecated APIs in 0.10.0</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p><a href="http://gerrit.cloudera.org:8080/3737">Gerrit #3737</a> The Java client has been repackaged |
| under <code>org.apache.kudu</code> instead of <code>org.kududb</code>. Import statements for Kudu classes must |
| be modified in order to compile against 0.10.0. Wire compatibility is maintained.</p> |
| </li> |
| <li> |
| <p><a href="https://gerrit.cloudera.org/#/c/3055/">Gerrit #3055</a> The Java client’s |
| synchronous API methods now throw <code>KuduException</code> instead of <code>Exception</code>. |
| Existing code that catches <code>Exception</code> should still compile, but introspection of an |
| exception’s message may be impacted. This change was made to allow thrown exceptions to be |
| queried more easily using <code>KuduException.getStatus</code> and calling one of <code>Status’s methods. |
| For example, an operation that tries to delete a table that doesn’t exist would return a |
| `Status</code> that returns true when queried on <code>isNotFound()</code>.</p> |
| </li> |
| <li> |
| <p>The Java client’s <code>KuduTable.getTabletsLocations</code> set of methods is now |
| deprecated. Additionally, they now take an exclusive end partition key instead |
| of an inclusive key. Applications are encouraged to use the scan tokens API |
| instead of these methods in the future.</p> |
| </li> |
| <li> |
| <p>The C++ API for specifying split points on range-partitioned tables has been improved |
| to make it easier for callers to properly manage the ownership of the provided rows.</p> |
| <div class="paragraph"> |
| <p>The <code>TableCreator::split_rows</code> API took a <code>vector<const KuduPartialRow*></code>, which |
| made it very difficult for the calling application to do proper error handling with |
| cleanup when setting the fields of the <code>KuduPartialRow</code>. This API has been now been |
| deprecated and replaced by a new method <code>TableCreator::add_range_split</code> which allows |
| easier use of smart pointers for safe memory management.</p> |
| </div> |
| </li> |
| <li> |
| <p>The Java client’s internal buffering has been reworked. Previously, the number of |
| buffered write operations was constrained on a per-tablet-server basis. Now, the configured |
| maximum buffer size constrains the total number of buffered operations across all |
| tablet servers in the cluster. This provides a more consistent bound on the memory |
| usage of the client regardless of the size of the cluster to which it is writing.</p> |
| <div class="paragraph"> |
| <p>This change can negatively affect the write performance of Java clients which rely on |
| buffered writes. Consider using the <code>setMutationBufferSpace</code> API to increase a |
| session’s maximum buffer size if write performance seems to be degraded after upgrading |
| to Kudu 0.10.0.</p> |
| </div> |
| </li> |
| <li> |
| <p>The "remote bootstrap" process used to copy a tablet replica from one host to |
| another has been renamed to "Tablet Copy". This resulted in the renaming of |
| several RPC metrics. Any users previously explicitly fetching or monitoring metrics |
| related to Remote Bootstrap should update their scripts to reflect the new names.</p> |
| </li> |
| <li> |
| <p>The SparkSQL datasource for Kudu no longer supports mode <code>Overwrite</code>. Users should |
| use the new <code>KuduContext.upsertRows</code> method instead. Additionally, inserts using the |
| datasource are now upserts by default. The older behavior can be restored by setting |
| the <code>operation</code> parameter to <code>insert</code>.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.10.0_new_features"><a class="link" href="#rn_0.10.0_new_features">New features</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p>Users may now manually manage the partitioning of a range-partitioned table. |
| When a table is created, the user may specify a set of range partitions that |
| do not cover the entire available key space. A user may add or drop range |
| partitions to existing tables.</p> |
| <div class="paragraph"> |
| <p>This feature can be particularly helpful with time series workloads in which |
| new partitions can be created on an hourly or daily basis. Old partitions |
| may be efficiently dropped if the application does not need to retain historical |
| data past a certain point.</p> |
| </div> |
| <div class="paragraph"> |
| <p>This feature is considered experimental for the 0.10 release. More details of |
| the new feature can be found in the accompanying |
| <a href="https://kudu.apache.org/2016/08/23/new-range-partitioning-features.html">blog post</a>.</p> |
| </div> |
| </li> |
| <li> |
| <p>Support for running Kudu clusters with multiple masters has been stabilized. |
| Users may start a cluster with three or five masters to provide fault tolerance |
| despite a failure of one or two masters, respectively.</p> |
| <div class="paragraph"> |
| <p>Note that certain tools (e.g. <code>ksck</code>) are still lacking complete support for |
| multiple masters. These deficiencies will be addressed in a following release.</p> |
| </div> |
| </li> |
| <li> |
| <p>Kudu now supports the ability to reserve a certain amount of free disk space |
| in each of its configured data directories. If a directory’s free disk space |
| drops to less than the configured minimum, Kudu will stop writing to that |
| directory until space becomes available. If no space is available in any |
| configured directory, Kudu will abort.</p> |
| <div class="paragraph"> |
| <p>This feature may be configured using the <code>fs_data_dirs_reserved_bytes</code> and |
| <code>fs_wal_dir_reserved_bytes</code> flags.</p> |
| </div> |
| </li> |
| <li> |
| <p>The Spark integration’s <code>KuduContext</code> now supports four new methods for writing to |
| Kudu tables: <code>insertRows</code>, <code>upsertRows</code>, <code>updateRows</code>, and <code>deleteRows</code>. These are |
| now the preferred way to write to Kudu tables from Spark.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.10.0_improvements"><a class="link" href="#rn_0.10.0_improvements">Improvements and optimizations</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1516">KUDU-1516</a> The <code>kudu-ksck</code> tool |
| has been improved and now detects problems such as when a tablet does not have |
| a majority of replicas on live tablet servers, or if those replicas aren’t in a |
| good state. Users who currently depend on the tool to detect inconsistencies may now see |
| failures when before they wouldn’t see any.</p> |
| </li> |
| <li> |
| <p><a href="https://gerrit.cloudera.org:8080/3477">Gerrit #3477</a> The way operations are buffered in |
| the Java client has been reworked. Previously, the session’s buffer size was set per tablet, meaning that a buffer |
| size of 1,000 for 10 tablets being written to allowed for 10,000 operations to be buffered at the |
| same time. With this change, all the tablets share one buffer, so users might need to set a |
| bigger buffer size in order to reach the same level of performance as before.</p> |
| </li> |
| <li> |
| <p><a href="https://gerrit.cloudera.org/#/c/3674/">Gerrit #3674</a> Added LESS and GREATER options for |
| column predicates.</p> |
| </li> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1444">KUDU-1444</a> added support for passing |
| back basic per-scan metrics (e.g cache hit rate) from the server to the C++ client. See the |
| <code>KuduScanner::GetResourceMetrics()</code> API for detailed usage. This feature will be supported |
| in the Java client API in a future release.</p> |
| </li> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1446">KUDU-1446</a> improved the order in |
| which the tablet server evaluates predicates, so that predicates on smaller columns |
| are evaluated first. This may improve performance on queries which apply predicates |
| on multiple columns of different sizes.</p> |
| </li> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1398">KUDU-1398</a> improved the storage |
| efficiency of Kudu’s internal primary key indexes. This optimization should decrease space |
| usage and improve random access performance, particularly for workloads with lengthy |
| primary keys.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.10.0_fixed_issues"><a class="link" href="#rn_0.10.0_fixed_issues">Fixed Issues</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p><a href="https://gerrit.cloudera.org/#/c/3541/">Gerrit #3541</a> Fixed a problem in the Java client |
| whereby an RPC could be dropped when a connection to a tablet server or master was forcefully |
| closed on the server-side while RPCs to that server were in the process of being encoded. |
| The effect was that the RPC would not be sent, and users of the synchronous API would receive |
| a <code>TimeoutException</code>. Several other Java client bugs which could cause similar spurious timeouts |
| were also fixed in this release.</p> |
| </li> |
| <li> |
| <p><a href="https://gerrit.cloudera.org/<mark>/c/3724/">Gerrit #3724</a> Fixed a problem in the Java client |
| whereby an RPC could be dropped when a socket timeout was fired while that RPC was being sent to |
| a tablet server or master. This would manifest itself in the same way |
| <a href="https://gerrit.cloudera.org/</mark>/c/3541/">Gerrit #3541</a>.</p> |
| </li> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1538">KUDU-1538</a> fixed a bug in which recycled |
| block identifiers could cause the tablet server to lose data. Following this bug fix, block |
| identifiers will no longer be reused.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.10.0_changes"><a class="link" href="#rn_0.10.0_changes">Other noteworthy changes</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p>This is the first release of Apache Kudu as a top-level (non-incubating) |
| project!</p> |
| </li> |
| <li> |
| <p>The default false positive rate for Bloom filters has been changed |
| from 1% to 0.01%. This will increase the space consumption of Bloom |
| filters by a factor of two (from approximately 10 bits per row to |
| approximately 20 bits per row). This is expected to substantially |
| improve the performance of random-write workloads at the cost of an |
| incremental increase in disk space usage.</p> |
| </li> |
| <li> |
| <p>The Kudu C++ client library now has Doxygen-based |
| <a href="http://kudu.apache.org/cpp-client-api/">API documentation</a> |
| available online.</p> |
| </li> |
| <li> |
| <p>Kudu now |
| <a href="http://kudu.apache.org/2016/06/17/raft-consensus-single-node.html"> |
| uses the Raft consensus algorithm even for unreplicated tables</a>. |
| This change simplifies code and will also allow administrators to enable |
| replication on a previously-unreplicated table. This change is internal and |
| should not be visible to users.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| </div> |
| </div> |
| <div class="sect1"> |
| <h2 id="rn_0.9.1"><a class="link" href="#rn_0.9.1">Release notes specific to 0.9.1</a></h2> |
| <div class="sectionbody"> |
| <div class="paragraph"> |
| <p>Kudu 0.9.1 delivers incremental bug fixes over Kudu 0.9.0. It is fully compatible with |
| Kudu 0.9.0.</p> |
| </div> |
| <div class="paragraph"> |
| <p>See also <a href="https://issues.apache.org/jira/issues/?jql=project%20%3D%20KUDU%20AND%20status%20%3D%20Resolved |
| %20AND%20fixVersion%20%3D%200.9.1">JIRAs resolved |
| for Kudu 0.9.1</a> and <a href="https://github.com/apache/kudu/compare/0.9.0...0.9.1">Git |
| changes between 0.9.0 and 0.9.1</a>.</p> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.9.1_fixed_issues"><a class="link" href="#rn_0.9.1_fixed_issues">Fixed Issues</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1469">KUDU-1469</a> fixed a bug in |
| our Raft consensus implementation that could cause a tablet to stop making progress after a leader |
| election.</p> |
| </li> |
| <li> |
| <p><a href="https://gerrit.cloudera.org/#/c/3456/">Gerrit #3456</a> fixed a bug in which |
| servers under high load could store metric information in incorrect memory |
| locations, causing crashes or data corruption.</p> |
| </li> |
| <li> |
| <p><a href="https://gerrit.cloudera.org/#/c/3457/">Gerrit #3457</a> fixed a bug in which |
| errors from the Java client would carry an incorrect error message.</p> |
| </li> |
| <li> |
| <p>Several other small bug fixes were backported to improve stability.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| </div> |
| </div> |
| <div class="sect1"> |
| <h2 id="rn_0.9.0"><a class="link" href="#rn_0.9.0">Release notes specific to 0.9.0</a></h2> |
| <div class="sectionbody"> |
| <div class="paragraph"> |
| <p>Kudu 0.9.0 delivers incremental features, improvements, and bug fixes over the previous versions.</p> |
| </div> |
| <div class="paragraph"> |
| <p>See also <a href="https://issues.apache.org/jira/issues/?jql=project%20%3D%20KUDU%20AND%20status%20%3D%20Resolved |
| %20AND%20fixVersion%20%3D%200.9.0">JIRAs resolved |
| for Kudu 0.9.0</a> and <a href="https://github.com/apache/kudu/compare/0.8.0...0.9.0">Git |
| changes between 0.8.0 and 0.9.0</a>.</p> |
| </div> |
| <div class="paragraph"> |
| <p>To upgrade to Kudu 0.10.0, see <a href="#rn_0.9.0_upgrade">[rn_0.9.0_upgrade]</a>.</p> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.9.0_incompatible_changes"><a class="link" href="#rn_0.9.0_incompatible_changes">Incompatible changes</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p>The <code>KuduTableInputFormat</code> command has changed the way in which it handles |
| scan predicates, including how it serializes predicates to the job configuration |
| object. The new configuration key is <code>kudu.mapreduce.encoded.predicate</code>. Clients |
| using the <code>TableInputFormatConfigurator</code> are not affected.</p> |
| </li> |
| <li> |
| <p>The <code>kudu-spark</code> sub-project has been renamed to follow naming conventions for |
| Scala. The new name is <code>kudu-spark_2.10</code>.</p> |
| </li> |
| <li> |
| <p>Default table partitioning has been removed. All tables must now be created |
| with explicit partitioning. Existing tables are unaffected. See the |
| <a href="schema_design.html#no_default_partitioning">schema design guide</a> for more |
| details.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.9.0_new_features"><a class="link" href="#rn_0.9.0_new_features">New features</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1002">KUDU-1002</a> Added support for |
| <code>UPSERT</code> operations, whereby a row is inserted if it does not already exist, but |
| updated if it does. Support for <code>UPSERT</code> is included in Java, C++, and Python APIs, |
| but not in Impala.</p> |
| </li> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1306">KUDU-1306</a> Scan token API |
| for creating partition-aware scan descriptors. This API simplifies executing |
| parallel scans for clients and query engines.</p> |
| </li> |
| <li> |
| <p><a href="http://gerrit.cloudera.org:8080/#/c/2848/">Gerrit 2848</a> Added a kudu datasource |
| for Spark. This datasource uses the Kudu client directly instead of |
| using the MapReduce API. Predicate pushdowns for <code>spark-sql</code> and Spark filters are |
| included, as well as parallel retrieval for multiple tablets and column projections. |
| See an example of <a href="developing.html#_kudu_integration_with_spark">Kudu integration with Spark</a>.</p> |
| </li> |
| <li> |
| <p><a href="http://gerrit.cloudera.org:8080/#/c/2992/">Gerrit 2992</a> Added the ability |
| to update and insert from Spark using a Kudu datasource.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.9.0_improvements"><a class="link" href="#rn_0.9.0_improvements">Improvements</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1415">KUDU-1415</a> Added statistics in the Java |
| client such as the number of bytes written and the number of operations applied.</p> |
| </li> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1451">KUDU-1451</a> Improved tablet server restart |
| time when the tablet server needs to clean up of a lot previously deleted tablets. Tablets are |
| now cleaned up after they are deleted.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.9.0_fixed_issues"><a class="link" href="#rn_0.9.0_fixed_issues">Fixed Issues</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-678">KUDU-678</a> Fixed a leak that happened during |
| DiskRowSet compactions where tiny blocks were still written to disk even if there were no REDO |
| records. With the default block manager, it usually resulted in block containers with thousands |
| of tiny blocks.</p> |
| </li> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1437">KUDU-1437</a> Fixed a data corruption issue |
| that occured after compacting sequences of negative INT32 values in a column that |
| was configured with RLE encoding.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.9.0_changes"><a class="link" href="#rn_0.9.0_changes">Other noteworthy changes</a></h3> |
| <div class="paragraph"> |
| <p>All Kudu clients have longer default timeout values, as listed below.</p> |
| </div> |
| <div class="ulist"> |
| <div class="title">Java</div> |
| <ul> |
| <li> |
| <p>The default operation timeout and the default admin operation timeout |
| are now set to 30 seconds instead of 10.</p> |
| </li> |
| <li> |
| <p>The default socket read timeout is now 10 seconds instead of 5.</p> |
| </li> |
| </ul> |
| </div> |
| <div class="ulist"> |
| <div class="title">C++</div> |
| <ul> |
| <li> |
| <p>The default admin timeout is now 30 seconds instead of 10.</p> |
| </li> |
| <li> |
| <p>The default RPC timeout is now 10 seconds instead of 5.</p> |
| </li> |
| <li> |
| <p>The default scan timeout is now 30 seconds instead of 15.</p> |
| </li> |
| <li> |
| <p>Some default settings related to I/O behavior during flushes and compactions have been changed: |
| The default for <code>flush_threshold_mb</code> has been increased from 64MB to 1000MB. The default |
| <code>cfile_do_on_finish</code> has been changed from <code>close</code> to <code>flush</code>. |
| <a href="http://getkudu.io/2016/04/26/ycsb.html">Experiments using YCSB</a> indicate that these |
| values will provide better throughput for write-heavy applications on typical server hardware.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| </div> |
| </div> |
| <div class="sect1"> |
| <h2 id="rn_0.8.0"><a class="link" href="#rn_0.8.0">Release notes specific to 0.8.0</a></h2> |
| <div class="sectionbody"> |
| <div class="paragraph"> |
| <p>Kudu 0.8.0 delivers incremental features, improvements, and bug fixes over the previous versions.</p> |
| </div> |
| <div class="paragraph"> |
| <p>See also <a href="https://issues.apache.org/jira/issues/?jql=project%20%3D%20KUDU%20AND%20status%20%3D%20Resolved |
| %20AND%20fixVersion%20%3D%200.8.0">JIRAs resolved |
| for Kudu 0.8.0</a> and <a href="https://github.com/apache/kudu/compare/0.7.1...0.8.0">Git |
| changes between 0.7.1 and 0.8.0</a>.</p> |
| </div> |
| <div class="paragraph"> |
| <p>To upgrade to Kudu 0.8.0, see <a href="installation.html#upgrade">Upgrade from 0.7.1 to 0.8.0</a>.</p> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.8.0_incompatible_changes"><a class="link" href="#rn_0.8.0_incompatible_changes">Incompatible changes</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p>0.8.0 clients are not fully compatible with servers running Kudu 0.7.1 or lower. |
| In particular, scans that specify column predicates will fail. To work around this |
| issue, upgrade all Kudu servers before upgrading clients.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.8.0_new_features"><a class="link" href="#rn_0.8.0_new_features">New features</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-431">KUDU-431</a> A simple Flume |
| sink has been implemented.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.8.0_improvements"><a class="link" href="#rn_0.8.0_improvements">Improvements</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-839">KUDU-839</a> Java RowError now uses an enum error code.</p> |
| </li> |
| <li> |
| <p><a href="http://gerrit.cloudera.org:8080/#/c/2138/">Gerrit 2138</a> The handling of |
| column predicates has been re-implemented in the server and clients.</p> |
| </li> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1379">KUDU-1379</a> Partition pruning |
| has been implemented for C++ clients (but not yet for the Java client). This feature |
| allows you to avoid reading a tablet if you know it does not serve the row keys you are querying.</p> |
| </li> |
| <li> |
| <p><a href="http://gerrit.cloudera.org:8080/#/c/2641">Gerrit 2641</a> Kudu now uses |
| <code>earliest-deadline-first</code> RPC scheduling and rejection. This changes the behavior |
| of the RPC service queue to prevent unfairness when processing a backlog of RPC |
| threads and to increase the likelihood that an RPC will be processed before it |
| can time out.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.8.0_fixed_issues"><a class="link" href="#rn_0.8.0_fixed_issues">Fixed Issues</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p><a href="https://issues.cloudera.org/browse/KUDU-1337">KUDU-1337</a> Tablets from tables |
| that were deleted might be unnecessarily re-bootstrapped when the leader gets the |
| notification to delete itself after the replicas do.</p> |
| </li> |
| <li> |
| <p><a href="https://issues.cloudera.org/browse/KUDU-969">KUDU-969</a> If a tablet server |
| shuts down while compacting a rowset and receiving updates for it, it might immediately |
| crash upon restart while bootstrapping that rowset’s tablet.</p> |
| </li> |
| <li> |
| <p><a href="https://issues.cloudera.org/browse/KUDU-1354">KUDU-1354</a> Due to a bug in Kudu’s |
| MVCC implementation where row locks were released before the MVCC commit happened, |
| flushed data would include out-of-order transactions, triggering a crash on the |
| next compaction.</p> |
| </li> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1322">KUDU-1322</a> The C++ client |
| now retries write operations if the tablet it is trying to reach has already been |
| deleted.</p> |
| </li> |
| <li> |
| <p><a href="http://gerrit.cloudera.org:8080/#/c/2571/">Gerrit 2571</a> Due to a bug in the |
| Java client, users were unable to close the <code>kudu-spark</code> shell because of |
| lingering non-daemon threads.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.8.0_changes"><a class="link" href="#rn_0.8.0_changes">Other noteworthy changes</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p><a href="http://gerrit.cloudera.org:8080/#/c/2239/">Gerrit 2239</a> The concept of "feature flags" |
| was introduced in order to manage compatibility between different |
| Kudu versions. One case where this is helpful is if a newer client attempts to use |
| a feature unsupported by the currently-running tablet server. Rather than receiving |
| a cryptic error, the user gets an error message that is easier to interpret. |
| This is an internal change for Kudu system developers and requires no action by |
| users of the clients or API.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| </div> |
| </div> |
| <div class="sect1"> |
| <h2 id="rn_0.7.1"><a class="link" href="#rn_0.7.1">Release notes specific to 0.7.1</a></h2> |
| <div class="sectionbody"> |
| <div class="paragraph"> |
| <p>Kudu 0.7.1 is a bug fix release for 0.7.0.</p> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.7.1_fixed_issues"><a class="link" href="#rn_0.7.1_fixed_issues">Fixed Issues</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1325">KUDU-1325</a> fixes a tablet server crash that could |
| occur during table deletion. In some cases, while a table was being deleted, other replicas would |
| attempt to re-replicate tablets to servers that had already processed the deletion. This could |
| trigger a race condition that caused a crash.</p> |
| </li> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1341">KUDU-1341</a> fixes a potential data corruption and |
| crash that could happen shortly after tablet server restarts in workloads that repeatedly delete |
| and re-insert rows with the same primary key. In most cases, this corruption affected only a single |
| replica and could be repaired by re-replicating from another.</p> |
| </li> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1343">KUDU-1343</a> fixes a bug in the Java client that |
| occurs when a scanner has to scan multiple batches from one tablet and then start scanning from |
| another. In particular, this would affect any scans using the Java client that read large numbers |
| of rows from multi-tablet tables.</p> |
| </li> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1345">KUDU-1345</a> fixes a bug where in some cases the |
| hybrid clock could jump backwards, resulting in a crash followed by an inability to |
| restart the affected tablet server.</p> |
| </li> |
| <li> |
| <p><a href="https://issues.apache.org/jira/browse/KUDU-1360">KUDU-1360</a> fixes a bug in the kudu-spark module |
| which prevented reading rows with <code>NULL</code> values.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| </div> |
| </div> |
| <div class="sect1"> |
| <h2 id="rn_0.7.0"><a class="link" href="#rn_0.7.0">Release notes specific to 0.7.0</a></h2> |
| <div class="sectionbody"> |
| <div class="paragraph"> |
| <p>Kudu 0.7.0 is the first release done as part of the Apache Incubator and includes a number |
| of changes, new features, improvements, and fixes.</p> |
| </div> |
| <div class="paragraph"> |
| <p>See also <a href="https://issues.cloudera.org/issues/?jql=project%20%3D%20Kudu%20AND%20status%20in%20 |
| (Resolved)%20AND%20fixVersion%20%3D%200.7.0%20ORDER%20BY%20key%20ASC">JIRAs resolved |
| for Kudu 0.7.0</a> and <a href="https://github.com/apache/kudu/compare/branch-0.6.0...branch-0.7.0">Git |
| changes between 0.6.0 and 0.7.0</a>.</p> |
| </div> |
| <div class="paragraph"> |
| <p>The upgrade instructions can be found at <a href="installation.html#upgrade">Upgrade from 0.6.0 to 0.7.0</a>.</p> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.7.0_incompatible_changes"><a class="link" href="#rn_0.7.0_incompatible_changes">Incompatible changes</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p>The C++ client includes a new API, <code>KuduScanBatch</code>, which performs better when a |
| large number of small rows are returned in a batch. The old API of <code>vector<KuduRowResult></code> |
| is deprecated.</p> |
| <div class="admonitionblock note"> |
| <table> |
| <tr> |
| <td class="icon"> |
| <i class="fa icon-note" title="Note"></i> |
| </td> |
| <td class="content"> |
| This change is API-compatible but <strong>not</strong> ABI-compatible. |
| </td> |
| </tr> |
| </table> |
| </div> |
| </li> |
| <li> |
| <p>The default replication factor has been changed from 1 to 3. Existing tables will |
| continue to use the replication factor they were created with. Applications that create |
| tables may not work properly if they assume a replication factor of 1 and fewer than |
| 3 replicas are available. To use the previous default replication factor, start the |
| master with the configuration flag <code>--default_num_replicas=1</code>.</p> |
| </li> |
| <li> |
| <p>The Python client has been completely rewritten, with a focus on improving code |
| quality and testing. The read path (scanners) has been improved by adding many of |
| the features already supported by the C++ and Java clients. The Python client is no |
| longer considered experimental.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.7.0_new_features"><a class="link" href="#rn_0.7.0_new_features">New features</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p>With the goal of Spark integration in mind, a new <code>kuduRDD</code> API has been added, |
| which wraps <code>newAPIHadoopRDD</code> and includes a default source for Spark SQL.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.7.0_improvements"><a class="link" href="#rn_0.7.0_improvements">Improvements</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p>The Java client includes new methods <code>countPendingErrors()</code> and |
| <code>getPendingErrors()</code> on <code>KuduSession</code>. These methods allow you to count and |
| retrieve outstanding row errors when configuring sessions with <code>AUTO_FLUSH_BACKGROUND</code>.</p> |
| </li> |
| <li> |
| <p>New server-level metrics allow you to monitor CPU usage and context switching.</p> |
| </li> |
| <li> |
| <p>Kudu now builds on RHEL 7, CentOS 7, and SLES 12. Extra instructions are included |
| for SLES 12.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.7.0_fixed_issues"><a class="link" href="#rn_0.7.0_fixed_issues">Fixed Issues</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p><a href="https://issues.cloudera.org/browse/KUDU-1288">KUDU-1288</a> fixes a severe file descriptor |
| leak, which could previously only be resolved by restarting the tablet server.</p> |
| </li> |
| <li> |
| <p><a href="https://issues.cloudera.org/browse/KUDU-1250">KUDU-1250</a> fixes a hang in the Java |
| client when processing an in-flight batch and the previous batch encountered an error.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| <div class="sect2"> |
| <h3 id="rn_0.7.0_changes"><a class="link" href="#rn_0.7.0_changes">Other noteworthy changes</a></h3> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p>The file block manager’s performance was improved, but it is still not recommended for |
| real-world use.</p> |
| </li> |
| <li> |
| <p>The master now attempts to spread tablets more evenly across the cluster during |
| table creation. This has no impact on existing tables, but will improve the speed |
| at which under-replicated tabletsare re-replicated after a tablet server failure.</p> |
| </li> |
| <li> |
| <p>All licensing documents have been modified to adhere to ASF guidelines.</p> |
| </li> |
| <li> |
| <p>Kudu now requires an out-of-tree build directory. Review the build instructions |
| for additional information.</p> |
| </li> |
| <li> |
| <p>The <code>C` client library is now explicitly built against the |
| link:https://gcc.gnu.org/onlinedocs/libstdc/manual/using_dual_abi.html[old gcc5 ABI]. |
| If you use gcc5 to build a Kudu application, your application must use the old ABI |
| as well. This is typically achieved by defining the `_GLIBCXX_USE_CXX11_ABI</code> macro |
| at compile-time when building your application. For more information, see the |
| previous link and link:http://developerblog.redhat.com/2015/02/05/gcc5-and-the-c11-abi/.</p> |
| </li> |
| <li> |
| <p>The Python client is no longer considered experimental.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| </div> |
| </div> |
| <div class="sect1"> |
| <h2 id="rn_0.6.0"><a class="link" href="#rn_0.6.0">Release notes specific to 0.6.0</a></h2> |
| <div class="sectionbody"> |
| <div class="paragraph"> |
| <p>The 0.6.0 release contains incremental improvements and bug fixes. The most notable |
| changes are:</p> |
| </div> |
| <div class="ulist"> |
| <ul> |
| <li> |
| <p>The Java client’s CreateTableBuilder and AlterTableBuilder classes have been renamed |
| to CreateTableOptions and AlterTableOptions. Their methods now also return <code>this</code> objects, |
| allowing them to be used as builders.</p> |
| </li> |
| <li> |
| <p>The Java client’s AbstractKuduScannerBuilder#maxNumBytes() setter is now called |
| batchSizeBytes as is the corresponding property in AsyncKuduScanner. This makes it |
| consistent with the C++ client.</p> |
| </li> |
| <li> |
| <p>The "kudu-admin" tool can now list and delete tables via its new subcommands |
| "list_tables" and "delete_table <table_name>".</p> |
| </li> |
| <li> |
| <p>OSX is now supported for single-host development. Please consult its specific installation |
| instructions in <a href="installation.html#osx_from_source">OS X</a>.</p> |
| </li> |
| </ul> |
| </div> |
| </div> |
| </div> |
| <div class="sect1"> |
| <h2 id="rn_0.5.0"><a class="link" href="#rn_0.5.0">Release Notes Specific to 0.5.0</a></h2> |
| <div class="sectionbody"> |
| <div class="paragraph"> |
| <p>Kudu 0.5.0 was the first public release. As such, no improvements or changes were |
| noted in its release notes.</p> |
| </div> |
| </div> |
| </div> |
| </div> |
| <div class="col-md-3"> |
| |
| <div id="toc" data-spy="affix" data-offset-top="70"> |
| <ul> |
| |
| <li> |
| |
| <a href="index.html">Introducing Kudu</a> |
| </li> |
| <li> |
| |
| <a href="release_notes.html">Kudu Release Notes</a> |
| </li> |
| <li> |
| |
| <a href="quickstart.html">Getting Started with Kudu</a> |
| </li> |
| <li> |
| |
| <a href="installation.html">Installation Guide</a> |
| </li> |
| <li> |
| |
| <a href="configuration.html">Configuring Kudu</a> |
| </li> |
| <li> |
| |
| <a href="kudu_impala_integration.html">Using Impala with Kudu</a> |
| </li> |
| <li> |
| |
| <a href="administration.html">Administering Kudu</a> |
| </li> |
| <li> |
| |
| <a href="troubleshooting.html">Troubleshooting Kudu</a> |
| </li> |
| <li> |
| |
| <a href="developing.html">Developing Applications with Kudu</a> |
| </li> |
| <li> |
| |
| <a href="schema_design.html">Kudu Schema Design</a> |
| </li> |
| <li> |
| |
| <a href="transaction_semantics.html">Kudu Transaction Semantics</a> |
| </li> |
| <li> |
| |
| <a href="contributing.html">Contributing to Kudu</a> |
| </li> |
| <li> |
| |
| <a href="style_guide.html">Kudu Documentation Style Guide</a> |
| </li> |
| <li> |
| |
| <a href="configuration_reference.html">Kudu Configuration Reference</a> |
| </li> |
| <li> |
| |
| <a href="known_issues.html">Known Issues and Limitations</a> |
| </li> |
| <li> |
| |
| <a href="export_control.html">Export Control Notice</a> |
| </li> |
| </ul> |
| </div> |
| </div> |
| </div> |
| </div> |
| <footer class="footer"> |
| <div class="row"> |
| <div class="col-md-9"> |
| <p class="small"> |
| Copyright © 2020 The Apache Software Foundation. Last updated 2017-01-12 12:48:06 PST |
| </p> |
| <p class="small"> |
| Apache Kudu, Kudu, Apache, the Apache feather logo, and the Apache Kudu |
| project logo are either registered trademarks or trademarks of The |
| Apache Software Foundation in the United States and other countries. |
| </p> |
| </div> |
| <div class="col-md-3"> |
| <a class="pull-right" href="https://www.apache.org/events/current-event.html"> |
| <img src="https://www.apache.org/events/current-event-234x60.png"/> |
| </a> |
| </div> |
| </div> |
| </footer> |
| </div> |
| <script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/1.11.3/jquery.min.js"></script> |
| <script> |
| // Try to detect touch-screen devices. Note: Many laptops have touch screens. |
| $(document).ready(function() { |
| if ("ontouchstart" in document.documentElement) { |
| $(document.documentElement).addClass("touch"); |
| } else { |
| $(document.documentElement).addClass("no-touch"); |
| } |
| }); |
| </script> |
| <script src="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.6/js/bootstrap.min.js" |
| integrity="sha384-0mSbJDEHialfmuBBQP6A4Qrprq5OVfW37PRR3j5ELqxss1yVqOtnepnHVP9aJ7xS" |
| crossorigin="anonymous"></script> |
| <script> |
| (function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){ |
| (i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o), |
| m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m) |
| })(window,document,'script','//www.google-analytics.com/analytics.js','ga'); |
| |
| ga('create', 'UA-68448017-1', 'auto'); |
| ga('send', 'pageview'); |
| </script> |
| <script src="https://cdnjs.cloudflare.com/ajax/libs/anchor-js/3.1.0/anchor.js"></script> |
| <script> |
| anchors.options = { |
| placement: 'right', |
| visible: 'touch', |
| }; |
| anchors.add(); |
| </script> |
| </body> |
| </html> |
| |