blob: 0c072f84afafc79c1379b7ee879936cc39753a24 [file] [log] [blame]
<!DOCTYPE html>
<html lang="en">
<head>
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1.0">
<title>
Spark Release 3.0.1 | Apache Spark
</title>
<link href="https://cdn.jsdelivr.net/npm/bootstrap@5.0.2/dist/css/bootstrap.min.css" rel="stylesheet"
integrity="sha384-EVSTQN3/azprG1Anm3QDgpJLIm9Nao0Yz1ztcQTwFspd3yD65VohhpuuCOmLASjC" crossorigin="anonymous">
<link rel="preconnect" href="https://fonts.googleapis.com">
<link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
<link href="https://fonts.googleapis.com/css2?family=DM+Sans:ital,wght@0,400;0,500;0,700;1,400;1,500;1,700&Courier+Prime:wght@400;700&display=swap" rel="stylesheet">
<link href="/css/custom.css" rel="stylesheet">
<!-- Code highlighter CSS -->
<link href="/css/pygments-default.css" rel="stylesheet">
<link rel="icon" href="/favicon.ico" type="image/x-icon">
<!-- Matomo -->
<script>
var _paq = window._paq = window._paq || [];
/* tracker methods like "setCustomDimension" should be called before "trackPageView" */
_paq.push(["disableCookies"]);
_paq.push(['trackPageView']);
_paq.push(['enableLinkTracking']);
(function() {
var u="https://analytics.apache.org/";
_paq.push(['setTrackerUrl', u+'matomo.php']);
_paq.push(['setSiteId', '40']);
var d=document, g=d.createElement('script'), s=d.getElementsByTagName('script')[0];
g.async=true; g.src=u+'matomo.js'; s.parentNode.insertBefore(g,s);
})();
</script>
<!-- End Matomo Code -->
</head>
<body class="global">
<nav class="navbar navbar-expand-lg navbar-dark p-0 px-4" style="background: #1D6890;">
<a class="navbar-brand" href="/">
<img src="/images/spark-logo-rev.svg" alt="" width="141" height="72">
</a>
<button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbarContent"
aria-controls="navbarContent" aria-expanded="false" aria-label="Toggle navigation">
<span class="navbar-toggler-icon"></span>
</button>
<div class="collapse navbar-collapse col-md-12 col-lg-auto pt-4" id="navbarContent">
<ul class="navbar-nav me-auto">
<li class="nav-item">
<a class="nav-link active" aria-current="page" href="/downloads.html">Download</a>
</li>
<li class="nav-item dropdown">
<a class="nav-link dropdown-toggle" href="#" id="libraries" role="button" data-bs-toggle="dropdown"
aria-expanded="false">
Libraries
</a>
<ul class="dropdown-menu" aria-labelledby="libraries">
<li><a class="dropdown-item" href="/sql/">SQL and DataFrames</a></li>
<li><a class="dropdown-item" href="/spark-connect/">Spark Connect</a></li>
<li><a class="dropdown-item" href="/streaming/">Spark Streaming</a></li>
<li><a class="dropdown-item" href="/mllib/">MLlib (machine learning)</a></li>
<li><a class="dropdown-item" href="/graphx/">GraphX (graph)</a></li>
<li>
<hr class="dropdown-divider">
</li>
<li><a class="dropdown-item" href="/third-party-projects.html">Third-Party Projects</a></li>
</ul>
</li>
<li class="nav-item dropdown">
<a class="nav-link dropdown-toggle" href="#" id="documentation" role="button" data-bs-toggle="dropdown"
aria-expanded="false">
Documentation
</a>
<ul class="dropdown-menu" aria-labelledby="documentation">
<li><a class="dropdown-item" href="/docs/latest/">Latest Release</a></li>
<li><a class="dropdown-item" href="/documentation.html">Older Versions and Other Resources</a></li>
<li><a class="dropdown-item" href="/faq.html">Frequently Asked Questions</a></li>
</ul>
</li>
<li class="nav-item">
<a class="nav-link active" aria-current="page" href="/examples.html">Examples</a>
</li>
<li class="nav-item dropdown">
<a class="nav-link dropdown-toggle" href="#" id="community" role="button" data-bs-toggle="dropdown"
aria-expanded="false">
Community
</a>
<ul class="dropdown-menu" aria-labelledby="community">
<li><a class="dropdown-item" href="/community.html">Mailing Lists &amp; Resources</a></li>
<li><a class="dropdown-item" href="/contributing.html">Contributing to Spark</a></li>
<li><a class="dropdown-item" href="/improvement-proposals.html">Improvement Proposals (SPIP)</a>
</li>
<li><a class="dropdown-item" href="https://issues.apache.org/jira/browse/SPARK">Issue Tracker</a>
</li>
<li><a class="dropdown-item" href="/powered-by.html">Powered By</a></li>
<li><a class="dropdown-item" href="/committers.html">Project Committers</a></li>
<li><a class="dropdown-item" href="/history.html">Project History</a></li>
</ul>
</li>
<li class="nav-item dropdown">
<a class="nav-link dropdown-toggle" href="#" id="developers" role="button" data-bs-toggle="dropdown"
aria-expanded="false">
Developers
</a>
<ul class="dropdown-menu" aria-labelledby="developers">
<li><a class="dropdown-item" href="/developer-tools.html">Useful Developer Tools</a></li>
<li><a class="dropdown-item" href="/versioning-policy.html">Versioning Policy</a></li>
<li><a class="dropdown-item" href="/release-process.html">Release Process</a></li>
<li><a class="dropdown-item" href="/security.html">Security</a></li>
</ul>
</li>
</ul>
<ul class="navbar-nav ml-auto">
<li class="nav-item dropdown">
<a class="nav-link dropdown-toggle" href="#" id="apacheFoundation" role="button"
data-bs-toggle="dropdown" aria-expanded="false">
Apache Software Foundation
</a>
<ul class="dropdown-menu" aria-labelledby="apacheFoundation">
<li><a class="dropdown-item" href="https://www.apache.org/">Apache Homepage</a></li>
<li><a class="dropdown-item" href="https://www.apache.org/licenses/">License</a></li>
<li><a class="dropdown-item"
href="https://www.apache.org/foundation/sponsorship.html">Sponsorship</a></li>
<li><a class="dropdown-item" href="https://www.apache.org/foundation/thanks.html">Thanks</a></li>
<li><a class="dropdown-item" href="https://www.apache.org/security/">Security</a></li>
<li><a class="dropdown-item" href="https://www.apache.org/events/current-event">Event</a></li>
</ul>
</li>
</ul>
</div>
</nav>
<div class="container">
<div class="row mt-4">
<div class="col-12 col-md-9">
<h2>Spark Release 3.0.1</h2>
<p>Spark 3.0.1 is a maintenance release containing stability fixes. This release is based on the branch-3.0 maintenance branch of Spark. We strongly recommend all 3.0 users to upgrade to this stable release.</p>
<h3 id="notable-changes">Notable changes</h3>
<ul>
<li><a href="https://issues.apache.org/jira/browse/SPARK-26905">[SPARK-26905]</a>: Revisit reserved/non-reserved keywords based on the ANSI SQL standard</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-31220">[SPARK-31220]</a>: repartition obeys spark.sql.adaptive.coalescePartitions.initialPartitionNum when spark.sql.adaptive.enabled</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-31703">[SPARK-31703]</a>: Changes made by SPARK-26985 break reading parquet files correctly in BigEndian architectures (AIX + LinuxPPC64)</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-31915">[SPARK-31915]</a>: Resolve the grouping column properly per the case sensitivity in grouped and cogrouped pandas UDFs</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-31923">[SPARK-31923]</a>: Event log cannot be generated when some internal accumulators use unexpected types</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-31935">[SPARK-31935]</a>: Hadoop file system config should be effective in data source options</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-31968">[SPARK-31968]</a>: write.partitionBy() creates duplicate subdirectories when user provides duplicate columns</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-31983">[SPARK-31983]</a>: Tables of structured streaming tab show wrong result for duration column</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-31990">[SPARK-31990]</a>: Streaming&#8217;s state store compatibility is broken</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-32003">[SPARK-32003]</a>: Shuffle files for lost executor are not unregistered if fetch failure occurs after executor is lost</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-32038">[SPARK-32038]</a>: Regression in handling NaN values in COUNT(DISTINCT)</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-32073">[SPARK-32073]</a>: Drop R &lt; 3.5 support</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-32092">[SPARK-32092]</a>: CrossvalidatorModel does not save all submodels (it saves only 3)</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-32136">[SPARK-32136]</a>: Spark producing incorrect groupBy results when key is a struct with nullable properties</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-32148">[SPARK-32148]</a>: LEFT JOIN generating non-deterministic and unexpected result (regression in Spark 3.0)</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-32220">[SPARK-32220]</a>: Cartesian Product Hint cause data error</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-32310">[SPARK-32310]</a>: ML params default value parity</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-32339">[SPARK-32339]</a>: Improve MLlib BLAS native acceleration docs</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-32424">[SPARK-32424]</a>: Fix silent data change for timestamp parsing if overflow happens</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-32451">[SPARK-32451]</a>: Support Apache Arrow 1.0.0 in SparkR</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-32456">[SPARK-32456]</a>: Check the Distinct by assuming it as Aggregate for Structured Streaming</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-32608">[SPARK-32608]</a>: Script Transform DELIMIT value should be formatted</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-32646">[SPARK-32646]</a>: ORC predicate pushdown should work with case-insensitive analysis</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-32658">[SPARK-32658]</a>: Partition length number overflow in PartitionWriterStream</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-32676">[SPARK-32676]</a>: Fix double caching in KMeans/BiKMeans</li>
</ul>
<h3 id="known-issues">Known issues</h3>
<ul>
<li><a href="https://issues.apache.org/jira/browse/SPARK-31511">[SPARK-31511]</a>: Make BytesToBytesMap iterator() thread-safe. This will be fixed in Spark 3.0.2.</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-32779">[SPARK-32779]</a>: Spark/Hive3 interaction potentially causes deadlock. This will be fixed in Spark 3.0.2.</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-32788">[SPARK-32788]</a>: non-partitioned table scan should not have partition filter. This will be fixed in Spark 3.0.2.</li>
<li><a href="https://issues.apache.org/jira/browse/SPARK-32810">[SPARK-32810]</a>: CSV/JSON data sources should avoid globbing paths when inferring schema. This will be fixed in Spark 3.0.2.</li>
</ul>
<p>You can consult JIRA for the <a href="https://s.apache.org/spark-3.0.1">detailed changes</a>.</p>
<p>We would like to acknowledge all community members for contributing patches to this release.</p>
<p>
<br/>
<a href="/news/">Spark News Archive</a>
</p>
</div>
<div class="col-12 col-md-3">
<div class="news" style="margin-bottom: 20px;">
<h5>Latest News</h5>
<ul class="list-unstyled">
<li><a href="/news/spark-3-5-1-released.html">Spark 3.5.1 released</a>
<span class="small">(Feb 23, 2024)</span></li>
<li><a href="/news/spark-3-3-4-released.html">Spark 3.3.4 released</a>
<span class="small">(Dec 16, 2023)</span></li>
<li><a href="/news/spark-3-4-2-released.html">Spark 3.4.2 released</a>
<span class="small">(Nov 30, 2023)</span></li>
<li><a href="/news/spark-3-5-0-released.html">Spark 3.5.0 released</a>
<span class="small">(Sep 13, 2023)</span></li>
</ul>
<p class="small" style="text-align: right;"><a href="/news/index.html">Archive</a></p>
</div>
<div style="text-align:center; margin-bottom: 20px;">
<a href="https://www.apache.org/events/current-event.html">
<img src="https://www.apache.org/events/current-event-234x60.png" style="max-width: 100%;"/>
</a>
</div>
<div class="hidden-xs hidden-sm">
<a href="/downloads.html" class="btn btn-cta btn-lg d-grid" style="margin-bottom: 30px;">
Download Spark
</a>
<p style="font-size: 16px; font-weight: 500; color: #555;">
Built-in Libraries:
</p>
<ul class="list-none">
<li><a href="/sql/">SQL and DataFrames</a></li>
<li><a href="/streaming/">Spark Streaming</a></li>
<li><a href="/mllib/">MLlib (machine learning)</a></li>
<li><a href="/graphx/">GraphX (graph)</a></li>
</ul>
<a href="/third-party-projects.html">Third-Party Projects</a>
</div>
</div>
</div>
<footer class="small">
<hr>
Apache Spark, Spark, Apache, the Apache feather logo, and the Apache Spark project logo are either registered
trademarks or trademarks of The Apache Software Foundation in the United States and other countries.
See guidance on use of Apache Spark <a href="/trademarks.html">trademarks</a>.
All other marks mentioned may be trademarks or registered trademarks of their respective owners.
Copyright &copy; 2018 The Apache Software Foundation, Licensed under the
<a href="https://www.apache.org/licenses/">Apache License, Version 2.0</a>.
</footer>
</div>
<script src="https://cdn.jsdelivr.net/npm/bootstrap@5.0.2/dist/js/bootstrap.bundle.min.js"
integrity="sha384-MrcW6ZMFYlzcLA8Nl+NtUVF0sA7MsXsP1UyJoMp4YLEuNSfAP+JcXn/tWtIaxVXM"
crossorigin="anonymous"></script>
<script src="https://code.jquery.com/jquery.js"></script>
<script src="/js/lang-tabs.js"></script>
<script src="/js/downloads.js"></script>
</body>
</html>