blob: aacc5f443a8f66d41fa22ac96dd67255a6a2fa32 [file] [log] [blame]
<!DOCTYPE html>
<html lang="en">
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1.0">
Spark Release 1.0.2 | Apache Spark
<link href="" rel="stylesheet"
integrity="sha384-EVSTQN3/azprG1Anm3QDgpJLIm9Nao0Yz1ztcQTwFspd3yD65VohhpuuCOmLASjC" crossorigin="anonymous">
<link rel="preconnect" href="">
<link rel="preconnect" href="" crossorigin>
<link href=",wght@0,400;0,500;0,700;1,400;1,500;1,700&Courier+Prime:wght@400;700&display=swap" rel="stylesheet">
<link href="/css/custom.css" rel="stylesheet">
<!-- Code highlighter CSS -->
<link href="/css/pygments-default.css" rel="stylesheet">
<link rel="icon" href="/favicon.ico" type="image/x-icon">
<!-- Matomo -->
var _paq = window._paq = window._paq || [];
/* tracker methods like "setCustomDimension" should be called before "trackPageView" */
(function() {
var u="";
_paq.push(['setTrackerUrl', u+'matomo.php']);
_paq.push(['setSiteId', '40']);
var d=document, g=d.createElement('script'), s=d.getElementsByTagName('script')[0];
g.async=true; g.src=u+'matomo.js'; s.parentNode.insertBefore(g,s);
<!-- End Matomo Code -->
<body class="global">
<nav class="navbar navbar-expand-lg navbar-dark p-0 px-4" style="background: #1D6890;">
<a class="navbar-brand" href="/">
<img src="/images/spark-logo-rev.svg" alt="" width="141" height="72">
<button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbarContent"
aria-controls="navbarContent" aria-expanded="false" aria-label="Toggle navigation">
<span class="navbar-toggler-icon"></span>
<div class="collapse navbar-collapse col-md-12 col-lg-auto pt-4" id="navbarContent">
<ul class="navbar-nav me-auto">
<li class="nav-item">
<a class="nav-link active" aria-current="page" href="/downloads.html">Download</a>
<li class="nav-item dropdown">
<a class="nav-link dropdown-toggle" href="#" id="libraries" role="button" data-bs-toggle="dropdown"
<ul class="dropdown-menu" aria-labelledby="libraries">
<li><a class="dropdown-item" href="/sql/">SQL and DataFrames</a></li>
<li><a class="dropdown-item" href="/spark-connect/">Spark Connect</a></li>
<li><a class="dropdown-item" href="/streaming/">Spark Streaming</a></li>
<li><a class="dropdown-item" href="/mllib/">MLlib (machine learning)</a></li>
<li><a class="dropdown-item" href="/graphx/">GraphX (graph)</a></li>
<hr class="dropdown-divider">
<li><a class="dropdown-item" href="/third-party-projects.html">Third-Party Projects</a></li>
<li class="nav-item dropdown">
<a class="nav-link dropdown-toggle" href="#" id="documentation" role="button" data-bs-toggle="dropdown"
<ul class="dropdown-menu" aria-labelledby="documentation">
<li><a class="dropdown-item" href="/docs/latest/">Latest Release</a></li>
<li><a class="dropdown-item" href="/documentation.html">Older Versions and Other Resources</a></li>
<li><a class="dropdown-item" href="/faq.html">Frequently Asked Questions</a></li>
<li class="nav-item">
<a class="nav-link active" aria-current="page" href="/examples.html">Examples</a>
<li class="nav-item dropdown">
<a class="nav-link dropdown-toggle" href="#" id="community" role="button" data-bs-toggle="dropdown"
<ul class="dropdown-menu" aria-labelledby="community">
<li><a class="dropdown-item" href="/community.html">Mailing Lists &amp; Resources</a></li>
<li><a class="dropdown-item" href="/contributing.html">Contributing to Spark</a></li>
<li><a class="dropdown-item" href="/improvement-proposals.html">Improvement Proposals (SPIP)</a>
<li><a class="dropdown-item" href="">Issue Tracker</a>
<li><a class="dropdown-item" href="/powered-by.html">Powered By</a></li>
<li><a class="dropdown-item" href="/committers.html">Project Committers</a></li>
<li><a class="dropdown-item" href="/history.html">Project History</a></li>
<li class="nav-item dropdown">
<a class="nav-link dropdown-toggle" href="#" id="developers" role="button" data-bs-toggle="dropdown"
<ul class="dropdown-menu" aria-labelledby="developers">
<li><a class="dropdown-item" href="/developer-tools.html">Useful Developer Tools</a></li>
<li><a class="dropdown-item" href="/versioning-policy.html">Versioning Policy</a></li>
<li><a class="dropdown-item" href="/release-process.html">Release Process</a></li>
<li><a class="dropdown-item" href="/security.html">Security</a></li>
<ul class="navbar-nav ml-auto">
<li class="nav-item dropdown">
<a class="nav-link dropdown-toggle" href="#" id="apacheFoundation" role="button"
data-bs-toggle="dropdown" aria-expanded="false">
Apache Software Foundation
<ul class="dropdown-menu" aria-labelledby="apacheFoundation">
<li><a class="dropdown-item" href="">Apache Homepage</a></li>
<li><a class="dropdown-item" href="">License</a></li>
<li><a class="dropdown-item"
<li><a class="dropdown-item" href="">Thanks</a></li>
<li><a class="dropdown-item" href="">Security</a></li>
<li><a class="dropdown-item" href="">Event</a></li>
<div class="container">
<div class="row mt-4">
<div class="col-12 col-md-9">
<h2>Spark Release 1.0.2</h2>
<p>Spark 1.0.2 is a maintenance release with bug fixes. This release is based on the <a href="">branch-1.0</a> maintenance branch of Spark. We recommend all 1.0.x users to upgrade to this stable release. Contributions to this release came from 30 developers.</p>
<p>You can download Spark 1.0.2 as either a
<a href="" onclick="trackOutboundLink(this, 'Release Download Links', 'cloudfront_spark-1.0.2.tgz'); return false;">source package</a>
(6 MB tgz) or a prebuilt package for
<a href="" onclick="trackOutboundLink(this, 'Release Download Links', 'cloudfront_spark-1.0.2-bin-hadoop1.tgz'); return false;">Hadoop 1 / CDH3</a> (156 MB tgz),
<a href="" onclick="trackOutboundLink(this, 'Release Download Links', 'cloudfront_spark-1.0.2-bin-cdh4.tgz'); return false;">CDH4</a> (161 MB tgz), or
<a href="" onclick="trackOutboundLink(this, 'Release Download Links', 'cloudfront_spark-1.0.2-bin-hadoop2.tgz'); return false;">Hadoop 2 / CDH5 / HDP2</a>
(168 MB tgz). Release signatures and checksums are available at the official <a href="">Apache download site</a>.</p>
<h3 id="fixes">Fixes</h3>
<p>Spark 1.0.2 contains bug fixes in several components. Some of the more important fixes are highlighted below. You can visit the <a href="">Spark issue tracker</a> for the full list of fixes.</p>
<h4 id="spark-core">Spark Core</h4>
<li>Avoid pulling in the entire RDD or PairRDDFunctions in various operators (<a href="">SPARK-2534</a>)</li>
<li>RangePartitioner&#8217;s binary search does not use the given Ordering (<a href="">SPARK-2598</a>)</li>
<li>Exception in accumulator update should not crash DAGScheduler and SparkContext (<a href="">SPARK-2323</a>)</li>
<h4 id="sql">SQL</h4>
<li>Slave node throws NoClassDefFoundError $line11.$read$ when executing a Spark QL query on HDFS CSV file (<a href="">SPARK-2576</a>)</li>
<li>Concurrent initialization of various DataType objects causes exceptions (<a href="">SPARK-2498</a>)</li>
<li>Multiple instances of an InMemoryRelation in a single plan results in recaching (<a href="">SPARK-2405</a>)</li>
<h4 id="pyspark">PySpark</h4>
<li>Make hash of None consistent cross machines (<a href="">SPARK-2494</a>)</li>
<h4 id="mllib">MLlib</h4>
<li>mutable.BitSet in ALS not serializable with KryoSerializer (<a href="">SPARK-1977</a>)</li>
<li>fix bin offset in DecisionTree node aggregations (<a href="">SPARK-2152</a>)</li>
<h4 id="streaming">Streaming</h4>
<li>Ability to limit the Receiver data rate to prevent overloading of data and Spark crash (<a href="">SPARK-1341</a>)</li>
<li>File stream processes existing files in a directory even if newFilesOnly = true (<a href="">SPARK-2362</a>)</li>
<li>QueueInputDStream with oneAtATime=false does not dequeue items (<a href="">SPARK-2343</a>)</li>
<h4 id="graphx">GraphX</h4>
<li>VertexPartition is not serializable (<a href="">SPARK-2455</a>)</li>
<h3 id="contributors">Contributors</h3>
<p>The following developers contributed to this release:</p>
<li>Aaron Davidson - Bug fixes in core</li>
<li>Aaron Staple - Bug fix in SQL</li>
<li>Andrew Or - Bug fix in core</li>
<li>Ankur Dave - Bug fix in GraphX</li>
<li>Artjom-Metro - Bug fix in examples</li>
<li>Basit Mustafa - Added t2 EC2 instance support</li>
<li>Cesar Arevalo - Doc fix</li>
<li>Cheng Hao - Bug fix in SQL</li>
<li>Daniel Darabos - Bug fix in core</li>
<li>Davies Liu - Bug fix in PySpark</li>
<li>Gabriele Nizzoli - Bug fix in Streaming</li>
<li>Hossein - Bug fix in core</li>
<li>Issac Buenrostro - Added support for throttling Streaming receiver</li>
<li>Manuel Laflamme - Bug fix in Streaming</li>
<li>Michael Armbrust - Bug fix and performance improvements in SQL</li>
<li>Neville Li - Bug fix in MLlib</li>
<li>Patrick Wendell - Bug fixes in core</li>
<li>Reynold Xin - Bug fixes in core and SQL</li>
<li>Sarah Gerweck - Bug fix in core</li>
<li>Takuya UESHIN - Bug fixes in SQL</li>
<li>Tathagata Das - Bug fix in Streaming</li>
<li>William Benton - Bug fix in SQL</li>
<li>Yin Huai - Bug fixes in SQL</li>
<li>Zongheng Yang - Bug fixes in SQL</li>
<li>baishuo(白硕) - Bug fix in SQL</li>
<li>johnnywalleye - Bug fixes in MLlib</li>
<li>joyyoj - Bug fix in Streaming</li>
<li>kballou - Doc fix</li>
<li>lianhuiwang - Doc fix</li>
<li>witgo - Bug fix in sbt</li>
<p><em>Thanks to everyone who contributed!</em></p>
<a href="/news/">Spark News Archive</a>
<div class="col-12 col-md-3">
<div class="news" style="margin-bottom: 20px;">
<h5>Latest News</h5>
<ul class="list-unstyled">
<li><a href="/news/spark-3-5-1-released.html">Spark 3.5.1 released</a>
<span class="small">(Feb 23, 2024)</span></li>
<li><a href="/news/spark-3-3-4-released.html">Spark 3.3.4 released</a>
<span class="small">(Dec 16, 2023)</span></li>
<li><a href="/news/spark-3-4-2-released.html">Spark 3.4.2 released</a>
<span class="small">(Nov 30, 2023)</span></li>
<li><a href="/news/spark-3-5-0-released.html">Spark 3.5.0 released</a>
<span class="small">(Sep 13, 2023)</span></li>
<p class="small" style="text-align: right;"><a href="/news/index.html">Archive</a></p>
<div style="text-align:center; margin-bottom: 20px;">
<a href="">
<img src="" style="max-width: 100%;"/>
<div class="hidden-xs hidden-sm">
<a href="/downloads.html" class="btn btn-cta btn-lg d-grid" style="margin-bottom: 30px;">
Download Spark
<p style="font-size: 16px; font-weight: 500; color: #555;">
Built-in Libraries:
<ul class="list-none">
<li><a href="/sql/">SQL and DataFrames</a></li>
<li><a href="/streaming/">Spark Streaming</a></li>
<li><a href="/mllib/">MLlib (machine learning)</a></li>
<li><a href="/graphx/">GraphX (graph)</a></li>
<a href="/third-party-projects.html">Third-Party Projects</a>
<footer class="small">
Apache Spark, Spark, Apache, the Apache feather logo, and the Apache Spark project logo are either registered
trademarks or trademarks of The Apache Software Foundation in the United States and other countries.
See guidance on use of Apache Spark <a href="/trademarks.html">trademarks</a>.
All other marks mentioned may be trademarks or registered trademarks of their respective owners.
Copyright &copy; 2018 The Apache Software Foundation, Licensed under the
<a href="">Apache License, Version 2.0</a>.
<script src=""
<script src=""></script>
<script src="/js/lang-tabs.js"></script>
<script src="/js/downloads.js"></script>