blob: 0b0502bcd64afc748f8c6fdde4704612bc617826 [file] [log] [blame]
<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd">
<!-- NewPage -->
<html lang="en">
<head>
<!-- Generated by javadoc (1.8.0_65) on Wed Apr 20 18:03:36 PDT 2016 -->
<title>ChunkRecordReader</title>
<meta name="date" content="2016-04-20">
<link rel="stylesheet" type="text/css" href="../../../../../../stylesheet.css" title="Style">
<script type="text/javascript" src="../../../../../../script.js"></script>
</head>
<body>
<script type="text/javascript"><!--
try {
if (location.href.indexOf('is-external=true') == -1) {
parent.document.title="ChunkRecordReader";
}
}
catch(err) {
}
//-->
var methods = {"i0":10,"i1":10,"i2":10,"i3":10,"i4":10,"i5":10,"i6":10};
var tabs = {65535:["t0","All Methods"],2:["t2","Instance Methods"],8:["t4","Concrete Methods"]};
var altColor = "altColor";
var rowColor = "rowColor";
var tableTab = "tableTab";
var activeTableTab = "activeTableTab";
</script>
<noscript>
<div>JavaScript is disabled on your browser.</div>
</noscript>
<!-- ========= START OF TOP NAVBAR ======= -->
<div class="topNav"><a name="navbar.top">
<!-- -->
</a>
<div class="skipNav"><a href="#skip.navbar.top" title="Skip navigation links">Skip navigation links</a></div>
<a name="navbar.top.firstrow">
<!-- -->
</a>
<ul class="navList" title="Navigation">
<li><a href="../../../../../../overview-summary.html">Overview</a></li>
<li><a href="package-summary.html">Package</a></li>
<li class="navBarCell1Rev">Class</li>
<li><a href="package-tree.html">Tree</a></li>
<li><a href="../../../../../../deprecated-list.html">Deprecated</a></li>
<li><a href="../../../../../../index-all.html">Index</a></li>
<li><a href="../../../../../../help-doc.html">Help</a></li>
</ul>
</div>
<div class="subNav">
<ul class="navList">
<li><a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkReader.html" title="class in org.apache.hawq.pxf.plugins.hdfs"><span class="typeNameLink">Prev&nbsp;Class</span></a></li>
<li><a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkWritable.html" title="class in org.apache.hawq.pxf.plugins.hdfs"><span class="typeNameLink">Next&nbsp;Class</span></a></li>
</ul>
<ul class="navList">
<li><a href="../../../../../../index.html?org/apache/hawq/pxf/plugins/hdfs/ChunkRecordReader.html" target="_top">Frames</a></li>
<li><a href="ChunkRecordReader.html" target="_top">No&nbsp;Frames</a></li>
</ul>
<ul class="navList" id="allclasses_navbar_top">
<li><a href="../../../../../../allclasses-noframe.html">All&nbsp;Classes</a></li>
</ul>
<div>
<script type="text/javascript"><!--
allClassesLink = document.getElementById("allclasses_navbar_top");
if(window==top) {
allClassesLink.style.display = "block";
}
else {
allClassesLink.style.display = "none";
}
//-->
</script>
</div>
<div>
<ul class="subNavList">
<li>Summary:&nbsp;</li>
<li>Nested&nbsp;|&nbsp;</li>
<li>Field&nbsp;|&nbsp;</li>
<li><a href="#constructor.summary">Constr</a>&nbsp;|&nbsp;</li>
<li><a href="#method.summary">Method</a></li>
</ul>
<ul class="subNavList">
<li>Detail:&nbsp;</li>
<li>Field&nbsp;|&nbsp;</li>
<li><a href="#constructor.detail">Constr</a>&nbsp;|&nbsp;</li>
<li><a href="#method.detail">Method</a></li>
</ul>
</div>
<a name="skip.navbar.top">
<!-- -->
</a></div>
<!-- ========= END OF TOP NAVBAR ========= -->
<!-- ======== START OF CLASS DATA ======== -->
<div class="header">
<div class="subTitle">org.apache.hawq.pxf.plugins.hdfs</div>
<h2 title="Class ChunkRecordReader" class="title">Class ChunkRecordReader</h2>
</div>
<div class="contentContainer">
<ul class="inheritance">
<li>java.lang.Object</li>
<li>
<ul class="inheritance">
<li>org.apache.hawq.pxf.plugins.hdfs.ChunkRecordReader</li>
</ul>
</li>
</ul>
<div class="description">
<ul class="blockList">
<li class="blockList">
<dl>
<dt>All Implemented Interfaces:</dt>
<dd>org.apache.hadoop.mapred.RecordReader&lt;org.apache.hadoop.io.LongWritable,<a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkWritable.html" title="class in org.apache.hawq.pxf.plugins.hdfs">ChunkWritable</a>&gt;</dd>
</dl>
<hr>
<br>
<pre>public class <span class="typeNameLabel">ChunkRecordReader</span>
extends java.lang.Object
implements org.apache.hadoop.mapred.RecordReader&lt;org.apache.hadoop.io.LongWritable,<a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkWritable.html" title="class in org.apache.hawq.pxf.plugins.hdfs">ChunkWritable</a>&gt;</pre>
<div class="block">ChunkRecordReader is designed for fast reading of a file split. The idea is
to bring chunks of data instead of single records. The chunks contain many
records and the chunk end is not aligned on a record boundary. The size of
the chunk is a class hardcoded parameter - CHUNK_SIZE. This behaviour sets
this reader apart from the other readers which will fetch one record and stop
when reaching a record delimiter.</div>
</li>
</ul>
</div>
<div class="summary">
<ul class="blockList">
<li class="blockList">
<!-- ======== CONSTRUCTOR SUMMARY ======== -->
<ul class="blockList">
<li class="blockList"><a name="constructor.summary">
<!-- -->
</a>
<h3>Constructor Summary</h3>
<table class="memberSummary" border="0" cellpadding="3" cellspacing="0" summary="Constructor Summary table, listing constructors, and an explanation">
<caption><span>Constructors</span><span class="tabEnd">&nbsp;</span></caption>
<tr>
<th class="colOne" scope="col">Constructor and Description</th>
</tr>
<tr class="altColor">
<td class="colOne"><code><span class="memberNameLink"><a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkRecordReader.html#ChunkRecordReader-org.apache.hadoop.conf.Configuration-org.apache.hadoop.mapred.FileSplit-">ChunkRecordReader</a></span>(org.apache.hadoop.conf.Configuration&nbsp;job,
org.apache.hadoop.mapred.FileSplit&nbsp;split)</code>
<div class="block">Constructs a ChunkRecordReader instance.</div>
</td>
</tr>
</table>
</li>
</ul>
<!-- ========== METHOD SUMMARY =========== -->
<ul class="blockList">
<li class="blockList"><a name="method.summary">
<!-- -->
</a>
<h3>Method Summary</h3>
<table class="memberSummary" border="0" cellpadding="3" cellspacing="0" summary="Method Summary table, listing methods, and an explanation">
<caption><span id="t0" class="activeTableTab"><span>All Methods</span><span class="tabEnd">&nbsp;</span></span><span id="t2" class="tableTab"><span><a href="javascript:show(2);">Instance Methods</a></span><span class="tabEnd">&nbsp;</span></span><span id="t4" class="tableTab"><span><a href="javascript:show(8);">Concrete Methods</a></span><span class="tabEnd">&nbsp;</span></span></caption>
<tr>
<th class="colFirst" scope="col">Modifier and Type</th>
<th class="colLast" scope="col">Method and Description</th>
</tr>
<tr id="i0" class="altColor">
<td class="colFirst"><code>void</code></td>
<td class="colLast"><code><span class="memberNameLink"><a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkRecordReader.html#close--">close</a></span>()</code>
<div class="block">Closes the input stream.</div>
</td>
</tr>
<tr id="i1" class="rowColor">
<td class="colFirst"><code>org.apache.hadoop.io.LongWritable</code></td>
<td class="colLast"><code><span class="memberNameLink"><a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkRecordReader.html#createKey--">createKey</a></span>()</code>
<div class="block">Used by the client of this class to create the 'key' output parameter for
next() method.</div>
</td>
</tr>
<tr id="i2" class="altColor">
<td class="colFirst"><code><a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkWritable.html" title="class in org.apache.hawq.pxf.plugins.hdfs">ChunkWritable</a></code></td>
<td class="colLast"><code><span class="memberNameLink"><a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkRecordReader.html#createValue--">createValue</a></span>()</code>
<div class="block">Used by the client of this class to create the 'value' output parameter
for next() method.</div>
</td>
</tr>
<tr id="i3" class="rowColor">
<td class="colFirst"><code>long</code></td>
<td class="colLast"><code><span class="memberNameLink"><a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkRecordReader.html#getPos--">getPos</a></span>()</code>
<div class="block">Returns the position of the unread tail of the file</div>
</td>
</tr>
<tr id="i4" class="altColor">
<td class="colFirst"><code>float</code></td>
<td class="colLast"><code><span class="memberNameLink"><a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkRecordReader.html#getProgress--">getProgress</a></span>()</code>
<div class="block">Gets the progress within the split.</div>
</td>
</tr>
<tr id="i5" class="rowColor">
<td class="colFirst"><code>org.apache.hadoop.hdfs.DFSInputStream.ReadStatistics</code></td>
<td class="colLast"><code><span class="memberNameLink"><a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkRecordReader.html#getReadStatistics--">getReadStatistics</a></span>()</code>
<div class="block">Returns statistics of the input stream's read operation: total bytes
read, bytes read locally, bytes read in short-circuit (directly from file
descriptor).</div>
</td>
</tr>
<tr id="i6" class="altColor">
<td class="colFirst"><code>boolean</code></td>
<td class="colLast"><code><span class="memberNameLink"><a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkRecordReader.html#next-org.apache.hadoop.io.LongWritable-org.apache.hawq.pxf.plugins.hdfs.ChunkWritable-">next</a></span>(org.apache.hadoop.io.LongWritable&nbsp;key,
<a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkWritable.html" title="class in org.apache.hawq.pxf.plugins.hdfs">ChunkWritable</a>&nbsp;value)</code>
<div class="block">Fetches the next data chunk from the file split.</div>
</td>
</tr>
</table>
<ul class="blockList">
<li class="blockList"><a name="methods.inherited.from.class.java.lang.Object">
<!-- -->
</a>
<h3>Methods inherited from class&nbsp;java.lang.Object</h3>
<code>clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait</code></li>
</ul>
</li>
</ul>
</li>
</ul>
</div>
<div class="details">
<ul class="blockList">
<li class="blockList">
<!-- ========= CONSTRUCTOR DETAIL ======== -->
<ul class="blockList">
<li class="blockList"><a name="constructor.detail">
<!-- -->
</a>
<h3>Constructor Detail</h3>
<a name="ChunkRecordReader-org.apache.hadoop.conf.Configuration-org.apache.hadoop.mapred.FileSplit-">
<!-- -->
</a>
<ul class="blockListLast">
<li class="blockList">
<h4>ChunkRecordReader</h4>
<pre>public&nbsp;ChunkRecordReader(org.apache.hadoop.conf.Configuration&nbsp;job,
org.apache.hadoop.mapred.FileSplit&nbsp;split)
throws java.io.IOException</pre>
<div class="block">Constructs a ChunkRecordReader instance.</div>
<dl>
<dt><span class="paramLabel">Parameters:</span></dt>
<dd><code>job</code> - the job configuration</dd>
<dd><code>split</code> - contains the file name, begin byte of the split and the
bytes length</dd>
<dt><span class="throwsLabel">Throws:</span></dt>
<dd><code>java.io.IOException</code> - if an I/O error occurs when accessing the file or
creating input stream to read from it</dd>
</dl>
</li>
</ul>
</li>
</ul>
<!-- ============ METHOD DETAIL ========== -->
<ul class="blockList">
<li class="blockList"><a name="method.detail">
<!-- -->
</a>
<h3>Method Detail</h3>
<a name="getReadStatistics--">
<!-- -->
</a>
<ul class="blockList">
<li class="blockList">
<h4>getReadStatistics</h4>
<pre>public&nbsp;org.apache.hadoop.hdfs.DFSInputStream.ReadStatistics&nbsp;getReadStatistics()</pre>
<div class="block">Returns statistics of the input stream's read operation: total bytes
read, bytes read locally, bytes read in short-circuit (directly from file
descriptor).</div>
<dl>
<dt><span class="returnLabel">Returns:</span></dt>
<dd>an instance of ReadStatistics class</dd>
</dl>
</li>
</ul>
<a name="createKey--">
<!-- -->
</a>
<ul class="blockList">
<li class="blockList">
<h4>createKey</h4>
<pre>public&nbsp;org.apache.hadoop.io.LongWritable&nbsp;createKey()</pre>
<div class="block">Used by the client of this class to create the 'key' output parameter for
next() method.</div>
<dl>
<dt><span class="overrideSpecifyLabel">Specified by:</span></dt>
<dd><code>createKey</code>&nbsp;in interface&nbsp;<code>org.apache.hadoop.mapred.RecordReader&lt;org.apache.hadoop.io.LongWritable,<a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkWritable.html" title="class in org.apache.hawq.pxf.plugins.hdfs">ChunkWritable</a>&gt;</code></dd>
<dt><span class="returnLabel">Returns:</span></dt>
<dd>an instance of LongWritable</dd>
</dl>
</li>
</ul>
<a name="createValue--">
<!-- -->
</a>
<ul class="blockList">
<li class="blockList">
<h4>createValue</h4>
<pre>public&nbsp;<a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkWritable.html" title="class in org.apache.hawq.pxf.plugins.hdfs">ChunkWritable</a>&nbsp;createValue()</pre>
<div class="block">Used by the client of this class to create the 'value' output parameter
for next() method.</div>
<dl>
<dt><span class="overrideSpecifyLabel">Specified by:</span></dt>
<dd><code>createValue</code>&nbsp;in interface&nbsp;<code>org.apache.hadoop.mapred.RecordReader&lt;org.apache.hadoop.io.LongWritable,<a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkWritable.html" title="class in org.apache.hawq.pxf.plugins.hdfs">ChunkWritable</a>&gt;</code></dd>
<dt><span class="returnLabel">Returns:</span></dt>
<dd>an instance of ChunkWritable</dd>
</dl>
</li>
</ul>
<a name="next-org.apache.hadoop.io.LongWritable-org.apache.hawq.pxf.plugins.hdfs.ChunkWritable-">
<!-- -->
</a>
<ul class="blockList">
<li class="blockList">
<h4>next</h4>
<pre>public&nbsp;boolean&nbsp;next(org.apache.hadoop.io.LongWritable&nbsp;key,
<a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkWritable.html" title="class in org.apache.hawq.pxf.plugins.hdfs">ChunkWritable</a>&nbsp;value)
throws java.io.IOException</pre>
<div class="block">Fetches the next data chunk from the file split. The size of the chunk is
a class hardcoded parameter - CHUNK_SIZE. This behaviour sets this reader
apart from the other readers which will fetch one record and stop when
reaching a record delimiter.</div>
<dl>
<dt><span class="overrideSpecifyLabel">Specified by:</span></dt>
<dd><code>next</code>&nbsp;in interface&nbsp;<code>org.apache.hadoop.mapred.RecordReader&lt;org.apache.hadoop.io.LongWritable,<a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkWritable.html" title="class in org.apache.hawq.pxf.plugins.hdfs">ChunkWritable</a>&gt;</code></dd>
<dt><span class="paramLabel">Parameters:</span></dt>
<dd><code>key</code> - - output parameter. When method returns will contain the key -
the number of the start byte of the chunk</dd>
<dd><code>value</code> - - output parameter. When method returns will contain the
value - the chunk, a byte array inside the ChunkWritable
instance</dd>
<dt><span class="returnLabel">Returns:</span></dt>
<dd>false - when end of split was reached</dd>
<dt><span class="throwsLabel">Throws:</span></dt>
<dd><code>java.io.IOException</code> - if an I/O error occurred while reading the next chunk
or line</dd>
</dl>
</li>
</ul>
<a name="getProgress--">
<!-- -->
</a>
<ul class="blockList">
<li class="blockList">
<h4>getProgress</h4>
<pre>public&nbsp;float&nbsp;getProgress()
throws java.io.IOException</pre>
<div class="block">Gets the progress within the split.</div>
<dl>
<dt><span class="overrideSpecifyLabel">Specified by:</span></dt>
<dd><code>getProgress</code>&nbsp;in interface&nbsp;<code>org.apache.hadoop.mapred.RecordReader&lt;org.apache.hadoop.io.LongWritable,<a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkWritable.html" title="class in org.apache.hawq.pxf.plugins.hdfs">ChunkWritable</a>&gt;</code></dd>
<dt><span class="throwsLabel">Throws:</span></dt>
<dd><code>java.io.IOException</code></dd>
</dl>
</li>
</ul>
<a name="getPos--">
<!-- -->
</a>
<ul class="blockList">
<li class="blockList">
<h4>getPos</h4>
<pre>public&nbsp;long&nbsp;getPos()
throws java.io.IOException</pre>
<div class="block">Returns the position of the unread tail of the file</div>
<dl>
<dt><span class="overrideSpecifyLabel">Specified by:</span></dt>
<dd><code>getPos</code>&nbsp;in interface&nbsp;<code>org.apache.hadoop.mapred.RecordReader&lt;org.apache.hadoop.io.LongWritable,<a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkWritable.html" title="class in org.apache.hawq.pxf.plugins.hdfs">ChunkWritable</a>&gt;</code></dd>
<dt><span class="returnLabel">Returns:</span></dt>
<dd>pos - start byte of the unread tail of the file</dd>
<dt><span class="throwsLabel">Throws:</span></dt>
<dd><code>java.io.IOException</code></dd>
</dl>
</li>
</ul>
<a name="close--">
<!-- -->
</a>
<ul class="blockListLast">
<li class="blockList">
<h4>close</h4>
<pre>public&nbsp;void&nbsp;close()
throws java.io.IOException</pre>
<div class="block">Closes the input stream.</div>
<dl>
<dt><span class="overrideSpecifyLabel">Specified by:</span></dt>
<dd><code>close</code>&nbsp;in interface&nbsp;<code>org.apache.hadoop.mapred.RecordReader&lt;org.apache.hadoop.io.LongWritable,<a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkWritable.html" title="class in org.apache.hawq.pxf.plugins.hdfs">ChunkWritable</a>&gt;</code></dd>
<dt><span class="throwsLabel">Throws:</span></dt>
<dd><code>java.io.IOException</code></dd>
</dl>
</li>
</ul>
</li>
</ul>
</li>
</ul>
</div>
</div>
<!-- ========= END OF CLASS DATA ========= -->
<!-- ======= START OF BOTTOM NAVBAR ====== -->
<div class="bottomNav"><a name="navbar.bottom">
<!-- -->
</a>
<div class="skipNav"><a href="#skip.navbar.bottom" title="Skip navigation links">Skip navigation links</a></div>
<a name="navbar.bottom.firstrow">
<!-- -->
</a>
<ul class="navList" title="Navigation">
<li><a href="../../../../../../overview-summary.html">Overview</a></li>
<li><a href="package-summary.html">Package</a></li>
<li class="navBarCell1Rev">Class</li>
<li><a href="package-tree.html">Tree</a></li>
<li><a href="../../../../../../deprecated-list.html">Deprecated</a></li>
<li><a href="../../../../../../index-all.html">Index</a></li>
<li><a href="../../../../../../help-doc.html">Help</a></li>
</ul>
</div>
<div class="subNav">
<ul class="navList">
<li><a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkReader.html" title="class in org.apache.hawq.pxf.plugins.hdfs"><span class="typeNameLink">Prev&nbsp;Class</span></a></li>
<li><a href="../../../../../../org/apache/hawq/pxf/plugins/hdfs/ChunkWritable.html" title="class in org.apache.hawq.pxf.plugins.hdfs"><span class="typeNameLink">Next&nbsp;Class</span></a></li>
</ul>
<ul class="navList">
<li><a href="../../../../../../index.html?org/apache/hawq/pxf/plugins/hdfs/ChunkRecordReader.html" target="_top">Frames</a></li>
<li><a href="ChunkRecordReader.html" target="_top">No&nbsp;Frames</a></li>
</ul>
<ul class="navList" id="allclasses_navbar_bottom">
<li><a href="../../../../../../allclasses-noframe.html">All&nbsp;Classes</a></li>
</ul>
<div>
<script type="text/javascript"><!--
allClassesLink = document.getElementById("allclasses_navbar_bottom");
if(window==top) {
allClassesLink.style.display = "block";
}
else {
allClassesLink.style.display = "none";
}
//-->
</script>
</div>
<div>
<ul class="subNavList">
<li>Summary:&nbsp;</li>
<li>Nested&nbsp;|&nbsp;</li>
<li>Field&nbsp;|&nbsp;</li>
<li><a href="#constructor.summary">Constr</a>&nbsp;|&nbsp;</li>
<li><a href="#method.summary">Method</a></li>
</ul>
<ul class="subNavList">
<li>Detail:&nbsp;</li>
<li>Field&nbsp;|&nbsp;</li>
<li><a href="#constructor.detail">Constr</a>&nbsp;|&nbsp;</li>
<li><a href="#method.detail">Method</a></li>
</ul>
</div>
<a name="skip.navbar.bottom">
<!-- -->
</a></div>
<!-- ======== END OF BOTTOM NAVBAR ======= -->
</body>
</html>