blob: 4aff28aa92c286a38d4dbebd8f003b60665849d5 [file] [log] [blame]
<!DOCTYPE HTML>
<!-- NewPage -->
<html lang="en">
<head>
<!-- Generated by javadoc (11.0.12) on Wed Aug 18 10:34:26 PDT 2021 -->
<title>ParquetSchemaUtil</title>
<meta http-equiv="Content-Type" content="text/html; charset=utf-8">
<meta name="dc.created" content="2021-08-18">
<link rel="stylesheet" type="text/css" href="../../../../stylesheet.css" title="Style">
<link rel="stylesheet" type="text/css" href="../../../../jquery/jquery-ui.css" title="Style">
<script type="text/javascript" src="../../../../script.js"></script>
<script type="text/javascript" src="../../../../jquery/jszip/dist/jszip.min.js"></script>
<script type="text/javascript" src="../../../../jquery/jszip-utils/dist/jszip-utils.min.js"></script>
<!--[if IE]>
<script type="text/javascript" src="../../../../jquery/jszip-utils/dist/jszip-utils-ie.min.js"></script>
<![endif]-->
<script type="text/javascript" src="../../../../jquery/jquery-3.5.1.js"></script>
<script type="text/javascript" src="../../../../jquery/jquery-ui.js"></script>
</head>
<body>
<script type="text/javascript"><!--
try {
if (location.href.indexOf('is-external=true') == -1) {
parent.document.title="ParquetSchemaUtil";
}
}
catch(err) {
}
//-->
var data = {"i0":9,"i1":9,"i2":9,"i3":9,"i4":9,"i5":9,"i6":9,"i7":9};
var tabs = {65535:["t0","All Methods"],1:["t1","Static Methods"],8:["t4","Concrete Methods"]};
var altColor = "altColor";
var rowColor = "rowColor";
var tableTab = "tableTab";
var activeTableTab = "activeTableTab";
var pathtoroot = "../../../../";
var useModuleDirectories = true;
loadScripts(document, 'script');</script>
<noscript>
<div>JavaScript is disabled on your browser.</div>
</noscript>
<header role="banner">
<nav role="navigation">
<div class="fixedNav">
<!-- ========= START OF TOP NAVBAR ======= -->
<div class="topNav"><a id="navbar.top">
<!-- -->
</a>
<div class="skipNav"><a href="#skip.navbar.top" title="Skip navigation links">Skip navigation links</a></div>
<a id="navbar.top.firstrow">
<!-- -->
</a>
<ul class="navList" title="Navigation">
<li><a href="../../../../index.html">Overview</a></li>
<li><a href="package-summary.html">Package</a></li>
<li class="navBarCell1Rev">Class</li>
<li><a href="package-tree.html">Tree</a></li>
<li><a href="../../../../deprecated-list.html">Deprecated</a></li>
<li><a href="../../../../index-all.html">Index</a></li>
<li><a href="../../../../help-doc.html">Help</a></li>
</ul>
</div>
<div class="subNav">
<ul class="navList" id="allclasses_navbar_top">
<li><a href="../../../../allclasses.html">All&nbsp;Classes</a></li>
</ul>
<ul class="navListSearch">
<li><label for="search">SEARCH:</label>
<input type="text" id="search" value="search" disabled="disabled">
<input type="reset" id="reset" value="reset" disabled="disabled">
</li>
</ul>
<div>
<script type="text/javascript"><!--
allClassesLink = document.getElementById("allclasses_navbar_top");
if(window==top) {
allClassesLink.style.display = "block";
}
else {
allClassesLink.style.display = "none";
}
//-->
</script>
<noscript>
<div>JavaScript is disabled on your browser.</div>
</noscript>
</div>
<div>
<ul class="subNavList">
<li>Summary:&nbsp;</li>
<li><a href="#nested.class.summary">Nested</a>&nbsp;|&nbsp;</li>
<li>Field&nbsp;|&nbsp;</li>
<li>Constr&nbsp;|&nbsp;</li>
<li><a href="#method.summary">Method</a></li>
</ul>
<ul class="subNavList">
<li>Detail:&nbsp;</li>
<li>Field&nbsp;|&nbsp;</li>
<li>Constr&nbsp;|&nbsp;</li>
<li><a href="#method.detail">Method</a></li>
</ul>
</div>
<a id="skip.navbar.top">
<!-- -->
</a></div>
<!-- ========= END OF TOP NAVBAR ========= -->
</div>
<div class="navPadding">&nbsp;</div>
<script type="text/javascript"><!--
$('.navPadding').css('padding-top', $('.fixedNav').css("height"));
//-->
</script>
</nav>
</header>
<!-- ======== START OF CLASS DATA ======== -->
<main role="main">
<div class="header">
<div class="subTitle"><span class="packageLabelInType">Package</span>&nbsp;<a href="package-summary.html">org.apache.iceberg.parquet</a></div>
<h2 title="Class ParquetSchemaUtil" class="title">Class ParquetSchemaUtil</h2>
</div>
<div class="contentContainer">
<ul class="inheritance">
<li>java.lang.Object</li>
<li>
<ul class="inheritance">
<li>org.apache.iceberg.parquet.ParquetSchemaUtil</li>
</ul>
</li>
</ul>
<div class="description">
<ul class="blockList">
<li class="blockList">
<hr>
<pre>public class <span class="typeNameLabel">ParquetSchemaUtil</span>
extends java.lang.Object</pre>
</li>
</ul>
</div>
<div class="summary">
<ul class="blockList">
<li class="blockList">
<!-- ======== NESTED CLASS SUMMARY ======== -->
<section role="region">
<ul class="blockList">
<li class="blockList"><a id="nested.class.summary">
<!-- -->
</a>
<h3>Nested Class Summary</h3>
<table class="memberSummary">
<caption><span>Nested Classes</span><span class="tabEnd">&nbsp;</span></caption>
<tr>
<th class="colFirst" scope="col">Modifier and Type</th>
<th class="colSecond" scope="col">Class</th>
<th class="colLast" scope="col">Description</th>
</tr>
<tr class="altColor">
<td class="colFirst"><code>static class&nbsp;</code></td>
<th class="colSecond" scope="row"><code><span class="memberNameLink"><a href="ParquetSchemaUtil.HasIds.html" title="class in org.apache.iceberg.parquet">ParquetSchemaUtil.HasIds</a></span></code></th>
<td class="colLast">&nbsp;</td>
</tr>
</table>
</li>
</ul>
</section>
<!-- ========== METHOD SUMMARY =========== -->
<section role="region">
<ul class="blockList">
<li class="blockList"><a id="method.summary">
<!-- -->
</a>
<h3>Method Summary</h3>
<table class="memberSummary">
<caption><span id="t0" class="activeTableTab"><span>All Methods</span><span class="tabEnd">&nbsp;</span></span><span id="t1" class="tableTab"><span><a href="javascript:show(1);">Static Methods</a></span><span class="tabEnd">&nbsp;</span></span><span id="t4" class="tableTab"><span><a href="javascript:show(8);">Concrete Methods</a></span><span class="tabEnd">&nbsp;</span></span></caption>
<tr>
<th class="colFirst" scope="col">Modifier and Type</th>
<th class="colSecond" scope="col">Method</th>
<th class="colLast" scope="col">Description</th>
</tr>
<tr id="i0" class="altColor">
<td class="colFirst"><code>static org.apache.parquet.schema.MessageType</code></td>
<th class="colSecond" scope="row"><code><span class="memberNameLink"><a href="#addFallbackIds(org.apache.parquet.schema.MessageType)">addFallbackIds</a></span>&#8203;(org.apache.parquet.schema.MessageType&nbsp;fileSchema)</code></th>
<td class="colLast">&nbsp;</td>
</tr>
<tr id="i1" class="rowColor">
<td class="colFirst"><code>static org.apache.parquet.schema.MessageType</code></td>
<th class="colSecond" scope="row"><code><span class="memberNameLink"><a href="#applyNameMapping(org.apache.parquet.schema.MessageType,org.apache.iceberg.mapping.NameMapping)">applyNameMapping</a></span>&#8203;(org.apache.parquet.schema.MessageType&nbsp;fileSchema,
<a href="../mapping/NameMapping.html" title="class in org.apache.iceberg.mapping">NameMapping</a>&nbsp;nameMapping)</code></th>
<td class="colLast">&nbsp;</td>
</tr>
<tr id="i2" class="altColor">
<td class="colFirst"><code>static org.apache.parquet.schema.MessageType</code></td>
<th class="colSecond" scope="row"><code><span class="memberNameLink"><a href="#convert(org.apache.iceberg.Schema,java.lang.String)">convert</a></span>&#8203;(<a href="../Schema.html" title="class in org.apache.iceberg">Schema</a>&nbsp;schema,
java.lang.String&nbsp;name)</code></th>
<td class="colLast">&nbsp;</td>
</tr>
<tr id="i3" class="rowColor">
<td class="colFirst"><code>static <a href="../Schema.html" title="class in org.apache.iceberg">Schema</a></code></td>
<th class="colSecond" scope="row"><code><span class="memberNameLink"><a href="#convert(org.apache.parquet.schema.MessageType)">convert</a></span>&#8203;(org.apache.parquet.schema.MessageType&nbsp;parquetSchema)</code></th>
<td class="colLast">
<div class="block">Converts a Parquet schema to an Iceberg schema.</div>
</td>
</tr>
<tr id="i4" class="altColor">
<td class="colFirst"><code>static <a href="../Schema.html" title="class in org.apache.iceberg">Schema</a></code></td>
<th class="colSecond" scope="row"><code><span class="memberNameLink"><a href="#convertAndPrune(org.apache.parquet.schema.MessageType)">convertAndPrune</a></span>&#8203;(org.apache.parquet.schema.MessageType&nbsp;parquetSchema)</code></th>
<td class="colLast">
<div class="block">Converts a Parquet schema to an Iceberg schema and prunes fields without IDs.</div>
</td>
</tr>
<tr id="i5" class="rowColor">
<td class="colFirst"><code>static boolean</code></td>
<th class="colSecond" scope="row"><code><span class="memberNameLink"><a href="#hasIds(org.apache.parquet.schema.MessageType)">hasIds</a></span>&#8203;(org.apache.parquet.schema.MessageType&nbsp;fileSchema)</code></th>
<td class="colLast">&nbsp;</td>
</tr>
<tr id="i6" class="altColor">
<td class="colFirst"><code>static org.apache.parquet.schema.MessageType</code></td>
<th class="colSecond" scope="row"><code><span class="memberNameLink"><a href="#pruneColumns(org.apache.parquet.schema.MessageType,org.apache.iceberg.Schema)">pruneColumns</a></span>&#8203;(org.apache.parquet.schema.MessageType&nbsp;fileSchema,
<a href="../Schema.html" title="class in org.apache.iceberg">Schema</a>&nbsp;expectedSchema)</code></th>
<td class="colLast">&nbsp;</td>
</tr>
<tr id="i7" class="rowColor">
<td class="colFirst"><code>static org.apache.parquet.schema.MessageType</code></td>
<th class="colSecond" scope="row"><code><span class="memberNameLink"><a href="#pruneColumnsFallback(org.apache.parquet.schema.MessageType,org.apache.iceberg.Schema)">pruneColumnsFallback</a></span>&#8203;(org.apache.parquet.schema.MessageType&nbsp;fileSchema,
<a href="../Schema.html" title="class in org.apache.iceberg">Schema</a>&nbsp;expectedSchema)</code></th>
<td class="colLast">
<div class="block">Prunes columns from a Parquet file schema that was written without field ids.</div>
</td>
</tr>
</table>
<ul class="blockList">
<li class="blockList"><a id="methods.inherited.from.class.java.lang.Object">
<!-- -->
</a>
<h3>Methods inherited from class&nbsp;java.lang.Object</h3>
<code>clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait</code></li>
</ul>
</li>
</ul>
</section>
</li>
</ul>
</div>
<div class="details">
<ul class="blockList">
<li class="blockList">
<!-- ============ METHOD DETAIL ========== -->
<section role="region">
<ul class="blockList">
<li class="blockList"><a id="method.detail">
<!-- -->
</a>
<h3>Method Detail</h3>
<a id="convert(org.apache.iceberg.Schema,java.lang.String)">
<!-- -->
</a>
<ul class="blockList">
<li class="blockList">
<h4>convert</h4>
<pre class="methodSignature">public static&nbsp;org.apache.parquet.schema.MessageType&nbsp;convert&#8203;(<a href="../Schema.html" title="class in org.apache.iceberg">Schema</a>&nbsp;schema,
java.lang.String&nbsp;name)</pre>
</li>
</ul>
<a id="convert(org.apache.parquet.schema.MessageType)">
<!-- -->
</a>
<ul class="blockList">
<li class="blockList">
<h4>convert</h4>
<pre class="methodSignature">public static&nbsp;<a href="../Schema.html" title="class in org.apache.iceberg">Schema</a>&nbsp;convert&#8203;(org.apache.parquet.schema.MessageType&nbsp;parquetSchema)</pre>
<div class="block">Converts a Parquet schema to an Iceberg schema. Fields without IDs are kept and assigned fallback IDs.</div>
<dl>
<dt><span class="paramLabel">Parameters:</span></dt>
<dd><code>parquetSchema</code> - a Parquet schema</dd>
<dt><span class="returnLabel">Returns:</span></dt>
<dd>a matching Iceberg schema for the provided Parquet schema</dd>
</dl>
</li>
</ul>
<a id="convertAndPrune(org.apache.parquet.schema.MessageType)">
<!-- -->
</a>
<ul class="blockList">
<li class="blockList">
<h4>convertAndPrune</h4>
<pre class="methodSignature">public static&nbsp;<a href="../Schema.html" title="class in org.apache.iceberg">Schema</a>&nbsp;convertAndPrune&#8203;(org.apache.parquet.schema.MessageType&nbsp;parquetSchema)</pre>
<div class="block">Converts a Parquet schema to an Iceberg schema and prunes fields without IDs.</div>
<dl>
<dt><span class="paramLabel">Parameters:</span></dt>
<dd><code>parquetSchema</code> - a Parquet schema</dd>
<dt><span class="returnLabel">Returns:</span></dt>
<dd>a matching Iceberg schema for the provided Parquet schema</dd>
</dl>
</li>
</ul>
<a id="pruneColumns(org.apache.parquet.schema.MessageType,org.apache.iceberg.Schema)">
<!-- -->
</a>
<ul class="blockList">
<li class="blockList">
<h4>pruneColumns</h4>
<pre class="methodSignature">public static&nbsp;org.apache.parquet.schema.MessageType&nbsp;pruneColumns&#8203;(org.apache.parquet.schema.MessageType&nbsp;fileSchema,
<a href="../Schema.html" title="class in org.apache.iceberg">Schema</a>&nbsp;expectedSchema)</pre>
</li>
</ul>
<a id="pruneColumnsFallback(org.apache.parquet.schema.MessageType,org.apache.iceberg.Schema)">
<!-- -->
</a>
<ul class="blockList">
<li class="blockList">
<h4>pruneColumnsFallback</h4>
<pre class="methodSignature">public static&nbsp;org.apache.parquet.schema.MessageType&nbsp;pruneColumnsFallback&#8203;(org.apache.parquet.schema.MessageType&nbsp;fileSchema,
<a href="../Schema.html" title="class in org.apache.iceberg">Schema</a>&nbsp;expectedSchema)</pre>
<div class="block">Prunes columns from a Parquet file schema that was written without field ids.
<p>
Files that were written without field ids are read assuming that schema evolution preserved
column order. Deleting columns was not allowed.
<p>
The order of columns in the resulting Parquet schema matches the Parquet file.</div>
<dl>
<dt><span class="paramLabel">Parameters:</span></dt>
<dd><code>fileSchema</code> - schema from a Parquet file that does not have field ids.</dd>
<dd><code>expectedSchema</code> - expected schema</dd>
<dt><span class="returnLabel">Returns:</span></dt>
<dd>a parquet schema pruned using the expected schema</dd>
</dl>
</li>
</ul>
<a id="hasIds(org.apache.parquet.schema.MessageType)">
<!-- -->
</a>
<ul class="blockList">
<li class="blockList">
<h4>hasIds</h4>
<pre class="methodSignature">public static&nbsp;boolean&nbsp;hasIds&#8203;(org.apache.parquet.schema.MessageType&nbsp;fileSchema)</pre>
</li>
</ul>
<a id="addFallbackIds(org.apache.parquet.schema.MessageType)">
<!-- -->
</a>
<ul class="blockList">
<li class="blockList">
<h4>addFallbackIds</h4>
<pre class="methodSignature">public static&nbsp;org.apache.parquet.schema.MessageType&nbsp;addFallbackIds&#8203;(org.apache.parquet.schema.MessageType&nbsp;fileSchema)</pre>
</li>
</ul>
<a id="applyNameMapping(org.apache.parquet.schema.MessageType,org.apache.iceberg.mapping.NameMapping)">
<!-- -->
</a>
<ul class="blockListLast">
<li class="blockList">
<h4>applyNameMapping</h4>
<pre class="methodSignature">public static&nbsp;org.apache.parquet.schema.MessageType&nbsp;applyNameMapping&#8203;(org.apache.parquet.schema.MessageType&nbsp;fileSchema,
<a href="../mapping/NameMapping.html" title="class in org.apache.iceberg.mapping">NameMapping</a>&nbsp;nameMapping)</pre>
</li>
</ul>
</li>
</ul>
</section>
</li>
</ul>
</div>
</div>
</main>
<!-- ========= END OF CLASS DATA ========= -->
<footer role="contentinfo">
<nav role="navigation">
<!-- ======= START OF BOTTOM NAVBAR ====== -->
<div class="bottomNav"><a id="navbar.bottom">
<!-- -->
</a>
<div class="skipNav"><a href="#skip.navbar.bottom" title="Skip navigation links">Skip navigation links</a></div>
<a id="navbar.bottom.firstrow">
<!-- -->
</a>
<ul class="navList" title="Navigation">
<li><a href="../../../../index.html">Overview</a></li>
<li><a href="package-summary.html">Package</a></li>
<li class="navBarCell1Rev">Class</li>
<li><a href="package-tree.html">Tree</a></li>
<li><a href="../../../../deprecated-list.html">Deprecated</a></li>
<li><a href="../../../../index-all.html">Index</a></li>
<li><a href="../../../../help-doc.html">Help</a></li>
</ul>
</div>
<div class="subNav">
<ul class="navList" id="allclasses_navbar_bottom">
<li><a href="../../../../allclasses.html">All&nbsp;Classes</a></li>
</ul>
<div>
<script type="text/javascript"><!--
allClassesLink = document.getElementById("allclasses_navbar_bottom");
if(window==top) {
allClassesLink.style.display = "block";
}
else {
allClassesLink.style.display = "none";
}
//-->
</script>
<noscript>
<div>JavaScript is disabled on your browser.</div>
</noscript>
</div>
<div>
<ul class="subNavList">
<li>Summary:&nbsp;</li>
<li><a href="#nested.class.summary">Nested</a>&nbsp;|&nbsp;</li>
<li>Field&nbsp;|&nbsp;</li>
<li>Constr&nbsp;|&nbsp;</li>
<li><a href="#method.summary">Method</a></li>
</ul>
<ul class="subNavList">
<li>Detail:&nbsp;</li>
<li>Field&nbsp;|&nbsp;</li>
<li>Constr&nbsp;|&nbsp;</li>
<li><a href="#method.detail">Method</a></li>
</ul>
</div>
<a id="skip.navbar.bottom">
<!-- -->
</a></div>
<!-- ======== END OF BOTTOM NAVBAR ======= -->
</nav>
</footer>
</body>
</html>