blob: 1db6dca5c4fabab8fa81549fb2e240a85a8d2a40 [file] [log] [blame]
<!doctype html>
<html lang="en" dir="ltr" class="docs-wrapper docs-doc-page docs-version-current plugin-docs plugin-id-default docs-doc-id-development/extensions-core/avro">
<head>
<meta charset="UTF-8">
<meta name="generator" content="Docusaurus v2.4.1">
<title data-rh="true">Apache Avro | Apache® Druid</title><meta data-rh="true" name="viewport" content="width=device-width,initial-scale=1"><meta data-rh="true" name="twitter:card" content="summary_large_image"><meta data-rh="true" property="og:image" content="https://druid.apache.org/img/druid_nav.png"><meta data-rh="true" name="twitter:image" content="https://druid.apache.org/img/druid_nav.png"><meta data-rh="true" property="og:url" content="https://druid.apache.org/docs/latest/development/extensions-core/avro"><meta data-rh="true" name="docusaurus_locale" content="en"><meta data-rh="true" name="docsearch:language" content="en"><meta data-rh="true" name="docusaurus_version" content="current"><meta data-rh="true" name="docusaurus_tag" content="docs-default-current"><meta data-rh="true" name="docsearch:version" content="current"><meta data-rh="true" name="docsearch:docusaurus_tag" content="docs-default-current"><meta data-rh="true" property="og:title" content="Apache Avro | Apache® Druid"><meta data-rh="true" name="description" content="&lt;!--"><meta data-rh="true" property="og:description" content="&lt;!--"><link data-rh="true" rel="icon" href="/img/favicon.png"><link data-rh="true" rel="canonical" href="https://druid.apache.org/docs/latest/development/extensions-core/avro"><link data-rh="true" rel="alternate" href="https://druid.apache.org/docs/latest/development/extensions-core/avro" hreflang="en"><link data-rh="true" rel="alternate" href="https://druid.apache.org/docs/latest/development/extensions-core/avro" hreflang="x-default"><link rel="preconnect" href="https://www.google-analytics.com">
<link rel="preconnect" href="https://www.googletagmanager.com">
<script async src="https://www.googletagmanager.com/gtag/js?id=UA-131010415-1"></script>
<script>function gtag(){dataLayer.push(arguments)}window.dataLayer=window.dataLayer||[],gtag("js",new Date),gtag("config","UA-131010415-1",{})</script>
<link rel="stylesheet" href="https://use.fontawesome.com/releases/v5.7.2/css/all.css">
<script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.4/clipboard.min.js"></script><link rel="stylesheet" href="/assets/css/styles.546f39eb.css">
<link rel="preload" href="/assets/js/runtime~main.4c9a7172.js" as="script">
<link rel="preload" href="/assets/js/main.3a5ab01b.js" as="script">
</head>
<body class="navigation-with-keyboard">
<script>!function(){function t(t){document.documentElement.setAttribute("data-theme",t)}var e=function(){var t=null;try{t=new URLSearchParams(window.location.search).get("docusaurus-theme")}catch(t){}return t}()||function(){var t=null;try{t=localStorage.getItem("theme")}catch(t){}return t}();t(null!==e?e:"light")}()</script><div id="__docusaurus">
<div role="region" aria-label="Skip to main content"><a class="skipToContent_fXgn" href="#__docusaurus_skipToContent_fallback">Skip to main content</a></div><nav aria-label="Main" class="navbar navbar--fixed-top navbar--dark"><div class="navbar__inner"><div class="navbar__items"><button aria-label="Toggle navigation bar" aria-expanded="false" class="navbar__toggle clean-btn" type="button"><svg width="30" height="30" viewBox="0 0 30 30" aria-hidden="true"><path stroke="currentColor" stroke-linecap="round" stroke-miterlimit="10" stroke-width="2" d="M4 7h22M4 15h22M4 23h22"></path></svg></button><a class="navbar__brand" href="/"><div class="navbar__logo"><img src="/img/druid_nav.png" alt="Apache® Druid" class="themedImage_ToTc themedImage--light_HNdA"><img src="/img/druid_nav.png" alt="Apache® Druid" class="themedImage_ToTc themedImage--dark_i4oU"></div></a></div><div class="navbar__items navbar__items--right"><a class="navbar__item navbar__link" href="/technology">Technology</a><a class="navbar__item navbar__link" href="/use-cases">Use Cases</a><a class="navbar__item navbar__link" href="/druid-powered">Powered By</a><a class="navbar__item navbar__link" href="/docs/latest/design/">Docs</a><a class="navbar__item navbar__link" href="/community/">Community</a><div class="navbar__item dropdown dropdown--hoverable dropdown--right"><a href="#" aria-haspopup="true" aria-expanded="false" role="button" class="navbar__link">Apache®</a><ul class="dropdown__menu"><li><a href="https://www.apache.org/" target="_blank" rel="noopener noreferrer" class="dropdown__link">Foundation<svg width="12" height="12" aria-hidden="true" viewBox="0 0 24 24" class="iconExternalLink_nPIU"><path fill="currentColor" d="M21 13v10h-21v-19h12v2h-10v15h17v-8h2zm3-12h-10.988l4.035 4-6.977 7.07 2.828 2.828 6.977-7.07 4.125 4.172v-11z"></path></svg></a></li><li><a href="https://apachecon.com/?ref=druid.apache.org" target="_blank" rel="noopener noreferrer" class="dropdown__link">Events<svg width="12" height="12" aria-hidden="true" viewBox="0 0 24 24" class="iconExternalLink_nPIU"><path fill="currentColor" d="M21 13v10h-21v-19h12v2h-10v15h17v-8h2zm3-12h-10.988l4.035 4-6.977 7.07 2.828 2.828 6.977-7.07 4.125 4.172v-11z"></path></svg></a></li><li><a href="https://www.apache.org/licenses/" target="_blank" rel="noopener noreferrer" class="dropdown__link">License<svg width="12" height="12" aria-hidden="true" viewBox="0 0 24 24" class="iconExternalLink_nPIU"><path fill="currentColor" d="M21 13v10h-21v-19h12v2h-10v15h17v-8h2zm3-12h-10.988l4.035 4-6.977 7.07 2.828 2.828 6.977-7.07 4.125 4.172v-11z"></path></svg></a></li><li><a href="https://www.apache.org/foundation/thanks.html" target="_blank" rel="noopener noreferrer" class="dropdown__link">Thanks<svg width="12" height="12" aria-hidden="true" viewBox="0 0 24 24" class="iconExternalLink_nPIU"><path fill="currentColor" d="M21 13v10h-21v-19h12v2h-10v15h17v-8h2zm3-12h-10.988l4.035 4-6.977 7.07 2.828 2.828 6.977-7.07 4.125 4.172v-11z"></path></svg></a></li><li><a href="https://www.apache.org/security/" target="_blank" rel="noopener noreferrer" class="dropdown__link">Security<svg width="12" height="12" aria-hidden="true" viewBox="0 0 24 24" class="iconExternalLink_nPIU"><path fill="currentColor" d="M21 13v10h-21v-19h12v2h-10v15h17v-8h2zm3-12h-10.988l4.035 4-6.977 7.07 2.828 2.828 6.977-7.07 4.125 4.172v-11z"></path></svg></a></li><li><a href="https://www.apache.org/foundation/sponsorship.html" target="_blank" rel="noopener noreferrer" class="dropdown__link">Sponsorship<svg width="12" height="12" aria-hidden="true" viewBox="0 0 24 24" class="iconExternalLink_nPIU"><path fill="currentColor" d="M21 13v10h-21v-19h12v2h-10v15h17v-8h2zm3-12h-10.988l4.035 4-6.977 7.07 2.828 2.828 6.977-7.07 4.125 4.172v-11z"></path></svg></a></li></ul></div><a class="navbar__item navbar__link" href="/downloads/">Download</a><div class="searchBox_ZlJk"><div class="navbar__search"><span aria-label="expand searchbar" role="button" class="search-icon" tabindex="0"></span><input type="search" id="search_input_react" placeholder="Loading..." aria-label="Search" class="navbar__search-input search-bar" disabled=""></div></div></div></div><div role="presentation" class="navbar-sidebar__backdrop"></div></nav><div id="__docusaurus_skipToContent_fallback" class="main-wrapper mainWrapper_z2l0 docsWrapper_BCFX"><button aria-label="Scroll back to top" class="clean-btn theme-back-to-top-button backToTopButton_sjWU" type="button"></button><div class="docPage__5DB"><main class="docMainContainer_gTbr docMainContainerEnhanced_Uz_u"><div class="container padding-top--md padding-bottom--lg"><div class="row"><div class="col docItemCol_VOVn"><div class="docItemContainer_Djhp"><article><div class="tocCollapsible_ETCw theme-doc-toc-mobile tocMobile_ITEo"><button type="button" class="clean-btn tocCollapsibleButton_TO0P">On this page</button></div><div class="theme-doc-markdown markdown"><header><h1>Apache Avro</h1></header><p>This Apache Druid extension enables Druid to ingest and parse the Apache Avro data format as follows:</p><ul><li><a href="/docs/latest/ingestion/data-formats#avro-stream">Avro stream input format</a> for Kafka and Kinesis.</li><li><a href="/docs/latest/ingestion/data-formats#avro-ocf">Avro OCF input format</a> for native batch ingestion.</li><li><a href="/docs/latest/ingestion/data-formats#avro-hadoop-parser">Avro Hadoop Parser</a>.</li></ul><p>The <a href="/docs/latest/ingestion/data-formats#avro-stream-parser">Avro Stream Parser</a> is deprecated.</p><h2 class="anchor anchorWithStickyNavbar_LWe7" id="load-the-avro-extension">Load the Avro extension<a href="#load-the-avro-extension" class="hash-link" aria-label="Direct link to Load the Avro extension" title="Direct link to Load the Avro extension"></a></h2><p>To use the Avro extension, add the <code>druid-avro-extensions</code> to the list of loaded extensions. See <a href="/docs/latest/configuration/extensions#loading-extensions">Loading extensions</a> for more information.</p><h2 class="anchor anchorWithStickyNavbar_LWe7" id="avro-types">Avro types<a href="#avro-types" class="hash-link" aria-label="Direct link to Avro types" title="Direct link to Avro types"></a></h2><p>Druid supports most Avro types natively. This section describes some exceptions.</p><h3 class="anchor anchorWithStickyNavbar_LWe7" id="unions">Unions<a href="#unions" class="hash-link" aria-label="Direct link to Unions" title="Direct link to Unions"></a></h3><p>Druid has two modes for supporting <code>union</code> types.</p><p>The default mode treats unions as a single value regardless of the type of data populating the union.</p><p>If you want to operate on individual members of a union, set <code>extractUnionsByType</code> on the Avro parser. This configuration expands union values into nested objects according to the following rules:</p><ul><li>Primitive types and unnamed complex types are keyed by their type name, such as <code>int</code> and <code>string</code>.</li><li>Complex named types are keyed by their names, this includes <code>record</code>, <code>fixed</code>, and <code>enum</code>.</li><li>The Avro null type is elided as its value can only ever be null.</li></ul><p>This is safe because an Avro union can only contain a single member of each unnamed type and duplicates of the same named type are not allowed. For example, only a single array is allowed, multiple records (or other named types) are allowed as long as each has a unique name.</p><p>You can then access the members of the union with a <a href="/docs/latest/ingestion/data-formats#flattenspec">flattenSpec</a> like you would for other nested types.</p><h3 class="anchor anchorWithStickyNavbar_LWe7" id="binary-types">Binary types<a href="#binary-types" class="hash-link" aria-label="Direct link to Binary types" title="Direct link to Binary types"></a></h3><p>The extension returns <code>bytes</code> and <code>fixed</code> Avro types as base64 encoded strings by default. To decode these types as UTF-8 strings, enable the <code>binaryAsString</code> option on the Avro parser.</p><h3 class="anchor anchorWithStickyNavbar_LWe7" id="enums">Enums<a href="#enums" class="hash-link" aria-label="Direct link to Enums" title="Direct link to Enums"></a></h3><p>The extension returns <code>enum</code> types as <code>string</code> of the enum symbol.</p><h3 class="anchor anchorWithStickyNavbar_LWe7" id="complex-types">Complex types<a href="#complex-types" class="hash-link" aria-label="Direct link to Complex types" title="Direct link to Complex types"></a></h3><p>You can ingest <code>record</code> and <code>map</code> types representing nested data with a <a href="/docs/latest/ingestion/data-formats#flattenspec">flattenSpec</a> on the parser.</p><h3 class="anchor anchorWithStickyNavbar_LWe7" id="logical-types">Logical types<a href="#logical-types" class="hash-link" aria-label="Direct link to Logical types" title="Direct link to Logical types"></a></h3><p>Druid does not currently support Avro logical types. It ignores them and handles fields according to the underlying primitive type.</p></div></article><nav class="pagination-nav docusaurus-mt-lg" aria-label="Docs pages"></nav></div></div><div class="col col--3"><div class="tableOfContents_bqdL thin-scrollbar theme-doc-toc-desktop"><ul class="table-of-contents table-of-contents__left-border"><li><a href="#load-the-avro-extension" class="table-of-contents__link toc-highlight">Load the Avro extension</a></li><li><a href="#avro-types" class="table-of-contents__link toc-highlight">Avro types</a><ul><li><a href="#unions" class="table-of-contents__link toc-highlight">Unions</a></li><li><a href="#binary-types" class="table-of-contents__link toc-highlight">Binary types</a></li><li><a href="#enums" class="table-of-contents__link toc-highlight">Enums</a></li><li><a href="#complex-types" class="table-of-contents__link toc-highlight">Complex types</a></li><li><a href="#logical-types" class="table-of-contents__link toc-highlight">Logical types</a></li></ul></li></ul></div></div></div></div></main></div></div><footer class="footer"><div class="container container-fluid"><div class="footer__bottom text--center"><div class="margin-bottom--sm"><img src="/img/favicon.png" class="themedImage_ToTc themedImage--light_HNdA footer__logo"><img src="/img/favicon.png" class="themedImage_ToTc themedImage--dark_i4oU footer__logo"></div><div class="footer__copyright">Copyright © 2023 Apache Software Foundation. Except where otherwise noted, licensed under CC BY-SA 4.0. Apache Druid, Druid, and the Druid logo are either registered trademarks or trademarks of The Apache Software Foundation in the United States and other countries.</div></div></div></footer></div>
<script src="/assets/js/runtime~main.4c9a7172.js"></script>
<script src="/assets/js/main.3a5ab01b.js"></script>
</body>
</html>