blob: 98985a3e1dbaf1ad0ae620994343c27a05c5e4f5 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.orc;
import java.io.IOException;
import java.nio.ByteBuffer;
import org.apache.orc.impl.StreamName;
import org.apache.orc.impl.writer.StreamOptions;
import org.apache.orc.impl.writer.WriterEncryptionVariant;
/**
* This interface separates the physical layout of ORC files from the higher
* level details.
*
* This API is limited to being used by LLAP.
*/
public interface PhysicalWriter {
/**
* The target of an output stream.
*/
interface OutputReceiver {
/**
* Output the given buffer to the final destination
*
* @param buffer the buffer to output
*/
void output(ByteBuffer buffer) throws IOException;
/**
* Suppress this stream from being written to the stripe.
*/
void suppress();
}
/**
* Writes the header of the file, which consists of the magic "ORC" bytes.
*/
void writeHeader() throws IOException;
/**
* Create an OutputReceiver for the given name.
* @param name the name of the stream
*/
OutputReceiver createDataStream(StreamName name) throws IOException;
/**
* Write an index in the given stream name.
* @param name the name of the stream
* @param index the bloom filter to write
*/
void writeIndex(StreamName name,
OrcProto.RowIndex.Builder index) throws IOException;
/**
* Write a bloom filter index in the given stream name.
* @param name the name of the stream
* @param bloom the bloom filter to write
*/
void writeBloomFilter(StreamName name,
OrcProto.BloomFilterIndex.Builder bloom) throws IOException;
/**
* Flushes the data in all the streams, spills them to disk, write out stripe
* footer.
* @param footer Stripe footer to be updated with relevant data and written out.
* @param dirEntry File metadata entry for the stripe, to be updated with
* relevant data.
*/
void finalizeStripe(OrcProto.StripeFooter.Builder footer,
OrcProto.StripeInformation.Builder dirEntry) throws IOException;
/**
* Write a stripe or file statistics to the file.
* @param name the name of the stream
* @param statistics the statistics to write
*/
void writeStatistics(StreamName name,
OrcProto.ColumnStatistics.Builder statistics
) throws IOException;
/**
* Writes out the file metadata.
* @param builder Metadata builder to finalize and write.
*/
void writeFileMetadata(OrcProto.Metadata.Builder builder) throws IOException;
/**
* Writes out the file footer.
* @param builder Footer builder to finalize and write.
*/
void writeFileFooter(OrcProto.Footer.Builder builder) throws IOException;
/**
* Writes out the postscript (including the size byte if needed).
* @param builder Postscript builder to finalize and write.
*/
long writePostScript(OrcProto.PostScript.Builder builder) throws IOException;
/**
* Closes the writer.
*/
void close() throws IOException;
/**
* Flushes the writer so that readers can see the preceeding postscripts.
*/
void flush() throws IOException;
/**
* Appends raw stripe data (e.g. for file merger).
* @param stripe Stripe data buffer.
* @param dirEntry File metadata entry for the stripe, to be updated with
* relevant data.
*/
void appendRawStripe(ByteBuffer stripe,
OrcProto.StripeInformation.Builder dirEntry
) throws IOException;
/**
* Get the number of bytes for a file in a givem column.
* @param column column from which to get file size
* @param variant the encryption variant to check
* @return number of bytes for the given column
*/
long getFileBytes(int column, WriterEncryptionVariant variant);
/**
* Get the unencrypted stream options for this file. This class needs the
* stream options to write the indexes and footers.
*
* Additionally, the LLAP CacheWriter wants to disable the generic compression.
*/
StreamOptions getStreamOptions();
}