tez-api/src/main/java/org/apache/tez/dag/api/DataSinkDescriptor.java - tez - Git at Google

 /**
  * Licensed to the Apache Software Foundation (ASF) under one
  * or more contributor license agreements.  See the NOTICE file
  * distributed with this work for additional information
  * regarding copyright ownership.  The ASF licenses this file
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
  *
  *     http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 package org.apache.tez.dag.api;

 import javax.annotation.Nullable;

 import org.apache.hadoop.classification.InterfaceAudience.Public;
 import org.apache.hadoop.security.Credentials;

 /**
  * Defines the output and output committer for a data sink
  *
  */
 @Public
 public class DataSinkDescriptor {
   private final OutputDescriptor outputDescriptor;
   private final OutputCommitterDescriptor committerDescriptor;

   private final Credentials credentials;

   /**
    * Create a {@link DataSinkDescriptor}
    * @param outputDescriptor
    *          An {@link OutputDescriptor} for the output
    * @param committerDescriptor
    *          Specify a committer to be used for the output. Can be null. After all
    *          tasks in the vertex (or in the DAG) have completed, the committer
    *          (if specified) is invoked to commit the outputs. Commit is a data
    *          sink specific operation that usually determines the visibility of
    *          the output to external observers. E.g. moving output files from
    *          temporary dirs to the real output dir. When there are multiple
    *          executions of a task, the commit process also helps decide which
    *          execution will be included in the final output. Users should
    *          consider whether their application or data sink need a commit
    *          operation.
    * @param credentials Credentials needs to access the data sink
    */
   @Deprecated
   public DataSinkDescriptor(OutputDescriptor outputDescriptor,
       @Nullable OutputCommitterDescriptor committerDescriptor,
       @Nullable Credentials credentials) {
     this.outputDescriptor = outputDescriptor;
     this.committerDescriptor = committerDescriptor;
     this.credentials = credentials;
   }

   /**
    * Create a {@link DataSinkDescriptor}
    * @param outputDescriptor
    *          An {@link OutputDescriptor} for the output
    * @param committerDescriptor
    *          Specify a committer to be used for the output. Can be null. After all
    *          tasks in the vertex (or in the DAG) have completed, the committer
    *          (if specified) is invoked to commit the outputs. Commit is a data
    *          sink specific operation that usually determines the visibility of
    *          the output to external observers. E.g. moving output files from
    *          temporary dirs to the real output dir. When there are multiple
    *          executions of a task, the commit process also helps decide which
    *          execution will be included in the final output. Users should
    *          consider whether their application or data sink need a commit
    *          operation.
    * @param credentials Credentials needs to access the data sink
    */
   public static DataSinkDescriptor create(OutputDescriptor outputDescriptor,
       @Nullable OutputCommitterDescriptor committerDescriptor,
       @Nullable Credentials credentials) {
     return new DataSinkDescriptor(outputDescriptor, committerDescriptor, credentials);
   }

   public OutputDescriptor getOutputDescriptor() {
     return outputDescriptor;
   }

   public @Nullable OutputCommitterDescriptor getOutputCommitterDescriptor() {
     return committerDescriptor;
   }

   public @Nullable Credentials getCredentials() {
     return credentials;
   }

 }
	/**
	* Licensed to the Apache Software Foundation (ASF) under one
	* or more contributor license agreements. See the NOTICE file
	* distributed with this work for additional information
	* regarding copyright ownership. The ASF licenses this file
	* to you under the Apache License, Version 2.0 (the
	* "License"); you may not use this file except in compliance
	* with the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/

	package org.apache.tez.dag.api;

	import javax.annotation.Nullable;

	import org.apache.hadoop.classification.InterfaceAudience.Public;
	import org.apache.hadoop.security.Credentials;

	/**
	* Defines the output and output committer for a data sink
	*
	*/
	@Public
	public class DataSinkDescriptor {
	private final OutputDescriptor outputDescriptor;
	private final OutputCommitterDescriptor committerDescriptor;

	private final Credentials credentials;

	/**
	* Create a {@link DataSinkDescriptor}
	* @param outputDescriptor
	* An {@link OutputDescriptor} for the output
	* @param committerDescriptor
	* Specify a committer to be used for the output. Can be null. After all
	* tasks in the vertex (or in the DAG) have completed, the committer
	* (if specified) is invoked to commit the outputs. Commit is a data
	* sink specific operation that usually determines the visibility of
	* the output to external observers. E.g. moving output files from
	* temporary dirs to the real output dir. When there are multiple
	* executions of a task, the commit process also helps decide which
	* execution will be included in the final output. Users should
	* consider whether their application or data sink need a commit
	* operation.
	* @param credentials Credentials needs to access the data sink
	*/
	@Deprecated
	public DataSinkDescriptor(OutputDescriptor outputDescriptor,
	@Nullable OutputCommitterDescriptor committerDescriptor,
	@Nullable Credentials credentials) {
	this.outputDescriptor = outputDescriptor;
	this.committerDescriptor = committerDescriptor;
	this.credentials = credentials;
	}

	/**
	* Create a {@link DataSinkDescriptor}
	* @param outputDescriptor
	* An {@link OutputDescriptor} for the output
	* @param committerDescriptor
	* Specify a committer to be used for the output. Can be null. After all
	* tasks in the vertex (or in the DAG) have completed, the committer
	* (if specified) is invoked to commit the outputs. Commit is a data
	* sink specific operation that usually determines the visibility of
	* the output to external observers. E.g. moving output files from
	* temporary dirs to the real output dir. When there are multiple
	* executions of a task, the commit process also helps decide which
	* execution will be included in the final output. Users should
	* consider whether their application or data sink need a commit
	* operation.
	* @param credentials Credentials needs to access the data sink
	*/
	public static DataSinkDescriptor create(OutputDescriptor outputDescriptor,
	@Nullable OutputCommitterDescriptor committerDescriptor,
	@Nullable Credentials credentials) {
	return new DataSinkDescriptor(outputDescriptor, committerDescriptor, credentials);
	}

	public OutputDescriptor getOutputDescriptor() {
	return outputDescriptor;
	}

	public @Nullable OutputCommitterDescriptor getOutputCommitterDescriptor() {
	return committerDescriptor;
	}

	public @Nullable Credentials getCredentials() {
	return credentials;
	}

	}