blob: 63689809ea5bc1c4de72eeb24750908646209e62 [file] [log] [blame]
/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.cloudera.sqoop.testutil;
import java.io.EOFException;
import java.io.IOException;
import java.util.ArrayList;
import java.util.List;
import org.apache.commons.lang.RandomStringUtils;
import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.FileStatus;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import com.cloudera.sqoop.SqoopOptions;
import com.cloudera.sqoop.Sqoop;
import com.cloudera.sqoop.orm.CompilationManager;
import com.cloudera.sqoop.tool.SqoopTool;
import com.cloudera.sqoop.tool.ImportTool;
import com.cloudera.sqoop.util.ClassLoaderStack;
import org.junit.Before;
import static org.junit.Assert.assertEquals;
import static org.junit.Assert.fail;
/**
* Class that implements common methods required for tests which import data
* from SQL into HDFS and verify correct import.
*/
public abstract class ImportJobTestCase extends BaseSqoopTestCase {
public static final Log LOG = LogFactory.getLog(
ImportJobTestCase.class.getName());
@Before
public void setUp() {
super.setUp();
removeTableDir();
}
protected String getTablePrefix() {
return "IMPORT_TABLE_";
}
/**
* @return a list of additional args to pass to the sqoop command line.
*/
protected List<String> getExtraArgs(Configuration conf) {
return new ArrayList<String>();
}
/**
* Create the argv to pass to Sqoop.
* @param includeHadoopFlags if true, then include -D various.settings=values
* @param colNames the columns to import. If null, all columns are used.
* @param conf a Configuration specifying additional properties to use when
* determining the arguments.
* @return the argv as an array of strings.
*/
protected String [] getArgv(boolean includeHadoopFlags, String [] colNames,
Configuration conf) {
if (null == colNames) {
colNames = getColNames();
}
String splitByCol = colNames[0];
String columnsString = "";
for (String col : colNames) {
columnsString += col + ",";
}
ArrayList<String> args = new ArrayList<String>();
if (includeHadoopFlags) {
CommonArgs.addHadoopFlags(args);
}
args.add("--table");
args.add(getTableName());
args.add("--columns");
args.add(columnsString);
args.add("--split-by");
args.add(splitByCol);
args.add("--warehouse-dir");
args.add(getWarehouseDir());
args.add("--connect");
args.add(getConnectString());
args.add("--as-sequencefile");
args.add("--num-mappers");
args.add("1");
args.addAll(getExtraArgs(conf));
return args.toArray(new String[0]);
}
/**
* Do a MapReduce-based import of the table and verify that the results
* were imported as expected. (tests readFields(ResultSet) and toString())
* @param expectedVal the value we injected into the table.
* @param importCols the columns to import. If null, all columns are used.
*/
protected void verifyImport(String expectedVal, String [] importCols) {
// paths to where our output file will wind up.
Path tableDirPath = getTablePath();
removeTableDir();
Configuration conf = getConf();
//Need to disable OraOop for existing tests
conf.set("oraoop.disabled", "true");
SqoopOptions opts = getSqoopOptions(conf);
// run the tool through the normal entry-point.
int ret;
try {
Sqoop importer = new Sqoop(new ImportTool(), conf, opts);
ret = Sqoop.runSqoop(importer, getArgv(true, importCols, conf));
} catch (Exception e) {
LOG.error("Got exception running Sqoop: " + e.toString());
throw new RuntimeException(e);
}
// expect a successful return.
assertEquals("Failure during job", 0, ret);
opts = getSqoopOptions(conf);
try {
ImportTool importTool = new ImportTool();
opts = importTool.parseArguments(getArgv(false, importCols, conf), conf,
opts, true);
} catch (Exception e) {
fail(e.toString());
}
CompilationManager compileMgr = new CompilationManager(opts);
String jarFileName = compileMgr.getJarFilename();
ClassLoader prevClassLoader = null;
try {
prevClassLoader = ClassLoaderStack.addJarFile(jarFileName,
getTableName());
// Now open and check all part-files in the table path until we find
// a non-empty one that we can verify contains the value.
if (!BaseSqoopTestCase.isOnPhysicalCluster()) {
conf.set(CommonArgs.FS_DEFAULT_NAME, CommonArgs.LOCAL_FS);
}
FileSystem fs = FileSystem.get(conf);
FileStatus [] stats = fs.listStatus(tableDirPath);
if (stats == null || stats.length == 0) {
fail("Error: no files in " + tableDirPath);
}
boolean foundRecord = false;
for (FileStatus stat : stats) {
if (!stat.getPath().getName().startsWith("part-")
&& !stat.getPath().getName().startsWith("data-")) {
// This isn't a data file. Ignore it.
continue;
}
try {
Object readValue = SeqFileReader.getFirstValue(
stat.getPath().toString());
LOG.info("Read back from sequencefile: " + readValue);
foundRecord = true;
// Add trailing '\n' to expected value since SqoopRecord.toString()
// encodes the record delim.
if (null == expectedVal) {
assertEquals("Error validating result from SeqFile", "null\n",
readValue.toString());
} else {
assertEquals("Error validating result from SeqFile",
expectedVal + "\n", readValue.toString());
}
} catch (EOFException eoe) {
// EOF in a file isn't necessarily a problem. We may have some
// empty sequence files, which will throw this. Just continue
// in the loop.
}
}
if (!foundRecord) {
fail("Couldn't read any records from SequenceFiles");
}
} catch (IOException ioe) {
fail("IOException: " + ioe.toString());
} finally {
if (null != prevClassLoader) {
ClassLoaderStack.setCurrentClassLoader(prevClassLoader);
}
}
}
/**
* Run a MapReduce-based import (using the argv provided to control
* execution).
*/
protected void runImport(SqoopTool tool, String [] argv) throws IOException {
// run the tool through the normal entry-point.
int ret;
try {
Configuration conf = getConf();
//Need to disable OraOop for existing tests
conf.set("oraoop.disabled", "true");
SqoopOptions opts = getSqoopOptions(conf);
Sqoop sqoop = new Sqoop(tool, conf, opts);
ret = Sqoop.runSqoop(sqoop, argv);
} catch (Exception e) {
LOG.error("Got exception running Sqoop: " + e.toString());
e.printStackTrace();
ret = 1;
}
// expect a successful return.
if (0 != ret) {
throw new IOException("Failure during job; return status " + ret);
}
}
/** run an import using the default ImportTool. */
protected void runImport(String [] argv) throws IOException {
runImport(new ImportTool(), argv);
}
}