blob: d4bcc5bdc81306df57770d2832c71f651d4cccc9 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
* <p>
* http://www.apache.org/licenses/LICENSE-2.0
* <p>
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.hive.spark;
import com.esotericsoftware.kryo.Kryo;
import com.esotericsoftware.kryo.Serializer;
import com.esotericsoftware.kryo.io.Input;
import com.esotericsoftware.kryo.io.Output;
import org.apache.hadoop.hive.ql.io.HiveKey;
import org.apache.hadoop.io.BytesWritable;
import org.apache.spark.SparkConf;
import org.apache.spark.serializer.KryoSerializer;
/**
* A {@link KryoSerializer} that does not serialize hash codes while serializing a
* {@link HiveKey}. This decreases the amount of data to be shuffled during a Spark shuffle.
*/
public class NoHashCodeKryoSerializer extends KryoSerializer {
private static final long serialVersionUID = 3350910170041648022L;
public NoHashCodeKryoSerializer(SparkConf conf) {
super(conf);
}
@Override
public Kryo newKryo() {
Kryo kryo = super.newKryo();
kryo.register(HiveKey.class, new HiveKeySerializer());
kryo.register(BytesWritable.class, new HiveKryoRegistrator.BytesWritableSerializer());
return kryo;
}
private static class HiveKeySerializer extends Serializer<HiveKey> {
public void write(Kryo kryo, Output output, HiveKey object) {
output.writeVarInt(object.getLength(), true);
output.write(object.getBytes(), 0, object.getLength());
}
public HiveKey read(Kryo kryo, Input input, Class<HiveKey> type) {
int len = input.readVarInt(true);
byte[] bytes = new byte[len];
input.readBytes(bytes);
return new HiveKey(bytes);
}
}
}