HADOOP-6443. Serialization classes accept invalid metadata. Contributed by Aaron Kimball.
git-svn-id: https://svn.apache.org/repos/asf/hadoop/common/trunk@895831 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
parent
3cb2e3112b
commit
efcad06506
@ -80,6 +80,9 @@ Trunk (unreleased changes)
|
|||||||
HADOOP-6472. add tokenCache option to GenericOptionsParser for passing
|
HADOOP-6472. add tokenCache option to GenericOptionsParser for passing
|
||||||
file with secret keys to a map reduce job. (boryas)
|
file with secret keys to a map reduce job. (boryas)
|
||||||
|
|
||||||
|
HADOOP-6443. Serialization classes accept invalid metadata.
|
||||||
|
(Aaron Kimball via tomwhite)
|
||||||
|
|
||||||
OPTIMIZATIONS
|
OPTIMIZATIONS
|
||||||
|
|
||||||
BUG FIXES
|
BUG FIXES
|
||||||
|
@ -99,9 +99,7 @@ public class JavaSerialization extends SerializationBase<Serializable> {
|
|||||||
}
|
}
|
||||||
|
|
||||||
public boolean accept(Map<String, String> metadata) {
|
public boolean accept(Map<String, String> metadata) {
|
||||||
String intendedSerializer = metadata.get(SERIALIZATION_KEY);
|
if (!checkSerializationKey(metadata)) {
|
||||||
if (intendedSerializer != null &&
|
|
||||||
!getClass().getName().equals(intendedSerializer)) {
|
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -101,4 +101,17 @@ public abstract class SerializationBase<T> extends Configured
|
|||||||
* for this given metadata.
|
* for this given metadata.
|
||||||
*/
|
*/
|
||||||
public abstract RawComparator<T> getRawComparator(Map<String,String> metadata);
|
public abstract RawComparator<T> getRawComparator(Map<String,String> metadata);
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Check that the SERIALIZATION_KEY, if set, matches the current class.
|
||||||
|
* @param metadata the serialization metadata to check.
|
||||||
|
* @return true if SERIALIZATION_KEY is unset, or if it matches the current class
|
||||||
|
* (meaning that accept() should continue processing), or false if it is a mismatch,
|
||||||
|
* meaning that accept() should return false.
|
||||||
|
*/
|
||||||
|
protected boolean checkSerializationKey(Map<String, String> metadata) {
|
||||||
|
String intendedSerializer = metadata.get(SERIALIZATION_KEY);
|
||||||
|
return intendedSerializer == null ||
|
||||||
|
getClass().getName().equals(intendedSerializer);
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
@ -135,11 +135,10 @@ public class WritableSerialization extends SerializationBase<Writable> {
|
|||||||
|
|
||||||
@Override
|
@Override
|
||||||
public boolean accept(Map<String, String> metadata) {
|
public boolean accept(Map<String, String> metadata) {
|
||||||
String intendedSerializer = metadata.get(SERIALIZATION_KEY);
|
if (!checkSerializationKey(metadata)) {
|
||||||
if (intendedSerializer != null &&
|
|
||||||
!getClass().getName().equals(intendedSerializer)) {
|
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
|
||||||
Class<?> c = getClassFromMetadata(metadata);
|
Class<?> c = getClassFromMetadata(metadata);
|
||||||
return c == null ? false : Writable.class.isAssignableFrom(c);
|
return c == null ? false : Writable.class.isAssignableFrom(c);
|
||||||
}
|
}
|
||||||
|
@ -30,16 +30,18 @@ import org.apache.hadoop.io.serializer.SerializationBase;
|
|||||||
|
|
||||||
/**
|
/**
|
||||||
* Serialization for Avro Generic classes. For a class to be accepted by this
|
* Serialization for Avro Generic classes. For a class to be accepted by this
|
||||||
* serialization it must have metadata with key
|
* serialization it must have a schema specified.
|
||||||
* {@link SerializationBase#SERIALIZATION_KEY} set to {@link AvroGenericSerialization}'s
|
|
||||||
* fully-qualified classname.
|
|
||||||
* The schema used is the one set by {@link AvroSerialization#AVRO_SCHEMA_KEY}.
|
* The schema used is the one set by {@link AvroSerialization#AVRO_SCHEMA_KEY}.
|
||||||
*/
|
*/
|
||||||
@SuppressWarnings("unchecked")
|
@SuppressWarnings("unchecked")
|
||||||
public class AvroGenericSerialization extends AvroSerialization<Object> {
|
public class AvroGenericSerialization extends AvroSerialization<Object> {
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public boolean accept(Map<String, String> metadata) {
|
public boolean accept(Map<String, String> metadata) {
|
||||||
|
if (!checkSerializationKey(metadata)) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
return metadata.get(AVRO_SCHEMA_KEY) != null;
|
return metadata.get(AVRO_SCHEMA_KEY) != null;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -54,8 +54,8 @@ public class AvroReflectSerialization extends AvroSerialization<Object>{
|
|||||||
if (packages == null) {
|
if (packages == null) {
|
||||||
getPackages();
|
getPackages();
|
||||||
}
|
}
|
||||||
if (getClass().getName().equals(metadata.get(SERIALIZATION_KEY))) {
|
if (!checkSerializationKey(metadata)) {
|
||||||
return true;
|
return false;
|
||||||
}
|
}
|
||||||
Class<?> c = getClassFromMetadata(metadata);
|
Class<?> c = getClassFromMetadata(metadata);
|
||||||
if (c == null) {
|
if (c == null) {
|
||||||
|
@ -141,8 +141,7 @@ public abstract class AvroSerialization<T> extends SerializationBase<T> {
|
|||||||
* @return a RawComparator parameterized for the specified Avro schema.
|
* @return a RawComparator parameterized for the specified Avro schema.
|
||||||
*/
|
*/
|
||||||
public RawComparator<T> getRawComparator(Map<String, String> metadata) {
|
public RawComparator<T> getRawComparator(Map<String, String> metadata) {
|
||||||
Schema schema = Schema.parse(metadata.get(AVRO_SCHEMA_KEY));
|
Schema schema = getSchema(metadata);
|
||||||
return new AvroComparator(schema);
|
return new AvroComparator(schema);
|
||||||
}
|
}
|
||||||
|
|
||||||
}
|
}
|
||||||
|
@ -39,8 +39,8 @@ public class AvroSpecificSerialization
|
|||||||
|
|
||||||
@Override
|
@Override
|
||||||
public boolean accept(Map<String, String> metadata) {
|
public boolean accept(Map<String, String> metadata) {
|
||||||
if (getClass().getName().equals(metadata.get(SERIALIZATION_KEY))) {
|
if (!checkSerializationKey(metadata)) {
|
||||||
return true;
|
return false;
|
||||||
}
|
}
|
||||||
Class<?> c = getClassFromMetadata(metadata);
|
Class<?> c = getClassFromMetadata(metadata);
|
||||||
return c == null ? false : SpecificRecord.class.isAssignableFrom(c);
|
return c == null ? false : SpecificRecord.class.isAssignableFrom(c);
|
||||||
|
@ -23,15 +23,20 @@ import static org.apache.hadoop.io.TestGenericWritable.CONF_TEST_VALUE;
|
|||||||
import junit.framework.TestCase;
|
import junit.framework.TestCase;
|
||||||
|
|
||||||
import java.io.IOException;
|
import java.io.IOException;
|
||||||
|
import java.util.HashMap;
|
||||||
import java.util.Map;
|
import java.util.Map;
|
||||||
|
|
||||||
import org.apache.hadoop.conf.Configuration;
|
import org.apache.hadoop.conf.Configuration;
|
||||||
import org.apache.hadoop.io.DataOutputBuffer;
|
import org.apache.hadoop.io.DataOutputBuffer;
|
||||||
|
import org.apache.hadoop.io.RawComparator;
|
||||||
import org.apache.hadoop.io.Text;
|
import org.apache.hadoop.io.Text;
|
||||||
import org.apache.hadoop.io.TestGenericWritable.Foo;
|
import org.apache.hadoop.io.TestGenericWritable.Foo;
|
||||||
import org.apache.hadoop.io.TestGenericWritable.Bar;
|
import org.apache.hadoop.io.TestGenericWritable.Bar;
|
||||||
import org.apache.hadoop.io.TestGenericWritable.Baz;
|
import org.apache.hadoop.io.TestGenericWritable.Baz;
|
||||||
import org.apache.hadoop.io.TestGenericWritable.FooGenericWritable;
|
import org.apache.hadoop.io.TestGenericWritable.FooGenericWritable;
|
||||||
|
import org.apache.hadoop.io.serializer.DeserializerBase;
|
||||||
|
import org.apache.hadoop.io.serializer.SerializationBase;
|
||||||
|
import org.apache.hadoop.io.serializer.SerializerBase;
|
||||||
import org.apache.hadoop.util.GenericsUtil;
|
import org.apache.hadoop.util.GenericsUtil;
|
||||||
|
|
||||||
public class TestWritableSerialization extends TestCase {
|
public class TestWritableSerialization extends TestCase {
|
||||||
@ -61,6 +66,26 @@ public class TestWritableSerialization extends TestCase {
|
|||||||
assertNotNull(result.getConf());
|
assertNotNull(result.getConf());
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@SuppressWarnings("unchecked")
|
||||||
|
public void testIgnoreMisconfiguredMetadata() throws IOException {
|
||||||
|
// If SERIALIZATION_KEY is set, still need class name.
|
||||||
|
|
||||||
|
Configuration conf = new Configuration();
|
||||||
|
Map<String, String> metadata = new HashMap<String, String>();
|
||||||
|
metadata.put(SerializationBase.SERIALIZATION_KEY,
|
||||||
|
WritableSerialization.class.getName());
|
||||||
|
SerializationFactory factory = new SerializationFactory(conf);
|
||||||
|
SerializationBase serialization = factory.getSerialization(metadata);
|
||||||
|
assertNull("Got serializer without any class info", serialization);
|
||||||
|
|
||||||
|
metadata.put(SerializationBase.CLASS_KEY,
|
||||||
|
Text.class.getName());
|
||||||
|
serialization = factory.getSerialization(metadata);
|
||||||
|
assertNotNull("Didn't get serialization!", serialization);
|
||||||
|
assertTrue("Wrong serialization class",
|
||||||
|
serialization instanceof WritableSerialization);
|
||||||
|
}
|
||||||
|
|
||||||
@SuppressWarnings("unchecked")
|
@SuppressWarnings("unchecked")
|
||||||
public void testReuseSerializer() throws IOException {
|
public void testReuseSerializer() throws IOException {
|
||||||
// Test that we can write multiple objects of the same type
|
// Test that we can write multiple objects of the same type
|
||||||
@ -112,4 +137,46 @@ public class TestWritableSerialization extends TestCase {
|
|||||||
barSerializer.close();
|
barSerializer.close();
|
||||||
out.reset();
|
out.reset();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
// Test the SerializationBase.checkSerializationKey() method.
|
||||||
|
class DummySerializationBase extends SerializationBase<Object> {
|
||||||
|
public boolean accept(Map<String, String> metadata) {
|
||||||
|
return checkSerializationKey(metadata);
|
||||||
|
}
|
||||||
|
|
||||||
|
public SerializerBase<Object> getSerializer(Map<String, String> metadata) {
|
||||||
|
return null;
|
||||||
|
}
|
||||||
|
|
||||||
|
public DeserializerBase<Object> getDeserializer(Map<String, String> metadata) {
|
||||||
|
return null;
|
||||||
|
}
|
||||||
|
|
||||||
|
public RawComparator<Object> getRawComparator(Map<String, String> metadata) {
|
||||||
|
return null;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
public void testSerializationKeyCheck() {
|
||||||
|
DummySerializationBase dummy = new DummySerializationBase();
|
||||||
|
Map<String, String> metadata = new HashMap<String, String>();
|
||||||
|
|
||||||
|
assertTrue("Didn't accept empty metadata", dummy.accept(metadata));
|
||||||
|
|
||||||
|
metadata.put(SerializationBase.SERIALIZATION_KEY,
|
||||||
|
DummySerializationBase.class.getName());
|
||||||
|
assertTrue("Didn't accept valid metadata", dummy.accept(metadata));
|
||||||
|
|
||||||
|
metadata.put(SerializationBase.SERIALIZATION_KEY, "foo");
|
||||||
|
assertFalse("Accepted invalid metadata", dummy.accept(metadata));
|
||||||
|
|
||||||
|
try {
|
||||||
|
dummy.accept((Map<String, String>) null);
|
||||||
|
// Shouldn't get here!
|
||||||
|
fail("Somehow didn't actually test the method we expected");
|
||||||
|
} catch (NullPointerException npe) {
|
||||||
|
// expected this.
|
||||||
|
}
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
@ -26,12 +26,38 @@ import junit.framework.TestCase;
|
|||||||
import org.apache.avro.util.Utf8;
|
import org.apache.avro.util.Utf8;
|
||||||
import org.apache.hadoop.conf.Configuration;
|
import org.apache.hadoop.conf.Configuration;
|
||||||
import org.apache.hadoop.io.serializer.SerializationBase;
|
import org.apache.hadoop.io.serializer.SerializationBase;
|
||||||
|
import org.apache.hadoop.io.serializer.SerializationFactory;
|
||||||
import org.apache.hadoop.io.serializer.SerializationTestUtil;
|
import org.apache.hadoop.io.serializer.SerializationTestUtil;
|
||||||
|
|
||||||
public class TestAvroSerialization extends TestCase {
|
public class TestAvroSerialization extends TestCase {
|
||||||
|
|
||||||
private static final Configuration conf = new Configuration();
|
private static final Configuration conf = new Configuration();
|
||||||
|
|
||||||
|
@SuppressWarnings("unchecked")
|
||||||
|
public void testIgnoreMisconfiguredMetadata() {
|
||||||
|
// If SERIALIZATION_KEY is set, still need class name.
|
||||||
|
|
||||||
|
Configuration conf = new Configuration();
|
||||||
|
Map<String, String> metadata = new HashMap<String, String>();
|
||||||
|
SerializationFactory factory = new SerializationFactory(conf);
|
||||||
|
SerializationBase serialization = null;
|
||||||
|
|
||||||
|
metadata.put(SerializationBase.SERIALIZATION_KEY,
|
||||||
|
AvroGenericSerialization.class.getName());
|
||||||
|
serialization = factory.getSerialization(metadata);
|
||||||
|
assertNull("Got serializer without any class info", serialization);
|
||||||
|
|
||||||
|
metadata.put(SerializationBase.SERIALIZATION_KEY,
|
||||||
|
AvroReflectSerialization.class.getName());
|
||||||
|
serialization = factory.getSerialization(metadata);
|
||||||
|
assertNull("Got serializer without any class info", serialization);
|
||||||
|
|
||||||
|
metadata.put(SerializationBase.SERIALIZATION_KEY,
|
||||||
|
AvroSpecificSerialization.class.getName());
|
||||||
|
serialization = factory.getSerialization(metadata);
|
||||||
|
assertNull("Got serializer without any class info", serialization);
|
||||||
|
}
|
||||||
|
|
||||||
public void testSpecific() throws Exception {
|
public void testSpecific() throws Exception {
|
||||||
AvroRecord before = new AvroRecord();
|
AvroRecord before = new AvroRecord();
|
||||||
before.intField = 5;
|
before.intField = 5;
|
||||||
|
Loading…
x
Reference in New Issue
Block a user