From 035ed477ca3d80ac844678b475d519cc22769455 Mon Sep 17 00:00:00 2001 From: Krisso Date: Thu, 18 Jan 2024 10:33:13 +0100 Subject: [PATCH] TDD approach - adding unit tests which should pass but they fail. --- .../recordWithNestedNotNullComplexFields.avsc | 35 ++++++ ...recordWithNestedNullableComplexFields.avsc | 50 ++++++++ .../FastGenericDeserializerGeneratorTest.java | 32 ++++- ...FastSpecificDeserializerGeneratorTest.java | 66 ++++++++++ ...nericDeserializer_1244262185_49792023.java | 113 ++++++++++++++++++ ...cificDeserializer_1244262185_49792023.java | 100 ++++++++++++++++ 6 files changed, 395 insertions(+), 1 deletion(-) create mode 100644 fastserde/avro-fastserde-tests-common/src/test/avro/recordWithNestedNotNullComplexFields.avsc create mode 100644 fastserde/avro-fastserde-tests-common/src/test/avro/recordWithNestedNullableComplexFields.avsc create mode 100644 fastserde/avro-fastserde-tests111/build/codegen/java/com/linkedin/avro/fastserde/generated/deserialization/AVRO_1_11/OuterRecordWithNestedNullableComplexFields_GenericDeserializer_1244262185_49792023.java create mode 100644 fastserde/avro-fastserde-tests111/build/codegen/java/com/linkedin/avro/fastserde/generated/deserialization/AVRO_1_11/OuterRecordWithNestedNullableComplexFields_SpecificDeserializer_1244262185_49792023.java diff --git a/fastserde/avro-fastserde-tests-common/src/test/avro/recordWithNestedNotNullComplexFields.avsc b/fastserde/avro-fastserde-tests-common/src/test/avro/recordWithNestedNotNullComplexFields.avsc new file mode 100644 index 000000000..241f5d2cd --- /dev/null +++ b/fastserde/avro-fastserde-tests-common/src/test/avro/recordWithNestedNotNullComplexFields.avsc @@ -0,0 +1,35 @@ +{ + "type": "record", + "name": "OuterRecordWithNestedNotNullComplexFields", + "namespace": "com.linkedin.avro.fastserde.generated.avro", + "doc": "Used in tests of fast-serde to serialize record with schema having not-null complex fields", + "fields": [ + { + "name": "innerRecord", + "type": { + "name": "InnerRecordNotNull", + "type": "record", + "fields": [ + { + "name": "comment", + "type": "string" + } + ] + } + }, + { + "name": "innerMap", + "type": { + "type": "map", + "values": "int" + } + }, + { + "name": "innerArray", + "type": { + "type": "array", + "items": "int" + } + } + ] +} diff --git a/fastserde/avro-fastserde-tests-common/src/test/avro/recordWithNestedNullableComplexFields.avsc b/fastserde/avro-fastserde-tests-common/src/test/avro/recordWithNestedNullableComplexFields.avsc new file mode 100644 index 000000000..c0777fde9 --- /dev/null +++ b/fastserde/avro-fastserde-tests-common/src/test/avro/recordWithNestedNullableComplexFields.avsc @@ -0,0 +1,50 @@ +{ + "type": "record", + "name": "OuterRecordWithNestedNullableComplexFields", + "aliases": [ + "OuterRecordWithNestedNotNullComplexFields" + ], + "namespace": "com.linkedin.avro.fastserde.generated.avro", + "doc": "Used in tests of fast-serde to deserialize record serialized with schema having not-null complex fields", + "fields": [ + { + "name": "innerRecord", + "type": [ + "null", + { + "name": "InnerRecordNullable", + "aliases": [ + "InnerRecordNotNull" + ], + "type": "record", + "fields": [ + { + "name": "comment", + "type": "string" + } + ] + } + ] + }, + { + "name": "innerMap", + "type": [ + "null", + { + "type": "map", + "values": "int" + } + ] + }, + { + "name": "innerArray", + "type": [ + "null", + { + "type": "array", + "items": "int" + } + ] + } + ] +} diff --git a/fastserde/avro-fastserde-tests-common/src/test/java/com/linkedin/avro/fastserde/FastGenericDeserializerGeneratorTest.java b/fastserde/avro-fastserde-tests-common/src/test/java/com/linkedin/avro/fastserde/FastGenericDeserializerGeneratorTest.java index 6c2194254..70f3acc19 100644 --- a/fastserde/avro-fastserde-tests-common/src/test/java/com/linkedin/avro/fastserde/FastGenericDeserializerGeneratorTest.java +++ b/fastserde/avro-fastserde-tests-common/src/test/java/com/linkedin/avro/fastserde/FastGenericDeserializerGeneratorTest.java @@ -5,8 +5,14 @@ import com.linkedin.avro.api.PrimitiveFloatList; import com.linkedin.avro.api.PrimitiveIntList; import com.linkedin.avro.api.PrimitiveLongList; +import com.linkedin.avro.fastserde.generated.avro.InnerRecordNotNull; +import com.linkedin.avro.fastserde.generated.avro.OuterRecordWithNestedNotNullComplexFields; +import com.linkedin.avro.fastserde.generated.avro.OuterRecordWithNestedNullableComplexFields; import com.linkedin.avroutil1.compatibility.AvroCompatibilityHelper; +import com.linkedin.avroutil1.compatibility.AvroRecordUtil; import com.linkedin.avroutil1.compatibility.AvroVersion; + +import java.io.ByteArrayOutputStream; import java.io.File; import java.io.IOException; import java.lang.reflect.Method; @@ -26,16 +32,21 @@ import org.apache.avro.generic.GenericData; import org.apache.avro.generic.GenericDatumReader; import org.apache.avro.generic.GenericRecord; +import org.apache.avro.io.BinaryDecoder; +import org.apache.avro.io.BinaryEncoder; import org.apache.avro.io.Decoder; +import org.apache.avro.specific.SpecificDatumWriter; import org.apache.avro.util.Utf8; import org.testng.Assert; import org.testng.SkipException; import org.testng.annotations.BeforeTest; import org.testng.annotations.DataProvider; import org.testng.annotations.Test; +import org.testng.collections.Lists; +import org.testng.internal.collections.Pair; import static com.linkedin.avro.fastserde.FastSerdeTestsSupport.*; - +import static com.linkedin.avro.fastserde.FastSpecificDeserializerGeneratorTest.createAndSerializeOuterRecordWithNotNullComplexFields; public class FastGenericDeserializerGeneratorTest { @@ -1590,6 +1601,25 @@ record = new GenericData.Record(recordWithUnionMapOfUnionValuesSchema); Assert.assertEquals(((Map) recordB.get("someInts")).get(new Utf8("3")), Integer.valueOf(3)); } + @Test(groups = {"deserializationTest"}, dataProvider = "Implementation") + void deserializeNullableFieldsPreviouslySerializedAsNotNull(Implementation implementation) throws IOException { + // given: outerRecord1 serialized using schema with not-null complex fields + Pair pair = createAndSerializeOuterRecordWithNotNullComplexFields(); + OuterRecordWithNestedNotNullComplexFields outerRecord1 = pair.first(); + byte[] serializedOuterRecord1 = pair.second(); + + Schema writerSchema = OuterRecordWithNestedNotNullComplexFields.SCHEMA$; // without nullable fields + Schema readerSchema = OuterRecordWithNestedNullableComplexFields.SCHEMA$; // contains nullable fields + BinaryDecoder binaryDecoder = AvroCompatibilityHelper.newBinaryDecoder(serializedOuterRecord1); + + // when: serialized outerRecord1 is deserialized using readerSchema with nullable complex fields + GenericRecord outerRecord2 = implementation.decode(writerSchema, readerSchema, binaryDecoder); + + // then: deserialized outerRecord2 is the same as outerRecord1 (initial one) + Assert.assertNotNull(outerRecord2); + Assert.assertEquals(outerRecord2.toString(), outerRecord1.toString()); + } + private static T decodeRecordColdFast(Schema writerSchema, Schema readerSchema, Decoder decoder) { FastDeserializer deserializer = new FastSerdeUtils.FastDeserializerWithAvroGenericImpl<>(writerSchema, readerSchema, GenericData.get(), false); diff --git a/fastserde/avro-fastserde-tests-common/src/test/java/com/linkedin/avro/fastserde/FastSpecificDeserializerGeneratorTest.java b/fastserde/avro-fastserde-tests-common/src/test/java/com/linkedin/avro/fastserde/FastSpecificDeserializerGeneratorTest.java index 327ebdbc1..04b39c2a6 100644 --- a/fastserde/avro-fastserde-tests-common/src/test/java/com/linkedin/avro/fastserde/FastSpecificDeserializerGeneratorTest.java +++ b/fastserde/avro-fastserde-tests-common/src/test/java/com/linkedin/avro/fastserde/FastSpecificDeserializerGeneratorTest.java @@ -2,9 +2,12 @@ package com.linkedin.avro.fastserde; import com.linkedin.avro.fastserde.generated.avro.FullRecord; +import com.linkedin.avro.fastserde.generated.avro.InnerRecordNotNull; import com.linkedin.avro.fastserde.generated.avro.IntRecord; import com.linkedin.avro.fastserde.generated.avro.MyEnumV2; import com.linkedin.avro.fastserde.generated.avro.MyRecordV2; +import com.linkedin.avro.fastserde.generated.avro.OuterRecordWithNestedNotNullComplexFields; +import com.linkedin.avro.fastserde.generated.avro.OuterRecordWithNestedNullableComplexFields; import com.linkedin.avro.fastserde.generated.avro.RecordWithLargeUnionField; import com.linkedin.avro.fastserde.generated.avro.RemovedTypesTestRecord; import com.linkedin.avro.fastserde.generated.avro.SplitRecordTest1; @@ -16,6 +19,9 @@ import com.linkedin.avro.fastserde.generated.avro.TestRecord; import com.linkedin.avro.fastserde.generated.avro.UnionOfRecordsWithSameNameEnumField; import com.linkedin.avroutil1.compatibility.AvroCompatibilityHelper; +import com.linkedin.avroutil1.compatibility.AvroRecordUtil; + +import java.io.ByteArrayOutputStream; import java.io.File; import java.io.IOException; import java.net.URL; @@ -31,13 +37,18 @@ import org.apache.avro.Schema; import org.apache.avro.generic.GenericData; import org.apache.avro.generic.GenericRecord; +import org.apache.avro.io.BinaryDecoder; +import org.apache.avro.io.BinaryEncoder; import org.apache.avro.io.Decoder; import org.apache.avro.specific.SpecificDatumReader; +import org.apache.avro.specific.SpecificDatumWriter; import org.apache.avro.util.Utf8; import org.testng.Assert; import org.testng.annotations.BeforeTest; import org.testng.annotations.DataProvider; import org.testng.annotations.Test; +import org.testng.collections.Lists; +import org.testng.internal.collections.Pair; import static com.linkedin.avro.fastserde.FastSerdeTestsSupport.*; @@ -844,6 +855,61 @@ public void largeSchemasWithUnionCanBeHandled() { } } + @Test(groups = {"deserializationTest"}, dataProvider = "SlowFastDeserializer") + void deserializeNullableFieldsPreviouslySerializedAsNotNull(boolean useFastSerializer) throws IOException { + // given: outerRecord1 serialized using schema with not-null complex fields + Pair pair = createAndSerializeOuterRecordWithNotNullComplexFields(); + OuterRecordWithNestedNotNullComplexFields outerRecord1 = pair.first(); + byte[] serializedOuterRecord1 = pair.second(); + BinaryDecoder binaryDecoder = AvroCompatibilityHelper.newBinaryDecoder(serializedOuterRecord1); + + Schema writerSchema = OuterRecordWithNestedNotNullComplexFields.SCHEMA$; // without nullable fields + Schema readerSchema = OuterRecordWithNestedNullableComplexFields.SCHEMA$; // contains nullable fields + + // when: serialized outerRecord1 is deserialized using readerSchema with nullable complex fields + OuterRecordWithNestedNullableComplexFields outerRecord2; + if (useFastSerializer) { + outerRecord2 = decodeRecordFast(readerSchema, writerSchema, binaryDecoder); + } else { + outerRecord2 = decodeRecordSlow(readerSchema, writerSchema, binaryDecoder); + } + + // then: deserialized outerRecord2 is the same as outerRecord1 (initial one) + Assert.assertNotNull(outerRecord2); + Assert.assertEquals(outerRecord2.toString(), outerRecord1.toString()); + } + + /** + * @return serialized {@link OuterRecordWithNestedNotNullComplexFields} + */ + static Pair createAndSerializeOuterRecordWithNotNullComplexFields() throws IOException { + InnerRecordNotNull innerRecord = AvroRecordUtil.setField(new InnerRecordNotNull(), "comment", "awesome comment"); + + Map innerMap = new HashMap<>(); + innerMap.put("one", 1); + innerMap.put("twotwo", 22); + innerMap.put("three x 3", 333); + + List innerArray = Lists.newArrayList(234, 2342, 948563); + + OuterRecordWithNestedNotNullComplexFields outerRecord1 = new OuterRecordWithNestedNotNullComplexFields(); + AvroRecordUtil.setField(outerRecord1, "innerRecord", innerRecord); + AvroRecordUtil.setField(outerRecord1, "innerMap", innerMap); + AvroRecordUtil.setField(outerRecord1, "innerArray", innerArray); + + Schema writerSchema = OuterRecordWithNestedNotNullComplexFields.SCHEMA$; + SpecificDatumWriter datumWriter = new SpecificDatumWriter<>(writerSchema); + ByteArrayOutputStream baos = new ByteArrayOutputStream(); + BinaryEncoder binaryEncoder = AvroCompatibilityHelper.newBinaryEncoder(baos); + + datumWriter.write(outerRecord1, binaryEncoder); + binaryEncoder.flush(); + + byte[] serializedOuterRecord1 = baos.toByteArray(); + + return Pair.of(outerRecord1, serializedOuterRecord1); + } + private T decodeRecordFast(Schema readerSchema, Schema writerSchema, Decoder decoder) { FastDeserializer deserializer = new FastSpecificDeserializerGenerator(writerSchema, readerSchema, tempDir, classLoader, diff --git a/fastserde/avro-fastserde-tests111/build/codegen/java/com/linkedin/avro/fastserde/generated/deserialization/AVRO_1_11/OuterRecordWithNestedNullableComplexFields_GenericDeserializer_1244262185_49792023.java b/fastserde/avro-fastserde-tests111/build/codegen/java/com/linkedin/avro/fastserde/generated/deserialization/AVRO_1_11/OuterRecordWithNestedNullableComplexFields_GenericDeserializer_1244262185_49792023.java new file mode 100644 index 000000000..6ae8626dc --- /dev/null +++ b/fastserde/avro-fastserde-tests111/build/codegen/java/com/linkedin/avro/fastserde/generated/deserialization/AVRO_1_11/OuterRecordWithNestedNullableComplexFields_GenericDeserializer_1244262185_49792023.java @@ -0,0 +1,113 @@ + +package com.linkedin.avro.fastserde.generated.deserialization.AVRO_1_11; + +import java.io.IOException; +import java.util.Map; +import com.linkedin.avro.api.PrimitiveIntList; +import com.linkedin.avro.fastserde.FastDeserializer; +import com.linkedin.avro.fastserde.customized.DatumReaderCustomization; +import com.linkedin.avro.fastserde.primitive.PrimitiveIntArrayList; +import org.apache.avro.Schema; +import org.apache.avro.generic.IndexedRecord; +import org.apache.avro.io.Decoder; +import org.apache.avro.util.Utf8; + +public class OuterRecordWithNestedNullableComplexFields_GenericDeserializer_1244262185_49792023 + implements FastDeserializer +{ + + private final Schema readerSchema; + private final Schema innerRecord0; + private final Schema innerRecordNullableRecordSchema0; + private final Schema innerMap0; + private final Schema innerMapMapSchema0; + private final Schema innerArray0; + private final Schema innerArrayArraySchema0; + + public OuterRecordWithNestedNullableComplexFields_GenericDeserializer_1244262185_49792023(Schema readerSchema) { + this.readerSchema = readerSchema; + this.innerRecord0 = readerSchema.getField("innerRecord").schema(); + this.innerRecordNullableRecordSchema0 = innerRecord0 .getTypes().get(1); + this.innerMap0 = readerSchema.getField("innerMap").schema(); + this.innerMapMapSchema0 = innerMap0 .getTypes().get(1); + this.innerArray0 = readerSchema.getField("innerArray").schema(); + this.innerArrayArraySchema0 = innerArray0 .getTypes().get(1); + } + + public IndexedRecord deserialize(IndexedRecord reuse, Decoder decoder, DatumReaderCustomization customization) + throws IOException + { + return deserializeOuterRecordWithNestedNullableComplexFields0((reuse), (decoder), (customization)); + } + + public IndexedRecord deserializeOuterRecordWithNestedNullableComplexFields0(Object reuse, Decoder decoder, DatumReaderCustomization customization) + throws IOException + { + IndexedRecord OuterRecordWithNestedNullableComplexFields; + if ((((reuse)!= null)&&((reuse) instanceof IndexedRecord))&&(((IndexedRecord)(reuse)).getSchema() == readerSchema)) { + OuterRecordWithNestedNullableComplexFields = ((IndexedRecord)(reuse)); + } else { + OuterRecordWithNestedNullableComplexFields = new org.apache.avro.generic.GenericData.Record(readerSchema); + } + OuterRecordWithNestedNullableComplexFields.put(0, deserializeInnerRecordNullable0(OuterRecordWithNestedNullableComplexFields.get(0), (decoder), (customization))); + populate_OuterRecordWithNestedNullableComplexFields0((OuterRecordWithNestedNullableComplexFields), (customization), (decoder)); + return OuterRecordWithNestedNullableComplexFields; + } + + public IndexedRecord deserializeInnerRecordNullable0(Object reuse, Decoder decoder, DatumReaderCustomization customization) + throws IOException + { + IndexedRecord InnerRecordNullable; + if ((((reuse)!= null)&&((reuse) instanceof IndexedRecord))&&(((IndexedRecord)(reuse)).getSchema() == innerRecordNullableRecordSchema0)) { + InnerRecordNullable = ((IndexedRecord)(reuse)); + } else { + InnerRecordNullable = new org.apache.avro.generic.GenericData.Record(innerRecordNullableRecordSchema0); + } + Utf8 charSequence0; + Object oldString0 = InnerRecordNullable.get(0); + if (oldString0 instanceof Utf8) { + charSequence0 = (decoder).readString(((Utf8) oldString0)); + } else { + charSequence0 = (decoder).readString(null); + } + InnerRecordNullable.put(0, charSequence0); + return InnerRecordNullable; + } + + private void populate_OuterRecordWithNestedNullableComplexFields0(IndexedRecord OuterRecordWithNestedNullableComplexFields, DatumReaderCustomization customization, Decoder decoder) + throws IOException + { + Map innerMap1 = null; + long chunkLen0 = (decoder.readMapStart()); + if (chunkLen0 > 0) { + innerMap1 = ((Map)(customization).getNewMapOverrideFunc().apply(OuterRecordWithNestedNullableComplexFields.get(1), ((int) chunkLen0))); + do { + for (int counter0 = 0; (counter0 0); + } else { + innerMap1 = ((Map)(customization).getNewMapOverrideFunc().apply(OuterRecordWithNestedNullableComplexFields.get(1), 0)); + } + OuterRecordWithNestedNullableComplexFields.put(1, innerMap1); + PrimitiveIntList innerArray1 = null; + long chunkLen1 = (decoder.readArrayStart()); + Object oldArray0 = OuterRecordWithNestedNullableComplexFields.get(2); + if (oldArray0 instanceof PrimitiveIntList) { + innerArray1 = ((PrimitiveIntList) oldArray0); + innerArray1 .clear(); + } else { + innerArray1 = new PrimitiveIntArrayList(((int) chunkLen1)); + } + while (chunkLen1 > 0) { + for (int counter1 = 0; (counter1 +{ + + private final Schema readerSchema; + + public OuterRecordWithNestedNullableComplexFields_SpecificDeserializer_1244262185_49792023(Schema readerSchema) { + this.readerSchema = readerSchema; + } + + public com.linkedin.avro.fastserde.generated.avro.OuterRecordWithNestedNullableComplexFields deserialize(com.linkedin.avro.fastserde.generated.avro.OuterRecordWithNestedNullableComplexFields reuse, Decoder decoder, DatumReaderCustomization customization) + throws IOException + { + return deserializeOuterRecordWithNestedNullableComplexFields0((reuse), (decoder), (customization)); + } + + public com.linkedin.avro.fastserde.generated.avro.OuterRecordWithNestedNullableComplexFields deserializeOuterRecordWithNestedNullableComplexFields0(Object reuse, Decoder decoder, DatumReaderCustomization customization) + throws IOException + { + com.linkedin.avro.fastserde.generated.avro.OuterRecordWithNestedNullableComplexFields OuterRecordWithNestedNullableComplexFields; + if ((reuse)!= null) { + OuterRecordWithNestedNullableComplexFields = ((com.linkedin.avro.fastserde.generated.avro.OuterRecordWithNestedNullableComplexFields)(reuse)); + } else { + OuterRecordWithNestedNullableComplexFields = new com.linkedin.avro.fastserde.generated.avro.OuterRecordWithNestedNullableComplexFields(); + } + OuterRecordWithNestedNullableComplexFields.put(0, deserializeInnerRecordNullable0(OuterRecordWithNestedNullableComplexFields.get(0), (decoder), (customization))); + populate_OuterRecordWithNestedNullableComplexFields0((OuterRecordWithNestedNullableComplexFields), (customization), (decoder)); + return OuterRecordWithNestedNullableComplexFields; + } + + public com.linkedin.avro.fastserde.generated.avro.InnerRecordNullable deserializeInnerRecordNullable0(Object reuse, Decoder decoder, DatumReaderCustomization customization) + throws IOException + { + com.linkedin.avro.fastserde.generated.avro.InnerRecordNullable InnerRecordNullable; + if ((reuse)!= null) { + InnerRecordNullable = ((com.linkedin.avro.fastserde.generated.avro.InnerRecordNullable)(reuse)); + } else { + InnerRecordNullable = new com.linkedin.avro.fastserde.generated.avro.InnerRecordNullable(); + } + Utf8 charSequence0; + Object oldString0 = InnerRecordNullable.get(0); + if (oldString0 instanceof Utf8) { + charSequence0 = (decoder).readString(((Utf8) oldString0)); + } else { + charSequence0 = (decoder).readString(null); + } + InnerRecordNullable.put(0, charSequence0); + return InnerRecordNullable; + } + + private void populate_OuterRecordWithNestedNullableComplexFields0(com.linkedin.avro.fastserde.generated.avro.OuterRecordWithNestedNullableComplexFields OuterRecordWithNestedNullableComplexFields, DatumReaderCustomization customization, Decoder decoder) + throws IOException + { + Map innerMap0 = null; + long chunkLen0 = (decoder.readMapStart()); + if (chunkLen0 > 0) { + innerMap0 = ((Map)(customization).getNewMapOverrideFunc().apply(OuterRecordWithNestedNullableComplexFields.get(1), ((int) chunkLen0))); + do { + for (int counter0 = 0; (counter0 0); + } else { + innerMap0 = ((Map)(customization).getNewMapOverrideFunc().apply(OuterRecordWithNestedNullableComplexFields.get(1), 0)); + } + OuterRecordWithNestedNullableComplexFields.put(1, innerMap0); + PrimitiveIntList innerArray0 = null; + long chunkLen1 = (decoder.readArrayStart()); + Object oldArray0 = OuterRecordWithNestedNullableComplexFields.get(2); + if (oldArray0 instanceof PrimitiveIntList) { + innerArray0 = ((PrimitiveIntList) oldArray0); + innerArray0 .clear(); + } else { + innerArray0 = new PrimitiveIntArrayList(((int) chunkLen1)); + } + while (chunkLen1 > 0) { + for (int counter1 = 0; (counter1