From 798a8eeb509209015e619f0ec4b6826f2754634f Mon Sep 17 00:00:00 2001 From: Matthew Burgess Date: Thu, 12 Mar 2020 14:46:58 -0400 Subject: [PATCH] NIFI-7249: Force String keys in maps in DataTypeUtils.inferDataType() Signed-off-by: Pierre Villard This closes #4139. --- .../record/util/DataTypeUtils.java | 18 ++++++- .../record/TestDataTypeUtils.java | 31 +++++++++++ .../apache/nifi/avro/TestAvroTypeUtil.java | 51 +++++++++++++++++++ 3 files changed, 99 insertions(+), 1 deletion(-) diff --git a/nifi-commons/nifi-record/src/main/java/org/apache/nifi/serialization/record/util/DataTypeUtils.java b/nifi-commons/nifi-record/src/main/java/org/apache/nifi/serialization/record/util/DataTypeUtils.java index b1daa917d7..009332eb83 100644 --- a/nifi-commons/nifi-record/src/main/java/org/apache/nifi/serialization/record/util/DataTypeUtils.java +++ b/nifi-commons/nifi-record/src/main/java/org/apache/nifi/serialization/record/util/DataTypeUtils.java @@ -474,7 +474,23 @@ public class DataTypeUtils { // A value of a Map could be either a Record or a Map type. In either case, it must have Strings as keys. if (value instanceof Map) { - final Map map = (Map) value; + final Map map; + // Only transform the map if the keys aren't strings + boolean allStrings = true; + for (final Object key : ((Map) value).keySet()) { + if (!(key instanceof String)) { + allStrings = false; + break; + } + } + + if (allStrings) { + map = (Map) value; + } else { + final Map m = (Map) value; + map = new HashMap<>(m.size()); + m.forEach((k, v) -> map.put(k == null ? null : k.toString(), v)); + } return inferRecordDataType(map); // // Check if all types are the same. // if (map.isEmpty()) { diff --git a/nifi-commons/nifi-record/src/test/java/org/apache/nifi/serialization/record/TestDataTypeUtils.java b/nifi-commons/nifi-record/src/test/java/org/apache/nifi/serialization/record/TestDataTypeUtils.java index 30b2a60ab3..8152d4f67b 100644 --- a/nifi-commons/nifi-record/src/test/java/org/apache/nifi/serialization/record/TestDataTypeUtils.java +++ b/nifi-commons/nifi-record/src/test/java/org/apache/nifi/serialization/record/TestDataTypeUtils.java @@ -19,6 +19,7 @@ package org.apache.nifi.serialization.record; import org.apache.nifi.serialization.SimpleRecordSchema; import org.apache.nifi.serialization.record.type.ChoiceDataType; +import org.apache.nifi.serialization.record.type.RecordDataType; import org.apache.nifi.serialization.record.util.DataTypeUtils; import org.apache.nifi.serialization.record.util.IllegalTypeConversionException; import org.junit.Test; @@ -442,6 +443,36 @@ public class TestDataTypeUtils { assertEquals(expected, actual); } + @Test + public void testInferTypeWithMapStringKeys() { + Map map = new HashMap<>(); + map.put("a", "Hello"); + map.put("b", "World"); + + RecordDataType expected = (RecordDataType)RecordFieldType.RECORD.getRecordDataType(new SimpleRecordSchema(Arrays.asList( + new RecordField("a", RecordFieldType.STRING.getDataType()), + new RecordField("b", RecordFieldType.STRING.getDataType()) + ))); + + DataType actual = DataTypeUtils.inferDataType(map, null); + assertEquals(expected, actual); + } + + @Test + public void testInferTypeWithMapNonStringKeys() { + Map map = new HashMap<>(); + map.put(1, "Hello"); + map.put(2, "World"); + + RecordDataType expected = (RecordDataType)RecordFieldType.RECORD.getRecordDataType(new SimpleRecordSchema(Arrays.asList( + new RecordField("1", RecordFieldType.STRING.getDataType()), + new RecordField("2", RecordFieldType.STRING.getDataType()) + ))); + + DataType actual = DataTypeUtils.inferDataType(map, null); + assertEquals(expected, actual); + } + @Test public void testFindMostSuitableTypeWithBoolean() { testFindMostSuitableType(true, RecordFieldType.BOOLEAN.getDataType()); diff --git a/nifi-nar-bundles/nifi-extension-utils/nifi-record-utils/nifi-avro-record-utils/src/test/java/org/apache/nifi/avro/TestAvroTypeUtil.java b/nifi-nar-bundles/nifi-extension-utils/nifi-record-utils/nifi-avro-record-utils/src/test/java/org/apache/nifi/avro/TestAvroTypeUtil.java index a89ebe479c..5b5f55dd52 100644 --- a/nifi-nar-bundles/nifi-extension-utils/nifi-record-utils/nifi-avro-record-utils/src/test/java/org/apache/nifi/avro/TestAvroTypeUtil.java +++ b/nifi-nar-bundles/nifi-extension-utils/nifi-record-utils/nifi-avro-record-utils/src/test/java/org/apache/nifi/avro/TestAvroTypeUtil.java @@ -29,6 +29,7 @@ import org.apache.avro.generic.GenericDatumReader; import org.apache.avro.generic.GenericFixed; import org.apache.avro.generic.GenericRecord; import org.apache.avro.generic.GenericRecordBuilder; +import org.apache.avro.util.Utf8; import org.apache.nifi.schema.access.SchemaNotFoundException; import org.apache.nifi.serialization.SimpleRecordSchema; import org.apache.nifi.serialization.record.DataType; @@ -640,4 +641,54 @@ public class TestAvroTypeUtil { // THEN assertEquals(expected, actualAfterReverse); } + + @Test + public void testConvertAvroMap() { + // GIVEN + Map expected = new HashMap() {{ + put( + "nullableMapField", + new HashMap() {{ + put("key1", "value1"); + put("key2", "value2"); + }} + ); + }}; + + Schema nullableMapFieldAvroSchema = Schema.createUnion( + Schema.create(Type.NULL), + Schema.create(Type.INT), + Schema.createMap(Schema.create(Type.STRING)) + ); + + Schema avroRecordSchema = Schema.createRecord( + "record", "doc", "namespace", false, + Arrays.asList( + new Field("nullableMapField", nullableMapFieldAvroSchema, "nullable map field", (Object)null) + ) + ); + + Map value = new HashMap(){{ + put(new Utf8("key1"), "value1"); + put(new Utf8("key2"), "value2"); + }}; + + Record avroRecord = new GenericRecordBuilder(avroRecordSchema) + .set("nullableMapField", value) + .build(); + + RecordSchema nifiRecordSchema = new SimpleRecordSchema( + Arrays.asList( + new RecordField("nullableMapField", RecordFieldType.CHOICE.getChoiceDataType( + RecordFieldType.MAP.getMapDataType(RecordFieldType.STRING.getDataType()) + )) + ) + ); + + // WHEN + Object actual = AvroTypeUtil.convertAvroRecordToMap(avroRecord, nifiRecordSchema); + + // THEN + assertEquals(expected, actual); + } }