apache · clintropolis · Mar 27, 2023 · Feb 8, 2023 · Feb 14, 2023 · Feb 14, 2023
diff --git a/.../avro-extensions/src/test/java/org/apache/druid/data/input/AvroStreamInputFormatTest.java b/.../avro-extensions/src/test/java/org/apache/druid/data/input/AvroStreamInputFormatTest.java
@@ -106,7 +106,6 @@ public class AvroStreamInputFormatTest extends InitializedNullHandlingTest
   private static final String TOPIC = "aTopic";
   static final List<String> DIMENSIONS = Arrays.asList(EVENT_TYPE, ID, SOME_OTHER_ID, IS_VALID);
   private static final List<String> DIMENSIONS_SCHEMALESS = Arrays.asList(
-      "nested",
       SOME_OTHER_ID,
       "someIntArray",
       "someFloat",

diff --git a/...ro-extensions/src/test/java/org/apache/druid/data/input/AvroStreamInputRowParserTest.java b/...ro-extensions/src/test/java/org/apache/druid/data/input/AvroStreamInputRowParserTest.java
@@ -86,7 +86,6 @@ public class AvroStreamInputRowParserTest
   private static final ZonedDateTime DATE_TIME = ZonedDateTime.of(2015, 10, 25, 19, 30, 0, 0, ZoneOffset.UTC);
   static final List<String> DIMENSIONS = Arrays.asList(EVENT_TYPE, ID, SOME_OTHER_ID, IS_VALID);
   private static final List<String> DIMENSIONS_SCHEMALESS = Arrays.asList(
-      "nested",
       SOME_OTHER_ID,
       "someIntArray",
       "someFloat",

diff --git a/...ions-core/orc-extensions/src/test/java/org/apache/druid/data/input/orc/OrcReaderTest.java b/...ions-core/orc-extensions/src/test/java/org/apache/druid/data/input/orc/OrcReaderTest.java
@@ -36,7 +36,6 @@
 import org.apache.druid.java.util.common.parsers.JSONPathFieldSpec;
 import org.apache.druid.java.util.common.parsers.JSONPathFieldType;
 import org.apache.druid.java.util.common.parsers.JSONPathSpec;
-import org.apache.druid.math.expr.ExpressionProcessing;
 import org.apache.druid.query.expression.TestExprMacroTable;
 import org.apache.druid.segment.NestedDataDimensionSchema;
 import org.apache.druid.segment.transform.ExpressionTransform;
@@ -453,7 +452,6 @@ public void testNestedColumnSchemaless() throws IOException
         "middle",
         "list",
         "map",
-        "ts",
         "decimal1"
     );
     try (CloseableIterator<InputRow> iterator = reader.read()) {
@@ -593,7 +591,6 @@ public void testListMap() throws IOException
   @Test
   public void testNestedArray() throws IOException
   {
-    ExpressionProcessing.initializeForTests(true);
     final InputFormat inputFormat = new OrcInputFormat(
         new JSONPathSpec(
             true,
@@ -669,9 +666,6 @@ public void testNestedArray() throws IOException
       Assert.assertArrayEquals(new Object[]{1L, 2L}, (Object[]) row.getRaw("t_d_0"));
       Assert.assertFalse(iterator.hasNext());
     }
-    finally {
-      ExpressionProcessing.initializeForTests(null);
-    }
   }
 
   @Test

diff --git a/...ions/src/test/java/org/apache/druid/data/input/parquet/NestedColumnParquetReaderTest.java b/...ions/src/test/java/org/apache/druid/data/input/parquet/NestedColumnParquetReaderTest.java
@@ -181,7 +181,7 @@ public void testNestedColumnSchemalessNestedTestFileNoNested() throws IOExceptio
     );
 
     List<InputRow> rows = readAllRows(reader);
-    Assert.assertEquals(ImmutableList.of("dim1", "metric1", "timestamp"), rows.get(0).getDimensions());
+    Assert.assertEquals(ImmutableList.of("dim1", "metric1"), rows.get(0).getDimensions());
     Assert.assertEquals(FlattenSpecParquetInputTest.TS1, rows.get(0).getTimestamp().toString());
     Assert.assertEquals(ImmutableList.of("d1v1"), rows.get(0).getDimension("dim1"));
     Assert.assertEquals("d1v1", rows.get(0).getRaw("dim1"));
@@ -218,7 +218,7 @@ public void testNestedColumnSchemalessNestedTestFile() throws IOException
     );
 
     List<InputRow> rows = readAllRows(reader);
-    Assert.assertEquals(ImmutableList.of("nestedData", "dim1", "metric1", "timestamp"), rows.get(0).getDimensions());
+    Assert.assertEquals(ImmutableList.of("nestedData", "dim1", "metric1"), rows.get(0).getDimensions());
     Assert.assertEquals(FlattenSpecParquetInputTest.TS1, rows.get(0).getTimestamp().toString());
     Assert.assertEquals(ImmutableList.of("d1v1"), rows.get(0).getDimension("dim1"));
     Assert.assertEquals("d1v1", rows.get(0).getRaw("dim1"));

diff --git a/...xtensions/src/test/java/org/apache/druid/data/input/protobuf/ProtobufInputFormatTest.java b/...xtensions/src/test/java/org/apache/druid/data/input/protobuf/ProtobufInputFormatTest.java
@@ -75,7 +75,7 @@ public class ProtobufInputFormatTest
   public void setUp() throws Exception
   {
     NullHandling.initializeForTests();
-    ExpressionProcessing.initializeForTests(null);
+    ExpressionProcessing.initializeForTests();
     timestampSpec = new TimestampSpec("timestamp", "iso", null);
     dimensionsSpec = new DimensionsSpec(Lists.newArrayList(
         new StringDimensionSchema("event"),
@@ -243,7 +243,6 @@ public void testParseFlattenDataDiscover() throws Exception
                      .add("someFloatColumn")
                      .add("id")
                      .add("someBytesColumn")
-                     .add("timestamp")
                      .build(),
         row.getDimensions()
     );
@@ -380,8 +379,7 @@ public void testParseNestedDataSchemaless() throws Exception
             "someFloatColumn",
             "eventType",
             "id",
-            "someBytesColumn",
-            "timestamp"
+            "someBytesColumn"
         ),
         row.getDimensions()
     );

diff --git a/processing/src/main/java/org/apache/druid/data/input/impl/DelimitedInputFormat.java b/processing/src/main/java/org/apache/druid/data/input/impl/DelimitedInputFormat.java
@@ -41,6 +41,7 @@
 public class DelimitedInputFormat extends FlatTextInputFormat
 {
   public static final String TYPE_KEY = "tsv";
+
   private static final String DEFAULT_DELIMITER = "\t";
 
   @JsonCreator

diff --git a/processing/src/main/java/org/apache/druid/data/input/impl/JsonInputFormat.java b/processing/src/main/java/org/apache/druid/data/input/impl/JsonInputFormat.java
@@ -40,7 +40,6 @@
 public class JsonInputFormat extends NestedInputFormat
 {
   public static final String TYPE_KEY = "json";
-
   private final Map<String, Boolean> featureSpec;
   private final ObjectMapper objectMapper;
   private final boolean keepNullColumns;

diff --git a/processing/src/main/java/org/apache/druid/data/input/impl/MapInputRowParser.java b/processing/src/main/java/org/apache/druid/data/input/impl/MapInputRowParser.java
@@ -23,7 +23,6 @@
 import com.fasterxml.jackson.annotation.JsonProperty;
 import com.google.common.annotations.VisibleForTesting;
 import com.google.common.collect.ImmutableList;
-import com.google.common.collect.Sets;
 import org.apache.druid.data.input.InputRow;
 import org.apache.druid.data.input.InputRowSchema;
 import org.apache.druid.data.input.MapBasedInputRow;
@@ -36,6 +35,7 @@
 import java.util.LinkedHashSet;
 import java.util.List;
 import java.util.Map;
+import java.util.Set;
 
 public class MapInputRowParser implements InputRowParser<Map<String, Object>>
 {
@@ -77,22 +77,38 @@ public static InputRow parse(InputRowSchema inputRowSchema, Map<String, Object>
    * 3) If isIncludeAllDimensions is not set and {@link DimensionsSpec#getDimensionNames()} is empty,
    *    the dimensions in the given map is returned.
    *
-   * In any case, the returned list does not include any dimensions in {@link DimensionsSpec#getDimensionExclusions()}.
+   * In any case, the returned list does not include any dimensions in {@link DimensionsSpec#getDimensionExclusions()}
+   * or {@link TimestampSpec#getTimestampColumn()}.
    */
   private static List<String> findDimensions(
+      TimestampSpec timestampSpec,
       DimensionsSpec dimensionsSpec,
       Map<String, Object> rawInputRow
   )
   {
+    final String timestampColumn = timestampSpec.getTimestampColumn();
+    final Set<String> exclusions = dimensionsSpec.getDimensionExclusions();
     if (dimensionsSpec.isIncludeAllDimensions()) {
       LinkedHashSet<String> dimensions = new LinkedHashSet<>(dimensionsSpec.getDimensionNames());
-      dimensions.addAll(Sets.difference(rawInputRow.keySet(), dimensionsSpec.getDimensionExclusions()));
+      for (String field : rawInputRow.keySet()) {
+        if (timestampColumn.equals(field) || exclusions.contains(field)) {
+          continue;
+        }
+        dimensions.add(field);
+      }
       return new ArrayList<>(dimensions);
     } else {
       if (!dimensionsSpec.getDimensionNames().isEmpty()) {
         return dimensionsSpec.getDimensionNames();
       } else {
-        return new ArrayList<>(Sets.difference(rawInputRow.keySet(), dimensionsSpec.getDimensionExclusions()));
+        List<String> dimensions = new ArrayList<>();
+        for (String field : rawInputRow.keySet()) {
+          if (timestampColumn.equals(field) || exclusions.contains(field)) {
+            continue;
+          }
+          dimensions.add(field);
+        }
+        return dimensions;
       }
     }
   }
@@ -104,7 +120,7 @@ static InputRow parse(
       Map<String, Object> theMap
   ) throws ParseException
   {
-    final List<String> dimensionsToUse = findDimensions(dimensionsSpec, theMap);
+    final List<String> dimensionsToUse = findDimensions(timestampSpec, dimensionsSpec, theMap);
 
     final DateTime timestamp;
     try {

diff --git a/processing/src/main/java/org/apache/druid/math/expr/ConstantExpr.java b/processing/src/main/java/org/apache/druid/math/expr/ConstantExpr.java
@@ -379,7 +379,6 @@ public ArrayExpr(ExpressionType outputType, @Nullable Object[] value)
   {
     super(outputType, value);
     Preconditions.checkArgument(outputType.isArray(), "Output type %s is not an array", outputType);
-    ExpressionType.checkNestedArrayAllowed(outputType);
   }
 
   @Override

diff --git a/processing/src/main/java/org/apache/druid/math/expr/ExprEval.java b/processing/src/main/java/org/apache/druid/math/expr/ExprEval.java
@@ -370,11 +370,26 @@ public static ExprEval ofComplex(ExpressionType outputType, @Nullable Object val
     return new ComplexExprEval(outputType, value);
   }
 
+  public static ExprEval bestEffortArray(@Nullable List<?> theList)
+  {
+    // do not convert empty lists to arrays with a single null element here, because that should have been done
+    // by the selectors preparing their ObjectBindings if necessary. If we get to this point it was legitimately
+    // empty
+    NonnullPair<ExpressionType, Object[]> coerced = coerceListToArray(theList, false);
+    if (coerced == null) {
+      return bestEffortOf(null);
+    }
+    return ofArray(coerced.lhs, coerced.rhs);
+  }
+
   /**
    * Examine java type to find most appropriate expression type
    */
   public static ExprEval bestEffortOf(@Nullable Object val)
   {
+    if (val == null) {
+      return new StringExprEval(null);
+    }
     if (val instanceof ExprEval) {
       return (ExprEval) val;
     }
@@ -468,14 +483,7 @@ public static ExprEval bestEffortOf(@Nullable Object val)
 
     if (val instanceof List || val instanceof Object[]) {
       final List<?> theList = val instanceof List ? ((List<?>) val) : Arrays.asList((Object[]) val);
-      // do not convert empty lists to arrays with a single null element here, because that should have been done
-      // by the selectors preparing their ObjectBindings if necessary. If we get to this point it was legitimately
-      // empty
-      NonnullPair<ExpressionType, Object[]> coerced = coerceListToArray(theList, false);
-      if (coerced == null) {
-        return bestEffortOf(null);
-      }
-      return ofArray(coerced.lhs, coerced.rhs);
+      return bestEffortArray(theList);
     }
 
     // in 'best effort' mode, we couldn't possibly use byte[] as a complex or anything else useful without type
@@ -485,12 +493,8 @@ public static ExprEval bestEffortOf(@Nullable Object val)
       return new StringExprEval(StringUtils.encodeBase64String((byte[]) val));
     }
 
-    if (val != null) {
-      // is this cool?
-      return new ComplexExprEval(ExpressionType.UNKNOWN_COMPLEX, val);
-    }
-
-    return new StringExprEval(null);
+    // is this cool?
+    return new ComplexExprEval(ExpressionType.UNKNOWN_COMPLEX, val);
   }
 
   public static ExprEval ofType(@Nullable ExpressionType type, @Nullable Object value)
@@ -1109,7 +1113,6 @@ private ArrayExprEval(ExpressionType arrayType, @Nullable Object[] value)
       super(value);
       this.arrayType = arrayType;
       Preconditions.checkArgument(arrayType.isArray(), "Output type %s is not an array", arrayType);
-      ExpressionType.checkNestedArrayAllowed(arrayType);
     }
 
     @Override

diff --git a/processing/src/main/java/org/apache/druid/math/expr/ExpressionProcessing.java b/processing/src/main/java/org/apache/druid/math/expr/ExpressionProcessing.java
@@ -22,8 +22,6 @@
 import com.google.common.annotations.VisibleForTesting;
 import com.google.inject.Inject;
 
-import javax.annotation.Nullable;
-
 /**
  * Like {@link org.apache.druid.common.config.NullHandling}, except for expressions processing configs
  */
@@ -43,33 +41,23 @@ public class ExpressionProcessing
   /**
    * Many unit tests do not setup modules for this value to be injected, this method provides a manual way to initialize
    * {@link #INSTANCE}
-   * @param allowNestedArrays
    */
   @VisibleForTesting
-  public static void initializeForTests(@Nullable Boolean allowNestedArrays)
+  public static void initializeForTests()
   {
-    INSTANCE = new ExpressionProcessingConfig(allowNestedArrays, null, null, null);
+    INSTANCE = new ExpressionProcessingConfig(null, null, null);
   }
 
   @VisibleForTesting
   public static void initializeForStrictBooleansTests(boolean useStrict)
   {
-    INSTANCE = new ExpressionProcessingConfig(null, useStrict, null, null);
+    INSTANCE = new ExpressionProcessingConfig(useStrict, null, null);
   }
 
   @VisibleForTesting
   public static void initializeForHomogenizeNullMultiValueStrings()
   {
-    INSTANCE = new ExpressionProcessingConfig(null, null, null, true);
-  }
-
-  /**
-   * [['is expression support for'],['nested arrays'],['enabled?']]
-   */
-  public static boolean allowNestedArrays()
-  {
-    checkInitialized();
-    return INSTANCE.allowNestedArrays();
+    INSTANCE = new ExpressionProcessingConfig(null, null, true);
   }
 
   /**

diff --git a/processing/src/main/java/org/apache/druid/math/expr/ExpressionProcessingConfig.java b/processing/src/main/java/org/apache/druid/math/expr/ExpressionProcessingConfig.java
@@ -26,7 +26,6 @@
 
 public class ExpressionProcessingConfig
 {
-  public static final String NESTED_ARRAYS_CONFIG_STRING = "druid.expressions.allowNestedArrays";
   public static final String NULL_HANDLING_LEGACY_LOGICAL_OPS_STRING = "druid.expressions.useStrictBooleans";
   // Coerce arrays to multi value strings
   public static final String PROCESS_ARRAYS_AS_MULTIVALUE_STRINGS_CONFIG_STRING =
@@ -35,9 +34,6 @@ public class ExpressionProcessingConfig
   public static final String HOMOGENIZE_NULL_MULTIVALUE_STRING_ARRAYS =
       "druid.expressions.homogenizeNullMultiValueStringArrays";
 
-  @JsonProperty("allowNestedArrays")
-  private final boolean allowNestedArrays;
-
   @JsonProperty("useStrictBooleans")
   private final boolean useStrictBooleans;
 
@@ -49,13 +45,11 @@ public class ExpressionProcessingConfig
 
   @JsonCreator
   public ExpressionProcessingConfig(
-      @JsonProperty("allowNestedArrays") @Nullable Boolean allowNestedArrays,
       @JsonProperty("useStrictBooleans") @Nullable Boolean useStrictBooleans,
       @JsonProperty("processArraysAsMultiValueStrings") @Nullable Boolean processArraysAsMultiValueStrings,
       @JsonProperty("homogenizeNullMultiValueStringArrays") @Nullable Boolean homogenizeNullMultiValueStringArrays
   )
   {
-    this.allowNestedArrays = getWithPropertyFallbackFalse(allowNestedArrays, NESTED_ARRAYS_CONFIG_STRING);
     this.useStrictBooleans = getWithPropertyFallbackFalse(useStrictBooleans, NULL_HANDLING_LEGACY_LOGICAL_OPS_STRING);
     this.processArraysAsMultiValueStrings = getWithPropertyFallbackFalse(
         processArraysAsMultiValueStrings,
@@ -67,11 +61,6 @@ public ExpressionProcessingConfig(
     );
   }
 
-  public boolean allowNestedArrays()
-  {
-    return allowNestedArrays;
-  }
-
   public boolean isUseStrictBooleans()
   {
     return useStrictBooleans;

diff --git a/processing/src/main/java/org/apache/druid/math/expr/ExpressionType.java b/processing/src/main/java/org/apache/druid/math/expr/ExpressionType.java
@@ -23,7 +23,6 @@
 import com.fasterxml.jackson.annotation.JsonProperty;
 import com.fasterxml.jackson.databind.annotation.JsonSerialize;
 import com.fasterxml.jackson.databind.ser.std.ToStringSerializer;
-import org.apache.druid.java.util.common.IAE;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.segment.column.BaseTypeSignature;
 import org.apache.druid.segment.column.ColumnType;
@@ -210,11 +209,4 @@ public static ColumnType toColumnType(ExpressionType exprType)
         throw new ISE("Unsupported expression type[%s]", exprType);
     }
   }
-
-  public static void checkNestedArrayAllowed(ExpressionType outputType)
-  {
-    if (outputType.isArray() && outputType.getElementType().isArray() && !ExpressionProcessing.allowNestedArrays()) {
-      throw new IAE("Cannot create a nested array type [%s], 'druid.expressions.allowNestedArrays' must be set to true", outputType);
-    }
-  }
 }
diff --git a/processing/src/main/java/org/apache/druid/math/expr/Function.java b/processing/src/main/java/org/apache/druid/math/expr/Function.java
@@ -3054,7 +3054,6 @@ static ExpressionType setArrayOutput(@Nullable ExpressionType arrayType, Object[
       if (arrayType == null) {
         arrayType = ExpressionTypeFactory.getInstance().ofArray(evaluated.type());
       }
-      ExpressionType.checkNestedArrayAllowed(arrayType);
       if (arrayType.getElementType().isNumeric() && evaluated.isNumericNull()) {
         out[i] = null;
       } else if (!evaluated.asArrayType().equals(arrayType)) {

diff --git a/processing/src/main/java/org/apache/druid/query/expression/NestedDataExpressions.java b/processing/src/main/java/org/apache/druid/query/expression/NestedDataExpressions.java
@@ -480,10 +480,25 @@ public Expr apply(List<Expr> args)
       final StructuredDataProcessor processor = new StructuredDataProcessor()
       {
         @Override
-        public StructuredDataProcessor.ProcessedLiteral<?> processLiteralField(ArrayList<NestedPathPart> fieldPath, Object fieldValue)
+        public ProcessedValue<?> processField(ArrayList<NestedPathPart> fieldPath, @Nullable Object fieldValue)
         {
           // do nothing, we only want the list of fields returned by this processor
-          return StructuredDataProcessor.ProcessedLiteral.NULL_LITERAL;
+          return ProcessedValue.NULL_LITERAL;
+        }
+
+        @Nullable
+        @Override
+        public ProcessedValue<?> processArrayField(
+            ArrayList<NestedPathPart> fieldPath,
+            @Nullable List<?> array
+        )
+        {
+          // we only want to return a non-null value here if the value is an array of primitive values
+          ExprEval<?> eval = ExprEval.bestEffortArray(array);
+          if (eval.type().isArray() && eval.type().getElementType().isPrimitive()) {
+            return ProcessedValue.NULL_LITERAL;
+          }
+          return null;
         }
       };