You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@nifi.apache.org by ma...@apache.org on 2020/12/03 22:23:27 UTC

[nifi] branch main updated: NIFI-8070: Added coalesce function to RecordPath

This is an automated email from the ASF dual-hosted git repository.

markap14 pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/nifi.git


The following commit(s) were added to refs/heads/main by this push:
     new d845836  NIFI-8070: Added coalesce function to RecordPath
d845836 is described below

commit d84583690f9323932cce851679770dea9d7a435f
Author: Mark Payne <ma...@hotmail.com>
AuthorDate: Thu Dec 3 16:05:26 2020 -0500

    NIFI-8070: Added coalesce function to RecordPath
---
 .../nifi/record/path/functions/Coalesce.java       | 53 ++++++++++++++++
 .../nifi/record/path/paths/RecordPathCompiler.java | 71 ++++++++++++---------
 .../apache/nifi/record/path/TestRecordPath.java    | 60 ++++++++++++++++++
 nifi-docs/src/main/asciidoc/record-path-guide.adoc | 73 ++++++++++++++++++++++
 4 files changed, 227 insertions(+), 30 deletions(-)

diff --git a/nifi-commons/nifi-record-path/src/main/java/org/apache/nifi/record/path/functions/Coalesce.java b/nifi-commons/nifi-record-path/src/main/java/org/apache/nifi/record/path/functions/Coalesce.java
new file mode 100644
index 0000000..24945d3
--- /dev/null
+++ b/nifi-commons/nifi-record-path/src/main/java/org/apache/nifi/record/path/functions/Coalesce.java
@@ -0,0 +1,53 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.nifi.record.path.functions;
+
+import org.apache.nifi.record.path.FieldValue;
+import org.apache.nifi.record.path.RecordPathEvaluationContext;
+import org.apache.nifi.record.path.paths.RecordPathSegment;
+
+import java.util.Optional;
+import java.util.stream.Stream;
+
+public class Coalesce extends RecordPathSegment {
+
+    private final RecordPathSegment[] valuePaths;
+
+    public Coalesce(final RecordPathSegment[] valuePaths, final boolean absolute) {
+        super("coalesce", null, absolute);
+        this.valuePaths = valuePaths;
+    }
+
+    @Override
+    public Stream<FieldValue> evaluate(final RecordPathEvaluationContext context) {
+        for (final RecordPathSegment valuePath : valuePaths) {
+            final Stream<FieldValue> stream = valuePath.evaluate(context);
+            final Optional<FieldValue> firstFieldValue = stream.findFirst();
+
+            if (firstFieldValue.isPresent()) {
+                // If the Optional is Present, it means that it found the field, but the value may still be explicitly null.
+                final FieldValue fieldValue = firstFieldValue.get();
+                if (fieldValue.getValue() != null) {
+                    return Stream.of(firstFieldValue.get());
+                }
+            }
+        }
+
+        return Stream.empty();
+    }
+}
diff --git a/nifi-commons/nifi-record-path/src/main/java/org/apache/nifi/record/path/paths/RecordPathCompiler.java b/nifi-commons/nifi-record-path/src/main/java/org/apache/nifi/record/path/paths/RecordPathCompiler.java
index 8b09243..7cb1ead 100644
--- a/nifi-commons/nifi-record-path/src/main/java/org/apache/nifi/record/path/paths/RecordPathCompiler.java
+++ b/nifi-commons/nifi-record-path/src/main/java/org/apache/nifi/record/path/paths/RecordPathCompiler.java
@@ -17,35 +17,6 @@
 
 package org.apache.nifi.record.path.paths;
 
-import static org.apache.nifi.record.path.RecordPathParser.ARRAY_INDEX;
-import static org.apache.nifi.record.path.RecordPathParser.CHILD_REFERENCE;
-import static org.apache.nifi.record.path.RecordPathParser.CURRENT_FIELD;
-import static org.apache.nifi.record.path.RecordPathParser.DESCENDANT_REFERENCE;
-import static org.apache.nifi.record.path.RecordPathParser.EQUAL;
-import static org.apache.nifi.record.path.RecordPathParser.FIELD_NAME;
-import static org.apache.nifi.record.path.RecordPathParser.FUNCTION;
-import static org.apache.nifi.record.path.RecordPathParser.GREATER_THAN;
-import static org.apache.nifi.record.path.RecordPathParser.GREATER_THAN_EQUAL;
-import static org.apache.nifi.record.path.RecordPathParser.LESS_THAN;
-import static org.apache.nifi.record.path.RecordPathParser.LESS_THAN_EQUAL;
-import static org.apache.nifi.record.path.RecordPathParser.MAP_KEY;
-import static org.apache.nifi.record.path.RecordPathParser.NOT_EQUAL;
-import static org.apache.nifi.record.path.RecordPathParser.NUMBER;
-import static org.apache.nifi.record.path.RecordPathParser.NUMBER_LIST;
-import static org.apache.nifi.record.path.RecordPathParser.NUMBER_RANGE;
-import static org.apache.nifi.record.path.RecordPathParser.PARENT_REFERENCE;
-import static org.apache.nifi.record.path.RecordPathParser.PATH;
-import static org.apache.nifi.record.path.RecordPathParser.PREDICATE;
-import static org.apache.nifi.record.path.RecordPathParser.RELATIVE_PATH;
-import static org.apache.nifi.record.path.RecordPathParser.ROOT_REFERENCE;
-import static org.apache.nifi.record.path.RecordPathParser.STRING_LIST;
-import static org.apache.nifi.record.path.RecordPathParser.STRING_LITERAL;
-import static org.apache.nifi.record.path.RecordPathParser.WILDCARD;
-
-import java.util.ArrayList;
-import java.util.List;
-import java.util.function.BiFunction;
-
 import org.antlr.runtime.tree.Tree;
 import org.apache.nifi.record.path.NumericRange;
 import org.apache.nifi.record.path.exception.RecordPathException;
@@ -66,9 +37,10 @@ import org.apache.nifi.record.path.filter.RecordPathFilter;
 import org.apache.nifi.record.path.filter.StartsWith;
 import org.apache.nifi.record.path.functions.Base64Decode;
 import org.apache.nifi.record.path.functions.Base64Encode;
+import org.apache.nifi.record.path.functions.Coalesce;
 import org.apache.nifi.record.path.functions.Concat;
-import org.apache.nifi.record.path.functions.Format;
 import org.apache.nifi.record.path.functions.FieldName;
+import org.apache.nifi.record.path.functions.Format;
 import org.apache.nifi.record.path.functions.Hash;
 import org.apache.nifi.record.path.functions.PadLeft;
 import org.apache.nifi.record.path.functions.PadRight;
@@ -88,6 +60,35 @@ import org.apache.nifi.record.path.functions.ToUpperCase;
 import org.apache.nifi.record.path.functions.TrimString;
 import org.apache.nifi.record.path.functions.UUID5;
 
+import java.util.ArrayList;
+import java.util.List;
+import java.util.function.BiFunction;
+
+import static org.apache.nifi.record.path.RecordPathParser.ARRAY_INDEX;
+import static org.apache.nifi.record.path.RecordPathParser.CHILD_REFERENCE;
+import static org.apache.nifi.record.path.RecordPathParser.CURRENT_FIELD;
+import static org.apache.nifi.record.path.RecordPathParser.DESCENDANT_REFERENCE;
+import static org.apache.nifi.record.path.RecordPathParser.EQUAL;
+import static org.apache.nifi.record.path.RecordPathParser.FIELD_NAME;
+import static org.apache.nifi.record.path.RecordPathParser.FUNCTION;
+import static org.apache.nifi.record.path.RecordPathParser.GREATER_THAN;
+import static org.apache.nifi.record.path.RecordPathParser.GREATER_THAN_EQUAL;
+import static org.apache.nifi.record.path.RecordPathParser.LESS_THAN;
+import static org.apache.nifi.record.path.RecordPathParser.LESS_THAN_EQUAL;
+import static org.apache.nifi.record.path.RecordPathParser.MAP_KEY;
+import static org.apache.nifi.record.path.RecordPathParser.NOT_EQUAL;
+import static org.apache.nifi.record.path.RecordPathParser.NUMBER;
+import static org.apache.nifi.record.path.RecordPathParser.NUMBER_LIST;
+import static org.apache.nifi.record.path.RecordPathParser.NUMBER_RANGE;
+import static org.apache.nifi.record.path.RecordPathParser.PARENT_REFERENCE;
+import static org.apache.nifi.record.path.RecordPathParser.PATH;
+import static org.apache.nifi.record.path.RecordPathParser.PREDICATE;
+import static org.apache.nifi.record.path.RecordPathParser.RELATIVE_PATH;
+import static org.apache.nifi.record.path.RecordPathParser.ROOT_REFERENCE;
+import static org.apache.nifi.record.path.RecordPathParser.STRING_LIST;
+import static org.apache.nifi.record.path.RecordPathParser.STRING_LITERAL;
+import static org.apache.nifi.record.path.RecordPathParser.WILDCARD;
+
 public class RecordPathCompiler {
 
     public static RecordPathSegment compile(final Tree pathTree, final RecordPathSegment root, final boolean absolute) {
@@ -343,6 +344,16 @@ public class RecordPathCompiler {
                             return new UUID5(args[0], null, absolute);
                         }
                     }
+                    case "coalesce": {
+                        final int numArgs = argumentListTree.getChildCount();
+
+                        final RecordPathSegment[] argPaths = new RecordPathSegment[numArgs];
+                        for (int i = 0; i < numArgs; i++) {
+                            argPaths[i] = buildPath(argumentListTree.getChild(i), null, absolute);
+                        }
+
+                        return new Coalesce(argPaths, absolute);
+                    }
                     default: {
                         throw new RecordPathException("Invalid function call: The '" + functionName + "' function does not exist or can only "
                             + "be used within a predicate, not as a standalone function");
diff --git a/nifi-commons/nifi-record-path/src/test/java/org/apache/nifi/record/path/TestRecordPath.java b/nifi-commons/nifi-record-path/src/test/java/org/apache/nifi/record/path/TestRecordPath.java
index 5ef4099..682ab7f 100644
--- a/nifi-commons/nifi-record-path/src/test/java/org/apache/nifi/record/path/TestRecordPath.java
+++ b/nifi-commons/nifi-record-path/src/test/java/org/apache/nifi/record/path/TestRecordPath.java
@@ -48,6 +48,7 @@ import java.util.stream.IntStream;
 
 import static org.junit.Assert.assertArrayEquals;
 import static org.junit.Assert.assertEquals;
+import static org.junit.Assert.assertFalse;
 import static org.junit.Assert.assertNull;
 import static org.junit.Assert.assertTrue;
 
@@ -1215,6 +1216,65 @@ public class TestRecordPath {
         assertEquals("John Doe: 48", RecordPath.compile("concat(/firstName, ' ', /lastName, ': ', 48)").evaluate(record).getSelectedFields().findFirst().get().getValue());
     }
 
+
+    @Test
+    public void testCoalesce() {
+        final List<RecordField> fields = new ArrayList<>();
+        fields.add(new RecordField("id", RecordFieldType.INT.getDataType()));
+        fields.add(new RecordField("name", RecordFieldType.STRING.getDataType()));
+
+        final RecordSchema schema = new SimpleRecordSchema(fields);
+
+        final Map<String, Object> values = new HashMap<>();
+        values.put("id", "1234");
+        values.put("name", null);
+        Record record = new MapRecord(schema, values);
+
+        final RecordPath recordPath = RecordPath.compile("coalesce(/id, /name)");
+
+        // Test where the first value is populated
+        FieldValue fieldValue = recordPath.evaluate(record).getSelectedFields().findFirst().get();
+        assertEquals("1234", fieldValue.getValue());
+        assertEquals("id", fieldValue.getField().getFieldName());
+
+        // Test different value populated
+        values.clear();
+        values.put("id", null);
+        values.put("name", "John Doe");
+
+        record = new MapRecord(schema, values);
+        fieldValue = recordPath.evaluate(record).getSelectedFields().findFirst().get();
+        assertEquals("John Doe", fieldValue.getValue());
+        assertEquals("name", fieldValue.getField().getFieldName());
+
+        // Test all null
+        values.clear();
+        values.put("id", null);
+        values.put("name", null);
+
+        record = new MapRecord(schema, values);
+        assertFalse(recordPath.evaluate(record).getSelectedFields().findFirst().isPresent());
+
+        // Test none is null
+        values.clear();
+        values.put("id", "1234");
+        values.put("name", "John Doe");
+
+        record = new MapRecord(schema, values);
+        fieldValue = recordPath.evaluate(record).getSelectedFields().findFirst().get();
+        assertEquals("1234", fieldValue.getValue());
+        assertEquals("id", fieldValue.getField().getFieldName());
+
+        // Test missing field
+        values.clear();
+        values.put("name", "John Doe");
+
+        record = new MapRecord(schema, values);
+        fieldValue = recordPath.evaluate(record).getSelectedFields().findFirst().get();
+        assertEquals("John Doe", fieldValue.getValue());
+        assertEquals("name", fieldValue.getField().getFieldName());
+    }
+
     private Record getCaseTestRecord() {
         final List<RecordField> fields = new ArrayList<>();
         fields.add(new RecordField("middleName", RecordFieldType.STRING.getDataType()));
diff --git a/nifi-docs/src/main/asciidoc/record-path-guide.adoc b/nifi-docs/src/main/asciidoc/record-path-guide.adoc
index 996d3fd..0f2f2dc 100644
--- a/nifi-docs/src/main/asciidoc/record-path-guide.adoc
+++ b/nifi-docs/src/main/asciidoc/record-path-guide.adoc
@@ -561,6 +561,79 @@ The following record path would convert the String field into a byte array using
 
 `toBytes( /s, "UTF-16")`
 
+=== coalesce
+
+Returns the first value from the given arguments that is non-null. For example, given a record such as:
+
+----
+{
+  "id": null,
+  "name": "John Doe"
+}
+----
+
+The following record path would return "John Doe":
+
+`coalesce(/id, /name)`
+
+Given the record:
+
+----
+{
+  "id": "1234",
+  "name": null
+}
+----
+
+The same record path would return "1234".
+
+Given the record:
+
+----
+{
+  "id": null,
+  "name": null
+}
+----
+
+The record path would return `null`.
+
+Given the record:
+
+----
+{
+  "id": "null",
+  "name": "John Doe"
+}
+----
+
+The record path would return the String "null". Note here the very important difference in that the `id`
+field does not have a null value but rather the value of the field is the literal string "null".
+
+Given the record:
+
+----
+{
+  "name": null
+}
+----
+
+The record path would return `null`. Given that the `id` field is not present, it is treated as a `null` value.
+
+Given the record:
+
+----
+{
+  "id": "1234",
+  "name": "John Doe"
+}
+----
+
+The record path would return "1234". However, the record path `coalesce(/name, /id)` would return "John Doe" because
+both fields given are non-null, so the `coalesce` function returns the first value that is referenced in its arguments,
+not the first value that is encountered in the Record itself.
+
+
 === format
 
 Converts a Date to a String in the given format with the given time zone(optional, default time zone is GMT).