nifi-nar-bundles/nifi-standard-bundle/nifi-standard-processors/src/main/java/org/apache/nifi/processors/standard/ForkRecord.java - nifi - Git at Google

 /*
  * Licensed to the Apache Software Foundation (ASF) under one or more
  * contributor license agreements.  See the NOTICE file distributed with
  * this work for additional information regarding copyright ownership.
  * The ASF licenses this file to You under the Apache License, Version 2.0
  * (the "License"); you may not use this file except in compliance with
  * the License.  You may obtain a copy of the License at
  *
  *     http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 package org.apache.nifi.processors.standard;

 import org.apache.commons.lang3.StringUtils;
 import org.apache.nifi.annotation.behavior.InputRequirement;
 import org.apache.nifi.annotation.behavior.InputRequirement.Requirement;
 import org.apache.nifi.annotation.behavior.SideEffectFree;
 import org.apache.nifi.annotation.behavior.SupportsBatching;
 import org.apache.nifi.annotation.behavior.WritesAttribute;
 import org.apache.nifi.annotation.behavior.WritesAttributes;
 import org.apache.nifi.annotation.documentation.CapabilityDescription;
 import org.apache.nifi.annotation.documentation.Tags;
 import org.apache.nifi.components.AllowableValue;
 import org.apache.nifi.components.PropertyDescriptor;
 import org.apache.nifi.components.ValidationContext;
 import org.apache.nifi.components.ValidationResult;
 import org.apache.nifi.components.Validator;
 import org.apache.nifi.expression.AttributeExpression;
 import org.apache.nifi.expression.ExpressionLanguageScope;
 import org.apache.nifi.flowfile.FlowFile;
 import org.apache.nifi.flowfile.attributes.CoreAttributes;
 import org.apache.nifi.processor.AbstractProcessor;
 import org.apache.nifi.processor.ProcessContext;
 import org.apache.nifi.processor.ProcessSession;
 import org.apache.nifi.processor.Relationship;
 import org.apache.nifi.processor.exception.ProcessException;
 import org.apache.nifi.processor.io.InputStreamCallback;
 import org.apache.nifi.processor.util.StandardValidators;
 import org.apache.nifi.record.path.FieldValue;
 import org.apache.nifi.record.path.RecordPath;
 import org.apache.nifi.record.path.util.RecordPathCache;
 import org.apache.nifi.record.path.validation.RecordPathValidator;
 import org.apache.nifi.schema.access.SchemaNotFoundException;
 import org.apache.nifi.serialization.MalformedRecordException;
 import org.apache.nifi.serialization.RecordReader;
 import org.apache.nifi.serialization.RecordReaderFactory;
 import org.apache.nifi.serialization.RecordSetWriter;
 import org.apache.nifi.serialization.RecordSetWriterFactory;
 import org.apache.nifi.serialization.WriteResult;
 import org.apache.nifi.serialization.record.DataType;
 import org.apache.nifi.serialization.record.Record;
 import org.apache.nifi.serialization.record.RecordFieldType;
 import org.apache.nifi.serialization.record.RecordSchema;
 import org.apache.nifi.serialization.record.type.ArrayDataType;

 import java.io.IOException;
 import java.io.InputStream;
 import java.io.OutputStream;
 import java.util.ArrayList;
 import java.util.Collection;
 import java.util.HashMap;
 import java.util.HashSet;
 import java.util.Iterator;
 import java.util.List;
 import java.util.Map;
 import java.util.NoSuchElementException;
 import java.util.Set;
 import java.util.concurrent.atomic.AtomicInteger;

 @SideEffectFree
 @SupportsBatching
 @InputRequirement(Requirement.INPUT_REQUIRED)
 @Tags({"fork", "record", "content", "array", "stream", "event"})
 @CapabilityDescription("This processor allows the user to fork a record into multiple records. The user must specify at least one "
         + "Record Path, as a dynamic property, pointing to a field of type ARRAY containing RECORD objects. The processor accepts "
         + "two modes: 'split' and 'extract'. In both modes, there is one record generated per element contained in the designated "
         + "array. In the 'split' mode, each generated record will preserve the same schema as given in the input but the array "
         + "will contain only one element. In the 'extract' mode, the element of the array must be of record type and will be the "
         + "generated record. Additionally, in the 'extract' mode, it is possible to specify if each generated record should contain "
         + "all the fields of the parent records from the root level to the extracted record. This assumes that the fields to add in "
         + "the record are defined in the schema of the Record Writer controller service. See examples in the additional details "
         + "documentation of this processor.")
 @WritesAttributes({
     @WritesAttribute(attribute = "record.count", description = "The generated FlowFile will have a 'record.count' attribute indicating "
             + "the number of records that were written to the FlowFile."),
     @WritesAttribute(attribute = "mime.type", description = "The MIME Type indicated by the Record Writer"),
     @WritesAttribute(attribute = "<Attributes from Record Writer>", description = "Any Attribute that the configured Record Writer "
             + "returns will be added to the FlowFile.")
 })
 public class ForkRecord extends AbstractProcessor {

     private volatile RecordPathCache recordPathCache = new RecordPathCache(25);

     static final AllowableValue MODE_EXTRACT = new AllowableValue("extract", "Extract",
         "Generated records will be the elements of the array");
     static final AllowableValue MODE_SPLIT = new AllowableValue("split", "Split",
         "Generated records will preserve the input schema and will contain a one-element array");

     public static final PropertyDescriptor RECORD_READER = new PropertyDescriptor.Builder()
             .name("record-reader")
             .displayName("Record Reader")
             .description("Specifies the Controller Service to use for reading incoming data")
             .identifiesControllerService(RecordReaderFactory.class)
             .required(true)
             .build();

     public static final PropertyDescriptor RECORD_WRITER = new PropertyDescriptor.Builder()
             .name("record-writer")
             .displayName("Record Writer")
             .description("Specifies the Controller Service to use for writing out the records")
             .identifiesControllerService(RecordSetWriterFactory.class)
             .required(true)
             .build();

     public static final PropertyDescriptor MODE = new PropertyDescriptor.Builder()
             .name("fork-mode")
             .displayName("Mode")
             .description("Specifies the forking mode of the processor")
             .allowableValues(MODE_EXTRACT, MODE_SPLIT)
             .defaultValue(MODE_SPLIT.getValue())
             .required(true)
             .build();

     public static final PropertyDescriptor INCLUDE_PARENT_FIELDS = new PropertyDescriptor.Builder()
             .name("include-parent-fields")
             .displayName("Include Parent Fields")
             .description("This parameter is only valid with the 'extract' mode. If set to true, all the fields "
                     + "from the root level to the given array will be added as fields of each element of the "
                     + "array to fork.")
             .allowableValues("true", "false")
             .defaultValue("false")
             .required(true)
             .build();

     public static final Relationship REL_FORK = new Relationship.Builder()
             .name("fork")
             .description("The FlowFiles containing the forked records will be routed to this relationship")
             .build();
     public static final Relationship REL_ORIGINAL = new Relationship.Builder()
             .name("original")
             .description("The original FlowFiles will be routed to this relationship")
             .build();
     public static final Relationship REL_FAILURE = new Relationship.Builder()
             .name("failure")
             .description("In case a FlowFile generates an error during the fork operation, it will be routed to this relationship")
             .build();

     @Override
     protected List<PropertyDescriptor> getSupportedPropertyDescriptors() {
         final List<PropertyDescriptor> properties = new ArrayList<>();
         properties.add(RECORD_READER);
         properties.add(RECORD_WRITER);
         properties.add(MODE);
         properties.add(INCLUDE_PARENT_FIELDS);
         return properties;
     }

     @Override
     public Set<Relationship> getRelationships() {
         final Set<Relationship> relationships = new HashSet<>();
         relationships.add(REL_ORIGINAL);
         relationships.add(REL_FAILURE);
         relationships.add(REL_FORK);
         return relationships;
     }

     @Override
     protected PropertyDescriptor getSupportedDynamicPropertyDescriptor(final String propertyDescriptorName) {
         return new PropertyDescriptor.Builder()
                 .name(propertyDescriptorName)
                 .required(false)
                 .addValidator(StandardValidators.createAttributeExpressionLanguageValidator(AttributeExpression.ResultType.STRING, true))
                 .addValidator(StandardValidators.ATTRIBUTE_KEY_PROPERTY_NAME_VALIDATOR)
                 .expressionLanguageSupported(ExpressionLanguageScope.FLOWFILE_ATTRIBUTES)
                 .dynamic(true)
                 .build();
     }

     @Override
     protected Collection<ValidationResult> customValidate(ValidationContext validationContext) {
         final List<ValidationResult> results = new ArrayList<>(super.customValidate(validationContext));
         Validator validator = new RecordPathValidator();

         Map<PropertyDescriptor, String> processorProperties = validationContext.getProperties();
         for (final Map.Entry<PropertyDescriptor, String> entry : processorProperties.entrySet()) {
             PropertyDescriptor property = entry.getKey();
             if (property.isDynamic() && property.isExpressionLanguageSupported()) {
                 String dynamicValue = validationContext.getProperty(property).getValue();
                 if(!validationContext.isExpressionLanguagePresent(dynamicValue)) {
                     results.add(validator.validate(property.getDisplayName(), dynamicValue, validationContext));
                 }
             }
         }

         return results;
     }

     @Override
     public void onTrigger(final ProcessContext context, final ProcessSession session) throws ProcessException {

         FlowFile flowFile = session.get();
         if (flowFile == null) {
             return;
         }

         final List<RecordPath> recordPaths = new ArrayList<>();
         Map<PropertyDescriptor, String> processorProperties = context.getProperties();
         for (final Map.Entry<PropertyDescriptor, String> entry : processorProperties.entrySet()) {
             PropertyDescriptor property = entry.getKey();
             if (property.isDynamic() && property.isExpressionLanguageSupported()) {
                 String path = context.getProperty(property).evaluateAttributeExpressions(flowFile).getValue();
                 if(StringUtils.isNotBlank(path)) {
                     recordPaths.add(recordPathCache.getCompiled(context.getProperty(property).evaluateAttributeExpressions(flowFile).getValue()));
                 }
             }
         }

         final RecordReaderFactory readerFactory = context.getProperty(RECORD_READER).asControllerService(RecordReaderFactory.class);
         final RecordSetWriterFactory writerFactory = context.getProperty(RECORD_WRITER).asControllerService(RecordSetWriterFactory.class);
         final boolean addParentFields = context.getProperty(INCLUDE_PARENT_FIELDS).asBoolean();
         final boolean isSplitMode = context.getProperty(MODE).getValue().equals(MODE_SPLIT.getValue());

         final FlowFile original = flowFile;
         final Map<String, String> originalAttributes = original.getAttributes();

         final FlowFile outFlowFile = session.create(original);
         final AtomicInteger readCount = new AtomicInteger(0);
         final AtomicInteger writeCount = new AtomicInteger(0);

         try {

             session.read(flowFile, new InputStreamCallback() {
                 @Override
                 public void process(final InputStream in) throws IOException {
                     try (final RecordReader reader = readerFactory.createRecordReader(originalAttributes, in, original.getSize(), getLogger())) {

                         final RecordSchema writeSchema = writerFactory.getSchema(originalAttributes, reader.getSchema());
                         final OutputStream out = session.write(outFlowFile);

                         try (final RecordSetWriter recordSetWriter = writerFactory.createWriter(getLogger(), writeSchema, out, outFlowFile)) {

                             recordSetWriter.beginRecordSet();

                             // we read each record of the input flow file
                             Record record;
                             while ((record = reader.nextRecord()) != null) {

                                 readCount.incrementAndGet();

                                 for(RecordPath recordPath : recordPaths) {

                                     // evaluate record path in each record of the flow file
                                     Iterator<FieldValue> it = recordPath.evaluate(record).getSelectedFields().iterator();

                                     while(it.hasNext()) {
                                         FieldValue fieldValue = it.next();
                                         RecordFieldType fieldType = fieldValue.getField().getDataType().getFieldType();

                                         // we want to have an array here, nothing else allowed
                                         if(fieldType != RecordFieldType.ARRAY) {
                                             getLogger().debug("The record path " + recordPath.getPath() + " is matching a field "
                                                     + "of type " + fieldType + " when the type ARRAY is expected.");
                                             continue;
                                         }

                                         if(isSplitMode) {

                                             Object[] items = (Object[]) fieldValue.getValue();
                                             for (Object item : items) {
                                                 fieldValue.updateValue(new Object[]{item});
                                                 recordSetWriter.write(record);
                                             }

                                         } else {

                                             // we get the type of the elements of the array
                                             final ArrayDataType arrayDataType = (ArrayDataType) fieldValue.getField().getDataType();
                                             final DataType elementType = arrayDataType.getElementType();

                                             // we want to have records in the array
                                             if(elementType.getFieldType() != RecordFieldType.RECORD) {
                                                 getLogger().debug("The record path " + recordPath.getPath() + " is matching an array field with "
                                                         + "values of type " + elementType.getFieldType() + " when the type RECORD is expected.");
                                                 continue;
                                             }

                                             Object[] records = (Object[]) fieldValue.getValue();
                                             for (Object elementRecord : records) {

                                                 if(elementRecord == null) {
                                                     continue;
                                                 }

                                                 Record recordToWrite = (Record) elementRecord;

                                                 if(addParentFields) {
                                                     // in this case we want to recursively add the parent fields into the record to write
                                                     // but we need to ensure that the Record has the appropriate schema for that
                                                     recordToWrite.incorporateSchema(writeSchema);
                                                     recursivelyAddParentFields(recordToWrite, fieldValue);
                                                 }

                                                 recordSetWriter.write(recordToWrite);
                                             }

                                         }

                                     }

                                 }
                             }

                             final WriteResult writeResult = recordSetWriter.finishRecordSet();

                             try {
                                 recordSetWriter.close();
                             } catch (final IOException ioe) {
                                 getLogger().warn("Failed to close Writer for {}", new Object[] {outFlowFile});
                             }

                             final Map<String, String> attributes = new HashMap<>();
                             writeCount.set(writeResult.getRecordCount());
                             attributes.put("record.count", String.valueOf(writeResult.getRecordCount()));
                             attributes.put(CoreAttributes.MIME_TYPE.key(), recordSetWriter.getMimeType());
                             attributes.putAll(writeResult.getAttributes());
                             session.transfer(session.putAllAttributes(outFlowFile, attributes), REL_FORK);
                         }

                     } catch (final SchemaNotFoundException | MalformedRecordException e) {
                         throw new ProcessException("Could not parse incoming data: " + e.getLocalizedMessage(), e);
                     }
                 }

                 private void recursivelyAddParentFields(Record recordToWrite, FieldValue fieldValue) {
                     try {
                         // we get the parent data
                         FieldValue parentField = fieldValue.getParent().get();
                         Record parentRecord = fieldValue.getParentRecord().get();

                         // for each field of the parent
                         for (String field : parentRecord.getSchema().getFieldNames()) {
                             // if and only if there is not an already existing field with this name
                             // (we want to give priority to the deeper existing fields)
                             if(recordToWrite.getValue(field) == null) {
                                 // Updates the value of the field with the given name to the given value.
                                 // If the field specified is not present in the schema, will do nothing.
                                 recordToWrite.setValue(field, parentRecord.getValue(field));
                             }
                         }

                         // recursive call
                         recursivelyAddParentFields(recordToWrite, parentField);
                     } catch (NoSuchElementException e) {
                         return;
                     }
                 }
             });

         } catch (Exception e) {
             getLogger().error("Failed to fork {}", new Object[] {flowFile, e});
             session.remove(outFlowFile);
             session.transfer(original, REL_FAILURE);
             return;
         }

         session.adjustCounter("Records Processed", readCount.get(), false);
         session.adjustCounter("Records Generated", writeCount.get(), false);
         getLogger().debug("Successfully forked {} records into {} records in {}", new Object[] {readCount.get(), writeCount.get(), flowFile});
         session.transfer(original, REL_ORIGINAL);
     }

 }
	/*
	* Licensed to the Apache Software Foundation (ASF) under one or more
	* contributor license agreements. See the NOTICE file distributed with
	* this work for additional information regarding copyright ownership.
	* The ASF licenses this file to You under the Apache License, Version 2.0
	* (the "License"); you may not use this file except in compliance with
	* the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/

	package org.apache.nifi.processors.standard;

	import org.apache.commons.lang3.StringUtils;
	import org.apache.nifi.annotation.behavior.InputRequirement;
	import org.apache.nifi.annotation.behavior.InputRequirement.Requirement;
	import org.apache.nifi.annotation.behavior.SideEffectFree;
	import org.apache.nifi.annotation.behavior.SupportsBatching;
	import org.apache.nifi.annotation.behavior.WritesAttribute;
	import org.apache.nifi.annotation.behavior.WritesAttributes;
	import org.apache.nifi.annotation.documentation.CapabilityDescription;
	import org.apache.nifi.annotation.documentation.Tags;
	import org.apache.nifi.components.AllowableValue;
	import org.apache.nifi.components.PropertyDescriptor;
	import org.apache.nifi.components.ValidationContext;
	import org.apache.nifi.components.ValidationResult;
	import org.apache.nifi.components.Validator;
	import org.apache.nifi.expression.AttributeExpression;
	import org.apache.nifi.expression.ExpressionLanguageScope;
	import org.apache.nifi.flowfile.FlowFile;
	import org.apache.nifi.flowfile.attributes.CoreAttributes;
	import org.apache.nifi.processor.AbstractProcessor;
	import org.apache.nifi.processor.ProcessContext;
	import org.apache.nifi.processor.ProcessSession;
	import org.apache.nifi.processor.Relationship;
	import org.apache.nifi.processor.exception.ProcessException;
	import org.apache.nifi.processor.io.InputStreamCallback;
	import org.apache.nifi.processor.util.StandardValidators;
	import org.apache.nifi.record.path.FieldValue;
	import org.apache.nifi.record.path.RecordPath;
	import org.apache.nifi.record.path.util.RecordPathCache;
	import org.apache.nifi.record.path.validation.RecordPathValidator;
	import org.apache.nifi.schema.access.SchemaNotFoundException;
	import org.apache.nifi.serialization.MalformedRecordException;
	import org.apache.nifi.serialization.RecordReader;
	import org.apache.nifi.serialization.RecordReaderFactory;
	import org.apache.nifi.serialization.RecordSetWriter;
	import org.apache.nifi.serialization.RecordSetWriterFactory;
	import org.apache.nifi.serialization.WriteResult;
	import org.apache.nifi.serialization.record.DataType;
	import org.apache.nifi.serialization.record.Record;
	import org.apache.nifi.serialization.record.RecordFieldType;
	import org.apache.nifi.serialization.record.RecordSchema;
	import org.apache.nifi.serialization.record.type.ArrayDataType;

	import java.io.IOException;
	import java.io.InputStream;
	import java.io.OutputStream;
	import java.util.ArrayList;
	import java.util.Collection;
	import java.util.HashMap;
	import java.util.HashSet;
	import java.util.Iterator;
	import java.util.List;
	import java.util.Map;
	import java.util.NoSuchElementException;
	import java.util.Set;
	import java.util.concurrent.atomic.AtomicInteger;

	@SideEffectFree
	@SupportsBatching
	@InputRequirement(Requirement.INPUT_REQUIRED)
	@Tags({"fork", "record", "content", "array", "stream", "event"})
	@CapabilityDescription("This processor allows the user to fork a record into multiple records. The user must specify at least one "
	+ "Record Path, as a dynamic property, pointing to a field of type ARRAY containing RECORD objects. The processor accepts "
	+ "two modes: 'split' and 'extract'. In both modes, there is one record generated per element contained in the designated "
	+ "array. In the 'split' mode, each generated record will preserve the same schema as given in the input but the array "
	+ "will contain only one element. In the 'extract' mode, the element of the array must be of record type and will be the "
	+ "generated record. Additionally, in the 'extract' mode, it is possible to specify if each generated record should contain "
	+ "all the fields of the parent records from the root level to the extracted record. This assumes that the fields to add in "
	+ "the record are defined in the schema of the Record Writer controller service. See examples in the additional details "
	+ "documentation of this processor.")
	@WritesAttributes({
	@WritesAttribute(attribute = "record.count", description = "The generated FlowFile will have a 'record.count' attribute indicating "
	+ "the number of records that were written to the FlowFile."),
	@WritesAttribute(attribute = "mime.type", description = "The MIME Type indicated by the Record Writer"),
	@WritesAttribute(attribute = "<Attributes from Record Writer>", description = "Any Attribute that the configured Record Writer "
	+ "returns will be added to the FlowFile.")
	})
	public class ForkRecord extends AbstractProcessor {

	private volatile RecordPathCache recordPathCache = new RecordPathCache(25);

	static final AllowableValue MODE_EXTRACT = new AllowableValue("extract", "Extract",
	"Generated records will be the elements of the array");
	static final AllowableValue MODE_SPLIT = new AllowableValue("split", "Split",
	"Generated records will preserve the input schema and will contain a one-element array");

	public static final PropertyDescriptor RECORD_READER = new PropertyDescriptor.Builder()
	.name("record-reader")
	.displayName("Record Reader")
	.description("Specifies the Controller Service to use for reading incoming data")
	.identifiesControllerService(RecordReaderFactory.class)
	.required(true)
	.build();

	public static final PropertyDescriptor RECORD_WRITER = new PropertyDescriptor.Builder()
	.name("record-writer")
	.displayName("Record Writer")
	.description("Specifies the Controller Service to use for writing out the records")
	.identifiesControllerService(RecordSetWriterFactory.class)
	.required(true)
	.build();

	public static final PropertyDescriptor MODE = new PropertyDescriptor.Builder()
	.name("fork-mode")
	.displayName("Mode")
	.description("Specifies the forking mode of the processor")
	.allowableValues(MODE_EXTRACT, MODE_SPLIT)
	.defaultValue(MODE_SPLIT.getValue())
	.required(true)
	.build();

	public static final PropertyDescriptor INCLUDE_PARENT_FIELDS = new PropertyDescriptor.Builder()
	.name("include-parent-fields")
	.displayName("Include Parent Fields")
	.description("This parameter is only valid with the 'extract' mode. If set to true, all the fields "
	+ "from the root level to the given array will be added as fields of each element of the "
	+ "array to fork.")
	.allowableValues("true", "false")
	.defaultValue("false")
	.required(true)
	.build();

	public static final Relationship REL_FORK = new Relationship.Builder()
	.name("fork")
	.description("The FlowFiles containing the forked records will be routed to this relationship")
	.build();
	public static final Relationship REL_ORIGINAL = new Relationship.Builder()
	.name("original")
	.description("The original FlowFiles will be routed to this relationship")
	.build();
	public static final Relationship REL_FAILURE = new Relationship.Builder()
	.name("failure")
	.description("In case a FlowFile generates an error during the fork operation, it will be routed to this relationship")
	.build();

	@Override
	protected List<PropertyDescriptor> getSupportedPropertyDescriptors() {
	final List<PropertyDescriptor> properties = new ArrayList<>();
	properties.add(RECORD_READER);
	properties.add(RECORD_WRITER);
	properties.add(MODE);
	properties.add(INCLUDE_PARENT_FIELDS);
	return properties;
	}

	@Override
	public Set<Relationship> getRelationships() {
	final Set<Relationship> relationships = new HashSet<>();
	relationships.add(REL_ORIGINAL);
	relationships.add(REL_FAILURE);
	relationships.add(REL_FORK);
	return relationships;
	}

	@Override
	protected PropertyDescriptor getSupportedDynamicPropertyDescriptor(final String propertyDescriptorName) {
	return new PropertyDescriptor.Builder()
	.name(propertyDescriptorName)
	.required(false)
	.addValidator(StandardValidators.createAttributeExpressionLanguageValidator(AttributeExpression.ResultType.STRING, true))
	.addValidator(StandardValidators.ATTRIBUTE_KEY_PROPERTY_NAME_VALIDATOR)
	.expressionLanguageSupported(ExpressionLanguageScope.FLOWFILE_ATTRIBUTES)
	.dynamic(true)
	.build();
	}

	@Override
	protected Collection<ValidationResult> customValidate(ValidationContext validationContext) {
	final List<ValidationResult> results = new ArrayList<>(super.customValidate(validationContext));
	Validator validator = new RecordPathValidator();

	Map<PropertyDescriptor, String> processorProperties = validationContext.getProperties();
	for (final Map.Entry<PropertyDescriptor, String> entry : processorProperties.entrySet()) {
	PropertyDescriptor property = entry.getKey();
	if (property.isDynamic() && property.isExpressionLanguageSupported()) {
	String dynamicValue = validationContext.getProperty(property).getValue();
	if(!validationContext.isExpressionLanguagePresent(dynamicValue)) {
	results.add(validator.validate(property.getDisplayName(), dynamicValue, validationContext));
	}
	}
	}

	return results;
	}

	@Override
	public void onTrigger(final ProcessContext context, final ProcessSession session) throws ProcessException {

	FlowFile flowFile = session.get();
	if (flowFile == null) {
	return;
	}

	final List<RecordPath> recordPaths = new ArrayList<>();
	Map<PropertyDescriptor, String> processorProperties = context.getProperties();
	for (final Map.Entry<PropertyDescriptor, String> entry : processorProperties.entrySet()) {
	PropertyDescriptor property = entry.getKey();
	if (property.isDynamic() && property.isExpressionLanguageSupported()) {
	String path = context.getProperty(property).evaluateAttributeExpressions(flowFile).getValue();
	if(StringUtils.isNotBlank(path)) {
	recordPaths.add(recordPathCache.getCompiled(context.getProperty(property).evaluateAttributeExpressions(flowFile).getValue()));
	}
	}
	}

	final RecordReaderFactory readerFactory = context.getProperty(RECORD_READER).asControllerService(RecordReaderFactory.class);
	final RecordSetWriterFactory writerFactory = context.getProperty(RECORD_WRITER).asControllerService(RecordSetWriterFactory.class);
	final boolean addParentFields = context.getProperty(INCLUDE_PARENT_FIELDS).asBoolean();
	final boolean isSplitMode = context.getProperty(MODE).getValue().equals(MODE_SPLIT.getValue());

	final FlowFile original = flowFile;
	final Map<String, String> originalAttributes = original.getAttributes();

	final FlowFile outFlowFile = session.create(original);
	final AtomicInteger readCount = new AtomicInteger(0);
	final AtomicInteger writeCount = new AtomicInteger(0);

	try {

	session.read(flowFile, new InputStreamCallback() {
	@Override
	public void process(final InputStream in) throws IOException {
	try (final RecordReader reader = readerFactory.createRecordReader(originalAttributes, in, original.getSize(), getLogger())) {

	final RecordSchema writeSchema = writerFactory.getSchema(originalAttributes, reader.getSchema());
	final OutputStream out = session.write(outFlowFile);

	try (final RecordSetWriter recordSetWriter = writerFactory.createWriter(getLogger(), writeSchema, out, outFlowFile)) {

	recordSetWriter.beginRecordSet();

	// we read each record of the input flow file
	Record record;
	while ((record = reader.nextRecord()) != null) {

	readCount.incrementAndGet();

	for(RecordPath recordPath : recordPaths) {

	// evaluate record path in each record of the flow file
	Iterator<FieldValue> it = recordPath.evaluate(record).getSelectedFields().iterator();

	while(it.hasNext()) {
	FieldValue fieldValue = it.next();
	RecordFieldType fieldType = fieldValue.getField().getDataType().getFieldType();

	// we want to have an array here, nothing else allowed
	if(fieldType != RecordFieldType.ARRAY) {
	getLogger().debug("The record path " + recordPath.getPath() + " is matching a field "
	+ "of type " + fieldType + " when the type ARRAY is expected.");
	continue;
	}

	if(isSplitMode) {

	Object[] items = (Object[]) fieldValue.getValue();
	for (Object item : items) {
	fieldValue.updateValue(new Object[]{item});
	recordSetWriter.write(record);
	}

	} else {

	// we get the type of the elements of the array
	final ArrayDataType arrayDataType = (ArrayDataType) fieldValue.getField().getDataType();
	final DataType elementType = arrayDataType.getElementType();

	// we want to have records in the array
	if(elementType.getFieldType() != RecordFieldType.RECORD) {
	getLogger().debug("The record path " + recordPath.getPath() + " is matching an array field with "
	+ "values of type " + elementType.getFieldType() + " when the type RECORD is expected.");
	continue;
	}

	Object[] records = (Object[]) fieldValue.getValue();
	for (Object elementRecord : records) {

	if(elementRecord == null) {
	continue;
	}

	Record recordToWrite = (Record) elementRecord;

	if(addParentFields) {
	// in this case we want to recursively add the parent fields into the record to write
	// but we need to ensure that the Record has the appropriate schema for that
	recordToWrite.incorporateSchema(writeSchema);
	recursivelyAddParentFields(recordToWrite, fieldValue);
	}

	recordSetWriter.write(recordToWrite);
	}

	}

	}

	}
	}

	final WriteResult writeResult = recordSetWriter.finishRecordSet();

	try {
	recordSetWriter.close();
	} catch (final IOException ioe) {
	getLogger().warn("Failed to close Writer for {}", new Object[] {outFlowFile});
	}

	final Map<String, String> attributes = new HashMap<>();
	writeCount.set(writeResult.getRecordCount());
	attributes.put("record.count", String.valueOf(writeResult.getRecordCount()));
	attributes.put(CoreAttributes.MIME_TYPE.key(), recordSetWriter.getMimeType());
	attributes.putAll(writeResult.getAttributes());
	session.transfer(session.putAllAttributes(outFlowFile, attributes), REL_FORK);
	}

	} catch (final SchemaNotFoundException \| MalformedRecordException e) {
	throw new ProcessException("Could not parse incoming data: " + e.getLocalizedMessage(), e);
	}
	}

	private void recursivelyAddParentFields(Record recordToWrite, FieldValue fieldValue) {
	try {
	// we get the parent data
	FieldValue parentField = fieldValue.getParent().get();
	Record parentRecord = fieldValue.getParentRecord().get();

	// for each field of the parent
	for (String field : parentRecord.getSchema().getFieldNames()) {
	// if and only if there is not an already existing field with this name
	// (we want to give priority to the deeper existing fields)
	if(recordToWrite.getValue(field) == null) {
	// Updates the value of the field with the given name to the given value.
	// If the field specified is not present in the schema, will do nothing.
	recordToWrite.setValue(field, parentRecord.getValue(field));
	}
	}

	// recursive call
	recursivelyAddParentFields(recordToWrite, parentField);
	} catch (NoSuchElementException e) {
	return;
	}
	}
	});

	} catch (Exception e) {
	getLogger().error("Failed to fork {}", new Object[] {flowFile, e});
	session.remove(outFlowFile);
	session.transfer(original, REL_FAILURE);
	return;
	}

	session.adjustCounter("Records Processed", readCount.get(), false);
	session.adjustCounter("Records Generated", writeCount.get(), false);
	getLogger().debug("Successfully forked {} records into {} records in {}", new Object[] {readCount.get(), writeCount.get(), flowFile});
	session.transfer(original, REL_ORIGINAL);
	}

	}