blob: 62e490aeba1b28127d985a96f6abc3a6c8e66ab2 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.solr.client.solrj.io.stream;
import java.io.IOException;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.LinkedHashMap;
import java.util.List;
import java.util.Locale;
import java.util.Map;
import java.util.Set;
import org.apache.solr.client.solrj.io.Tuple;
import org.apache.solr.client.solrj.io.comp.StreamComparator;
import org.apache.solr.client.solrj.io.eval.EvaluatorException;
import org.apache.solr.client.solrj.io.eval.StreamEvaluator;
import org.apache.solr.client.solrj.io.ops.StreamOperation;
import org.apache.solr.client.solrj.io.stream.expr.Explanation;
import org.apache.solr.client.solrj.io.stream.expr.Explanation.ExpressionType;
import org.apache.solr.client.solrj.io.stream.expr.Expressible;
import org.apache.solr.client.solrj.io.stream.expr.StreamExplanation;
import org.apache.solr.client.solrj.io.stream.expr.StreamExpression;
import org.apache.solr.client.solrj.io.stream.expr.StreamExpressionParameter;
import org.apache.solr.client.solrj.io.stream.expr.StreamExpressionParser;
import org.apache.solr.client.solrj.io.stream.expr.StreamExpressionValue;
import org.apache.solr.client.solrj.io.stream.expr.StreamFactory;
/**
* Selects fields from the incoming stream and applies optional field renaming.
* Does not reorder the outgoing stream.
* @since 6.0.0
**/
public class SelectStream extends TupleStream implements Expressible {
private static final long serialVersionUID = 1;
private TupleStream stream;
private StreamContext streamContext;
private Map<String,String> selectedFields;
private Map<StreamEvaluator,String> selectedEvaluators;
private List<StreamOperation> operations;
public SelectStream(TupleStream stream, List<String> selectedFields) throws IOException {
this.stream = stream;
this.selectedFields = new HashMap<>();
for(String selectedField : selectedFields){
this.selectedFields.put(selectedField, selectedField);
}
operations = new ArrayList<>();
selectedEvaluators = new LinkedHashMap<>();
}
public SelectStream(TupleStream stream, Map<String,String> selectedFields) throws IOException {
this.stream = stream;
this.selectedFields = selectedFields;
operations = new ArrayList<>();
selectedEvaluators = new LinkedHashMap<>();
}
@SuppressWarnings({"unchecked"})
public SelectStream(StreamExpression expression,StreamFactory factory) throws IOException {
// grab all parameters out
List<StreamExpression> streamExpressions = factory.getExpressionOperandsRepresentingTypes(expression, Expressible.class, TupleStream.class);
List<StreamExpressionParameter> selectAsFieldsExpressions = factory.getOperandsOfType(expression, StreamExpressionValue.class);
List<StreamExpression> operationExpressions = factory.getExpressionOperandsRepresentingTypes(expression, StreamOperation.class);
List<StreamExpression> evaluatorExpressions = factory.getExpressionOperandsRepresentingTypes(expression, StreamEvaluator.class);
// validate expression contains only what we want.
if(expression.getParameters().size() != streamExpressions.size() + selectAsFieldsExpressions.size() + operationExpressions.size()){
throw new IOException(String.format(Locale.ROOT,"Invalid expression %s - unknown operands found", expression));
}
if(1 != streamExpressions.size()){
throw new IOException(String.format(Locale.ROOT,"Invalid expression %s - expecting single stream but found %d (must be TupleStream types)",expression, streamExpressions.size()));
}
if(0 == selectAsFieldsExpressions.size()){
throw new IOException(String.format(Locale.ROOT,"Invalid expression %s - expecting at least one select field but found %d",expression, streamExpressions.size()));
}
if(0 != evaluatorExpressions.size()){
throw new IOException(String.format(Locale.ROOT,"Invalid expression %s - evaluators must be given a name, like 'add(...) as result' but found %d evaluators without names",expression, evaluatorExpressions.size()));
}
stream = factory.constructStream(streamExpressions.get(0));
selectedFields = new HashMap<String,String>();
selectedEvaluators = new LinkedHashMap<>();
for(StreamExpressionParameter parameter : selectAsFieldsExpressions){
StreamExpressionValue selectField = (StreamExpressionValue)parameter;
String value = selectField.getValue().trim();
// remove possible wrapping quotes
if(value.length() > 2 && value.startsWith("\"") && value.endsWith("\"")){
value = value.substring(1, value.length() - 1);
}
if(value.toLowerCase(Locale.ROOT).contains(" as ")){
String[] parts = value.split("(?i) as "); // ensure we are splitting in a case-insensitive way
if(2 != parts.length){
throw new IOException(String.format(Locale.ROOT,"Invalid expression %s - expecting select field of form 'fieldA' or 'fieldA as alias' but found %s",expression, value));
}
String asValue = parts[0].trim();
String asName = parts[1].trim();
boolean handled = false;
if(asValue.contains("(")){
// possible evaluator
try{
StreamExpression asValueExpression = StreamExpressionParser.parse(asValue);
if(factory.doesRepresentTypes(asValueExpression, StreamEvaluator.class)){
selectedEvaluators.put(factory.constructEvaluator(asValueExpression), asName);
handled = true;
}
} catch(Throwable e) {
Throwable t = e;
while(true) {
if(t instanceof EvaluatorException) {
throw new IOException(t);
}
t = t.getCause();
if(t == null) {
break;
}
}
// it was not handled, so treat as a non-evaluator
}
}
if(!handled){
selectedFields.put(asValue, asName);
}
}
else{
selectedFields.put(value,value);
}
}
operations = new ArrayList<>();
for(StreamExpression expr : operationExpressions){
operations.add(factory.constructOperation(expr));
}
}
@Override
public StreamExpression toExpression(StreamFactory factory) throws IOException{
return toExpression(factory, true);
}
private StreamExpression toExpression(StreamFactory factory, boolean includeStreams) throws IOException {
// function name
StreamExpression expression = new StreamExpression(factory.getFunctionName(this.getClass()));
if(includeStreams){
// stream
if(stream instanceof Expressible){
expression.addParameter(((Expressible)stream).toExpression(factory));
}
else{
throw new IOException("This SelectStream contains a non-expressible TupleStream - it cannot be converted to an expression");
}
}
else{
expression.addParameter("<stream>");
}
// selected fields
for(Map.Entry<String, String> selectField : selectedFields.entrySet()) {
if(selectField.getKey().equals(selectField.getValue())){
expression.addParameter(selectField.getKey());
}
else{
expression.addParameter(String.format(Locale.ROOT, "%s as %s", selectField.getKey(), selectField.getValue()));
}
}
// selected evaluators
for(Map.Entry<StreamEvaluator, String> selectedEvaluator : selectedEvaluators.entrySet()) {
expression.addParameter(String.format(Locale.ROOT, "%s as %s", selectedEvaluator.getKey().toExpression(factory), selectedEvaluator.getValue()));
}
for(StreamOperation operation : operations){
expression.addParameter(operation.toExpression(factory));
}
return expression;
}
@Override
public Explanation toExplanation(StreamFactory factory) throws IOException {
Explanation explanation = new StreamExplanation(getStreamNodeId().toString())
.withChildren(new Explanation[]{
stream.toExplanation(factory)
})
.withFunctionName(factory.getFunctionName(this.getClass()))
.withImplementingClass(this.getClass().getName())
.withExpressionType(ExpressionType.STREAM_DECORATOR)
.withExpression(toExpression(factory, false).toString());
for(StreamEvaluator evaluator : selectedEvaluators.keySet()){
explanation.addHelper(evaluator.toExplanation(factory));
}
for(StreamOperation operation : operations){
explanation.addHelper(operation.toExplanation(factory));
}
return explanation;
}
public void setStreamContext(StreamContext context) {
this.streamContext = context;
this.stream.setStreamContext(context);
Set<StreamEvaluator> evaluators = selectedEvaluators.keySet();
for(StreamEvaluator evaluator : evaluators) {
evaluator.setStreamContext(context);
}
}
public List<TupleStream> children() {
List<TupleStream> l = new ArrayList<>();
l.add(stream);
return l;
}
public void open() throws IOException {
stream.open();
}
public void close() throws IOException {
stream.close();
}
public Tuple read() throws IOException {
Tuple original = stream.read();
if(original.EOF){
return original;
}
// create a copy with the limited set of fields
Tuple workingToReturn = new Tuple();
Tuple workingForEvaluators = new Tuple();
//Clear the TupleContext before running the evaluators.
//The TupleContext allows evaluators to cache values within the scope of a single tuple.
//For example a LocalDateTime could be parsed by one evaluator and used by other evaluators within the scope of the tuple.
//This avoids the need to create multiple LocalDateTime instances for the same tuple to satisfy a select expression.
streamContext.getTupleContext().clear();
for(Object fieldName : original.getFields().keySet()){
workingForEvaluators.put(fieldName, original.get(fieldName));
if(selectedFields.containsKey(fieldName)){
workingToReturn.put(selectedFields.get(fieldName), original.get(fieldName));
}
}
// apply all operations
for(StreamOperation operation : operations){
operation.operate(workingToReturn);
operation.operate(workingForEvaluators);
}
// Apply all evaluators
for(Map.Entry<StreamEvaluator, String> selectedEvaluator : selectedEvaluators.entrySet()) {
Object o = selectedEvaluator.getKey().evaluate(workingForEvaluators);
if(o != null) {
workingForEvaluators.put(selectedEvaluator.getValue(), o);
workingToReturn.put(selectedEvaluator.getValue(), o);
}
}
return workingToReturn;
}
/** Return the stream sort - ie, the order in which records are returned */
public StreamComparator getStreamSort(){
// apply aliasing to comparator
return stream.getStreamSort().copyAliased(selectedFields);
}
public int getCost() {
return 0;
}
}