samoa-api/src/main/java/org/apache/samoa/learners/classifiers/rules/distributed/AMRLearnerProcessor.java - incubator-samoa - Git at Google

 package org.apache.samoa.learners.classifiers.rules.distributed;

 /*
  * #%L
  * SAMOA
  * %%
  * Copyright (C) 2014 - 2015 Apache Software Foundation
  * %%
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
  * You may obtain a copy of the License at
  *
  *      http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  * #L%
  */

 import java.util.Iterator;
 import java.util.LinkedList;
 import java.util.List;

 import org.apache.samoa.core.ContentEvent;
 import org.apache.samoa.core.Processor;
 import org.apache.samoa.instances.Instance;
 import org.apache.samoa.instances.Instances;
 import org.apache.samoa.learners.classifiers.rules.common.ActiveRule;
 import org.apache.samoa.learners.classifiers.rules.common.LearningRule;
 import org.apache.samoa.learners.classifiers.rules.common.RuleActiveRegressionNode;
 import org.apache.samoa.learners.classifiers.rules.common.RulePassiveRegressionNode;
 import org.apache.samoa.learners.classifiers.rules.common.RuleSplitNode;
 import org.apache.samoa.topology.Stream;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;

 /**
  * Learner Processor (HAMR).
  *
  * @author Anh Thu Vu
  *
  */
 public class AMRLearnerProcessor implements Processor {

   /**
 	 *
 	 */
   private static final long serialVersionUID = -2302897295090248013L;

   private static final Logger logger = LoggerFactory.getLogger(AMRLearnerProcessor.class);

   private transient List<ActiveRule> ruleSet;

   private Stream outputStream;

   private double splitConfidence;
   private double tieThreshold;
   private int gracePeriod;

   private boolean noAnomalyDetection;
   private double multivariateAnomalyProbabilityThreshold;
   private double univariateAnomalyprobabilityThreshold;
   private int anomalyNumInstThreshold;

   public AMRLearnerProcessor(Builder builder) {
     this.splitConfidence = builder.splitConfidence;
     this.tieThreshold = builder.tieThreshold;
     this.gracePeriod = builder.gracePeriod;

     this.noAnomalyDetection = builder.noAnomalyDetection;
     this.multivariateAnomalyProbabilityThreshold = builder.multivariateAnomalyProbabilityThreshold;
     this.univariateAnomalyprobabilityThreshold = builder.univariateAnomalyprobabilityThreshold;
     this.anomalyNumInstThreshold = builder.anomalyNumInstThreshold;
   }

   @Override
   public boolean process(ContentEvent event) {
     if (event instanceof AssignmentContentEvent) {
       AssignmentContentEvent attrContentEvent = (AssignmentContentEvent) event;
       trainRuleOnInstance(attrContentEvent.getRuleNumberID(), attrContentEvent.getInstance());
     }
     else if (event instanceof RuleContentEvent) {
       RuleContentEvent ruleContentEvent = (RuleContentEvent) event;
       if (!ruleContentEvent.isRemoving()) {
         addRule(ruleContentEvent.getRule());
       }
     }

     return false;
   }

   /*
    * Process input instances
    */
   private void trainRuleOnInstance(int ruleID, Instance instance) {
     // System.out.println("Processor:"+this.processorId+": Rule:"+ruleID+" -> Counter="+counter);
     Iterator<ActiveRule> ruleIterator = this.ruleSet.iterator();
     while (ruleIterator.hasNext()) {
       ActiveRule rule = ruleIterator.next();
       if (rule.getRuleNumberID() == ruleID) {
         // Check (again) for coverage
         if (rule.isCovering(instance)) {
           double error = rule.computeError(instance); // Use adaptive mode error
           boolean changeDetected = ((RuleActiveRegressionNode) rule.getLearningNode()).updateChangeDetection(error);
           if (changeDetected) {
             ruleIterator.remove();

             this.sendRemoveRuleEvent(ruleID);
           } else {
             rule.updateStatistics(instance);
             if (rule.getInstancesSeen() % this.gracePeriod == 0.0) {
               if (rule.tryToExpand(this.splitConfidence, this.tieThreshold)) {
                 rule.split();

                 // expanded: update Aggregator with new/updated predicate
                 this.sendPredicate(rule.getRuleNumberID(), rule.getLastUpdatedRuleSplitNode(),
                     (RuleActiveRegressionNode) rule.getLearningNode());
               }

             }

           }
         }

         return;
       }
     }
   }

   private boolean isAnomaly(Instance instance, LearningRule rule) {
     // AMRUles is equipped with anomaly detection. If on, compute the anomaly
     // value.
     boolean isAnomaly = false;
     if (!this.noAnomalyDetection) {
       if (rule.getInstancesSeen() >= this.anomalyNumInstThreshold) {
         isAnomaly = rule.isAnomaly(instance,
             this.univariateAnomalyprobabilityThreshold,
             this.multivariateAnomalyProbabilityThreshold,
             this.anomalyNumInstThreshold);
       }
     }
     return isAnomaly;
   }

   private void sendRemoveRuleEvent(int ruleID) {
     RuleContentEvent rce = new RuleContentEvent(ruleID, null, true);
     this.outputStream.put(rce);
   }

   private void sendPredicate(int ruleID, RuleSplitNode splitNode, RuleActiveRegressionNode learningNode) {
     this.outputStream.put(new PredicateContentEvent(ruleID, splitNode, new RulePassiveRegressionNode(learningNode)));
   }

   /*
    * Process control message (regarding adding or removing rules)
    */
   private boolean addRule(ActiveRule rule) {
     this.ruleSet.add(rule);
     return true;
   }

   @Override
   public void onCreate(int id) {
     this.ruleSet = new LinkedList<>();
   }

   @Override
   public Processor newProcessor(Processor p) {
     AMRLearnerProcessor oldProcessor = (AMRLearnerProcessor) p;
     AMRLearnerProcessor newProcessor =
         new AMRLearnerProcessor.Builder(oldProcessor).build();

     newProcessor.setOutputStream(oldProcessor.outputStream);
     return newProcessor;
   }

   /*
    * Builder
    */
   public static class Builder {
     private double splitConfidence;
     private double tieThreshold;
     private int gracePeriod;

     private boolean noAnomalyDetection;
     private double multivariateAnomalyProbabilityThreshold;
     private double univariateAnomalyprobabilityThreshold;
     private int anomalyNumInstThreshold;

     private Instances dataset;

     public Builder(Instances dataset) {
       this.dataset = dataset;
     }

     public Builder(AMRLearnerProcessor processor) {
       this.splitConfidence = processor.splitConfidence;
       this.tieThreshold = processor.tieThreshold;
       this.gracePeriod = processor.gracePeriod;
     }

     public Builder splitConfidence(double splitConfidence) {
       this.splitConfidence = splitConfidence;
       return this;
     }

     public Builder tieThreshold(double tieThreshold) {
       this.tieThreshold = tieThreshold;
       return this;
     }

     public Builder gracePeriod(int gracePeriod) {
       this.gracePeriod = gracePeriod;
       return this;
     }

     public Builder noAnomalyDetection(boolean noAnomalyDetection) {
       this.noAnomalyDetection = noAnomalyDetection;
       return this;
     }

     public Builder multivariateAnomalyProbabilityThreshold(double mAnomalyThreshold) {
       this.multivariateAnomalyProbabilityThreshold = mAnomalyThreshold;
       return this;
     }

     public Builder univariateAnomalyProbabilityThreshold(double uAnomalyThreshold) {
       this.univariateAnomalyprobabilityThreshold = uAnomalyThreshold;
       return this;
     }

     public Builder anomalyNumberOfInstancesThreshold(int anomalyNumInstThreshold) {
       this.anomalyNumInstThreshold = anomalyNumInstThreshold;
       return this;
     }

     public AMRLearnerProcessor build() {
       return new AMRLearnerProcessor(this);
     }
   }

   /*
    * Output stream
    */
   public void setOutputStream(Stream stream) {
     this.outputStream = stream;
   }

   public Stream getOutputStream() {
     return this.outputStream;
   }
 }
	package org.apache.samoa.learners.classifiers.rules.distributed;

	/*
	* #%L
	* SAMOA
	* %%
	* Copyright (C) 2014 - 2015 Apache Software Foundation
	* %%
	* Licensed under the Apache License, Version 2.0 (the "License");
	* you may not use this file except in compliance with the License.
	* You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	* #L%
	*/

	import java.util.Iterator;
	import java.util.LinkedList;
	import java.util.List;

	import org.apache.samoa.core.ContentEvent;
	import org.apache.samoa.core.Processor;
	import org.apache.samoa.instances.Instance;
	import org.apache.samoa.instances.Instances;
	import org.apache.samoa.learners.classifiers.rules.common.ActiveRule;
	import org.apache.samoa.learners.classifiers.rules.common.LearningRule;
	import org.apache.samoa.learners.classifiers.rules.common.RuleActiveRegressionNode;
	import org.apache.samoa.learners.classifiers.rules.common.RulePassiveRegressionNode;
	import org.apache.samoa.learners.classifiers.rules.common.RuleSplitNode;
	import org.apache.samoa.topology.Stream;
	import org.slf4j.Logger;
	import org.slf4j.LoggerFactory;

	/**
	* Learner Processor (HAMR).
	*
	* @author Anh Thu Vu
	*
	*/
	public class AMRLearnerProcessor implements Processor {

	/**
	*
	*/
	private static final long serialVersionUID = -2302897295090248013L;

	private static final Logger logger = LoggerFactory.getLogger(AMRLearnerProcessor.class);

	private transient List<ActiveRule> ruleSet;

	private Stream outputStream;

	private double splitConfidence;
	private double tieThreshold;
	private int gracePeriod;

	private boolean noAnomalyDetection;
	private double multivariateAnomalyProbabilityThreshold;
	private double univariateAnomalyprobabilityThreshold;
	private int anomalyNumInstThreshold;

	public AMRLearnerProcessor(Builder builder) {
	this.splitConfidence = builder.splitConfidence;
	this.tieThreshold = builder.tieThreshold;
	this.gracePeriod = builder.gracePeriod;

	this.noAnomalyDetection = builder.noAnomalyDetection;
	this.multivariateAnomalyProbabilityThreshold = builder.multivariateAnomalyProbabilityThreshold;
	this.univariateAnomalyprobabilityThreshold = builder.univariateAnomalyprobabilityThreshold;
	this.anomalyNumInstThreshold = builder.anomalyNumInstThreshold;
	}

	@Override
	public boolean process(ContentEvent event) {
	if (event instanceof AssignmentContentEvent) {
	AssignmentContentEvent attrContentEvent = (AssignmentContentEvent) event;
	trainRuleOnInstance(attrContentEvent.getRuleNumberID(), attrContentEvent.getInstance());
	}
	else if (event instanceof RuleContentEvent) {
	RuleContentEvent ruleContentEvent = (RuleContentEvent) event;
	if (!ruleContentEvent.isRemoving()) {
	addRule(ruleContentEvent.getRule());
	}
	}

	return false;
	}

	/*
	* Process input instances
	*/
	private void trainRuleOnInstance(int ruleID, Instance instance) {
	// System.out.println("Processor:"+this.processorId+": Rule:"+ruleID+" -> Counter="+counter);
	Iterator<ActiveRule> ruleIterator = this.ruleSet.iterator();
	while (ruleIterator.hasNext()) {
	ActiveRule rule = ruleIterator.next();
	if (rule.getRuleNumberID() == ruleID) {
	// Check (again) for coverage
	if (rule.isCovering(instance)) {
	double error = rule.computeError(instance); // Use adaptive mode error
	boolean changeDetected = ((RuleActiveRegressionNode) rule.getLearningNode()).updateChangeDetection(error);
	if (changeDetected) {
	ruleIterator.remove();

	this.sendRemoveRuleEvent(ruleID);
	} else {
	rule.updateStatistics(instance);
	if (rule.getInstancesSeen() % this.gracePeriod == 0.0) {
	if (rule.tryToExpand(this.splitConfidence, this.tieThreshold)) {
	rule.split();

	// expanded: update Aggregator with new/updated predicate
	this.sendPredicate(rule.getRuleNumberID(), rule.getLastUpdatedRuleSplitNode(),
	(RuleActiveRegressionNode) rule.getLearningNode());
	}

	}

	}
	}

	return;
	}
	}
	}

	private boolean isAnomaly(Instance instance, LearningRule rule) {
	// AMRUles is equipped with anomaly detection. If on, compute the anomaly
	// value.
	boolean isAnomaly = false;
	if (!this.noAnomalyDetection) {
	if (rule.getInstancesSeen() >= this.anomalyNumInstThreshold) {
	isAnomaly = rule.isAnomaly(instance,
	this.univariateAnomalyprobabilityThreshold,
	this.multivariateAnomalyProbabilityThreshold,
	this.anomalyNumInstThreshold);
	}
	}
	return isAnomaly;
	}

	private void sendRemoveRuleEvent(int ruleID) {
	RuleContentEvent rce = new RuleContentEvent(ruleID, null, true);
	this.outputStream.put(rce);
	}

	private void sendPredicate(int ruleID, RuleSplitNode splitNode, RuleActiveRegressionNode learningNode) {
	this.outputStream.put(new PredicateContentEvent(ruleID, splitNode, new RulePassiveRegressionNode(learningNode)));
	}

	/*
	* Process control message (regarding adding or removing rules)
	*/
	private boolean addRule(ActiveRule rule) {
	this.ruleSet.add(rule);
	return true;
	}

	@Override
	public void onCreate(int id) {
	this.ruleSet = new LinkedList<>();
	}

	@Override
	public Processor newProcessor(Processor p) {
	AMRLearnerProcessor oldProcessor = (AMRLearnerProcessor) p;
	AMRLearnerProcessor newProcessor =
	new AMRLearnerProcessor.Builder(oldProcessor).build();

	newProcessor.setOutputStream(oldProcessor.outputStream);
	return newProcessor;
	}

	/*
	* Builder
	*/
	public static class Builder {
	private double splitConfidence;
	private double tieThreshold;
	private int gracePeriod;

	private boolean noAnomalyDetection;
	private double multivariateAnomalyProbabilityThreshold;
	private double univariateAnomalyprobabilityThreshold;
	private int anomalyNumInstThreshold;

	private Instances dataset;

	public Builder(Instances dataset) {
	this.dataset = dataset;
	}

	public Builder(AMRLearnerProcessor processor) {
	this.splitConfidence = processor.splitConfidence;
	this.tieThreshold = processor.tieThreshold;
	this.gracePeriod = processor.gracePeriod;
	}

	public Builder splitConfidence(double splitConfidence) {
	this.splitConfidence = splitConfidence;
	return this;
	}

	public Builder tieThreshold(double tieThreshold) {
	this.tieThreshold = tieThreshold;
	return this;
	}

	public Builder gracePeriod(int gracePeriod) {
	this.gracePeriod = gracePeriod;
	return this;
	}

	public Builder noAnomalyDetection(boolean noAnomalyDetection) {
	this.noAnomalyDetection = noAnomalyDetection;
	return this;
	}

	public Builder multivariateAnomalyProbabilityThreshold(double mAnomalyThreshold) {
	this.multivariateAnomalyProbabilityThreshold = mAnomalyThreshold;
	return this;
	}

	public Builder univariateAnomalyProbabilityThreshold(double uAnomalyThreshold) {
	this.univariateAnomalyprobabilityThreshold = uAnomalyThreshold;
	return this;
	}

	public Builder anomalyNumberOfInstancesThreshold(int anomalyNumInstThreshold) {
	this.anomalyNumInstThreshold = anomalyNumInstThreshold;
	return this;
	}

	public AMRLearnerProcessor build() {
	return new AMRLearnerProcessor(this);
	}
	}

	/*
	* Output stream
	*/
	public void setOutputStream(Stream stream) {
	this.outputStream = stream;
	}

	public Stream getOutputStream() {
	return this.outputStream;
	}
	}