Windows Develop

Development Platform:
Java

RuleNode.java：Code Content
							/*
 *    RuleNode.java
 *    Copyright (C) 2000 Mark Hall
 *
 *    This program is free software; you can redistribute it and/or modify
 *    it under the terms of the GNU General Public License as published by
 *    the Free Software Foundation; either version 2 of the License, or
 *    (at your option) any later version.
 *
 *    This program is distributed in the hope that it will be useful,
 *    but WITHOUT ANY WARRANTY; without even the implied warranty of
 *    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *    GNU General Public License for more details.
 *
 *    You should have received a copy of the GNU General Public License
 *    along with this program; if not, write to the Free Software
 *    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
 */
package weka.classifiers.trees.m5;
import java.io.*;
import java.util.*;
import weka.core.*;
import weka.classifiers.*;
import weka.classifiers.functions.LinearRegression;
import weka.filters.unsupervised.attribute.Remove;
import weka.filters.Filter;
/**
 * Constructs a node for use in an m5 tree or rule
 *
 * @author Mark Hall (mhall@cs.waikato.ac.nz)
 * @version $Revision: 1.3 $
 */
public class RuleNode extends Classifier {
  /**
   * instances reaching this node
   */
  private Instances	   m_instances;
  /**
   * the class index
   */
  private int		   m_classIndex;
  /**
   * the number of instances reaching this node
   */
  protected int		   m_numInstances;
  /**
   * the number of attributes
   */
  private int		   m_numAttributes;
  /**
   * Node is a leaf
   */
  private boolean	   m_isLeaf;
  /**
   * attribute this node splits on
   */
  private int		   m_splitAtt;
  /**
   * the value of the split attribute
   */
  private double	   m_splitValue;
  /**
   * the linear model at this node
   */
  private LinearRegression m_nodeModel;
  /**
   * the number of paramters in the chosen model for this node---either
   * the subtree model or the linear model.
   * The constant term is counted as a paramter---this is for pruning
   * purposes
   */
  public int		   m_numParameters;
  /**
   * A copy of the instances containing only the attributes tested
   * below this node---used to construct the linear model for this node
   */
  private Instances	   m_reducedI;
  /**
   * the mean squared error of the model at this node (either linear or
   * subtree)
   */
  private double	   m_rootMeanSquaredError;
  /**
   * the Attribute filter used to remove any attributes not presented to
   * the linear regression model
   */
  private Remove  m_attributeFilter;
  /**
   * child nodes
   */
  protected RuleNode	   m_left;
  protected RuleNode	   m_right;
  /**
   * the parent of this node
   */
  private RuleNode	   m_parent;
  /**
   * a node will not be split if it contains less then m_splitNum isntances
   */
  private double	   m_splitNum = 3.5;
  /**
   * a node will not be split if its class standard deviation is less
   * than 5% of the class standard deviation of all the instances
   */
  private double	   m_devFraction = 0.05;
  private double	   m_pruningMultiplier = 2;
  /**
   * the number assigned to the linear model if this node is a leaf.
   * = 0 if this node is not a leaf
   */
  private int		   m_leafModelNum;
  /**
   * a node will not be split if the class deviation of its
   * instances is less than m_devFraction of the deviation of the
   * global class
   */
  private double	   m_globalDeviation;
  /**
   * the absolute deviation of the global class
   */
  private double	   m_globalAbsDeviation;
  /**
   * Use the original m5 smoothing procedure during prediction of
   * novel test cases
   */
  private boolean	   m_smoothPredictions;
  /**
   * Used to disable smoothing during pruning
   */
  private boolean	   m_smoothingOn;
  /**
   * Indices of the attributes to be used in generating a linear model
   * at this node
   */
  private int [] m_indices;
    
  /**
   * Constant used in original m5 smoothing calculation
   */
  private static final double	   SMOOTHING_CONSTANT = 15.0;
  /**
   * Node id.
   */
  private int m_id;
  /**
   * Save the instances at each node (for visualizing in the
   * Explorer's treevisualizer.
   */
  private boolean m_saveInstances = false;
  /**
   * Make a regression tree instead of a model tree
   */
  private boolean m_regressionTree;
  /**
   * Creates a new <code>RuleNode</code> instance.
   *
   * @param globalDev the global standard deviation of the class
   * @param globalAbsDev the global absolute deviation of the class
   * @param parent the parent of this node
   */
  public RuleNode(double globalDev, double globalAbsDev, RuleNode parent) {
    m_nodeModel = null;
    m_right = null;
    m_left = null;
    m_parent = parent;
    m_globalDeviation = globalDev;
    m_globalAbsDeviation = globalAbsDev;
    m_attributeFilter = null;
    m_smoothPredictions = false;
  }
    
  /**
   * Build this node (find an attribute and split point)
   *
   * @param data the instances on which to build this node
   * @exception Exception if an error occurs
   */
  public void buildClassifier(Instances data) throws Exception {
    m_smoothingOn = false;
    m_rootMeanSquaredError = Double.MAX_VALUE;
    //    m_instances = new Instances(data);
    m_instances = data;
    m_classIndex = m_instances.classIndex();
    m_numInstances = m_instances.numInstances();
    m_numAttributes = m_instances.numAttributes();
    m_nodeModel = null;
    m_right = null;
    m_left = null;
    m_attributeFilter = null;
    if ((m_numInstances < m_splitNum) 
	|| (Rule.stdDev(m_classIndex, m_instances) 
	    < (m_globalDeviation * m_devFraction))) {
      m_isLeaf = true;
    } else {
      m_isLeaf = false;
    } 
    split();
  } 
 
  /**
   * Classify an instance using this node. Recursively calls classifyInstance
   * on child nodes.
   *
   * @param inst the instance to classify
   * @return the prediction for this instance
   * @exception Exception if an error occurs
   */
  public double classifyInstance(Instance inst) throws Exception {
    double   pred;
    double   n = 0;
    Instance tempInst;
    if (m_isLeaf) {
      if (m_nodeModel == null) {
	throw new Exception("Classifier has not been built correctly.");
      } 
      m_attributeFilter.input(inst);
      tempInst = m_attributeFilter.output();
      return m_nodeModel.classifyInstance(tempInst);
    } 
    if (inst.value(m_splitAtt) <= m_splitValue) {
      if (m_left == null) {
	m_attributeFilter.input(inst);
	tempInst = m_attributeFilter.output();
	return m_nodeModel.classifyInstance(tempInst);
      } 
      pred = m_left.classifyInstance(inst);
      n = m_left.m_numInstances;
    } else {
      if (m_right == null) {
	m_attributeFilter.input(inst);
	tempInst = m_attributeFilter.output();
	return m_nodeModel.classifyInstance(tempInst);
      } 
      pred = m_right.classifyInstance(inst);
      n = m_right.m_numInstances;
    } 
    if (m_smoothingOn && m_smoothPredictions) {
      m_attributeFilter.input(inst);
      tempInst = m_attributeFilter.output();
      double supportPred = m_nodeModel.classifyInstance(tempInst);
      pred = smoothingOriginal(n, pred, supportPred);
    } 
    return pred;
  } 
  /**
   * Applies the m5 smoothing procedure to a prediction
   *
   * @param n number of instances in selected child of this node
   * @param pred the prediction so far
   * @param supportPred the prediction of the linear model at this node
   * @return the current prediction smoothed with the prediction of the
   * linear model at this node
   * @exception Exception if an error occurs
   */
  protected static double smoothingOriginal(double n, double pred, 
					    double supportPred) 
    throws Exception {
    double   smoothed;
    smoothed = 
      ((n * pred) + (SMOOTHING_CONSTANT * supportPred)) /
      (n + SMOOTHING_CONSTANT);
    return smoothed;
  } 
  /**
   * Finds an attribute and split point for this node
   *
   * @exception Exception if an error occurs
   */
  public void split() throws Exception {
    int		  i;
    Instances     leftSubset, rightSubset;
    SplitEvaluate bestSplit, currentSplit;
    boolean[]     attsBelow;
    if (!m_isLeaf) {
     
      bestSplit = new YongSplitInfo(0, m_numInstances - 1, -1);
      currentSplit = new YongSplitInfo(0, m_numInstances - 1, -1);
      // find the best attribute to split on
      for (i = 0; i < m_numAttributes; i++) {
	if (i != m_classIndex) {
	  // sort the instances by this attribute
	  m_instances.sort(i);
	  currentSplit.attrSplit(i, m_instances);
	  if ((Math.abs(currentSplit.maxImpurity() - 
			bestSplit.maxImpurity()) > 1.e-6) 
	      && (currentSplit.maxImpurity() 
		  > bestSplit.maxImpurity() + 1.e-6)) {
	    bestSplit = currentSplit.copy();
	  } 
	} 
      } 
      // cant find a good split or split point?
      if (bestSplit.splitAttr() < 0 || bestSplit.position() < 1 
	  || bestSplit.position() > m_numInstances - 1) {
	m_isLeaf = true;
      } else {
	m_splitAtt = bestSplit.splitAttr();
	m_splitValue = bestSplit.splitValue();
	leftSubset = new Instances(m_instances, m_numInstances);
	rightSubset = new Instances(m_instances, m_numInstances);
	for (i = 0; i < m_numInstances; i++) {
	  if (m_instances.instance(i).value(m_splitAtt) <= m_splitValue) {
	    leftSubset.add(m_instances.instance(i));
	  } else {
	    rightSubset.add(m_instances.instance(i));
	  } 
	} 
	leftSubset.compactify();
	rightSubset.compactify();
	// build left and right nodes
	m_left = new RuleNode(m_globalDeviation, m_globalAbsDeviation, this);
	m_left.setRegressionTree(m_regressionTree);
	m_left.setSmoothing(m_smoothPredictions);
	m_left.setSaveInstances(m_saveInstances);
	m_left.buildClassifier(leftSubset);
	m_right = new RuleNode(m_globalDeviation, m_globalAbsDeviation, this);
	
	m_right.setRegressionTree(m_regressionTree);
	m_right.setSmoothing(m_smoothPredictions);
	m_right.setSaveInstances(m_saveInstances);
	m_right.buildClassifier(rightSubset);
	// now find out what attributes are tested in the left and right
	// subtrees and use them to learn a linear model for this node
	if (!m_regressionTree) {
	  attsBelow = attsTestedBelow();
	  attsBelow[m_classIndex] = true;
	  int count = 0, j;
	  for (j = 0; j < m_numAttributes; j++) {
	    if (attsBelow[j]) {
	      count++;
	    } 
	  } 
	  
	  int[] indices = new int[count];
	  count = 0;
	  
	  for (j = 0; j < m_numAttributes; j++) {
	    if (attsBelow[j] && (j != m_classIndex)) {
	      indices[count++] = j;
	    } 
	  } 
	  
	  indices[count] = m_classIndex;
	  m_indices = indices;
	} else {
	  m_indices = new int [1];
	  m_indices[0] = m_classIndex;
	  m_numParameters = 1;
	}
      } 
    } 
    if (m_isLeaf) {
      int [] indices = new int [1];
      indices[0] = m_classIndex;
      m_indices = indices;
      m_numParameters = 1;
     
      // need to evaluate the model here if want correct stats for unpruned
      // tree
    } 
  } 
  /**
   * Build a linear model for this node using those attributes
   * specified in indices.
   *
   * @param indices an array of attribute indices to include in the linear
   * model
   */
  private void buildLinearModel(int [] indices) throws Exception {
    // copy the training instances and remove all but the tested
    // attributes
    m_reducedI = new Instances(m_instances);
    m_attributeFilter = new Remove();
    
    m_attributeFilter.setInvertSelection(true);
    m_attributeFilter.setAttributeIndicesArray(indices);
    m_attributeFilter.setInputFormat(m_reducedI);
    m_reducedI = Filter.useFilter(m_reducedI, m_attributeFilter);
    
    // build a linear regression for the training data using the
    // tested attributes
    m_nodeModel = new LinearRegression();
    
    m_nodeModel.buildClassifier(m_reducedI);
  }
  /**
   * Returns an array containing the indexes of attributes used in tests
   * above this node
   *
   * @return an array of attribute indexes
   */
  private boolean[] attsTestedAbove() {
    boolean[] atts = new boolean[m_numAttributes];
    boolean[] attsAbove = null;
    if (m_parent != null) {
      attsAbove = m_parent.attsTestedAbove();
    } 
    if (attsAbove != null) {
      for (int i = 0; i < m_numAttributes; i++) {
	atts[i] = attsAbove[i];
      } 
    } 
    atts[m_splitAtt] = true;
    return atts;
  } 
  /**
   * Returns an array containing the indexes of attributes used in tests
   * below this node
   *
   * @return an array of attribute indexes
   */
  private boolean[] attsTestedBelow() {
    boolean[] attsBelow = new boolean[m_numAttributes];
    boolean[] attsBelowLeft = null;
    boolean[] attsBelowRight = null;
    if (m_right != null) {
      attsBelowRight = m_right.attsTestedBelow();
    } 
    if (m_left != null) {
      attsBelowLeft = m_left.attsTestedBelow();
    } 
    for (int i = 0; i < m_numAttributes; i++) {
      if (attsBelowLeft != null) {
	attsBelow[i] = (attsBelow[i] || attsBelowLeft[i]);
      } 
      if (attsBelowRight != null) {
	attsBelow[i] = (attsBelow[i] || attsBelowRight[i]);
      } 
    } 
    if (!m_isLeaf) {
      attsBelow[m_splitAtt] = true;
    } 
    return attsBelow;
  } 
  /**
   * Sets the leaves' numbers
   * @param leafCounter the number of leaves counted
   * @return the number of the total leaves under the node
   */
  public int numLeaves(int leafCounter) {
    // turn smoothing on (if requested) once model has been built
    if (m_smoothPredictions) {
      m_smoothingOn = true;
    } 
    if (!m_isLeaf) {
      // node
      m_leafModelNum = 0;
      if (m_left != null) {
	leafCounter = m_left.numLeaves(leafCounter);
      } 
      if (m_right != null) {
	leafCounter = m_right.numLeaves(leafCounter);
      } 
    } else {
      // leaf
      leafCounter++;
      m_leafModelNum = leafCounter;
    } 
    return leafCounter;
  } 
  /**
   * print the linear model at this node
   */
  public String toString() {
    return printNodeLinearModel();
  } 
  /**
   * print the linear model at this node
   */
  public String printNodeLinearModel() {
    return m_nodeModel.toString();
  } 
  /**
   * print all leaf models
   */
  public String printLeafModels() {
    StringBuffer text = new StringBuffer();
    if (m_isLeaf) {
      text.append("nLM num: " + m_leafModelNum);
      text.append(m_nodeModel.toString());
      text.append("n");
    } else {
      text.append(m_left.printLeafModels());
      text.append(m_right.printLeafModels());
    } 
    return text.toString();
  } 
  /**
   * Returns a description of this node (debugging purposes)
   *
   * @return a string describing this node
   */
  public String nodeToString() {
    StringBuffer text = new StringBuffer();
    System.out.println("In to string");
    text.append("Node:ntnum inst: " + m_numInstances);
    if (m_isLeaf) {
      text.append("ntleaf");
    } else {
      text.append("tnode");
    }
    text.append("ntSplit att: " + m_instances.attribute(m_splitAtt).name());
    text.append("ntSplit val: " + Utils.doubleToString(m_splitValue, 1, 3));
    text.append("ntLM num: " + m_leafModelNum);
    text.append("ntLinear modeln" + m_nodeModel.toString());
    text.append("nn");
    if (m_left != null) {
      text.append(m_left.nodeToString());
    } 
    if (m_right != null) {
      text.append(m_right.nodeToString());
    } 
    return text.toString();
  } 
  /**
   * Recursively builds a textual description of the tree
   *
   * @param level the level of this node
   * @return string describing the tree
   */
  public String treeToString(int level) {
    int		 i;
    StringBuffer text = new StringBuffer();
    if (!m_isLeaf) {
      text.append("n");
      for (i = 1; i <= level; i++) {
	text.append("|   ");
      } 
      if (m_instances.attribute(m_splitAtt).name().charAt(0) != '[') {
	text.append(m_instances.attribute(m_splitAtt).name() + " <= " 
		    + Utils.doubleToString(m_splitValue, 1, 3) + " : ");
      } else {
	text.append(m_instances.attribute(m_splitAtt).name() + " false : ");
      } 
      if (m_left != null) {
	text.append(m_left.treeToString(level + 1));
      } else {
	text.append("NULLn");
      }
      for (i = 1; i <= level; i++) {
	text.append("|   ");
      } 
      if (m_instances.attribute(m_splitAtt).name().charAt(0) != '[') {
	text.append(m_instances.attribute(m_splitAtt).name() + " >  " 
		    + Utils.doubleToString(m_splitValue, 1, 3) + " : ");
      } else {
	text.append(m_instances.attribute(m_splitAtt).name() + " true : ");
      } 
      if (m_right != null) {
	text.append(m_right.treeToString(level + 1));
      } else {
	text.append("NULLn");
      }
    } else {
      text.append("LM" + m_leafModelNum);
      if (m_globalDeviation > 0.0) {
	text
	  .append(" (" + m_numInstances + "/" 
		  + Utils.doubleToString((100.0 * m_rootMeanSquaredError /
					     m_globalAbsDeviation), 1, 3) 
		  + "%)n");
      } else {
	text.append(" (" + m_numInstances + ")n");
      } 
    } 
    return text.toString();
  } 
  /**
   * Recursively prune the tree
   *
   * @exception Exception if an error occurs
   */
  public void prune() throws Exception {
    Evaluation nodeModelEval = null;
    if (m_isLeaf) {
      buildLinearModel(m_indices);
      nodeModelEval = new Evaluation(m_reducedI);
      if (m_reducedI == null) {
	throw new Exception("No instances at leaf!");
      } 
      // count the constant term as a paramter for a leaf
      // Evaluate the model
      nodeModelEval.evaluateModel(m_nodeModel, m_reducedI);
      m_rootMeanSquaredError = nodeModelEval.rootMeanSquaredError();
    } else {
      // Prune the left and right subtrees
      if (m_left != null) {
	m_left.prune();
      } 
      if (m_right != null) {
	m_right.prune();	
      } 
      
      buildLinearModel(m_indices);
      nodeModelEval = new Evaluation(m_reducedI);
      double rmsModel;
      double adjustedErrorModel;
      nodeModelEval.evaluateModel(m_nodeModel, m_reducedI);
      rmsModel = nodeModelEval.rootMeanSquaredError();
      adjustedErrorModel = rmsModel 
	* pruningFactor(m_numInstances, 
			m_nodeModel.numParameters() + 1);
      // Evaluate this node (ie its left and right subtrees)
      Evaluation nodeEval = new Evaluation(m_instances);
      double     rmsSubTree;
      double     adjustedErrorNode;
      int	 l_params = 0, r_params = 0;
      nodeEval.evaluateModel(this, m_instances);
      rmsSubTree = nodeEval.rootMeanSquaredError();
      if (m_left != null) {
	l_params = m_left.numParameters();
      } 
      if (m_right != null) {
	r_params = m_right.numParameters();
      } 
      adjustedErrorNode = rmsSubTree 
	* pruningFactor(m_numInstances, 
			(l_params + r_params + 1));
      if ((adjustedErrorModel <= adjustedErrorNode) 
	  || (adjustedErrorModel < (m_globalDeviation * 0.00001))) {
	// Choose linear model for this node rather than subtree model
	m_isLeaf = true;
	m_right = null;
	m_left = null;
	m_numParameters = m_nodeModel.numParameters() + 1;
	m_rootMeanSquaredError = rmsModel;
      } else {
	m_numParameters = (l_params + r_params + 1);
	m_rootMeanSquaredError = rmsSubTree;
      } 
    }
    // save space
    if (!m_saveInstances) {
      m_instances = new Instances(m_instances, 0);
    }
    m_reducedI = new Instances(m_reducedI, 0);
  } 
  /**
   * Compute the pruning factor
   *
   * @param num_instances number of instances
   * @param num_params number of parameters in the model
   * @return the pruning factor
   */
  private double pruningFactor(int num_instances, int num_params) {
    if (num_instances <= num_params) {
      return 10.0;    // Caution says Yong in his code
    } 
    return ((double) (num_instances + m_pruningMultiplier * num_params) 
	    / (double) (num_instances - num_params));
  } 
  /**
   * Find the leaf with greatest coverage
   *
   * @param maxCoverage the greatest coverage found so far
   * @param bestLeaf the leaf with the greatest coverage
   */
  public void findBestLeaf(double[] maxCoverage, RuleNode[] bestLeaf) {
    if (!m_isLeaf) {
      if (m_left != null) {
	m_left.findBestLeaf(maxCoverage, bestLeaf);
      } 
      if (m_right != null) {
	m_right.findBestLeaf(maxCoverage, bestLeaf);
      } 
    } else {
      if (m_numInstances > maxCoverage[0]) {
	maxCoverage[0] = m_numInstances;
	bestLeaf[0] = this;
      } 
    } 
  } 
  /**
   * Return a list containing all the leaves in the tree
   *
   * @param v a single element array containing a vector of leaves
   */
  public void returnLeaves(FastVector[] v) {
    if (m_isLeaf) {
      v[0].addElement(this);
    } else {
      if (m_left != null) {
	m_left.returnLeaves(v);
      } 
      if (m_right != null) {
	m_right.returnLeaves(v);
      } 
    } 
  } 
  /**
   * Get the parent of this node
   *
   * @return the parent of this node
   */
  public RuleNode parentNode() {
    return m_parent;
  } 
  /**
   * Get the left child of this node
   *
   * @return the left child of this node
   */
  public RuleNode leftNode() {
    return m_left;
  } 
  /**
   * Get the right child of this node
   *
   * @return the right child of this node
   */
  public RuleNode rightNode() {
    return m_right;
  } 
  /**
   * Get the index of the splitting attribute for this node
   *
   * @return the index of the splitting attribute
   */
  public int splitAtt() {
    return m_splitAtt;
  } 
  /**
   * Get the split point for this node
   *
   * @return the split point for this node
   */
  public double splitVal() {
    return m_splitValue;
  } 
  /**
   * Get the number of linear models in the tree
   *
   * @return the number of linear models
   */
  public int numberOfLinearModels() {
    if (m_isLeaf) {
      return 1;
    } else {
      return m_left.numberOfLinearModels() + m_right.numberOfLinearModels();
    } 
  } 
  /**
   * Return true if this node is a leaf
   *
   * @return true if this node is a leaf
   */
  private boolean isLeaf() {
    return m_isLeaf;
  } 
  /**
   * Get the root mean squared error at this node
   *
   * @return the root mean squared error
   */
  protected double rootMeanSquaredError() {
    return m_rootMeanSquaredError;
  } 
  /**
   * Get the linear model at this node
   *
   * @return the linear model at this node
   */
  protected LinearRegression getModel() {
    return m_nodeModel;
  } 
  /**
   * Get the number of parameters in the model at this node
   *
   * @return the number of parameters in the model at this node
   */
  private int numParameters() {
    return m_numParameters;
  } 
  /**
   * Get if smoothing is being used
   *
   * @param s true if smoothing is being used
   */
  public void setSmoothing(boolean s) {
    m_smoothPredictions = s;
  } 
  /**
   * Method declaration
   *
   * @return true if smoothing has been selected.
   *
   */
  public boolean getSmoothing() {
    return m_smoothPredictions;
  } 
  
  /**
   * Get the value of regressionTree.
   *
   * @return Value of regressionTree.
   */
  public boolean getRegressionTree() {
    
    return m_regressionTree;
  }
  
  /**
   * Set the value of regressionTree.
   *
   * @param newregressionTree Value to assign to regressionTree.
   */
  public void setRegressionTree(boolean newregressionTree) {
    
    m_regressionTree = newregressionTree;
  }
  
  /**
   * Apply the attribute filter at this node to a set of supplied instances
   *
   * @param inst the instances to apply the filter to
   * @return a filtered set of instances
   * @exception Exception if an error occurs
   */
  protected Instance applyNodeFilter(Instance inst) throws Exception {
    m_attributeFilter.input(inst);
    return m_attributeFilter.output();
  }
							  
  /**
   * Print all the linear models at the learf (debugging purposes)
   */
  public void printAllModels() {
    if (m_isLeaf) {
      System.out.println(m_nodeModel.toString());
    } else {
      System.out.println(m_nodeModel.toString());
      m_left.printAllModels();
      m_right.printAllModels();
    } 
  } 
  /**
   * Assigns a unique identifier to each node in the tree
   *
   * @param lastID last id number used
   * @return ID after processing child nodes
   */
  protected int assignIDs(int lastID) {
    int currLastID = lastID + 1;
    m_id = currLastID;
    if (m_left != null) {
      currLastID = m_left.assignIDs(currLastID);
    }
    if (m_right != null) {
      currLastID = m_right.assignIDs(currLastID);
    }
    return currLastID;
  }
  /**
   * Assign a unique identifier to each node in the tree and then
   * calls graphTree
   *
   * @param text a <code>StringBuffer</code> value
   */
  protected void graph(StringBuffer text) {
    assignIDs(-1);
    graphTree(text);
  }
  /**
   * Return a dotty style string describing the tree
   *
   * @param text a <code>StringBuffer</code> value
   */
  protected void graphTree(StringBuffer text) {
    text.append("N" + m_id
		+ (m_isLeaf 
		   ? " [label="LM " + m_leafModelNum
		   : " [label="" + m_instances.attribute(m_splitAtt).name())
		+ (m_isLeaf
		 ? " (" + ((m_globalDeviation > 0.0) 
			  ?  m_numInstances + "/" 
			     + Utils.doubleToString((100.0 * 
						     m_rootMeanSquaredError /
						     m_globalAbsDeviation), 
						    1, 3) 
			     + "%)"
			   : m_numInstances + ")")
		    + "" shape=box style=filled "
		   : """)
		+ (m_saveInstances
		   ? "data=n" + m_instances + "n,n"
		   : "")
		+ "]n");
		
    if (m_left != null) {
      text.append("N" + m_id + "->" + "N" + m_left.m_id + " [label="<="
		  + Utils.doubleToString(m_splitValue, 1, 3)
		  + ""]n");
      m_left.graphTree(text);
    }
     
    if (m_right != null) {
      text.append("N" + m_id + "->" + "N" + m_right.m_id + " [label=">"
		  + Utils.doubleToString(m_splitValue, 1, 3)
		  + ""]n");
      m_right.graphTree(text);
    }
  }
  /**
   * Set whether to save instances for visualization purposes.
   * Default is to save memory.
   *
   * @param save a <code>boolean</code> value
   */
  protected void setSaveInstances(boolean save) {
    m_saveInstances = save;
  }
}