Context Navigation

source: src/main/java/weka/classifiers/trees/ADTree.java @ 22

Last change on this file since 22 was 4, checked in by gnappo, 14 years ago
Import di weka.
File size: 50.1 KB

Rev	Line
[4]	1	/*
	2	* This program is free software; you can redistribute it and/or modify
	3	* it under the terms of the GNU General Public License as published by
	4	* the Free Software Foundation; either version 2 of the License, or
	5	* (at your option) any later version.
	6	*
	7	* This program is distributed in the hope that it will be useful,
	8	* but WITHOUT ANY WARRANTY; without even the implied warranty of
	9	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
	10	* GNU General Public License for more details.
	11	*
	12	* You should have received a copy of the GNU General Public License
	13	* along with this program; if not, write to the Free Software
	14	* Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
	15	*/
	16
	17	/*
	18	* ADTree.java
	19	* Copyright (C) 2001 University of Waikato, Hamilton, New Zealand
	20	*
	21	*/
	22
	23	package weka.classifiers.trees;
	24
	25	import weka.classifiers.Classifier;
	26	import weka.classifiers.AbstractClassifier;
	27	import weka.classifiers.IterativeClassifier;
	28	import weka.classifiers.trees.adtree.PredictionNode;
	29	import weka.classifiers.trees.adtree.ReferenceInstances;
	30	import weka.classifiers.trees.adtree.Splitter;
	31	import weka.classifiers.trees.adtree.TwoWayNominalSplit;
	32	import weka.classifiers.trees.adtree.TwoWayNumericSplit;
	33	import weka.core.AdditionalMeasureProducer;
	34	import weka.core.Attribute;
	35	import weka.core.Capabilities;
	36	import weka.core.Drawable;
	37	import weka.core.FastVector;
	38	import weka.core.Instance;
	39	import weka.core.Instances;
	40	import weka.core.Option;
	41	import weka.core.OptionHandler;
	42	import weka.core.RevisionUtils;
	43	import weka.core.SelectedTag;
	44	import weka.core.SerializedObject;
	45	import weka.core.Tag;
	46	import weka.core.TechnicalInformation;
	47	import weka.core.TechnicalInformationHandler;
	48	import weka.core.Utils;
	49	import weka.core.WeightedInstancesHandler;
	50	import weka.core.Capabilities.Capability;
	51	import weka.core.TechnicalInformation.Field;
	52	import weka.core.TechnicalInformation.Type;
	53
	54	import java.util.Enumeration;
	55	import java.util.Random;
	56	import java.util.Vector;
	57
	58	/**
	59	<!-- globalinfo-start -->
	60	* Class for generating an alternating decision tree. The basic algorithm is based on:<br/>
	61	* <br/>
	62	* Freund, Y., Mason, L.: The alternating decision tree learning algorithm. In: Proceeding of the Sixteenth International Conference on Machine Learning, Bled, Slovenia, 124-133, 1999.<br/>
	63	* <br/>
	64	* This version currently only supports two-class problems. The number of boosting iterations needs to be manually tuned to suit the dataset and the desired complexity/accuracy tradeoff. Induction of the trees has been optimized, and heuristic search methods have been introduced to speed learning.
	65	* <p/>
	66	<!-- globalinfo-end -->
	67	*
	68	<!-- technical-bibtex-start -->
	69	* BibTeX:
	70	* <pre>
	71	* @inproceedings{Freund1999,
	72	* address = {Bled, Slovenia},
	73	* author = {Freund, Y. and Mason, L.},
	74	* booktitle = {Proceeding of the Sixteenth International Conference on Machine Learning},
	75	* pages = {124-133},
	76	* title = {The alternating decision tree learning algorithm},
	77	* year = {1999}
	78	* }
	79	* </pre>
	80	* <p/>
	81	<!-- technical-bibtex-end -->
	82	*
	83	<!-- options-start -->
	84	* Valid options are: <p/>
	85	*
	86	* <pre> -B <number of boosting iterations>
	87	* Number of boosting iterations.
	88	* (Default = 10)</pre>
	89	*
	90	* <pre> -E <-3\|-2\|-1\|>=0>
	91	* Expand nodes: -3(all), -2(weight), -1(z_pure), >=0 seed for random walk
	92	* (Default = -3)</pre>
	93	*
	94	* <pre> -D
	95	* Save the instance data with the model</pre>
	96	*
	97	<!-- options-end -->
	98	*
	99	* @author Richard Kirkby (rkirkby@cs.waikato.ac.nz)
	100	* @author Bernhard Pfahringer (bernhard@cs.waikato.ac.nz)
	101	* @version $Revision: 5928 $
	102	*/
	103	public class ADTree
	104	extends AbstractClassifier
	105	implements OptionHandler, Drawable, AdditionalMeasureProducer,
	106	WeightedInstancesHandler, IterativeClassifier,
	107	TechnicalInformationHandler {
	108
	109	/** for serialization */
	110	static final long serialVersionUID = -1532264837167690683L;
	111
	112	/**
	113	* Returns a string describing classifier
	114	* @return a description suitable for
	115	* displaying in the explorer/experimenter gui
	116	*/
	117	public String globalInfo() {
	118
	119	return "Class for generating an alternating decision tree. The basic "
	120	+ "algorithm is based on:\n\n"
	121	+ getTechnicalInformation().toString() + "\n\n"
	122	+ "This version currently only supports two-class problems. The number of boosting "
	123	+ "iterations needs to be manually tuned to suit the dataset and the desired "
	124	+ "complexity/accuracy tradeoff. Induction of the trees has been optimized, and heuristic "
	125	+ "search methods have been introduced to speed learning.";
	126	}
	127
	128	/** search mode: Expand all paths */
	129	public static final int SEARCHPATH_ALL = 0;
	130	/** search mode: Expand the heaviest path */
	131	public static final int SEARCHPATH_HEAVIEST = 1;
	132	/** search mode: Expand the best z-pure path */
	133	public static final int SEARCHPATH_ZPURE = 2;
	134	/** search mode: Expand a random path */
	135	public static final int SEARCHPATH_RANDOM = 3;
	136	/** The search modes */
	137	public static final Tag [] TAGS_SEARCHPATH = {
	138	new Tag(SEARCHPATH_ALL, "Expand all paths"),
	139	new Tag(SEARCHPATH_HEAVIEST, "Expand the heaviest path"),
	140	new Tag(SEARCHPATH_ZPURE, "Expand the best z-pure path"),
	141	new Tag(SEARCHPATH_RANDOM, "Expand a random path")
	142	};
	143
	144	/** The instances used to train the tree */
	145	protected Instances m_trainInstances;
	146
	147	/** The root of the tree */
	148	protected PredictionNode m_root = null;
	149
	150	/** The random number generator - used for the random search heuristic */
	151	protected Random m_random = null;
	152
	153	/** The number of the last splitter added to the tree */
	154	protected int m_lastAddedSplitNum = 0;
	155
	156	/** An array containing the inidices to the numeric attributes in the data */
	157	protected int[] m_numericAttIndices;
	158
	159	/** An array containing the inidices to the nominal attributes in the data */
	160	protected int[] m_nominalAttIndices;
	161
	162	/** The total weight of the instances - used to speed Z calculations */
	163	protected double m_trainTotalWeight;
	164
	165	/** The training instances with positive class - referencing the training dataset */
	166	protected ReferenceInstances m_posTrainInstances;
	167
	168	/** The training instances with negative class - referencing the training dataset */
	169	protected ReferenceInstances m_negTrainInstances;
	170
	171	/** The best node to insert under, as found so far by the latest search */
	172	protected PredictionNode m_search_bestInsertionNode;
	173
	174	/** The best splitter to insert, as found so far by the latest search */
	175	protected Splitter m_search_bestSplitter;
	176
	177	/** The smallest Z value found so far by the latest search */
	178	protected double m_search_smallestZ;
	179
	180	/** The positive instances that apply to the best path found so far */
	181	protected Instances m_search_bestPathPosInstances;
	182
	183	/** The negative instances that apply to the best path found so far */
	184	protected Instances m_search_bestPathNegInstances;
	185
	186	/** Statistics - the number of prediction nodes investigated during search */
	187	protected int m_nodesExpanded = 0;
	188
	189	/** Statistics - the number of instances processed during search */
	190	protected int m_examplesCounted = 0;
	191
	192	/** Option - the number of boosting iterations o perform */
	193	protected int m_boostingIterations = 10;
	194
	195	/** Option - the search mode */
	196	protected int m_searchPath = 0;
	197
	198	/** Option - the seed to use for a random search */
	199	protected int m_randomSeed = 0;
	200
	201	/** Option - whether the tree should remember the instance data */
	202	protected boolean m_saveInstanceData = false;
	203
	204	/**
	205	* Returns an instance of a TechnicalInformation object, containing
	206	* detailed information about the technical background of this class,
	207	* e.g., paper reference or book this class is based on.
	208	*
	209	* @return the technical information about this class
	210	*/
	211	public TechnicalInformation getTechnicalInformation() {
	212	TechnicalInformation result;
	213
	214	result = new TechnicalInformation(Type.INPROCEEDINGS);
	215	result.setValue(Field.AUTHOR, "Freund, Y. and Mason, L.");
	216	result.setValue(Field.YEAR, "1999");
	217	result.setValue(Field.TITLE, "The alternating decision tree learning algorithm");
	218	result.setValue(Field.BOOKTITLE, "Proceeding of the Sixteenth International Conference on Machine Learning");
	219	result.setValue(Field.ADDRESS, "Bled, Slovenia");
	220	result.setValue(Field.PAGES, "124-133");
	221
	222	return result;
	223	}
	224
	225	/**
	226	* Sets up the tree ready to be trained, using two-class optimized method.
	227	*
	228	* @param instances the instances to train the tree with
	229	* @exception Exception if training data is unsuitable
	230	*/
	231	public void initClassifier(Instances instances) throws Exception {
	232
	233	// clear stats
	234	m_nodesExpanded = 0;
	235	m_examplesCounted = 0;
	236	m_lastAddedSplitNum = 0;
	237
	238	// prepare the random generator
	239	m_random = new Random(m_randomSeed);
	240
	241	// create training set
	242	m_trainInstances = new Instances(instances);
	243
	244	// create positive/negative subsets
	245	m_posTrainInstances = new ReferenceInstances(m_trainInstances,
	246	m_trainInstances.numInstances());
	247	m_negTrainInstances = new ReferenceInstances(m_trainInstances,
	248	m_trainInstances.numInstances());
	249	for (Enumeration e = m_trainInstances.enumerateInstances(); e.hasMoreElements(); ) {
	250	Instance inst = (Instance) e.nextElement();
	251	if ((int) inst.classValue() == 0)
	252	m_negTrainInstances.addReference(inst); // belongs in negative class
	253	else
	254	m_posTrainInstances.addReference(inst); // belongs in positive class
	255	}
	256	m_posTrainInstances.compactify();
	257	m_negTrainInstances.compactify();
	258
	259	// create the root prediction node
	260	double rootPredictionValue = calcPredictionValue(m_posTrainInstances,
	261	m_negTrainInstances);
	262	m_root = new PredictionNode(rootPredictionValue);
	263
	264	// pre-adjust weights
	265	updateWeights(m_posTrainInstances, m_negTrainInstances, rootPredictionValue);
	266
	267	// pre-calculate what we can
	268	generateAttributeIndicesSingle();
	269	}
	270
	271	/**
	272	* Performs one iteration.
	273	*
	274	* @param iteration the index of the current iteration (0-based)
	275	* @exception Exception if this iteration fails
	276	*/
	277	public void next(int iteration) throws Exception {
	278
	279	boost();
	280	}
	281
	282	/**
	283	* Performs a single boosting iteration, using two-class optimized method.
	284	* Will add a new splitter node and two prediction nodes to the tree
	285	* (unless merging takes place).
	286	*
	287	* @exception Exception if try to boost without setting up tree first or there are no
	288	* instances to train with
	289	*/
	290	public void boost() throws Exception {
	291
	292	if (m_trainInstances == null \|\| m_trainInstances.numInstances() == 0)
	293	throw new Exception("Trying to boost with no training data");
	294
	295	// perform the search
	296	searchForBestTestSingle();
	297
	298	if (m_search_bestSplitter == null) return; // handle empty instances
	299
	300	// create the new nodes for the tree, updating the weights
	301	for (int i=0; i<2; i++) {
	302	Instances posInstances =
	303	m_search_bestSplitter.instancesDownBranch(i, m_search_bestPathPosInstances);
	304	Instances negInstances =
	305	m_search_bestSplitter.instancesDownBranch(i, m_search_bestPathNegInstances);
	306	double predictionValue = calcPredictionValue(posInstances, negInstances);
	307	PredictionNode newPredictor = new PredictionNode(predictionValue);
	308	updateWeights(posInstances, negInstances, predictionValue);
	309	m_search_bestSplitter.setChildForBranch(i, newPredictor);
	310	}
	311
	312	// insert the new nodes
	313	m_search_bestInsertionNode.addChild((Splitter) m_search_bestSplitter, this);
	314
	315	// free memory
	316	m_search_bestPathPosInstances = null;
	317	m_search_bestPathNegInstances = null;
	318	m_search_bestSplitter = null;
	319	}
	320
	321	/**
	322	* Generates the m_nominalAttIndices and m_numericAttIndices arrays to index
	323	* the respective attribute types in the training data.
	324	*
	325	*/
	326	private void generateAttributeIndicesSingle() {
	327
	328	// insert indices into vectors
	329	FastVector nominalIndices = new FastVector();
	330	FastVector numericIndices = new FastVector();
	331
	332	for (int i=0; i<m_trainInstances.numAttributes(); i++) {
	333	if (i != m_trainInstances.classIndex()) {
	334	if (m_trainInstances.attribute(i).isNumeric())
	335	numericIndices.addElement(new Integer(i));
	336	else
	337	nominalIndices.addElement(new Integer(i));
	338	}
	339	}
	340
	341	// create nominal array
	342	m_nominalAttIndices = new int[nominalIndices.size()];
	343	for (int i=0; i<nominalIndices.size(); i++)
	344	m_nominalAttIndices[i] = ((Integer)nominalIndices.elementAt(i)).intValue();
	345
	346	// create numeric array
	347	m_numericAttIndices = new int[numericIndices.size()];
	348	for (int i=0; i<numericIndices.size(); i++)
	349	m_numericAttIndices[i] = ((Integer)numericIndices.elementAt(i)).intValue();
	350	}
	351
	352	/**
	353	* Performs a search for the best test (splitter) to add to the tree, by aiming to
	354	* minimize the Z value.
	355	*
	356	* @exception Exception if search fails
	357	*/
	358	private void searchForBestTestSingle() throws Exception {
	359
	360	// keep track of total weight for efficient wRemainder calculations
	361	m_trainTotalWeight = m_trainInstances.sumOfWeights();
	362
	363	m_search_smallestZ = Double.POSITIVE_INFINITY;
	364	searchForBestTestSingle(m_root, m_posTrainInstances, m_negTrainInstances);
	365	}
	366
	367	/**
	368	* Recursive function that carries out search for the best test (splitter) to add to
	369	* this part of the tree, by aiming to minimize the Z value. Performs Z-pure cutoff to
	370	* reduce search space.
	371	*
	372	* @param currentNode the root of the subtree to be searched, and the current node
	373	* being considered as parent of a new split
	374	* @param posInstances the positive-class instances that apply at this node
	375	* @param negInstances the negative-class instances that apply at this node
	376	* @exception Exception if search fails
	377	*/
	378	private void searchForBestTestSingle(PredictionNode currentNode,
	379	Instances posInstances, Instances negInstances)
	380	throws Exception {
	381
	382	// don't investigate pure or empty nodes any further
	383	if (posInstances.numInstances() == 0 \|\| negInstances.numInstances() == 0) return;
	384
	385	// do z-pure cutoff
	386	if (calcZpure(posInstances, negInstances) >= m_search_smallestZ) return;
	387
	388	// keep stats
	389	m_nodesExpanded++;
	390	m_examplesCounted += posInstances.numInstances() + negInstances.numInstances();
	391
	392	// evaluate static splitters (nominal)
	393	for (int i=0; i<m_nominalAttIndices.length; i++)
	394	evaluateNominalSplitSingle(m_nominalAttIndices[i], currentNode,
	395	posInstances, negInstances);
	396
	397	// evaluate dynamic splitters (numeric)
	398	if (m_numericAttIndices.length > 0) {
	399
	400	// merge the two sets of instances into one
	401	Instances allInstances = new Instances(posInstances);
	402	for (Enumeration e = negInstances.enumerateInstances(); e.hasMoreElements(); )
	403	allInstances.add((Instance) e.nextElement());
	404
	405	// use method of finding the optimal Z split-point
	406	for (int i=0; i<m_numericAttIndices.length; i++)
	407	evaluateNumericSplitSingle(m_numericAttIndices[i], currentNode,
	408	posInstances, negInstances, allInstances);
	409	}
	410
	411	if (currentNode.getChildren().size() == 0) return;
	412
	413	// keep searching
	414	switch (m_searchPath) {
	415	case SEARCHPATH_ALL:
	416	goDownAllPathsSingle(currentNode, posInstances, negInstances);
	417	break;
	418	case SEARCHPATH_HEAVIEST:
	419	goDownHeaviestPathSingle(currentNode, posInstances, negInstances);
	420	break;
	421	case SEARCHPATH_ZPURE:
	422	goDownZpurePathSingle(currentNode, posInstances, negInstances);
	423	break;
	424	case SEARCHPATH_RANDOM:
	425	goDownRandomPathSingle(currentNode, posInstances, negInstances);
	426	break;
	427	}
	428	}
	429
	430	/**
	431	* Continues single (two-class optimized) search by investigating every node in the
	432	* subtree under currentNode.
	433	*
	434	* @param currentNode the root of the subtree to be searched
	435	* @param posInstances the positive-class instances that apply at this node
	436	* @param negInstances the negative-class instances that apply at this node
	437	* @exception Exception if search fails
	438	*/
	439	private void goDownAllPathsSingle(PredictionNode currentNode,
	440	Instances posInstances, Instances negInstances)
	441	throws Exception {
	442
	443	for (Enumeration e = currentNode.children(); e.hasMoreElements(); ) {
	444	Splitter split = (Splitter) e.nextElement();
	445	for (int i=0; i<split.getNumOfBranches(); i++)
	446	searchForBestTestSingle(split.getChildForBranch(i),
	447	split.instancesDownBranch(i, posInstances),
	448	split.instancesDownBranch(i, negInstances));
	449	}
	450	}
	451
	452	/**
	453	* Continues single (two-class optimized) search by investigating only the path
	454	* with the most heavily weighted instances.
	455	*
	456	* @param currentNode the root of the subtree to be searched
	457	* @param posInstances the positive-class instances that apply at this node
	458	* @param negInstances the negative-class instances that apply at this node
	459	* @exception Exception if search fails
	460	*/
	461	private void goDownHeaviestPathSingle(PredictionNode currentNode,
	462	Instances posInstances, Instances negInstances)
	463	throws Exception {
	464
	465	Splitter heaviestSplit = null;
	466	int heaviestBranch = 0;
	467	double largestWeight = 0.0;
	468	for (Enumeration e = currentNode.children(); e.hasMoreElements(); ) {
	469	Splitter split = (Splitter) e.nextElement();
	470	for (int i=0; i<split.getNumOfBranches(); i++) {
	471	double weight =
	472	split.instancesDownBranch(i, posInstances).sumOfWeights() +
	473	split.instancesDownBranch(i, negInstances).sumOfWeights();
	474	if (weight > largestWeight) {
	475	heaviestSplit = split;
	476	heaviestBranch = i;
	477	largestWeight = weight;
	478	}
	479	}
	480	}
	481	if (heaviestSplit != null)
	482	searchForBestTestSingle(heaviestSplit.getChildForBranch(heaviestBranch),
	483	heaviestSplit.instancesDownBranch(heaviestBranch,
	484	posInstances),
	485	heaviestSplit.instancesDownBranch(heaviestBranch,
	486	negInstances));
	487	}
	488
	489	/**
	490	* Continues single (two-class optimized) search by investigating only the path
	491	* with the best Z-pure value at each branch.
	492	*
	493	* @param currentNode the root of the subtree to be searched
	494	* @param posInstances the positive-class instances that apply at this node
	495	* @param negInstances the negative-class instances that apply at this node
	496	* @exception Exception if search fails
	497	*/
	498	private void goDownZpurePathSingle(PredictionNode currentNode,
	499	Instances posInstances, Instances negInstances)
	500	throws Exception {
	501
	502	double lowestZpure = m_search_smallestZ; // do z-pure cutoff
	503	PredictionNode bestPath = null;
	504	Instances bestPosSplit = null, bestNegSplit = null;
	505
	506	// search for branch with lowest Z-pure
	507	for (Enumeration e = currentNode.children(); e.hasMoreElements(); ) {
	508	Splitter split = (Splitter) e.nextElement();
	509	for (int i=0; i<split.getNumOfBranches(); i++) {
	510	Instances posSplit = split.instancesDownBranch(i, posInstances);
	511	Instances negSplit = split.instancesDownBranch(i, negInstances);
	512	double newZpure = calcZpure(posSplit, negSplit);
	513	if (newZpure < lowestZpure) {
	514	lowestZpure = newZpure;
	515	bestPath = split.getChildForBranch(i);
	516	bestPosSplit = posSplit;
	517	bestNegSplit = negSplit;
	518	}
	519	}
	520	}
	521
	522	if (bestPath != null)
	523	searchForBestTestSingle(bestPath, bestPosSplit, bestNegSplit);
	524	}
	525
	526	/**
	527	* Continues single (two-class optimized) search by investigating a random path.
	528	*
	529	* @param currentNode the root of the subtree to be searched
	530	* @param posInstances the positive-class instances that apply at this node
	531	* @param negInstances the negative-class instances that apply at this node
	532	* @exception Exception if search fails
	533	*/
	534	private void goDownRandomPathSingle(PredictionNode currentNode,
	535	Instances posInstances, Instances negInstances)
	536	throws Exception {
	537
	538	FastVector children = currentNode.getChildren();
	539	Splitter split = (Splitter) children.elementAt(getRandom(children.size()));
	540	int branch = getRandom(split.getNumOfBranches());
	541	searchForBestTestSingle(split.getChildForBranch(branch),
	542	split.instancesDownBranch(branch, posInstances),
	543	split.instancesDownBranch(branch, negInstances));
	544	}
	545
	546	/**
	547	* Investigates the option of introducing a nominal split under currentNode. If it
	548	* finds a split that has a Z-value lower than has already been found it will
	549	* update the search information to record this as the best option so far.
	550	*
	551	* @param attIndex index of a nominal attribute to create a split from
	552	* @param currentNode the parent under which a split is to be considered
	553	* @param posInstances the positive-class instances that apply at this node
	554	* @param negInstances the negative-class instances that apply at this node
	555	*/
	556	private void evaluateNominalSplitSingle(int attIndex, PredictionNode currentNode,
	557	Instances posInstances, Instances negInstances)
	558	{
	559
	560	double[] indexAndZ = findLowestZNominalSplit(posInstances, negInstances, attIndex);
	561
	562	if (indexAndZ[1] < m_search_smallestZ) {
	563	m_search_smallestZ = indexAndZ[1];
	564	m_search_bestInsertionNode = currentNode;
	565	m_search_bestSplitter = new TwoWayNominalSplit(attIndex, (int) indexAndZ[0]);
	566	m_search_bestPathPosInstances = posInstances;
	567	m_search_bestPathNegInstances = negInstances;
	568	}
	569	}
	570
	571	/**
	572	* Investigates the option of introducing a two-way numeric split under currentNode.
	573	* If it finds a split that has a Z-value lower than has already been found it will
	574	* update the search information to record this as the best option so far.
	575	*
	576	* @param attIndex index of a numeric attribute to create a split from
	577	* @param currentNode the parent under which a split is to be considered
	578	* @param posInstances the positive-class instances that apply at this node
	579	* @param negInstances the negative-class instances that apply at this node
	580	* @param allInstances all of the instances the apply at this node (pos+neg combined)
	581	* @throws Exception in case of an error
	582	*/
	583	private void evaluateNumericSplitSingle(int attIndex, PredictionNode currentNode,
	584	Instances posInstances, Instances negInstances,
	585	Instances allInstances)
	586	throws Exception {
	587
	588	double[] splitAndZ = findLowestZNumericSplit(allInstances, attIndex);
	589
	590	if (splitAndZ[1] < m_search_smallestZ) {
	591	m_search_smallestZ = splitAndZ[1];
	592	m_search_bestInsertionNode = currentNode;
	593	m_search_bestSplitter = new TwoWayNumericSplit(attIndex, splitAndZ[0]);
	594	m_search_bestPathPosInstances = posInstances;
	595	m_search_bestPathNegInstances = negInstances;
	596	}
	597	}
	598
	599	/**
	600	* Calculates the prediction value used for a particular set of instances.
	601	*
	602	* @param posInstances the positive-class instances
	603	* @param negInstances the negative-class instances
	604	* @return the prediction value
	605	*/
	606	private double calcPredictionValue(Instances posInstances, Instances negInstances) {
	607
	608	return 0.5 * Math.log( (posInstances.sumOfWeights() + 1.0)
	609	/ (negInstances.sumOfWeights() + 1.0) );
	610	}
	611
	612	/**
	613	* Calculates the Z-pure value for a particular set of instances.
	614	*
	615	* @param posInstances the positive-class instances
	616	* @param negInstances the negative-class instances
	617	* @return the Z-pure value
	618	*/
	619	private double calcZpure(Instances posInstances, Instances negInstances) {
	620
	621	double posWeight = posInstances.sumOfWeights();
	622	double negWeight = negInstances.sumOfWeights();
	623	return (2.0 * (Math.sqrt(posWeight+1.0) + Math.sqrt(negWeight+1.0))) +
	624	(m_trainTotalWeight - (posWeight + negWeight));
	625	}
	626
	627	/**
	628	* Updates the weights of instances that are influenced by a new prediction value.
	629	*
	630	* @param posInstances positive-class instances to which the prediction value applies
	631	* @param negInstances negative-class instances to which the prediction value applies
	632	* @param predictionValue the new prediction value
	633	*/
	634	private void updateWeights(Instances posInstances, Instances negInstances,
	635	double predictionValue) {
	636
	637	// do positives
	638	double weightMultiplier = Math.pow(Math.E, -predictionValue);
	639	for (Enumeration e = posInstances.enumerateInstances(); e.hasMoreElements(); ) {
	640	Instance inst = (Instance) e.nextElement();
	641	inst.setWeight(inst.weight() * weightMultiplier);
	642	}
	643	// do negatives
	644	weightMultiplier = Math.pow(Math.E, predictionValue);
	645	for (Enumeration e = negInstances.enumerateInstances(); e.hasMoreElements(); ) {
	646	Instance inst = (Instance) e.nextElement();
	647	inst.setWeight(inst.weight() * weightMultiplier);
	648	}
	649	}
	650
	651	/**
	652	* Finds the nominal attribute value to split on that results in the lowest Z-value.
	653	*
	654	* @param posInstances the positive-class instances to split
	655	* @param negInstances the negative-class instances to split
	656	* @param attIndex the index of the nominal attribute to find a split for
	657	* @return a double array, index[0] contains the value to split on, index[1] contains
	658	* the Z-value of the split
	659	*/
	660	private double[] findLowestZNominalSplit(Instances posInstances, Instances negInstances,
	661	int attIndex)
	662	{
	663
	664	double lowestZ = Double.MAX_VALUE;
	665	int bestIndex = 0;
	666
	667	// set up arrays
	668	double[] posWeights = attributeValueWeights(posInstances, attIndex);
	669	double[] negWeights = attributeValueWeights(negInstances, attIndex);
	670	double posWeight = Utils.sum(posWeights);
	671	double negWeight = Utils.sum(negWeights);
	672
	673	int maxIndex = posWeights.length;
	674	if (maxIndex == 2) maxIndex = 1; // avoid repeating due to 2-way symmetry
	675
	676	for (int i = 0; i < maxIndex; i++) {
	677	// calculate Z
	678	double w1 = posWeights[i] + 1.0;
	679	double w2 = negWeights[i] + 1.0;
	680	double w3 = posWeight - w1 + 2.0;
	681	double w4 = negWeight - w2 + 2.0;
	682	double wRemainder = m_trainTotalWeight + 4.0 - (w1 + w2 + w3 + w4);
	683	double newZ = (2.0 * (Math.sqrt(w1 * w2) + Math.sqrt(w3 * w4))) + wRemainder;
	684
	685	// record best option
	686	if (newZ < lowestZ) {
	687	lowestZ = newZ;
	688	bestIndex = i;
	689	}
	690	}
	691
	692	// return result
	693	double[] indexAndZ = new double[2];
	694	indexAndZ[0] = (double) bestIndex;
	695	indexAndZ[1] = lowestZ;
	696	return indexAndZ;
	697	}
	698
	699	/**
	700	* Simultanously sum the weights of all attribute values for all instances.
	701	*
	702	* @param instances the instances to get the weights from
	703	* @param attIndex index of the attribute to be evaluated
	704	* @return a double array containing the weight of each attribute value
	705	*/
	706	private double[] attributeValueWeights(Instances instances, int attIndex)
	707	{
	708
	709	double[] weights = new double[instances.attribute(attIndex).numValues()];
	710	for(int i = 0; i < weights.length; i++) weights[i] = 0.0;
	711
	712	for (Enumeration e = instances.enumerateInstances(); e.hasMoreElements(); ) {
	713	Instance inst = (Instance) e.nextElement();
	714	if (!inst.isMissing(attIndex)) weights[(int)inst.value(attIndex)] += inst.weight();
	715	}
	716	return weights;
	717	}
	718
	719	/**
	720	* Finds the numeric split-point that results in the lowest Z-value.
	721	*
	722	* @param instances the instances to find a split for
	723	* @param attIndex the index of the numeric attribute to find a split for
	724	* @return a double array, index[0] contains the split-point, index[1] contains the
	725	* Z-value of the split
	726	* @throws Exception in case of an error
	727	*/
	728	private double[] findLowestZNumericSplit(Instances instances, int attIndex)
	729	throws Exception {
	730
	731	double splitPoint = 0.0;
	732	double bestVal = Double.MAX_VALUE, currVal, currCutPoint;
	733	int numMissing = 0;
	734	double[][] distribution = new double[3][instances.numClasses()];
	735
	736	// compute counts for all the values
	737	for (int i = 0; i < instances.numInstances(); i++) {
	738	Instance inst = instances.instance(i);
	739	if (!inst.isMissing(attIndex)) {
	740	distribution[1][(int)inst.classValue()] += inst.weight();
	741	} else {
	742	distribution[2][(int)inst.classValue()] += inst.weight();
	743	numMissing++;
	744	}
	745	}
	746
	747	// sort instances
	748	instances.sort(attIndex);
	749
	750	// make split counts for each possible split and evaluate
	751	for (int i = 0; i < instances.numInstances() - (numMissing + 1); i++) {
	752	Instance inst = instances.instance(i);
	753	Instance instPlusOne = instances.instance(i + 1);
	754	distribution[0][(int)inst.classValue()] += inst.weight();
	755	distribution[1][(int)inst.classValue()] -= inst.weight();
	756	if (Utils.sm(inst.value(attIndex), instPlusOne.value(attIndex))) {
	757	currCutPoint = (inst.value(attIndex) + instPlusOne.value(attIndex)) / 2.0;
	758	currVal = conditionedZOnRows(distribution);
	759	if (currVal < bestVal) {
	760	splitPoint = currCutPoint;
	761	bestVal = currVal;
	762	}
	763	}
	764	}
	765
	766	double[] splitAndZ = new double[2];
	767	splitAndZ[0] = splitPoint;
	768	splitAndZ[1] = bestVal;
	769	return splitAndZ;
	770	}
	771
	772	/**
	773	* Calculates the Z-value from the rows of a weight distribution array.
	774	*
	775	* @param distribution the weight distribution
	776	* @return the Z-value
	777	*/
	778	private double conditionedZOnRows(double [][] distribution) {
	779
	780	double w1 = distribution[0][0] + 1.0;
	781	double w2 = distribution[0][1] + 1.0;
	782	double w3 = distribution[1][0] + 1.0;
	783	double w4 = distribution[1][1] + 1.0;
	784	double wRemainder = m_trainTotalWeight + 4.0 - (w1 + w2 + w3 + w4);
	785	return (2.0 * (Math.sqrt(w1 * w2) + Math.sqrt(w3 * w4))) + wRemainder;
	786	}
	787
	788	/**
	789	* Returns the class probability distribution for an instance.
	790	*
	791	* @param instance the instance to be classified
	792	* @return the distribution the tree generates for the instance
	793	*/
	794	public double[] distributionForInstance(Instance instance) {
	795
	796	double predVal = predictionValueForInstance(instance, m_root, 0.0);
	797
	798	double[] distribution = new double[2];
	799	distribution[0] = 1.0 / (1.0 + Math.pow(Math.E, predVal));
	800	distribution[1] = 1.0 / (1.0 + Math.pow(Math.E, -predVal));
	801
	802	return distribution;
	803	}
	804
	805	/**
	806	* Returns the class prediction value (vote) for an instance.
	807	*
	808	* @param inst the instance
	809	* @param currentNode the root of the tree to get the values from
	810	* @param currentValue the current value before adding the value contained in the
	811	* subtree
	812	* @return the class prediction value (vote)
	813	*/
	814	protected double predictionValueForInstance(Instance inst, PredictionNode currentNode,
	815	double currentValue) {
	816
	817	currentValue += currentNode.getValue();
	818	for (Enumeration e = currentNode.children(); e.hasMoreElements(); ) {
	819	Splitter split = (Splitter) e.nextElement();
	820	int branch = split.branchInstanceGoesDown(inst);
	821	if (branch >= 0)
	822	currentValue = predictionValueForInstance(inst, split.getChildForBranch(branch),
	823	currentValue);
	824	}
	825	return currentValue;
	826	}
	827
	828	/**
	829	* Returns a description of the classifier.
	830	*
	831	* @return a string containing a description of the classifier
	832	*/
	833	public String toString() {
	834
	835	if (m_root == null)
	836	return ("ADTree not built yet");
	837	else {
	838	return ("Alternating decision tree:\n\n" + toString(m_root, 1) +
	839	"\nLegend: " + legend() +
	840	"\nTree size (total number of nodes): " + numOfAllNodes(m_root) +
	841	"\nLeaves (number of predictor nodes): " + numOfPredictionNodes(m_root)
	842	);
	843	}
	844	}
	845
	846	/**
	847	* Traverses the tree, forming a string that describes it.
	848	*
	849	* @param currentNode the current node under investigation
	850	* @param level the current level in the tree
	851	* @return the string describing the subtree
	852	*/
	853	protected String toString(PredictionNode currentNode, int level) {
	854
	855	StringBuffer text = new StringBuffer();
	856
	857	text.append(": " + Utils.doubleToString(currentNode.getValue(),3));
	858
	859	for (Enumeration e = currentNode.children(); e.hasMoreElements(); ) {
	860	Splitter split = (Splitter) e.nextElement();
	861
	862	for (int j=0; j<split.getNumOfBranches(); j++) {
	863	PredictionNode child = split.getChildForBranch(j);
	864	if (child != null) {
	865	text.append("\n");
	866	for (int k = 0; k < level; k++) {
	867	text.append("\| ");
	868	}
	869	text.append("(" + split.orderAdded + ")");
	870	text.append(split.attributeString(m_trainInstances) + " "
	871	+ split.comparisonString(j, m_trainInstances));
	872	text.append(toString(child, level + 1));
	873	}
	874	}
	875	}
	876	return text.toString();
	877	}
	878
	879	/**
	880	* Returns the type of graph this classifier
	881	* represents.
	882	* @return Drawable.TREE
	883	*/
	884	public int graphType() {
	885	return Drawable.TREE;
	886	}
	887
	888	/**
	889	* Returns graph describing the tree.
	890	*
	891	* @return the graph of the tree in dotty format
	892	* @exception Exception if something goes wrong
	893	*/
	894	public String graph() throws Exception {
	895
	896	StringBuffer text = new StringBuffer();
	897	text.append("digraph ADTree {\n");
	898	graphTraverse(m_root, text, 0, 0, m_trainInstances);
	899	return text.toString() +"}\n";
	900	}
	901
	902	/**
	903	* Traverses the tree, graphing each node.
	904	*
	905	* @param currentNode the currentNode under investigation
	906	* @param text the string built so far
	907	* @param splitOrder the order the parent splitter was added to the tree
	908	* @param predOrder the order this predictor was added to the split
	909	* @param instances the data to work on
	910	* @exception Exception if something goes wrong
	911	*/
	912	protected void graphTraverse(PredictionNode currentNode, StringBuffer text,
	913	int splitOrder, int predOrder, Instances instances)
	914	throws Exception {
	915
	916	text.append("S" + splitOrder + "P" + predOrder + " [label=\"");
	917	text.append(Utils.doubleToString(currentNode.getValue(),3));
	918	if (splitOrder == 0) // show legend in root
	919	text.append(" (" + legend() + ")");
	920	text.append("\" shape=box style=filled");
	921	if (instances.numInstances() > 0) text.append(" data=\n" + instances + "\n,\n");
	922	text.append("]\n");
	923	for (Enumeration e = currentNode.children(); e.hasMoreElements(); ) {
	924	Splitter split = (Splitter) e.nextElement();
	925	text.append("S" + splitOrder + "P" + predOrder + "->" + "S" + split.orderAdded +
	926	" [style=dotted]\n");
	927	text.append("S" + split.orderAdded + " [label=\"" + split.orderAdded + ": " +
	928	split.attributeString(m_trainInstances) + "\"]\n");
	929
	930	for (int i=0; i<split.getNumOfBranches(); i++) {
	931	PredictionNode child = split.getChildForBranch(i);
	932	if (child != null) {
	933	text.append("S" + split.orderAdded + "->" + "S" + split.orderAdded + "P" + i +
	934	" [label=\"" + split.comparisonString(i, m_trainInstances) + "\"]\n");
	935	graphTraverse(child, text, split.orderAdded, i,
	936	split.instancesDownBranch(i, instances));
	937	}
	938	}
	939	}
	940	}
	941
	942	/**
	943	* Returns the legend of the tree, describing how results are to be interpreted.
	944	*
	945	* @return a string containing the legend of the classifier
	946	*/
	947	public String legend() {
	948
	949	Attribute classAttribute = null;
	950	if (m_trainInstances == null) return "";
	951	try {classAttribute = m_trainInstances.classAttribute();} catch (Exception x){};
	952	return ("-ve = " + classAttribute.value(0) +
	953	", +ve = " + classAttribute.value(1));
	954	}
	955
	956	/**
	957	* @return tip text for this property suitable for
	958	* displaying in the explorer/experimenter gui
	959	*/
	960	public String numOfBoostingIterationsTipText() {
	961
	962	return "Sets the number of boosting iterations to perform. You will need to manually "
	963	+ "tune this parameter to suit the dataset and the desired complexity/accuracy "
	964	+ "tradeoff. More boosting iterations will result in larger (potentially more "
	965	+ " accurate) trees, but will make learning slower. Each iteration will add 3 nodes "
	966	+ "(1 split + 2 prediction) to the tree unless merging occurs.";
	967	}
	968
	969	/**
	970	* Gets the number of boosting iterations.
	971	*
	972	* @return the number of boosting iterations
	973	*/
	974	public int getNumOfBoostingIterations() {
	975
	976	return m_boostingIterations;
	977	}
	978
	979	/**
	980	* Sets the number of boosting iterations.
	981	*
	982	* @param b the number of boosting iterations to use
	983	*/
	984	public void setNumOfBoostingIterations(int b) {
	985
	986	m_boostingIterations = b;
	987	}
	988
	989	/**
	990	* @return tip text for this property suitable for
	991	* displaying in the explorer/experimenter gui
	992	*/
	993	public String searchPathTipText() {
	994
	995	return "Sets the type of search to perform when building the tree. The default option"
	996	+ " (Expand all paths) will do an exhaustive search. The other search methods are"
	997	+ " heuristic, so they are not guaranteed to find an optimal solution but they are"
	998	+ " much faster. Expand the heaviest path: searches the path with the most heavily"
	999	+ " weighted instances. Expand the best z-pure path: searches the path determined"
	1000	+ " by the best z-pure estimate. Expand a random path: the fastest method, simply"
	1001	+ " searches down a single random path on each iteration.";
	1002	}
	1003
	1004	/**
	1005	* Gets the method of searching the tree for a new insertion. Will be one of
	1006	* SEARCHPATH_ALL, SEARCHPATH_HEAVIEST, SEARCHPATH_ZPURE, SEARCHPATH_RANDOM.
	1007	*
	1008	* @return the tree searching mode
	1009	*/
	1010	public SelectedTag getSearchPath() {
	1011
	1012	return new SelectedTag(m_searchPath, TAGS_SEARCHPATH);
	1013	}
	1014
	1015	/**
	1016	* Sets the method of searching the tree for a new insertion. Will be one of
	1017	* SEARCHPATH_ALL, SEARCHPATH_HEAVIEST, SEARCHPATH_ZPURE, SEARCHPATH_RANDOM.
	1018	*
	1019	* @param newMethod the new tree searching mode
	1020	*/
	1021	public void setSearchPath(SelectedTag newMethod) {
	1022
	1023	if (newMethod.getTags() == TAGS_SEARCHPATH) {
	1024	m_searchPath = newMethod.getSelectedTag().getID();
	1025	}
	1026	}
	1027
	1028	/**
	1029	* @return tip text for this property suitable for
	1030	* displaying in the explorer/experimenter gui
	1031	*/
	1032	public String randomSeedTipText() {
	1033
	1034	return "Sets the random seed to use for a random search.";
	1035	}
	1036
	1037	/**
	1038	* Gets random seed for a random walk.
	1039	*
	1040	* @return the random seed
	1041	*/
	1042	public int getRandomSeed() {
	1043
	1044	return m_randomSeed;
	1045	}
	1046
	1047	/**
	1048	* Sets random seed for a random walk.
	1049	*
	1050	* @param seed the random seed
	1051	*/
	1052	public void setRandomSeed(int seed) {
	1053
	1054	// the actual random object is created when the tree is initialized
	1055	m_randomSeed = seed;
	1056	}
	1057
	1058	/**
	1059	* @return tip text for this property suitable for
	1060	* displaying in the explorer/experimenter gui
	1061	*/
	1062	public String saveInstanceDataTipText() {
	1063
	1064	return "Sets whether the tree is to save instance data - the model will take up more"
	1065	+ " memory if it does. If enabled you will be able to visualize the instances at"
	1066	+ " the prediction nodes when visualizing the tree.";
	1067	}
	1068
	1069	/**
	1070	* Gets whether the tree is to save instance data.
	1071	*
	1072	* @return the random seed
	1073	*/
	1074	public boolean getSaveInstanceData() {
	1075
	1076	return m_saveInstanceData;
	1077	}
	1078
	1079	/**
	1080	* Sets whether the tree is to save instance data.
	1081	*
	1082	* @param v true then the tree saves instance data
	1083	*/
	1084	public void setSaveInstanceData(boolean v) {
	1085
	1086	m_saveInstanceData = v;
	1087	}
	1088
	1089	/**
	1090	* Returns an enumeration describing the available options..
	1091	*
	1092	* @return an enumeration of all the available options.
	1093	*/
	1094	public Enumeration listOptions() {
	1095
	1096	Vector newVector = new Vector(3);
	1097	newVector.addElement(new Option(
	1098	"\tNumber of boosting iterations.\n"
	1099	+"\t(Default = 10)",
	1100	"B", 1,"-B <number of boosting iterations>"));
	1101	newVector.addElement(new Option(
	1102	"\tExpand nodes: -3(all), -2(weight), -1(z_pure), "
	1103	+">=0 seed for random walk\n"
	1104	+"\t(Default = -3)",
	1105	"E", 1,"-E <-3\|-2\|-1\|>=0>"));
	1106	newVector.addElement(new Option(
	1107	"\tSave the instance data with the model",
	1108	"D", 0,"-D"));
	1109	return newVector.elements();
	1110	}
	1111
	1112	/**
	1113	* Parses a given list of options. Valid options are:<p>
	1114	*
	1115	* -B num <br>
	1116	* Set the number of boosting iterations
	1117	* (default 10) <p>
	1118	*
	1119	* -E num <br>
	1120	* Set the nodes to expand: -3(all), -2(weight), -1(z_pure), >=0 seed for random walk
	1121	* (default -3) <p>
	1122	*
	1123	* -D <br>
	1124	* Save the instance data with the model <p>
	1125	*
	1126	* @param options the list of options as an array of strings
	1127	* @exception Exception if an option is not supported
	1128	*/
	1129	public void setOptions(String[] options) throws Exception {
	1130
	1131	String bString = Utils.getOption('B', options);
	1132	if (bString.length() != 0) setNumOfBoostingIterations(Integer.parseInt(bString));
	1133
	1134	String eString = Utils.getOption('E', options);
	1135	if (eString.length() != 0) {
	1136	int value = Integer.parseInt(eString);
	1137	if (value >= 0) {
	1138	setSearchPath(new SelectedTag(SEARCHPATH_RANDOM, TAGS_SEARCHPATH));
	1139	setRandomSeed(value);
	1140	} else setSearchPath(new SelectedTag(value + 3, TAGS_SEARCHPATH));
	1141	}
	1142
	1143	setSaveInstanceData(Utils.getFlag('D', options));
	1144
	1145	Utils.checkForRemainingOptions(options);
	1146	}
	1147
	1148	/**
	1149	* Gets the current settings of ADTree.
	1150	*
	1151	* @return an array of strings suitable for passing to setOptions()
	1152	*/
	1153	public String[] getOptions() {
	1154
	1155	String[] options = new String[6];
	1156	int current = 0;
	1157	options[current++] = "-B"; options[current++] = "" + getNumOfBoostingIterations();
	1158	options[current++] = "-E"; options[current++] = "" +
	1159	(m_searchPath == SEARCHPATH_RANDOM ?
	1160	m_randomSeed : m_searchPath - 3);
	1161	if (getSaveInstanceData()) options[current++] = "-D";
	1162	while (current < options.length) options[current++] = "";
	1163	return options;
	1164	}
	1165
	1166	/**
	1167	* Calls measure function for tree size - the total number of nodes.
	1168	*
	1169	* @return the tree size
	1170	*/
	1171	public double measureTreeSize() {
	1172
	1173	return numOfAllNodes(m_root);
	1174	}
	1175
	1176	/**
	1177	* Calls measure function for leaf size - the number of prediction nodes.
	1178	*
	1179	* @return the leaf size
	1180	*/
	1181	public double measureNumLeaves() {
	1182
	1183	return numOfPredictionNodes(m_root);
	1184	}
	1185
	1186	/**
	1187	* Calls measure function for prediction leaf size - the number of
	1188	* prediction nodes without children.
	1189	*
	1190	* @return the leaf size
	1191	*/
	1192	public double measureNumPredictionLeaves() {
	1193
	1194	return numOfPredictionLeafNodes(m_root);
	1195	}
	1196
	1197	/**
	1198	* Returns the number of nodes expanded.
	1199	*
	1200	* @return the number of nodes expanded during search
	1201	*/
	1202	public double measureNodesExpanded() {
	1203
	1204	return m_nodesExpanded;
	1205	}
	1206
	1207	/**
	1208	* Returns the number of examples "counted".
	1209	*
	1210	* @return the number of nodes processed during search
	1211	*/
	1212
	1213	public double measureExamplesProcessed() {
	1214
	1215	return m_examplesCounted;
	1216	}
	1217
	1218	/**
	1219	* Returns an enumeration of the additional measure names.
	1220	*
	1221	* @return an enumeration of the measure names
	1222	*/
	1223	public Enumeration enumerateMeasures() {
	1224
	1225	Vector newVector = new Vector(4);
	1226	newVector.addElement("measureTreeSize");
	1227	newVector.addElement("measureNumLeaves");
	1228	newVector.addElement("measureNumPredictionLeaves");
	1229	newVector.addElement("measureNodesExpanded");
	1230	newVector.addElement("measureExamplesProcessed");
	1231	return newVector.elements();
	1232	}
	1233
	1234	/**
	1235	* Returns the value of the named measure.
	1236	*
	1237	* @param additionalMeasureName the name of the measure to query for its value
	1238	* @return the value of the named measure
	1239	* @exception IllegalArgumentException if the named measure is not supported
	1240	*/
	1241	public double getMeasure(String additionalMeasureName) {
	1242
	1243	if (additionalMeasureName.equalsIgnoreCase("measureTreeSize")) {
	1244	return measureTreeSize();
	1245	}
	1246	else if (additionalMeasureName.equalsIgnoreCase("measureNumLeaves")) {
	1247	return measureNumLeaves();
	1248	}
	1249	else if (additionalMeasureName.equalsIgnoreCase("measureNumPredictionLeaves")) {
	1250	return measureNumPredictionLeaves();
	1251	}
	1252	else if (additionalMeasureName.equalsIgnoreCase("measureNodesExpanded")) {
	1253	return measureNodesExpanded();
	1254	}
	1255	else if (additionalMeasureName.equalsIgnoreCase("measureExamplesProcessed")) {
	1256	return measureExamplesProcessed();
	1257	}
	1258	else {throw new IllegalArgumentException(additionalMeasureName
	1259	+ " not supported (ADTree)");
	1260	}
	1261	}
	1262
	1263	/**
	1264	* Returns the total number of nodes in a tree.
	1265	*
	1266	* @param root the root of the tree being measured
	1267	* @return tree size in number of splitter + prediction nodes
	1268	*/
	1269	protected int numOfAllNodes(PredictionNode root) {
	1270
	1271	int numSoFar = 0;
	1272	if (root != null) {
	1273	numSoFar++;
	1274	for (Enumeration e = root.children(); e.hasMoreElements(); ) {
	1275	numSoFar++;
	1276	Splitter split = (Splitter) e.nextElement();
	1277	for (int i=0; i<split.getNumOfBranches(); i++)
	1278	numSoFar += numOfAllNodes(split.getChildForBranch(i));
	1279	}
	1280	}
	1281	return numSoFar;
	1282	}
	1283
	1284	/**
	1285	* Returns the number of prediction nodes in a tree.
	1286	*
	1287	* @param root the root of the tree being measured
	1288	* @return tree size in number of prediction nodes
	1289	*/
	1290	protected int numOfPredictionNodes(PredictionNode root) {
	1291
	1292	int numSoFar = 0;
	1293	if (root != null) {
	1294	numSoFar++;
	1295	for (Enumeration e = root.children(); e.hasMoreElements(); ) {
	1296	Splitter split = (Splitter) e.nextElement();
	1297	for (int i=0; i<split.getNumOfBranches(); i++)
	1298	numSoFar += numOfPredictionNodes(split.getChildForBranch(i));
	1299	}
	1300	}
	1301	return numSoFar;
	1302	}
	1303
	1304	/**
	1305	* Returns the number of leaf nodes in a tree - prediction nodes without
	1306	* children.
	1307	*
	1308	* @param root the root of the tree being measured
	1309	* @return tree leaf size in number of prediction nodes
	1310	*/
	1311	protected int numOfPredictionLeafNodes(PredictionNode root) {
	1312
	1313	int numSoFar = 0;
	1314	if (root.getChildren().size() > 0) {
	1315	for (Enumeration e = root.children(); e.hasMoreElements(); ) {
	1316	Splitter split = (Splitter) e.nextElement();
	1317	for (int i=0; i<split.getNumOfBranches(); i++)
	1318	numSoFar += numOfPredictionLeafNodes(split.getChildForBranch(i));
	1319	}
	1320	} else numSoFar = 1;
	1321	return numSoFar;
	1322	}
	1323
	1324	/**
	1325	* Gets the next random value.
	1326	*
	1327	* @param max the maximum value (+1) to be returned
	1328	* @return the next random value (between 0 and max-1)
	1329	*/
	1330	protected int getRandom(int max) {
	1331
	1332	return m_random.nextInt(max);
	1333	}
	1334
	1335	/**
	1336	* Returns the next number in the order that splitter nodes have been added to
	1337	* the tree, and records that a new splitter has been added.
	1338	*
	1339	* @return the next number in the order
	1340	*/
	1341	public int nextSplitAddedOrder() {
	1342
	1343	return ++m_lastAddedSplitNum;
	1344	}
	1345
	1346	/**
	1347	* Returns default capabilities of the classifier.
	1348	*
	1349	* @return the capabilities of this classifier
	1350	*/
	1351	public Capabilities getCapabilities() {
	1352	Capabilities result = super.getCapabilities();
	1353	result.disableAll();
	1354
	1355	// attributes
	1356	result.enable(Capability.NOMINAL_ATTRIBUTES);
	1357	result.enable(Capability.NUMERIC_ATTRIBUTES);
	1358	result.enable(Capability.DATE_ATTRIBUTES);
	1359	result.enable(Capability.MISSING_VALUES);
	1360
	1361	// class
	1362	result.enable(Capability.BINARY_CLASS);
	1363	result.enable(Capability.MISSING_CLASS_VALUES);
	1364
	1365	return result;
	1366	}
	1367
	1368	/**
	1369	* Builds a classifier for a set of instances.
	1370	*
	1371	* @param instances the instances to train the classifier with
	1372	* @exception Exception if something goes wrong
	1373	*/
	1374	public void buildClassifier(Instances instances) throws Exception {
	1375
	1376	// can classifier handle the data?
	1377	getCapabilities().testWithFail(instances);
	1378
	1379	// remove instances with missing class
	1380	instances = new Instances(instances);
	1381	instances.deleteWithMissingClass();
	1382
	1383	// set up the tree
	1384	initClassifier(instances);
	1385
	1386	// build the tree
	1387	for (int T = 0; T < m_boostingIterations; T++) boost();
	1388
	1389	// clean up if desired
	1390	if (!m_saveInstanceData) done();
	1391	}
	1392
	1393	/**
	1394	* Frees memory that is no longer needed for a final model - will no longer be able
	1395	* to increment the classifier after calling this.
	1396	*
	1397	*/
	1398	public void done() {
	1399
	1400	m_trainInstances = new Instances(m_trainInstances, 0);
	1401	m_random = null;
	1402	m_numericAttIndices = null;
	1403	m_nominalAttIndices = null;
	1404	m_posTrainInstances = null;
	1405	m_negTrainInstances = null;
	1406	}
	1407
	1408	/**
	1409	* Creates a clone that is identical to the current tree, but is independent.
	1410	* Deep copies the essential elements such as the tree nodes, and the instances
	1411	* (because the weights change.) Reference copies several elements such as the
	1412	* potential splitter sets, assuming that such elements should never differ between
	1413	* clones.
	1414	*
	1415	* @return the clone
	1416	*/
	1417	public Object clone() {
	1418
	1419	ADTree clone = new ADTree();
	1420
	1421	if (m_root != null) { // check for initialization first
	1422	clone.m_root = (PredictionNode) m_root.clone(); // deep copy the tree
	1423
	1424	clone.m_trainInstances = new Instances(m_trainInstances); // copy training instances
	1425
	1426	// deep copy the random object
	1427	if (m_random != null) {
	1428	SerializedObject randomSerial = null;
	1429	try {
	1430	randomSerial = new SerializedObject(m_random);
	1431	} catch (Exception ignored) {} // we know that Random is serializable
	1432	clone.m_random = (Random) randomSerial.getObject();
	1433	}
	1434
	1435	clone.m_lastAddedSplitNum = m_lastAddedSplitNum;
	1436	clone.m_numericAttIndices = m_numericAttIndices;
	1437	clone.m_nominalAttIndices = m_nominalAttIndices;
	1438	clone.m_trainTotalWeight = m_trainTotalWeight;
	1439
	1440	// reconstruct pos/negTrainInstances references
	1441	if (m_posTrainInstances != null) {
	1442	clone.m_posTrainInstances =
	1443	new ReferenceInstances(m_trainInstances, m_posTrainInstances.numInstances());
	1444	clone.m_negTrainInstances =
	1445	new ReferenceInstances(m_trainInstances, m_negTrainInstances.numInstances());
	1446	for (Enumeration e = clone.m_trainInstances.enumerateInstances();
	1447	e.hasMoreElements(); ) {
	1448	Instance inst = (Instance) e.nextElement();
	1449	try { // ignore classValue() exception
	1450	if ((int) inst.classValue() == 0)
	1451	clone.m_negTrainInstances.addReference(inst); // belongs in negative class
	1452	else
	1453	clone.m_posTrainInstances.addReference(inst); // belongs in positive class
	1454	} catch (Exception ignored) {}
	1455	}
	1456	}
	1457	}
	1458	clone.m_nodesExpanded = m_nodesExpanded;
	1459	clone.m_examplesCounted = m_examplesCounted;
	1460	clone.m_boostingIterations = m_boostingIterations;
	1461	clone.m_searchPath = m_searchPath;
	1462	clone.m_randomSeed = m_randomSeed;
	1463
	1464	return clone;
	1465	}
	1466
	1467	/**
	1468	* Merges two trees together. Modifies the tree being acted on, leaving tree passed
	1469	* as a parameter untouched (cloned). Does not check to see whether training instances
	1470	* are compatible - strange things could occur if they are not.
	1471	*
	1472	* @param mergeWith the tree to merge with
	1473	* @exception Exception if merge could not be performed
	1474	*/
	1475	public void merge(ADTree mergeWith) throws Exception {
	1476
	1477	if (m_root == null \|\| mergeWith.m_root == null)
	1478	throw new Exception("Trying to merge an uninitialized tree");
	1479	m_root.merge(mergeWith.m_root, this);
	1480	}
	1481
	1482	/**
	1483	* Returns the revision string.
	1484	*
	1485	* @return the revision
	1486	*/
	1487	public String getRevision() {
	1488	return RevisionUtils.extract("$Revision: 5928 $");
	1489	}
	1490
	1491	/**
	1492	* Main method for testing this class.
	1493	*
	1494	* @param argv the options
	1495	*/
	1496	public static void main(String [] argv) {
	1497	runClassifier(new ADTree(), argv);
	1498	}
	1499	}

Note: See TracBrowser for help on using the repository browser.

Download in other formats: