Context Navigation

source: src/main/java/weka/classifiers/mi/MIBoost.java @ 15

Last change on this file since 15 was 4, checked in by gnappo, 14 years ago
Import di weka.
File size: 20.4 KB

Line
1	/*
2	* This program is free software; you can redistribute it and/or modify
3	* it under the terms of the GNU General Public License as published by
4	* the Free Software Foundation; either version 2 of the License, or
5	* (at your option) any later version.
6	*
7	* This program is distributed in the hope that it will be useful,
8	* but WITHOUT ANY WARRANTY; without even the implied warranty of
9	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
10	* GNU General Public License for more details.
11	*
12	* You should have received a copy of the GNU General Public License
13	* along with this program; if not, write to the Free Software
14	* Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
15	*/
16
17	/*
18	* MIBoost.java
19	* Copyright (C) 2005 University of Waikato, Hamilton, New Zealand
20	*
21	*/
22
23	package weka.classifiers.mi;
24
25	import weka.classifiers.Classifier;
26	import weka.classifiers.AbstractClassifier;
27	import weka.classifiers.SingleClassifierEnhancer;
28	import weka.core.Capabilities;
29	import weka.core.Instance;
30	import weka.core.Instances;
31	import weka.core.MultiInstanceCapabilitiesHandler;
32	import weka.core.Optimization;
33	import weka.core.Option;
34	import weka.core.OptionHandler;
35	import weka.core.RevisionUtils;
36	import weka.core.TechnicalInformation;
37	import weka.core.TechnicalInformationHandler;
38	import weka.core.Utils;
39	import weka.core.WeightedInstancesHandler;
40	import weka.core.Capabilities.Capability;
41	import weka.core.TechnicalInformation.Field;
42	import weka.core.TechnicalInformation.Type;
43	import weka.filters.Filter;
44	import weka.filters.unsupervised.attribute.Discretize;
45	import weka.filters.unsupervised.attribute.MultiInstanceToPropositional;
46
47	import java.util.Enumeration;
48	import java.util.Vector;
49
50	/**
51	<!-- globalinfo-start -->
52	* MI AdaBoost method, considers the geometric mean of posterior of instances inside a bag (arithmatic mean of log-posterior) and the expectation for a bag is taken inside the loss function.<br/>
53	* <br/>
54	* For more information about Adaboost, see:<br/>
55	* <br/>
56	* Yoav Freund, Robert E. Schapire: Experiments with a new boosting algorithm. In: Thirteenth International Conference on Machine Learning, San Francisco, 148-156, 1996.
57	* <p/>
58	<!-- globalinfo-end -->
59	*
60	<!-- technical-bibtex-start -->
61	* BibTeX:
62	* <pre>
63	* @inproceedings{Freund1996,
64	* address = {San Francisco},
65	* author = {Yoav Freund and Robert E. Schapire},
66	* booktitle = {Thirteenth International Conference on Machine Learning},
67	* pages = {148-156},
68	* publisher = {Morgan Kaufmann},
69	* title = {Experiments with a new boosting algorithm},
70	* year = {1996}
71	* }
72	* </pre>
73	* <p/>
74	<!-- technical-bibtex-end -->
75	*
76	<!-- options-start -->
77	* Valid options are: <p/>
78	*
79	* <pre> -D
80	* Turn on debugging output.</pre>
81	*
82	* <pre> -B <num>
83	* The number of bins in discretization
84	* (default 0, no discretization)</pre>
85	*
86	* <pre> -R <num>
87	* Maximum number of boost iterations.
88	* (default 10)</pre>
89	*
90	* <pre> -W <class name>
91	* Full name of classifier to boost.
92	* eg: weka.classifiers.bayes.NaiveBayes</pre>
93	*
94	* <pre> -D
95	* If set, classifier is run in debug mode and
96	* may output additional info to the console</pre>
97	*
98	<!-- options-end -->
99	*
100	* @author Eibe Frank (eibe@cs.waikato.ac.nz)
101	* @author Xin Xu (xx5@cs.waikato.ac.nz)
102	* @version $Revision: 5928 $
103	*/
104	public class MIBoost
105	extends SingleClassifierEnhancer
106	implements OptionHandler, MultiInstanceCapabilitiesHandler,
107	TechnicalInformationHandler {
108
109	/** for serialization */
110	static final long serialVersionUID = -3808427225599279539L;
111
112	/** the models for the iterations */
113	protected Classifier[] m_Models;
114
115	/** The number of the class labels */
116	protected int m_NumClasses;
117
118	/** Class labels for each bag */
119	protected int[] m_Classes;
120
121	/** attributes name for the new dataset used to build the model */
122	protected Instances m_Attributes;
123
124	/** Number of iterations */
125	private int m_NumIterations = 100;
126
127	/** Voting weights of models */
128	protected double[] m_Beta;
129
130	/** the maximum number of boost iterations */
131	protected int m_MaxIterations = 10;
132
133	/** the number of discretization bins */
134	protected int m_DiscretizeBin = 0;
135
136	/** filter used for discretization */
137	protected Discretize m_Filter = null;
138
139	/** filter used to convert the MI dataset into single-instance dataset */
140	protected MultiInstanceToPropositional m_ConvertToSI = new MultiInstanceToPropositional();
141
142	/**
143	* Returns a string describing this filter
144	*
145	* @return a description of the filter suitable for
146	* displaying in the explorer/experimenter gui
147	*/
148	public String globalInfo() {
149	return
150	"MI AdaBoost method, considers the geometric mean of posterior "
151	+ "of instances inside a bag (arithmatic mean of log-posterior) and "
152	+ "the expectation for a bag is taken inside the loss function.\n\n"
153	+ "For more information about Adaboost, see:\n\n"
154	+ getTechnicalInformation().toString();
155	}
156
157	/**
158	* Returns an instance of a TechnicalInformation object, containing
159	* detailed information about the technical background of this class,
160	* e.g., paper reference or book this class is based on.
161	*
162	* @return the technical information about this class
163	*/
164	public TechnicalInformation getTechnicalInformation() {
165	TechnicalInformation result;
166
167	result = new TechnicalInformation(Type.INPROCEEDINGS);
168	result.setValue(Field.AUTHOR, "Yoav Freund and Robert E. Schapire");
169	result.setValue(Field.TITLE, "Experiments with a new boosting algorithm");
170	result.setValue(Field.BOOKTITLE, "Thirteenth International Conference on Machine Learning");
171	result.setValue(Field.YEAR, "1996");
172	result.setValue(Field.PAGES, "148-156");
173	result.setValue(Field.PUBLISHER, "Morgan Kaufmann");
174	result.setValue(Field.ADDRESS, "San Francisco");
175
176	return result;
177	}
178
179	/**
180	* Returns an enumeration describing the available options
181	*
182	* @return an enumeration of all the available options
183	*/
184	public Enumeration listOptions() {
185	Vector result = new Vector();
186
187	result.addElement(new Option(
188	"\tTurn on debugging output.",
189	"D", 0, "-D"));
190
191	result.addElement(new Option(
192	"\tThe number of bins in discretization\n"
193	+ "\t(default 0, no discretization)",
194	"B", 1, "-B <num>"));
195
196	result.addElement(new Option(
197	"\tMaximum number of boost iterations.\n"
198	+ "\t(default 10)",
199	"R", 1, "-R <num>"));
200
201	result.addElement(new Option(
202	"\tFull name of classifier to boost.\n"
203	+ "\teg: weka.classifiers.bayes.NaiveBayes",
204	"W", 1, "-W <class name>"));
205
206	Enumeration enu = ((OptionHandler)m_Classifier).listOptions();
207	while (enu.hasMoreElements()) {
208	result.addElement(enu.nextElement());
209	}
210
211	return result.elements();
212	}
213
214	/**
215	* Parses a given list of options. <p/>
216	*
217	<!-- options-start -->
218	* Valid options are: <p/>
219	*
220	* <pre> -D
221	* Turn on debugging output.</pre>
222	*
223	* <pre> -B <num>
224	* The number of bins in discretization
225	* (default 0, no discretization)</pre>
226	*
227	* <pre> -R <num>
228	* Maximum number of boost iterations.
229	* (default 10)</pre>
230	*
231	* <pre> -W <class name>
232	* Full name of classifier to boost.
233	* eg: weka.classifiers.bayes.NaiveBayes</pre>
234	*
235	* <pre> -D
236	* If set, classifier is run in debug mode and
237	* may output additional info to the console</pre>
238	*
239	<!-- options-end -->
240	*
241	* @param options the list of options as an array of strings
242	* @throws Exception if an option is not supported
243	*/
244	public void setOptions(String[] options) throws Exception {
245	setDebug(Utils.getFlag('D', options));
246
247	String bin = Utils.getOption('B', options);
248	if (bin.length() != 0) {
249	setDiscretizeBin(Integer.parseInt(bin));
250	} else {
251	setDiscretizeBin(0);
252	}
253
254	String boostIterations = Utils.getOption('R', options);
255	if (boostIterations.length() != 0) {
256	setMaxIterations(Integer.parseInt(boostIterations));
257	} else {
258	setMaxIterations(10);
259	}
260
261	super.setOptions(options);
262	}
263
264	/**
265	* Gets the current settings of the classifier.
266	*
267	* @return an array of strings suitable for passing to setOptions
268	*/
269	public String[] getOptions() {
270	Vector result;
271	String[] options;
272	int i;
273
274	result = new Vector();
275
276	result.add("-R");
277	result.add("" + getMaxIterations());
278
279	result.add("-B");
280	result.add("" + getDiscretizeBin());
281
282	options = super.getOptions();
283	for (i = 0; i < options.length; i++)
284	result.add(options[i]);
285
286	return (String[]) result.toArray(new String[result.size()]);
287	}
288
289	/**
290	* Returns the tip text for this property
291	*
292	* @return tip text for this property suitable for
293	* displaying in the explorer/experimenter gui
294	*/
295	public String maxIterationsTipText() {
296	return "The maximum number of boost iterations.";
297	}
298
299	/**
300	* Set the maximum number of boost iterations
301	*
302	* @param maxIterations the maximum number of boost iterations
303	*/
304	public void setMaxIterations(int maxIterations) {
305	m_MaxIterations = maxIterations;
306	}
307
308	/**
309	* Get the maximum number of boost iterations
310	*
311	* @return the maximum number of boost iterations
312	*/
313	public int getMaxIterations() {
314
315	return m_MaxIterations;
316	}
317
318	/**
319	* Returns the tip text for this property
320	*
321	* @return tip text for this property suitable for
322	* displaying in the explorer/experimenter gui
323	*/
324	public String discretizeBinTipText() {
325	return "The number of bins in discretization.";
326	}
327
328	/**
329	* Set the number of bins in discretization
330	*
331	* @param bin the number of bins in discretization
332	*/
333	public void setDiscretizeBin(int bin) {
334	m_DiscretizeBin = bin;
335	}
336
337	/**
338	* Get the number of bins in discretization
339	*
340	* @return the number of bins in discretization
341	*/
342	public int getDiscretizeBin() {
343	return m_DiscretizeBin;
344	}
345
346	private class OptEng
347	extends Optimization {
348
349	private double[] weights, errs;
350
351	public void setWeights(double[] w){
352	weights = w;
353	}
354
355	public void setErrs(double[] e){
356	errs = e;
357	}
358
359	/**
360	* Evaluate objective function
361	* @param x the current values of variables
362	* @return the value of the objective function
363	* @throws Exception if result is NaN
364	*/
365	protected double objectiveFunction(double[] x) throws Exception{
366	double obj=0;
367	for(int i=0; i<weights.length; i++){
368	obj += weights[i]Math.exp(x[0](2.0*errs[i]-1.0));
369	if(Double.isNaN(obj))
370	throw new Exception("Objective function value is NaN!");
371
372	}
373	return obj;
374	}
375
376	/**
377	* Evaluate Jacobian vector
378	* @param x the current values of variables
379	* @return the gradient vector
380	* @throws Exception if gradient is NaN
381	*/
382	protected double[] evaluateGradient(double[] x) throws Exception{
383	double[] grad = new double[1];
384	for(int i=0; i<weights.length; i++){
385	grad[0] += weights[i](2.0errs[i]-1.0)Math.exp(x[0](2.0*errs[i]-1.0));
386	if(Double.isNaN(grad[0]))
387	throw new Exception("Gradient is NaN!");
388
389	}
390	return grad;
391	}
392
393	/**
394	* Returns the revision string.
395	*
396	* @return the revision
397	*/
398	public String getRevision() {
399	return RevisionUtils.extract("$Revision: 5928 $");
400	}
401	}
402
403	/**
404	* Returns default capabilities of the classifier.
405	*
406	* @return the capabilities of this classifier
407	*/
408	public Capabilities getCapabilities() {
409	Capabilities result = super.getCapabilities();
410
411	// attributes
412	result.enable(Capability.NOMINAL_ATTRIBUTES);
413	result.enable(Capability.RELATIONAL_ATTRIBUTES);
414	result.enable(Capability.MISSING_VALUES);
415
416	// class
417	result.disableAllClasses();
418	result.disableAllClassDependencies();
419	if (super.getCapabilities().handles(Capability.BINARY_CLASS))
420	result.enable(Capability.BINARY_CLASS);
421	result.enable(Capability.MISSING_CLASS_VALUES);
422
423	// other
424	result.enable(Capability.ONLY_MULTIINSTANCE);
425
426	return result;
427	}
428
429	/**
430	* Returns the capabilities of this multi-instance classifier for the
431	* relational data.
432	*
433	* @return the capabilities of this object
434	* @see Capabilities
435	*/
436	public Capabilities getMultiInstanceCapabilities() {
437	Capabilities result = super.getCapabilities();
438
439	// class
440	result.disableAllClasses();
441	result.enable(Capability.NO_CLASS);
442
443	return result;
444	}
445
446	/**
447	* Builds the classifier
448	*
449	* @param exps the training data to be used for generating the
450	* boosted classifier.
451	* @throws Exception if the classifier could not be built successfully
452	*/
453	public void buildClassifier(Instances exps) throws Exception {
454
455	// can classifier handle the data?
456	getCapabilities().testWithFail(exps);
457
458	// remove instances with missing class
459	Instances train = new Instances(exps);
460	train.deleteWithMissingClass();
461
462	m_NumClasses = train.numClasses();
463	m_NumIterations = m_MaxIterations;
464
465	if (m_Classifier == null)
466	throw new Exception("A base classifier has not been specified!");
467	if(!(m_Classifier instanceof WeightedInstancesHandler))
468	throw new Exception("Base classifier cannot handle weighted instances!");
469
470	m_Models = AbstractClassifier.makeCopies(m_Classifier, getMaxIterations());
471	if(m_Debug)
472	System.err.println("Base classifier: "+m_Classifier.getClass().getName());
473
474	m_Beta = new double[m_NumIterations];
475
476	/* modified by Lin Dong. (use MIToSingleInstance filter to convert the MI datasets) */
477
478	//Initialize the bags' weights
479	double N = (double)train.numInstances(), sumNi=0;
480	for(int i=0; i<N; i++)
481	sumNi += train.instance(i).relationalValue(1).numInstances();
482	for(int i=0; i<N; i++){
483	train.instance(i).setWeight(sumNi/N);
484	}
485
486	//convert the training dataset into single-instance dataset
487	m_ConvertToSI.setInputFormat(train);
488	Instances data = Filter.useFilter( train, m_ConvertToSI);
489	data.deleteAttributeAt(0); //remove the bagIndex attribute;
490
491
492	// Assume the order of the instances are preserved in the Discretize filter
493	if(m_DiscretizeBin > 0){
494	m_Filter = new Discretize();
495	m_Filter.setInputFormat(new Instances(data, 0));
496	m_Filter.setBins(m_DiscretizeBin);
497	data = Filter.useFilter(data, m_Filter);
498	}
499
500	// Main algorithm
501	int dataIdx;
502	iterations:
503	for(int m=0; m < m_MaxIterations; m++){
504	if(m_Debug)
505	System.err.println("\nIteration "+m);
506
507
508	// Build a model
509	m_Models[m].buildClassifier(data);
510
511	// Prediction of each bag
512	double[] err=new double[(int)N], weights=new double[(int)N];
513	boolean perfect = true, tooWrong=true;
514	dataIdx = 0;
515	for(int n=0; n<N; n++){
516	Instance exn = train.instance(n);
517	// Prediction of each instance and the predicted class distribution
518	// of the bag
519	double nn = (double)exn.relationalValue(1).numInstances();
520	for(int p=0; p<nn; p++){
521	Instance testIns = data.instance(dataIdx++);
522	if((int)m_Models[m].classifyInstance(testIns)
523	!= (int)exn.classValue()) // Weighted instance-wise 0-1 errors
524	err[n] ++;
525	}
526	weights[n] = exn.weight();
527	err[n] /= nn;
528	if(err[n] > 0.5)
529	perfect = false;
530	if(err[n] < 0.5)
531	tooWrong = false;
532	}
533
534	if(perfect \|\| tooWrong){ // No or 100% classification error, cannot find beta
535	if (m == 0)
536	m_Beta[m] = 1.0;
537	else
538	m_Beta[m] = 0;
539	m_NumIterations = m+1;
540	if(m_Debug) System.err.println("No errors");
541	break iterations;
542	}
543
544	double[] x = new double[1];
545	x[0] = 0;
546	double[][] b = new double[2][x.length];
547	b[0][0] = Double.NaN;
548	b[1][0] = Double.NaN;
549
550	OptEng opt = new OptEng();
551	opt.setWeights(weights);
552	opt.setErrs(err);
553	//opt.setDebug(m_Debug);
554	if (m_Debug)
555	System.out.println("Start searching for c... ");
556	x = opt.findArgmin(x, b);
557	while(x==null){
558	x = opt.getVarbValues();
559	if (m_Debug)
560	System.out.println("200 iterations finished, not enough!");
561	x = opt.findArgmin(x, b);
562	}
563	if (m_Debug)
564	System.out.println("Finished.");
565	m_Beta[m] = x[0];
566
567	if(m_Debug)
568	System.err.println("c = "+m_Beta[m]);
569
570	// Stop if error too small or error too big and ignore this model
571	if (Double.isInfinite(m_Beta[m])
572	\|\| Utils.smOrEq(m_Beta[m], 0)
573	) {
574	if (m == 0)
575	m_Beta[m] = 1.0;
576	else
577	m_Beta[m] = 0;
578	m_NumIterations = m+1;
579	if(m_Debug)
580	System.err.println("Errors out of range!");
581	break iterations;
582	}
583
584	// Update weights of data and class label of wfData
585	dataIdx=0;
586	double totWeights=0;
587	for(int r=0; r<N; r++){
588	Instance exr = train.instance(r);
589	exr.setWeight(weights[r]Math.exp(m_Beta[m](2.0*err[r]-1.0)));
590	totWeights += exr.weight();
591	}
592
593	if(m_Debug)
594	System.err.println("Total weights = "+totWeights);
595
596	for(int r=0; r<N; r++){
597	Instance exr = train.instance(r);
598	double num = (double)exr.relationalValue(1).numInstances();
599	exr.setWeight(sumNi*exr.weight()/totWeights);
600	//if(m_Debug)
601	// System.err.print("\nExemplar "+r+"="+exr.weight()+": \t");
602	for(int s=0; s<num; s++){
603	Instance inss = data.instance(dataIdx);
604	inss.setWeight(exr.weight()/num);
605	// if(m_Debug)
606	// System.err.print("instance "+s+"="+inss.weight()+
607	// "\|ewiwsumNi="+data.instance(dataIdx).weight()+"\t");
608	if(Double.isNaN(inss.weight()))
609	throw new Exception("instance "+s+" in bag "+r+" has weight NaN!");
610	dataIdx++;
611	}
612	//if(m_Debug)
613	// System.err.println();
614	}
615	}
616	}
617
618	/**
619	* Computes the distribution for a given exemplar
620	*
621	* @param exmp the exemplar for which distribution is computed
622	* @return the classification
623	* @throws Exception if the distribution can't be computed successfully
624	*/
625	public double[] distributionForInstance(Instance exmp)
626	throws Exception {
627
628	double[] rt = new double[m_NumClasses];
629
630	Instances insts = new Instances(exmp.dataset(), 0);
631	insts.add(exmp);
632
633	// convert the training dataset into single-instance dataset
634	insts = Filter.useFilter( insts, m_ConvertToSI);
635	insts.deleteAttributeAt(0); //remove the bagIndex attribute
636
637	double n = insts.numInstances();
638
639	if(m_DiscretizeBin > 0)
640	insts = Filter.useFilter(insts, m_Filter);
641
642	for(int y=0; y<n; y++){
643	Instance ins = insts.instance(y);
644	for(int x=0; x<m_NumIterations; x++){
645	rt[(int)m_Models[x].classifyInstance(ins)] += m_Beta[x]/n;
646	}
647	}
648
649	for(int i=0; i<rt.length; i++)
650	rt[i] = Math.exp(rt[i]);
651
652	Utils.normalize(rt);
653	return rt;
654	}
655
656	/**
657	* Gets a string describing the classifier.
658	*
659	* @return a string describing the classifer built.
660	*/
661	public String toString() {
662
663	if (m_Models == null) {
664	return "No model built yet!";
665	}
666	StringBuffer text = new StringBuffer();
667	text.append("MIBoost: number of bins in discretization = "+m_DiscretizeBin+"\n");
668	if (m_NumIterations == 0) {
669	text.append("No model built yet.\n");
670	} else if (m_NumIterations == 1) {
671	text.append("No boosting possible, one classifier used: Weight = "
672	+ Utils.roundDouble(m_Beta[0], 2)+"\n");
673	text.append("Base classifiers:\n"+m_Models[0].toString());
674	} else {
675	text.append("Base classifiers and their weights: \n");
676	for (int i = 0; i < m_NumIterations ; i++) {
677	text.append("\n\n"+i+": Weight = " + Utils.roundDouble(m_Beta[i], 2)
678	+"\nBase classifier:\n"+m_Models[i].toString() );
679	}
680	}
681
682	text.append("\n\nNumber of performed Iterations: "
683	+ m_NumIterations + "\n");
684
685	return text.toString();
686	}
687
688	/**
689	* Returns the revision string.
690	*
691	* @return the revision
692	*/
693	public String getRevision() {
694	return RevisionUtils.extract("$Revision: 5928 $");
695	}
696
697	/**
698	* Main method for testing this class.
699	*
700	* @param argv should contain the command line arguments to the
701	* scheme (see Evaluation)
702	*/
703	public static void main(String[] argv) {
704	runClassifier(new MIBoost(), argv);
705	}
706	}

Note: See TracBrowser for help on using the repository browser.

Download in other formats: