Context Navigation

CrossValidationResultProducer.java

Last change on this file was 29, checked in by gnappo, 14 years ago
Taggata versione per la demo e aggiunto branch.
File size: 25.6 KB

Line
1	/*
2	* This program is free software; you can redistribute it and/or modify
3	* it under the terms of the GNU General Public License as published by
4	* the Free Software Foundation; either version 2 of the License, or
5	* (at your option) any later version.
6	*
7	* This program is distributed in the hope that it will be useful,
8	* but WITHOUT ANY WARRANTY; without even the implied warranty of
9	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
10	* GNU General Public License for more details.
11	*
12	* You should have received a copy of the GNU General Public License
13	* along with this program; if not, write to the Free Software
14	* Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
15	*/
16
17	/*
18	* CrossValidationResultProducer.java
19	* Copyright (C) 1999 University of Waikato, Hamilton, New Zealand
20	*
21	*/
22
23
24	package weka.experiment;
25
26	import weka.core.AdditionalMeasureProducer;
27	import weka.core.Instances;
28	import weka.core.Option;
29	import weka.core.OptionHandler;
30	import weka.core.RevisionHandler;
31	import weka.core.RevisionUtils;
32	import weka.core.Utils;
33
34	import java.io.File;
35	import java.util.Calendar;
36	import java.util.Enumeration;
37	import java.util.Random;
38	import java.util.TimeZone;
39	import java.util.Vector;
40
41
42	/**
43	<!-- globalinfo-start -->
44	* Generates for each run, carries out an n-fold cross-validation, using the set SplitEvaluator to generate some results. If the class attribute is nominal, the dataset is stratified. Results for each fold are generated, so you may wish to use this in addition with an AveragingResultProducer to obtain averages for each run.
45	* <p/>
46	<!-- globalinfo-end -->
47	*
48	<!-- options-start -->
49	* Valid options are: <p/>
50	*
51	* <pre> -X <number of folds>
52	* The number of folds to use for the cross-validation.
53	* (default 10)</pre>
54	*
55	* <pre> -D
56	* Save raw split evaluator output.</pre>
57	*
58	* <pre> -O <file/directory name/path>
59	* The filename where raw output will be stored.
60	* If a directory name is specified then then individual
61	* outputs will be gzipped, otherwise all output will be
62	* zipped to the named file. Use in conjuction with -D. (default splitEvalutorOut.zip)</pre>
63	*
64	* <pre> -W <class name>
65	* The full class name of a SplitEvaluator.
66	* eg: weka.experiment.ClassifierSplitEvaluator</pre>
67	*
68	* <pre>
69	* Options specific to split evaluator weka.experiment.ClassifierSplitEvaluator:
70	* </pre>
71	*
72	* <pre> -W <class name>
73	* The full class name of the classifier.
74	* eg: weka.classifiers.bayes.NaiveBayes</pre>
75	*
76	* <pre> -C <index>
77	* The index of the class for which IR statistics
78	* are to be output. (default 1)</pre>
79	*
80	* <pre> -I <index>
81	* The index of an attribute to output in the
82	* results. This attribute should identify an
83	* instance in order to know which instances are
84	* in the test set of a cross validation. if 0
85	* no output (default 0).</pre>
86	*
87	* <pre> -P
88	* Add target and prediction columns to the result
89	* for each fold.</pre>
90	*
91	* <pre>
92	* Options specific to classifier weka.classifiers.rules.ZeroR:
93	* </pre>
94	*
95	* <pre> -D
96	* If set, classifier is run in debug mode and
97	* may output additional info to the console</pre>
98	*
99	<!-- options-end -->
100	*
101	* All options after -- will be passed to the split evaluator.
102	*
103	* @author Len Trigg (trigg@cs.waikato.ac.nz)
104	* @version $Revision: 1.17 $
105	*/
106	public class CrossValidationResultProducer
107	implements ResultProducer, OptionHandler, AdditionalMeasureProducer,
108	RevisionHandler {
109
110	/** for serialization */
111	static final long serialVersionUID = -1580053925080091917L;
112
113	/** The dataset of interest */
114	protected Instances m_Instances;
115
116	/** The ResultListener to send results to */
117	protected ResultListener m_ResultListener = new CSVResultListener();
118
119	/** The number of folds in the cross-validation */
120	protected int m_NumFolds = 10;
121
122	/** Save raw output of split evaluators --- for debugging purposes */
123	protected boolean m_debugOutput = false;
124
125	/** The output zipper to use for saving raw splitEvaluator output */
126	protected OutputZipper m_ZipDest = null;
127
128	/** The destination output file/directory for raw output */
129	protected File m_OutputFile = new File(
130	new File(System.getProperty("user.dir")),
131	"splitEvalutorOut.zip");
132
133	/** The SplitEvaluator used to generate results */
134	protected SplitEvaluator m_SplitEvaluator = new ClassifierSplitEvaluator();
135
136	/** The names of any additional measures to look for in SplitEvaluators */
137	protected String [] m_AdditionalMeasures = null;
138
139	/** The name of the key field containing the dataset name */
140	public static String DATASET_FIELD_NAME = "Dataset";
141
142	/** The name of the key field containing the run number */
143	public static String RUN_FIELD_NAME = "Run";
144
145	/** The name of the key field containing the fold number */
146	public static String FOLD_FIELD_NAME = "Fold";
147
148	/** The name of the result field containing the timestamp */
149	public static String TIMESTAMP_FIELD_NAME = "Date_time";
150
151	/**
152	* Returns a string describing this result producer
153	* @return a description of the result producer suitable for
154	* displaying in the explorer/experimenter gui
155	*/
156	public String globalInfo() {
157	return
158	"Generates for each run, carries out an n-fold cross-validation, "
159	+ "using the set SplitEvaluator to generate some results. If the class "
160	+ "attribute is nominal, the dataset is stratified. Results for each fold "
161	+ "are generated, so you may wish to use this in addition with an "
162	+ "AveragingResultProducer to obtain averages for each run.";
163	}
164
165	/**
166	* Sets the dataset that results will be obtained for.
167	*
168	* @param instances a value of type 'Instances'.
169	*/
170	public void setInstances(Instances instances) {
171
172	m_Instances = instances;
173	}
174
175	/**
176	* Sets the object to send results of each run to.
177	*
178	* @param listener a value of type 'ResultListener'
179	*/
180	public void setResultListener(ResultListener listener) {
181
182	m_ResultListener = listener;
183	}
184
185	/**
186	* Set a list of method names for additional measures to look for
187	* in SplitEvaluators. This could contain many measures (of which only a
188	* subset may be produceable by the current SplitEvaluator) if an experiment
189	* is the type that iterates over a set of properties.
190	* @param additionalMeasures an array of measure names, null if none
191	*/
192	public void setAdditionalMeasures(String [] additionalMeasures) {
193	m_AdditionalMeasures = additionalMeasures;
194
195	if (m_SplitEvaluator != null) {
196	System.err.println("CrossValidationResultProducer: setting additional "
197	+"measures for "
198	+"split evaluator");
199	m_SplitEvaluator.setAdditionalMeasures(m_AdditionalMeasures);
200	}
201	}
202
203	/**
204	* Returns an enumeration of any additional measure names that might be
205	* in the SplitEvaluator
206	* @return an enumeration of the measure names
207	*/
208	public Enumeration enumerateMeasures() {
209	Vector newVector = new Vector();
210	if (m_SplitEvaluator instanceof AdditionalMeasureProducer) {
211	Enumeration en = ((AdditionalMeasureProducer)m_SplitEvaluator).
212	enumerateMeasures();
213	while (en.hasMoreElements()) {
214	String mname = (String)en.nextElement();
215	newVector.addElement(mname);
216	}
217	}
218	return newVector.elements();
219	}
220
221	/**
222	* Returns the value of the named measure
223	* @param additionalMeasureName the name of the measure to query for its value
224	* @return the value of the named measure
225	* @throws IllegalArgumentException if the named measure is not supported
226	*/
227	public double getMeasure(String additionalMeasureName) {
228	if (m_SplitEvaluator instanceof AdditionalMeasureProducer) {
229	return ((AdditionalMeasureProducer)m_SplitEvaluator).
230	getMeasure(additionalMeasureName);
231	} else {
232	throw new IllegalArgumentException("CrossValidationResultProducer: "
233	+"Can't return value for : "+additionalMeasureName
234	+". "+m_SplitEvaluator.getClass().getName()+" "
235	+"is not an AdditionalMeasureProducer");
236	}
237	}
238
239	/**
240	* Gets a Double representing the current date and time.
241	* eg: 1:46pm on 20/5/1999 -> 19990520.1346
242	*
243	* @return a value of type Double
244	*/
245	public static Double getTimestamp() {
246
247	Calendar now = Calendar.getInstance(TimeZone.getTimeZone("UTC"));
248	double timestamp = now.get(Calendar.YEAR) * 10000
249	+ (now.get(Calendar.MONTH) + 1) * 100
250	+ now.get(Calendar.DAY_OF_MONTH)
251	+ now.get(Calendar.HOUR_OF_DAY) / 100.0
252	+ now.get(Calendar.MINUTE) / 10000.0;
253	return new Double(timestamp);
254	}
255
256	/**
257	* Prepare to generate results.
258	*
259	* @throws Exception if an error occurs during preprocessing.
260	*/
261	public void preProcess() throws Exception {
262
263	if (m_SplitEvaluator == null) {
264	throw new Exception("No SplitEvalutor set");
265	}
266	if (m_ResultListener == null) {
267	throw new Exception("No ResultListener set");
268	}
269	m_ResultListener.preProcess(this);
270	}
271
272	/**
273	* Perform any postprocessing. When this method is called, it indicates
274	* that no more requests to generate results for the current experiment
275	* will be sent.
276	*
277	* @throws Exception if an error occurs
278	*/
279	public void postProcess() throws Exception {
280
281	m_ResultListener.postProcess(this);
282
283	if (m_debugOutput) {
284	if (m_ZipDest != null) {
285	m_ZipDest.finished();
286	m_ZipDest = null;
287	}
288	}
289	}
290
291	/**
292	* Gets the keys for a specified run number. Different run
293	* numbers correspond to different randomizations of the data. Keys
294	* produced should be sent to the current ResultListener
295	*
296	* @param run the run number to get keys for.
297	* @throws Exception if a problem occurs while getting the keys
298	*/
299	public void doRunKeys(int run) throws Exception {
300	if (m_Instances == null) {
301	throw new Exception("No Instances set");
302	}
303	/* // Randomize on a copy of the original dataset
304	Instances runInstances = new Instances(m_Instances);
305	runInstances.randomize(new Random(run));
306	if (runInstances.classAttribute().isNominal()) {
307	runInstances.stratify(m_NumFolds);
308	} */
309	for (int fold = 0; fold < m_NumFolds; fold++) {
310	// Add in some fields to the key like run and fold number, dataset name
311	Object [] seKey = m_SplitEvaluator.getKey();
312	Object [] key = new Object [seKey.length + 3];
313	key[0] = Utils.backQuoteChars(m_Instances.relationName());
314	key[1] = "" + run;
315	key[2] = "" + (fold + 1);
316	System.arraycopy(seKey, 0, key, 3, seKey.length);
317	if (m_ResultListener.isResultRequired(this, key)) {
318	try {
319	m_ResultListener.acceptResult(this, key, null);
320	} catch (Exception ex) {
321	// Save the train and test datasets for debugging purposes?
322	throw ex;
323	}
324	}
325	}
326	}
327
328
329	/**
330	* Gets the results for a specified run number. Different run
331	* numbers correspond to different randomizations of the data. Results
332	* produced should be sent to the current ResultListener
333	*
334	* @param run the run number to get results for.
335	* @throws Exception if a problem occurs while getting the results
336	*/
337	public void doRun(int run) throws Exception {
338
339	if (getRawOutput()) {
340	if (m_ZipDest == null) {
341	m_ZipDest = new OutputZipper(m_OutputFile);
342	}
343	}
344
345	if (m_Instances == null) {
346	throw new Exception("No Instances set");
347	}
348	// Randomize on a copy of the original dataset
349	Instances runInstances = new Instances(m_Instances);
350	Random random = new Random(run);
351	runInstances.randomize(random);
352	if (runInstances.classAttribute().isNominal()) {
353	runInstances.stratify(m_NumFolds);
354	}
355	for (int fold = 0; fold < m_NumFolds; fold++) {
356	// Add in some fields to the key like run and fold number, dataset name
357	Object [] seKey = m_SplitEvaluator.getKey();
358	Object [] key = new Object [seKey.length + 3];
359	key[0] = Utils.backQuoteChars(m_Instances.relationName());
360	key[1] = "" + run;
361	key[2] = "" + (fold + 1);
362	System.arraycopy(seKey, 0, key, 3, seKey.length);
363	if (m_ResultListener.isResultRequired(this, key)) {
364	Instances train = runInstances.trainCV(m_NumFolds, fold, random);
365	Instances test = runInstances.testCV(m_NumFolds, fold);
366	try {
367	Object [] seResults = m_SplitEvaluator.getResult(train, test);
368	Object [] results = new Object [seResults.length + 1];
369	results[0] = getTimestamp();
370	System.arraycopy(seResults, 0, results, 1,
371	seResults.length);
372	if (m_debugOutput) {
373	String resultName = (""+run+"."+(fold+1)+"."
374	+ Utils.backQuoteChars(runInstances.relationName())
375	+"."
376	+m_SplitEvaluator.toString()).replace(' ','_');
377	resultName = Utils.removeSubstring(resultName,
378	"weka.classifiers.");
379	resultName = Utils.removeSubstring(resultName,
380	"weka.filters.");
381	resultName = Utils.removeSubstring(resultName,
382	"weka.attributeSelection.");
383	m_ZipDest.zipit(m_SplitEvaluator.getRawResultOutput(), resultName);
384	}
385	m_ResultListener.acceptResult(this, key, results);
386	} catch (Exception ex) {
387	// Save the train and test datasets for debugging purposes?
388	throw ex;
389	}
390	}
391	}
392	}
393
394	/**
395	* Gets the names of each of the columns produced for a single run.
396	* This method should really be static.
397	*
398	* @return an array containing the name of each column
399	*/
400	public String [] getKeyNames() {
401
402	String [] keyNames = m_SplitEvaluator.getKeyNames();
403	// Add in the names of our extra key fields
404	String [] newKeyNames = new String [keyNames.length + 3];
405	newKeyNames[0] = DATASET_FIELD_NAME;
406	newKeyNames[1] = RUN_FIELD_NAME;
407	newKeyNames[2] = FOLD_FIELD_NAME;
408	System.arraycopy(keyNames, 0, newKeyNames, 3, keyNames.length);
409	return newKeyNames;
410	}
411
412	/**
413	* Gets the data types of each of the columns produced for a single run.
414	* This method should really be static.
415	*
416	* @return an array containing objects of the type of each column. The
417	* objects should be Strings, or Doubles.
418	*/
419	public Object [] getKeyTypes() {
420
421	Object [] keyTypes = m_SplitEvaluator.getKeyTypes();
422	// Add in the types of our extra fields
423	Object [] newKeyTypes = new String [keyTypes.length + 3];
424	newKeyTypes[0] = new String();
425	newKeyTypes[1] = new String();
426	newKeyTypes[2] = new String();
427	System.arraycopy(keyTypes, 0, newKeyTypes, 3, keyTypes.length);
428	return newKeyTypes;
429	}
430
431	/**
432	* Gets the names of each of the columns produced for a single run.
433	* This method should really be static.
434	*
435	* @return an array containing the name of each column
436	*/
437	public String [] getResultNames() {
438
439	String [] resultNames = m_SplitEvaluator.getResultNames();
440	// Add in the names of our extra Result fields
441	String [] newResultNames = new String [resultNames.length + 1];
442	newResultNames[0] = TIMESTAMP_FIELD_NAME;
443	System.arraycopy(resultNames, 0, newResultNames, 1, resultNames.length);
444	return newResultNames;
445	}
446
447	/**
448	* Gets the data types of each of the columns produced for a single run.
449	* This method should really be static.
450	*
451	* @return an array containing objects of the type of each column. The
452	* objects should be Strings, or Doubles.
453	*/
454	public Object [] getResultTypes() {
455
456	Object [] resultTypes = m_SplitEvaluator.getResultTypes();
457	// Add in the types of our extra Result fields
458	Object [] newResultTypes = new Object [resultTypes.length + 1];
459	newResultTypes[0] = new Double(0);
460	System.arraycopy(resultTypes, 0, newResultTypes, 1, resultTypes.length);
461	return newResultTypes;
462	}
463
464	/**
465	* Gets a description of the internal settings of the result
466	* producer, sufficient for distinguishing a ResultProducer
467	* instance from another with different settings (ignoring
468	* those settings set through this interface). For example,
469	* a cross-validation ResultProducer may have a setting for the
470	* number of folds. For a given state, the results produced should
471	* be compatible. Typically if a ResultProducer is an OptionHandler,
472	* this string will represent the command line arguments required
473	* to set the ResultProducer to that state.
474	*
475	* @return the description of the ResultProducer state, or null
476	* if no state is defined
477	*/
478	public String getCompatibilityState() {
479
480	String result = "-X " + m_NumFolds + " " ;
481	if (m_SplitEvaluator == null) {
482	result += "<null SplitEvaluator>";
483	} else {
484	result += "-W " + m_SplitEvaluator.getClass().getName();
485	}
486	return result + " --";
487	}
488
489	/**
490	* Returns the tip text for this property
491	* @return tip text for this property suitable for
492	* displaying in the explorer/experimenter gui
493	*/
494	public String outputFileTipText() {
495	return "Set the destination for saving raw output. If the rawOutput "
496	+"option is selected, then output from the splitEvaluator for "
497	+"individual folds is saved. If the destination is a directory, "
498	+"then each output is saved to an individual gzip file; if the "
499	+"destination is a file, then each output is saved as an entry "
500	+"in a zip file.";
501	}
502
503	/**
504	* Get the value of OutputFile.
505	*
506	* @return Value of OutputFile.
507	*/
508	public File getOutputFile() {
509
510	return m_OutputFile;
511	}
512
513	/**
514	* Set the value of OutputFile.
515	*
516	* @param newOutputFile Value to assign to OutputFile.
517	*/
518	public void setOutputFile(File newOutputFile) {
519
520	m_OutputFile = newOutputFile;
521	}
522
523	/**
524	* Returns the tip text for this property
525	* @return tip text for this property suitable for
526	* displaying in the explorer/experimenter gui
527	*/
528	public String numFoldsTipText() {
529	return "Number of folds to use in cross validation.";
530	}
531
532	/**
533	* Get the value of NumFolds.
534	*
535	* @return Value of NumFolds.
536	*/
537	public int getNumFolds() {
538
539	return m_NumFolds;
540	}
541
542	/**
543	* Set the value of NumFolds.
544	*
545	* @param newNumFolds Value to assign to NumFolds.
546	*/
547	public void setNumFolds(int newNumFolds) {
548
549	m_NumFolds = newNumFolds;
550	}
551
552	/**
553	* Returns the tip text for this property
554	* @return tip text for this property suitable for
555	* displaying in the explorer/experimenter gui
556	*/
557	public String rawOutputTipText() {
558	return "Save raw output (useful for debugging). If set, then output is "
559	+"sent to the destination specified by outputFile";
560	}
561
562	/**
563	* Get if raw split evaluator output is to be saved
564	* @return true if raw split evalutor output is to be saved
565	*/
566	public boolean getRawOutput() {
567	return m_debugOutput;
568	}
569
570	/**
571	* Set to true if raw split evaluator output is to be saved
572	* @param d true if output is to be saved
573	*/
574	public void setRawOutput(boolean d) {
575	m_debugOutput = d;
576	}
577
578	/**
579	* Returns the tip text for this property
580	* @return tip text for this property suitable for
581	* displaying in the explorer/experimenter gui
582	*/
583	public String splitEvaluatorTipText() {
584	return "The evaluator to apply to the cross validation folds. "
585	+"This may be a classifier, regression scheme etc.";
586	}
587
588	/**
589	* Get the SplitEvaluator.
590	*
591	* @return the SplitEvaluator.
592	*/
593	public SplitEvaluator getSplitEvaluator() {
594
595	return m_SplitEvaluator;
596	}
597
598	/**
599	* Set the SplitEvaluator.
600	*
601	* @param newSplitEvaluator new SplitEvaluator to use.
602	*/
603	public void setSplitEvaluator(SplitEvaluator newSplitEvaluator) {
604
605	m_SplitEvaluator = newSplitEvaluator;
606	m_SplitEvaluator.setAdditionalMeasures(m_AdditionalMeasures);
607	}
608
609	/**
610	* Returns an enumeration describing the available options..
611	*
612	* @return an enumeration of all the available options.
613	*/
614	public Enumeration listOptions() {
615
616	Vector newVector = new Vector(4);
617
618	newVector.addElement(new Option(
619	"\tThe number of folds to use for the cross-validation.\n"
620	+"\t(default 10)",
621	"X", 1,
622	"-X <number of folds>"));
623
624	newVector.addElement(new Option(
625	"Save raw split evaluator output.",
626	"D",0,"-D"));
627
628	newVector.addElement(new Option(
629	"\tThe filename where raw output will be stored.\n"
630	+"\tIf a directory name is specified then then individual\n"
631	+"\toutputs will be gzipped, otherwise all output will be\n"
632	+"\tzipped to the named file. Use in conjuction with -D."
633	+"\t(default splitEvalutorOut.zip)",
634	"O", 1,
635	"-O <file/directory name/path>"));
636
637	newVector.addElement(new Option(
638	"\tThe full class name of a SplitEvaluator.\n"
639	+"\teg: weka.experiment.ClassifierSplitEvaluator",
640	"W", 1,
641	"-W <class name>"));
642
643	if ((m_SplitEvaluator != null) &&
644	(m_SplitEvaluator instanceof OptionHandler)) {
645	newVector.addElement(new Option(
646	"",
647	"", 0, "\nOptions specific to split evaluator "
648	+ m_SplitEvaluator.getClass().getName() + ":"));
649	Enumeration enu = ((OptionHandler)m_SplitEvaluator).listOptions();
650	while (enu.hasMoreElements()) {
651	newVector.addElement(enu.nextElement());
652	}
653	}
654	return newVector.elements();
655	}
656
657	/**
658	* Parses a given list of options. <p/>
659	*
660	<!-- options-start -->
661	* Valid options are: <p/>
662	*
663	* <pre> -X <number of folds>
664	* The number of folds to use for the cross-validation.
665	* (default 10)</pre>
666	*
667	* <pre> -D
668	* Save raw split evaluator output.</pre>
669	*
670	* <pre> -O <file/directory name/path>
671	* The filename where raw output will be stored.
672	* If a directory name is specified then then individual
673	* outputs will be gzipped, otherwise all output will be
674	* zipped to the named file. Use in conjuction with -D. (default splitEvalutorOut.zip)</pre>
675	*
676	* <pre> -W <class name>
677	* The full class name of a SplitEvaluator.
678	* eg: weka.experiment.ClassifierSplitEvaluator</pre>
679	*
680	* <pre>
681	* Options specific to split evaluator weka.experiment.ClassifierSplitEvaluator:
682	* </pre>
683	*
684	* <pre> -W <class name>
685	* The full class name of the classifier.
686	* eg: weka.classifiers.bayes.NaiveBayes</pre>
687	*
688	* <pre> -C <index>
689	* The index of the class for which IR statistics
690	* are to be output. (default 1)</pre>
691	*
692	* <pre> -I <index>
693	* The index of an attribute to output in the
694	* results. This attribute should identify an
695	* instance in order to know which instances are
696	* in the test set of a cross validation. if 0
697	* no output (default 0).</pre>
698	*
699	* <pre> -P
700	* Add target and prediction columns to the result
701	* for each fold.</pre>
702	*
703	* <pre>
704	* Options specific to classifier weka.classifiers.rules.ZeroR:
705	* </pre>
706	*
707	* <pre> -D
708	* If set, classifier is run in debug mode and
709	* may output additional info to the console</pre>
710	*
711	<!-- options-end -->
712	*
713	* All options after -- will be passed to the split evaluator.
714	*
715	* @param options the list of options as an array of strings
716	* @throws Exception if an option is not supported
717	*/
718	public void setOptions(String[] options) throws Exception {
719
720	setRawOutput(Utils.getFlag('D', options));
721
722	String fName = Utils.getOption('O', options);
723	if (fName.length() != 0) {
724	setOutputFile(new File(fName));
725	}
726
727	String numFolds = Utils.getOption('X', options);
728	if (numFolds.length() != 0) {
729	setNumFolds(Integer.parseInt(numFolds));
730	} else {
731	setNumFolds(10);
732	}
733
734	String seName = Utils.getOption('W', options);
735	if (seName.length() == 0) {
736	throw new Exception("A SplitEvaluator must be specified with"
737	+ " the -W option.");
738	}
739	// Do it first without options, so if an exception is thrown during
740	// the option setting, listOptions will contain options for the actual
741	// SE.
742	setSplitEvaluator((SplitEvaluator)Utils.forName(
743	SplitEvaluator.class,
744	seName,
745	null));
746	if (getSplitEvaluator() instanceof OptionHandler) {
747	((OptionHandler) getSplitEvaluator())
748	.setOptions(Utils.partitionOptions(options));
749	}
750	}
751
752	/**
753	* Gets the current settings of the result producer.
754	*
755	* @return an array of strings suitable for passing to setOptions
756	*/
757	public String [] getOptions() {
758
759	String [] seOptions = new String [0];
760	if ((m_SplitEvaluator != null) &&
761	(m_SplitEvaluator instanceof OptionHandler)) {
762	seOptions = ((OptionHandler)m_SplitEvaluator).getOptions();
763	}
764
765	String [] options = new String [seOptions.length + 8];
766	int current = 0;
767
768	options[current++] = "-X"; options[current++] = "" + getNumFolds();
769
770	if (getRawOutput()) {
771	options[current++] = "-D";
772	}
773
774	options[current++] = "-O";
775	options[current++] = getOutputFile().getName();
776
777	if (getSplitEvaluator() != null) {
778	options[current++] = "-W";
779	options[current++] = getSplitEvaluator().getClass().getName();
780	}
781	options[current++] = "--";
782
783	System.arraycopy(seOptions, 0, options, current,
784	seOptions.length);
785	current += seOptions.length;
786	while (current < options.length) {
787	options[current++] = "";
788	}
789	return options;
790	}
791
792	/**
793	* Gets a text descrption of the result producer.
794	*
795	* @return a text description of the result producer.
796	*/
797	public String toString() {
798
799	String result = "CrossValidationResultProducer: ";
800	result += getCompatibilityState();
801	if (m_Instances == null) {
802	result += ": <null Instances>";
803	} else {
804	result += ": " + Utils.backQuoteChars(m_Instances.relationName());
805	}
806	return result;
807	}
808
809	/**
810	* Returns the revision string.
811	*
812	* @return the revision
813	*/
814	public String getRevision() {
815	return RevisionUtils.extract("$Revision: 1.17 $");
816	}
817
818	/**
819	* Quick test of timestamp
820	*
821	* @param args the commandline options
822	*/
823	public static void main(String [] args) {
824
825	System.err.println(Utils.doubleToString(getTimestamp().doubleValue(), 4));
826	}
827	} // CrossValidationResultProducer

Note: See TracBrowser for help on using the repository browser.

Context Navigation

source: branches/MetisMQI/src/main/java/weka/experiment/CrossValidationResultProducer.java

Download in other formats: