Context Navigation

source: src/main/java/weka/experiment/RemoteExperiment.java @ 17

Last change on this file since 17 was 4, checked in by gnappo, 14 years ago
Import di weka.
File size: 29.3 KB

Line
1	/*
2	* This program is free software; you can redistribute it and/or modify
3	* it under the terms of the GNU General Public License as published by
4	* the Free Software Foundation; either version 2 of the License, or
5	* (at your option) any later version.
6	*
7	* This program is distributed in the hope that it will be useful,
8	* but WITHOUT ANY WARRANTY; without even the implied warranty of
9	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
10	* GNU General Public License for more details.
11	*
12	* You should have received a copy of the GNU General Public License
13	* along with this program; if not, write to the Free Software
14	* Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
15	*/
16
17	/*
18	* RemoteExperiment.java
19	* Copyright (C) 2000 University of Waikato, Hamilton, New Zealand
20	*
21	*/
22
23
24	package weka.experiment;
25
26	import weka.core.FastVector;
27	import weka.core.Option;
28	import weka.core.OptionHandler;
29	import weka.core.Queue;
30	import weka.core.RevisionUtils;
31	import weka.core.SerializedObject;
32	import weka.core.Utils;
33	import weka.core.xml.KOML;
34	import weka.core.xml.XMLOptions;
35	import weka.experiment.xml.XMLExperiment;
36
37	import java.io.BufferedInputStream;
38	import java.io.BufferedOutputStream;
39	import java.io.File;
40	import java.io.FileInputStream;
41	import java.io.FileOutputStream;
42	import java.io.ObjectInputStream;
43	import java.io.ObjectOutputStream;
44	import java.rmi.Naming;
45	import java.util.Enumeration;
46
47	import javax.swing.DefaultListModel;
48
49	/**
50	* Holds all the necessary configuration information for a distributed
51	* experiment. This object is able to be serialized for storage on disk.<p>
52	*
53	* This class is experimental at present. Has been tested using
54	* CSVResultListener (sending results to standard out) and
55	* DatabaseResultListener (InstantDB + RmiJdbc bridge). <p>
56	*
57	* Getting started:<p>
58	*
59	* Start InstantDB (with the RMI bridge) on some machine. If using java2
60	* then specify -Djava.security.policy=db.policy to the
61	* virtual machine. Where db.policy is as follows: <br>
62	* <pre>
63	* grant {
64	* permission java.security.AllPermission;
65	* };
66	* </pre><p>
67	*
68	* Start RemoteEngine servers on x machines as per the instructons in the
69	* README_Experiment_Gui file. There must be a
70	* DatabaseUtils.props in either the HOME or current directory of each
71	* machine, listing all necessary jdbc drivers.<p>
72	*
73	* The machine where a RemoteExperiment is started must also have a copy
74	* of DatabaseUtils.props listing the URL to the machine where the
75	* database server is running (RmiJdbc + InstantDB). <p>
76	*
77	* Here is an example of starting a RemoteExperiment: <p>
78	*
79	* <pre>
80	*
81	* java -Djava.rmi.server.codebase=file:/path to weka classes/ \
82	* weka.experiment.RemoteExperiment -L 1 -U 10 \
83	* -T /home/ml/datasets/UCI/iris.arff \
84	* -D "weka.experiment.DatabaseResultListener" \
85	* -P "weka.experiment.RandomSplitResultProducer" \
86	* -h rosebud.cs.waikato.ac.nz -h blackbird.cs.waikato.ac.nz -r -- \
87	* -W weka.experiment.ClassifierSplitEvaluator -- \
88	* -W weka.classifiers.bayes.NaiveBayes
89	*
90	* </pre> <p>
91	* The "codebase" property tells rmi where to serve up weka classes from.
92	* This can either be a file url (as long as a shared file system is being
93	* used that is accessable by the remoteEngine servers), or http url (which
94	* of course supposes that a web server is running and you have put your
95	* weka classes somewhere that is web accessable). If using a file url the
96	* trailing "/" is most important unless the weka classes are in a jar
97	* file. <p>
98	*
99	<!-- options-start -->
100	* Valid options are: <p/>
101	*
102	* <pre> -L <num>
103	* The lower run number to start the experiment from.
104	* (default 1)</pre>
105	*
106	* <pre> -U <num>
107	* The upper run number to end the experiment at (inclusive).
108	* (default 10)</pre>
109	*
110	* <pre> -T <arff file>
111	* The dataset to run the experiment on.
112	* (required, may be specified multiple times)</pre>
113	*
114	* <pre> -P <class name>
115	* The full class name of a ResultProducer (required).
116	* eg: weka.experiment.RandomSplitResultProducer</pre>
117	*
118	* <pre> -D <class name>
119	* The full class name of a ResultListener (required).
120	* eg: weka.experiment.CSVResultListener</pre>
121	*
122	* <pre> -N <string>
123	* A string containing any notes about the experiment.
124	* (default none)</pre>
125	*
126	* <pre>
127	* Options specific to result producer weka.experiment.RandomSplitResultProducer:
128	* </pre>
129	*
130	* <pre> -P <percent>
131	* The percentage of instances to use for training.
132	* (default 66)</pre>
133	*
134	* <pre> -D
135	* Save raw split evaluator output.</pre>
136	*
137	* <pre> -O <file/directory name/path>
138	* The filename where raw output will be stored.
139	* If a directory name is specified then then individual
140	* outputs will be gzipped, otherwise all output will be
141	* zipped to the named file. Use in conjuction with -D. (default splitEvalutorOut.zip)</pre>
142	*
143	* <pre> -W <class name>
144	* The full class name of a SplitEvaluator.
145	* eg: weka.experiment.ClassifierSplitEvaluator</pre>
146	*
147	* <pre> -R
148	* Set when data is not to be randomized and the data sets' size.
149	* Is not to be determined via probabilistic rounding.</pre>
150	*
151	* <pre>
152	* Options specific to split evaluator weka.experiment.ClassifierSplitEvaluator:
153	* </pre>
154	*
155	* <pre> -W <class name>
156	* The full class name of the classifier.
157	* eg: weka.classifiers.bayes.NaiveBayes</pre>
158	*
159	* <pre> -C <index>
160	* The index of the class for which IR statistics
161	* are to be output. (default 1)</pre>
162	*
163	* <pre> -I <index>
164	* The index of an attribute to output in the
165	* results. This attribute should identify an
166	* instance in order to know which instances are
167	* in the test set of a cross validation. if 0
168	* no output (default 0).</pre>
169	*
170	* <pre> -P
171	* Add target and prediction columns to the result
172	* for each fold.</pre>
173	*
174	* <pre>
175	* Options specific to classifier weka.classifiers.rules.ZeroR:
176	* </pre>
177	*
178	* <pre> -D
179	* If set, classifier is run in debug mode and
180	* may output additional info to the console</pre>
181	*
182	<!-- options-end -->
183	*
184	* @author Mark Hall (mhall@cs.waikato.ac.nz)
185	* @version $Revision: 1.16 $
186	*/
187	public class RemoteExperiment
188	extends Experiment {
189
190	/** for serialization */
191	static final long serialVersionUID = -7357668825635314937L;
192
193	/** The list of objects listening for remote experiment events */
194	private FastVector m_listeners = new FastVector();
195
196	/** Holds the names of machines with remoteEngine servers running */
197	protected DefaultListModel m_remoteHosts = new DefaultListModel();
198
199	/** The queue of available hosts */
200	private Queue m_remoteHostsQueue = new Queue();
201
202	/** The status of each of the remote hosts */
203	private int [] m_remoteHostsStatus;
204
205	/** The number of times tasks have failed on each remote host */
206	private int [] m_remoteHostFailureCounts;
207
208	/** status of the remote host: available */
209	protected static final int AVAILABLE=0;
210	/** status of the remote host: in use */
211	protected static final int IN_USE=1;
212	/** status of the remote host: connection failed */
213	protected static final int CONNECTION_FAILED=2;
214	/** status of the remote host: some other failure */
215	protected static final int SOME_OTHER_FAILURE=3;
216
217	// protected static final int TO_BE_RUN=0;
218	// protected static final int PROCESSING=1;
219	// protected static final int FAILED=2;
220	// protected static final int FINISHED=3;
221
222	/** allow at most 3 failures on a host before it is removed from the list
223	of usable hosts */
224	protected static final int MAX_FAILURES=3;
225
226	/** Set to true if MAX_FAILURES exceeded on all hosts or connections fail
227	on all hosts or user aborts experiment (via gui) */
228	private boolean m_experimentAborted = false;
229
230	/** The number of hosts removed due to exceeding max failures */
231	private int m_removedHosts;
232
233	/** The count of failed sub-experiments */
234	private int m_failedCount;
235
236	/** The count of successfully completed sub-experiments */
237	private int m_finishedCount;
238
239	/** The base experiment to split up into sub experiments for remote
240	execution */
241	private Experiment m_baseExperiment = null;
242
243	/** The sub experiments */
244	protected Experiment [] m_subExperiments;
245
246	/** The queue of sub experiments waiting to be processed */
247	private Queue m_subExpQueue = new Queue();
248
249	/** The status of each of the sub-experiments */
250	protected int [] m_subExpComplete;
251
252	/**
253	* If true, then sub experiments are created on the basis of data sets
254	* rather than run number.
255	*/
256	protected boolean m_splitByDataSet = true;
257
258
259	/**
260	* Returns true if sub experiments are to be created on the basis of
261	* data set..
262	*
263	* @return a <code>boolean</code> value indicating whether sub
264	* experiments are to be created on the basis of data set (true) or
265	* run number (false).
266	*/
267	public boolean getSplitByDataSet() {
268	return m_splitByDataSet;
269	}
270
271	/**
272	* Set whether sub experiments are to be created on the basis of
273	* data set.
274	*
275	* @param sd true if sub experiments are to be created on the basis
276	* of data set. Otherwise sub experiments are created on the basis of
277	* run number.
278	*/
279	public void setSplitByDataSet(boolean sd) {
280	m_splitByDataSet = sd;
281	}
282
283	/**
284	* Construct a new RemoteExperiment using an empty Experiment as base
285	* Experiment
286	* @throws Exception if the base experiment is null
287	*/
288	public RemoteExperiment() throws Exception {
289	this(new Experiment());
290	}
291
292	/**
293	* Construct a new RemoteExperiment using a base Experiment
294	* @param base the base experiment to use
295	* @throws Exception if the base experiment is null
296	*/
297	public RemoteExperiment(Experiment base) throws Exception {
298	setBaseExperiment(base);
299	}
300
301	/**
302	* Add an object to the list of those interested in recieving update
303	* information from the RemoteExperiment
304	* @param r a listener
305	*/
306	public void addRemoteExperimentListener(RemoteExperimentListener r) {
307	m_listeners.addElement(r);
308	}
309
310	/**
311	* Get the base experiment used by this remote experiment
312	* @return the base experiment
313	*/
314	public Experiment getBaseExperiment() {
315	return m_baseExperiment;
316	}
317
318	/**
319	* Set the base experiment. A sub experiment will be created for each
320	* run in the base experiment.
321	* @param base the base experiment to use.
322	* @throws Exception if supplied base experiment is null
323	*/
324	public void setBaseExperiment(Experiment base) throws Exception {
325	if (base == null) {
326	throw new Exception("Base experiment is null!");
327	}
328	m_baseExperiment = base;
329	setRunLower(m_baseExperiment.getRunLower());
330	setRunUpper(m_baseExperiment.getRunUpper());
331	setResultListener(m_baseExperiment.getResultListener());
332	setResultProducer(m_baseExperiment.getResultProducer());
333	setDatasets(m_baseExperiment.getDatasets());
334	setUsePropertyIterator(m_baseExperiment.getUsePropertyIterator());
335	setPropertyPath(m_baseExperiment.getPropertyPath());
336	setPropertyArray(m_baseExperiment.getPropertyArray());
337	setNotes(m_baseExperiment.getNotes());
338	m_ClassFirst = m_baseExperiment.m_ClassFirst;
339	m_AdvanceDataSetFirst = m_baseExperiment.m_AdvanceDataSetFirst;
340	}
341
342	/**
343	* Set the user notes.
344	*
345	* @param newNotes New user notes.
346	*/
347	public void setNotes(String newNotes) {
348
349	super.setNotes(newNotes);
350	m_baseExperiment.setNotes(newNotes);
351	}
352
353	/**
354	* Set the lower run number for the experiment.
355	*
356	* @param newRunLower the lower run number for the experiment.
357	*/
358	public void setRunLower(int newRunLower) {
359
360	super.setRunLower(newRunLower);
361	m_baseExperiment.setRunLower(newRunLower);
362	}
363
364	/**
365	* Set the upper run number for the experiment.
366	*
367	* @param newRunUpper the upper run number for the experiment.
368	*/
369	public void setRunUpper(int newRunUpper) {
370
371	super.setRunUpper(newRunUpper);
372	m_baseExperiment.setRunUpper(newRunUpper);
373	}
374
375	/**
376	* Sets the result listener where results will be sent.
377	*
378	* @param newResultListener the result listener where results will be sent.
379	*/
380	public void setResultListener(ResultListener newResultListener) {
381
382	super.setResultListener(newResultListener);
383	m_baseExperiment.setResultListener(newResultListener);
384	}
385
386	/**
387	* Set the result producer used for the current experiment.
388	*
389	* @param newResultProducer result producer to use for the current
390	* experiment.
391	*/
392	public void setResultProducer(ResultProducer newResultProducer) {
393
394	super.setResultProducer(newResultProducer);
395	m_baseExperiment.setResultProducer(newResultProducer);
396	}
397
398	/**
399	* Set the datasets to use in the experiment
400	* @param ds the list of datasets to use
401	*/
402	public void setDatasets(DefaultListModel ds) {
403	super.setDatasets(ds);
404	m_baseExperiment.setDatasets(ds);
405	}
406
407	/**
408	* Sets whether the custom property iterator should be used.
409	*
410	* @param newUsePropertyIterator true if so
411	*/
412	public void setUsePropertyIterator(boolean newUsePropertyIterator) {
413
414	super.setUsePropertyIterator(newUsePropertyIterator);
415	m_baseExperiment.setUsePropertyIterator(newUsePropertyIterator);
416	}
417
418	/**
419	* Sets the path of properties taken to get to the custom property
420	* to iterate over.
421	*
422	* @param newPropertyPath an array of PropertyNodes
423	*/
424	public void setPropertyPath(PropertyNode [] newPropertyPath) {
425
426	super.setPropertyPath(newPropertyPath);
427	m_baseExperiment.setPropertyPath(newPropertyPath);
428	}
429
430	/**
431	* Sets the array of values to set the custom property to.
432	*
433	* @param newPropArray a value of type Object which should be an
434	* array of the appropriate values.
435	*/
436	public void setPropertyArray(Object newPropArray) {
437	super.setPropertyArray(newPropArray);
438	m_baseExperiment.setPropertyArray(newPropArray);
439	}
440
441
442	/**
443	* Prepares a remote experiment for running, creates sub experiments
444	*
445	* @throws Exception if an error occurs
446	*/
447	public void initialize() throws Exception {
448	if (m_baseExperiment == null) {
449	throw new Exception("No base experiment specified!");
450	}
451
452	m_experimentAborted = false;
453	m_finishedCount = 0;
454	m_failedCount = 0;
455	m_RunNumber = getRunLower();
456	m_DatasetNumber = 0;
457	m_PropertyNumber = 0;
458	m_CurrentProperty = -1;
459	m_CurrentInstances = null;
460	m_Finished = false;
461
462	if (m_remoteHosts.size() == 0) {
463	throw new Exception("No hosts specified!");
464	}
465	// initialize all remote hosts to available
466	m_remoteHostsStatus = new int [m_remoteHosts.size()];
467	m_remoteHostFailureCounts = new int [m_remoteHosts.size()];
468
469	m_remoteHostsQueue = new Queue();
470	// prime the hosts queue
471	for (int i=0;i<m_remoteHosts.size();i++) {
472	m_remoteHostsQueue.push(new Integer(i));
473	}
474
475	// set up sub experiments
476	m_subExpQueue = new Queue();
477	int numExps;
478	if (getSplitByDataSet()) {
479	numExps = m_baseExperiment.getDatasets().size();
480	} else {
481	numExps = getRunUpper() - getRunLower() + 1;
482	}
483	m_subExperiments = new Experiment[numExps];
484	m_subExpComplete = new int[numExps];
485	// create copy of base experiment
486	SerializedObject so = new SerializedObject(m_baseExperiment);
487
488	if (getSplitByDataSet()) {
489	for (int i = 0; i < m_baseExperiment.getDatasets().size(); i++) {
490	m_subExperiments[i] = (Experiment)so.getObject();
491	// one for each data set
492	DefaultListModel temp = new DefaultListModel();
493	temp.addElement(m_baseExperiment.getDatasets().elementAt(i));
494	m_subExperiments[i].setDatasets(temp);
495	m_subExpQueue.push(new Integer(i));
496	}
497	} else {
498	for (int i = getRunLower(); i <= getRunUpper(); i++) {
499	m_subExperiments[i-getRunLower()] = (Experiment)so.getObject();
500	// one run for each sub experiment
501	m_subExperiments[i-getRunLower()].setRunLower(i);
502	m_subExperiments[i-getRunLower()].setRunUpper(i);
503
504	m_subExpQueue.push(new Integer(i-getRunLower()));
505	}
506	}
507	}
508
509	/**
510	* Inform all listeners of progress
511	* @param status true if this is a status type of message
512	* @param log true if this is a log type of message
513	* @param finished true if the remote experiment has finished
514	* @param message the message.
515	*/
516	private synchronized void notifyListeners(boolean status,
517	boolean log,
518	boolean finished,
519	String message) {
520	if (m_listeners.size() > 0) {
521	for (int i=0;i<m_listeners.size();i++) {
522	RemoteExperimentListener r =
523	(RemoteExperimentListener)(m_listeners.elementAt(i));
524	r.remoteExperimentStatus(new RemoteExperimentEvent(status,
525	log,
526	finished,
527	message));
528	}
529	} else {
530	System.err.println(message);
531	}
532	}
533
534	/**
535	* Set the abort flag
536	*/
537	public void abortExperiment() {
538	m_experimentAborted = true;
539	}
540
541	/**
542	* Increment the number of successfully completed sub experiments
543	*/
544	protected synchronized void incrementFinished() {
545	m_finishedCount++;
546	}
547
548	/**
549	* Increment the overall number of failures and the number of failures for
550	* a particular host
551	* @param hostNum the index of the host to increment failure count
552	*/
553	protected synchronized void incrementFailed(int hostNum) {
554	m_failedCount++;
555	m_remoteHostFailureCounts[hostNum]++;
556	}
557
558	/**
559	* Push an experiment back on the queue of waiting experiments
560	* @param expNum the index of the experiment to push onto the queue
561	*/
562	protected synchronized void waitingExperiment(int expNum) {
563	m_subExpQueue.push(new Integer(expNum));
564	}
565
566	/**
567	* Check to see if we have failed to connect to all hosts
568	*
569	* @return true if failed to connect to all hosts
570	*/
571	private boolean checkForAllFailedHosts() {
572	boolean allbad = true;
573	for (int i = 0; i < m_remoteHostsStatus.length; i++) {
574	if (m_remoteHostsStatus[i] != CONNECTION_FAILED) {
575	allbad = false;
576	break;
577	}
578	}
579	if (allbad) {
580	abortExperiment();
581	notifyListeners(false,true,true,"Experiment aborted! All connections "
582	+"to remote hosts failed.");
583	}
584	return allbad;
585	}
586
587	/**
588	* Returns some post experiment information.
589	* @return a String containing some post experiment info
590	*/
591	private String postExperimentInfo() {
592	StringBuffer text = new StringBuffer();
593	text.append(m_finishedCount+(m_splitByDataSet
594	? " data sets"
595	: " runs") + " completed successfully. "
596	+m_failedCount+" failures during running.\n");
597	System.err.print(text.toString());
598	return text.toString();
599	}
600
601	/**
602	* Pushes a host back onto the queue of available hosts and attempts to
603	* launch a waiting experiment (if any).
604	* @param hostNum the index of the host to push back onto the queue of
605	* available hosts
606	*/
607	protected synchronized void availableHost(int hostNum) {
608	if (hostNum >= 0) {
609	if (m_remoteHostFailureCounts[hostNum] < MAX_FAILURES) {
610	m_remoteHostsQueue.push(new Integer(hostNum));
611	} else {
612	notifyListeners(false,true,false,"Max failures exceeded for host "
613	+((String)m_remoteHosts.elementAt(hostNum))
614	+". Removed from host list.");
615	m_removedHosts++;
616	}
617	}
618
619	// check for all sub exp complete or all hosts failed or failed count
620	// exceeded
621	if (m_failedCount == (MAX_FAILURES * m_remoteHosts.size())) {
622	abortExperiment();
623	notifyListeners(false,true,true,"Experiment aborted! Max failures "
624	+"exceeded on all remote hosts.");
625	return;
626	}
627
628	if ((getSplitByDataSet() &&
629	(m_baseExperiment.getDatasets().size() == m_finishedCount)) \|\|
630	(!getSplitByDataSet() &&
631	((getRunUpper() - getRunLower() + 1) == m_finishedCount))) {
632	notifyListeners(false,true,false,"Experiment completed successfully.");
633	notifyListeners(false,true,true,postExperimentInfo());
634	return;
635	}
636
637	if (checkForAllFailedHosts()) {
638	return;
639	}
640
641	if (m_experimentAborted &&
642	(m_remoteHostsQueue.size() + m_removedHosts) == m_remoteHosts.size()) {
643	notifyListeners(false,true,true,"Experiment aborted. All remote tasks "
644	+"finished.");
645	}
646
647	if (!m_subExpQueue.empty() && !m_experimentAborted) {
648	if (!m_remoteHostsQueue.empty()) {
649	int availHost, waitingExp;
650	try {
651	availHost = ((Integer)m_remoteHostsQueue.pop()).intValue();
652	waitingExp = ((Integer)m_subExpQueue.pop()).intValue();
653	launchNext(waitingExp, availHost);
654	} catch (Exception ex) {
655	ex.printStackTrace();
656	}
657	}
658	}
659	}
660
661	/**
662	* Launch a sub experiment on a remote host
663	* @param wexp the index of the sub experiment to launch
664	* @param ah the index of the available host to launch on
665	*/
666	public void launchNext(final int wexp, final int ah) {
667
668	Thread subExpThread;
669	subExpThread = new Thread() {
670	public void run() {
671	m_remoteHostsStatus[ah] = IN_USE;
672	m_subExpComplete[wexp] = TaskStatusInfo.PROCESSING;
673	RemoteExperimentSubTask expSubTsk = new RemoteExperimentSubTask();
674	expSubTsk.setExperiment(m_subExperiments[wexp]);
675	String subTaskType = (getSplitByDataSet())
676	? "dataset :" + ((File)m_subExperiments[wexp].getDatasets().
677	elementAt(0)).getName()
678	: "run :" + m_subExperiments[wexp].getRunLower();
679	try {
680	String name = "//"
681	+((String)m_remoteHosts.elementAt(ah))
682	+"/RemoteEngine";
683	Compute comp = (Compute) Naming.lookup(name);
684	// assess the status of the sub-exp
685	notifyListeners(false,true,false,"Starting "
686	+subTaskType
687	+" on host "
688	+((String)m_remoteHosts.elementAt(ah)));
689	Object subTaskId = comp.executeTask(expSubTsk);
690	boolean finished = false;
691	TaskStatusInfo is = null;
692	while (!finished) {
693	try {
694	Thread.sleep(2000);
695
696	TaskStatusInfo cs = (TaskStatusInfo)comp.
697	checkStatus(subTaskId);
698	if (cs.getExecutionStatus() == TaskStatusInfo.FINISHED) {
699	// push host back onto queue and try launching any waiting
700	// sub-experiments
701	notifyListeners(false, true, false, cs.getStatusMessage());
702	m_remoteHostsStatus[ah] = AVAILABLE;
703	incrementFinished();
704	availableHost(ah);
705	finished = true;
706	} else if (cs.getExecutionStatus() == TaskStatusInfo.FAILED) {
707	// a non connection related error---possibly host doesn't have
708	// access to data sets or security policy is not set up
709	// correctly or classifier(s) failed for some reason
710	notifyListeners(false, true, false, cs.getStatusMessage());
711	m_remoteHostsStatus[ah] = SOME_OTHER_FAILURE;
712	m_subExpComplete[wexp] = TaskStatusInfo.FAILED;
713	notifyListeners(false,true,false,subTaskType
714	+" "+cs.getStatusMessage()
715	+". Scheduling for execution on another host.");
716	incrementFailed(ah);
717	// push experiment back onto queue
718	waitingExperiment(wexp);
719	// push host back onto queue and try launching any waiting
720	// sub-experiments. Host is pushed back on the queue as the
721	// failure may be temporary---eg. with InstantDB using the
722	// RMI bridge, two or more threads may try to create the
723	// experiment index or results table simultaneously; all but
724	// one will throw an exception. These hosts are still usable
725	// however.
726	availableHost(ah);
727	finished = true;
728	} else {
729	if (is == null) {
730	is = cs;
731	notifyListeners(false, true, false, cs.getStatusMessage());
732	} else {
733	if (cs.getStatusMessage().
734	compareTo(is.getStatusMessage()) != 0) {
735
736	notifyListeners(false, true, false,
737	cs.getStatusMessage());
738	}
739	is = cs;
740	}
741	}
742	} catch (InterruptedException ie) {
743	}
744	}
745
746	} catch (Exception ce) {
747	m_remoteHostsStatus[ah] = CONNECTION_FAILED;
748	m_subExpComplete[wexp] = TaskStatusInfo.TO_BE_RUN;
749	System.err.println(ce);
750	ce.printStackTrace();
751	notifyListeners(false,true,false,"Connection to "
752	+((String)m_remoteHosts.elementAt(ah))
753	+" failed. Scheduling "
754	+subTaskType
755	+" for execution on another host.");
756	checkForAllFailedHosts();
757	waitingExperiment(wexp);
758	} finally {
759	if (isInterrupted()) {
760	System.err.println("Sub exp Interupted!");
761	}
762	}
763	}
764	};
765	subExpThread.setPriority(Thread.MIN_PRIORITY);
766	subExpThread.start();
767	}
768
769	/**
770	* Overides the one in Experiment
771	* @throws Exception never throws an exception
772	*/
773	public void nextIteration() throws Exception {
774
775	}
776
777	/**
778	* overides the one in Experiment
779	*/
780	public void advanceCounters() {
781
782	}
783
784	/**
785	* overides the one in Experiment
786	*/
787	public void postProcess() {
788
789	}
790
791	/**
792	* Add a host name to the list of remote hosts
793	* @param hostname the host name to add to the list
794	*/
795	public void addRemoteHost(String hostname) {
796	m_remoteHosts.addElement(hostname);
797	}
798
799	/**
800	* Get the list of remote host names
801	* @return the list of remote host names
802	*/
803	public DefaultListModel getRemoteHosts() {
804	return m_remoteHosts;
805	}
806
807	/**
808	* Set the list of remote host names
809	* @param list the list of remote host names
810	*/
811	public void setRemoteHosts(DefaultListModel list) {
812	m_remoteHosts = list;
813	}
814
815	/**
816	* Overides toString in Experiment
817	* @return a description of this remote experiment
818	*/
819	public String toString() {
820	String result = m_baseExperiment.toString();
821
822	result += "\nRemote Hosts:\n";
823	for (int i=0;i<m_remoteHosts.size();i++) {
824	result += ((String)m_remoteHosts.elementAt(i)) +'\n';
825	}
826	return result;
827	}
828
829	/**
830	* Overides runExperiment in Experiment
831	*/
832	public void runExperiment() {
833	int totalHosts = m_remoteHostsQueue.size();
834	// Try to launch sub experiments on all available hosts
835	for (int i = 0; i < totalHosts; i++) {
836	availableHost(-1);
837	}
838	}
839
840	/**
841	* Returns the revision string.
842	*
843	* @return the revision
844	*/
845	public String getRevision() {
846	return RevisionUtils.extract("$Revision: 1.16 $");
847	}
848
849	/**
850	* Configures/Runs the Experiment from the command line.
851	*
852	* @param args command line arguments to the Experiment.
853	*/
854	public static void main(String[] args) {
855
856	try {
857	RemoteExperiment exp = null;
858
859	// get options from XML?
860	String xmlOption = Utils.getOption("xml", args);
861	if (!xmlOption.equals(""))
862	args = new XMLOptions(xmlOption).toArray();
863
864	Experiment base = null;
865	String expFile = Utils.getOption('l', args);
866	String saveFile = Utils.getOption('s', args);
867	boolean runExp = Utils.getFlag('r', args);
868	FastVector remoteHosts = new FastVector();
869	String runHost = " ";
870	while (runHost.length() != 0) {
871	runHost = Utils.getOption('h', args);
872	if (runHost.length() != 0) {
873	remoteHosts.addElement(runHost);
874	}
875	}
876	if (expFile.length() == 0) {
877	base = new Experiment();
878	try {
879	base.setOptions(args);
880	Utils.checkForRemainingOptions(args);
881	} catch (Exception ex) {
882	ex.printStackTrace();
883	String result = "Usage:\n\n"
884	+ "-l <exp file>\n"
885	+ "\tLoad experiment from file (default use cli options)\n"
886	+ "-s <exp file>\n"
887	+ "\tSave experiment to file after setting other options\n"
888	+ "\t(default don't save)\n"
889	+ "-h <remote host name>\n"
890	+ "\tHost to run experiment on (may be specified more than once\n"
891	+ "\tfor multiple remote hosts)\n"
892	+ "-r \n"
893	+ "\tRun experiment on (default don't run)\n"
894	+ "-xml <filename \| xml-string>\n"
895	+ "\tget options from XML-Data instead from parameters\n"
896	+ "\n";
897	Enumeration enm = ((OptionHandler)base).listOptions();
898	while (enm.hasMoreElements()) {
899	Option option = (Option) enm.nextElement();
900	result += option.synopsis() + "\n";
901	result += option.description() + "\n";
902	}
903	throw new Exception(result + "\n" + ex.getMessage());
904	}
905	} else {
906	Object tmp;
907
908	// KOML?
909	if ( (KOML.isPresent()) && (expFile.toLowerCase().endsWith(KOML.FILE_EXTENSION)) ) {
910	tmp = KOML.read(expFile);
911	}
912	else
913	// XML?
914	if (expFile.toLowerCase().endsWith(".xml")) {
915	XMLExperiment xml = new XMLExperiment();
916	tmp = xml.read(expFile);
917	}
918	// binary
919	else {
920	FileInputStream fi = new FileInputStream(expFile);
921	ObjectInputStream oi = new ObjectInputStream(
922	new BufferedInputStream(fi));
923	tmp = oi.readObject();
924	oi.close();
925	}
926	if (tmp instanceof RemoteExperiment) {
927	exp = (RemoteExperiment)tmp;
928	} else {
929	base = (Experiment)tmp;
930	}
931	}
932	if (base != null) {
933	exp = new RemoteExperiment(base);
934	}
935	for (int i=0;i<remoteHosts.size();i++) {
936	exp.addRemoteHost((String)remoteHosts.elementAt(i));
937	}
938	System.err.println("Experiment:\n" + exp.toString());
939
940	if (saveFile.length() != 0) {
941	// KOML?
942	if ( (KOML.isPresent()) && (saveFile.toLowerCase().endsWith(KOML.FILE_EXTENSION)) ) {
943	KOML.write(saveFile, exp);
944	}
945	else
946	// XML?
947	if (saveFile.toLowerCase().endsWith(".xml")) {
948	XMLExperiment xml = new XMLExperiment();
949	xml.write(saveFile, exp);
950	}
951	// binary
952	else {
953	FileOutputStream fo = new FileOutputStream(saveFile);
954	ObjectOutputStream oo = new ObjectOutputStream(
955	new BufferedOutputStream(fo));
956	oo.writeObject(exp);
957	oo.close();
958	}
959	}
960
961	if (runExp) {
962	System.err.println("Initializing...");
963	exp.initialize();
964	System.err.println("Iterating...");
965	exp.runExperiment();
966	System.err.println("Postprocessing...");
967	exp.postProcess();
968	}
969	} catch (Exception ex) {
970	ex.printStackTrace();
971	System.err.println(ex.getMessage());
972	}
973	}
974	}

Note: See TracBrowser for help on using the repository browser.

Download in other formats: