1 | /* |
---|
2 | * This program is free software; you can redistribute it and/or modify |
---|
3 | * it under the terms of the GNU General Public License as published by |
---|
4 | * the Free Software Foundation; either version 2 of the License, or |
---|
5 | * (at your option) any later version. |
---|
6 | * |
---|
7 | * This program is distributed in the hope that it will be useful, |
---|
8 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
---|
9 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
---|
10 | * GNU General Public License for more details. |
---|
11 | * |
---|
12 | * You should have received a copy of the GNU General Public License |
---|
13 | * along with this program; if not, write to the Free Software |
---|
14 | * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. |
---|
15 | */ |
---|
16 | |
---|
17 | /* |
---|
18 | * ParallelMultipleClassifiersCombiner.java |
---|
19 | * Copyright (C) 2009 University of Waikato, Hamilton, New Zealand |
---|
20 | * |
---|
21 | */ |
---|
22 | |
---|
23 | package weka.classifiers; |
---|
24 | |
---|
25 | import java.util.Enumeration; |
---|
26 | import java.util.Vector; |
---|
27 | import java.util.concurrent.LinkedBlockingQueue; |
---|
28 | import java.util.concurrent.ThreadPoolExecutor; |
---|
29 | import java.util.concurrent.TimeUnit; |
---|
30 | |
---|
31 | import weka.core.Instances; |
---|
32 | import weka.core.Option; |
---|
33 | import weka.core.Utils; |
---|
34 | |
---|
35 | /** |
---|
36 | * Abstract utility class for handling settings common to |
---|
37 | * meta classifiers that build an ensemble in parallel using multiple |
---|
38 | * classifiers. |
---|
39 | * |
---|
40 | * @author Mark Hall (mhall{[at]}pentaho{[dot]}com) |
---|
41 | * @version $Revision: 6041 $ |
---|
42 | */ |
---|
43 | public abstract class ParallelMultipleClassifiersCombiner extends |
---|
44 | MultipleClassifiersCombiner { |
---|
45 | |
---|
46 | /** For serialization */ |
---|
47 | private static final long serialVersionUID = 728109028953726626L; |
---|
48 | |
---|
49 | /** The number of threads to have executing at any one time */ |
---|
50 | protected int m_numExecutionSlots = 1; |
---|
51 | |
---|
52 | /** Pool of threads to train models with */ |
---|
53 | protected transient ThreadPoolExecutor m_executorPool; |
---|
54 | |
---|
55 | /** The number of classifiers completed so far */ |
---|
56 | protected int m_completed; |
---|
57 | |
---|
58 | /** |
---|
59 | * The number of classifiers that experienced a failure of some sort |
---|
60 | * during construction |
---|
61 | */ |
---|
62 | protected int m_failed; |
---|
63 | |
---|
64 | /** |
---|
65 | * Returns an enumeration describing the available options. |
---|
66 | * |
---|
67 | * @return an enumeration of all the available options. |
---|
68 | */ |
---|
69 | public Enumeration listOptions() { |
---|
70 | |
---|
71 | Vector newVector = new Vector(2); |
---|
72 | |
---|
73 | newVector.addElement(new Option( |
---|
74 | "\tNumber of execution slots.\n" |
---|
75 | + "\t(default 1 - i.e. no parallelism)", |
---|
76 | "num-slots", 1, "-num-slots <num>")); |
---|
77 | |
---|
78 | Enumeration enu = super.listOptions(); |
---|
79 | while (enu.hasMoreElements()) { |
---|
80 | newVector.addElement(enu.nextElement()); |
---|
81 | } |
---|
82 | return newVector.elements(); |
---|
83 | } |
---|
84 | |
---|
85 | /** |
---|
86 | * Parses a given list of options. Valid options are:<p> |
---|
87 | * |
---|
88 | * -Z num <br> |
---|
89 | * Set the number of execution slots to use (default 1 - i.e. no parallelism). <p> |
---|
90 | * |
---|
91 | * Options after -- are passed to the designated classifier.<p> |
---|
92 | * |
---|
93 | * @param options the list of options as an array of strings |
---|
94 | * @exception Exception if an option is not supported |
---|
95 | */ |
---|
96 | public void setOptions(String[] options) throws Exception { |
---|
97 | |
---|
98 | String iterations = Utils.getOption("num-slots", options); |
---|
99 | if (iterations.length() != 0) { |
---|
100 | setNumExecutionSlots(Integer.parseInt(iterations)); |
---|
101 | } else { |
---|
102 | setNumExecutionSlots(1); |
---|
103 | } |
---|
104 | |
---|
105 | super.setOptions(options); |
---|
106 | } |
---|
107 | |
---|
108 | /** |
---|
109 | * Gets the current settings of the classifier. |
---|
110 | * |
---|
111 | * @return an array of strings suitable for passing to setOptions |
---|
112 | */ |
---|
113 | public String [] getOptions() { |
---|
114 | |
---|
115 | String [] superOptions = super.getOptions(); |
---|
116 | String [] options = new String [superOptions.length + 2]; |
---|
117 | |
---|
118 | int current = 0; |
---|
119 | options[current++] = "-num-slots"; |
---|
120 | options[current++] = "" + getNumExecutionSlots(); |
---|
121 | |
---|
122 | System.arraycopy(superOptions, 0, options, current, |
---|
123 | superOptions.length); |
---|
124 | |
---|
125 | return options; |
---|
126 | } |
---|
127 | |
---|
128 | /** |
---|
129 | * Set the number of execution slots (threads) to use for building the |
---|
130 | * members of the ensemble. |
---|
131 | * |
---|
132 | * @param numSlots the number of slots to use. |
---|
133 | */ |
---|
134 | public void setNumExecutionSlots(int numSlots) { |
---|
135 | m_numExecutionSlots = numSlots; |
---|
136 | } |
---|
137 | |
---|
138 | /** |
---|
139 | * Get the number of execution slots (threads) to use for building |
---|
140 | * the members of the ensemble. |
---|
141 | * |
---|
142 | * @return the number of slots to use |
---|
143 | */ |
---|
144 | public int getNumExecutionSlots() { |
---|
145 | return m_numExecutionSlots; |
---|
146 | } |
---|
147 | |
---|
148 | /** |
---|
149 | * Returns the tip text for this property |
---|
150 | * @return tip text for this property suitable for |
---|
151 | * displaying in the explorer/experimenter gui |
---|
152 | */ |
---|
153 | public String numExecutionSlotsTipText() { |
---|
154 | return "The number of execution slots (threads) to use for " + |
---|
155 | "constructing the ensemble."; |
---|
156 | } |
---|
157 | |
---|
158 | /** |
---|
159 | * Stump method for building the classifiers |
---|
160 | * |
---|
161 | * @param data the training data to be used for generating the ensemble |
---|
162 | * @exception Exception if the classifier could not be built successfully |
---|
163 | */ |
---|
164 | public void buildClassifier(Instances data) throws Exception { |
---|
165 | |
---|
166 | if (m_numExecutionSlots < 1) { |
---|
167 | throw new Exception("Number of execution slots needs to be >= 1!"); |
---|
168 | } |
---|
169 | |
---|
170 | if (m_numExecutionSlots > 1) { |
---|
171 | if (m_Debug) { |
---|
172 | System.out.println("Starting executor pool with " + m_numExecutionSlots |
---|
173 | + " slots..."); |
---|
174 | } |
---|
175 | startExecutorPool(); |
---|
176 | } |
---|
177 | m_completed = 0; |
---|
178 | m_failed = 0; |
---|
179 | } |
---|
180 | |
---|
181 | /** |
---|
182 | * Start the pool of execution threads |
---|
183 | */ |
---|
184 | protected void startExecutorPool() { |
---|
185 | if (m_executorPool != null) { |
---|
186 | m_executorPool.shutdownNow(); |
---|
187 | } |
---|
188 | |
---|
189 | m_executorPool = new ThreadPoolExecutor(m_numExecutionSlots, m_numExecutionSlots, |
---|
190 | 120, TimeUnit.SECONDS, new LinkedBlockingQueue<Runnable>()); |
---|
191 | } |
---|
192 | |
---|
193 | private synchronized void block(boolean tf) { |
---|
194 | if (tf) { |
---|
195 | try { |
---|
196 | wait(); |
---|
197 | } catch (InterruptedException ex) { |
---|
198 | } |
---|
199 | } else { |
---|
200 | notifyAll(); |
---|
201 | } |
---|
202 | } |
---|
203 | |
---|
204 | /** |
---|
205 | * Does the actual construction of the ensemble |
---|
206 | * |
---|
207 | * @throws Exception if something goes wrong during the training |
---|
208 | * process |
---|
209 | */ |
---|
210 | protected synchronized void buildClassifiers(final Instances data) throws Exception { |
---|
211 | |
---|
212 | for (int i = 0; i < m_Classifiers.length; i++) { |
---|
213 | if (m_numExecutionSlots > 1) { |
---|
214 | final Classifier currentClassifier = m_Classifiers[i]; |
---|
215 | final int iteration = i; |
---|
216 | Runnable newTask = new Runnable() { |
---|
217 | public void run() { |
---|
218 | try { |
---|
219 | if (m_Debug) { |
---|
220 | System.out.println("Training classifier (" + (iteration +1) + ")"); |
---|
221 | } |
---|
222 | currentClassifier.buildClassifier(data); |
---|
223 | if (m_Debug) { |
---|
224 | System.out.println("Finished classifier (" + (iteration +1) + ")"); |
---|
225 | } |
---|
226 | completedClassifier(iteration, true); |
---|
227 | } catch (Exception ex) { |
---|
228 | ex.printStackTrace(); |
---|
229 | completedClassifier(iteration, false); |
---|
230 | } |
---|
231 | } |
---|
232 | }; |
---|
233 | |
---|
234 | // launch this task |
---|
235 | m_executorPool.execute(newTask); |
---|
236 | } else { |
---|
237 | m_Classifiers[i].buildClassifier(data); |
---|
238 | } |
---|
239 | } |
---|
240 | |
---|
241 | if (m_numExecutionSlots > 1 && m_completed + m_failed < m_Classifiers.length) { |
---|
242 | block(true); |
---|
243 | } |
---|
244 | } |
---|
245 | |
---|
246 | /** |
---|
247 | * Records the completion of the training of a single classifier. Unblocks if |
---|
248 | * all classifiers have been trained. |
---|
249 | * |
---|
250 | * @param iteration the iteration that has completed |
---|
251 | * @param success whether the classifier trained successfully |
---|
252 | */ |
---|
253 | protected synchronized void completedClassifier(int iteration, |
---|
254 | boolean success) { |
---|
255 | m_completed++; |
---|
256 | |
---|
257 | if (!success) { |
---|
258 | m_failed++; |
---|
259 | if (m_Debug) { |
---|
260 | System.err.println("Iteration " + iteration + " failed!"); |
---|
261 | } |
---|
262 | } |
---|
263 | |
---|
264 | if (m_completed + m_failed == m_Classifiers.length) { |
---|
265 | if (m_failed > 0) { |
---|
266 | if (m_Debug) { |
---|
267 | System.err.println("Problem building classifiers - some iterations failed."); |
---|
268 | } |
---|
269 | } |
---|
270 | |
---|
271 | // have to shut the pool down or program executes as a server |
---|
272 | // and when running from the command line does not return to the |
---|
273 | // prompt |
---|
274 | m_executorPool.shutdown(); |
---|
275 | block(false); |
---|
276 | } |
---|
277 | } |
---|
278 | } |
---|