/* * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. */ /* * Evaluation.java * Copyright (C) 1999 University of Waikato, Hamilton, New Zealand * */ package weka.classifiers; import weka.classifiers.evaluation.NominalPrediction; import weka.classifiers.evaluation.NumericPrediction; import weka.classifiers.evaluation.ThresholdCurve; import weka.classifiers.evaluation.output.prediction.AbstractOutput; import weka.classifiers.evaluation.output.prediction.PlainText; import weka.classifiers.pmml.consumer.PMMLClassifier; import weka.classifiers.xml.XMLClassifier; import weka.core.Drawable; import weka.core.FastVector; import weka.core.Instance; import weka.core.Instances; import weka.core.Option; import weka.core.OptionHandler; import weka.core.RevisionHandler; import weka.core.RevisionUtils; import weka.core.Summarizable; import weka.core.Utils; import weka.core.Version; import weka.core.converters.ConverterUtils.DataSink; import weka.core.converters.ConverterUtils.DataSource; import weka.core.pmml.PMMLFactory; import weka.core.pmml.PMMLModel; import weka.core.xml.KOML; import weka.core.xml.XMLOptions; import weka.core.xml.XMLSerialization; import weka.estimators.UnivariateKernelEstimator; import java.beans.BeanInfo; import java.beans.Introspector; import java.beans.MethodDescriptor; import java.io.BufferedInputStream; import java.io.BufferedOutputStream; import java.io.BufferedReader; import java.io.FileInputStream; import java.io.FileOutputStream; import java.io.FileReader; import java.io.InputStream; import java.io.ObjectInputStream; import java.io.ObjectOutputStream; import java.io.OutputStream; import java.io.Reader; import java.lang.reflect.Method; import java.util.Date; import java.util.Enumeration; import java.util.Random; import java.util.zip.GZIPInputStream; import java.util.zip.GZIPOutputStream; /** * Class for evaluating machine learning models.

* * -------------------------------------------------------------------

* * General options when evaluating a learning scheme from the command-line:

* * -t filename
* Name of the file with the training data. (required)

* * -T filename
* Name of the file with the test data. If missing a cross-validation * is performed.

* * -c index
* Index of the class attribute (1, 2, ...; default: last).

* * -x number
* The number of folds for the cross-validation (default: 10).

* * -no-cv
* No cross validation. If no test file is provided, no evaluation * is done.

* * -split-percentage percentage
* Sets the percentage for the train/test set split, e.g., 66.

* * -preserve-order
* Preserves the order in the percentage split instead of randomizing * the data first with the seed value ('-s').

* * -s seed
* Random number seed for the cross-validation and percentage split * (default: 1).

* * -m filename
* The name of a file containing a cost matrix.

* * -l filename
* Loads classifier from the given file. In case the filename ends with ".xml", * a PMML file is loaded or, if that fails, options are loaded from XML.

* * -d filename
* Saves classifier built from the training data into the given file. In case * the filename ends with ".xml" the options are saved XML, not the model.

* * -v
* Outputs no statistics for the training data.

* * -o
* Outputs statistics only, not the classifier.

* * -i
* Outputs information-retrieval statistics per class.

* * -k
* Outputs information-theoretic statistics.

* * -classifications "weka.classifiers.evaluation.output.prediction.AbstractOutput + options"
* Uses the specified class for generating the classification output. * E.g.: weka.classifiers.evaluation.output.prediction.PlainText * or : weka.classifiers.evaluation.output.prediction.CSV * * -p range
* Outputs predictions for test instances (or the train instances if no test * instances provided and -no-cv is used), along with the attributes in the specified range * (and nothing else). Use '-p 0' if no attributes are desired.

* Deprecated: use "-classifications ..." instead.

* * -distribution
* Outputs the distribution instead of only the prediction * in conjunction with the '-p' option (only nominal classes).

* Deprecated: use "-classifications ..." instead.

* * -r
* Outputs cumulative margin distribution (and nothing else).

* * -g
* Only for classifiers that implement "Graphable." Outputs * the graph representation of the classifier (and nothing * else).

* * -xml filename | xml-string
* Retrieves the options from the XML-data instead of the command line.

* * -threshold-file file
* The file to save the threshold data to. * The format is determined by the extensions, e.g., '.arff' for ARFF * format or '.csv' for CSV.

* * -threshold-label label
* The class label to determine the threshold data for * (default is the first label)

* * -------------------------------------------------------------------

* * Example usage as the main of a classifier (called FunkyClassifier): *

 * public static void main(String [] args) {
 *   runClassifier(new FunkyClassifier(), args);
 * }
 *

* * ------------------------------------------------------------------

* * Example usage from within an application: *

 * Instances trainInstances = ... instances got from somewhere
 * Instances testInstances = ... instances got from somewhere
 * Classifier scheme = ... scheme got from somewhere
 *
 * Evaluation evaluation = new Evaluation(trainInstances);
 * evaluation.evaluateModel(scheme, testInstances);
 * System.out.println(evaluation.toSummaryString());
 *

* * * @author Eibe Frank (eibe@cs.waikato.ac.nz) * @author Len Trigg (trigg@cs.waikato.ac.nz) * @version $Revision: 6041 $ */ public class Evaluation implements Summarizable, RevisionHandler { /** The number of classes. */ protected int m_NumClasses; /** The number of folds for a cross-validation. */ protected int m_NumFolds; /** The weight of all incorrectly classified instances. */ protected double m_Incorrect; /** The weight of all correctly classified instances. */ protected double m_Correct; /** The weight of all unclassified instances. */ protected double m_Unclassified; /*** The weight of all instances that had no class assigned to them. */ protected double m_MissingClass; /** The weight of all instances that had a class assigned to them. */ protected double m_WithClass; /** Array for storing the confusion matrix. */ protected double [][] m_ConfusionMatrix; /** The names of the classes. */ protected String [] m_ClassNames; /** Is the class nominal or numeric? */ protected boolean m_ClassIsNominal; /** The prior probabilities of the classes. */ protected double [] m_ClassPriors; /** The sum of counts for priors. */ protected double m_ClassPriorsSum; /** The cost matrix (if given). */ protected CostMatrix m_CostMatrix; /** The total cost of predictions (includes instance weights). */ protected double m_TotalCost; /** Sum of errors. */ protected double m_SumErr; /** Sum of absolute errors. */ protected double m_SumAbsErr; /** Sum of squared errors. */ protected double m_SumSqrErr; /** Sum of class values. */ protected double m_SumClass; /** Sum of squared class values. */ protected double m_SumSqrClass; /*** Sum of predicted values. */ protected double m_SumPredicted; /** Sum of squared predicted values. */ protected double m_SumSqrPredicted; /** Sum of predicted * class values. */ protected double m_SumClassPredicted; /** Sum of absolute errors of the prior. */ protected double m_SumPriorAbsErr; /** Sum of absolute errors of the prior. */ protected double m_SumPriorSqrErr; /** Total Kononenko & Bratko Information. */ protected double m_SumKBInfo; /*** Resolution of the margin histogram. */ protected static int k_MarginResolution = 500; /** Cumulative margin distribution. */ protected double m_MarginCounts []; /** Number of non-missing class training instances seen. */ protected int m_NumTrainClassVals; /** Array containing all numeric training class values seen. */ protected double [] m_TrainClassVals; /** Array containing all numeric training class weights. */ protected double [] m_TrainClassWeights; /** Numeric class estimator for prior. */ protected UnivariateKernelEstimator m_PriorEstimator; /** Whether complexity statistics are available. */ protected boolean m_ComplexityStatisticsAvailable = true; /** * The minimum probablility accepted from an estimator to avoid * taking log(0) in Sf calculations. */ protected static final double MIN_SF_PROB = Double.MIN_VALUE; /** Total entropy of prior predictions. */ protected double m_SumPriorEntropy; /** Total entropy of scheme predictions. */ protected double m_SumSchemeEntropy; /** Whether coverage statistics are available. */ protected boolean m_CoverageStatisticsAvailable = true; /** The confidence level used for coverage statistics. */ protected double m_ConfLevel = 0.95; /** Total size of predicted regions at the given confidence level. */ protected double m_TotalSizeOfRegions; /** Total coverage of test cases at the given confidence level. */ protected double m_TotalCoverage; /** Minimum target value. */ protected double m_MinTarget; /** Maximum target value. */ protected double m_MaxTarget; /** The list of predictions that have been generated (for computing AUC). */ protected FastVector m_Predictions; /** enables/disables the use of priors, e.g., if no training set is * present in case of de-serialized schemes. */ protected boolean m_NoPriors = false; /** The header of the training set. */ protected Instances m_Header; /** * Initializes all the counters for the evaluation. * Use useNoPriors() if the dataset is the test set and you * can't initialize with the priors from the training set via * setPriors(Instances). * * @param data set of training instances, to get some header * information and prior class distribution information * @throws Exception if the class is not defined * @see #useNoPriors() * @see #setPriors(Instances) */ public Evaluation(Instances data) throws Exception { this(data, null); } /** * Initializes all the counters for the evaluation and also takes a * cost matrix as parameter. * Use useNoPriors() if the dataset is the test set and you * can't initialize with the priors from the training set via * setPriors(Instances). * * @param data set of training instances, to get some header * information and prior class distribution information * @param costMatrix the cost matrix---if null, default costs will be used * @throws Exception if cost matrix is not compatible with * data, the class is not defined or the class is numeric * @see #useNoPriors() * @see #setPriors(Instances) */ public Evaluation(Instances data, CostMatrix costMatrix) throws Exception { m_Header = new Instances(data, 0); m_NumClasses = data.numClasses(); m_NumFolds = 1; m_ClassIsNominal = data.classAttribute().isNominal(); if (m_ClassIsNominal) { m_ConfusionMatrix = new double [m_NumClasses][m_NumClasses]; m_ClassNames = new String [m_NumClasses]; for(int i = 0; i < m_NumClasses; i++) { m_ClassNames[i] = data.classAttribute().value(i); } } m_CostMatrix = costMatrix; if (m_CostMatrix != null) { if (!m_ClassIsNominal) { throw new Exception("Class has to be nominal if cost matrix given!"); } if (m_CostMatrix.size() != m_NumClasses) { throw new Exception("Cost matrix not compatible with data!"); } } m_ClassPriors = new double [m_NumClasses]; setPriors(data); m_MarginCounts = new double [k_MarginResolution + 1]; } /** * Returns the header of the underlying dataset. * * @return the header information */ public Instances getHeader() { return m_Header; } /** * Returns the area under ROC for those predictions that have been collected * in the evaluateClassifier(Classifier, Instances) method. Returns * Utils.missingValue() if the area is not available. * * @param classIndex the index of the class to consider as "positive" * @return the area under the ROC curve or not a number */ public double areaUnderROC(int classIndex) { // Check if any predictions have been collected if (m_Predictions == null) { return Utils.missingValue(); } else { ThresholdCurve tc = new ThresholdCurve(); Instances result = tc.getCurve(m_Predictions, classIndex); return ThresholdCurve.getROCArea(result); } } /** * Calculates the weighted (by class size) AUC. * * @return the weighted AUC. */ public double weightedAreaUnderROC() { double[] classCounts = new double[m_NumClasses]; double classCountSum = 0; for (int i = 0; i < m_NumClasses; i++) { for (int j = 0; j < m_NumClasses; j++) { classCounts[i] += m_ConfusionMatrix[i][j]; } classCountSum += classCounts[i]; } double aucTotal = 0; for(int i = 0; i < m_NumClasses; i++) { double temp = areaUnderROC(i); if (!Utils.isMissingValue(temp)) { aucTotal += (temp * classCounts[i]); } } return aucTotal / classCountSum; } /** * Returns a copy of the confusion matrix. * * @return a copy of the confusion matrix as a two-dimensional array */ public double[][] confusionMatrix() { double[][] newMatrix = new double[m_ConfusionMatrix.length][0]; for (int i = 0; i < m_ConfusionMatrix.length; i++) { newMatrix[i] = new double[m_ConfusionMatrix[i].length]; System.arraycopy(m_ConfusionMatrix[i], 0, newMatrix[i], 0, m_ConfusionMatrix[i].length); } return newMatrix; } /** * Performs a (stratified if class is nominal) cross-validation * for a classifier on a set of instances. Now performs * a deep copy of the classifier before each call to * buildClassifier() (just in case the classifier is not * initialized properly). * * @param classifier the classifier with any options set. * @param data the data on which the cross-validation is to be * performed * @param numFolds the number of folds for the cross-validation * @param random random number generator for randomization * @param forPredictionsPrinting varargs parameter that, if supplied, is * expected to hold a weka.classifiers.evaluation.output.prediction.AbstractOutput * object * @throws Exception if a classifier could not be generated * successfully or the class is not defined */ public void crossValidateModel(Classifier classifier, Instances data, int numFolds, Random random, Object... forPredictionsPrinting) throws Exception { // Make a copy of the data we can reorder data = new Instances(data); data.randomize(random); if (data.classAttribute().isNominal()) { data.stratify(numFolds); } // We assume that the first element is a // weka.classifiers.evaluation.output.prediction.AbstractOutput object AbstractOutput classificationOutput = null; if (forPredictionsPrinting.length > 0) { // print the header first classificationOutput = (AbstractOutput) forPredictionsPrinting[0]; classificationOutput.setHeader(data); classificationOutput.printHeader(); } // Do the folds for (int i = 0; i < numFolds; i++) { Instances train = data.trainCV(numFolds, i, random); setPriors(train); Classifier copiedClassifier = AbstractClassifier.makeCopy(classifier); copiedClassifier.buildClassifier(train); Instances test = data.testCV(numFolds, i); evaluateModel(copiedClassifier, test, forPredictionsPrinting); } m_NumFolds = numFolds; if (classificationOutput != null) classificationOutput.printFooter(); } /** * Performs a (stratified if class is nominal) cross-validation * for a classifier on a set of instances. * * @param classifierString a string naming the class of the classifier * @param data the data on which the cross-validation is to be * performed * @param numFolds the number of folds for the cross-validation * @param options the options to the classifier. Any options * @param random the random number generator for randomizing the data * accepted by the classifier will be removed from this array. * @throws Exception if a classifier could not be generated * successfully or the class is not defined */ public void crossValidateModel(String classifierString, Instances data, int numFolds, String[] options, Random random) throws Exception { crossValidateModel(AbstractClassifier.forName(classifierString, options), data, numFolds, random); } /** * Evaluates a classifier with the options given in an array of * strings.

* * Valid options are: