Java Machine Learning Library Source code

Status: Beta
Brought to you by: thomasabeel
[572a65]: / src / libsvm / LibSVM.java Maximize Restore History
271 lines (238 with data), 7.1 kB

/**
 * %SVN.HEADER%
 */
package libsvm;

import java.util.SortedSet;

import net.sf.javaml.classification.AbstractClassifier;
import net.sf.javaml.core.Dataset;
import net.sf.javaml.core.Instance;
import net.sf.javaml.core.exception.TrainingRequiredException;

/**
 * Wrapper for the libSVM library by Chih-Chung Chang and Chih-Jen Lin. This
 * class allows you to use the power of libSVM in Java-ML.
 * 
 * <pre>
 * Chih-Chung Chang and Chih-Jen Lin, LIBSVM : a library for support vector
 * machines, 2001. Software available at
 * http://www.csie.ntu.edu.tw/&tilde;cjlin/libsvm
 * </pre>
 * 
 * @author Thomas Abeel
 * 
 */
public class LibSVM extends AbstractClassifier {

	public static svm_print_interface svm_print_console = null;
	public static svm_print_interface svm_print_null = new svm_print_interface() {
		public void print(String s) {
		}
	};
	/* By default console output is turned off. */
	static {
		svm.svm_set_print_string_function(svm_print_null);
	}

	private static final long serialVersionUID = -8901871714620581945L;

	/**
	 * Create a new instance of libsvm.
	 */
	public LibSVM() {
		param = new svm_parameter();
		// default values
		param.svm_type = svm_parameter.C_SVC;
		param.C = 1;
		param.kernel_type = svm_parameter.LINEAR;
		param.degree = 1;
		param.gamma = 0; // 1/k
		param.coef0 = 0;
		param.nu = 0.5;
		param.cache_size = 100;
		param.eps = 1e-3;
		param.p = 0.1;
		param.shrinking = 1;
		param.probability = 0;
		param.nr_weight = 0;
		param.weight_label = new int[0];
		param.weight = new double[0];
	}

	/**
	 * Returns a reference to the parameter configuration of the SVM
	 * 
	 * @return the current configuration
	 */
	public svm_parameter getParameters() {
		return param;
	}

	private static svm_problem transformDataset(Dataset data, boolean regression) {
		svm_problem p = new svm_problem();
		p.l = data.size();
		p.y = new double[data.size()];
		p.x = new svm_node[data.size()][];
		int tmpIndex = 0;
		for (int j = 0; j < data.size(); j++) {
			Instance tmp = data.instance(j);
			if (regression)
				p.y[tmpIndex] = Double.parseDouble(tmp.classValue().toString());
			else
				p.y[tmpIndex] = data.classIndex(tmp.classValue());
			p.x[tmpIndex] = new svm_node[tmp.keySet().size()];
			int i = 0;
			SortedSet<Integer> tmpSet = tmp.keySet();
			for (int index : tmpSet) {
				p.x[tmpIndex][i] = new svm_node();
				p.x[tmpIndex][i].index = index;
				p.x[tmpIndex][i].value = tmp.value(index);
				i++;
			}
			tmpIndex++;
		}
		return p;
	}

	private svm_parameter param;
	private Dataset data;
	private svm_model model;

	/**
	 * Set the parameters that will be used for training.
	 * 
	 * @param param
	 *            a set of parameters
	 */
	public void setParameters(svm_parameter param) {
		this.param = param;
	}

	/**
	 * Set the print interface that will be used for training. print a print
	 * interface. If <code>LibSVM.svm_print_console</code> is provided then
	 * output will be printed to standard out. If
	 * <code>LibSVM.svm_print_null</code> is provided then no output will be
	 * printed.
	 * 
	 * By default this the printmode is set to
	 * <code>LibSVM.svm_print_null</code>
	 */
	public static void setPrintInterface(svm_print_interface print) {
		svm.svm_set_print_string_function(print);
	}

	@Override
	public void buildClassifier(Dataset data) {
		super.buildClassifier(data);
		this.data = data;

		svm_problem p = null;
		if (param.svm_type == svm_parameter.EPSILON_SVR) {
			System.out.println("Using regression transformation");
			p = transformDataset(data, true);
		} else
			p = transformDataset(data, false);

		model = svm.svm_train(p, param);

		double[][] coef = model.sv_coef;

		assert model.SV != null;
		assert model.SV.length > 0;

		double[][] prob = new double[model.SV.length][data.noAttributes()];
		for (int i = 0; i < model.SV.length; i++) {
			for (int j = 0; j < data.noAttributes(); j++) {
				prob[i][j] = 0;
			}
		}
		for (int i = 0; i < model.SV.length; i++) {
			for (int j = 0; j < model.SV[i].length; j++) {
				prob[i][model.SV[i][j].index] = model.SV[i][j].value;
			}
		}
		/* Weights are only available for linear SVMs */
		if (param.svm_type == svm_parameter.C_SVC) {
			double w_list[][][] = new double[model.nr_class][model.nr_class - 1][data
					.noAttributes()];

			for (int i = 0; i < data.noAttributes(); ++i) {
				for (int j = 0; j < model.nr_class - 1; ++j) {
					int index = 0;
					int end = 0;
					double acc;
					for (int k = 0; k < model.nr_class; ++k) {
						acc = 0.0;
						index += (k == 0) ? 0 : model.nSV[k - 1];
						end = index + model.nSV[k];
						for (int m = index; m < end; ++m) {
							acc += coef[j][m] * prob[m][i];
						}
						w_list[k][j][i] = acc;
					}
				}
			}

			weights = new double[data.noAttributes()];
			for (int i = 0; i < model.nr_class - 1; ++i) {
				for (int j = i + 1, k = i; j < model.nr_class; ++j, ++k) {
					for (int m = 0; m < data.noAttributes(); ++m) {
						weights[m] = (w_list[i][k][m] + w_list[j][i][m]);

					}
				}
			}
		} else {
			weights = null;
		}

	}

	private double[] weights;

	/**
	 * Provides access to the weights the support vectors obtained during
	 * training.
	 * 
	 * @return weight vector
	 */
	public double[] getWeights() {
		return weights;
	}

	public double[] rawDecisionValues(Instance i) {
		return svm_predict_raw(model, convert(i));
	}

	/* Method to get raw decision values */
	private double[] svm_predict_raw(svm_model model, svm_node[] x) {
		if (model.param.svm_type == svm_parameter.ONE_CLASS
				|| model.param.svm_type == svm_parameter.EPSILON_SVR
				|| model.param.svm_type == svm_parameter.NU_SVR) {
			double[] res = new double[1];
			svm.svm_predict_values(model, x, res);
			return res;
		} else {
			int nr_class = model.nr_class;
			double[] dec_values = new double[nr_class * (nr_class - 1) / 2];
			svm.svm_predict_values(model, x, dec_values);
			return dec_values;
		}
	}

	private svm_node[] convert(Instance instance) {
		svm_node[] x = new svm_node[instance.noAttributes()];
		// TODO implement sparseness
		for (int i = 0; i < instance.noAttributes(); i++) {
			x[i] = new svm_node();
			x[i].index = i;
			x[i].value = instance.value(i);
		}
		return x;
	}

	@Override
	public Object classify(Instance instance) {
		svm_node[] x = convert(instance);
		double d = svm.svm_predict(model, x);
		Object out = data.classValue((int) d);
		return out;
	}
	
	
	// public double regress(Instance instance){
	// svm_node[] x = convert(instance);
	// svm.svm
	// double d = svm.svm_predict_values(model, x);
	// svm.svm
	// return d;
	// }

	public double[] probability(Instance instance) {
		if (param.probability == 1) {
			svm_node[] x = convert(instance);
			double[] classProb = new double[2];
			double d = svm.svm_predict_probability(model, x, classProb);
			return classProb;
		} else
			throw new TrainingRequiredException(
					"You need to set svm.param.probability = 1 during training");
	}

	public int[] getLabels() {
		int res[] = new int[model.nr_class];
		svm.svm_get_labels(model, res);
		return res;
	}

}
Java Machine Learning Library Source code

Branches

[572a65]: / src / libsvm / LibSVM.java Maximize Restore History

271 lines (238 with data), 7.1 kB