RubyGems - numo-liblinear - Versions diffs - 0.5.0 → 1.0.0 - Mend

numo-liblinear 0.5.0 → 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (20) hide show

checksums.yaml +4 -4
data/.gitmodules +3 -0
data/.travis.yml +0 -1
data/CHANGELOG.md +5 -0
data/README.md +1 -9
data/ext/numo/liblinear/extconf.rb +7 -8
data/ext/numo/liblinear/liblinear/blas/blas.h +25 -0
data/ext/numo/liblinear/liblinear/blas/blasp.h +438 -0
data/ext/numo/liblinear/liblinear/blas/daxpy.c +57 -0
data/ext/numo/liblinear/liblinear/blas/ddot.c +58 -0
data/ext/numo/liblinear/liblinear/blas/dnrm2.c +70 -0
data/ext/numo/liblinear/liblinear/blas/dscal.c +52 -0
data/ext/numo/liblinear/liblinear/linear.cpp +3203 -0
data/ext/numo/liblinear/liblinear/linear.h +83 -0
data/ext/numo/liblinear/liblinear/tron.cpp +288 -0
data/ext/numo/liblinear/liblinear/tron.h +36 -0
data/ext/numo/liblinear/liblinearext.c +3 -0
data/lib/numo/liblinear/version.rb +1 -1
data/numo-liblinear.gemspec +8 -0
metadata +13 -2

data/ext/numo/liblinear/liblinear/linear.h ADDED

@@ -0,0 +1,83 @@
+#ifndef _LIBLINEAR_H
+#define _LIBLINEAR_H
+#define LIBLINEAR_VERSION 230
+#ifdef __cplusplus
+extern "C" {
+#endif
+extern int liblinear_version;
+struct feature_node
+{
+	int index;
+	double value;
+};
+struct problem
+{
+	int l, n;
+	double *y;
+	struct feature_node **x;
+	double bias;            /* < 0 if no bias term */
+};
+enum { L2R_LR, L2R_L2LOSS_SVC_DUAL, L2R_L2LOSS_SVC, L2R_L1LOSS_SVC_DUAL, MCSVM_CS, L1R_L2LOSS_SVC, L1R_LR, L2R_LR_DUAL, L2R_L2LOSS_SVR = 11, L2R_L2LOSS_SVR_DUAL, L2R_L1LOSS_SVR_DUAL }; /* solver_type */
+struct parameter
+{
+	int solver_type;
+	/* these are for training only */
+	double eps;	        /* stopping criteria */
+	double C;
+	int nr_weight;
+	int *weight_label;
+	double* weight;
+	double p;
+	double *init_sol;
+};
+struct model
+{
+	struct parameter param;
+	int nr_class;		/* number of classes */
+	int nr_feature;
+	double *w;
+	int *label;		/* label of each class */
+	double bias;
+};
+struct model* train(const struct problem *prob, const struct parameter *param);
+void cross_validation(const struct problem *prob, const struct parameter *param, int nr_fold, double *target);
+void find_parameters(const struct problem *prob, const struct parameter *param, int nr_fold, double start_C, double start_p, double *best_C, double *best_p, double *best_score);
+double predict_values(const struct model *model_, const struct feature_node *x, double* dec_values);
+double predict(const struct model *model_, const struct feature_node *x);
+double predict_probability(const struct model *model_, const struct feature_node *x, double* prob_estimates);
+int save_model(const char *model_file_name, const struct model *model_);
+struct model *load_model(const char *model_file_name);
+int get_nr_feature(const struct model *model_);
+int get_nr_class(const struct model *model_);
+void get_labels(const struct model *model_, int* label);
+double get_decfun_coef(const struct model *model_, int feat_idx, int label_idx);
+double get_decfun_bias(const struct model *model_, int label_idx);
+void free_model_content(struct model *model_ptr);
+void free_and_destroy_model(struct model **model_ptr_ptr);
+void destroy_param(struct parameter *param);
+const char *check_parameter(const struct problem *prob, const struct parameter *param);
+int check_probability_model(const struct model *model);
+int check_regression_model(const struct model *model);
+void set_print_string_function(void (*print_func) (const char*));
+#ifdef __cplusplus
+}
+#endif
+#endif /* _LIBLINEAR_H */

data/ext/numo/liblinear/liblinear/tron.cpp ADDED

@@ -0,0 +1,288 @@
+#include <math.h>
+#include <stdio.h>
+#include <string.h>
+#include <stdarg.h>
+#include "tron.h"
+#ifndef min
+template <class T> static inline T min(T x,T y) { return (x<y)?x:y; }
+#endif
+#ifndef max
+template <class T> static inline T max(T x,T y) { return (x>y)?x:y; }
+#endif
+#ifdef __cplusplus
+extern "C" {
+#endif
+extern double dnrm2_(int *, double *, int *);
+extern double ddot_(int *, double *, int *, double *, int *);
+extern int daxpy_(int *, double *, double *, int *, double *, int *);
+extern int dscal_(int *, double *, double *, int *);
+#ifdef __cplusplus
+}
+#endif
+static void default_print(const char *buf)
+{
+	fputs(buf,stdout);
+	fflush(stdout);
+}
+static double uTMv(int n, double *u, double *M, double *v)
+{
+	const int m = n-4;
+	double res = 0;
+	int i;
+	for (i=0; i<m; i+=5)
+		res += u[i]*M[i]*v[i]+u[i+1]*M[i+1]*v[i+1]+u[i+2]*M[i+2]*v[i+2]+
+			u[i+3]*M[i+3]*v[i+3]+u[i+4]*M[i+4]*v[i+4];
+	for (; i<n; i++)
+		res += u[i]*M[i]*v[i];
+	return res;
+}
+void TRON::info(const char *fmt,...)
+{
+	char buf[BUFSIZ];
+	va_list ap;
+	va_start(ap,fmt);
+	vsprintf(buf,fmt,ap);
+	va_end(ap);
+	(*tron_print_string)(buf);
+}
+TRON::TRON(const function *fun_obj, double eps, double eps_cg, int max_iter)
+{
+	this->fun_obj=const_cast<function *>(fun_obj);
+	this->eps=eps;
+	this->eps_cg=eps_cg;
+	this->max_iter=max_iter;
+	tron_print_string = default_print;
+}
+TRON::~TRON()
+{
+}
+void TRON::tron(double *w)
+{
+	// Parameters for updating the iterates.
+	double eta0 = 1e-4, eta1 = 0.25, eta2 = 0.75;
+	// Parameters for updating the trust region size delta.
+	double sigma1 = 0.25, sigma2 = 0.5, sigma3 = 4;
+	int n = fun_obj->get_nr_variable();
+	int i, cg_iter;
+	double delta=0, sMnorm, one=1.0;
+	double alpha, f, fnew, prered, actred, gs;
+	int search = 1, iter = 1, inc = 1;
+	double *s = new double[n];
+	double *r = new double[n];
+	double *g = new double[n];
+	const double alpha_pcg = 0.01;
+	double *M = new double[n];
+	// calculate gradient norm at w=0 for stopping condition.
+	double *w0 = new double[n];
+	for (i=0; i<n; i++)
+		w0[i] = 0;
+	fun_obj->fun(w0);
+	fun_obj->grad(w0, g);
+	double gnorm0 = dnrm2_(&n, g, &inc);
+	delete [] w0;
+	f = fun_obj->fun(w);
+	fun_obj->grad(w, g);
+	double gnorm = dnrm2_(&n, g, &inc);
+	if (gnorm <= eps*gnorm0)
+		search = 0;
+	fun_obj->get_diag_preconditioner(M);
+	for(i=0; i<n; i++)
+		M[i] = (1-alpha_pcg) + alpha_pcg*M[i];
+	delta = sqrt(uTMv(n, g, M, g));
+	double *w_new = new double[n];
+	bool reach_boundary;
+	bool delta_adjusted = false;
+	while (iter <= max_iter && search)
+	{
+		cg_iter = trpcg(delta, g, M, s, r, &reach_boundary);
+		memcpy(w_new, w, sizeof(double)*n);
+		daxpy_(&n, &one, s, &inc, w_new, &inc);
+		gs = ddot_(&n, g, &inc, s, &inc);
+		prered = -0.5*(gs-ddot_(&n, s, &inc, r, &inc));
+		fnew = fun_obj->fun(w_new);
+		// Compute the actual reduction.
+		actred = f - fnew;
+		// On the first iteration, adjust the initial step bound.
+		sMnorm = sqrt(uTMv(n, s, M, s));
+		if (iter == 1 && !delta_adjusted)
+		{
+			delta = min(delta, sMnorm);
+			delta_adjusted = true;
+		}
+		// Compute prediction alpha*sMnorm of the step.
+		if (fnew - f - gs <= 0)
+			alpha = sigma3;
+		else
+			alpha = max(sigma1, -0.5*(gs/(fnew - f - gs)));
+		// Update the trust region bound according to the ratio of actual to predicted reduction.
+		if (actred < eta0*prered)
+			delta = min(alpha*sMnorm, sigma2*delta);
+		else if (actred < eta1*prered)
+			delta = max(sigma1*delta, min(alpha*sMnorm, sigma2*delta));
+		else if (actred < eta2*prered)
+			delta = max(sigma1*delta, min(alpha*sMnorm, sigma3*delta));
+		else
+		{
+			if (reach_boundary)
+				delta = sigma3*delta;
+			else
+				delta = max(delta, min(alpha*sMnorm, sigma3*delta));
+		}
+		info("iter %2d act %5.3e pre %5.3e delta %5.3e f %5.3e |g| %5.3e CG %3d\n", iter, actred, prered, delta, f, gnorm, cg_iter);
+		if (actred > eta0*prered)
+		{
+			iter++;
+			memcpy(w, w_new, sizeof(double)*n);
+			f = fnew;
+			fun_obj->grad(w, g);
+			fun_obj->get_diag_preconditioner(M);
+			for(i=0; i<n; i++)
+				M[i] = (1-alpha_pcg) + alpha_pcg*M[i];
+			gnorm = dnrm2_(&n, g, &inc);
+			if (gnorm <= eps*gnorm0)
+				break;
+		}
+		if (f < -1.0e+32)
+		{
+			info("WARNING: f < -1.0e+32\n");
+			break;
+		}
+		if (prered <= 0)
+		{
+			info("WARNING: prered <= 0\n");
+			break;
+		}
+		if (fabs(actred) <= 1.0e-12*fabs(f) &&
+		    fabs(prered) <= 1.0e-12*fabs(f))
+		{
+			info("WARNING: actred and prered too small\n");
+			break;
+		}
+	}
+	delete[] g;
+	delete[] r;
+	delete[] w_new;
+	delete[] s;
+	delete[] M;
+}
+int TRON::trpcg(double delta, double *g, double *M, double *s, double *r, bool *reach_boundary)
+{
+	int i, inc = 1;
+	int n = fun_obj->get_nr_variable();
+	double one = 1;
+	double *d = new double[n];
+	double *Hd = new double[n];
+	double zTr, znewTrnew, alpha, beta, cgtol;
+	double *z = new double[n];
+	*reach_boundary = false;
+	for (i=0; i<n; i++)
+	{
+		s[i] = 0;
+		r[i] = -g[i];
+		z[i] = r[i] / M[i];
+		d[i] = z[i];
+	}
+	zTr = ddot_(&n, z, &inc, r, &inc);
+	cgtol = eps_cg*sqrt(zTr);
+	int cg_iter = 0;
+	int max_cg_iter = max(n, 5);
+	while (cg_iter < max_cg_iter)
+	{
+		if (sqrt(zTr) <= cgtol)
+			break;
+		cg_iter++;
+		fun_obj->Hv(d, Hd);
+		alpha = zTr/ddot_(&n, d, &inc, Hd, &inc);
+		daxpy_(&n, &alpha, d, &inc, s, &inc);
+		double sMnorm = sqrt(uTMv(n, s, M, s));
+		if (sMnorm > delta)
+		{
+			info("cg reaches trust region boundary\n");
+			*reach_boundary = true;
+			alpha = -alpha;
+			daxpy_(&n, &alpha, d, &inc, s, &inc);
+			double sTMd = uTMv(n, s, M, d);
+			double sTMs = uTMv(n, s, M, s);
+			double dTMd = uTMv(n, d, M, d);
+			double dsq = delta*delta;
+			double rad = sqrt(sTMd*sTMd + dTMd*(dsq-sTMs));
+			if (sTMd >= 0)
+				alpha = (dsq - sTMs)/(sTMd + rad);
+			else
+				alpha = (rad - sTMd)/dTMd;
+			daxpy_(&n, &alpha, d, &inc, s, &inc);
+			alpha = -alpha;
+			daxpy_(&n, &alpha, Hd, &inc, r, &inc);
+			break;
+		}
+		alpha = -alpha;
+		daxpy_(&n, &alpha, Hd, &inc, r, &inc);
+		for (i=0; i<n; i++)
+			z[i] = r[i] / M[i];
+		znewTrnew = ddot_(&n, z, &inc, r, &inc);
+		beta = znewTrnew/zTr;
+		dscal_(&n, &beta, d, &inc);
+		daxpy_(&n, &one, z, &inc, d, &inc);
+		zTr = znewTrnew;
+	}
+	if (cg_iter == max_cg_iter)
+		info("WARNING: reaching maximal number of CG steps\n");
+	delete[] d;
+	delete[] Hd;
+	delete[] z;
+	return(cg_iter);
+}
+double TRON::norm_inf(int n, double *x)
+{
+	double dmax = fabs(x[0]);
+	for (int i=1; i<n; i++)
+		if (fabs(x[i]) >= dmax)
+			dmax = fabs(x[i]);
+	return(dmax);
+}
+void TRON::set_print_string(void (*print_string) (const char *buf))
+{
+	tron_print_string = print_string;
+}

data/ext/numo/liblinear/liblinear/tron.h ADDED

@@ -0,0 +1,36 @@
+#ifndef _TRON_H
+#define _TRON_H
+class function
+{
+public:
+	virtual double fun(double *w) = 0 ;
+	virtual void grad(double *w, double *g) = 0 ;
+	virtual void Hv(double *s, double *Hs) = 0 ;
+	virtual int get_nr_variable(void) = 0 ;
+	virtual void get_diag_preconditioner(double *M) = 0 ;
+	virtual ~function(void){}
+};
+class TRON
+{
+public:
+	TRON(const function *fun_obj, double eps = 0.1, double eps_cg = 0.1, int max_iter = 1000);
+	~TRON();
+	void tron(double *w);
+	void set_print_string(void (*i_print) (const char *buf));
+private:
+	int trpcg(double delta, double *g, double *M, double *s, double *r, bool *reach_boundary);
+	double norm_inf(int n, double *x);
+	double eps;
+	double eps_cg;
+	int max_iter;
+	function *fun_obj;
+	void info(const char *fmt,...);
+	void (*tron_print_string)(const char *buf);
+};
+#endif

data/ext/numo/liblinear/liblinearext.c CHANGED

@@ -545,6 +545,9 @@ void Init_liblinearext()
    */
   mLiblinear = rb_define_module_under(mNumo, "Liblinear");
+  /* The version of LIBLINEAR used in backgroud library. */
+  rb_define_const(mLiblinear, "LIBLINEAR_VERSION", INT2NUM(LIBLINEAR_VERSION));
   rb_define_module_function(mLiblinear, "train", numo_liblinear_train, 3);
   rb_define_module_function(mLiblinear, "cv", numo_liblinear_cross_validation, 4);
   rb_define_module_function(mLiblinear, "predict", numo_liblinear_predict, 3);

data/lib/numo/liblinear/version.rb CHANGED

@@ -3,6 +3,6 @@
 module Numo
   module Liblinear
     # The version of Numo::Liblienar you are using.
-    VERSION = '0.5.0'
+    VERSION = '1.0.0'
   end
 end

data/numo-liblinear.gemspec CHANGED

@@ -27,6 +27,13 @@ Gem::Specification.new do |spec|
   spec.files         = Dir.chdir(File.expand_path(__dir__)) do
     `git ls-files -z`.split("\x0").reject { |f| f.match(%r{^(test|spec|features)/}) }
   end
+  gem_dir = File.expand_path(__dir__) + '/'
+  submodule_path = `git submodule --quiet foreach pwd`.split($OUTPUT_RECORD_SEPARATOR).first
+  submodule_relative_path = submodule_path.sub gem_dir, ''
+  liblinear_files = %w[linear.cpp linear.h tron.cpp tron.h blas/blas.h blas/blasp.h blas/daxpy.c blas/ddot.c blas/dnrm2.c blas/dscal.c]
+  liblinear_files.each { |liblinf| spec.files << "#{submodule_relative_path}/#{liblinf}" }
   spec.bindir        = 'exe'
   spec.executables   = spec.files.grep(%r{^exe/}) { |f| File.basename(f) }
   spec.require_paths = ['lib']
@@ -39,6 +46,7 @@ Gem::Specification.new do |spec|
   }
   spec.add_runtime_dependency 'numo-narray', '~> 0.9.1'
   spec.add_development_dependency 'bundler', '~> 2.0'
   spec.add_development_dependency 'rake', '~> 10.0'
   spec.add_development_dependency 'rake-compiler', '~> 1.0'