RubyGems - alglib - Versions diffs - 0.1.1 - Mend

alglib 0.1.1

Files changed (255) hide show

data/History.txt +7 -0
data/Manifest.txt +253 -0
data/README.txt +33 -0
data/Rakefile +27 -0
data/ext/Rakefile +24 -0
data/ext/alglib.i +24 -0
data/ext/alglib/Makefile +157 -0
data/ext/alglib/airyf.cpp +372 -0
data/ext/alglib/airyf.h +81 -0
data/ext/alglib/alglib.cpp +8558 -0
data/ext/alglib/alglib_util.cpp +19 -0
data/ext/alglib/alglib_util.h +14 -0
data/ext/alglib/ap.cpp +877 -0
data/ext/alglib/ap.english.html +364 -0
data/ext/alglib/ap.h +666 -0
data/ext/alglib/ap.russian.html +442 -0
data/ext/alglib/apvt.h +754 -0
data/ext/alglib/bdss.cpp +1500 -0
data/ext/alglib/bdss.h +251 -0
data/ext/alglib/bdsvd.cpp +1339 -0
data/ext/alglib/bdsvd.h +164 -0
data/ext/alglib/bessel.cpp +1226 -0
data/ext/alglib/bessel.h +331 -0
data/ext/alglib/betaf.cpp +105 -0
data/ext/alglib/betaf.h +74 -0
data/ext/alglib/bidiagonal.cpp +1328 -0
data/ext/alglib/bidiagonal.h +350 -0
data/ext/alglib/binomialdistr.cpp +247 -0
data/ext/alglib/binomialdistr.h +153 -0
data/ext/alglib/blas.cpp +576 -0
data/ext/alglib/blas.h +132 -0
data/ext/alglib/cblas.cpp +226 -0
data/ext/alglib/cblas.h +57 -0
data/ext/alglib/cdet.cpp +138 -0
data/ext/alglib/cdet.h +92 -0
data/ext/alglib/chebyshev.cpp +216 -0
data/ext/alglib/chebyshev.h +76 -0
data/ext/alglib/chisquaredistr.cpp +157 -0
data/ext/alglib/chisquaredistr.h +144 -0
data/ext/alglib/cholesky.cpp +285 -0
data/ext/alglib/cholesky.h +86 -0
data/ext/alglib/cinverse.cpp +298 -0
data/ext/alglib/cinverse.h +111 -0
data/ext/alglib/clu.cpp +337 -0
data/ext/alglib/clu.h +120 -0
data/ext/alglib/correlation.cpp +280 -0
data/ext/alglib/correlation.h +77 -0
data/ext/alglib/correlationtests.cpp +726 -0
data/ext/alglib/correlationtests.h +134 -0
data/ext/alglib/crcond.cpp +826 -0
data/ext/alglib/crcond.h +148 -0
data/ext/alglib/creflections.cpp +310 -0
data/ext/alglib/creflections.h +165 -0
data/ext/alglib/csolve.cpp +312 -0
data/ext/alglib/csolve.h +99 -0
data/ext/alglib/ctrinverse.cpp +387 -0
data/ext/alglib/ctrinverse.h +98 -0
data/ext/alglib/ctrlinsolve.cpp +297 -0
data/ext/alglib/ctrlinsolve.h +81 -0
data/ext/alglib/dawson.cpp +234 -0
data/ext/alglib/dawson.h +74 -0
data/ext/alglib/descriptivestatistics.cpp +436 -0
data/ext/alglib/descriptivestatistics.h +112 -0
data/ext/alglib/det.cpp +140 -0
data/ext/alglib/det.h +94 -0
data/ext/alglib/dforest.cpp +1819 -0
data/ext/alglib/dforest.h +316 -0
data/ext/alglib/elliptic.cpp +497 -0
data/ext/alglib/elliptic.h +217 -0
data/ext/alglib/estnorm.cpp +429 -0
data/ext/alglib/estnorm.h +107 -0
data/ext/alglib/expintegrals.cpp +422 -0
data/ext/alglib/expintegrals.h +108 -0
data/ext/alglib/faq.english.html +258 -0
data/ext/alglib/faq.russian.html +272 -0
data/ext/alglib/fdistr.cpp +202 -0
data/ext/alglib/fdistr.h +163 -0
data/ext/alglib/fresnel.cpp +211 -0
data/ext/alglib/fresnel.h +91 -0
data/ext/alglib/gammaf.cpp +338 -0
data/ext/alglib/gammaf.h +104 -0
data/ext/alglib/gqgengauss.cpp +235 -0
data/ext/alglib/gqgengauss.h +92 -0
data/ext/alglib/gqgenhermite.cpp +268 -0
data/ext/alglib/gqgenhermite.h +63 -0
data/ext/alglib/gqgenjacobi.cpp +297 -0
data/ext/alglib/gqgenjacobi.h +72 -0
data/ext/alglib/gqgenlaguerre.cpp +265 -0
data/ext/alglib/gqgenlaguerre.h +69 -0
data/ext/alglib/gqgenlegendre.cpp +300 -0
data/ext/alglib/gqgenlegendre.h +62 -0
data/ext/alglib/gqgenlobatto.cpp +305 -0
data/ext/alglib/gqgenlobatto.h +97 -0
data/ext/alglib/gqgenradau.cpp +232 -0
data/ext/alglib/gqgenradau.h +95 -0
data/ext/alglib/hbisinv.cpp +480 -0
data/ext/alglib/hbisinv.h +183 -0
data/ext/alglib/hblas.cpp +228 -0
data/ext/alglib/hblas.h +64 -0
data/ext/alglib/hcholesky.cpp +339 -0
data/ext/alglib/hcholesky.h +91 -0
data/ext/alglib/hermite.cpp +114 -0
data/ext/alglib/hermite.h +49 -0
data/ext/alglib/hessenberg.cpp +370 -0
data/ext/alglib/hessenberg.h +152 -0
data/ext/alglib/hevd.cpp +247 -0
data/ext/alglib/hevd.h +107 -0
data/ext/alglib/hsschur.cpp +1316 -0
data/ext/alglib/hsschur.h +108 -0
data/ext/alglib/htridiagonal.cpp +734 -0
data/ext/alglib/htridiagonal.h +180 -0
data/ext/alglib/ialglib.cpp +6 -0
data/ext/alglib/ialglib.h +9 -0
data/ext/alglib/ibetaf.cpp +960 -0
data/ext/alglib/ibetaf.h +125 -0
data/ext/alglib/igammaf.cpp +430 -0
data/ext/alglib/igammaf.h +157 -0
data/ext/alglib/inv.cpp +274 -0
data/ext/alglib/inv.h +115 -0
data/ext/alglib/inverseupdate.cpp +480 -0
data/ext/alglib/inverseupdate.h +185 -0
data/ext/alglib/jacobianelliptic.cpp +164 -0
data/ext/alglib/jacobianelliptic.h +94 -0
data/ext/alglib/jarquebera.cpp +2271 -0
data/ext/alglib/jarquebera.h +80 -0
data/ext/alglib/kmeans.cpp +356 -0
data/ext/alglib/kmeans.h +76 -0
data/ext/alglib/laguerre.cpp +94 -0
data/ext/alglib/laguerre.h +48 -0
data/ext/alglib/lbfgs.cpp +1167 -0
data/ext/alglib/lbfgs.h +218 -0
data/ext/alglib/lda.cpp +434 -0
data/ext/alglib/lda.h +133 -0
data/ext/alglib/ldlt.cpp +1130 -0
data/ext/alglib/ldlt.h +124 -0
data/ext/alglib/leastsquares.cpp +1252 -0
data/ext/alglib/leastsquares.h +290 -0
data/ext/alglib/legendre.cpp +107 -0
data/ext/alglib/legendre.h +49 -0
data/ext/alglib/linreg.cpp +1185 -0
data/ext/alglib/linreg.h +380 -0
data/ext/alglib/logit.cpp +1523 -0
data/ext/alglib/logit.h +333 -0
data/ext/alglib/lq.cpp +399 -0
data/ext/alglib/lq.h +160 -0
data/ext/alglib/lu.cpp +462 -0
data/ext/alglib/lu.h +119 -0
data/ext/alglib/mannwhitneyu.cpp +4490 -0
data/ext/alglib/mannwhitneyu.h +115 -0
data/ext/alglib/minlm.cpp +918 -0
data/ext/alglib/minlm.h +312 -0
data/ext/alglib/mlpbase.cpp +3375 -0
data/ext/alglib/mlpbase.h +589 -0
data/ext/alglib/mlpe.cpp +1369 -0
data/ext/alglib/mlpe.h +552 -0
data/ext/alglib/mlptrain.cpp +1056 -0
data/ext/alglib/mlptrain.h +283 -0
data/ext/alglib/nearunityunit.cpp +91 -0
data/ext/alglib/nearunityunit.h +17 -0
data/ext/alglib/normaldistr.cpp +377 -0
data/ext/alglib/normaldistr.h +175 -0
data/ext/alglib/nsevd.cpp +1869 -0
data/ext/alglib/nsevd.h +140 -0
data/ext/alglib/pca.cpp +168 -0
data/ext/alglib/pca.h +87 -0
data/ext/alglib/poissondistr.cpp +143 -0
data/ext/alglib/poissondistr.h +130 -0
data/ext/alglib/polinterpolation.cpp +685 -0
data/ext/alglib/polinterpolation.h +206 -0
data/ext/alglib/psif.cpp +173 -0
data/ext/alglib/psif.h +88 -0
data/ext/alglib/qr.cpp +414 -0
data/ext/alglib/qr.h +168 -0
data/ext/alglib/ratinterpolation.cpp +134 -0
data/ext/alglib/ratinterpolation.h +72 -0
data/ext/alglib/rcond.cpp +705 -0
data/ext/alglib/rcond.h +140 -0
data/ext/alglib/reflections.cpp +504 -0
data/ext/alglib/reflections.h +165 -0
data/ext/alglib/rotations.cpp +473 -0
data/ext/alglib/rotations.h +128 -0
data/ext/alglib/rsolve.cpp +221 -0
data/ext/alglib/rsolve.h +99 -0
data/ext/alglib/sbisinv.cpp +217 -0
data/ext/alglib/sbisinv.h +171 -0
data/ext/alglib/sblas.cpp +185 -0
data/ext/alglib/sblas.h +64 -0
data/ext/alglib/schur.cpp +156 -0
data/ext/alglib/schur.h +102 -0
data/ext/alglib/sdet.cpp +193 -0
data/ext/alglib/sdet.h +101 -0
data/ext/alglib/sevd.cpp +116 -0
data/ext/alglib/sevd.h +99 -0
data/ext/alglib/sinverse.cpp +672 -0
data/ext/alglib/sinverse.h +138 -0
data/ext/alglib/spddet.cpp +138 -0
data/ext/alglib/spddet.h +96 -0
data/ext/alglib/spdgevd.cpp +842 -0
data/ext/alglib/spdgevd.h +200 -0
data/ext/alglib/spdinverse.cpp +509 -0
data/ext/alglib/spdinverse.h +122 -0
data/ext/alglib/spdrcond.cpp +421 -0
data/ext/alglib/spdrcond.h +118 -0
data/ext/alglib/spdsolve.cpp +275 -0
data/ext/alglib/spdsolve.h +105 -0
data/ext/alglib/spline2d.cpp +1192 -0
data/ext/alglib/spline2d.h +301 -0
data/ext/alglib/spline3.cpp +1264 -0
data/ext/alglib/spline3.h +290 -0
data/ext/alglib/srcond.cpp +595 -0
data/ext/alglib/srcond.h +127 -0
data/ext/alglib/ssolve.cpp +895 -0
data/ext/alglib/ssolve.h +139 -0
data/ext/alglib/stdafx.h +0 -0
data/ext/alglib/stest.cpp +131 -0
data/ext/alglib/stest.h +94 -0
data/ext/alglib/studenttdistr.cpp +222 -0
data/ext/alglib/studenttdistr.h +115 -0
data/ext/alglib/studentttests.cpp +377 -0
data/ext/alglib/studentttests.h +178 -0
data/ext/alglib/svd.cpp +620 -0
data/ext/alglib/svd.h +126 -0
data/ext/alglib/tdbisinv.cpp +2608 -0
data/ext/alglib/tdbisinv.h +228 -0
data/ext/alglib/tdevd.cpp +1229 -0
data/ext/alglib/tdevd.h +115 -0
data/ext/alglib/tridiagonal.cpp +594 -0
data/ext/alglib/tridiagonal.h +171 -0
data/ext/alglib/trigintegrals.cpp +490 -0
data/ext/alglib/trigintegrals.h +131 -0
data/ext/alglib/trinverse.cpp +345 -0
data/ext/alglib/trinverse.h +98 -0
data/ext/alglib/trlinsolve.cpp +926 -0
data/ext/alglib/trlinsolve.h +73 -0
data/ext/alglib/tsort.cpp +405 -0
data/ext/alglib/tsort.h +54 -0
data/ext/alglib/variancetests.cpp +245 -0
data/ext/alglib/variancetests.h +134 -0
data/ext/alglib/wsr.cpp +6285 -0
data/ext/alglib/wsr.h +96 -0
data/ext/ap.i +97 -0
data/ext/correlation.i +24 -0
data/ext/extconf.rb +6 -0
data/ext/logit.i +89 -0
data/lib/alglib.rb +71 -0
data/lib/alglib/correlation.rb +26 -0
data/lib/alglib/linearregression.rb +63 -0
data/lib/alglib/logit.rb +42 -0
data/test/test_alglib.rb +52 -0
data/test/test_correlation.rb +44 -0
data/test/test_correlationtest.rb +45 -0
data/test/test_linreg.rb +35 -0
data/test/test_logit.rb +43 -0
data/test/test_pca.rb +27 -0
metadata +326 -0

@@ -0,0 +1,1056 @@
+/*************************************************************************
+Copyright (c) 2007-2008, Sergey Bochkanov (ALGLIB project).
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are
+met:
+- Redistributions of source code must retain the above copyright
+  notice, this list of conditions and the following disclaimer.
+- Redistributions in binary form must reproduce the above copyright
+  notice, this list of conditions and the following disclaimer listed
+  in this license in the documentation and/or other materials
+  provided with the distribution.
+- Neither the name of the copyright holders nor the names of its
+  contributors may be used to endorse or promote products derived from
+  this software without specific prior written permission.
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
+OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+*************************************************************************/
+#include <stdafx.h>
+#include "mlptrain.h"
+static const double mindecay = 0.001;
+static void mlpkfoldcvgeneral(const multilayerperceptron& n,
+     const ap::real_2d_array& xy,
+     int npoints,
+     double decay,
+     int restarts,
+     int foldscount,
+     bool lmalgorithm,
+     double wstep,
+     int maxits,
+     int& info,
+     mlpreport& rep,
+     mlpcvreport& cvrep);
+static void mlpkfoldsplit(const ap::real_2d_array& xy,
+     int npoints,
+     int nclasses,
+     int foldscount,
+     bool stratifiedsplits,
+     ap::integer_1d_array& folds);
+/*************************************************************************
+Neural network training  using  modified  Levenberg-Marquardt  with  exact
+Hessian calculation and regularization. Subroutine trains  neural  network
+with restarts from random positions. Algorithm is well  suited  for  small
+and medium scale problems (hundreds of weights).
+INPUT PARAMETERS:
+    Network     -   neural network with initialized geometry
+    XY          -   training set
+    NPoints     -   training set size
+    Decay       -   weight decay constant, >=0.001
+                    Decay term 'Decay*||Weights||^2' is added to error
+                    function.
+                    If you don't know what Decay to choose, use 0.001.
+    Restarts    -   number of restarts from random position, >0.
+                    If you don't know what Restarts to choose, use 2.
+OUTPUT PARAMETERS:
+    Network     -   trained neural network.
+    Info        -   return code:
+                    * -9, if internal matrix inverse subroutine failed
+                    * -2, if there is a point with class number
+                          outside of [0..NOut-1].
+                    * -1, if wrong parameters specified
+                          (NPoints<0, Restarts<1).
+                    *  2, if task has been solved.
+    Rep         -   training report
+  -- ALGLIB --
+     Copyright 10.03.2009 by Bochkanov Sergey
+*************************************************************************/
+void mlptrainlm(multilayerperceptron& network,
+     const ap::real_2d_array& xy,
+     int npoints,
+     double decay,
+     int restarts,
+     int& info,
+     mlpreport& rep)
+{
+    int nin;
+    int nout;
+    int wcount;
+    double lmftol;
+    double lmsteptol;
+    int i;
+    int j;
+    int k;
+    int mx;
+    double v;
+    double e;
+    double enew;
+    double xnorm2;
+    double stepnorm;
+    ap::real_1d_array g;
+    ap::real_1d_array d;
+    ap::real_2d_array h;
+    ap::real_2d_array hmod;
+    ap::real_2d_array z;
+    bool spd;
+    double nu;
+    double lambda;
+    double lambdaup;
+    double lambdadown;
+    int cvcnt;
+    double cvrelcnt;
+    lbfgsreport internalrep;
+    lbfgsstate state;
+    ap::real_1d_array x;
+    ap::real_1d_array y;
+    ap::real_1d_array wbase;
+    double wstep;
+    ap::real_1d_array wdir;
+    ap::real_1d_array wt;
+    ap::real_1d_array wx;
+    int pass;
+    ap::real_1d_array wbest;
+    double ebest;
+    mlpproperties(network, nin, nout, wcount);
+    lambdaup = 10;
+    lambdadown = 0.3;
+    lmftol = 0.001;
+    lmsteptol = 0.001;
+    //
+    // Test for inputs
+    //
+    if( npoints<=0||restarts<1 )
+    {
+        info = -1;
+        return;
+    }
+    if( mlpissoftmax(network) )
+    {
+        for(i = 0; i <= npoints-1; i++)
+        {
+            if( ap::round(xy(i,nin))<0||ap::round(xy(i,nin))>=nout )
+            {
+                info = -2;
+                return;
+            }
+        }
+    }
+    decay = ap::maxreal(decay, mindecay);
+    info = 2;
+    //
+    // Initialize data
+    //
+    rep.ngrad = 0;
+    rep.nhess = 0;
+    rep.ncholesky = 0;
+    //
+    // General case.
+    // Prepare task and network. Allocate space.
+    //
+    mlpinitpreprocessor(network, xy, npoints);
+    g.setbounds(0, wcount-1);
+    h.setbounds(0, wcount-1, 0, wcount-1);
+    hmod.setbounds(0, wcount-1, 0, wcount-1);
+    wbase.setbounds(0, wcount-1);
+    wdir.setbounds(0, wcount-1);
+    wbest.setbounds(0, wcount-1);
+    wt.setbounds(0, wcount-1);
+    wx.setbounds(0, wcount-1);
+    ebest = ap::maxrealnumber;
+    //
+    // Multiple passes
+    //
+    for(pass = 1; pass <= restarts; pass++)
+    {
+        //
+        // Initialize weights
+        //
+        mlprandomize(network);
+        //
+        // First stage of the hybrid algorithm: LBFGS
+        //
+        ap::vmove(&wbase(0), &network.weights(0), ap::vlen(0,wcount-1));
+        minlbfgs(wcount, ap::minint(wcount, 5), wbase, 0.0, 0.0, 0.0, ap::maxint(25, wcount), 0, state);
+        while(minlbfgsiteration(state))
+        {
+            //
+            // gradient
+            //
+            ap::vmove(&network.weights(0), &state.x(0), ap::vlen(0,wcount-1));
+            mlpgradbatch(network, xy, npoints, state.f, state.g);
+            //
+            // weight decay
+            //
+            v = ap::vdotproduct(&network.weights(0), &network.weights(0), ap::vlen(0,wcount-1));
+            state.f = state.f+0.5*decay*v;
+            ap::vadd(&state.g(0), &network.weights(0), ap::vlen(0,wcount-1), decay);
+            //
+            // next iteration
+            //
+            rep.ngrad = rep.ngrad+1;
+        }
+        minlbfgsresults(state, wbase, internalrep);
+        ap::vmove(&network.weights(0), &wbase(0), ap::vlen(0,wcount-1));
+        //
+        // Second stage of the hybrid algorithm: LM
+        //
+        // Initialize H with identity matrix,
+        // G with gradient,
+        // E with regularized error.
+        //
+        mlphessianbatch(network, xy, npoints, e, g, h);
+        v = ap::vdotproduct(&network.weights(0), &network.weights(0), ap::vlen(0,wcount-1));
+        e = e+0.5*decay*v;
+        ap::vadd(&g(0), &network.weights(0), ap::vlen(0,wcount-1), decay);
+        for(k = 0; k <= wcount-1; k++)
+        {
+            h(k,k) = h(k,k)+decay;
+        }
+        rep.nhess = rep.nhess+1;
+        lambda = 0.001;
+        nu = 2;
+        while(true)
+        {
+            //
+            // 1. HMod = H+lambda*I
+            // 2. Try to solve (H+Lambda*I)*dx = -g.
+            //    Increase lambda if left part is not positive definite.
+            //
+            for(i = 0; i <= wcount-1; i++)
+            {
+                ap::vmove(&hmod(i, 0), &h(i, 0), ap::vlen(0,wcount-1));
+                hmod(i,i) = hmod(i,i)+lambda;
+            }
+            spd = spdmatrixcholesky(hmod, wcount, true);
+            rep.ncholesky = rep.ncholesky+1;
+            if( !spd )
+            {
+                lambda = lambda*lambdaup*nu;
+                nu = nu*2;
+                continue;
+            }
+            if( !spdmatrixcholeskysolve(hmod, g, wcount, true, wdir) )
+            {
+                lambda = lambda*lambdaup*nu;
+                nu = nu*2;
+                continue;
+            }
+            ap::vmul(&wdir(0), ap::vlen(0,wcount-1), -1);
+            //
+            // Lambda found.
+            // 1. Save old w in WBase
+            // 1. Test some stopping criterions
+            // 2. If error(w+wdir)>error(w), increase lambda
+            //
+            ap::vadd(&network.weights(0), &wdir(0), ap::vlen(0,wcount-1));
+            xnorm2 = ap::vdotproduct(&network.weights(0), &network.weights(0), ap::vlen(0,wcount-1));
+            stepnorm = ap::vdotproduct(&wdir(0), &wdir(0), ap::vlen(0,wcount-1));
+            stepnorm = sqrt(stepnorm);
+            enew = mlperror(network, xy, npoints)+0.5*decay*xnorm2;
+            if( stepnorm<lmsteptol*(1+sqrt(xnorm2)) )
+            {
+                break;
+            }
+            if( enew>e )
+            {
+                lambda = lambda*lambdaup*nu;
+                nu = nu*2;
+                continue;
+            }
+            //
+            // Optimize using inv(cholesky(H)) as preconditioner
+            //
+            if( !rmatrixtrinverse(hmod, wcount, true, false) )
+            {
+                //
+                // if matrix can't be inverted then exit with errors
+                // TODO: make WCount steps in direction suggested by HMod
+                //
+                info = -9;
+                return;
+            }
+            ap::vmove(&wbase(0), &network.weights(0), ap::vlen(0,wcount-1));
+            for(i = 0; i <= wcount-1; i++)
+            {
+                wt(i) = 0;
+            }
+            minlbfgs(wcount, wcount, wt, 0.0, 0.0, 0.0, 5, 0, state);
+            while(minlbfgsiteration(state))
+            {
+                //
+                // gradient
+                //
+                for(i = 0; i <= wcount-1; i++)
+                {
+                    v = ap::vdotproduct(&state.x(i), &hmod(i, i), ap::vlen(i,wcount-1));
+                    network.weights(i) = wbase(i)+v;
+                }
+                mlpgradbatch(network, xy, npoints, state.f, g);
+                for(i = 0; i <= wcount-1; i++)
+                {
+                    state.g(i) = 0;
+                }
+                for(i = 0; i <= wcount-1; i++)
+                {
+                    v = g(i);
+                    ap::vadd(&state.g(i), &hmod(i, i), ap::vlen(i,wcount-1), v);
+                }
+                //
+                // weight decay
+                // grad(x'*x) = A'*(x0+A*t)
+                //
+                v = ap::vdotproduct(&network.weights(0), &network.weights(0), ap::vlen(0,wcount-1));
+                state.f = state.f+0.5*decay*v;
+                for(i = 0; i <= wcount-1; i++)
+                {
+                    v = decay*network.weights(i);
+                    ap::vadd(&state.g(i), &hmod(i, i), ap::vlen(i,wcount-1), v);
+                }
+                //
+                // next iteration
+                //
+                rep.ngrad = rep.ngrad+1;
+            }
+            minlbfgsresults(state, wt, internalrep);
+            //
+            // Accept new position.
+            // Calculate Hessian
+            //
+            for(i = 0; i <= wcount-1; i++)
+            {
+                v = ap::vdotproduct(&wt(i), &hmod(i, i), ap::vlen(i,wcount-1));
+                network.weights(i) = wbase(i)+v;
+            }
+            mlphessianbatch(network, xy, npoints, e, g, h);
+            v = ap::vdotproduct(&network.weights(0), &network.weights(0), ap::vlen(0,wcount-1));
+            e = e+0.5*decay*v;
+            ap::vadd(&g(0), &network.weights(0), ap::vlen(0,wcount-1), decay);
+            for(k = 0; k <= wcount-1; k++)
+            {
+                h(k,k) = h(k,k)+decay;
+            }
+            rep.nhess = rep.nhess+1;
+            //
+            // Update lambda
+            //
+            lambda = lambda*lambdadown;
+            nu = 2;
+        }
+        //
+        // update WBest
+        //
+        v = ap::vdotproduct(&network.weights(0), &network.weights(0), ap::vlen(0,wcount-1));
+        e = 0.5*decay*v+mlperror(network, xy, npoints);
+        if( e<ebest )
+        {
+            ebest = e;
+            ap::vmove(&wbest(0), &network.weights(0), ap::vlen(0,wcount-1));
+        }
+    }
+    //
+    // copy WBest to output
+    //
+    ap::vmove(&network.weights(0), &wbest(0), ap::vlen(0,wcount-1));
+}
+/*************************************************************************
+Neural  network  training  using  L-BFGS  algorithm  with  regularization.
+Subroutine  trains  neural  network  with  restarts from random positions.
+Algorithm  is  well  suited  for  problems  of  any dimensionality (memory
+requirements and step complexity are linear by weights number).
+INPUT PARAMETERS:
+    Network     -   neural network with initialized geometry
+    XY          -   training set
+    NPoints     -   training set size
+    Decay       -   weight decay constant, >=0.001
+                    Decay term 'Decay*||Weights||^2' is added to error
+                    function.
+                    If you don't know what Decay to choose, use 0.001.
+    Restarts    -   number of restarts from random position, >0.
+                    If you don't know what Restarts to choose, use 2.
+    WStep       -   stopping criterion. Algorithm stops if  step  size  is
+                    less than WStep. Recommended value - 0.01.  Zero  step
+                    size means stopping after MaxIts iterations.
+    MaxIts      -   stopping   criterion.  Algorithm  stops  after  MaxIts
+                    iterations (NOT gradient  calculations).  Zero  MaxIts
+                    means stopping when step is sufficiently small.
+OUTPUT PARAMETERS:
+    Network     -   trained neural network.
+    Info        -   return code:
+                    * -8, if both WStep=0 and MaxIts=0
+                    * -2, if there is a point with class number
+                          outside of [0..NOut-1].
+                    * -1, if wrong parameters specified
+                          (NPoints<0, Restarts<1).
+                    *  2, if task has been solved.
+    Rep         -   training report
+  -- ALGLIB --
+     Copyright 09.12.2007 by Bochkanov Sergey
+*************************************************************************/
+void mlptrainlbfgs(multilayerperceptron& network,
+     const ap::real_2d_array& xy,
+     int npoints,
+     double decay,
+     int restarts,
+     double wstep,
+     int maxits,
+     int& info,
+     mlpreport& rep)
+{
+    int i;
+    int j;
+    int pass;
+    int nin;
+    int nout;
+    int wcount;
+    ap::real_1d_array w;
+    ap::real_1d_array wbest;
+    double e;
+    double v;
+    double ebest;
+    lbfgsreport internalrep;
+    lbfgsstate state;
+    //
+    // Test inputs, parse flags, read network geometry
+    //
+    if( wstep==0&&maxits==0 )
+    {
+        info = -8;
+        return;
+    }
+    if( npoints<=0||restarts<1||wstep<0||maxits<0 )
+    {
+        info = -1;
+        return;
+    }
+    mlpproperties(network, nin, nout, wcount);
+    if( mlpissoftmax(network) )
+    {
+        for(i = 0; i <= npoints-1; i++)
+        {
+            if( ap::round(xy(i,nin))<0||ap::round(xy(i,nin))>=nout )
+            {
+                info = -2;
+                return;
+            }
+        }
+    }
+    decay = ap::maxreal(decay, mindecay);
+    info = 2;
+    //
+    // Prepare
+    //
+    mlpinitpreprocessor(network, xy, npoints);
+    w.setbounds(0, wcount-1);
+    wbest.setbounds(0, wcount-1);
+    ebest = ap::maxrealnumber;
+    //
+    // Multiple starts
+    //
+    rep.ncholesky = 0;
+    rep.nhess = 0;
+    rep.ngrad = 0;
+    for(pass = 1; pass <= restarts; pass++)
+    {
+        //
+        // Process
+        //
+        mlprandomize(network);
+        ap::vmove(&w(0), &network.weights(0), ap::vlen(0,wcount-1));
+        minlbfgs(wcount, ap::minint(wcount, 50), w, 0.0, 0.0, wstep, maxits, 0, state);
+        while(minlbfgsiteration(state))
+        {
+            ap::vmove(&network.weights(0), &state.x(0), ap::vlen(0,wcount-1));
+            mlpgradnbatch(network, xy, npoints, state.f, state.g);
+            v = ap::vdotproduct(&network.weights(0), &network.weights(0), ap::vlen(0,wcount-1));
+            state.f = state.f+0.5*decay*v;
+            ap::vadd(&state.g(0), &network.weights(0), ap::vlen(0,wcount-1), decay);
+            rep.ngrad = rep.ngrad+1;
+        }
+        minlbfgsresults(state, w, internalrep);
+        ap::vmove(&network.weights(0), &w(0), ap::vlen(0,wcount-1));
+        //
+        // Compare with best
+        //
+        v = ap::vdotproduct(&network.weights(0), &network.weights(0), ap::vlen(0,wcount-1));
+        e = mlperrorn(network, xy, npoints)+0.5*decay*v;
+        if( e<ebest )
+        {
+            ap::vmove(&wbest(0), &network.weights(0), ap::vlen(0,wcount-1));
+            ebest = e;
+        }
+    }
+    //
+    // The best network
+    //
+    ap::vmove(&network.weights(0), &wbest(0), ap::vlen(0,wcount-1));
+}
+/*************************************************************************
+Neural network training using early stopping (base algorithm - L-BFGS with
+regularization).
+INPUT PARAMETERS:
+    Network     -   neural network with initialized geometry
+    TrnXY       -   training set
+    TrnSize     -   training set size
+    ValXY       -   validation set
+    ValSize     -   validation set size
+    Decay       -   weight decay constant, >=0.001
+                    Decay term 'Decay*||Weights||^2' is added to error
+                    function.
+                    If you don't know what Decay to choose, use 0.001.
+    Restarts    -   number of restarts from random position, >0.
+                    If you don't know what Restarts to choose, use 2.
+OUTPUT PARAMETERS:
+    Network     -   trained neural network.
+    Info        -   return code:
+                    * -2, if there is a point with class number
+                          outside of [0..NOut-1].
+                    * -1, if wrong parameters specified
+                          (NPoints<0, Restarts<1, ...).
+                    *  2, task has been solved, stopping  criterion  met -
+                          sufficiently small step size.  Not expected  (we
+                          use  EARLY  stopping)  but  possible  and not an
+                          error.
+                    *  6, task has been solved, stopping  criterion  met -
+                          increasing of validation set error.
+    Rep         -   training report
+NOTE:
+Algorithm stops if validation set error increases for  a  long  enough  or
+step size is small enought  (there  are  task  where  validation  set  may
+decrease for eternity). In any case solution returned corresponds  to  the
+minimum of validation set error.
+  -- ALGLIB --
+     Copyright 10.03.2009 by Bochkanov Sergey
+*************************************************************************/
+void mlptraines(multilayerperceptron& network,
+     const ap::real_2d_array& trnxy,
+     int trnsize,
+     const ap::real_2d_array& valxy,
+     int valsize,
+     double decay,
+     int restarts,
+     int& info,
+     mlpreport& rep)
+{
+    int i;
+    int j;
+    int pass;
+    int nin;
+    int nout;
+    int wcount;
+    ap::real_1d_array w;
+    ap::real_1d_array wbest;
+    double e;
+    double v;
+    double ebest;
+    ap::real_1d_array wfinal;
+    double efinal;
+    int itbest;
+    lbfgsreport internalrep;
+    lbfgsstate state;
+    double wstep;
+    wstep = 0.001;
+    //
+    // Test inputs, parse flags, read network geometry
+    //
+    if( trnsize<=0||valsize<=0||restarts<1||decay<0 )
+    {
+        info = -1;
+        return;
+    }
+    mlpproperties(network, nin, nout, wcount);
+    if( mlpissoftmax(network) )
+    {
+        for(i = 0; i <= trnsize-1; i++)
+        {
+            if( ap::round(trnxy(i,nin))<0||ap::round(trnxy(i,nin))>=nout )
+            {
+                info = -2;
+                return;
+            }
+        }
+        for(i = 0; i <= valsize-1; i++)
+        {
+            if( ap::round(valxy(i,nin))<0||ap::round(valxy(i,nin))>=nout )
+            {
+                info = -2;
+                return;
+            }
+        }
+    }
+    info = 2;
+    //
+    // Prepare
+    //
+    mlpinitpreprocessor(network, trnxy, trnsize);
+    w.setbounds(0, wcount-1);
+    wbest.setbounds(0, wcount-1);
+    wfinal.setbounds(0, wcount-1);
+    efinal = ap::maxrealnumber;
+    for(i = 0; i <= wcount-1; i++)
+    {
+        wfinal(i) = 0;
+    }
+    //
+    // Multiple starts
+    //
+    rep.ncholesky = 0;
+    rep.nhess = 0;
+    rep.ngrad = 0;
+    for(pass = 1; pass <= restarts; pass++)
+    {
+        //
+        // Process
+        //
+        mlprandomize(network);
+        ebest = mlperror(network, valxy, valsize);
+        ap::vmove(&wbest(0), &network.weights(0), ap::vlen(0,wcount-1));
+        itbest = 0;
+        ap::vmove(&w(0), &network.weights(0), ap::vlen(0,wcount-1));
+        minlbfgs(wcount, ap::minint(wcount, 50), w, 0.0, 0.0, wstep, 0, 0, state);
+        while(minlbfgsiteration(state))
+        {
+            //
+            // Calculate gradient
+            //
+            ap::vmove(&network.weights(0), &state.x(0), ap::vlen(0,wcount-1));
+            mlpgradnbatch(network, trnxy, trnsize, state.f, state.g);
+            v = ap::vdotproduct(&network.weights(0), &network.weights(0), ap::vlen(0,wcount-1));
+            state.f = state.f+0.5*decay*v;
+            ap::vadd(&state.g(0), &network.weights(0), ap::vlen(0,wcount-1), decay);
+            rep.ngrad = rep.ngrad+1;
+            //
+            // Validation set
+            //
+            if( state.xupdated )
+            {
+                ap::vmove(&network.weights(0), &w(0), ap::vlen(0,wcount-1));
+                e = mlperror(network, valxy, valsize);
+                if( e<ebest )
+                {
+                    ebest = e;
+                    ap::vmove(&wbest(0), &network.weights(0), ap::vlen(0,wcount-1));
+                    itbest = internalrep.iterationscount;
+                }
+                if( internalrep.iterationscount>30&&internalrep.iterationscount>1.5*itbest )
+                {
+                    info = 6;
+                    break;
+                }
+            }
+        }
+        minlbfgsresults(state, w, internalrep);
+        //
+        // Compare with final answer
+        //
+        if( ebest<efinal )
+        {
+            ap::vmove(&wfinal(0), &wbest(0), ap::vlen(0,wcount-1));
+            efinal = ebest;
+        }
+    }
+    //
+    // The best network
+    //
+    ap::vmove(&network.weights(0), &wfinal(0), ap::vlen(0,wcount-1));
+}
+/*************************************************************************
+Cross-validation estimate of generalization error.
+Base algorithm - L-BFGS.
+INPUT PARAMETERS:
+    Network     -   neural network with initialized geometry.   Network is
+                    not changed during cross-validation -  it is used only
+                    as a representative of its architecture.
+    XY          -   training set.
+    SSize       -   training set size
+    Decay       -   weight  decay, same as in MLPTrainLBFGS
+    Restarts    -   number of restarts, >0.
+                    restarts are counted for each partition separately, so
+                    total number of restarts will be Restarts*FoldsCount.
+    WStep       -   stopping criterion, same as in MLPTrainLBFGS
+    MaxIts      -   stopping criterion, same as in MLPTrainLBFGS
+    FoldsCount  -   number of folds in k-fold cross-validation,
+                    2<=FoldsCount<=SSize.
+                    recommended value: 10.
+OUTPUT PARAMETERS:
+    Info        -   return code, same as in MLPTrainLBFGS
+    Rep         -   report, same as in MLPTrainLM/MLPTrainLBFGS
+    CVRep       -   generalization error estimates
+  -- ALGLIB --
+     Copyright 09.12.2007 by Bochkanov Sergey
+*************************************************************************/
+void mlpkfoldcvlbfgs(const multilayerperceptron& network,
+     const ap::real_2d_array& xy,
+     int npoints,
+     double decay,
+     int restarts,
+     double wstep,
+     int maxits,
+     int foldscount,
+     int& info,
+     mlpreport& rep,
+     mlpcvreport& cvrep)
+{
+    mlpkfoldcvgeneral(network, xy, npoints, decay, restarts, foldscount, false, wstep, maxits, info, rep, cvrep);
+}
+/*************************************************************************
+Cross-validation estimate of generalization error.
+Base algorithm - Levenberg-Marquardt.
+INPUT PARAMETERS:
+    Network     -   neural network with initialized geometry.   Network is
+                    not changed during cross-validation -  it is used only
+                    as a representative of its architecture.
+    XY          -   training set.
+    SSize       -   training set size
+    Decay       -   weight  decay, same as in MLPTrainLBFGS
+    Restarts    -   number of restarts, >0.
+                    restarts are counted for each partition separately, so
+                    total number of restarts will be Restarts*FoldsCount.
+    FoldsCount  -   number of folds in k-fold cross-validation,
+                    2<=FoldsCount<=SSize.
+                    recommended value: 10.
+OUTPUT PARAMETERS:
+    Info        -   return code, same as in MLPTrainLBFGS
+    Rep         -   report, same as in MLPTrainLM/MLPTrainLBFGS
+    CVRep       -   generalization error estimates
+  -- ALGLIB --
+     Copyright 09.12.2007 by Bochkanov Sergey
+*************************************************************************/
+void mlpkfoldcvlm(const multilayerperceptron& network,
+     const ap::real_2d_array& xy,
+     int npoints,
+     double decay,
+     int restarts,
+     int foldscount,
+     int& info,
+     mlpreport& rep,
+     mlpcvreport& cvrep)
+{
+    mlpkfoldcvgeneral(network, xy, npoints, decay, restarts, foldscount, true, 0.0, 0, info, rep, cvrep);
+}
+/*************************************************************************
+Internal cross-validation subroutine
+*************************************************************************/
+static void mlpkfoldcvgeneral(const multilayerperceptron& n,
+     const ap::real_2d_array& xy,
+     int npoints,
+     double decay,
+     int restarts,
+     int foldscount,
+     bool lmalgorithm,
+     double wstep,
+     int maxits,
+     int& info,
+     mlpreport& rep,
+     mlpcvreport& cvrep)
+{
+    int i;
+    int fold;
+    int j;
+    int k;
+    multilayerperceptron network;
+    int nin;
+    int nout;
+    int rowlen;
+    int wcount;
+    int nclasses;
+    int tssize;
+    int cvssize;
+    ap::real_2d_array cvset;
+    ap::real_2d_array testset;
+    ap::integer_1d_array folds;
+    int relcnt;
+    mlpreport internalrep;
+    ap::real_1d_array x;
+    ap::real_1d_array y;
+    //
+    // Read network geometry, test parameters
+    //
+    mlpproperties(n, nin, nout, wcount);
+    if( mlpissoftmax(n) )
+    {
+        nclasses = nout;
+        rowlen = nin+1;
+    }
+    else
+    {
+        nclasses = -nout;
+        rowlen = nin+nout;
+    }
+    if( npoints<=0||foldscount<2||foldscount>npoints )
+    {
+        info = -1;
+        return;
+    }
+    mlpcopy(n, network);
+    //
+    // K-fold out cross-validation.
+    // First, estimate generalization error
+    //
+    testset.setbounds(0, npoints-1, 0, rowlen-1);
+    cvset.setbounds(0, npoints-1, 0, rowlen-1);
+    x.setbounds(0, nin-1);
+    y.setbounds(0, nout-1);
+    mlpkfoldsplit(xy, npoints, nclasses, foldscount, false, folds);
+    cvrep.relclserror = 0;
+    cvrep.avgce = 0;
+    cvrep.rmserror = 0;
+    cvrep.avgerror = 0;
+    cvrep.avgrelerror = 0;
+    rep.ngrad = 0;
+    rep.nhess = 0;
+    rep.ncholesky = 0;
+    relcnt = 0;
+    for(fold = 0; fold <= foldscount-1; fold++)
+    {
+        //
+        // Separate set
+        //
+        tssize = 0;
+        cvssize = 0;
+        for(i = 0; i <= npoints-1; i++)
+        {
+            if( folds(i)==fold )
+            {
+                ap::vmove(&testset(tssize, 0), &xy(i, 0), ap::vlen(0,rowlen-1));
+                tssize = tssize+1;
+            }
+            else
+            {
+                ap::vmove(&cvset(cvssize, 0), &xy(i, 0), ap::vlen(0,rowlen-1));
+                cvssize = cvssize+1;
+            }
+        }
+        //
+        // Train on CV training set
+        //
+        if( lmalgorithm )
+        {
+            mlptrainlm(network, cvset, cvssize, decay, restarts, info, internalrep);
+        }
+        else
+        {
+            mlptrainlbfgs(network, cvset, cvssize, decay, restarts, wstep, maxits, info, internalrep);
+        }
+        if( info<0 )
+        {
+            cvrep.relclserror = 0;
+            cvrep.avgce = 0;
+            cvrep.rmserror = 0;
+            cvrep.avgerror = 0;
+            cvrep.avgrelerror = 0;
+            return;
+        }
+        rep.ngrad = rep.ngrad+internalrep.ngrad;
+        rep.nhess = rep.nhess+internalrep.nhess;
+        rep.ncholesky = rep.ncholesky+internalrep.ncholesky;
+        //
+        // Estimate error using CV test set
+        //
+        if( mlpissoftmax(network) )
+        {
+            //
+            // classification-only code
+            //
+            cvrep.relclserror = cvrep.relclserror+mlpclserror(network, testset, tssize);
+            cvrep.avgce = cvrep.avgce+mlperrorn(network, testset, tssize);
+        }
+        for(i = 0; i <= tssize-1; i++)
+        {
+            ap::vmove(&x(0), &testset(i, 0), ap::vlen(0,nin-1));
+            mlpprocess(network, x, y);
+            if( mlpissoftmax(network) )
+            {
+                //
+                // Classification-specific code
+                //
+                k = ap::round(testset(i,nin));
+                for(j = 0; j <= nout-1; j++)
+                {
+                    if( j==k )
+                    {
+                        cvrep.rmserror = cvrep.rmserror+ap::sqr(y(j)-1);
+                        cvrep.avgerror = cvrep.avgerror+fabs(y(j)-1);
+                        cvrep.avgrelerror = cvrep.avgrelerror+fabs(y(j)-1);
+                        relcnt = relcnt+1;
+                    }
+                    else
+                    {
+                        cvrep.rmserror = cvrep.rmserror+ap::sqr(y(j));
+                        cvrep.avgerror = cvrep.avgerror+fabs(y(j));
+                    }
+                }
+            }
+            else
+            {
+                //
+                // Regression-specific code
+                //
+                for(j = 0; j <= nout-1; j++)
+                {
+                    cvrep.rmserror = cvrep.rmserror+ap::sqr(y(j)-testset(i,nin+j));
+                    cvrep.avgerror = cvrep.avgerror+fabs(y(j)-testset(i,nin+j));
+                    if( testset(i,nin+j)!=0 )
+                    {
+                        cvrep.avgrelerror = cvrep.avgrelerror+fabs((y(j)-testset(i,nin+j))/testset(i,nin+j));
+                        relcnt = relcnt+1;
+                    }
+                }
+            }
+        }
+    }
+    if( mlpissoftmax(network) )
+    {
+        cvrep.relclserror = cvrep.relclserror/npoints;
+        cvrep.avgce = cvrep.avgce/(log(double(2))*npoints);
+    }
+    cvrep.rmserror = sqrt(cvrep.rmserror/(npoints*nout));
+    cvrep.avgerror = cvrep.avgerror/(npoints*nout);
+    cvrep.avgrelerror = cvrep.avgrelerror/relcnt;
+    info = 1;
+}
+/*************************************************************************
+Subroutine prepares K-fold split of the training set.
+NOTES:
+    "NClasses>0" means that we have classification task.
+    "NClasses<0" means regression task with -NClasses real outputs.
+*************************************************************************/
+static void mlpkfoldsplit(const ap::real_2d_array& xy,
+     int npoints,
+     int nclasses,
+     int foldscount,
+     bool stratifiedsplits,
+     ap::integer_1d_array& folds)
+{
+    int i;
+    int j;
+    int k;
+    //
+    // test parameters
+    //
+    ap::ap_error::make_assertion(npoints>0, "MLPKFoldSplit: wrong NPoints!");
+    ap::ap_error::make_assertion(nclasses>1||nclasses<0, "MLPKFoldSplit: wrong NClasses!");
+    ap::ap_error::make_assertion(foldscount>=2&&foldscount<=npoints, "MLPKFoldSplit: wrong FoldsCount!");
+    ap::ap_error::make_assertion(!stratifiedsplits, "MLPKFoldSplit: stratified splits are not supported!");
+    //
+    // Folds
+    //
+    folds.setbounds(0, npoints-1);
+    for(i = 0; i <= npoints-1; i++)
+    {
+        folds(i) = i*foldscount/npoints;
+    }
+    for(i = 0; i <= npoints-2; i++)
+    {
+        j = i+ap::randominteger(npoints-i);
+        if( j!=i )
+        {
+            k = folds(i);
+            folds(i) = folds(j);
+            folds(j) = k;
+        }
+    }
+}