RubyGems - scs - Versions diffs - 0.2.2 → 0.3.2 - Mend

scs 0.2.2 → 0.3.2

Files changed (103) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +16 -0
data/LICENSE.txt +18 -18
data/README.md +19 -14
data/lib/scs/ffi.rb +31 -20
data/lib/scs/solver.rb +32 -9
data/lib/scs/version.rb +1 -1
data/vendor/scs/CITATION.cff +39 -0
data/vendor/scs/CMakeLists.txt +320 -0
data/vendor/scs/Makefile +32 -23
data/vendor/scs/README.md +9 -218
data/vendor/scs/include/aa.h +67 -23
data/vendor/scs/include/cones.h +22 -19
data/vendor/scs/include/glbopts.h +107 -79
data/vendor/scs/include/linalg.h +3 -4
data/vendor/scs/include/linsys.h +58 -44
data/vendor/scs/include/normalize.h +6 -5
data/vendor/scs/include/rw.h +8 -2
data/vendor/scs/include/scs.h +257 -141
data/vendor/scs/include/scs_types.h +34 -0
data/vendor/scs/include/scs_work.h +83 -0
data/vendor/scs/include/util.h +3 -15
data/vendor/scs/linsys/cpu/direct/private.c +241 -232
data/vendor/scs/linsys/cpu/direct/private.h +13 -7
data/vendor/scs/linsys/cpu/indirect/private.c +194 -118
data/vendor/scs/linsys/cpu/indirect/private.h +7 -4
data/vendor/scs/linsys/csparse.c +87 -0
data/vendor/scs/linsys/csparse.h +34 -0
data/vendor/scs/linsys/external/amd/SuiteSparse_config.c +6 -6
data/vendor/scs/linsys/external/amd/SuiteSparse_config.h +6 -1
data/vendor/scs/linsys/external/amd/amd_internal.h +1 -1
data/vendor/scs/linsys/external/amd/amd_order.c +5 -5
data/vendor/scs/linsys/external/qdldl/changes +2 -0
data/vendor/scs/linsys/external/qdldl/qdldl.c +29 -46
data/vendor/scs/linsys/external/qdldl/qdldl.h +33 -41
data/vendor/scs/linsys/external/qdldl/qdldl_types.h +11 -3
data/vendor/scs/linsys/gpu/gpu.c +58 -21
data/vendor/scs/linsys/gpu/gpu.h +70 -35
data/vendor/scs/linsys/gpu/indirect/private.c +394 -157
data/vendor/scs/linsys/gpu/indirect/private.h +27 -12
data/vendor/scs/linsys/scs_matrix.c +478 -0
data/vendor/scs/linsys/scs_matrix.h +70 -0
data/vendor/scs/scs.mk +14 -10
data/vendor/scs/src/aa.c +394 -110
data/vendor/scs/src/cones.c +497 -359
data/vendor/scs/src/ctrlc.c +15 -5
data/vendor/scs/src/linalg.c +107 -26
data/vendor/scs/src/normalize.c +30 -72
data/vendor/scs/src/rw.c +202 -27
data/vendor/scs/src/scs.c +769 -571
data/vendor/scs/src/scs_version.c +11 -3
data/vendor/scs/src/util.c +37 -106
data/vendor/scs/test/minunit.h +22 -8
data/vendor/scs/test/problem_utils.h +180 -25
data/vendor/scs/test/problems/degenerate.h +130 -0
data/vendor/scs/test/problems/hs21_tiny_qp.h +124 -0
data/vendor/scs/test/problems/hs21_tiny_qp_rw.h +116 -0
data/vendor/scs/test/problems/infeasible_tiny_qp.h +100 -0
data/vendor/scs/test/problems/qafiro_tiny_qp.h +199 -0
data/vendor/scs/test/problems/random_prob +0 -0
data/vendor/scs/test/problems/random_prob.h +45 -0
data/vendor/scs/test/problems/rob_gauss_cov_est.h +188 -31
data/vendor/scs/test/problems/small_lp.h +14 -13
data/vendor/scs/test/problems/small_qp.h +352 -0
data/vendor/scs/test/problems/test_validation.h +43 -0
data/vendor/scs/test/problems/unbounded_tiny_qp.h +82 -0
data/vendor/scs/test/random_socp_prob.c +54 -53
data/vendor/scs/test/rng.h +109 -0
data/vendor/scs/test/run_from_file.c +20 -11
data/vendor/scs/test/run_tests.c +35 -2
metadata +29 -98
data/vendor/scs/linsys/amatrix.c +0 -305
data/vendor/scs/linsys/amatrix.h +0 -36
data/vendor/scs/linsys/amatrix.o +0 -0
data/vendor/scs/linsys/cpu/direct/private.o +0 -0
data/vendor/scs/linsys/cpu/indirect/private.o +0 -0
data/vendor/scs/linsys/external/amd/SuiteSparse_config.o +0 -0
data/vendor/scs/linsys/external/amd/amd_1.o +0 -0
data/vendor/scs/linsys/external/amd/amd_2.o +0 -0
data/vendor/scs/linsys/external/amd/amd_aat.o +0 -0
data/vendor/scs/linsys/external/amd/amd_control.o +0 -0
data/vendor/scs/linsys/external/amd/amd_defaults.o +0 -0
data/vendor/scs/linsys/external/amd/amd_dump.o +0 -0
data/vendor/scs/linsys/external/amd/amd_global.o +0 -0
data/vendor/scs/linsys/external/amd/amd_info.o +0 -0
data/vendor/scs/linsys/external/amd/amd_order.o +0 -0
data/vendor/scs/linsys/external/amd/amd_post_tree.o +0 -0
data/vendor/scs/linsys/external/amd/amd_postorder.o +0 -0
data/vendor/scs/linsys/external/amd/amd_preprocess.o +0 -0
data/vendor/scs/linsys/external/amd/amd_valid.o +0 -0
data/vendor/scs/linsys/external/qdldl/qdldl.o +0 -0
data/vendor/scs/src/aa.o +0 -0
data/vendor/scs/src/cones.o +0 -0
data/vendor/scs/src/ctrlc.o +0 -0
data/vendor/scs/src/linalg.o +0 -0
data/vendor/scs/src/normalize.o +0 -0
data/vendor/scs/src/rw.o +0 -0
data/vendor/scs/src/scs.o +0 -0
data/vendor/scs/src/scs_version.o +0 -0
data/vendor/scs/src/util.o +0 -0
data/vendor/scs/test/data/small_random_socp +0 -0
data/vendor/scs/test/problems/small_random_socp.h +0 -33
data/vendor/scs/test/run_tests +0 -2

data/vendor/scs/linsys/gpu/indirect/private.h CHANGED Viewed

@@ -5,29 +5,44 @@
 extern "C" {
 #endif
-#include "gpu.h"
+#include "csparse.h"
 #include "glbopts.h"
+#include "gpu.h"
 #include "linalg.h"
 #include "scs.h"
 struct SCS_LIN_SYS_WORK {
+  scs_int n, m; /* linear system dimensions */
   /* reporting */
   scs_int tot_cg_its;
-  scs_float total_solve_time;
+  scs_float *M; /* preconditioner on cpu */
   /* ALL BELOW HOSTED ON THE GPU */
-  scs_float *p;     /* cg iterate, n  */
-  scs_float *r;     /* cg residual, n */
-  scs_float *Gp;    /* G * p, n */
-  scs_float *bg;    /* b, n */
-  scs_float *tmp_m; /* m, used in mat_vec */
-  scs_float *z;     /* preconditioned */
-  scs_float *M;     /* preconditioner */
-  ScsGpuMatrix *Ag;    /* A matrix on GPU */
-  ScsGpuMatrix *Agt;   /* A trans matrix on GPU */
+  scs_float *p;       /* cg iterate, n  */
+  scs_float *r;       /* cg residual, n */
+  scs_float *Gp;      /* G * p, n */
+  scs_float *bg;      /* b, n */
+  scs_float *tmp_m;   /* m, used in mat_vec */
+  scs_float *z;       /* preconditioned */
+  scs_float *M_gpu;   /* preconditioner */
+  const ScsMatrix *A; /* does *not* own this memory */
+  const ScsMatrix *P; /* does *not* own this memory */
+  ScsGpuMatrix *Ag;   /* A matrix on GPU */
+  ScsGpuMatrix *Agt;  /* A trans matrix on GPU */
+  ScsGpuMatrix *Pg;   /* P matrix on GPU */
   /* CUDA */
   cublasHandle_t cublas_handle;
   cusparseHandle_t cusparse_handle;
+  /* CUSPARSE */
+  size_t buffer_size;
+  void *buffer;
+  cusparseDnVecDescr_t dn_vec_m;   /* Dense vector of length m */
+  cusparseDnVecDescr_t dn_vec_n;   /* Dense vector of length n */
+  cusparseDnVecDescr_t dn_vec_n_p; /* Dense vector of length n */
+  /* rho terms */
+  scs_float *r_x_gpu;
+  scs_float *inv_r_y;     /* inverse R_y */
+  scs_float *inv_r_y_gpu; /* inverse R_y on GPU */
 };
 #ifdef __cplusplus

data/vendor/scs/linsys/scs_matrix.c ADDED Viewed

@@ -0,0 +1,478 @@
+/* contains routines common to direct and indirect sparse solvers */
+#include "scs_matrix.h"
+#include "linalg.h"
+#include "linsys.h"
+#include "util.h"
+#define MIN_NORMALIZATION_FACTOR (1e-4)
+#define MAX_NORMALIZATION_FACTOR (1e4)
+#define NUM_RUIZ_PASSES (25) /* additional passes don't help much */
+#define NUM_L2_PASSES (1)    /* do one or zero, not more since not stable */
+scs_int SCS(copy_matrix)(ScsMatrix **dstp, const ScsMatrix *src) {
+  scs_int Anz = src->p[src->n];
+  ScsMatrix *A = (ScsMatrix *)scs_calloc(1, sizeof(ScsMatrix));
+  if (!A) {
+    return 0;
+  }
+  A->n = src->n;
+  A->m = src->m;
+  /* A values, size: NNZ A */
+  A->x = (scs_float *)scs_calloc(Anz, sizeof(scs_float));
+  /* A row index, size: NNZ A */
+  A->i = (scs_int *)scs_calloc(Anz, sizeof(scs_int));
+  /* A column pointer, size: n+1 */
+  A->p = (scs_int *)scs_calloc(src->n + 1, sizeof(scs_int));
+  if (!A->x || !A->i || !A->p) {
+    return 0;
+  }
+  memcpy(A->x, src->x, sizeof(scs_float) * Anz);
+  memcpy(A->i, src->i, sizeof(scs_int) * Anz);
+  memcpy(A->p, src->p, sizeof(scs_int) * (src->n + 1));
+  *dstp = A;
+  return 1;
+}
+scs_int SCS(validate_lin_sys)(const ScsMatrix *A, const ScsMatrix *P) {
+  scs_int i, j, r_max, Anz;
+  if (!A->x || !A->i || !A->p) {
+    scs_printf("data incompletely specified\n");
+    return -1;
+  }
+  /* detects some errors in A col ptrs: */
+  Anz = A->p[A->n];
+  if (Anz > 0) {
+    for (i = 0; i < A->n; ++i) {
+      if (A->p[i] == A->p[i + 1]) {
+        scs_printf("WARN: A->p (column pointers) not strictly increasing, "
+                   "column %li empty\n",
+                   (long)i);
+      } else if (A->p[i] > A->p[i + 1]) {
+        scs_printf("ERROR: A->p (column pointers) decreasing\n");
+        return -1;
+      }
+    }
+  }
+  if (((scs_float)Anz / A->m > A->n) || (Anz < 0)) {
+    scs_printf("Anz (nonzeros in A) = %li, outside of valid range\n",
+               (long)Anz);
+    return -1;
+  }
+  r_max = 0;
+  for (i = 0; i < Anz; ++i) {
+    if (A->i[i] > r_max) {
+      r_max = A->i[i];
+    }
+  }
+  if (r_max > A->m - 1) {
+    scs_printf("number of rows in A inconsistent with input dimension\n");
+    return -1;
+  }
+  if (P) {
+    if (P->n != A->n) {
+      scs_printf("P dimension = %li, inconsistent with n = %li\n", (long)P->n,
+                 (long)A->n);
+      return -1;
+    }
+    if (P->m != P->n) {
+      scs_printf("P is not square\n");
+      return -1;
+    }
+    for (j = 0; j < P->n; j++) { /* cols */
+      for (i = P->p[j]; i < P->p[j + 1]; i++) {
+        if (P->i[i] > j) { /* if row > */
+          scs_printf("P is not upper triangular\n");
+          return -1;
+        }
+      }
+    }
+  }
+  return 0;
+}
+void SCS(free_scs_matrix)(ScsMatrix *A) {
+  if (A) {
+    scs_free(A->x);
+    scs_free(A->i);
+    scs_free(A->p);
+    scs_free(A);
+  }
+}
+static inline scs_float apply_limit(scs_float x) {
+  /* need to bound to 1 for cols/rows of all zeros, otherwise blows up */
+  x = x < MIN_NORMALIZATION_FACTOR ? 1.0 : x;
+  x = x > MAX_NORMALIZATION_FACTOR ? MAX_NORMALIZATION_FACTOR : x;
+  return x;
+}
+static void compute_ruiz_mats(ScsMatrix *P, ScsMatrix *A, scs_float *b,
+                              scs_float *c, scs_float *Dt, scs_float *Et,
+                              scs_float *s, ScsConeWork *cone) {
+  scs_int i, j, kk;
+  scs_float wrk;
+  /****************************  D  ****************************/
+  /* initialize D */
+  for (i = 0; i < A->m; ++i) {
+    /* Dt[i] = 0.; */
+    Dt[i] = ABS(b[i]);
+  }
+  /* calculate row norms */
+  for (i = 0; i < A->n; ++i) {
+    for (j = A->p[i]; j < A->p[i + 1]; ++j) {
+      Dt[A->i[j]] = MAX(Dt[A->i[j]], ABS(A->x[j]));
+    }
+  }
+  /* accumulate D across each cone  */
+  SCS(enforce_cone_boundaries)(cone, Dt, &SCS(norm_inf));
+  /* invert temporary vec to form D */
+  for (i = 0; i < A->m; ++i) {
+    Dt[i] = SAFEDIV_POS(1.0, SQRTF(apply_limit(Dt[i])));
+  }
+  /****************************  E  ****************************/
+  /* initialize E */
+  for (i = 0; i < A->n; ++i) {
+    /* Et[i] = 0.; */
+    Et[i] = ABS(c[i]);
+  }
+  /* TODO: test not using P to determine scaling  */
+  if (P) {
+    /* compute norm of cols of P (symmetric upper triangular) */
+    /* E = norm of cols of P */
+    /* Compute maximum across columns */
+    /* P(i, j) contributes to col j and col i (row i) due to symmetry */
+    for (j = 0; j < P->n; j++) { /* cols */
+      for (kk = P->p[j]; kk < P->p[j + 1]; kk++) {
+        i = P->i[kk]; /* row */
+        wrk = ABS(P->x[kk]);
+        Et[j] = MAX(wrk, Et[j]);
+        if (i != j) {
+          Et[i] = MAX(wrk, Et[i]);
+        }
+      }
+    }
+  }
+  /* calculate col norms, E */
+  for (i = 0; i < A->n; ++i) {
+    Et[i] = MAX(Et[i], SCS(norm_inf)(&(A->x[A->p[i]]), A->p[i + 1] - A->p[i]));
+    Et[i] = SAFEDIV_POS(1.0, SQRTF(apply_limit(Et[i])));
+  }
+  /* calculate s value */
+  *s = MAX(SCS(norm_inf)(c, A->n), SCS(norm_inf)(b, A->m));
+  *s = SAFEDIV_POS(1.0, SQRTF(apply_limit(*s)));
+}
+static void compute_l2_mats(ScsMatrix *P, ScsMatrix *A, scs_float *b,
+                            scs_float *c, scs_float *Dt, scs_float *Et,
+                            scs_float *s, ScsConeWork *cone) {
+  scs_int i, j, kk;
+  scs_float wrk, norm_c, norm_b;
+  /****************************  D  ****************************/
+  /* initialize D */
+  for (i = 0; i < A->m; ++i) {
+    /* Dt[i] = 0.; */
+    Dt[i] = b[i] * b[i];
+  }
+  /* calculate row norms */
+  for (i = 0; i < A->n; ++i) {
+    for (j = A->p[i]; j < A->p[i + 1]; ++j) {
+      Dt[A->i[j]] += A->x[j] * A->x[j];
+    }
+  }
+  for (i = 0; i < A->m; ++i) {
+    Dt[i] = SQRTF(Dt[i]); /* l2 norm of rows */
+  }
+  /* accumulate D across each cone  */
+  SCS(enforce_cone_boundaries)(cone, Dt, &SCS(mean));
+  for (i = 0; i < A->m; ++i) {
+    Dt[i] = SAFEDIV_POS(1.0, SQRTF(apply_limit(Dt[i])));
+  }
+  /****************************  E  ****************************/
+  /* initialize E */
+  for (i = 0; i < A->n; ++i) {
+    /* Et[i] = 0.; */
+    Et[i] = c[i] * c[i];
+  }
+  /* TODO: test not using P to determine scaling  */
+  if (P) {
+    /* compute norm of cols of P (symmetric upper triangular) */
+    /* E = norm of cols of P */
+    /* Compute maximum across columns */
+    /* P(i, j) contributes to col j and col i (row i) due to symmetry */
+    for (j = 0; j < P->n; j++) { /* cols */
+      for (kk = P->p[j]; kk < P->p[j + 1]; kk++) {
+        i = P->i[kk]; /* row */
+        wrk = P->x[kk] * P->x[kk];
+        Et[j] += wrk;
+        if (i != j) {
+          Et[i] += wrk;
+        }
+      }
+    }
+  }
+  /* calculate col norms, E */
+  for (i = 0; i < A->n; ++i) {
+    Et[i] += SCS(norm_sq)(&(A->x[A->p[i]]), A->p[i + 1] - A->p[i]);
+    Et[i] = SAFEDIV_POS(1.0, SQRTF(apply_limit(SQRTF(Et[i]))));
+  }
+  /* calculate s value */
+  norm_c = SCS(norm_2)(c, A->n);
+  norm_b = SCS(norm_2)(b, A->m);
+  *s = SQRTF(norm_c * norm_c + norm_b * norm_b);
+  *s = SAFEDIV_POS(1.0, SQRTF(apply_limit(*s)));
+}
+static void rescale(ScsMatrix *P, ScsMatrix *A, scs_float *b, scs_float *c,
+                    scs_float *Dt, scs_float *Et, scs_float s, ScsScaling *scal,
+                    ScsConeWork *cone) {
+  scs_int i, j;
+  /* scale the rows of A with D */
+  for (i = 0; i < A->n; ++i) {
+    for (j = A->p[i]; j < A->p[i + 1]; ++j) {
+      A->x[j] *= Dt[A->i[j]];
+    }
+  }
+  /* scale the cols of A with E */
+  for (i = 0; i < A->n; ++i) {
+    SCS(scale_array)(&(A->x[A->p[i]]), Et[i], A->p[i + 1] - A->p[i]);
+  }
+  if (P) {
+    /* scale the rows of P with E */
+    for (i = 0; i < P->n; ++i) {
+      for (j = P->p[i]; j < P->p[i + 1]; ++j) {
+        P->x[j] *= Et[P->i[j]];
+      }
+    }
+    /* scale the cols of P with E */
+    for (i = 0; i < P->n; ++i) {
+      SCS(scale_array)(&(P->x[P->p[i]]), Et[i], P->p[i + 1] - P->p[i]);
+    }
+  }
+  /* scale c */
+  for (i = 0; i < A->n; ++i) {
+    c[i] *= Et[i];
+  }
+  /* scale b */
+  for (i = 0; i < A->m; ++i) {
+    b[i] *= Dt[i];
+  }
+  /* Accumulate scaling */
+  for (i = 0; i < A->m; ++i) {
+    scal->D[i] *= Dt[i];
+  }
+  for (i = 0; i < A->n; ++i) {
+    scal->E[i] *= Et[i];
+  }
+  /* Apply scaling */
+  SCS(scale_array)(c, s, A->n);
+  SCS(scale_array)(b, s, A->m);
+  /* no need to scale P since primal_scale = dual_scale */
+  /*
+  if (P) {
+    SCS(scale_array)(P->x, primal_scale, P->p[P->n]);
+    SCS(scale_array)(P->x, 1.0 / dual_scale, P->p[P->n]);
+  }
+  */
+  /* Accumulate scaling */
+  scal->primal_scale *= s;
+  scal->dual_scale *= s;
+}
+/* Will rescale as P -> EPE, A -> DAE, c -> sEc, b -> sDb, in-place.
+ * Essentially trying to rescale this matrix:
+ *
+ * [P  A' c]   with   [E  0  0] on both sides (D, E diagonal)
+ * [A  0  b]          [0  D  0]
+ * [c' b' 0]          [0  0  s]
+ *
+ * which results in:
+ *
+ * [ EPE   EA'D  sEc ]
+ * [ DAE    0    sDb ]
+ * [ sc'E  sb'D   0  ]
+ *
+ * In other words D rescales the rows of A, b
+ *                E rescales the cols of A and rows/cols of P, c'
+ *
+ * will repeatedly set: D^-1 ~ norm of rows of [ A  b ]
+ *
+ *                      E^-1 ~ norm of cols of [ P ]
+ *                                             [ A ]
+ *                                             [ c']
+ *
+ * `s` is incorporated into dual_scale and primal_scale
+ *
+ * The main complication is that D has to respect cone boundaries.
+ *
+ */
+ScsScaling *SCS(normalize_a_p)(ScsMatrix *P, ScsMatrix *A, scs_float *b,
+                               scs_float *c, ScsConeWork *cone) {
+  scs_int i;
+  scs_float s;
+  ScsScaling *scal = (ScsScaling *)scs_calloc(1, sizeof(ScsScaling));
+  scs_float *Dt = (scs_float *)scs_calloc(A->m, sizeof(scs_float));
+  scs_float *Et = (scs_float *)scs_calloc(A->n, sizeof(scs_float));
+  scal->D = (scs_float *)scs_calloc(A->m, sizeof(scs_float));
+  scal->E = (scs_float *)scs_calloc(A->n, sizeof(scs_float));
+#if VERBOSITY > 5
+  SCS(timer) normalize_timer;
+  SCS(tic)(&normalize_timer);
+  scs_printf("normalizing A and P\n");
+#endif
+  /* init D, E */
+  scal->m = A->m;
+  for (i = 0; i < A->m; ++i) {
+    scal->D[i] = 1.;
+  }
+  scal->n = A->n;
+  for (i = 0; i < A->n; ++i) {
+    scal->E[i] = 1.;
+  }
+  scal->primal_scale = 1.;
+  scal->dual_scale = 1.;
+  for (i = 0; i < NUM_RUIZ_PASSES; ++i) {
+    compute_ruiz_mats(P, A, b, c, Dt, Et, &s, cone);
+    rescale(P, A, b, c, Dt, Et, s, scal, cone);
+  }
+  for (i = 0; i < NUM_L2_PASSES; ++i) {
+    compute_l2_mats(P, A, b, c, Dt, Et, &s, cone);
+    rescale(P, A, b, c, Dt, Et, s, scal, cone);
+  }
+  scs_free(Dt);
+  scs_free(Et);
+#if VERBOSITY > 5
+  scs_printf("finished normalizing A and P, time: %1.2es\n",
+             SCS(tocq)(&normalize_timer) / 1e3);
+  scs_printf("inf norm A %1.2e\n", SCS(norm_inf)(A->x, A->p[A->n]));
+  if (P) {
+    scs_printf("inf norm P %1.2e\n", SCS(norm_inf)(P->x, P->p[P->n]));
+  }
+  scs_printf("primal_scale %g\n", scal->primal_scale);
+  scs_printf("dual_scale %g\n", scal->dual_scale);
+  scs_printf("norm_b %g\n", SCS(norm_inf)(b, A->m));
+  scs_printf("norm_c %g\n", SCS(norm_inf)(c, A->n));
+  scs_printf("norm D %g\n", SCS(norm_inf)(scal->D, A->m));
+  scs_printf("norm E %g\n", SCS(norm_inf)(scal->E, A->n));
+#endif
+  return scal;
+}
+void SCS(un_normalize_a_p)(ScsMatrix *A, ScsMatrix *P, const ScsScaling *scal) {
+  scs_int i, j;
+  scs_float *D = scal->D;
+  scs_float *E = scal->E;
+  for (i = 0; i < A->n; ++i) {
+    SCS(scale_array)
+    (&(A->x[A->p[i]]), 1. / E[i], A->p[i + 1] - A->p[i]);
+  }
+  for (i = 0; i < A->n; ++i) {
+    for (j = A->p[i]; j < A->p[i + 1]; ++j) {
+      A->x[j] /= D[A->i[j]];
+    }
+  }
+  if (P) {
+    for (i = 0; i < P->n; ++i) {
+      SCS(scale_array)
+      (&(P->x[P->p[i]]), 1. / E[i], P->p[i + 1] - P->p[i]);
+    }
+    for (i = 0; i < P->n; ++i) {
+      for (j = P->p[i]; j < P->p[i + 1]; ++j) {
+        P->x[j] /= E[P->i[j]];
+      }
+    }
+  }
+}
+void SCS(accum_by_atrans)(const ScsMatrix *A, const scs_float *x,
+                          scs_float *y) {
+  /* y += A'*x
+     A in column compressed format
+     parallelizes over columns (rows of A')
+   */
+  scs_int p, j;
+  scs_int c1, c2;
+  scs_float yj;
+  scs_int n = A->n;
+  scs_int *Ap = A->p;
+  scs_int *Ai = A->i;
+  scs_float *Ax = A->x;
+#ifdef _OPENMP
+#pragma omp parallel for private(p, c1, c2, yj)
+#endif
+  for (j = 0; j < n; j++) {
+    yj = y[j];
+    c1 = Ap[j];
+    c2 = Ap[j + 1];
+    for (p = c1; p < c2; p++) {
+      yj += Ax[p] * x[Ai[p]];
+    }
+    y[j] = yj;
+  }
+}
+void SCS(accum_by_a)(const ScsMatrix *A, const scs_float *x, scs_float *y) {
+  /*y += A*x
+    A in column compressed format
+    */
+  scs_int p, j, i;
+  scs_int n = A->n;
+  scs_int *Ap = A->p;
+  scs_int *Ai = A->i;
+  scs_float *Ax = A->x;
+  for (j = 0; j < n; j++) { /* col */
+    for (p = Ap[j]; p < Ap[j + 1]; p++) {
+      i = Ai[p]; /* row */
+      y[i] += Ax[p] * x[j];
+    }
+  }
+}
+/* Since P is upper triangular need to be clever here */
+void SCS(accum_by_p)(const ScsMatrix *P, const scs_float *x, scs_float *y) {
+  /* returns y += P x */
+  scs_int p, j, i;
+  scs_int n = P->n;
+  scs_int *Pp = P->p;
+  scs_int *Pi = P->i;
+  scs_float *Px = P->x;
+  /* y += P_upper x but skip diagonal entries*/
+  for (j = 0; j < n; j++) { /* col */
+    for (p = Pp[j]; p < Pp[j + 1]; p++) {
+      i = Pi[p];    /* row */
+      if (i != j) { /* skip the diagonal */
+        y[i] += Px[p] * x[j];
+      }
+    }
+  }
+  /* y += P_lower x */
+  SCS(accum_by_atrans)(P, x, y);
+}

data/vendor/scs/linsys/scs_matrix.h ADDED Viewed

@@ -0,0 +1,70 @@
+#ifndef SCS_MATRIX_H_GUARD
+#define SCS_MATRIX_H_GUARD
+#ifdef __cplusplus
+extern "C" {
+#endif
+#include "glbopts.h"
+#include "scs.h"
+#include "scs_work.h"
+/* Normalization routines, used if d->NORMALIZE is true */
+/* normalizes A matrix, sets scal->E and scal->D diagonal scaling matrices,
+ * A -> D*A*E. D and E must be all positive entries, D must satisfy cone
+ * boundaries */
+ScsScaling *SCS(normalize_a_p)(ScsMatrix *P, ScsMatrix *A, scs_float *b,
+                               scs_float *c, ScsConeWork *cone);
+/* unnormalizes A matrix, unnormalizes by w->D and w->E */
+void SCS(un_normalize_a_p)(ScsMatrix *A, ScsMatrix *P, const ScsScaling *scal);
+/* to free the memory allocated in a ScsMatrix (called on A and P at finish) */
+void SCS(free_scs_matrix)(ScsMatrix *A);
+/* copies A (instead of in-place normalization), returns 0 for failure,
+ * allocates memory for dstp	*/
+scs_int SCS(copy_matrix)(ScsMatrix **dstp, const ScsMatrix *src);
+scs_float SCS(cumsum)(scs_int *p, scs_int *c, scs_int n);
+/**
+ * Validate the linear system inputs, returns < 0 if not valid inputs.
+ *
+ *  @param  A    A data matrix
+ *  @param  P    P data matrix
+ *  @return status < 0 indicates failure
+ */
+scs_int SCS(validate_lin_sys)(const ScsMatrix *A, const ScsMatrix *P);
+/**
+ * Forms y += A^T * x
+ *
+ *  @param  A    A data matrix
+ *  @param  x    Input
+ *  @param  y    Output
+ */
+void SCS(accum_by_atrans)(const ScsMatrix *A, const scs_float *x, scs_float *y);
+/**
+ * Forms y += A * x
+ *
+ *  @param  A           Data matrix
+ *  @param  x           Input
+ *  @param  y           Output
+ */
+void SCS(accum_by_a)(const ScsMatrix *A, const scs_float *x, scs_float *y);
+/**
+ * Forms y += P * x
+ *
+ *  @param  P    P data matrix
+ *  @param  x    Input
+ *  @param  y    Output
+ */
+void SCS(accum_by_p)(const ScsMatrix *P, const scs_float *x, scs_float *y);
+#ifdef __cplusplus
+}
+#endif
+#endif

data/vendor/scs/scs.mk CHANGED Viewed

@@ -99,10 +99,6 @@ SFLOAT = 0
 ifneq ($(SFLOAT), 0)
 OPT_FLAGS += -DSFLOAT=$(SFLOAT) # use floats rather than doubles
 endif
-NOVALIDATE = 0
-ifneq ($(NOVALIDATE), 0)
-OPT_FLAGS += -DNOVALIDATE=$(NOVALIDATE)$ # remove data validation step
-endif
 NOTIMER = 0
 ifneq ($(NOTIMER), 0)
 OPT_FLAGS += -DNOTIMER=$(NOTIMER) # no timing, times reported as nan
@@ -115,12 +111,20 @@ GPU_TRANSPOSE_MAT = 1
 ifneq ($(GPU_TRANSPOSE_MAT), 0)
 OPT_FLAGS += -DGPU_TRANSPOSE_MAT=$(GPU_TRANSPOSE_MAT) # tranpose A mat in GPU memory
 endif
-### VERBOSITY LEVELS: 0,1,2
-EXTRA_VERBOSE = 0
-ifneq ($(EXTRA_VERBOSE), 0)
-OPT_FLAGS += -DEXTRA_VERBOSE=$(EXTRA_VERBOSE) # extra verbosity level
+NOVALIDATE = 0
+ifneq ($(NOVALIDATE), 0)
+OPT_FLAGS += -DNOVALIDATE=$(NOVALIDATE) # perform problem validation or skip
+endif
+### VERBOSITY LEVELS: 0,1,2,...
+VERBOSITY = 0
+ifneq ($(VERBOSITY), 0)
+OPT_FLAGS += -DVERBOSITY=$(VERBOSITY) # verbosity level
 endif
+COVERAGE = 0
+ifneq ($(COVERAGE), 0)
+override CFLAGS += --coverage # generate test coverage data
+endif
 ############ OPENMP: ############
 # set USE_OPENMP = 1 to allow openmp (multi-threaded matrix multiplies):
@@ -141,7 +145,7 @@ endif
 USE_LAPACK = 1
 ifneq ($(USE_LAPACK), 0)
   # edit these for your setup:
-  BLASLDFLAGS = -lblas -llapack #-lgfortran
+  BLASLDFLAGS = -llapack -lblas # -lgfortran
   LDFLAGS += $(BLASLDFLAGS)
   OPT_FLAGS += -DUSE_LAPACK