nysol-take 3.0.0

Sign up to get free protection for your applications and to get access to all the features.
Files changed (161) hide show
  1. checksums.yaml +7 -0
  2. data/bin/mbiclique.rb +317 -0
  3. data/bin/mbipolish.rb +362 -0
  4. data/bin/mccomp.rb +235 -0
  5. data/bin/mclique.rb +295 -0
  6. data/bin/mclique2g.rb +105 -0
  7. data/bin/mcliqueInfo.rb +203 -0
  8. data/bin/mfriends.rb +202 -0
  9. data/bin/mgdiff.rb +252 -0
  10. data/bin/mhifriend.rb +456 -0
  11. data/bin/mhipolish.rb +465 -0
  12. data/bin/mitemset.rb +168 -0
  13. data/bin/mpal.rb +410 -0
  14. data/bin/mpolishing.rb +399 -0
  15. data/bin/msequence.rb +165 -0
  16. data/bin/mtra2g.rb +476 -0
  17. data/bin/mtra2gc.rb +360 -0
  18. data/ext/grhfilrun/extconf.rb +12 -0
  19. data/ext/grhfilrun/grhfilrun.c +85 -0
  20. data/ext/grhfilrun/src/_sspc.c +358 -0
  21. data/ext/grhfilrun/src/aheap.c +545 -0
  22. data/ext/grhfilrun/src/aheap.h +251 -0
  23. data/ext/grhfilrun/src/base.c +92 -0
  24. data/ext/grhfilrun/src/base.h +59 -0
  25. data/ext/grhfilrun/src/fstar.c +497 -0
  26. data/ext/grhfilrun/src/fstar.h +80 -0
  27. data/ext/grhfilrun/src/grhfil.c +214 -0
  28. data/ext/grhfilrun/src/itemset.c +713 -0
  29. data/ext/grhfilrun/src/itemset.h +170 -0
  30. data/ext/grhfilrun/src/problem.c +415 -0
  31. data/ext/grhfilrun/src/problem.h +179 -0
  32. data/ext/grhfilrun/src/queue.c +533 -0
  33. data/ext/grhfilrun/src/queue.h +182 -0
  34. data/ext/grhfilrun/src/sample.c +19 -0
  35. data/ext/grhfilrun/src/sspc.c +597 -0
  36. data/ext/grhfilrun/src/sspc2.c +491 -0
  37. data/ext/grhfilrun/src/stdlib2.c +1482 -0
  38. data/ext/grhfilrun/src/stdlib2.h +892 -0
  39. data/ext/grhfilrun/src/trsact.c +817 -0
  40. data/ext/grhfilrun/src/trsact.h +160 -0
  41. data/ext/grhfilrun/src/vec.c +745 -0
  42. data/ext/grhfilrun/src/vec.h +172 -0
  43. data/ext/lcmrun/extconf.rb +20 -0
  44. data/ext/lcmrun/lcmrun.cpp +99 -0
  45. data/ext/lcmrun/src/aheap.c +216 -0
  46. data/ext/lcmrun/src/aheap.h +111 -0
  47. data/ext/lcmrun/src/base.c +92 -0
  48. data/ext/lcmrun/src/base.h +59 -0
  49. data/ext/lcmrun/src/itemset.c +496 -0
  50. data/ext/lcmrun/src/itemset.h +157 -0
  51. data/ext/lcmrun/src/lcm.c +427 -0
  52. data/ext/lcmrun/src/problem.c +349 -0
  53. data/ext/lcmrun/src/problem.h +177 -0
  54. data/ext/lcmrun/src/queue.c +528 -0
  55. data/ext/lcmrun/src/queue.h +176 -0
  56. data/ext/lcmrun/src/sgraph.c +359 -0
  57. data/ext/lcmrun/src/sgraph.h +173 -0
  58. data/ext/lcmrun/src/stdlib2.c +1282 -0
  59. data/ext/lcmrun/src/stdlib2.h +823 -0
  60. data/ext/lcmrun/src/trsact.c +747 -0
  61. data/ext/lcmrun/src/trsact.h +159 -0
  62. data/ext/lcmrun/src/vec.c +731 -0
  63. data/ext/lcmrun/src/vec.h +171 -0
  64. data/ext/lcmseq0run/extconf.rb +20 -0
  65. data/ext/lcmseq0run/lcmseq0run.cpp +59 -0
  66. data/ext/lcmseq0run/src/aheap.c +216 -0
  67. data/ext/lcmseq0run/src/aheap.h +111 -0
  68. data/ext/lcmseq0run/src/base.c +92 -0
  69. data/ext/lcmseq0run/src/base.h +59 -0
  70. data/ext/lcmseq0run/src/itemset.c +518 -0
  71. data/ext/lcmseq0run/src/itemset.h +157 -0
  72. data/ext/lcmseq0run/src/itemset_zero.c +522 -0
  73. data/ext/lcmseq0run/src/lcm_seq.c +446 -0
  74. data/ext/lcmseq0run/src/lcm_seq_zero.c +446 -0
  75. data/ext/lcmseq0run/src/problem.c +439 -0
  76. data/ext/lcmseq0run/src/problem.h +179 -0
  77. data/ext/lcmseq0run/src/problem_zero.c +439 -0
  78. data/ext/lcmseq0run/src/queue.c +533 -0
  79. data/ext/lcmseq0run/src/queue.h +182 -0
  80. data/ext/lcmseq0run/src/stdlib2.c +1350 -0
  81. data/ext/lcmseq0run/src/stdlib2.h +864 -0
  82. data/ext/lcmseq0run/src/trsact.c +747 -0
  83. data/ext/lcmseq0run/src/trsact.h +159 -0
  84. data/ext/lcmseq0run/src/vec.c +779 -0
  85. data/ext/lcmseq0run/src/vec.h +172 -0
  86. data/ext/lcmseqrun/extconf.rb +20 -0
  87. data/ext/lcmseqrun/lcmseqrun.cpp +101 -0
  88. data/ext/lcmseqrun/src/aheap.c +216 -0
  89. data/ext/lcmseqrun/src/aheap.h +111 -0
  90. data/ext/lcmseqrun/src/base.c +92 -0
  91. data/ext/lcmseqrun/src/base.h +59 -0
  92. data/ext/lcmseqrun/src/itemset.c +518 -0
  93. data/ext/lcmseqrun/src/itemset.h +157 -0
  94. data/ext/lcmseqrun/src/itemset_zero.c +522 -0
  95. data/ext/lcmseqrun/src/lcm_seq.c +447 -0
  96. data/ext/lcmseqrun/src/lcm_seq_zero.c +446 -0
  97. data/ext/lcmseqrun/src/problem.c +439 -0
  98. data/ext/lcmseqrun/src/problem.h +179 -0
  99. data/ext/lcmseqrun/src/problem_zero.c +439 -0
  100. data/ext/lcmseqrun/src/queue.c +533 -0
  101. data/ext/lcmseqrun/src/queue.h +182 -0
  102. data/ext/lcmseqrun/src/stdlib2.c +1350 -0
  103. data/ext/lcmseqrun/src/stdlib2.h +864 -0
  104. data/ext/lcmseqrun/src/trsact.c +747 -0
  105. data/ext/lcmseqrun/src/trsact.h +159 -0
  106. data/ext/lcmseqrun/src/vec.c +779 -0
  107. data/ext/lcmseqrun/src/vec.h +172 -0
  108. data/ext/lcmtransrun/extconf.rb +18 -0
  109. data/ext/lcmtransrun/lcmtransrun.cpp +264 -0
  110. data/ext/macerun/extconf.rb +20 -0
  111. data/ext/macerun/macerun.cpp +57 -0
  112. data/ext/macerun/src/aheap.c +217 -0
  113. data/ext/macerun/src/aheap.h +112 -0
  114. data/ext/macerun/src/itemset.c +491 -0
  115. data/ext/macerun/src/itemset.h +158 -0
  116. data/ext/macerun/src/mace.c +503 -0
  117. data/ext/macerun/src/problem.c +346 -0
  118. data/ext/macerun/src/problem.h +174 -0
  119. data/ext/macerun/src/queue.c +529 -0
  120. data/ext/macerun/src/queue.h +177 -0
  121. data/ext/macerun/src/sgraph.c +360 -0
  122. data/ext/macerun/src/sgraph.h +174 -0
  123. data/ext/macerun/src/stdlib2.c +993 -0
  124. data/ext/macerun/src/stdlib2.h +811 -0
  125. data/ext/macerun/src/vec.c +634 -0
  126. data/ext/macerun/src/vec.h +170 -0
  127. data/ext/sspcrun/extconf.rb +20 -0
  128. data/ext/sspcrun/src/_sspc.c +358 -0
  129. data/ext/sspcrun/src/aheap.c +545 -0
  130. data/ext/sspcrun/src/aheap.h +251 -0
  131. data/ext/sspcrun/src/base.c +92 -0
  132. data/ext/sspcrun/src/base.h +59 -0
  133. data/ext/sspcrun/src/fstar.c +496 -0
  134. data/ext/sspcrun/src/fstar.h +80 -0
  135. data/ext/sspcrun/src/grhfil.c +213 -0
  136. data/ext/sspcrun/src/itemset.c +713 -0
  137. data/ext/sspcrun/src/itemset.h +170 -0
  138. data/ext/sspcrun/src/problem.c +415 -0
  139. data/ext/sspcrun/src/problem.h +179 -0
  140. data/ext/sspcrun/src/queue.c +533 -0
  141. data/ext/sspcrun/src/queue.h +182 -0
  142. data/ext/sspcrun/src/sample.c +19 -0
  143. data/ext/sspcrun/src/sspc.c +598 -0
  144. data/ext/sspcrun/src/sspc2.c +491 -0
  145. data/ext/sspcrun/src/stdlib2.c +1482 -0
  146. data/ext/sspcrun/src/stdlib2.h +892 -0
  147. data/ext/sspcrun/src/trsact.c +817 -0
  148. data/ext/sspcrun/src/trsact.h +160 -0
  149. data/ext/sspcrun/src/vec.c +745 -0
  150. data/ext/sspcrun/src/vec.h +172 -0
  151. data/ext/sspcrun/sspcrun.cpp +54 -0
  152. data/lib/nysol/enumLcmEp.rb +338 -0
  153. data/lib/nysol/enumLcmEsp.rb +284 -0
  154. data/lib/nysol/enumLcmIs.rb +275 -0
  155. data/lib/nysol/enumLcmSeq.rb +143 -0
  156. data/lib/nysol/items.rb +201 -0
  157. data/lib/nysol/seqDB.rb +256 -0
  158. data/lib/nysol/take.rb +39 -0
  159. data/lib/nysol/taxonomy.rb +113 -0
  160. data/lib/nysol/traDB.rb +257 -0
  161. metadata +239 -0
@@ -0,0 +1,634 @@
1
+ /* library for vector and sparse vector, and matrix */
2
+ /* Takeaki Uno 27/Dec/2008 */
3
+
4
+ #ifndef _vec_c_
5
+ #define _vec_c_
6
+
7
+ #include"vec.h"
8
+ #include"stdlib2.c"
9
+ #include"queue.c"
10
+
11
+ MAT INIT_MAT = {TYPE_MAT,NULL,0,NULL,0,0,NULL,NULL,0,0};
12
+ SVEC INIT_SVEC_ELE = {0,0};
13
+ SVEC INIT_SVEC = {TYPE_SVEC,NULL,0,0};
14
+ SMAT INIT_SMAT = {TYPE_SMAT,NULL,0,NULL,0,0,NULL,NULL,0,0,0};
15
+ SETFAMILY INIT_SETFAMILY = INIT_SETFAMILY_;
16
+
17
+ QSORT_TYPE (SVEC_VAL, SVEC_VAL)
18
+ QSORT_TYPE (SVEC_VAL2, SVEC_VAL2)
19
+
20
+ /* allocate memory according to rows and rowt */
21
+ void VEC_alloc (VEC *V, VEC_ID clms){
22
+ *V = INIT_VEC;
23
+ V->end = clms;
24
+ calloc2 (V->v, clms+1, EXIT);
25
+ }
26
+
27
+ /* terminate routine for VEC */
28
+ void VEC_end (VEC *V){
29
+ free2 (V->v);
30
+ *V = INIT_VEC;
31
+ }
32
+
33
+ /* allocate memory according to rows and rowt */
34
+ void MAT_alloc (MAT *M, VEC_ID rows, VEC_ID clms){
35
+ VEC_ID i;
36
+ calloc2 (M->v, rows+1, EXIT);
37
+ calloc2 (M->buf, (clms+1) * (rows+1), {free(M->v);EXIT;});
38
+ M->end = rows;
39
+ M->clms = clms;
40
+ FLOOP (i, 0, rows){
41
+ M->v[i].end = M->v[i].t = clms;
42
+ M->v[i].v = M->buf + i*(clms+1);
43
+ }
44
+ }
45
+
46
+ /* terminate routine for MAT */
47
+ void MAT_end (MAT *M){
48
+ free2 (M->buf);
49
+ free2 (M->buf2);
50
+ free2 (M->v);
51
+ *M = INIT_MAT;
52
+ }
53
+
54
+ /* allocate memory */
55
+ void SVEC_alloc (SVEC *V, VEC_ID end){
56
+ *V = INIT_SVEC;
57
+ calloc2 (V->v, end+1, EXIT);
58
+ V->end = end;
59
+ V->t = 0;
60
+ }
61
+
62
+ /* terminate routine for SVEC */
63
+ void SVEC_end (SVEC *V){
64
+ free2 (V->v);
65
+ *V = INIT_SVEC;
66
+ }
67
+
68
+ /* allocate memory according to rows and rowt */
69
+ void SMAT_alloc (SMAT *M, VEC_ID rows, VEC_ID *rowt, VEC_ID clms, size_t eles){
70
+ VEC_ID i;
71
+ if ( eles == 0 ) ARY_SUM (M->ele_end, rowt, 0, rows); else M->ele_end = eles;
72
+ calloc2 (M->buf, M->ele_end*((M->flag&LOAD_DBLBUF)?2:1) +rows +2, EXIT);
73
+ malloc2 (M->v, rows+1, {free(M->buf);EXIT;});
74
+ ARY_FILL (M->v, 0, rows, INIT_SVEC);
75
+ M->end = rows;
76
+ M->clms = clms;
77
+ if ( rowt ){
78
+ FLOOP (i, 0, rows){
79
+ M->v[i].v = i? M->v[i-1].v + rowt[i-1] +1: M->buf;
80
+ M->v[i].end = rowt[i];
81
+ }
82
+ }
83
+ }
84
+
85
+ /* terminate routine for MAT */
86
+ void SMAT_end (SMAT *M){
87
+ free2 (M->buf);
88
+ free2 (M->buf2);
89
+ free2 (M->v);
90
+ *M = INIT_SMAT;
91
+ }
92
+
93
+
94
+
95
+ /* allocate memory according to rows and rowt */
96
+ /* if eles == 0, compute eles from rowt and rows */
97
+ void SETFAMILY_alloc (SETFAMILY *M, VEC_ID rows, VEC_ID *rowt, VEC_ID clms, size_t eles){
98
+ VEC_ID i;
99
+ char *buf;
100
+ if ( eles == 0 ) ARY_SUM (M->ele_end, rowt, 0, rows); else M->ele_end = eles;
101
+ calloc2 (buf, (M->ele_end*((M->flag&LOAD_DBLBUF)?2:1) +((M->flag&LOAD_DBLBUF)?MAX(rows,clms):rows)+2)*M->unit, EXIT);
102
+ M->buf = (QUEUE_INT *)buf;
103
+ malloc2 (M->v, rows+1, {free(M->buf);EXIT;});
104
+ ARY_FILL (M->v, 0, rows, INIT_QUEUE);
105
+ M->end = rows;
106
+ M->clms = clms;
107
+ if ( rowt ){
108
+ FLOOP (i, 0, rows){
109
+ M->v[i].v = (QUEUE_INT *)buf;
110
+ buf += (rowt[i] +1)*M->unit;
111
+ M->v[i].end = rowt[i]+1;
112
+ }
113
+ }
114
+ }
115
+
116
+ /* allocate memory according to rows and rowt */
117
+ /* if eles == 0, compute eles from rowt and rows */
118
+ void SETFAMILY_alloc_weight (SETFAMILY *M){
119
+ VEC_ID i;
120
+ calloc2 (M->w, M->end +1, EXIT);
121
+ calloc2 (M->wbuf, M->ele_end*((M->flag&LOAD_DBLBUF)?2:1)+1, {free(M->w);EXIT;});
122
+ FLOOP (i, 1, M->t) M->w[i] = i? M->w[i-1] + M->v[i-1].t: M->wbuf;
123
+ }
124
+
125
+ /* terminate routine for MAT */
126
+ void SETFAMILY_end (SETFAMILY *M){
127
+ mfree (M->buf, M->buf2, M->v, M->rw, M->cw, M->wbuf, M->w);
128
+ *M = INIT_SETFAMILY;
129
+ }
130
+
131
+ /****************************************************************/
132
+ /****************************************************************/
133
+ /****************************************************************/
134
+
135
+ /* read binary file for MAT */
136
+ /* each unit-byte will be one number. if unit<0, the sign of unit is flipped, and each value is minesed the half of the maximum */
137
+ void MAT_load_bin (MAT *M, FILE2 *fp, int unit){
138
+ VEC_ID flag=0, i, j, jj;
139
+ size_t siz=0;
140
+ VEC_VAL z, neg=0;
141
+
142
+ if ( unit < 0 ){
143
+ unit = -unit; flag = 1; neg=128;
144
+ FLOOP (jj, 0, unit-1) neg *= 256;
145
+ }
146
+ if ( M->t == 0 ){ // determine #rows if M->t is 0 (not specified)
147
+ fseek(fp->fp, 0, SEEK_END);
148
+ siz = ftell(fp->fp);
149
+ fseek(fp->fp, 0, SEEK_SET);
150
+ M->t = (VEC_ID)(siz / unit / M->clms);
151
+ if ( M->flag & LOAD_TPOSE ) SWAP_VEC_ID (M->t, M->clms);
152
+ }
153
+ MAT_alloc (M, M->t, M->clms); if (ERROR_MES) return;
154
+ M->end = M->t;
155
+ FLOOP (i, 0, M->t){
156
+ FLOOP (j, 0, M->clms){
157
+ z=0; FLOOP (jj, 0, unit){ z *= 256; z += FILE2_getc (fp); }
158
+ if ( flag ) z -= neg;
159
+ if ( M->flag & LOAD_TPOSE ) M->v[j].v[i] = z;
160
+ else M->v[i].v[j] = z;
161
+ }
162
+ }
163
+ }
164
+
165
+ /* segmentation fault for illegal files */
166
+ /* count/read the number in file for MAT */
167
+ /* if *rows>0, only read count the numbers in a row, for the first scan. */
168
+ void MAT_file_load (MAT *M, FILE2 *fp){
169
+ QUEUE_ID c;
170
+ VEC_ID t=0;
171
+ double p;
172
+
173
+ for ( t=0 ; (FILE_err&2)==0 ; t++){
174
+ ARY_SCAN (c, double, *fp, 0);
175
+ if ( M->flag & LOAD_TPOSE ){
176
+ if ( M->t == 0 ){ M->t = c; if ( M->clms>0 ) break; }
177
+ } else if ( M->clms == 0 ){ M->clms = c; if ( M->t>0 ) break; }
178
+ }
179
+ if ( M->flag & LOAD_TPOSE ){ if ( M->clms==0 ) M->clms = t;} else if ( M->t==0 ) M->t = t;
180
+ FILE2_reset (fp);
181
+ M->end = M->t;
182
+ MAT_alloc (M, M->t, M->clms); if (ERROR_MES) return;
183
+ FLOOP (t, 0, M->t ){
184
+ FLOOP (c, 0, M->clms){
185
+ p = FILE2_read_double(fp);
186
+ if ( M->flag&LOAD_TPOSE ) M->v[c].v[t] = p;
187
+ else M->v[t].v[c] = p;
188
+ if ( c>= ((M->flag&LOAD_TPOSE)? M->t: M->clms) ) break;
189
+ }
190
+ if ( !FILE_err ) FILE2_read_until_newline (fp);
191
+ if ( c>= ((M->flag&LOAD_TPOSE)? M->clms: M->t) ) break;
192
+ }
193
+ }
194
+
195
+ /* load file with switching the format according to the flag */
196
+ void MAT_load (MAT *M){
197
+ FILE2 fp = INIT_FILE2;
198
+ int unit=0;
199
+ #ifdef USE_MATH
200
+ VEC_ID i;
201
+ #endif
202
+ if ( M->flag & VEC_LOAD_BIN ) unit = 1;
203
+ else if ( M->flag & VEC_LOAD_BIN2 ) unit = 2;
204
+ else if ( M->flag & VEC_LOAD_BIN4 ) unit = 4;
205
+ if ( M->flag & VEC_LOAD_CENTERIZE ) unit = -unit;
206
+
207
+ FILE2_open (fp, M->fname, "rb", EXIT);
208
+ if ( unit ) MAT_load_bin (M, &fp, unit);
209
+ else MAT_file_load (M, &fp);
210
+ FILE2_close (&fp); if (ERROR_MES) EXIT;
211
+ #ifdef USE_MATH
212
+ if ( M->flag&VEC_NORMALIZE ) FLOOP (i, 0, M->t) ARY_NORMALIZE (M->v[i].v,M->v[i].t);
213
+ #endif
214
+ print_mes (M, "mat: %s ,#rows %d ,#clms %d\n", M->fname, M->t, M->clms);
215
+ }
216
+
217
+
218
+ /* scan file and read the numbers for SMAT */
219
+ /* flag&1? SMAT, SETFAMILY, flag&2? tuple list format: array list :*/
220
+ void SMAT_file_load (SMAT *M, FILE2 *fp){
221
+ SVEC_VAL z=0;
222
+ VEC_ID flag= (M->type==TYPE_SMAT), t, x, y;
223
+ FILE_COUNT C;
224
+
225
+ C = FILE2_count (fp, (M->flag&(LOAD_ELE+LOAD_TPOSE)) | FILE_COUNT_ROWT, 0, 0, 0, 0, 0);
226
+ if ( M->clms == 0 ) M->clms = C.clms;
227
+ if ( M->t == 0 ) M->t = C.rows;
228
+ if ( flag ) SMAT_alloc (M, M->t, C.rowt, M->clms, 0);
229
+ else SETFAMILY_alloc ((SETFAMILY *)M, M->t, C.rowt, M->clms, 0);
230
+ free2 (C.rowt);
231
+ if ( ERROR_MES ) return;
232
+ FILE2_reset (fp);
233
+ t=0;
234
+ do {
235
+ if ( M->flag&LOAD_ELE ){
236
+ x = (VEC_ID)FILE2_read_int (fp);
237
+ y = (VEC_ID)FILE2_read_int (fp);
238
+ if ( flag ) z = FILE2_read_double (fp);
239
+ if ( FILE_err&4 ) goto LOOP_END2;
240
+ FILE2_read_until_newline (fp);
241
+ } else {
242
+ x = t;
243
+ y = (VEC_ID)FILE2_read_int (fp);
244
+ if ( FILE_err&4 ) goto LOOP_END2;
245
+ if ( flag ) z = FILE2_read_double (fp);
246
+ }
247
+ if ( M->flag&LOAD_TPOSE ) SWAP_VEC_ID (x, y);
248
+ // printf ("%d %d %d %d\n", x, M->t, y, M->clms);
249
+ if ( y >= M->clms || x >= M->t ) goto LOOP_END2;
250
+ // printf ("## %d %d\n", x, y);
251
+ if ( flag ){
252
+ M->v[x].v[M->v[x].t].i = y;
253
+ M->v[x].v[M->v[x].t].a = z;
254
+ M->v[x].t++;
255
+ } else ARY_INS (((SETFAMILY *)M)->v[x], y);
256
+ LOOP_END2:;
257
+ if ( !(M->flag&LOAD_ELE) && (FILE_err&3) ){ t++; if ( t >= M->t ) break; }
258
+ } while ( (FILE_err&2)==0 );
259
+ }
260
+
261
+ /* scan file and read the numbers for SMAT */
262
+ /* flag&1? SMAT, SETFAMILY, flag&2? tuple list format: array list :*/
263
+ void SETFAMILY_load_weight (SETFAMILY *M){
264
+ FILE2 fp = INIT_FILE2;
265
+ VEC_ID i;
266
+ QUEUE_ID j;
267
+ if ( M->flag&LOAD_TPOSE ) error ("transope and weight can't be specified simultaneously", EXIT);
268
+ FILE2_open (fp, M->wfname, "r", EXIT);
269
+ SETFAMILY_alloc_weight (M);
270
+ FLOOP (i, 0, M->t){
271
+ FLOOP (j, 0, M->v[i].t)
272
+ M->w[i][j] = (WEIGHT)FILE2_read_double (&fp);
273
+ FILE2_read_until_newline (&fp);
274
+ }
275
+ }
276
+
277
+ void SETFAMILY_load_column_weight (SETFAMILY *M){
278
+ int i;
279
+ #ifdef WEIGHT_DOUBLE
280
+ ARY_LOAD (M->cw, double, i, M->cwfname, 1, EXIT);
281
+ #else
282
+ ARY_LOAD (M->cw, int, i, M->cwfname, 1, EXIT);
283
+ #endif
284
+ if ( i < M->clms ){ realloc2 (M->cw, M->clms+1, EXIT); ARY_FILL (M->cw, i, M->clms+1, 0); }
285
+ }
286
+
287
+ void SETFAMILY_load_row_weight (SETFAMILY *M){
288
+ int i;
289
+ #ifdef WEIGHT_DOUBLE
290
+ ARY_LOAD (M->rw, double, i, M->rwfname, 1, EXIT);
291
+ #else
292
+ ARY_LOAD (M->rw, int, i, M->rwfname, 1, EXIT);
293
+ #endif
294
+ if ( i < M->t ){ realloc2 (M->rw, M->t+1, EXIT); ARY_FILL (M->rw, i, M->t+1, 0); }
295
+ }
296
+
297
+
298
+ /* load file with switching the format according to the flag */
299
+ void SMAT_load (SMAT *M){
300
+ FILE2 fp = INIT_FILE2;
301
+ VEC_ID i;
302
+ M->type = TYPE_SMAT;
303
+ FILE2_open (fp, M->fname, "r", EXIT);
304
+ SMAT_file_load (M, &fp);
305
+ FILE2_close (&fp); if (ERROR_MES) EXIT;
306
+ FLOOP (i, 0, M->t) M->v[i].v[M->v[i].t].i = M->clms; // end mark
307
+
308
+ #ifdef USE_MATH
309
+ if ( M->flag&VEC_NORMALIZE ) FLOOP (i, 0, M->t) SVEC_normalize (&M->v[i]); // normalize
310
+ #endif
311
+ if (M->flag&LOAD_INCSORT)
312
+ FLOOP (i, 0, M->t) qsort_VEC_ID ((VEC_ID *)(M->v[i].v), M->v[i].t, sizeof(SVEC_ELE));
313
+ if (M->flag&LOAD_DECSORT)
314
+ FLOOP (i, 0, M->t) qsort_VEC_ID ((VEC_ID *)(M->v[i].v), M->v[i].t, -(int)sizeof(SVEC_ELE));
315
+ if (M->flag&LOAD_RM_DUP)
316
+ FLOOP (i, 0, M->t) MQUE_UNIFY (M->v[i], SVEC_VAL);
317
+ M->eles = M->ele_end;
318
+ print_mes (M, "smat: %s ,#rows %d ,#clms %d ,#eles %zd\n", M->fname, M->t, M->clms, M->eles);
319
+
320
+ }
321
+
322
+ /* sort and duplication check */
323
+ void SETFAMILY_sort (SETFAMILY *M){
324
+ VEC_ID i;
325
+ PERM *p;
326
+ WEIGHT *ww;
327
+ QUEUE Q;
328
+ int flag = (M->flag&LOAD_INCSORT)? 1: ((M->flag&LOAD_DECSORT)? -1: 0);
329
+ if ( flag ){ // sort items in each row
330
+ malloc2 (p, M->clms, EXIT);
331
+ FLOOP (i, 0, M->t)
332
+ QUEUE_perm_WEIGHT (&M->v[i], M->w?M->w[i]:NULL, p, flag);
333
+ free (p);
334
+ }
335
+ flag = ((M->flag&LOAD_SIZSORT)? ((M->flag&LOAD_DECROWSORT)? -1: 1): 0) *sizeof(QUEUE);
336
+ if ( flag ){ // sort the rows
337
+ p = qsort_perm_VECt ((VEC *)M->v, M->t, flag);
338
+ if ( M->w ) ARY_INVPERMUTE_ (M->w, p, ww, M->t);
339
+ ARY_INVPERMUTE (M->v, p, Q, M->t, EXIT);
340
+ free (p);
341
+ }
342
+ if (M->flag&LOAD_RM_DUP){ // unify the duplicated edges
343
+ FLOOP (i, 0, M->t)
344
+ QUEUE_rm_dup_WEIGHT (&M->v[i], M->w?M->w[i]:NULL);
345
+ }
346
+ }
347
+
348
+ /* scan file and load the data from file to SMAT structure */
349
+ void SETFAMILY_load (SETFAMILY *M){
350
+ FILE2 fp = INIT_FILE2;
351
+ VEC_ID i;
352
+ M->type = TYPE_SETFAMILY;
353
+ FILE2_open (fp, M->fname, "r", EXIT);
354
+ SMAT_file_load ((SMAT *)M, &fp);
355
+ FILE2_close (&fp); if(ERROR_MES) EXIT;
356
+ FLOOP (i, 0, M->t) M->v[i].v[M->v[i].t] = M->clms; // end mark
357
+ print_mes (M, "setfamily: %s ,#rows %d ,#clms %d ,#eles %zd", M->fname, M->t, M->clms, M->eles);
358
+ if ( !(M->flag&LOAD_ELE) && M->wfname ){
359
+ SETFAMILY_load_weight (M); if ( ERROR_MES ){ SETFAMILY_end (M); EXIT; }
360
+ print_mes (M, " ,weightfile %s", M->wfname);
361
+ }
362
+ print_mes (M, "\n");
363
+
364
+ SETFAMILY_sort (M);
365
+ M->eles = M->ele_end;
366
+
367
+ }
368
+
369
+ /* print routines */
370
+ void MAT_print (FILE *fp, MAT *M){
371
+ VEC *V;
372
+ MQUE_FLOOP (*M, V) ARY_FPRINT (fp, V->v, 0, V->t, VEC_VALF" ");
373
+ }
374
+ void SVEC_print (FILE *fp, SVEC *V){
375
+ SVEC_ELE *x;
376
+ MQUE_FLOOP (*V, x) fprintf (fp, "("QUEUE_IDF","SVEC_VALF") ", (*x).i, (*x).a);
377
+ fputc ('\n', fp);
378
+ }
379
+ void SMAT_print (FILE *fp, SMAT *M){
380
+ SVEC *V;
381
+ MQUE_FLOOP (*M, V) SVEC_print (fp, V);
382
+ }
383
+ void SETFAMILY_print (FILE *fp, SETFAMILY *M){
384
+ QUEUE *V;
385
+ MQUE_FLOOP (*M, V) ARY_FPRINT (fp, V->v, 0, V->t, QUEUE_INTF" ");
386
+ }
387
+
388
+ /*
389
+ void SETFAMILY_print_WEIGHT (FILE *fp, SETFAMILY *M){
390
+ if ( M->w ){
391
+ printf (","); fprint_WEIGHT (stdout, M->w[i][j]); }
392
+ printf ("\n");
393
+ }
394
+ */
395
+
396
+ /****************************************************************/
397
+ /** Inner product routines **************************************/
398
+ /****************************************************************/
399
+ SVEC_VAL2 SVEC_inpro (SVEC *V1, SVEC *V2){
400
+ VEC_ID i1, i2=0;
401
+ SVEC_VAL2 sum=0;
402
+ FLOOP (i1, 0, V1->t){
403
+ while (V2->v[i2].i < V1->v[i1].i) i2++;
404
+ if (V2->v[i2].i == V1->v[i1].i) sum += ((SVEC_VAL2)V2->v[i2].a)*V1->v[i1].a;
405
+ }
406
+ return (sum);
407
+ }
408
+
409
+
410
+ /* get ith vector */
411
+ void *MVEC_getvec (void *M, int i, int flag){
412
+ MAT *MM = (MAT *)M;
413
+ if (MM->type==TYPE_MAT) return (&MM->v[i]);
414
+ if (MM->type==TYPE_SMAT) return (&((SVEC *)M)->v[i]);
415
+ if (MM->type==TYPE_SETFAMILY) return (&((QUEUE *)M)->v[i]);
416
+ return (NULL);
417
+ }
418
+
419
+ #ifdef USE_MATH
420
+
421
+ /****************************************************************/
422
+ /** Norm computation and normalization ************************/
423
+ /****************************************************************/
424
+ double SVEC_norm (SVEC *V){
425
+ SVEC_ELE *v;
426
+ double sum=0;
427
+ MQUE_FLOOP (*V, v) sum += ((double)(v->a)) * (v->a);
428
+ return (sqrt(sum));
429
+ }
430
+ void SVEC_normalize (SVEC *V){
431
+ SVEC_ELE *v;
432
+ double norm = SVEC_norm (V);
433
+ MQUE_FLOOP (*V, v) v->a /= norm;
434
+ }
435
+
436
+ /****************************************************************/
437
+ /** Euclidean distance routines *********************************/
438
+ /****************************************************************/
439
+
440
+ /* compute the inner product of two vectors */
441
+ double VEC_eucdist (VEC *V1, VEC *V2){
442
+ VEC_ID i, end=MIN(V1->end,V2->end);
443
+ double sum=0, a0, a1, a2, a3;
444
+ for (i=0 ; i<end ; i+=4){
445
+ a0 = ((double)V1->v[i])- ((double)V2->v[i]);
446
+ a1 = ((double)V1->v[i+1])- ((double)V2->v[i+1]);
447
+ a2 = ((double)V1->v[i+2])- ((double)V2->v[i+2]);
448
+ a3 = ((double)V1->v[i+3])- ((double)V2->v[i+3]);
449
+ sum += a0*a0 + a1*a1 + a2*a2 + a3*a3;
450
+ }
451
+ if ( i+1<end ){
452
+ a0 = ((double)V1->v[i])- ((double)V2->v[i]);
453
+ a1 = ((double)V1->v[i+1])- ((double)V2->v[i+1]);
454
+ sum += a0*a0 + a1*a1;
455
+ if ( i+2<end ){ a2 = ((double)V1->v[i+2])- ((double)V2->v[i+2]); sum += a2*a2; }
456
+ } else if ( i<end ){ a0 = ((double)V1->v[i])- ((double)V2->v[i]); sum += a0*a0; }
457
+ return (sqrt(sum));
458
+ }
459
+
460
+ /* compute the inner product of two vectors */
461
+ double SVEC_eucdist (SVEC *V1, SVEC *V2){
462
+ VEC_ID i1, i2;
463
+ double sum=0, a;
464
+ for ( i1=i2=0 ; i1<V1->t && i2<V2->t ; ){
465
+ if (V2->v[i2].i > V1->v[i1].i) a = V1->v[i1].a;
466
+ else if (V2->v[i2].i < V1->v[i1].i) a = V2->v[i2].a;
467
+ else a = ((double)V2->v[i2].a) - ((double)V1->v[i1].a);
468
+ sum += a*a;
469
+ }
470
+ return (sqrt(sum));
471
+ }
472
+
473
+ /* compute the inner product of two vectors */
474
+ double VEC_SVEC_eucdist (VEC *V1, SVEC *V2){
475
+ VEC_ID i, i2=0;
476
+ double sum=0, a;
477
+ FLOOP (i, 0, V1->end){
478
+ if ( i < V2->v[i2].i ) a = V1->v[i];
479
+ else { a = ((double)V1->v[i]) - ((double)V2->v[i2].a); i2++; }
480
+ sum += a*a;
481
+ }
482
+ return (sqrt(sum));
483
+ }
484
+
485
+ /**********************************************************/
486
+ /* Euclidean distance of vector and set */
487
+ double VEC_QUEUE_eucdist (VEC *V, QUEUE *Q){
488
+ VEC_ID i;
489
+ QUEUE_ID i2=0;
490
+ double sum=0, a;
491
+ FLOOP (i, 0, V->end){
492
+ if ( i < Q->v[i2] ) a = V->v[i];
493
+ else { a = ((double)V->v[i]) - 1.0; i2++; }
494
+ sum += a*a;
495
+ }
496
+ return (sqrt(sum));
497
+ }
498
+
499
+ /* compute Euclidean distance of two sets */
500
+ double QUEUE_eucdist (QUEUE *Q1, QUEUE *Q2){
501
+ double f;
502
+ MQUE_UNION(f, *Q1, *Q2);
503
+ return (sqrt(f));
504
+ }
505
+
506
+ double MVEC_norm (void *V){
507
+ VEC *VV = (VEC *)V;
508
+ double p;
509
+ if (VV->type==TYPE_VEC){ ARY_NORM (p, VV->v, VV->t); return (p); }
510
+ if (VV->type==TYPE_SVEC) return (SVEC_norm ((SVEC *)V));
511
+ if (VV->type==TYPE_QUEUE) return (sqrt(((QUEUE*)V)->t));
512
+ return (0.0);
513
+ }
514
+
515
+ double MMAT_norm_i (void *M, int i){
516
+ MAT *MM = (MAT *)M;
517
+ double p;
518
+ if (MM->type==TYPE_MAT){ ARY_NORM (p, MM->v[i].v, MM->v[i].t); return (p); }
519
+ if (MM->type==TYPE_SMAT) return (SVEC_norm (&((SMAT *)M)->v[i]));
520
+ if (MM->type==TYPE_SETFAMILY) return (sqrt (((SETFAMILY *)M)->v[i].t));
521
+ return (0.0);
522
+ }
523
+
524
+ double MVEC_eucdist (void *V, void *U){
525
+ VEC *VV = (VEC *)V;
526
+ double p;
527
+ if (VV->type==TYPE_VEC) return (VEC_eucdist ((VEC *)V, (VEC *)U));
528
+ if (VV->type==TYPE_SVEC) return (SVEC_eucdist ((SVEC *)V, (SVEC *)U));
529
+ if (VV->type==TYPE_QUEUE){ MQUE_DIF (p, *((QUEUE *)V), *((QUEUE *)U)); return (sqrt(p));}
530
+ return (0.0);
531
+ }
532
+
533
+ double MMAT_eucdist_ij (void *M, int i, int j){
534
+ MAT *MM=(MAT *)M;
535
+ double p;
536
+ if (MM->type==TYPE_MAT) return (VEC_eucdist ( &MM->v[i], &MM->v[j] ));
537
+ if (MM->type==TYPE_SMAT) return (SVEC_eucdist ( &((SMAT *)M)->v[i], &((SMAT *)M)->v[j]));
538
+ if (MM->type==TYPE_SETFAMILY){ MQUE_DIF (p, ((SETFAMILY *)M)->v[i], ((SETFAMILY *)M)->v[j]); return (sqrt(p)); }
539
+ return (0.0);
540
+ }
541
+
542
+
543
+ #endif
544
+
545
+ /* compute the inner product of two vectors */
546
+ double VEC_linfdist (VEC *V1, VEC *V2){
547
+ VEC_ID i, end=MIN(V1->end,V2->end);
548
+ double max=0, a0, a1, a2, a3;
549
+ for (i=0 ; i<end ; i+=4){
550
+ a0 = fabs(((double)V1->v[i])- ((double)V2->v[i]));
551
+ a1 = fabs(((double)V1->v[i+1])- ((double)V2->v[i+1]));
552
+ a2 = fabs(((double)V1->v[i+2])- ((double)V2->v[i+2]));
553
+ a3 = fabs(((double)V1->v[i+3])- ((double)V2->v[i+3]));
554
+ ENMAX (a0, a1); ENMAX (a2, a3); ENMAX (a0, a2); ENMAX (max, a0);
555
+ }
556
+ if ( i+1<end ){
557
+ a0 = fabs(((double)V1->v[i])- ((double)V2->v[i]));
558
+ a1 = fabs(((double)V1->v[i+1])- ((double)V2->v[i+1]));
559
+ ENMAX (a0, a1); ENMAX (max, a0);
560
+ if ( i+2<end ){ a2 = fabs(((double)V1->v[i+2])- ((double)V2->v[i+2])); ENMAX (max, a2); }
561
+ } else if ( i<end ){ a0 = fabs(((double)V1->v[i])- ((double)V2->v[i])); ENMAX (max, a0); }
562
+ return (max);
563
+ }
564
+
565
+ /**********************************************************/
566
+ /** multi-vector routines ******************************/
567
+ /**********************************************************/
568
+
569
+ /* compute the inner product, Euclidean distance for multi vector */
570
+ double MVEC_inpro (void *V, void *U){
571
+ VEC *VV = (VEC *)V, *UU = (VEC *)U;
572
+ double p;
573
+ if (VV->type==TYPE_VEC){
574
+ if (UU->type==TYPE_VEC){ ARY_INPRO (p, VV->v, UU->v, VV->t); return (p); }
575
+ if (UU->type==TYPE_SVEC){ ARY_SVEC_INPRO (p, *((SVEC *)U), VV->v); return (p); }
576
+ if (UU->type==TYPE_QUEUE){ ARY_QUEUE_INPRO (p, *((QUEUE *)U), VV->v); return (p); }
577
+ }
578
+ if (VV->type==TYPE_SVEC){
579
+ if (UU->type==TYPE_VEC){ ARY_SVEC_INPRO (p, *((SVEC *)V), UU->v); return (p);}
580
+ if (UU->type==TYPE_SVEC) return (SVEC_inpro ((SVEC *)V, (SVEC *)U));
581
+ // if (UU->type==TYPE_QUEUE) return (VEC_QUEUE_inpro (V, U));
582
+ }
583
+ if (VV->type==TYPE_QUEUE){
584
+ if (UU->type==TYPE_VEC){ ARY_QUEUE_INPRO (p, *((QUEUE *)V), UU->v); return (p); }
585
+ // else if (UU->type==TYPE_SVEC) return (SVEC_inpro (V, U));
586
+ if (UU->type==TYPE_QUEUE){ MQUE_INTSEC (p, *((QUEUE *)V), *((QUEUE *)U)); return (p);}
587
+ }
588
+ return (0.0);
589
+ }
590
+
591
+ double MVEC_double_inpro (void *V, double *w){
592
+ VEC *VV = (VEC *)V;
593
+ double p;
594
+ if (VV->type==TYPE_VEC){ ARY_INPRO (p, VV->v, w, VV->t); return (p); }
595
+ if (VV->type==TYPE_SVEC){ ARY_SVEC_INPRO (p, *((SVEC *)V), w); return (p); }
596
+ if (VV->type==TYPE_QUEUE){ ARY_QUEUE_INPRO (p, *((QUEUE *)V), w); return (p); }
597
+ return (0.0);
598
+ }
599
+
600
+ /* compute the inner product, euclidean distance for i,jth vector */
601
+ double MMAT_inpro_ij (void *M, int i, int j){
602
+ MAT *MM = (MAT *)M;
603
+ double p;
604
+ if (MM->type==TYPE_MAT){ ARY_INPRO (p, MM->v[i].v, MM->v[j].v, MM->v[j].t); return (p); }
605
+ if (MM->type==TYPE_SMAT) return (SVEC_inpro (&((SMAT *)M)->v[i], &((SMAT *)M)->v[j]));
606
+ if (MM->type==TYPE_SETFAMILY){
607
+ p = QUEUE_intsec_ (&((SETFAMILY *)M)->v[i], &((SETFAMILY *)M)->v[j]); return (p); }
608
+ return (0.0);
609
+ }
610
+
611
+ double MMAT_double_inpro_i (void *M, int i, double *w){
612
+ MAT *MM = (MAT *)M;
613
+ double p;
614
+ if (MM->type==TYPE_MAT){ ARY_INPRO (p, MM->v[i].v, w, MM->v[i].t); return (p); }
615
+ if (MM->type==TYPE_SMAT){ ARY_SVEC_INPRO (p, ((SMAT *)M)->v[i], w); return (p); }
616
+ if (MM->type==TYPE_SETFAMILY){ ARY_QUEUE_INPRO (p, ((SETFAMILY *)M)->v[i], w); return (p); }
617
+ return (0.0);
618
+ }
619
+
620
+ #ifdef _barray_h_
621
+ void SETFAMILY_to_BARRAY (BARRAY *A, SETFAMILY *F){
622
+ VEC_ID t;
623
+ size_t i=0;
624
+ BARRAY_init (A, F->clms, F->t);
625
+ FLOOP (t, 0, F->t){
626
+ BARRAY_set_subset (&A->v[i], &F->v[t]);
627
+ i += A->xend;
628
+ }
629
+ }
630
+ #endif
631
+
632
+ #endif
633
+
634
+