cumo 0.2.4 → 0.2.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +6 -0
- data/README.md +23 -24
- data/bench/cumo_bench.rb +1 -0
- data/ext/cumo/cuda/memory_pool.cpp +9 -1
- data/ext/cumo/cuda/memory_pool_impl.cpp +2 -13
- data/ext/cumo/cumo.c +4 -4
- data/ext/cumo/depend.erb +1 -1
- data/ext/cumo/extconf.rb +2 -0
- data/ext/cumo/include/cumo.h +4 -4
- data/ext/cumo/include/cumo/indexer.h +50 -0
- data/ext/cumo/include/cumo/intern.h +1 -0
- data/ext/cumo/include/cumo/narray.h +20 -1
- data/ext/cumo/include/cumo/narray_kernel.h +10 -0
- data/ext/cumo/include/cumo/ndloop.h +1 -1
- data/ext/cumo/narray/array.c +8 -2
- data/ext/cumo/narray/gen/tmpl/store_array.c +15 -3
- data/ext/cumo/narray/gen/tmpl_bit/store_array.c +10 -2
- data/ext/cumo/narray/index.c +77 -43
- data/ext/cumo/narray/narray.c +11 -2
- data/ext/cumo/narray/ndloop.c +49 -1
- data/ext/cumo/narray/ndloop_kernel.cu +97 -0
- data/ext/cumo/narray/step.c +56 -250
- data/lib/cumo/narray/extra.rb +50 -1
- metadata +4 -4
data/ext/cumo/narray/step.c
CHANGED
@@ -24,164 +24,10 @@
|
|
24
24
|
#define DBL_EPSILON 2.2204460492503131e-16
|
25
25
|
#endif
|
26
26
|
|
27
|
-
static ID cumo_id_beg, cumo_id_end, cumo_id_len, cumo_id_step
|
27
|
+
static ID cumo_id_beg, cumo_id_end, cumo_id_len, cumo_id_step;
|
28
28
|
|
29
|
-
//#define EXCL(r) RTEST(rb_ivar_get((r), cumo_id_excl))
|
30
|
-
#define EXCL(r) RTEST(rb_funcall((r), rb_intern("exclude_end?"), 0))
|
31
|
-
|
32
|
-
#define SET_EXCL(r,v) rb_ivar_set((r), cumo_id_excl, (v) ? Qtrue : Qfalse)
|
33
|
-
|
34
|
-
static void
|
35
|
-
step_init(
|
36
|
-
VALUE self,
|
37
|
-
VALUE beg,
|
38
|
-
VALUE end,
|
39
|
-
VALUE step,
|
40
|
-
VALUE len,
|
41
|
-
VALUE excl
|
42
|
-
)
|
43
|
-
{
|
44
|
-
if (RTEST(len)) {
|
45
|
-
if (!(FIXNUM_P(len) || TYPE(len)==T_BIGNUM)) {
|
46
|
-
rb_raise(rb_eArgError, "length must be Integer");
|
47
|
-
}
|
48
|
-
if (RTEST(rb_funcall(len,rb_intern("<"),1,INT2FIX(0)))) {
|
49
|
-
rb_raise(rb_eRangeError,"length must be non negative");
|
50
|
-
}
|
51
|
-
}
|
52
|
-
rb_ivar_set(self, cumo_id_beg, beg);
|
53
|
-
rb_ivar_set(self, cumo_id_end, end);
|
54
|
-
rb_ivar_set(self, cumo_id_len, len);
|
55
|
-
rb_ivar_set(self, cumo_id_step, step);
|
56
|
-
SET_EXCL(self, excl);
|
57
|
-
}
|
58
|
-
|
59
|
-
static VALUE
|
60
|
-
cumo_na_step_new2(
|
61
|
-
VALUE range,
|
62
|
-
VALUE step,
|
63
|
-
VALUE len
|
64
|
-
)
|
65
|
-
{
|
66
|
-
VALUE beg, end, excl;
|
67
|
-
VALUE self = rb_obj_alloc(cumo_na_cStep);
|
68
|
-
|
69
|
-
//beg = rb_ivar_get(range, cumo_id_beg);
|
70
|
-
beg = rb_funcall(range, cumo_id_beg, 0);
|
71
|
-
//end = rb_ivar_get(range, cumo_id_end);
|
72
|
-
end = rb_funcall(range, cumo_id_end, 0);
|
73
|
-
excl = rb_funcall(range, rb_intern("exclude_end?"), 0);
|
74
|
-
|
75
|
-
step_init(self, beg, end, step, len, excl);
|
76
|
-
return self;
|
77
|
-
}
|
78
|
-
|
79
|
-
|
80
|
-
/*
|
81
|
-
* call-seq:
|
82
|
-
* Step.new(start, end, step=nil, length=nil) => step
|
83
|
-
* Step.new(range, step=nil, length=nil) => step
|
84
|
-
*
|
85
|
-
* Constructs a step using three parameters among <i>start</i>,
|
86
|
-
* <i>end</i>, <i>step</i> and <i>length</i>. <i>start</i>,
|
87
|
-
* <i>end</i> parameters can be replaced with <i>range</i>. If the
|
88
|
-
* <i>step</i> is omitted (or supplied with nil), then calculated
|
89
|
-
* from <i>length</i> or definded as 1.
|
90
|
-
*/
|
91
|
-
|
92
|
-
static VALUE
|
93
|
-
step_initialize( int argc, VALUE *argv, VALUE self )
|
94
|
-
{
|
95
|
-
VALUE a, b=Qnil, c=Qnil, d=Qnil, e=Qnil;
|
96
|
-
|
97
|
-
rb_scan_args(argc, argv, "13", &a, &b, &c, &d);
|
98
|
-
/* Selfs are immutable, so that they should be initialized only once. */
|
99
|
-
if (rb_ivar_defined(self, cumo_id_beg)) {
|
100
|
-
rb_name_error(rb_intern("initialize"), "`initialize' called twice");
|
101
|
-
}
|
102
|
-
if (rb_obj_is_kind_of(a,rb_cRange)) {
|
103
|
-
if (argc>3) {
|
104
|
-
rb_raise(rb_eArgError, "extra argument");
|
105
|
-
}
|
106
|
-
d = c;
|
107
|
-
c = b;
|
108
|
-
e = rb_funcall(a, rb_intern("exclude_end?"), 0);
|
109
|
-
//b = rb_ivar_get(a, cumo_id_end);
|
110
|
-
b = rb_funcall(a, cumo_id_end, 0);
|
111
|
-
//a = rb_ivar_get(a, cumo_id_beg);
|
112
|
-
a = rb_funcall(a, cumo_id_beg, 0);
|
113
|
-
}
|
114
|
-
step_init(self, a, b, c, d, e);
|
115
|
-
return Qnil;
|
116
|
-
}
|
117
|
-
|
118
|
-
/*
|
119
|
-
* call-seq:
|
120
|
-
* step.begin => obj
|
121
|
-
* step.first => obj
|
122
|
-
*
|
123
|
-
* Returns the start of <i>step</i>.
|
124
|
-
*/
|
125
|
-
|
126
|
-
static VALUE
|
127
|
-
step_first( VALUE self )
|
128
|
-
{
|
129
|
-
return rb_ivar_get(self, cumo_id_beg);
|
130
|
-
}
|
131
|
-
|
132
|
-
/*
|
133
|
-
* call-seq:
|
134
|
-
* step.end => obj
|
135
|
-
* step.last => obj
|
136
|
-
*
|
137
|
-
* Returns the object that defines the end of <i>step</i>.
|
138
|
-
*/
|
139
|
-
|
140
|
-
static VALUE
|
141
|
-
step_last( VALUE self )
|
142
|
-
{
|
143
|
-
return rb_ivar_get(self, cumo_id_end);
|
144
|
-
}
|
145
|
-
|
146
|
-
/*
|
147
|
-
* call-seq:
|
148
|
-
* step.length => obj
|
149
|
-
* step.size => obj
|
150
|
-
*
|
151
|
-
* Returns the length of <i>step</i>.
|
152
|
-
*/
|
153
|
-
|
154
|
-
static VALUE
|
155
|
-
step_length( VALUE self )
|
156
|
-
{
|
157
|
-
return rb_ivar_get(self, cumo_id_len);
|
158
|
-
}
|
159
|
-
|
160
|
-
/*
|
161
|
-
* call-seq:
|
162
|
-
* step.step => obj
|
163
|
-
*
|
164
|
-
* Returns the step of <i>step</i>.
|
165
|
-
*/
|
166
|
-
|
167
|
-
static VALUE
|
168
|
-
step_step( VALUE self )
|
169
|
-
{
|
170
|
-
return rb_ivar_get(self, cumo_id_step);
|
171
|
-
}
|
172
|
-
|
173
|
-
/*
|
174
|
-
* call-seq:
|
175
|
-
* step.exclude_end? => true or false
|
176
|
-
*
|
177
|
-
* Returns <code>true</code> if <i>step</i> excludes its end value.
|
178
|
-
*/
|
179
|
-
static VALUE
|
180
|
-
step_exclude_end_p(VALUE self)
|
181
|
-
{
|
182
|
-
return RTEST(rb_ivar_get(self, cumo_id_excl)) ? Qtrue : Qfalse;
|
183
|
-
}
|
184
29
|
|
30
|
+
#define EXCL(r) RTEST(rb_funcall((r), rb_intern("exclude_end?"), 0))
|
185
31
|
|
186
32
|
/*
|
187
33
|
* call-seq:
|
@@ -192,7 +38,7 @@ step_exclude_end_p(VALUE self)
|
|
192
38
|
*/
|
193
39
|
|
194
40
|
void
|
195
|
-
cumo_na_step_array_index(VALUE
|
41
|
+
cumo_na_step_array_index(VALUE obj, size_t ary_size,
|
196
42
|
size_t *plen, ssize_t *pbeg, ssize_t *pstep)
|
197
43
|
{
|
198
44
|
size_t len;
|
@@ -200,14 +46,28 @@ cumo_na_step_array_index(VALUE self, size_t ary_size,
|
|
200
46
|
VALUE vbeg, vend, vstep, vlen;
|
201
47
|
ssize_t end=ary_size;
|
202
48
|
|
203
|
-
|
204
|
-
|
205
|
-
|
206
|
-
|
207
|
-
|
208
|
-
|
209
|
-
|
210
|
-
|
49
|
+
#ifdef HAVE_RB_ARITHMETIC_SEQUENCE_EXTRACT
|
50
|
+
rb_arithmetic_sequence_components_t x;
|
51
|
+
rb_arithmetic_sequence_extract(obj, &x);
|
52
|
+
|
53
|
+
vstep = x.step;
|
54
|
+
vbeg = x.begin;
|
55
|
+
vend = x.end;
|
56
|
+
#else
|
57
|
+
cumo_enumerator_t *e;
|
58
|
+
|
59
|
+
if (rb_obj_is_kind_of(obj, rb_cRange)) {
|
60
|
+
vstep = rb_ivar_get(obj, cumo_id_step);
|
61
|
+
} else { // Enumerator
|
62
|
+
cumo_na_parse_enumerator_step(obj, &vstep);
|
63
|
+
e = (cumo_enumerator_t *)DATA_PTR(obj);
|
64
|
+
obj = e->obj; // Range
|
65
|
+
}
|
66
|
+
|
67
|
+
vbeg = rb_funcall(obj, cumo_id_beg, 0);
|
68
|
+
vend = rb_funcall(obj, cumo_id_end, 0);
|
69
|
+
#endif
|
70
|
+
vlen = rb_ivar_get(obj, cumo_id_len);
|
211
71
|
|
212
72
|
if (RTEST(vbeg)) {
|
213
73
|
beg = NUM2SSIZET(vbeg);
|
@@ -237,7 +97,7 @@ cumo_na_step_array_index(VALUE self, size_t ary_size,
|
|
237
97
|
}
|
238
98
|
} else {
|
239
99
|
if (RTEST(vend)) {
|
240
|
-
if (EXCL(
|
100
|
+
if (EXCL(obj)) {
|
241
101
|
if (step>0) end--;
|
242
102
|
if (step<0) end++;
|
243
103
|
}
|
@@ -251,7 +111,7 @@ cumo_na_step_array_index(VALUE self, size_t ary_size,
|
|
251
111
|
step = 1;
|
252
112
|
if (RTEST(vbeg)) {
|
253
113
|
if (RTEST(vend)) {
|
254
|
-
if (EXCL(
|
114
|
+
if (EXCL(obj)) {
|
255
115
|
if (beg<end) end--;
|
256
116
|
if (beg>end) end++;
|
257
117
|
}
|
@@ -262,7 +122,7 @@ cumo_na_step_array_index(VALUE self, size_t ary_size,
|
|
262
122
|
}
|
263
123
|
} else {
|
264
124
|
if (RTEST(vend)) {
|
265
|
-
if (EXCL(
|
125
|
+
if (EXCL(obj)) {
|
266
126
|
end--;
|
267
127
|
}
|
268
128
|
beg = end - (len-1);
|
@@ -286,7 +146,7 @@ cumo_na_step_array_index(VALUE self, size_t ary_size,
|
|
286
146
|
if (!RTEST(vend)) {
|
287
147
|
end = ary_size-1;
|
288
148
|
}
|
289
|
-
else if (EXCL(
|
149
|
+
else if (EXCL(obj)) {
|
290
150
|
end--;
|
291
151
|
}
|
292
152
|
if (beg<=end) {
|
@@ -301,7 +161,7 @@ cumo_na_step_array_index(VALUE self, size_t ary_size,
|
|
301
161
|
if (!RTEST(vend)) {
|
302
162
|
end = 0;
|
303
163
|
}
|
304
|
-
else if (EXCL(
|
164
|
+
else if (EXCL(obj)) {
|
305
165
|
end++;
|
306
166
|
}
|
307
167
|
if (beg>=end) {
|
@@ -327,25 +187,35 @@ cumo_na_step_array_index(VALUE self, size_t ary_size,
|
|
327
187
|
if (pstep) *pstep = step;
|
328
188
|
}
|
329
189
|
|
330
|
-
|
331
190
|
void
|
332
|
-
cumo_na_step_sequence( VALUE
|
191
|
+
cumo_na_step_sequence( VALUE obj, size_t *plen, double *pbeg, double *pstep )
|
333
192
|
{
|
334
|
-
VALUE
|
193
|
+
VALUE vend, vstep, vlen;
|
335
194
|
double dbeg, dend, dstep=1, dsize, err;
|
336
195
|
size_t size, n;
|
337
196
|
|
338
|
-
|
339
|
-
|
340
|
-
|
341
|
-
|
342
|
-
|
343
|
-
|
197
|
+
#ifdef HAVE_RB_ARITHMETIC_SEQUENCE_EXTRACT
|
198
|
+
rb_arithmetic_sequence_components_t x;
|
199
|
+
rb_arithmetic_sequence_extract(obj, &x);
|
200
|
+
|
201
|
+
vstep = x.step;
|
202
|
+
dbeg = NUM2DBL(x.begin);
|
203
|
+
vend = x.end;
|
204
|
+
#else
|
205
|
+
cumo_enumerator_t *e;
|
206
|
+
|
207
|
+
if (rb_obj_is_kind_of(obj, rb_cRange)) {
|
208
|
+
vstep = rb_ivar_get(obj, cumo_id_step);
|
209
|
+
} else { // Enumerator
|
210
|
+
cumo_na_parse_enumerator_step(obj, &vstep);
|
211
|
+
e = (cumo_enumerator_t *)DATA_PTR(obj);
|
212
|
+
obj = e->obj; // Range
|
213
|
+
}
|
344
214
|
|
345
|
-
|
346
|
-
|
347
|
-
|
348
|
-
|
215
|
+
dbeg = NUM2DBL(rb_funcall(obj, cumo_id_beg, 0));
|
216
|
+
vend = rb_funcall(obj, cumo_id_end, 0);
|
217
|
+
#endif
|
218
|
+
vlen = rb_ivar_get(obj, cumo_id_len);
|
349
219
|
|
350
220
|
if (RTEST(vlen)) {
|
351
221
|
size = NUM2SIZET(vlen);
|
@@ -353,7 +223,7 @@ cumo_na_step_sequence( VALUE self, size_t *plen, double *pbeg, double *pstep )
|
|
353
223
|
if (!RTEST(vstep)) {
|
354
224
|
if (RTEST(vend)) {
|
355
225
|
dend = NUM2DBL(vend);
|
356
|
-
if (EXCL(
|
226
|
+
if (EXCL(obj)) {
|
357
227
|
n = size;
|
358
228
|
} else {
|
359
229
|
n = size-1;
|
@@ -378,7 +248,7 @@ cumo_na_step_sequence( VALUE self, size_t *plen, double *pbeg, double *pstep )
|
|
378
248
|
err = (fabs(dbeg)+fabs(dend)+fabs(dend-dbeg))/fabs(dstep)*DBL_EPSILON;
|
379
249
|
if (err>0.5) err=0.5;
|
380
250
|
dsize = (dend-dbeg)/dstep;
|
381
|
-
if (EXCL(
|
251
|
+
if (EXCL(obj))
|
382
252
|
dsize -= err;
|
383
253
|
else
|
384
254
|
dsize += err;
|
@@ -398,77 +268,13 @@ cumo_na_step_sequence( VALUE self, size_t *plen, double *pbeg, double *pstep )
|
|
398
268
|
if (pstep) *pstep = dstep;
|
399
269
|
}
|
400
270
|
|
401
|
-
/*
|
402
|
-
static VALUE
|
403
|
-
step_each( VALUE self )
|
404
|
-
{
|
405
|
-
VALUE a;
|
406
|
-
double beg, step;
|
407
|
-
size_t i, size;
|
408
|
-
|
409
|
-
a = cumo_na_step_parameters( self, Qnil );
|
410
|
-
beg = NUM2DBL(RARRAY_PTR(a)[0]);
|
411
|
-
step = NUM2DBL(RARRAY_PTR(a)[1]);
|
412
|
-
size = NUM2SIZET(RARRAY_PTR(a)[2]);
|
413
|
-
|
414
|
-
for (i=0; i<size; i++) {
|
415
|
-
rb_yield(rb_float_new(beg+i*step));
|
416
|
-
}
|
417
|
-
return self;
|
418
|
-
}
|
419
|
-
*/
|
420
|
-
|
421
|
-
static VALUE
|
422
|
-
range_with_step( VALUE range, VALUE step )
|
423
|
-
{
|
424
|
-
return cumo_na_step_new2( range, step, Qnil );
|
425
|
-
}
|
426
|
-
|
427
|
-
static VALUE
|
428
|
-
range_with_length( VALUE range, VALUE len )
|
429
|
-
{
|
430
|
-
return cumo_na_step_new2( range, Qnil, len );
|
431
|
-
}
|
432
|
-
|
433
|
-
|
434
|
-
static VALUE
|
435
|
-
cumo_na_s_step( int argc, VALUE *argv, VALUE mod )
|
436
|
-
{
|
437
|
-
VALUE self = rb_obj_alloc(cumo_na_cStep);
|
438
|
-
step_initialize(argc, argv, self);
|
439
|
-
return self;
|
440
|
-
}
|
441
|
-
|
442
|
-
|
443
271
|
void
|
444
272
|
Init_cumo_na_step()
|
445
273
|
{
|
446
|
-
|
447
|
-
rb_include_module(cumo_na_cStep, rb_mEnumerable);
|
448
|
-
rb_define_method(cumo_na_cStep, "initialize", step_initialize, -1);
|
449
|
-
|
450
|
-
//rb_define_method(cumo_na_cStep, "each", step_each, 0);
|
451
|
-
|
452
|
-
rb_define_method(cumo_na_cStep, "first", step_first, 0);
|
453
|
-
rb_define_method(cumo_na_cStep, "last", step_last, 0);
|
454
|
-
rb_define_method(cumo_na_cStep, "begin", step_first, 0);
|
455
|
-
rb_define_method(cumo_na_cStep, "end", step_last, 0);
|
456
|
-
rb_define_method(cumo_na_cStep, "step", step_step, 0);
|
457
|
-
rb_define_method(cumo_na_cStep, "length", step_length, 0);
|
458
|
-
rb_define_method(cumo_na_cStep, "size", step_length, 0);
|
459
|
-
rb_define_method(cumo_na_cStep, "exclude_end?", step_exclude_end_p, 0);
|
460
|
-
//rb_define_method(cumo_na_cStep, "to_s", step_to_s, 0);
|
461
|
-
//rb_define_method(cumo_na_cStep, "inspect", step_inspect, 0);
|
462
|
-
//rb_define_method(cumo_na_cStep, "parameters", cumo_na_step_parameters, 1);
|
463
|
-
|
464
|
-
rb_define_method(rb_cRange, "%", range_with_step, 1);
|
465
|
-
rb_define_method(rb_cRange, "*", range_with_length, 1);
|
466
|
-
|
467
|
-
rb_define_singleton_method(cNArray, "step", cumo_na_s_step, -1);
|
274
|
+
rb_define_alias(rb_cRange, "%", "step");
|
468
275
|
|
469
276
|
cumo_id_beg = rb_intern("begin");
|
470
277
|
cumo_id_end = rb_intern("end");
|
471
278
|
cumo_id_len = rb_intern("length");
|
472
279
|
cumo_id_step = rb_intern("step");
|
473
|
-
cumo_id_excl = rb_intern("excl");
|
474
280
|
}
|
data/lib/cumo/narray/extra.rb
CHANGED
@@ -208,6 +208,55 @@ module Cumo
|
|
208
208
|
end
|
209
209
|
end
|
210
210
|
|
211
|
+
|
212
|
+
# Iterate over an axis
|
213
|
+
# @ example
|
214
|
+
# > a = Cumo::DFloat.new(2,2,2).seq
|
215
|
+
# > p a
|
216
|
+
# Cumo::DFloat#shape=[2,2,2]
|
217
|
+
# [[[0, 1],
|
218
|
+
# [2, 3]],
|
219
|
+
# [[4, 5],
|
220
|
+
# [6, 7]]]
|
221
|
+
#
|
222
|
+
# > a.each_over_axis{|i| p i}
|
223
|
+
# Cumo::DFloat(view)#shape=[2,2]
|
224
|
+
# [[0, 1],
|
225
|
+
# [2, 3]]
|
226
|
+
# Cumo::DFloat(view)#shape=[2,2]
|
227
|
+
# [[4, 5],
|
228
|
+
# [6, 7]]
|
229
|
+
#
|
230
|
+
# > a.each_over_axis(1){|i| p i}
|
231
|
+
# Cumo::DFloat(view)#shape=[2,2]
|
232
|
+
# [[0, 1],
|
233
|
+
# [4, 5]]
|
234
|
+
# Cumo::DFloat(view)#shape=[2,2]
|
235
|
+
# [[2, 3],
|
236
|
+
# [6, 7]]
|
237
|
+
|
238
|
+
def each_over_axis(axis=0)
|
239
|
+
unless block_given?
|
240
|
+
return to_enum(:each_over_axis,axis)
|
241
|
+
end
|
242
|
+
if ndim == 0
|
243
|
+
if axis != 0
|
244
|
+
raise ArgumentError,"axis=#{axis} is invalid"
|
245
|
+
end
|
246
|
+
niter = 1
|
247
|
+
else
|
248
|
+
axis = check_axis(axis)
|
249
|
+
niter = shape[axis]
|
250
|
+
end
|
251
|
+
idx = [true]*ndim
|
252
|
+
niter.times do |i|
|
253
|
+
idx[axis] = i
|
254
|
+
yield(self[*idx])
|
255
|
+
end
|
256
|
+
self
|
257
|
+
end
|
258
|
+
|
259
|
+
|
211
260
|
# Append values to the end of an narray.
|
212
261
|
# @example
|
213
262
|
# a = Cumo::DFloat[1, 2, 3]
|
@@ -987,7 +1036,7 @@ module Cumo
|
|
987
1036
|
raise NArray::ShapeError, "must be >= 2-dimensional array"
|
988
1037
|
end
|
989
1038
|
m,n = shape[-2..-1]
|
990
|
-
NArray.triu_indices(m,n,k
|
1039
|
+
NArray.triu_indices(m,n,k)
|
991
1040
|
end
|
992
1041
|
|
993
1042
|
# Return the indices for the uppler-triangle on and above the k-th diagonal.
|