big_ml 0.1.2 → 0.1.3

Sign up to get free protection for your applications and to get access to all the features.
Files changed (52) hide show
  1. checksums.yaml +7 -0
  2. data/.rspec +1 -1
  3. data/.rvmrc.example +1 -1
  4. data/.travis.yml +1 -1
  5. data/README.md +6 -5
  6. data/lib/big_ml.rb +5 -0
  7. data/lib/big_ml/base.rb +31 -0
  8. data/lib/big_ml/batch_prediction.rb +39 -0
  9. data/lib/big_ml/ensemble.rb +32 -0
  10. data/lib/big_ml/evaluation.rb +31 -0
  11. data/lib/big_ml/prediction.rb +2 -2
  12. data/lib/big_ml/util/client.rb +1 -0
  13. data/lib/big_ml/util/config.rb +4 -1
  14. data/lib/big_ml/util/request.rb +9 -4
  15. data/lib/big_ml/version.rb +1 -1
  16. data/spec/integration/dataset_spec.rb +21 -23
  17. data/spec/integration/ensemble_spec.rb +73 -0
  18. data/spec/integration/evaluation_spec.rb +64 -0
  19. data/spec/integration/model_spec.rb +23 -25
  20. data/spec/integration/prediction_spec.rb +20 -22
  21. data/spec/integration/source_spec.rb +22 -24
  22. data/spec/spec_helper.rb +4 -3
  23. data/spec/units/client_spec.rb +58 -26
  24. data/spec/units/source_spec.rb +3 -3
  25. data/spec/vcr_cassettes/BigML_Dataset/one_dataset/can_be_converted_in_a_model.yml +180 -99
  26. data/spec/vcr_cassettes/BigML_Dataset/one_dataset/must_be_able_to_be_find_using_the_reference.yml +144 -163
  27. data/spec/vcr_cassettes/BigML_Ensemble/no_ensemble/_all/must_be_empty.yml +223 -0
  28. data/spec/vcr_cassettes/BigML_Ensemble/one_ensemble/can_be_converted_in_a_prediction.yml +1074 -0
  29. data/spec/vcr_cassettes/BigML_Ensemble/one_ensemble/must_be_able_to_be_deleted_using_the_destroy_method.yml +1082 -0
  30. data/spec/vcr_cassettes/BigML_Ensemble/one_ensemble/must_be_able_to_be_find_using_the_reference.yml +734 -0
  31. data/spec/vcr_cassettes/BigML_Ensemble/one_ensemble/must_be_able_to_remove_the_ensemble.yml +1215 -0
  32. data/spec/vcr_cassettes/BigML_Ensemble/one_ensemble/must_be_able_to_set_number_of_models.yml +853 -0
  33. data/spec/vcr_cassettes/BigML_Ensemble/one_ensemble/must_be_able_to_update_the_name.yml +1226 -0
  34. data/spec/vcr_cassettes/BigML_Ensemble/one_ensemble/must_be_able_to_update_the_name_from_the_instance.yml +1226 -0
  35. data/spec/vcr_cassettes/BigML_Ensemble/one_ensemble/must_have_only_one_item.yml +686 -0
  36. data/spec/vcr_cassettes/BigML_Ensemble/one_ensemble/must_have_the_same_size.yml +732 -0
  37. data/spec/vcr_cassettes/BigML_Ensemble/one_ensemble/was_created_successfully.yml +495 -0
  38. data/spec/vcr_cassettes/BigML_Evaluation/no_evaluation/_all/must_be_empty.yml +600 -0
  39. data/spec/vcr_cassettes/BigML_Evaluation/one_evaluation/must_be_able_to_be_deleted_using_the_destroy_method.yml +1127 -0
  40. data/spec/vcr_cassettes/BigML_Evaluation/one_evaluation/must_be_able_to_be_find_using_the_reference.yml +1151 -0
  41. data/spec/vcr_cassettes/BigML_Evaluation/one_evaluation/must_be_able_to_remove_the_evaluation.yml +1203 -0
  42. data/spec/vcr_cassettes/BigML_Evaluation/one_evaluation/must_be_able_to_update_the_name.yml +1374 -0
  43. data/spec/vcr_cassettes/BigML_Evaluation/one_evaluation/must_be_able_to_update_the_name_from_the_instance.yml +1373 -0
  44. data/spec/vcr_cassettes/BigML_Evaluation/one_evaluation/must_have_only_one_item.yml +1103 -0
  45. data/spec/vcr_cassettes/BigML_Evaluation/one_evaluation/must_have_the_same_name.yml +1108 -0
  46. data/spec/vcr_cassettes/BigML_Evaluation/one_evaluation/was_created_successfully.yml +922 -0
  47. data/spec/vcr_cassettes/BigML_Model/one_model/must_be_able_to_be_find_using_the_reference.yml +269 -282
  48. data/spec/vcr_cassettes/BigML_Prediction/one_prediction/must_be_able_to_be_find_using_the_reference.yml +360 -312
  49. data/spec/vcr_cassettes/BigML_Source/one_source/must_be_able_to_be_find_using_the_reference.yml +75 -72
  50. data/spec/vcr_cassettes/BigML_Util_Client/response_handling/debug_mode/raises_on_bad_request.yml +38 -0
  51. data/spec/vcr_cassettes/BigML_Util_Client/response_handling/normal_mode/does_not_raise_on_bad_request.yml +38 -0
  52. metadata +74 -43
@@ -0,0 +1,732 @@
1
+ ---
2
+ http_interactions:
3
+ - request:
4
+ method: get
5
+ uri: https://bigml.io/dev/andromeda/source?username=<USERNAME>&api_key=<API_KEY>
6
+ body:
7
+ encoding: US-ASCII
8
+ string: ''
9
+ headers: {}
10
+ response:
11
+ status:
12
+ code: 200
13
+ message: OK
14
+ headers:
15
+ access-control-allow-methods:
16
+ - POST,GET,PUT,DELETE
17
+ access-control-allow-origin:
18
+ - "*"
19
+ content-type:
20
+ - application/json
21
+ date:
22
+ - Wed, 25 Jun 2014 15:02:13 GMT
23
+ server:
24
+ - nginx/1.0.12
25
+ vary:
26
+ - Accept-Encoding
27
+ content-length:
28
+ - '1002'
29
+ connection:
30
+ - Close
31
+ body:
32
+ encoding: UTF-8
33
+ string: '{"meta": {"limit": 20, "next": null, "offset": 0, "previous": null,
34
+ "total_count": 1}, "objects": [{"category": 0, "code": 200, "content_type":
35
+ "application/octet-stream", "created": "2014-06-25T15:02:09.117000", "credits":
36
+ 0.0, "description": "", "dev": true, "file_name": "iris.csv", "md5": "d1175c032e1042bec7f974c91e4a65ae",
37
+ "name": "iris.csv", "number_of_datasets": 1, "number_of_ensembles": 1, "number_of_models":
38
+ 0, "number_of_predictions": 0, "private": true, "resource": "source/53aae4710af5e815350010c8",
39
+ "shared": false, "size": 4608, "source_parser": {"header": true, "locale":
40
+ "en_US", "missing_tokens": ["", "NaN", "NULL", "N/A", "null", "-", "#REF!",
41
+ "#VALUE!", "?", "#NULL!", "#NUM!", "#DIV/0", "n/a", "#NAME?", "NIL", "nil",
42
+ "na", "#N/A", "NA"], "quote": "\"", "separator": ","}, "status": {"code":
43
+ 5, "elapsed": 781, "message": "The source has been created"}, "subscription":
44
+ false, "tags": [], "term_analysis": {"enabled": true}, "type": 0, "updated":
45
+ "2014-06-25T15:02:12.618000"}]}'
46
+ http_version: '1.1'
47
+ recorded_at: Wed, 25 Jun 2014 15:02:14 GMT
48
+ - request:
49
+ method: delete
50
+ uri: https://bigml.io/dev/andromeda/source/53aae4710af5e815350010c8?username=<USERNAME>&api_key=<API_KEY>
51
+ body:
52
+ encoding: US-ASCII
53
+ string: ''
54
+ headers: {}
55
+ response:
56
+ status:
57
+ code: 204
58
+ message: NO CONTENT
59
+ headers:
60
+ access-control-allow-methods:
61
+ - POST,GET,PUT,DELETE
62
+ access-control-allow-origin:
63
+ - "*"
64
+ content-length:
65
+ - '0'
66
+ content-type:
67
+ - text/html; charset=utf-8
68
+ date:
69
+ - Wed, 25 Jun 2014 15:02:14 GMT
70
+ server:
71
+ - nginx/1.0.12
72
+ connection:
73
+ - Close
74
+ body:
75
+ encoding: US-ASCII
76
+ string: ''
77
+ http_version: '1.1'
78
+ recorded_at: Wed, 25 Jun 2014 15:02:14 GMT
79
+ - request:
80
+ method: get
81
+ uri: https://bigml.io/dev/andromeda/dataset?username=<USERNAME>&api_key=<API_KEY>
82
+ body:
83
+ encoding: US-ASCII
84
+ string: ''
85
+ headers: {}
86
+ response:
87
+ status:
88
+ code: 200
89
+ message: OK
90
+ headers:
91
+ access-control-allow-methods:
92
+ - POST,GET,PUT,DELETE
93
+ access-control-allow-origin:
94
+ - "*"
95
+ content-type:
96
+ - application/json
97
+ date:
98
+ - Wed, 25 Jun 2014 15:02:14 GMT
99
+ server:
100
+ - nginx/1.0.12
101
+ vary:
102
+ - Accept-Encoding
103
+ transfer-encoding:
104
+ - chunked
105
+ connection:
106
+ - Close
107
+ body:
108
+ encoding: UTF-8
109
+ string: '{"meta": {"limit": 20, "next": null, "offset": 0, "previous": null,
110
+ "total_count": 2}, "objects": [{"all_fields": true, "category": 0, "cluster":
111
+ null, "cluster_status": true, "code": 200, "columns": 5, "created": "2014-06-25T15:02:10.895000",
112
+ "credits": 0.00439453125, "description": "", "dev": true, "field_types": {"categorical":
113
+ 1, "datetime": 0, "numeric": 4, "preferred": 5, "text": 0, "total": 5}, "locale":
114
+ "en_US", "missing_numeric_rows": 0, "name": "iris'' dataset", "number_of_batchcentroids":
115
+ 0, "number_of_batchpredictions": 0, "number_of_clusters": 0, "number_of_ensembles":
116
+ 1, "number_of_evaluations": 0, "number_of_models": 0, "number_of_predictions":
117
+ 0, "objective_field": {"column_number": 4, "datatype": "string", "id": "000004",
118
+ "name": "species", "optype": "categorical", "order": 4, "term_analysis": {"enabled":
119
+ true}}, "price": 0.0, "private": true, "ranges": null, "replacements": null,
120
+ "resource": "dataset/53aae472ffa04408550019ff", "rows": 150, "sample_rates":
121
+ null, "seeds": null, "shared": false, "size": 4608, "source": "source/53aae4710af5e815350010c8",
122
+ "source_status": false, "status": {"bytes": 4608, "code": 5, "elapsed": 449,
123
+ "field_errors": [], "message": "The dataset has been created", "row_format_errors":
124
+ [], "serialized_rows": 150}, "subscription": false, "tags": [], "term_limit":
125
+ 32, "updated": "2014-06-25T15:02:12.632000"}, {"all_fields": true, "category":
126
+ 0, "cluster": null, "cluster_status": true, "code": 200, "columns": 5, "created":
127
+ "2014-06-25T15:02:05.759000", "credits": 0.00439453125, "description": "",
128
+ "dev": true, "field_types": {"categorical": 1, "datetime": 0, "numeric": 4,
129
+ "preferred": 5, "text": 0, "total": 5}, "locale": "en_US", "missing_numeric_rows":
130
+ 0, "name": "iris'' dataset", "number_of_batchcentroids": 0, "number_of_batchpredictions":
131
+ 0, "number_of_clusters": 0, "number_of_ensembles": 0, "number_of_evaluations":
132
+ 0, "number_of_models": 0, "number_of_predictions": 0, "objective_field": {"column_number":
133
+ 4, "datatype": "string", "id": "000004", "name": "species", "optype": "categorical",
134
+ "order": 4, "term_analysis": {"enabled": true}}, "price": 0.0, "private":
135
+ true, "ranges": null, "replacements": null, "resource": "dataset/53aae46d0af5e815350010bf",
136
+ "rows": 150, "sample_rates": null, "seeds": null, "shared": false, "size":
137
+ 4608, "source": "source/53aae46cffa04408550019e1", "source_status": false,
138
+ "status": {"bytes": 4608, "code": 5, "elapsed": 370, "field_errors": [], "message":
139
+ "The dataset has been created", "row_format_errors": [], "serialized_rows":
140
+ 150}, "subscription": false, "tags": [], "term_limit": 32, "updated": "2014-06-25T15:02:08.944000"}]}'
141
+ http_version: '1.1'
142
+ recorded_at: Wed, 25 Jun 2014 15:02:14 GMT
143
+ - request:
144
+ method: delete
145
+ uri: https://bigml.io/dev/andromeda/dataset/53aae472ffa04408550019ff?username=<USERNAME>&api_key=<API_KEY>
146
+ body:
147
+ encoding: US-ASCII
148
+ string: ''
149
+ headers: {}
150
+ response:
151
+ status:
152
+ code: 404
153
+ message: NOT FOUND
154
+ headers:
155
+ access-control-allow-methods:
156
+ - POST,GET,PUT,DELETE
157
+ access-control-allow-origin:
158
+ - "*"
159
+ content-type:
160
+ - application/json
161
+ date:
162
+ - Wed, 25 Jun 2014 15:02:14 GMT
163
+ server:
164
+ - nginx/1.0.12
165
+ transfer-encoding:
166
+ - chunked
167
+ connection:
168
+ - Close
169
+ body:
170
+ encoding: UTF-8
171
+ string: '{"code": 404, "status": {"code": -1201, "extra": ["Couldn''t find an
172
+ instance of ''Model'' which matched ''id=53aae4740af5e81537000871''."], "message":
173
+ "Id does not exist"}}'
174
+ http_version: '1.1'
175
+ recorded_at: Wed, 25 Jun 2014 15:02:14 GMT
176
+ - request:
177
+ method: delete
178
+ uri: https://bigml.io/dev/andromeda/dataset/53aae46d0af5e815350010bf?username=<USERNAME>&api_key=<API_KEY>
179
+ body:
180
+ encoding: US-ASCII
181
+ string: ''
182
+ headers: {}
183
+ response:
184
+ status:
185
+ code: 204
186
+ message: NO CONTENT
187
+ headers:
188
+ access-control-allow-methods:
189
+ - POST,GET,PUT,DELETE
190
+ access-control-allow-origin:
191
+ - "*"
192
+ content-length:
193
+ - '0'
194
+ content-type:
195
+ - text/html; charset=utf-8
196
+ date:
197
+ - Wed, 25 Jun 2014 15:02:14 GMT
198
+ server:
199
+ - nginx/1.0.12
200
+ connection:
201
+ - Close
202
+ body:
203
+ encoding: US-ASCII
204
+ string: ''
205
+ http_version: '1.1'
206
+ recorded_at: Wed, 25 Jun 2014 15:02:15 GMT
207
+ - request:
208
+ method: get
209
+ uri: https://bigml.io/dev/andromeda/ensemble?username=<USERNAME>&api_key=<API_KEY>
210
+ body:
211
+ encoding: US-ASCII
212
+ string: ''
213
+ headers: {}
214
+ response:
215
+ status:
216
+ code: 200
217
+ message: OK
218
+ headers:
219
+ access-control-allow-methods:
220
+ - POST,GET,PUT,DELETE
221
+ access-control-allow-origin:
222
+ - "*"
223
+ content-type:
224
+ - application/json
225
+ date:
226
+ - Wed, 25 Jun 2014 15:02:15 GMT
227
+ server:
228
+ - nginx/1.0.12
229
+ vary:
230
+ - Accept-Encoding
231
+ transfer-encoding:
232
+ - chunked
233
+ connection:
234
+ - Close
235
+ body:
236
+ encoding: UTF-8
237
+ string: '{"meta": {"limit": 20, "next": null, "offset": 0, "previous": null,
238
+ "total_count": 1}, "objects": [{"balance_objective": false, "category": 0,
239
+ "code": 200, "columns": 5, "created": "2014-06-25T15:02:12.607000", "credits":
240
+ 0.03515625, "credits_per_prediction": 0.0, "dataset": "dataset/53aae472ffa04408550019ff",
241
+ "dataset_field_types": {"categorical": 1, "datetime": 0, "numeric": 4, "preferred":
242
+ 5, "text": 0, "total": 5}, "dataset_status": true, "datasets": [], "description":
243
+ "", "dev": true, "error_models": 0, "fields_maps": null, "finished_models":
244
+ 0, "locale": "en-US", "max_columns": 5, "max_rows": 150, "name": "iris'' dataset
245
+ ensemble", "node_threshold": 512, "number_of_batchpredictions": 0, "number_of_evaluations":
246
+ 0, "number_of_models": 2, "number_of_predictions": 0, "number_of_public_predictions":
247
+ 0, "objective_field": "000004", "ordering": 0, "out_of_bag": false, "price":
248
+ 0.0, "private": true, "randomize": false, "range": [1, 150], "replacement":
249
+ true, "resource": "ensemble/53aae4740af5e81537000871", "rows": 150, "sample_rate":
250
+ 1.0, "shared": false, "size": 9216, "source": "source/53aae4710af5e815350010c8",
251
+ "source_status": false, "stat_pruning": false, "status": {"code": 3, "elapsed":
252
+ 39.0, "message": "The ensemble creation has been started", "progress": 0.0},
253
+ "subscription": false, "tags": ["species"], "tlp": 1, "updated": "2014-06-25T15:02:12.646000"}]}'
254
+ http_version: '1.1'
255
+ recorded_at: Wed, 25 Jun 2014 15:02:15 GMT
256
+ - request:
257
+ method: delete
258
+ uri: https://bigml.io/dev/andromeda/ensemble/53aae4740af5e81537000871?username=<USERNAME>&api_key=<API_KEY>
259
+ body:
260
+ encoding: US-ASCII
261
+ string: ''
262
+ headers: {}
263
+ response:
264
+ status:
265
+ code: 204
266
+ message: NO CONTENT
267
+ headers:
268
+ access-control-allow-methods:
269
+ - POST,GET,PUT,DELETE
270
+ access-control-allow-origin:
271
+ - "*"
272
+ content-length:
273
+ - '0'
274
+ content-type:
275
+ - text/html; charset=utf-8
276
+ date:
277
+ - Wed, 25 Jun 2014 15:02:15 GMT
278
+ server:
279
+ - nginx/1.0.12
280
+ connection:
281
+ - Close
282
+ body:
283
+ encoding: US-ASCII
284
+ string: ''
285
+ http_version: '1.1'
286
+ recorded_at: Wed, 25 Jun 2014 15:02:15 GMT
287
+ - request:
288
+ method: post
289
+ uri: https://bigml.io/dev/andromeda/source
290
+ body:
291
+ encoding: US-ASCII
292
+ string: ''
293
+ headers:
294
+ content-type:
295
+ - multipart/form-data; boundary=-----------RubyMultipartPost
296
+ content-length:
297
+ - '5150'
298
+ response:
299
+ status:
300
+ code: 201
301
+ message: CREATED
302
+ headers:
303
+ access-control-allow-methods:
304
+ - POST,GET,PUT,DELETE
305
+ access-control-allow-origin:
306
+ - "*"
307
+ content-type:
308
+ - application/json
309
+ date:
310
+ - Wed, 25 Jun 2014 15:02:15 GMT
311
+ location:
312
+ - http://bigml.io/andromeda/source/53aae477ffa0440852000936
313
+ server:
314
+ - nginx/1.0.12
315
+ transfer-encoding:
316
+ - chunked
317
+ connection:
318
+ - Close
319
+ body:
320
+ encoding: UTF-8
321
+ string: '{"category": 0, "code": 201, "content_type": "application/octet-stream",
322
+ "created": "2014-06-25T15:02:15.629919", "credits": 0.0, "description": "",
323
+ "dev": true, "fields_meta": {"count": 0, "limit": 1000, "offset": 0, "total":
324
+ 0}, "file_name": "iris.csv", "md5": "d1175c032e1042bec7f974c91e4a65ae", "name":
325
+ "iris.csv", "number_of_datasets": 0, "number_of_ensembles": 0, "number_of_models":
326
+ 0, "number_of_predictions": 0, "private": true, "resource": "source/53aae477ffa0440852000936",
327
+ "shared": false, "size": 4608, "source_parser": {}, "status": {"code": 1,
328
+ "message": "The request has been queued and will be processed soon"}, "subscription":
329
+ false, "tags": [], "term_analysis": {}, "type": 0, "updated": "2014-06-25T15:02:15.629969"}'
330
+ http_version: '1.1'
331
+ recorded_at: Wed, 25 Jun 2014 15:02:15 GMT
332
+ - request:
333
+ method: get
334
+ uri: https://bigml.io/dev/andromeda/source/53aae477ffa0440852000936?username=<USERNAME>&api_key=<API_KEY>
335
+ body:
336
+ encoding: US-ASCII
337
+ string: ''
338
+ headers: {}
339
+ response:
340
+ status:
341
+ code: 200
342
+ message: OK
343
+ headers:
344
+ access-control-allow-methods:
345
+ - POST,GET,PUT,DELETE
346
+ access-control-allow-origin:
347
+ - "*"
348
+ content-type:
349
+ - application/json
350
+ date:
351
+ - Wed, 25 Jun 2014 15:02:15 GMT
352
+ server:
353
+ - nginx/1.0.12
354
+ vary:
355
+ - Accept-Encoding
356
+ content-length:
357
+ - '761'
358
+ connection:
359
+ - Close
360
+ body:
361
+ encoding: UTF-8
362
+ string: '{"category": 0, "code": 200, "content_type": "application/octet-stream",
363
+ "created": "2014-06-25T15:02:15.629000", "credits": 0.0, "description": "",
364
+ "dev": true, "fields_meta": {"count": 0, "limit": 1000, "offset": 0, "query_total":
365
+ 0, "total": 0}, "file_name": "iris.csv", "md5": "d1175c032e1042bec7f974c91e4a65ae",
366
+ "name": "iris.csv", "number_of_datasets": 0, "number_of_ensembles": 0, "number_of_models":
367
+ 0, "number_of_predictions": 0, "private": true, "resource": "source/53aae477ffa0440852000936",
368
+ "shared": false, "size": 4608, "source_parser": {"missing_tokens": []}, "status":
369
+ {"code": 3, "elapsed": 0, "message": "The source is being created"}, "subscription":
370
+ false, "tags": [], "term_analysis": {}, "type": 0, "updated": "2014-06-25T15:02:15.832000"}'
371
+ http_version: '1.1'
372
+ recorded_at: Wed, 25 Jun 2014 15:02:16 GMT
373
+ - request:
374
+ method: get
375
+ uri: https://bigml.io/dev/andromeda/source/53aae477ffa0440852000936?username=<USERNAME>&api_key=<API_KEY>
376
+ body:
377
+ encoding: US-ASCII
378
+ string: ''
379
+ headers: {}
380
+ response:
381
+ status:
382
+ code: 200
383
+ message: OK
384
+ headers:
385
+ access-control-allow-methods:
386
+ - POST,GET,PUT,DELETE
387
+ access-control-allow-origin:
388
+ - "*"
389
+ content-type:
390
+ - application/json
391
+ date:
392
+ - Wed, 25 Jun 2014 15:02:17 GMT
393
+ server:
394
+ - nginx/1.0.12
395
+ vary:
396
+ - Accept-Encoding
397
+ content-length:
398
+ - '1478'
399
+ connection:
400
+ - Close
401
+ body:
402
+ encoding: UTF-8
403
+ string: '{"category": 0, "code": 200, "content_type": "application/octet-stream",
404
+ "created": "2014-06-25T15:02:15.629000", "credits": 0.0, "description": "",
405
+ "dev": true, "fields": {"000000": {"column_number": 0, "name": "sepal length",
406
+ "optype": "numeric", "order": 0}, "000001": {"column_number": 1, "name": "sepal
407
+ width", "optype": "numeric", "order": 1}, "000002": {"column_number": 2, "name":
408
+ "petal length", "optype": "numeric", "order": 2}, "000003": {"column_number":
409
+ 3, "name": "petal width", "optype": "numeric", "order": 3}, "000004": {"column_number":
410
+ 4, "name": "species", "optype": "categorical", "order": 4, "term_analysis":
411
+ {"enabled": true}}}, "fields_meta": {"count": 5, "limit": 1000, "offset":
412
+ 0, "query_total": 5, "total": 5}, "file_name": "iris.csv", "md5": "d1175c032e1042bec7f974c91e4a65ae",
413
+ "name": "iris.csv", "number_of_datasets": 0, "number_of_ensembles": 0, "number_of_models":
414
+ 0, "number_of_predictions": 0, "private": true, "resource": "source/53aae477ffa0440852000936",
415
+ "shared": false, "size": 4608, "source_parser": {"header": true, "locale":
416
+ "en_US", "missing_tokens": ["", "NaN", "NULL", "N/A", "null", "-", "#REF!",
417
+ "#VALUE!", "?", "#NULL!", "#NUM!", "#DIV/0", "n/a", "#NAME?", "NIL", "nil",
418
+ "na", "#N/A", "NA"], "quote": "\"", "separator": ","}, "status": {"code":
419
+ 5, "elapsed": 355, "message": "The source has been created"}, "subscription":
420
+ false, "tags": [], "term_analysis": {"enabled": true}, "type": 0, "updated":
421
+ "2014-06-25T15:02:16.182000"}'
422
+ http_version: '1.1'
423
+ recorded_at: Wed, 25 Jun 2014 15:02:17 GMT
424
+ - request:
425
+ method: post
426
+ uri: https://bigml.io/dev/andromeda/dataset?username=<USERNAME>&api_key=<API_KEY>
427
+ body:
428
+ encoding: UTF-8
429
+ string: '{"source":"source/53aae477ffa0440852000936"}'
430
+ headers:
431
+ content-type:
432
+ - application/json
433
+ response:
434
+ status:
435
+ code: 201
436
+ message: CREATED
437
+ headers:
438
+ access-control-allow-methods:
439
+ - POST,GET,PUT,DELETE
440
+ access-control-allow-origin:
441
+ - "*"
442
+ content-type:
443
+ - application/json
444
+ date:
445
+ - Wed, 25 Jun 2014 15:02:17 GMT
446
+ location:
447
+ - http://bigml.io/andromeda/dataset/53aae479ffa0440855001a12
448
+ server:
449
+ - nginx/1.0.12
450
+ content-length:
451
+ - '1294'
452
+ connection:
453
+ - Close
454
+ body:
455
+ encoding: UTF-8
456
+ string: '{"all_fields": true, "category": 0, "cluster": null, "cluster_status":
457
+ true, "code": 201, "columns": 0, "created": "2014-06-25T15:02:17.233172",
458
+ "credits": 0.00439453125, "description": "", "dev": true, "download": {"code":
459
+ 0, "excluded_input_fields": [], "header": true, "input_fields": [], "message":
460
+ "", "preview": [], "separator": ","}, "excluded_fields": [], "field_types":
461
+ {"categorical": 0, "datetime": 0, "numeric": 0, "preferred": 0, "text": 0,
462
+ "total": 0}, "fields_meta": {"count": 0, "limit": 1000, "offset": 0, "total":
463
+ 0}, "locale": "en-US", "missing_numeric_rows": 0, "missing_tokens": [], "name":
464
+ "iris'' dataset", "number_of_batchcentroids": 0, "number_of_batchpredictions":
465
+ 0, "number_of_clusters": 0, "number_of_ensembles": 0, "number_of_evaluations":
466
+ 0, "number_of_models": 0, "number_of_predictions": 0, "price": 0.0, "private":
467
+ true, "ranges": null, "replacements": null, "resource": "dataset/53aae479ffa0440855001a12",
468
+ "rows": 0, "sample_rates": null, "seeds": null, "shared": false, "size": 4608,
469
+ "source": "source/53aae477ffa0440852000936", "source_status": true, "status":
470
+ {"code": 1, "message": "The dataset is being processed and will be created
471
+ soon"}, "subscription": false, "tags": [], "term_limit": 32, "updated": "2014-06-25T15:02:17.233208",
472
+ "user_metadata": {}}'
473
+ http_version: '1.1'
474
+ recorded_at: Wed, 25 Jun 2014 15:02:17 GMT
475
+ - request:
476
+ method: get
477
+ uri: https://bigml.io/dev/andromeda/dataset/53aae479ffa0440855001a12?username=<USERNAME>&api_key=<API_KEY>
478
+ body:
479
+ encoding: US-ASCII
480
+ string: ''
481
+ headers: {}
482
+ response:
483
+ status:
484
+ code: 200
485
+ message: OK
486
+ headers:
487
+ access-control-allow-methods:
488
+ - POST,GET,PUT,DELETE
489
+ access-control-allow-origin:
490
+ - "*"
491
+ content-type:
492
+ - application/json
493
+ date:
494
+ - Wed, 25 Jun 2014 15:02:17 GMT
495
+ server:
496
+ - nginx/1.0.12
497
+ vary:
498
+ - Accept-Encoding
499
+ transfer-encoding:
500
+ - chunked
501
+ connection:
502
+ - Close
503
+ body:
504
+ encoding: UTF-8
505
+ string: '{"all_fields": true, "category": 0, "cluster": null, "cluster_status":
506
+ true, "code": 200, "columns": 5, "created": "2014-06-25T15:02:17.233000",
507
+ "credits": 0.00439453125, "description": "", "dev": true, "download": {"code":
508
+ 0, "excluded_input_fields": [], "header": true, "input_fields": [], "message":
509
+ "", "preview": [], "separator": ","}, "excluded_fields": [], "field_types":
510
+ {"categorical": 0, "datetime": 0, "numeric": 0, "preferred": 0, "text": 0,
511
+ "total": 5}, "fields": {"000000": {"column_number": 0, "name": "sepal length",
512
+ "optype": "numeric", "order": 0}, "000001": {"column_number": 1, "name": "sepal
513
+ width", "optype": "numeric", "order": 1}, "000002": {"column_number": 2, "name":
514
+ "petal length", "optype": "numeric", "order": 2}, "000003": {"column_number":
515
+ 3, "name": "petal width", "optype": "numeric", "order": 3}, "000004": {"column_number":
516
+ 4, "name": "species", "optype": "categorical", "order": 4, "term_analysis":
517
+ {"enabled": true}}}, "fields_meta": {"count": 5, "limit": 1000, "offset":
518
+ 0, "query_total": 5, "total": 5}, "locale": "en_US", "missing_numeric_rows":
519
+ 0, "missing_tokens": ["", "NaN", "NULL", "N/A", "null", "-", "#REF!", "#VALUE!",
520
+ "?", "#NULL!", "#NUM!", "#DIV/0", "n/a", "#NAME?", "NIL", "nil", "na", "#N/A",
521
+ "NA"], "name": "iris'' dataset", "number_of_batchcentroids": 0, "number_of_batchpredictions":
522
+ 0, "number_of_clusters": 0, "number_of_ensembles": 0, "number_of_evaluations":
523
+ 0, "number_of_models": 0, "number_of_predictions": 0, "price": 0.0, "private":
524
+ true, "ranges": null, "replacements": null, "resource": "dataset/53aae479ffa0440855001a12",
525
+ "rows": 0, "sample_rates": null, "seeds": null, "shared": false, "size": 4608,
526
+ "source": "source/53aae477ffa0440852000936", "source_status": true, "status":
527
+ {"bytes": 0, "code": 2, "elapsed": 0, "field_errors": [], "message": "The
528
+ dataset creation has been started. No partial summary yet", "row_format_errors":
529
+ [], "serialized_rows": 0}, "subscription": false, "tags": [], "term_limit":
530
+ 32, "updated": "2014-06-25T15:02:17.464000", "user_metadata": {}}'
531
+ http_version: '1.1'
532
+ recorded_at: Wed, 25 Jun 2014 15:02:17 GMT
533
+ - request:
534
+ method: get
535
+ uri: https://bigml.io/dev/andromeda/dataset/53aae479ffa0440855001a12?username=<USERNAME>&api_key=<API_KEY>
536
+ body:
537
+ encoding: US-ASCII
538
+ string: ''
539
+ headers: {}
540
+ response:
541
+ status:
542
+ code: 200
543
+ message: OK
544
+ headers:
545
+ access-control-allow-methods:
546
+ - POST,GET,PUT,DELETE
547
+ access-control-allow-origin:
548
+ - "*"
549
+ content-type:
550
+ - application/json
551
+ date:
552
+ - Wed, 25 Jun 2014 15:02:18 GMT
553
+ server:
554
+ - nginx/1.0.12
555
+ vary:
556
+ - Accept-Encoding
557
+ transfer-encoding:
558
+ - chunked
559
+ connection:
560
+ - Close
561
+ body:
562
+ encoding: UTF-8
563
+ string: '{"all_fields": true, "category": 0, "cluster": null, "cluster_status":
564
+ true, "code": 200, "columns": 5, "created": "2014-06-25T15:02:17.233000",
565
+ "credits": 0.00439453125, "description": "", "dev": true, "download": {"code":
566
+ 0, "excluded_input_fields": [], "header": true, "input_fields": [], "message":
567
+ "", "preview": [], "separator": ","}, "excluded_fields": [], "field_types":
568
+ {"categorical": 1, "datetime": 0, "numeric": 4, "preferred": 5, "text": 0,
569
+ "total": 5}, "fields": {"000000": {"column_number": 0, "datatype": "double",
570
+ "name": "sepal length", "optype": "numeric", "order": 0, "preferred": true,
571
+ "summary": {"bins": [[4.3, 1], [4.425, 4], [4.6, 4], [4.77143, 7], [4.9625,
572
+ 16], [5.1, 9], [5.2, 4], [5.3, 1], [5.4, 6], [5.5, 7], [5.6, 6], [5.7, 8],
573
+ [5.8, 7], [5.9, 3], [6, 6], [6.1, 6], [6.2, 4], [6.3, 9], [6.4, 7], [6.5,
574
+ 5], [6.6, 2], [6.7, 8], [6.8, 3], [6.9, 4], [7, 1], [7.1, 1], [7.2, 3], [7.3,
575
+ 1], [7.4, 1], [7.6, 1], [7.7, 4], [7.9, 1]], "maximum": 7.9, "mean": 5.84333,
576
+ "median": 5.77889, "minimum": 4.3, "missing_count": 0, "population": 150,
577
+ "splits": [4.51526, 4.67252, 4.81113, 4.89582, 4.96139, 5.01131, 5.05992,
578
+ 5.11148, 5.18177, 5.35681, 5.44129, 5.5108, 5.58255, 5.65532, 5.71658, 5.77889,
579
+ 5.85381, 5.97078, 6.05104, 6.13074, 6.23023, 6.29578, 6.35078, 6.41459, 6.49383,
580
+ 6.63013, 6.70719, 6.79218, 6.92597, 7.20423, 7.64746], "standard_deviation":
581
+ 0.82807, "sum": 876.5, "sum_squares": 5223.85, "variance": 0.68569}}, "000001":
582
+ {"column_number": 1, "datatype": "double", "name": "sepal width", "optype":
583
+ "numeric", "order": 1, "preferred": true, "summary": {"counts": [[2, 1], [2.2,
584
+ 3], [2.3, 4], [2.4, 3], [2.5, 8], [2.6, 5], [2.7, 9], [2.8, 14], [2.9, 10],
585
+ [3, 26], [3.1, 11], [3.2, 13], [3.3, 6], [3.4, 12], [3.5, 6], [3.6, 4], [3.7,
586
+ 3], [3.8, 6], [3.9, 2], [4, 1], [4.1, 1], [4.2, 1], [4.4, 1]], "maximum":
587
+ 4.4, "mean": 3.05733, "median": 3.02044, "minimum": 2, "missing_count": 0,
588
+ "population": 150, "standard_deviation": 0.43587, "sum": 458.6, "sum_squares":
589
+ 1430.4, "variance": 0.18998}}, "000002": {"column_number": 2, "datatype":
590
+ "double", "name": "petal length", "optype": "numeric", "order": 2, "preferred":
591
+ true, "summary": {"bins": [[1, 1], [1.16667, 3], [1.3, 7], [1.4, 13], [1.5,
592
+ 13], [1.6, 7], [1.7, 4], [1.9, 2], [3, 1], [3.3, 2], [3.5, 2], [3.6, 1], [3.75,
593
+ 2], [3.9, 3], [4.0375, 8], [4.23333, 6], [4.46667, 12], [4.6, 3], [4.74444,
594
+ 9], [4.94444, 9], [5.1, 8], [5.25, 4], [5.46, 5], [5.6, 6], [5.75, 6], [5.95,
595
+ 4], [6.1, 3], [6.3, 1], [6.4, 1], [6.6, 1], [6.7, 2], [6.9, 1]], "maximum":
596
+ 6.9, "mean": 3.758, "median": 4.34142, "minimum": 1, "missing_count": 0, "population":
597
+ 150, "splits": [1.25138, 1.32426, 1.37171, 1.40962, 1.44567, 1.48173, 1.51859,
598
+ 1.56301, 1.6255, 1.74645, 3.23033, 3.675, 3.94203, 4.0469, 4.18243, 4.34142,
599
+ 4.45309, 4.51823, 4.61771, 4.72566, 4.83445, 4.93363, 5.03807, 5.1064, 5.20938,
600
+ 5.43979, 5.5744, 5.6646, 5.81496, 6.02913, 6.38125], "standard_deviation":
601
+ 1.7653, "sum": 563.7, "sum_squares": 2582.71, "variance": 3.11628}}, "000003":
602
+ {"column_number": 3, "datatype": "double", "name": "petal width", "optype":
603
+ "numeric", "order": 3, "preferred": true, "summary": {"counts": [[0.1, 5],
604
+ [0.2, 29], [0.3, 7], [0.4, 7], [0.5, 1], [0.6, 1], [1, 7], [1.1, 3], [1.2,
605
+ 5], [1.3, 13], [1.4, 8], [1.5, 12], [1.6, 4], [1.7, 2], [1.8, 12], [1.9, 5],
606
+ [2, 6], [2.1, 6], [2.2, 3], [2.3, 8], [2.4, 3], [2.5, 3]], "maximum": 2.5,
607
+ "mean": 1.19933, "median": 1.32848, "minimum": 0.1, "missing_count": 0, "population":
608
+ 150, "standard_deviation": 0.76224, "sum": 179.9, "sum_squares": 302.33, "variance":
609
+ 0.58101}}, "000004": {"column_number": 4, "datatype": "string", "name": "species",
610
+ "optype": "categorical", "order": 4, "preferred": true, "summary": {"categories":
611
+ [["Iris-setosa", 50], ["Iris-versicolor", 50], ["Iris-virginica", 50]], "missing_count":
612
+ 0}, "term_analysis": {"enabled": true}}}, "fields_meta": {"count": 5, "limit":
613
+ 1000, "offset": 0, "query_total": 5, "total": 5}, "locale": "en_US", "missing_numeric_rows":
614
+ 0, "missing_tokens": ["", "NaN", "NULL", "N/A", "null", "-", "#REF!", "#VALUE!",
615
+ "?", "#NULL!", "#NUM!", "#DIV/0", "n/a", "#NAME?", "NIL", "nil", "na", "#N/A",
616
+ "NA"], "name": "iris'' dataset", "number_of_batchcentroids": 0, "number_of_batchpredictions":
617
+ 0, "number_of_clusters": 0, "number_of_ensembles": 0, "number_of_evaluations":
618
+ 0, "number_of_models": 0, "number_of_predictions": 0, "objective_field": {"column_number":
619
+ 4, "datatype": "string", "id": "000004", "name": "species", "optype": "categorical",
620
+ "order": 4, "term_analysis": {"enabled": true}}, "price": 0.0, "private":
621
+ true, "ranges": null, "replacements": null, "resource": "dataset/53aae479ffa0440855001a12",
622
+ "rows": 150, "sample_rates": null, "seeds": null, "shared": false, "size":
623
+ 4608, "source": "source/53aae477ffa0440852000936", "source_status": true,
624
+ "status": {"bytes": 4608, "code": 5, "elapsed": 480, "field_errors": [], "message":
625
+ "The dataset has been created", "row_format_errors": [], "serialized_rows":
626
+ 150}, "subscription": false, "tags": [], "term_limit": 32, "updated": "2014-06-25T15:02:17.952000",
627
+ "user_metadata": {}}'
628
+ http_version: '1.1'
629
+ recorded_at: Wed, 25 Jun 2014 15:02:18 GMT
630
+ - request:
631
+ method: post
632
+ uri: https://bigml.io/dev/andromeda/ensemble?username=<USERNAME>&api_key=<API_KEY>
633
+ body:
634
+ encoding: UTF-8
635
+ string: '{"dataset":"dataset/53aae479ffa0440855001a12","number_of_models":2}'
636
+ headers:
637
+ content-type:
638
+ - application/json
639
+ response:
640
+ status:
641
+ code: 201
642
+ message: CREATED
643
+ headers:
644
+ access-control-allow-methods:
645
+ - POST,GET,PUT,DELETE
646
+ access-control-allow-origin:
647
+ - "*"
648
+ content-type:
649
+ - application/json
650
+ date:
651
+ - Wed, 25 Jun 2014 15:02:19 GMT
652
+ location:
653
+ - http://bigml.io/andromeda/ensemble/53aae47bffa044085200093d
654
+ server:
655
+ - nginx/1.0.12
656
+ transfer-encoding:
657
+ - chunked
658
+ connection:
659
+ - Close
660
+ body:
661
+ encoding: UTF-8
662
+ string: '{"balance_objective": false, "category": 0, "code": 201, "columns":
663
+ 5, "created": "2014-06-25T15:02:19.010775", "credits": 0.03515625, "credits_per_prediction":
664
+ 0.0, "dataset": "dataset/53aae479ffa0440855001a12", "dataset_field_types":
665
+ {"categorical": 1, "datetime": 0, "numeric": 4, "preferred": 5, "text": 0,
666
+ "total": 5}, "dataset_status": true, "datasets": [], "description": "", "dev":
667
+ true, "distributions": [{"importance": [], "predictions": {}, "training":
668
+ {}}, {"importance": [], "predictions": {}, "training": {}}], "error_models":
669
+ 0, "fields_maps": null, "finished_models": 0, "locale": "en-US", "max_columns":
670
+ 5, "max_rows": 150, "models": ["model/53aae47bffa0440852000940"], "name":
671
+ "iris'' dataset ensemble", "node_threshold": 512, "number_of_batchpredictions":
672
+ 0, "number_of_evaluations": 0, "number_of_models": 2, "number_of_predictions":
673
+ 0, "number_of_public_predictions": 0, "objective_field": "000004", "ordering":
674
+ 0, "out_of_bag": false, "price": 0.0, "private": true, "randomize": false,
675
+ "range": [1, 150], "replacement": true, "resource": "ensemble/53aae47bffa044085200093d",
676
+ "rows": 150, "sample_rate": 1.0, "shared": false, "size": 9216, "source":
677
+ "source/53aae477ffa0440852000936", "source_status": true, "stat_pruning":
678
+ false, "status": {"code": 3, "elapsed": 0.036000000000000004, "message": "The
679
+ ensemble creation has been started", "progress": 0.0}, "subscription": false,
680
+ "tags": ["species"], "tlp": 1, "updated": "2014-06-25T15:02:19.010811"}'
681
+ http_version: '1.1'
682
+ recorded_at: Wed, 25 Jun 2014 15:02:19 GMT
683
+ - request:
684
+ method: get
685
+ uri: https://bigml.io/dev/andromeda/ensemble?username=<USERNAME>&api_key=<API_KEY>
686
+ body:
687
+ encoding: US-ASCII
688
+ string: ''
689
+ headers: {}
690
+ response:
691
+ status:
692
+ code: 200
693
+ message: OK
694
+ headers:
695
+ access-control-allow-methods:
696
+ - POST,GET,PUT,DELETE
697
+ access-control-allow-origin:
698
+ - "*"
699
+ content-type:
700
+ - application/json
701
+ date:
702
+ - Wed, 25 Jun 2014 15:02:19 GMT
703
+ server:
704
+ - nginx/1.0.12
705
+ vary:
706
+ - Accept-Encoding
707
+ transfer-encoding:
708
+ - chunked
709
+ connection:
710
+ - Close
711
+ body:
712
+ encoding: UTF-8
713
+ string: '{"meta": {"limit": 20, "next": null, "offset": 0, "previous": null,
714
+ "total_count": 1}, "objects": [{"balance_objective": false, "category": 0,
715
+ "code": 200, "columns": 5, "created": "2014-06-25T15:02:19.010000", "credits":
716
+ 0.03515625, "credits_per_prediction": 0.0, "dataset": "dataset/53aae479ffa0440855001a12",
717
+ "dataset_field_types": {"categorical": 1, "datetime": 0, "numeric": 4, "preferred":
718
+ 5, "text": 0, "total": 5}, "dataset_status": true, "datasets": [], "description":
719
+ "", "dev": true, "error_models": 0, "fields_maps": null, "finished_models":
720
+ 0, "locale": "en-US", "max_columns": 5, "max_rows": 150, "name": "iris'' dataset
721
+ ensemble", "node_threshold": 512, "number_of_batchpredictions": 0, "number_of_evaluations":
722
+ 0, "number_of_models": 2, "number_of_predictions": 0, "number_of_public_predictions":
723
+ 0, "objective_field": "000004", "ordering": 0, "out_of_bag": false, "price":
724
+ 0.0, "private": true, "randomize": false, "range": [1, 150], "replacement":
725
+ true, "resource": "ensemble/53aae47bffa044085200093d", "rows": 150, "sample_rate":
726
+ 1.0, "shared": false, "size": 9216, "source": "source/53aae477ffa0440852000936",
727
+ "source_status": true, "stat_pruning": false, "status": {"code": 3, "elapsed":
728
+ 48.0, "message": "The ensemble creation has been started", "progress": 0.0},
729
+ "subscription": false, "tags": ["species"], "tlp": 1, "updated": "2014-06-25T15:02:19.058000"}]}'
730
+ http_version: '1.1'
731
+ recorded_at: Wed, 25 Jun 2014 15:02:19 GMT
732
+ recorded_with: VCR 2.9.2