nexosis_api 2.0.1 → 2.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (43) hide show
  1. checksums.yaml +4 -4
  2. data/lib/nexosis_api.rb +11 -11
  3. data/lib/nexosis_api/algorithm.rb +22 -22
  4. data/lib/nexosis_api/algorithm_contestant.rb +43 -43
  5. data/lib/nexosis_api/anomaly_scores.rb +19 -0
  6. data/lib/nexosis_api/calendar_jointarget.rb +35 -35
  7. data/lib/nexosis_api/classifier_result.rb +25 -25
  8. data/lib/nexosis_api/classifier_scores.rb +26 -0
  9. data/lib/nexosis_api/client.rb +120 -118
  10. data/lib/nexosis_api/client/contest.rb +66 -66
  11. data/lib/nexosis_api/client/datasets.rb +155 -155
  12. data/lib/nexosis_api/client/imports.rb +141 -141
  13. data/lib/nexosis_api/client/models.rb +121 -108
  14. data/lib/nexosis_api/client/sessions.rb +308 -213
  15. data/lib/nexosis_api/client/views.rb +105 -105
  16. data/lib/nexosis_api/column.rb +50 -50
  17. data/lib/nexosis_api/column_options.rb +38 -38
  18. data/lib/nexosis_api/column_role.rb +19 -19
  19. data/lib/nexosis_api/column_type.rb +23 -23
  20. data/lib/nexosis_api/dataset_data.rb +22 -22
  21. data/lib/nexosis_api/dataset_jointarget.rb +18 -18
  22. data/lib/nexosis_api/dataset_model.rb +26 -26
  23. data/lib/nexosis_api/dataset_summary.rb +33 -33
  24. data/lib/nexosis_api/http_exception.rb +28 -28
  25. data/lib/nexosis_api/impact_metric.rb +22 -22
  26. data/lib/nexosis_api/imports_response.rb +74 -74
  27. data/lib/nexosis_api/join.rb +63 -63
  28. data/lib/nexosis_api/link.rb +18 -18
  29. data/lib/nexosis_api/message.rb +19 -19
  30. data/lib/nexosis_api/metric.rb +16 -16
  31. data/lib/nexosis_api/model_summary.rb +66 -66
  32. data/lib/nexosis_api/paged_array.rb +35 -35
  33. data/lib/nexosis_api/predict_response.rb +35 -35
  34. data/lib/nexosis_api/session.rb +122 -118
  35. data/lib/nexosis_api/session_contest.rb +30 -30
  36. data/lib/nexosis_api/session_response.rb +29 -33
  37. data/lib/nexosis_api/session_result.rb +27 -27
  38. data/lib/nexosis_api/session_selection_metrics.rb +20 -20
  39. data/lib/nexosis_api/time_interval.rb +15 -15
  40. data/lib/nexosis_api/view_data.rb +14 -14
  41. data/lib/nexosis_api/view_definition.rb +64 -64
  42. data/nexosisapi.gemspec +20 -20
  43. metadata +5 -3
@@ -1,108 +1,121 @@
1
- module NexosisApi
2
- class Client
3
- # class to operate on model endpoint in Nexosis API
4
- # @since 1.3.0
5
- module Models
6
- # List all models created in your company, optionally filtered by query parameters
7
- #
8
- # @param datasource_name [String] optionally limit to those
9
- # models created for this data source name.
10
- # @param query_options [Hash] limit by dates: begin_date and/or end_date
11
- # @note - query options dates can either be ISO 8601 compliant strings or Date objects
12
- # @return [NexosisApi::PagedArray of NexosisApi::ModelSummary] - all models available within the query parameters
13
- def list_models(datasource_name = nil, page = 0, page_size = 50, query_options = {})
14
- model_url = '/models'
15
- query = {
16
- page: page,
17
- pageSize: page_size
18
- }
19
- unless query_options.empty?
20
- query.store('createdBeforeDate', query_options['end_date']) unless query_options['end_date'].nil?
21
- query.store('createdAfterDate', query_options['begin_date']) unless query_options['begin_date'].nil?
22
- end
23
- query.store(dataSourceName: datasource_name) unless datasource_name.nil?
24
- response = self.class.get(model_url, headers: @headers, query: query)
25
- raise HttpException.new("There was a problem listing models: #{response.code}.",
26
- "listing models with data source name #{datasource_name}",
27
- response) unless response.success?
28
- NexosisApi::PagedArray.new(response.parsed_response,
29
- response.parsed_response['items']
30
- .map { |item| NexosisApi::ModelSummary.new(item) })
31
- end
32
-
33
- # Get the details of the particular model requested by id
34
- #
35
- # @param model_id [String] The unique identifier for the model returned by a create-model session
36
- # @return [NexosisApi::ModelSummary]
37
- def get_model(model_id)
38
- raise ArgumentError, 'Retrieving a model requires that model_id be specified and it is currently null.' if model_id.nil?
39
- model_url = "/models/#{model_id}"
40
- response = self.class.get(model_url, @options)
41
- if (response.success?)
42
- NexosisApi::ModelSummary.new(response.parsed_response)
43
- else
44
- raise HttpException.new("There was a problem getting your model: #{response.code}.", "Could not get model #{model_id}", response)
45
- end
46
- end
47
-
48
- # Run a feature set through the model to get predictions
49
- #
50
- # @param model_id [String] unique identifier of model to use
51
- # @param feature_data [Array of Hash] feature columns with values to predict from
52
- # @return [NexosisApi::PredictResponse]
53
- # @note The feature data shape should match that of the dataset used to create the model.
54
- # Any missing features in this request will reduce the quality of the predictions.
55
- def predict(model_id, feature_data)
56
- raise ArgumentError, 'Running predictions requires that model_id be specified and it is currently empty.' if model_id.empty?
57
- raise ArgumentError, 'Running predictions requires that feature_data be specified and it is currently empty.' if feature_data.empty?
58
- predict_url = "/models/#{model_id}/predict"
59
- response = self.class.post(predict_url, headers: @headers, body: { "data": feature_data }.to_json)
60
- if (response.success?)
61
- NexosisApi::PredictResponse.new(model_id, response.parsed_response)
62
- else
63
- raise HttpException.new("There was a problem predicting from your model: #{response.code}.",
64
- "Could not start predict for #{model_id}",
65
- response)
66
- end
67
- end
68
-
69
- # Remove an existing model
70
- #
71
- # @param model_id [String] the unique id of the model to remove.
72
- def remove_model(model_id)
73
- raise ArgumentError, 'Deleting a model requires that model_id be specified and it is currently empty.' if model_id.empty?
74
- delete_url = "/models/#{model_id}"
75
- response = self.class.delete(delete_url, @options)
76
- unless (response.success?)
77
- raise HttpException.new("There was a problem deleting your model: #{response.code}.",
78
- "Could not delete #{model_id}",
79
- response)
80
- end
81
- end
82
-
83
- # Deletes multiple models based on the provided filter criteria.
84
- # @param datasource_name [String] remove all models created by this datasource
85
- # @param begin_date [DateTime] remove all models created after this date/time - inclusive. May be a ISO 8601 compliant string.
86
- # @param end_date [DateTime] remove all models created before this date/time - inclusive. May be a ISO 8601 compliant string.
87
- # @note - Use with great care. This permanently removes trained models.
88
- # All parameters are indepdently optional, but one must be sent.
89
- def remove_models(datasource_name = nil, begin_date = nil, end_date = nil)
90
- params_unset = datasource_name.nil?
91
- params_unset &= begin_date.nil?
92
- params_unset &= end_date.nil?
93
- raise ArgumentError, 'Must set one of the method parameters.' if params_unset
94
- delete_url = '/models'
95
- query = {}
96
- query.store('dataSourceName', datasource_name) unless datasource_name.nil?
97
- query.store('createdAfterDate', begin_date) unless begin_date.nil?
98
- query.store('createdBeforeDate', end_date) unless end_date.nil?
99
- response = self.class.delete(delete_url, headers: @headers, query: query)
100
- unless (response.success?)
101
- raise HttpException.new("There was a problem deleting your models: #{response.code}.",
102
- 'Could not delete models',
103
- response)
104
- end
105
- end
106
- end
107
- end
108
- end
1
+ module NexosisApi
2
+ class Client
3
+ # class to operate on model endpoint in Nexosis API
4
+ # @since 1.3.0
5
+ module Models
6
+ # List all models created in your company, optionally filtered by query parameters
7
+ #
8
+ # @param datasource_name [String] optionally limit to those
9
+ # models created for this data source name.
10
+ # @param query_options [Hash] limit by dates: begin_date and/or end_date
11
+ # @note - query options dates can either be ISO 8601 compliant strings or Date objects.
12
+ # @return [NexosisApi::PagedArray of NexosisApi::ModelSummary] - all models available within the query parameters
13
+ # @raise [NexosisApi::HttpException]
14
+ def list_models(datasource_name = nil, page = 0, page_size = 50, query_options = {})
15
+ model_url = '/models'
16
+ query = {
17
+ page: page,
18
+ pageSize: page_size
19
+ }
20
+ unless query_options.empty?
21
+ query.store('createdBeforeDate', query_options['end_date']) unless query_options['end_date'].nil?
22
+ query.store('createdAfterDate', query_options['begin_date']) unless query_options['begin_date'].nil?
23
+ end
24
+ query.store('dataSourceName', datasource_name) unless datasource_name.nil?
25
+ response = self.class.get(model_url, headers: @headers, query: query)
26
+ raise HttpException.new("There was a problem listing models: #{response.code}.",
27
+ "listing models with data source name #{datasource_name}",
28
+ response) unless response.success?
29
+ NexosisApi::PagedArray.new(response.parsed_response,
30
+ response.parsed_response['items']
31
+ .map { |item| NexosisApi::ModelSummary.new(item) })
32
+ end
33
+
34
+ # Get the details of the particular model requested by id
35
+ #
36
+ # @param model_id [String] The unique identifier for the model returned by a create-model session
37
+ # @return [NexosisApi::ModelSummary]
38
+ # @raise [NexosisApi::HttpException]
39
+ # @raise [ArgumentError]
40
+ def get_model(model_id)
41
+ raise ArgumentError, 'Retrieving a model requires that model_id be specified and it is currently null.' if model_id.nil?
42
+ model_url = "/models/#{model_id}"
43
+ response = self.class.get(model_url, @options)
44
+ if (response.success?)
45
+ NexosisApi::ModelSummary.new(response.parsed_response)
46
+ else
47
+ raise HttpException.new("There was a problem getting your model: #{response.code}.", "Could not get model #{model_id}", response)
48
+ end
49
+ end
50
+
51
+ # Run a feature set through the model to get predictions
52
+ #
53
+ # @param model_id [String] unique identifier of model to use
54
+ # @param feature_data [Array of Hash] feature columns with values to predict from
55
+ # @param extra_parameters [Hash] name value pairs which should be included in the extraParameters property of the json body of the request.
56
+ # @return [NexosisApi::PredictResponse]
57
+ # @raise [NexosisApi::HttpException]
58
+ # @raise [ArgumentError]
59
+ # @note The feature data shape should match that of the dataset used to create the model.
60
+ # Any missing features in this request will reduce the quality of the predictions.
61
+ # @note For a classification model you may include the extra parameter 'includeClassScores' to
62
+ # get scores back for each class, not just the chosen class.
63
+ def predict(model_id, feature_data, extra_parameters = {})
64
+ raise ArgumentError, 'Running predictions requires that model_id be specified and it is currently empty.' if model_id.empty?
65
+ raise ArgumentError, 'Running predictions requires that feature_data be specified and it is currently empty.' if feature_data.empty?
66
+ predict_url = "/models/#{model_id}/predict"
67
+ feature_data = [feature_data] unless feature_data.kind_of?(Array)
68
+ response = self.class.post(predict_url, headers: @headers, body: { 'data': feature_data, 'extraParameters': extra_parameters }.to_json)
69
+ if (response.success?)
70
+ NexosisApi::PredictResponse.new(model_id, response.parsed_response)
71
+ else
72
+ raise HttpException.new("There was a problem predicting from your model: #{response.code}.",
73
+ "Could not start predict for #{model_id}",
74
+ response)
75
+ end
76
+ end
77
+
78
+ # Remove an existing model
79
+ #
80
+ # @param model_id [String] the unique id of the model to remove.
81
+ # @raise [NexosisApi::HttpException]
82
+ # @raise [ArgumentError]
83
+ def remove_model(model_id)
84
+ raise ArgumentError, 'Deleting a model requires that model_id be specified and it is currently empty.' if model_id.empty?
85
+ delete_url = "/models/#{model_id}"
86
+ response = self.class.delete(delete_url, @options)
87
+ unless (response.success?)
88
+ raise HttpException.new("There was a problem deleting your model: #{response.code}.",
89
+ "Could not delete #{model_id}",
90
+ response)
91
+ end
92
+ end
93
+
94
+ # Deletes multiple models based on the provided filter criteria.
95
+ # @param datasource_name [String] remove all models created by this datasource
96
+ # @param begin_date [DateTime] remove all models created after this date/time - inclusive. May be a ISO 8601 compliant string.
97
+ # @param end_date [DateTime] remove all models created before this date/time - inclusive. May be a ISO 8601 compliant string.
98
+ # @raise [NexosisApi::HttpException]
99
+ # @raise [ArgumentError]
100
+ # @note - Use with great care. This permanently removes trained models.
101
+ # All parameters are indepdently optional, but one must be sent.
102
+ def remove_models(datasource_name = nil, begin_date = nil, end_date = nil)
103
+ params_unset = datasource_name.nil?
104
+ params_unset &= begin_date.nil?
105
+ params_unset &= end_date.nil?
106
+ raise ArgumentError, 'Must set one of the method parameters.' if params_unset
107
+ delete_url = '/models'
108
+ query = {}
109
+ query.store('dataSourceName', datasource_name) unless datasource_name.nil?
110
+ query.store('createdAfterDate', begin_date) unless begin_date.nil?
111
+ query.store('createdBeforeDate', end_date) unless end_date.nil?
112
+ response = self.class.delete(delete_url, headers: @headers, query: query)
113
+ unless (response.success?)
114
+ raise HttpException.new("There was a problem deleting your models: #{response.code}.",
115
+ 'Could not delete models',
116
+ response)
117
+ end
118
+ end
119
+ end
120
+ end
121
+ end
@@ -1,213 +1,308 @@
1
- require 'csv'
2
- require 'json'
3
-
4
- module NexosisApi
5
- class Client
6
- # Session-based API operations
7
- #
8
- # @see http://docs.nexosis.com/
9
- module Sessions
10
-
11
- # List sessions previously submitted
12
- #
13
- # @param query_options [Hash] optionally provide query parameters to limit the search of sessions.
14
- # @param page [Integer] optionally provide a page number for paging. Defaults to 0 (first page).
15
- # @param pageSize [Integer] optionally provide a page size to limit the total number of results. Defaults to 50, max 1000
16
- # @return [NexosisApi::PagedArray of NexosisApi::SessionResponse] with all sessions matching the query or all if no query
17
- # @note query parameters hash members are dataset_name, event_name, requested_before_date, and requested_after_date.
18
- # After and before dates refer to the session requested date.
19
- # @example query for just one dataset
20
- # sessions = NexosisApi.client.list_sessions :dataset_name => 'MyDataset'
21
- def list_sessions(query_options = {}, page = 0, pageSize = 50)
22
- sessions_url = '/sessions'
23
- query = {
24
- 'dataSetName' => query_options[:dataset_name],
25
- 'eventName' => query_options[:event_name],
26
- 'requestedAfterDate' => query_options[:requested_after_date],
27
- 'requestedBeforeDate' => query_options[:requested_before_date],
28
- 'type' => query_options[:type],
29
- 'page' => page,
30
- 'pageSize' => pageSize
31
- }
32
- response = self.class.get(sessions_url, headers: @headers, query: query)
33
- raise HttpException.new('Could not retrieve sessions',
34
- "Get all sessions with query #{query_options}",
35
- response) unless response.success?
36
- NexosisApi::PagedArray.new(response.parsed_response, response.parsed_response['items'].map do |session_hash|
37
- response_hash = { 'session' => session_hash }.merge(response.headers)
38
- NexosisApi::SessionResponse.new(response_hash)
39
- end)
40
- end
41
-
42
- # Remove a session
43
- # @param session_id [String] required session identifier
44
- def remove_session(session_id)
45
- if (session_id.to_s.empty?)
46
- raise ArgumentError 'session_id cannot be empty or nil'
47
- end
48
- session_url = "/sessions/#{session_id}"
49
- response = self.class.delete(session_url, headers: @headers)
50
- return if response.success?
51
- raise HttpException.new('Could not delete session with given id', "remove session with id #{session_id}", response)
52
- end
53
-
54
- # Remove sessions that have been run. All query options are optional and will be used to limit the sessions removed.
55
- # @param query_options [Hash] optionally provide query parametes to limit the set of sessions removed.
56
- # @note query parameters hash members are type, dataset_name, event_name, start_date, and end_date.
57
- # Start and end dates refer to the session requested date.
58
- # Results are not removed but then can only be accessed by dataset name
59
- # @example Remove all sessions based on a dataset by name
60
- # NexosisApi.client.remove_sessions :dataset_name => 'existing_dataset'
61
- def remove_sessions(query_options = {})
62
- sessions_url = '/sessions'
63
- response = self.class.delete(sessions_url, :headers => @headers, :query => get_query_from_options(query_options))
64
- return if response.success?
65
- raise HttpException.new('Could not remove sessions', "Remove sessions with query #{query_options.to_s}",response)
66
- end
67
-
68
- # Initiate a new forecast session based on a named dataset.
69
- #
70
- # @param dataset_name [String] The name of the saved data set that has the data to forecast on.
71
- # @param start_date [DateTime] The starting date of the forecast period. Can be ISO 8601 string.
72
- # @param end_date [DateTime] The ending date of the forecast period. Can be ISO 8601 string.
73
- # @param target_column [String] The name of the column for which you want predictions. Nil if defined in dataset.
74
- # @param result_interval [NexosisApi::TimeInterval] (optional) - The date/time interval (e.g. Day, Hour) at which predictions should be generated. So, if Hour is specified for this parameter you will get a Result record for each hour between startDate and endDate. If unspecified, we’ll generate predictions at a Day interval.
75
- # @param column_metadata [Array of NexosisApi::Column] (optional) - specification for how to handle columns if different from existing metadata on dataset
76
- # @return [NexosisApi::SessionResponse] providing information about the sesssion
77
- # @note The time interval selected must be greater than or equal to the finest granularity of the data provided.
78
- # For instance if your data includes many recoreds per hour, then you could request hour, day, or any other result interval.
79
- # However, if your data includes only a few records per day or fewer, then a request for an hourly result interval will produce poor results.
80
- def create_forecast_session(dataset_name, start_date, end_date, target_column = nil, result_interval = NexosisApi::TimeInterval::DAY, column_metadata = nil)
81
- create_session(dataset_name, start_date, end_date, target_column, nil, 'forecast', result_interval, column_metadata)
82
- end
83
-
84
- # Analyze impact for an event with data already saved to the API.
85
- #
86
- # @param dataset_name [String] The name of the saved data set that has the data to forecast on.
87
- # @param start_date [DateTime] The starting date of the impactful event. Can be ISO 8601 string.
88
- # @param end_date [DateTime] The ending date of the impactful event. Can be ISO 8601 string.
89
- # @param event_name [String] The name of the event.
90
- # @param target_column [String] The name of the column for which you want predictions. Nil if defined in datatset.
91
- # @param result_interval [NexosisApi::TimeInterval] (optional) - The date/time interval (e.g. Day, Hour) at which predictions should be generated. So, if Hour is specified for this parameter you will get a Result record for each hour between startDate and endDate. If unspecified, we’ll generate predictions at a Day interval.
92
- # @param column_metadata [Array of NexosisApi::Column] (optional) - specification for how to handle columns if different from existing metadata on dataset
93
- # @return [NexosisApi::SessionResponse] providing information about the sesssion
94
- def create_impact_session(dataset_name, start_date, end_date, event_name, target_column = nil, result_interval = NexosisApi::TimeInterval::DAY, column_metadata = nil)
95
- create_session(dataset_name, start_date, end_date, target_column, event_name, 'impact', result_interval, column_metadata)
96
- end
97
-
98
- # Get the results of the session.
99
- #
100
- # @param session_id [String] the Guid string returned in a previous session request
101
- # @param as_csv [Boolean] indicate whether results should be returned in csv format
102
- # @param prediction_interval [Float] one of the available prediction intervals for the session.
103
- # @return [NexosisApi::SessionResult] SessionResult if parsed, String of csv data otherwise
104
- def get_session_results(session_id, as_csv = false, prediction_interval = nil)
105
- session_result_url = "/sessions/#{session_id}/results"
106
- @headers['Accept'] = 'text/csv' if as_csv
107
- query = { predictionInterval: prediction_interval } unless prediction_interval.nil?
108
- response = self.class.get(session_result_url, headers: @headers, query: query)
109
- @headers.delete('Accept')
110
-
111
- if (response.success?)
112
- return response.body if as_csv
113
- NexosisApi::SessionResult.new(response.parsed_response)
114
- else
115
- raise HttpException.new("There was a problem getting the session: #{response.code}.", "get results for session #{session_id}" ,response)
116
- end
117
- end
118
-
119
- # Get a specific session by id.
120
- #
121
- # @param session_id [String] the Guid string returned in a previous session request
122
- # @return [NexosisApi::Session] a Session object populated with the session's data
123
- def get_session(session_id)
124
- session_url = "/sessions/#{session_id}"
125
- response = self.class.get(session_url, @options)
126
- return NexosisApi::Session.new(response.parsed_response) if response.success?
127
- raise HttpException.new("There was a problem getting the session: #{response.code}.", "getting session #{session_id}" ,response)
128
- end
129
-
130
- # Create a new model based on a data source
131
- #
132
- # @param datasource_name [String] The datasource from which to build the model
133
- # @param target_column [String] The column which will be predicted when using the model
134
- # @param columns [Hash] column metadata to modify roles, imputation, or target.
135
- # @param options [Hash] prediction_domain and or balance (true or false) indicator for classification
136
- # @note - classifcation assumes balanced classes. The use of a 'balanced=false' option
137
- # indicates that no attempt should be made to sample the classes in balanced fashion.
138
- # @since 1.3.0
139
- def create_model(datasource_name, target_column, columns = {}, options = { prediction_domain: 'regression' })
140
- model_url = '/sessions/model'
141
- body = {
142
- dataSourceName: datasource_name,
143
- targetColumn: target_column,
144
- predictionDomain: options[:prediction_domain].downcase
145
- }
146
- body.store(:extraParameters, { balance: options[:balance] }) if options.include?(:balance) && body[:predictionDomain] == 'classification'
147
- body.store(columns: columns) unless columns.empty?
148
- response = self.class.post(model_url, headers: @headers, body: body.to_json)
149
- if response.success?
150
- session_hash = { 'session' => response.parsed_response }.merge(response.headers)
151
- NexosisApi::SessionResponse.new(session_hash)
152
- else
153
- raise HttpException.new("There was a problem creating the model session: #{response.code}.", 'creating model session' ,response)
154
- end
155
- end
156
-
157
- # Get the confusion matrix for a completed classification session
158
- # @param session_id [String] The unique id of the completed classification session
159
- # @return [NexosisApi::ClassifierResult] a confusion matrix along with class labels and other session information.
160
- # @since 1.4.1
161
- # @note - This endpoint returns a 404 for requests of non-classification sessions
162
- def get_confusion_matrix(session_id)
163
- result_url = "/sessions/#{session_id}/results/confusionmatrix"
164
- response = self.class.get(result_url, headers: @headers)
165
- raise HttpException.new("There was a problem getting a confusion matrix for session #{session_id}", 'getting confusion matrix', response) unless response.success?
166
- NexosisApi::ClassifierResult.new(response.parsed_response)
167
- end
168
-
169
- private
170
-
171
- # @private
172
- def create_session(dataset_name, start_date, end_date, target_column = nil, event_name = nil, type = 'forecast', result_interval = NexosisApi::TimeInterval::DAY, column_metadata = nil)
173
- session_url = "/sessions/#{type}"
174
- query = {
175
- 'targetColumn' => target_column.to_s,
176
- 'startDate' => start_date.to_s,
177
- 'endDate' => end_date.to_s,
178
- 'resultInterval' => result_interval.to_s
179
- }
180
- query['dataSetName'] = dataset_name.to_s unless dataset_name.to_s.empty?
181
- if (event_name.nil? == false)
182
- query['eventName'] = event_name
183
- end
184
- body = ''
185
- if (column_metadata.nil? == false)
186
- column_json = Column.to_json(column_metadata)
187
- body = {
188
- 'dataSetName' => dataset_name,
189
- 'columns' => column_json
190
- }
191
- end
192
- response = self.class.post(session_url, headers: @headers, query: query, body: body.to_json)
193
- if (response.success?)
194
- session_hash = { 'session' => response.parsed_response }.merge(response.headers)
195
- NexosisApi::SessionResponse.new(session_hash)
196
- else
197
- raise HttpException.new("Unable to create new #{type} session", "Create session for dataset #{dataset_name}", response)
198
- end
199
- end
200
-
201
- def get_query_from_options(options)
202
- query = {
203
- 'dataSetName' => options[:dataset_name],
204
- 'eventName' => options[:event_name],
205
- 'startDate' => options[:start_date],
206
- 'endDate' => options[:end_date],
207
- 'type' => options[:type]
208
- }
209
- query
210
- end
211
- end
212
- end
213
- end
1
+ require 'csv'
2
+ require 'json'
3
+
4
+ module NexosisApi
5
+ class Client
6
+ # Session-based API operations
7
+ #
8
+ # @see http://docs.nexosis.com/
9
+ module Sessions
10
+
11
+ # List sessions previously submitted
12
+ #
13
+ # @param query_options [Hash] optionally provide query parameters to limit the search of sessions.
14
+ # @param page [Integer] optionally provide a page number for paging. Defaults to 0 (first page).
15
+ # @param pageSize [Integer] optionally provide a page size to limit the total number of results. Defaults to 50, max 1000
16
+ # @return [NexosisApi::PagedArray of NexosisApi::SessionResponse] with all sessions matching the query or all if no query
17
+ # @raise [NexosisApi::HttpException]
18
+ # @note query parameters hash members are dataset_name, event_name, requested_before_date, and requested_after_date.
19
+ # After and before dates refer to the session requested date.
20
+ # @example query for just one dataset
21
+ # sessions = NexosisApi.client.list_sessions :dataset_name => 'MyDataset'
22
+ def list_sessions(query_options = {}, page = 0, pageSize = 50)
23
+ sessions_url = '/sessions'
24
+ query = {
25
+ 'dataSetName' => query_options[:dataset_name],
26
+ 'eventName' => query_options[:event_name],
27
+ 'requestedAfterDate' => query_options[:requested_after_date],
28
+ 'requestedBeforeDate' => query_options[:requested_before_date],
29
+ 'type' => query_options[:type],
30
+ 'page' => page,
31
+ 'pageSize' => pageSize
32
+ }
33
+ response = self.class.get(sessions_url, headers: @headers, query: query)
34
+ raise HttpException.new('Could not retrieve sessions',
35
+ "Get all sessions with query #{query_options}",
36
+ response) unless response.success?
37
+ NexosisApi::PagedArray.new(response.parsed_response, response.parsed_response['items'].map do |session_hash|
38
+ response_hash = { 'session' => session_hash }.merge(response.headers)
39
+ NexosisApi::SessionResponse.new(response_hash)
40
+ end)
41
+ end
42
+
43
+ # Remove a session
44
+ # @param session_id [String] required session identifier
45
+ # @raise [NexosisApi::HttpException]
46
+ # @raise [ArgumentError]
47
+ def remove_session(session_id)
48
+ if (session_id.to_s.empty?)
49
+ raise ArgumentError 'session_id cannot be empty or nil'
50
+ end
51
+ session_url = "/sessions/#{session_id}"
52
+ response = self.class.delete(session_url, headers: @headers)
53
+ return if response.success?
54
+ raise HttpException.new('Could not delete session with given id', "remove session with id #{session_id}", response)
55
+ end
56
+
57
+ # Remove sessions that have been run. All query options are optional and will be used to limit the sessions removed.
58
+ # @param query_options [Hash] optionally provide query parametes to limit the set of sessions removed.
59
+ # @raise [NexosisApi::HttpException]
60
+ # @note query parameters hash members are type, dataset_name, event_name, start_date, and end_date.
61
+ # Start and end dates refer to the session requested date.
62
+ # Results are not removed but then can only be accessed by dataset name
63
+ # @example Remove all sessions based on a dataset by name
64
+ # NexosisApi.client.remove_sessions :dataset_name => 'existing_dataset'
65
+ def remove_sessions(query_options = {})
66
+ sessions_url = '/sessions'
67
+ response = self.class.delete(sessions_url, :headers => @headers, :query => get_query_from_options(query_options))
68
+ return if response.success?
69
+ raise HttpException.new('Could not remove sessions', "Remove sessions with query #{query_options.to_s}",response)
70
+ end
71
+
72
+ # Initiate a new forecast session based on a named dataset.
73
+ #
74
+ # @param dataset_name [String] The name of the saved data set that has the data to forecast on.
75
+ # @param start_date [DateTime] The starting date of the forecast period. Can be ISO 8601 string.
76
+ # @param end_date [DateTime] The ending date of the forecast period. Can be ISO 8601 string.
77
+ # @param target_column [String] The name of the column for which you want predictions. Nil if defined in dataset.
78
+ # @param result_interval [NexosisApi::TimeInterval] (optional) - The date/time interval (e.g. Day, Hour) at which predictions should be generated. So, if Hour is specified for this parameter you will get a Result record for each hour between startDate and endDate. If unspecified, we’ll generate predictions at a Day interval.
79
+ # @param column_metadata [Array of NexosisApi::Column] (optional) - specification for how to handle columns if different from existing metadata on dataset
80
+ # @return [NexosisApi::SessionResponse] providing information about the sesssion
81
+ # @note The time interval selected must be greater than or equal to the finest granularity of the data provided.
82
+ # For instance if your data includes many recoreds per hour, then you could request hour, day, or any other result interval.
83
+ # However, if your data includes only a few records per day or fewer, then a request for an hourly result interval will produce poor results.
84
+ def create_forecast_session(dataset_name, start_date, end_date, target_column = nil, result_interval = NexosisApi::TimeInterval::DAY, column_metadata = nil)
85
+ create_session(dataset_name, start_date, end_date, target_column, nil, 'forecast', result_interval, column_metadata)
86
+ end
87
+
88
+ # Analyze impact for an event with data already saved to the API.
89
+ #
90
+ # @param dataset_name [String] The name of the saved data set that has the data to forecast on.
91
+ # @param start_date [DateTime] The starting date of the impactful event. Can be ISO 8601 string.
92
+ # @param end_date [DateTime] The ending date of the impactful event. Can be ISO 8601 string.
93
+ # @param event_name [String] The name of the event.
94
+ # @param target_column [String] The name of the column for which you want predictions. Nil if defined in datatset.
95
+ # @param result_interval [NexosisApi::TimeInterval] (optional) - The date/time interval (e.g. Day, Hour) at which predictions should be generated. So, if Hour is specified for this parameter you will get a Result record for each hour between startDate and endDate. If unspecified, we’ll generate predictions at a Day interval.
96
+ # @param column_metadata [Array of NexosisApi::Column] (optional) - specification for how to handle columns if different from existing metadata on dataset
97
+ # @return [NexosisApi::SessionResponse] providing information about the sesssion
98
+ def create_impact_session(dataset_name, start_date, end_date, event_name, target_column = nil, result_interval = NexosisApi::TimeInterval::DAY, column_metadata = nil)
99
+ create_session(dataset_name, start_date, end_date, target_column, event_name, 'impact', result_interval, column_metadata)
100
+ end
101
+
102
+ # Get the results of the session.
103
+ #
104
+ # @param session_id [String] the Guid string returned in a previous session request
105
+ # @param as_csv [Boolean] indicate whether results should be returned in csv format
106
+ # @param prediction_interval [Float] one of the available prediction intervals for the session.
107
+ # @return [NexosisApi::SessionResult] SessionResult if parsed, String of csv data otherwise
108
+ # @raise [NexosisApi::HttpException]
109
+ # @deprecated
110
+ def get_session_results(session_id, as_csv = false, prediction_interval = nil)
111
+ get_session_result_data(session_id, 0, 50, {as_csv: as_csv, prediction_interval: prediction_interval})
112
+ end
113
+
114
+ # Get the results of the session.
115
+ #
116
+ # @param session_id [String] the Guid string returned in a previous session request
117
+ # @param page [Integer] optionally provide a page number for paging. Defaults to 0 (first page).
118
+ # @param pageSize [Integer] optionally provide a page size to limit the total number of results. Defaults to 50, max 1000
119
+ # @param options [Hash] as_csv [Boolean] to indicate whether results should be returned in csv format; prediction_interval [Float] one of the available prediction intervals for the session.
120
+ # @return [NexosisApi::SessionResult] SessionResult if parsed, String of csv data otherwise
121
+ # @raise [NexosisApi::HttpException]
122
+ # @since 2.1.0
123
+ def get_session_result_data(session_id, page = 0, page_size = 50, options = {})
124
+ session_result_url = "/sessions/#{session_id}/results"
125
+ @headers['Accept'] = 'text/csv' if options[:as_csv]
126
+ query = { 'page' => page, 'pageSize' => page_size }
127
+ query.store('predictionInterval', options[:prediction_interval]) unless options[:prediction_interval].nil?
128
+ response = self.class.get(session_result_url, headers: @headers, query: query)
129
+ @headers.delete('Accept')
130
+ if (response.success?)
131
+ return response.body if options[:as_csv]
132
+ NexosisApi::SessionResult.new(response.parsed_response)
133
+ else
134
+ raise HttpException.new("There was a problem getting the session: #{response.code}.", "get results for session #{session_id}" ,response)
135
+ end
136
+ end
137
+
138
+ # Get a specific session by id.
139
+ #
140
+ # @param session_id [String] the Guid string returned in a previous session request
141
+ # @return [NexosisApi::Session] a Session object populated with the session's data
142
+ # @raise [NexosisApi::HttpException]
143
+ def get_session(session_id)
144
+ session_url = "/sessions/#{session_id}"
145
+ response = self.class.get(session_url, @options)
146
+ return NexosisApi::Session.new(response.parsed_response) if response.success?
147
+ raise HttpException.new("There was a problem getting the session: #{response.code}.", "getting session #{session_id}" ,response)
148
+ end
149
+
150
+ # Create a new model based on a data source
151
+ #
152
+ # @param datasource_name [String] The datasource from which to build the model
153
+ # @param target_column [String] The column which will be predicted when using the model
154
+ # @param columns [Hash] column metadata to modify roles, imputation, or target.
155
+ # @param options [Hash] prediction_domain and or balance (true or false) indicator for classification
156
+ # @return [NexosisApi::SessionResponse]
157
+ # @raise [NexosisApi::HttpException]
158
+ # @note - classifcation assumes balanced classes. The use of a 'balance=false' option
159
+ # indicates that no attempt should be made to sample the classes in balanced fashion.
160
+ # @since 1.3.0
161
+ def create_model(datasource_name, target_column, columns = {}, options = { prediction_domain: 'regression' })
162
+ model_url = '/sessions/model'
163
+ body = {
164
+ dataSourceName: datasource_name,
165
+ targetColumn: target_column,
166
+ predictionDomain: options[:prediction_domain].downcase
167
+ }
168
+ body.store(:extraParameters, { balance: options[:balance] }) if options.include?(:balance) && body[:predictionDomain] == 'classification'
169
+ body.store(columns: columns) unless columns.empty?
170
+ response = self.class.post(model_url, headers: @headers, body: body.to_json)
171
+ if response.success?
172
+ session_hash = { 'session' => response.parsed_response }.merge(response.headers)
173
+ NexosisApi::SessionResponse.new(session_hash)
174
+ else
175
+ raise HttpException.new("There was a problem creating the model session: #{response.code}.", 'creating model session' ,response)
176
+ end
177
+ end
178
+
179
+ # Create a new model based on a data source
180
+ #
181
+ # @param datasource_name [String] The datasource from which to build the model
182
+ # @param columns [Hash] column metadata to modify roles, imputation, or target.
183
+ # @param data_contains_anomalies [Boolean] Whether or not the source dataset contains anomalies (default is true)
184
+ # @return [NexosisApi::SessionResponse]
185
+ # @raise [NexosisApi::HttpException]
186
+ # @since 2.1.0
187
+ # @note The anomalies model session results will contain the anomalous observations when the session is complete.
188
+ def create_anomalies_model(datasource_name, columns = {}, data_contains_anomalies = true)
189
+ model_url = '/sessions/model'
190
+ body = {
191
+ dataSourceName: datasource_name,
192
+ predictionDomain: 'anomalies',
193
+ extraParameters: {
194
+ 'containsAnomalies': data_contains_anomalies
195
+ },
196
+ columns: columns
197
+ }
198
+ response = self.class.post(model_url, headers: @headers, body: body.to_json)
199
+ raise HttpException.new("There was a problem creating the model session: #{response.code}.", 'creating anomaly model session' ,response) unless response.success?
200
+ NexosisApi::SessionResponse.new(response.parsed_response.merge(response.headers))
201
+ end
202
+
203
+ # Create a new model based on a data source
204
+ #
205
+ # @param datasource_name [String] The datasource from which to build the model
206
+ # @param target_column [String] The column which will be predicted when using the model
207
+ # @param columns [Hash] column metadata to modify roles, imputation, or target.
208
+ # @param balance [Boolean] Whether or not to balance classes during model building (default is true)
209
+ # @return [NexosisApi::SessionResponse]
210
+ # @raise [NexosisApi::HttpException]
211
+ # @since 2.1.0
212
+ # @note The anomalies model session results will contain the anomalous observations when the session is complete.
213
+ def create_classification_model(datasource_name, target_column, columns = {}, balance = true)
214
+ return create_model(datasource_name, target_column, columns, prediction_domain: 'classification', balance: balance)
215
+ end
216
+
217
+ # Get the confusion matrix for a completed classification session
218
+ # @param session_id [String] The unique id of the completed classification session
219
+ # @return [NexosisApi::ClassifierResult] a confusion matrix along with class labels and other session information.
220
+ # @raise [NexosisApi::HttpException]
221
+ # @since 1.4.1
222
+ # @note - This endpoint returns a 404 for requests of non-classification sessions
223
+ def get_confusion_matrix(session_id)
224
+ result_url = "/sessions/#{session_id}/results/confusionmatrix"
225
+ response = self.class.get(result_url, headers: @headers)
226
+ raise HttpException.new("There was a problem getting a confusion matrix for session #{session_id}", 'getting confusion matrix', response) unless response.success?
227
+ NexosisApi::ClassifierResult.new(response.parsed_response.merge(response.headers))
228
+ end
229
+
230
+ # Get the observation anomaly score for a completed anomalies session
231
+ # @param session_id [String] The unique id of the completed anomalies session
232
+ # @return [NexosisApi::ScoreResult] A session result with a list of each observation and score per column.
233
+ # @raise [NexosisApi::HttpException]
234
+ # @since 2.1.0
235
+ # @note - This endpoint returns a 404 for requests of non-anomalies sessions
236
+ def get_anomaly_scores(session_id, page = 0, page_size = 50)
237
+ score_url = "/sessions/#{session_id}/results/anomalyScores"
238
+ query = {
239
+ page: page,
240
+ pageSize: page_size
241
+ }
242
+ response = self.class.get(score_url, headers: @headers, query: query)
243
+ raise HttpException.new("There was a problem getting the anomaly scores for session #{session_id}", 'getting anomaly scores', response) unless response.success?
244
+ NexosisApi::AnomalyScores.new(response.parsed_response.merge(response.headers))
245
+ end
246
+
247
+ # Get the observation class score for a completed classification session
248
+ # @param session_id [String] The unique id of the completed classification session
249
+ # @return [NexosisApi::ScoreResult] A session result with a list of each observation and score per column.
250
+ # @raise [NexosisApi::HttpException]
251
+ # @since 2.1.0
252
+ # @note - This endpoint returns a 404 for requests of non-classification sessions
253
+ def get_class_scores(session_id, page = 0, page_size = 50)
254
+ score_url = "/sessions/#{session_id}/results/classScores"
255
+ query = {
256
+ page: page,
257
+ pageSize: page_size
258
+ }
259
+ response = self.class.get(score_url, headers: @headers, query: query)
260
+ raise HttpException.new("There was a problem getting the class scores for session #{session_id}", 'getting class scores', response) unless response.success?
261
+ NexosisApi::ClassifierScores.new(response.parsed_response.merge(response.headers))
262
+ end
263
+
264
+ private
265
+
266
+ # @private
267
+ def create_session(dataset_name, start_date, end_date, target_column = nil, event_name = nil, type = 'forecast', result_interval = NexosisApi::TimeInterval::DAY, column_metadata = nil)
268
+ session_url = "/sessions/#{type}"
269
+ query = {
270
+ 'targetColumn' => target_column.to_s,
271
+ 'startDate' => start_date.to_s,
272
+ 'endDate' => end_date.to_s,
273
+ 'resultInterval' => result_interval.to_s
274
+ }
275
+ query['dataSetName'] = dataset_name.to_s unless dataset_name.to_s.empty?
276
+ if (event_name.nil? == false)
277
+ query['eventName'] = event_name
278
+ end
279
+ body = ''
280
+ if (column_metadata.nil? == false)
281
+ column_json = Column.to_json(column_metadata)
282
+ body = {
283
+ 'dataSetName' => dataset_name,
284
+ 'columns' => column_json
285
+ }
286
+ end
287
+ response = self.class.post(session_url, headers: @headers, query: query, body: body.to_json)
288
+ if (response.success?)
289
+ session_hash = { 'session' => response.parsed_response }.merge(response.headers)
290
+ NexosisApi::SessionResponse.new(session_hash)
291
+ else
292
+ raise HttpException.new("Unable to create new #{type} session", "Create session for dataset #{dataset_name}", response)
293
+ end
294
+ end
295
+
296
+ def get_query_from_options(options)
297
+ query = {
298
+ 'dataSetName' => options[:dataset_name],
299
+ 'eventName' => options[:event_name],
300
+ 'startDate' => options[:start_date],
301
+ 'endDate' => options[:end_date],
302
+ 'type' => options[:type]
303
+ }
304
+ query
305
+ end
306
+ end
307
+ end
308
+ end