@iblai/iblai-api 4.253.3-ai → 4.254.0-ai
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/index.cjs.js +653 -381
- package/dist/index.cjs.js.map +1 -1
- package/dist/index.esm.js +653 -382
- package/dist/index.esm.js.map +1 -1
- package/dist/index.umd.js +653 -381
- package/dist/index.umd.js.map +1 -1
- package/dist/types/index.d.ts +28 -0
- package/dist/types/models/DataTypeEnum.d.ts +10 -0
- package/dist/types/models/Dataset.d.ts +12 -0
- package/dist/types/models/DatasetCreate.d.ts +8 -0
- package/dist/types/models/DatasetItem.d.ts +20 -0
- package/dist/types/models/DatasetItemBulkCreateResponse.d.ts +5 -0
- package/dist/types/models/DatasetItemCreate.d.ts +10 -0
- package/dist/types/models/DatasetItemInput.d.ts +7 -0
- package/dist/types/models/DatasetItemUpdate.d.ts +10 -0
- package/dist/types/models/DatasetItemUpdateStatusEnum.d.ts +8 -0
- package/dist/types/models/DatasetRunItem.d.ts +16 -0
- package/dist/types/models/ExperimentCreate.d.ts +8 -0
- package/dist/types/models/JudgeRecord.d.ts +18 -0
- package/dist/types/models/LLMJudge.d.ts +10 -0
- package/dist/types/models/PaginatedDatasetItemList.d.ts +7 -0
- package/dist/types/models/PaginatedDatasetList.d.ts +7 -0
- package/dist/types/models/PaginatedJudgeList.d.ts +7 -0
- package/dist/types/models/PaginatedRunList.d.ts +7 -0
- package/dist/types/models/PaginatedScoreConfigList.d.ts +7 -0
- package/dist/types/models/PaginatedScoreList.d.ts +7 -0
- package/dist/types/models/Run.d.ts +19 -0
- package/dist/types/models/RunDetailResponse.d.ts +19 -0
- package/dist/types/models/Score.d.ts +17 -0
- package/dist/types/models/ScoreConfig.d.ts +12 -0
- package/dist/types/models/ScoreConfigCategory.d.ts +7 -0
- package/dist/types/models/ScoreConfigCreate.d.ts +13 -0
- package/dist/types/models/ScoreCreate.d.ts +14 -0
- package/dist/types/models/ScoreCreateResponse.d.ts +7 -0
- package/dist/types/services/AiMentorService.d.ts +0 -171
- package/dist/types/services/EvaluationsService.d.ts +353 -0
- package/package.json +1 -1
- package/sdk_schema.yml +1512 -299
- package/src/core/OpenAPI.ts +1 -1
- package/src/index.ts +28 -0
- package/src/models/DataTypeEnum.ts +14 -0
- package/src/models/Dataset.ts +17 -0
- package/src/models/DatasetCreate.ts +13 -0
- package/src/models/DatasetItem.ts +25 -0
- package/src/models/DatasetItemBulkCreateResponse.ts +10 -0
- package/src/models/DatasetItemCreate.ts +15 -0
- package/src/models/DatasetItemInput.ts +12 -0
- package/src/models/DatasetItemUpdate.ts +15 -0
- package/src/models/DatasetItemUpdateStatusEnum.ts +12 -0
- package/src/models/DatasetRunItem.ts +21 -0
- package/src/models/ExperimentCreate.ts +13 -0
- package/src/models/JudgeRecord.ts +23 -0
- package/src/models/LLMJudge.ts +15 -0
- package/src/models/PaginatedDatasetItemList.ts +12 -0
- package/src/models/PaginatedDatasetList.ts +12 -0
- package/src/models/PaginatedJudgeList.ts +12 -0
- package/src/models/PaginatedRunList.ts +12 -0
- package/src/models/PaginatedScoreConfigList.ts +12 -0
- package/src/models/PaginatedScoreList.ts +12 -0
- package/src/models/Run.ts +24 -0
- package/src/models/RunDetailResponse.ts +24 -0
- package/src/models/Score.ts +22 -0
- package/src/models/ScoreConfig.ts +17 -0
- package/src/models/ScoreConfigCategory.ts +12 -0
- package/src/models/ScoreConfigCreate.ts +18 -0
- package/src/models/ScoreCreate.ts +19 -0
- package/src/models/ScoreCreateResponse.ts +12 -0
- package/src/services/AiMentorService.ts +0 -456
- package/src/services/EvaluationsService.ts +851 -0
package/dist/index.cjs.js
CHANGED
|
@@ -110,7 +110,7 @@ class CancelablePromise {
|
|
|
110
110
|
|
|
111
111
|
const OpenAPI = {
|
|
112
112
|
BASE: 'https://base.manager.iblai.app',
|
|
113
|
-
VERSION: '4.
|
|
113
|
+
VERSION: '4.254.0-ai-plus',
|
|
114
114
|
WITH_CREDENTIALS: false,
|
|
115
115
|
CREDENTIALS: 'include',
|
|
116
116
|
TOKEN: undefined,
|
|
@@ -405,6 +405,36 @@ exports.CreditTransactionHistoryStatusEnum = void 0;
|
|
|
405
405
|
CreditTransactionHistoryStatusEnum["CANCELLED"] = "cancelled";
|
|
406
406
|
})(exports.CreditTransactionHistoryStatusEnum || (exports.CreditTransactionHistoryStatusEnum = {}));
|
|
407
407
|
|
|
408
|
+
/* generated using openapi-typescript-codegen -- do not edit */
|
|
409
|
+
/* istanbul ignore file */
|
|
410
|
+
/* tslint:disable */
|
|
411
|
+
/* eslint-disable */
|
|
412
|
+
/**
|
|
413
|
+
* * `ACTIVE` - ACTIVE
|
|
414
|
+
* * `ARCHIVED` - ARCHIVED
|
|
415
|
+
*/
|
|
416
|
+
exports.DatasetItemUpdateStatusEnum = void 0;
|
|
417
|
+
(function (DatasetItemUpdateStatusEnum) {
|
|
418
|
+
DatasetItemUpdateStatusEnum["ACTIVE"] = "ACTIVE";
|
|
419
|
+
DatasetItemUpdateStatusEnum["ARCHIVED"] = "ARCHIVED";
|
|
420
|
+
})(exports.DatasetItemUpdateStatusEnum || (exports.DatasetItemUpdateStatusEnum = {}));
|
|
421
|
+
|
|
422
|
+
/* generated using openapi-typescript-codegen -- do not edit */
|
|
423
|
+
/* istanbul ignore file */
|
|
424
|
+
/* tslint:disable */
|
|
425
|
+
/* eslint-disable */
|
|
426
|
+
/**
|
|
427
|
+
* * `NUMERIC` - NUMERIC
|
|
428
|
+
* * `BOOLEAN` - BOOLEAN
|
|
429
|
+
* * `CATEGORICAL` - CATEGORICAL
|
|
430
|
+
*/
|
|
431
|
+
exports.DataTypeEnum = void 0;
|
|
432
|
+
(function (DataTypeEnum) {
|
|
433
|
+
DataTypeEnum["NUMERIC"] = "NUMERIC";
|
|
434
|
+
DataTypeEnum["BOOLEAN"] = "BOOLEAN";
|
|
435
|
+
DataTypeEnum["CATEGORICAL"] = "CATEGORICAL";
|
|
436
|
+
})(exports.DataTypeEnum || (exports.DataTypeEnum = {}));
|
|
437
|
+
|
|
408
438
|
/* generated using openapi-typescript-codegen -- do not edit */
|
|
409
439
|
/* istanbul ignore file */
|
|
410
440
|
/* tslint:disable */
|
|
@@ -19899,386 +19929,6 @@ class AiMentorService {
|
|
|
19899
19929
|
}
|
|
19900
19930
|
});
|
|
19901
19931
|
}
|
|
19902
|
-
/**
|
|
19903
|
-
* List datasets belonging to the tenant.
|
|
19904
|
-
* @returns any No response body
|
|
19905
|
-
* @throws ApiError
|
|
19906
|
-
*/
|
|
19907
|
-
static aiMentorOrgsUsersEvaluationsDatasetsRetrieve({
|
|
19908
|
-
org,
|
|
19909
|
-
userId
|
|
19910
|
-
}) {
|
|
19911
|
-
return request(OpenAPI, {
|
|
19912
|
-
method: 'GET',
|
|
19913
|
-
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/',
|
|
19914
|
-
path: {
|
|
19915
|
-
'org': org,
|
|
19916
|
-
'user_id': userId
|
|
19917
|
-
}
|
|
19918
|
-
});
|
|
19919
|
-
}
|
|
19920
|
-
/**
|
|
19921
|
-
* Create a new dataset.
|
|
19922
|
-
* @returns any No response body
|
|
19923
|
-
* @throws ApiError
|
|
19924
|
-
*/
|
|
19925
|
-
static aiMentorOrgsUsersEvaluationsDatasetsCreate({
|
|
19926
|
-
org,
|
|
19927
|
-
userId
|
|
19928
|
-
}) {
|
|
19929
|
-
return request(OpenAPI, {
|
|
19930
|
-
method: 'POST',
|
|
19931
|
-
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/',
|
|
19932
|
-
path: {
|
|
19933
|
-
'org': org,
|
|
19934
|
-
'user_id': userId
|
|
19935
|
-
}
|
|
19936
|
-
});
|
|
19937
|
-
}
|
|
19938
|
-
/**
|
|
19939
|
-
* Get a single dataset by name.
|
|
19940
|
-
* @returns any No response body
|
|
19941
|
-
* @throws ApiError
|
|
19942
|
-
*/
|
|
19943
|
-
static aiMentorOrgsUsersEvaluationsDatasetsRetrieve2({
|
|
19944
|
-
datasetName,
|
|
19945
|
-
org,
|
|
19946
|
-
userId
|
|
19947
|
-
}) {
|
|
19948
|
-
return request(OpenAPI, {
|
|
19949
|
-
method: 'GET',
|
|
19950
|
-
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/',
|
|
19951
|
-
path: {
|
|
19952
|
-
'dataset_name': datasetName,
|
|
19953
|
-
'org': org,
|
|
19954
|
-
'user_id': userId
|
|
19955
|
-
}
|
|
19956
|
-
});
|
|
19957
|
-
}
|
|
19958
|
-
/**
|
|
19959
|
-
* List items in a dataset.
|
|
19960
|
-
* @returns any No response body
|
|
19961
|
-
* @throws ApiError
|
|
19962
|
-
*/
|
|
19963
|
-
static aiMentorOrgsUsersEvaluationsDatasetsItemsRetrieve({
|
|
19964
|
-
datasetName,
|
|
19965
|
-
org,
|
|
19966
|
-
userId
|
|
19967
|
-
}) {
|
|
19968
|
-
return request(OpenAPI, {
|
|
19969
|
-
method: 'GET',
|
|
19970
|
-
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/',
|
|
19971
|
-
path: {
|
|
19972
|
-
'dataset_name': datasetName,
|
|
19973
|
-
'org': org,
|
|
19974
|
-
'user_id': userId
|
|
19975
|
-
}
|
|
19976
|
-
});
|
|
19977
|
-
}
|
|
19978
|
-
/**
|
|
19979
|
-
* Add items to a dataset from direct input or trace IDs.
|
|
19980
|
-
* @returns any No response body
|
|
19981
|
-
* @throws ApiError
|
|
19982
|
-
*/
|
|
19983
|
-
static aiMentorOrgsUsersEvaluationsDatasetsItemsCreate({
|
|
19984
|
-
datasetName,
|
|
19985
|
-
org,
|
|
19986
|
-
userId
|
|
19987
|
-
}) {
|
|
19988
|
-
return request(OpenAPI, {
|
|
19989
|
-
method: 'POST',
|
|
19990
|
-
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/',
|
|
19991
|
-
path: {
|
|
19992
|
-
'dataset_name': datasetName,
|
|
19993
|
-
'org': org,
|
|
19994
|
-
'user_id': userId
|
|
19995
|
-
}
|
|
19996
|
-
});
|
|
19997
|
-
}
|
|
19998
|
-
/**
|
|
19999
|
-
* Update a dataset item.
|
|
20000
|
-
* @returns any No response body
|
|
20001
|
-
* @throws ApiError
|
|
20002
|
-
*/
|
|
20003
|
-
static aiMentorOrgsUsersEvaluationsDatasetsItemsUpdate({
|
|
20004
|
-
datasetName,
|
|
20005
|
-
itemId,
|
|
20006
|
-
org,
|
|
20007
|
-
userId
|
|
20008
|
-
}) {
|
|
20009
|
-
return request(OpenAPI, {
|
|
20010
|
-
method: 'PUT',
|
|
20011
|
-
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/{item_id}/',
|
|
20012
|
-
path: {
|
|
20013
|
-
'dataset_name': datasetName,
|
|
20014
|
-
'item_id': itemId,
|
|
20015
|
-
'org': org,
|
|
20016
|
-
'user_id': userId
|
|
20017
|
-
}
|
|
20018
|
-
});
|
|
20019
|
-
}
|
|
20020
|
-
/**
|
|
20021
|
-
* Delete a dataset item.
|
|
20022
|
-
* @returns void
|
|
20023
|
-
* @throws ApiError
|
|
20024
|
-
*/
|
|
20025
|
-
static aiMentorOrgsUsersEvaluationsDatasetsItemsDestroy({
|
|
20026
|
-
datasetName,
|
|
20027
|
-
itemId,
|
|
20028
|
-
org,
|
|
20029
|
-
userId
|
|
20030
|
-
}) {
|
|
20031
|
-
return request(OpenAPI, {
|
|
20032
|
-
method: 'DELETE',
|
|
20033
|
-
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/{item_id}/',
|
|
20034
|
-
path: {
|
|
20035
|
-
'dataset_name': datasetName,
|
|
20036
|
-
'item_id': itemId,
|
|
20037
|
-
'org': org,
|
|
20038
|
-
'user_id': userId
|
|
20039
|
-
}
|
|
20040
|
-
});
|
|
20041
|
-
}
|
|
20042
|
-
/**
|
|
20043
|
-
* Upload a CSV file to create dataset items.
|
|
20044
|
-
* @returns any No response body
|
|
20045
|
-
* @throws ApiError
|
|
20046
|
-
*/
|
|
20047
|
-
static aiMentorOrgsUsersEvaluationsDatasetsItemsUploadCreate({
|
|
20048
|
-
datasetName,
|
|
20049
|
-
org,
|
|
20050
|
-
userId
|
|
20051
|
-
}) {
|
|
20052
|
-
return request(OpenAPI, {
|
|
20053
|
-
method: 'POST',
|
|
20054
|
-
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/upload/',
|
|
20055
|
-
path: {
|
|
20056
|
-
'dataset_name': datasetName,
|
|
20057
|
-
'org': org,
|
|
20058
|
-
'user_id': userId
|
|
20059
|
-
}
|
|
20060
|
-
});
|
|
20061
|
-
}
|
|
20062
|
-
/**
|
|
20063
|
-
* List experiment runs for a dataset.
|
|
20064
|
-
* @returns any No response body
|
|
20065
|
-
* @throws ApiError
|
|
20066
|
-
*/
|
|
20067
|
-
static aiMentorOrgsUsersEvaluationsDatasetsRunsRetrieve({
|
|
20068
|
-
datasetName,
|
|
20069
|
-
org,
|
|
20070
|
-
userId
|
|
20071
|
-
}) {
|
|
20072
|
-
return request(OpenAPI, {
|
|
20073
|
-
method: 'GET',
|
|
20074
|
-
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/',
|
|
20075
|
-
path: {
|
|
20076
|
-
'dataset_name': datasetName,
|
|
20077
|
-
'org': org,
|
|
20078
|
-
'user_id': userId
|
|
20079
|
-
}
|
|
20080
|
-
});
|
|
20081
|
-
}
|
|
20082
|
-
/**
|
|
20083
|
-
* Start an experiment — dispatches a Celery task.
|
|
20084
|
-
* @returns any No response body
|
|
20085
|
-
* @throws ApiError
|
|
20086
|
-
*/
|
|
20087
|
-
static aiMentorOrgsUsersEvaluationsDatasetsRunsCreate({
|
|
20088
|
-
datasetName,
|
|
20089
|
-
org,
|
|
20090
|
-
userId
|
|
20091
|
-
}) {
|
|
20092
|
-
return request(OpenAPI, {
|
|
20093
|
-
method: 'POST',
|
|
20094
|
-
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/',
|
|
20095
|
-
path: {
|
|
20096
|
-
'dataset_name': datasetName,
|
|
20097
|
-
'org': org,
|
|
20098
|
-
'user_id': userId
|
|
20099
|
-
}
|
|
20100
|
-
});
|
|
20101
|
-
}
|
|
20102
|
-
/**
|
|
20103
|
-
* Get experiment run details.
|
|
20104
|
-
* @returns any No response body
|
|
20105
|
-
* @throws ApiError
|
|
20106
|
-
*/
|
|
20107
|
-
static aiMentorOrgsUsersEvaluationsDatasetsRunsRetrieve2({
|
|
20108
|
-
datasetName,
|
|
20109
|
-
org,
|
|
20110
|
-
runName,
|
|
20111
|
-
userId
|
|
20112
|
-
}) {
|
|
20113
|
-
return request(OpenAPI, {
|
|
20114
|
-
method: 'GET',
|
|
20115
|
-
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/{run_name}/',
|
|
20116
|
-
path: {
|
|
20117
|
-
'dataset_name': datasetName,
|
|
20118
|
-
'org': org,
|
|
20119
|
-
'run_name': runName,
|
|
20120
|
-
'user_id': userId
|
|
20121
|
-
}
|
|
20122
|
-
});
|
|
20123
|
-
}
|
|
20124
|
-
/**
|
|
20125
|
-
* Delete an experiment run.
|
|
20126
|
-
* @returns void
|
|
20127
|
-
* @throws ApiError
|
|
20128
|
-
*/
|
|
20129
|
-
static aiMentorOrgsUsersEvaluationsDatasetsRunsDestroy({
|
|
20130
|
-
datasetName,
|
|
20131
|
-
org,
|
|
20132
|
-
runName,
|
|
20133
|
-
userId
|
|
20134
|
-
}) {
|
|
20135
|
-
return request(OpenAPI, {
|
|
20136
|
-
method: 'DELETE',
|
|
20137
|
-
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/{run_name}/',
|
|
20138
|
-
path: {
|
|
20139
|
-
'dataset_name': datasetName,
|
|
20140
|
-
'org': org,
|
|
20141
|
-
'run_name': runName,
|
|
20142
|
-
'user_id': userId
|
|
20143
|
-
}
|
|
20144
|
-
});
|
|
20145
|
-
}
|
|
20146
|
-
/**
|
|
20147
|
-
* Trigger LLM-as-Judge evaluation on a completed experiment run.
|
|
20148
|
-
* @returns any No response body
|
|
20149
|
-
* @throws ApiError
|
|
20150
|
-
*/
|
|
20151
|
-
static aiMentorOrgsUsersEvaluationsDatasetsRunsEvaluateCreate({
|
|
20152
|
-
datasetName,
|
|
20153
|
-
org,
|
|
20154
|
-
runName,
|
|
20155
|
-
userId
|
|
20156
|
-
}) {
|
|
20157
|
-
return request(OpenAPI, {
|
|
20158
|
-
method: 'POST',
|
|
20159
|
-
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/{run_name}/evaluate/',
|
|
20160
|
-
path: {
|
|
20161
|
-
'dataset_name': datasetName,
|
|
20162
|
-
'org': org,
|
|
20163
|
-
'run_name': runName,
|
|
20164
|
-
'user_id': userId
|
|
20165
|
-
}
|
|
20166
|
-
});
|
|
20167
|
-
}
|
|
20168
|
-
/**
|
|
20169
|
-
* Export experiment results as CSV.
|
|
20170
|
-
* @returns any No response body
|
|
20171
|
-
* @throws ApiError
|
|
20172
|
-
*/
|
|
20173
|
-
static aiMentorOrgsUsersEvaluationsDatasetsRunsExportRetrieve({
|
|
20174
|
-
datasetName,
|
|
20175
|
-
org,
|
|
20176
|
-
runName,
|
|
20177
|
-
userId
|
|
20178
|
-
}) {
|
|
20179
|
-
return request(OpenAPI, {
|
|
20180
|
-
method: 'GET',
|
|
20181
|
-
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/{run_name}/export/',
|
|
20182
|
-
path: {
|
|
20183
|
-
'dataset_name': datasetName,
|
|
20184
|
-
'org': org,
|
|
20185
|
-
'run_name': runName,
|
|
20186
|
-
'user_id': userId
|
|
20187
|
-
}
|
|
20188
|
-
});
|
|
20189
|
-
}
|
|
20190
|
-
/**
|
|
20191
|
-
* List score configurations.
|
|
20192
|
-
* @returns any No response body
|
|
20193
|
-
* @throws ApiError
|
|
20194
|
-
*/
|
|
20195
|
-
static aiMentorOrgsUsersEvaluationsScoreConfigsRetrieve({
|
|
20196
|
-
org,
|
|
20197
|
-
userId
|
|
20198
|
-
}) {
|
|
20199
|
-
return request(OpenAPI, {
|
|
20200
|
-
method: 'GET',
|
|
20201
|
-
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/score-configs/',
|
|
20202
|
-
path: {
|
|
20203
|
-
'org': org,
|
|
20204
|
-
'user_id': userId
|
|
20205
|
-
}
|
|
20206
|
-
});
|
|
20207
|
-
}
|
|
20208
|
-
/**
|
|
20209
|
-
* Create a score configuration.
|
|
20210
|
-
* @returns any No response body
|
|
20211
|
-
* @throws ApiError
|
|
20212
|
-
*/
|
|
20213
|
-
static aiMentorOrgsUsersEvaluationsScoreConfigsCreate({
|
|
20214
|
-
org,
|
|
20215
|
-
userId
|
|
20216
|
-
}) {
|
|
20217
|
-
return request(OpenAPI, {
|
|
20218
|
-
method: 'POST',
|
|
20219
|
-
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/score-configs/',
|
|
20220
|
-
path: {
|
|
20221
|
-
'org': org,
|
|
20222
|
-
'user_id': userId
|
|
20223
|
-
}
|
|
20224
|
-
});
|
|
20225
|
-
}
|
|
20226
|
-
/**
|
|
20227
|
-
* List scores with optional filters.
|
|
20228
|
-
* @returns any No response body
|
|
20229
|
-
* @throws ApiError
|
|
20230
|
-
*/
|
|
20231
|
-
static aiMentorOrgsUsersEvaluationsScoresRetrieve({
|
|
20232
|
-
org,
|
|
20233
|
-
userId
|
|
20234
|
-
}) {
|
|
20235
|
-
return request(OpenAPI, {
|
|
20236
|
-
method: 'GET',
|
|
20237
|
-
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/scores/',
|
|
20238
|
-
path: {
|
|
20239
|
-
'org': org,
|
|
20240
|
-
'user_id': userId
|
|
20241
|
-
}
|
|
20242
|
-
});
|
|
20243
|
-
}
|
|
20244
|
-
/**
|
|
20245
|
-
* Create a score (human annotation).
|
|
20246
|
-
* @returns any No response body
|
|
20247
|
-
* @throws ApiError
|
|
20248
|
-
*/
|
|
20249
|
-
static aiMentorOrgsUsersEvaluationsScoresCreate({
|
|
20250
|
-
org,
|
|
20251
|
-
userId
|
|
20252
|
-
}) {
|
|
20253
|
-
return request(OpenAPI, {
|
|
20254
|
-
method: 'POST',
|
|
20255
|
-
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/scores/',
|
|
20256
|
-
path: {
|
|
20257
|
-
'org': org,
|
|
20258
|
-
'user_id': userId
|
|
20259
|
-
}
|
|
20260
|
-
});
|
|
20261
|
-
}
|
|
20262
|
-
/**
|
|
20263
|
-
* Delete a score.
|
|
20264
|
-
* @returns void
|
|
20265
|
-
* @throws ApiError
|
|
20266
|
-
*/
|
|
20267
|
-
static aiMentorOrgsUsersEvaluationsScoresDestroy({
|
|
20268
|
-
org,
|
|
20269
|
-
scoreId,
|
|
20270
|
-
userId
|
|
20271
|
-
}) {
|
|
20272
|
-
return request(OpenAPI, {
|
|
20273
|
-
method: 'DELETE',
|
|
20274
|
-
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/scores/{score_id}/',
|
|
20275
|
-
path: {
|
|
20276
|
-
'org': org,
|
|
20277
|
-
'score_id': scoreId,
|
|
20278
|
-
'user_id': userId
|
|
20279
|
-
}
|
|
20280
|
-
});
|
|
20281
|
-
}
|
|
20282
19932
|
/**
|
|
20283
19933
|
* Retrieve the count of free usage credits available to a user.
|
|
20284
19934
|
*
|
|
@@ -44210,6 +43860,627 @@ class CustomDomainsService {
|
|
|
44210
43860
|
}
|
|
44211
43861
|
}
|
|
44212
43862
|
|
|
43863
|
+
class EvaluationsService {
|
|
43864
|
+
/**
|
|
43865
|
+
* List datasets
|
|
43866
|
+
* List datasets belonging to the tenant. Supports server-side filtering by name substring and creator email (matched against the cached `created_by_email` in Langfuse metadata).
|
|
43867
|
+
* @returns PaginatedDatasetList
|
|
43868
|
+
* @throws ApiError
|
|
43869
|
+
*/
|
|
43870
|
+
static evaluationsDatasetsList({
|
|
43871
|
+
org,
|
|
43872
|
+
userId,
|
|
43873
|
+
limit,
|
|
43874
|
+
name,
|
|
43875
|
+
page,
|
|
43876
|
+
userEmail
|
|
43877
|
+
}) {
|
|
43878
|
+
return request(OpenAPI, {
|
|
43879
|
+
method: 'GET',
|
|
43880
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/',
|
|
43881
|
+
path: {
|
|
43882
|
+
'org': org,
|
|
43883
|
+
'user_id': userId
|
|
43884
|
+
},
|
|
43885
|
+
query: {
|
|
43886
|
+
'limit': limit,
|
|
43887
|
+
'name': name,
|
|
43888
|
+
'page': page,
|
|
43889
|
+
'user_email': userEmail
|
|
43890
|
+
}
|
|
43891
|
+
});
|
|
43892
|
+
}
|
|
43893
|
+
/**
|
|
43894
|
+
* Create a dataset
|
|
43895
|
+
* Create a Langfuse dataset under the tenant. The creator's `username` and `user_email` are captured into metadata so future list responses can attribute the row without an extra DB lookup.
|
|
43896
|
+
* @returns Dataset
|
|
43897
|
+
* @throws ApiError
|
|
43898
|
+
*/
|
|
43899
|
+
static aiMentorOrgsUsersEvaluationsDatasetsCreate({
|
|
43900
|
+
org,
|
|
43901
|
+
userId,
|
|
43902
|
+
requestBody
|
|
43903
|
+
}) {
|
|
43904
|
+
return request(OpenAPI, {
|
|
43905
|
+
method: 'POST',
|
|
43906
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/',
|
|
43907
|
+
path: {
|
|
43908
|
+
'org': org,
|
|
43909
|
+
'user_id': userId
|
|
43910
|
+
},
|
|
43911
|
+
body: requestBody,
|
|
43912
|
+
mediaType: 'application/json',
|
|
43913
|
+
errors: {
|
|
43914
|
+
400: `Validation error.`
|
|
43915
|
+
}
|
|
43916
|
+
});
|
|
43917
|
+
}
|
|
43918
|
+
/**
|
|
43919
|
+
* Retrieve a dataset
|
|
43920
|
+
* Get a single dataset by name.
|
|
43921
|
+
* @returns Dataset
|
|
43922
|
+
* @throws ApiError
|
|
43923
|
+
*/
|
|
43924
|
+
static aiMentorOrgsUsersEvaluationsDatasetsRetrieve({
|
|
43925
|
+
datasetName,
|
|
43926
|
+
org,
|
|
43927
|
+
userId
|
|
43928
|
+
}) {
|
|
43929
|
+
return request(OpenAPI, {
|
|
43930
|
+
method: 'GET',
|
|
43931
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/',
|
|
43932
|
+
path: {
|
|
43933
|
+
'dataset_name': datasetName,
|
|
43934
|
+
'org': org,
|
|
43935
|
+
'user_id': userId
|
|
43936
|
+
},
|
|
43937
|
+
errors: {
|
|
43938
|
+
403: `Authenticated, but the resource belongs to another tenant.`,
|
|
43939
|
+
404: `Not found within the tenant.`
|
|
43940
|
+
}
|
|
43941
|
+
});
|
|
43942
|
+
}
|
|
43943
|
+
/**
|
|
43944
|
+
* List dataset items
|
|
43945
|
+
* List items in a dataset. Pass `?include_trace=true` to attach `trace_input` / `trace_output` for items linked to a source trace (one bulk ClickHouse query for the page — no per-row fan-out).
|
|
43946
|
+
* @returns PaginatedDatasetItemList
|
|
43947
|
+
* @throws ApiError
|
|
43948
|
+
*/
|
|
43949
|
+
static evaluationsDatasetItemsList({
|
|
43950
|
+
datasetName,
|
|
43951
|
+
org,
|
|
43952
|
+
userId,
|
|
43953
|
+
includeTrace,
|
|
43954
|
+
limit,
|
|
43955
|
+
page
|
|
43956
|
+
}) {
|
|
43957
|
+
return request(OpenAPI, {
|
|
43958
|
+
method: 'GET',
|
|
43959
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/',
|
|
43960
|
+
path: {
|
|
43961
|
+
'dataset_name': datasetName,
|
|
43962
|
+
'org': org,
|
|
43963
|
+
'user_id': userId
|
|
43964
|
+
},
|
|
43965
|
+
query: {
|
|
43966
|
+
'include_trace': includeTrace,
|
|
43967
|
+
'limit': limit,
|
|
43968
|
+
'page': page
|
|
43969
|
+
},
|
|
43970
|
+
errors: {
|
|
43971
|
+
404: `Not found within the tenant.`
|
|
43972
|
+
}
|
|
43973
|
+
});
|
|
43974
|
+
}
|
|
43975
|
+
/**
|
|
43976
|
+
* Add dataset items
|
|
43977
|
+
* Add items to a dataset. Provide either an `items` array of `{input, expected_output}` objects OR a `trace_ids` array to seed items from existing traces (input/expected are then copied from the trace). Exactly one of the two must be present.
|
|
43978
|
+
* @returns DatasetItemBulkCreateResponse
|
|
43979
|
+
* @throws ApiError
|
|
43980
|
+
*/
|
|
43981
|
+
static aiMentorOrgsUsersEvaluationsDatasetsItemsCreate({
|
|
43982
|
+
datasetName,
|
|
43983
|
+
org,
|
|
43984
|
+
userId,
|
|
43985
|
+
requestBody
|
|
43986
|
+
}) {
|
|
43987
|
+
return request(OpenAPI, {
|
|
43988
|
+
method: 'POST',
|
|
43989
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/',
|
|
43990
|
+
path: {
|
|
43991
|
+
'dataset_name': datasetName,
|
|
43992
|
+
'org': org,
|
|
43993
|
+
'user_id': userId
|
|
43994
|
+
},
|
|
43995
|
+
body: requestBody,
|
|
43996
|
+
mediaType: 'application/json',
|
|
43997
|
+
errors: {
|
|
43998
|
+
400: `Validation error.`,
|
|
43999
|
+
404: `Not found within the tenant.`
|
|
44000
|
+
}
|
|
44001
|
+
});
|
|
44002
|
+
}
|
|
44003
|
+
/**
|
|
44004
|
+
* Retrieve a dataset item
|
|
44005
|
+
* Retrieve a single dataset item. `trace_input` / `trace_output` are always populated when the item has a `source_trace_id` (single-row case, no fan-out concern).
|
|
44006
|
+
* @returns DatasetItem
|
|
44007
|
+
* @throws ApiError
|
|
44008
|
+
*/
|
|
44009
|
+
static aiMentorOrgsUsersEvaluationsDatasetsItemsRetrieve({
|
|
44010
|
+
datasetName,
|
|
44011
|
+
itemId,
|
|
44012
|
+
org,
|
|
44013
|
+
userId
|
|
44014
|
+
}) {
|
|
44015
|
+
return request(OpenAPI, {
|
|
44016
|
+
method: 'GET',
|
|
44017
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/{item_id}/',
|
|
44018
|
+
path: {
|
|
44019
|
+
'dataset_name': datasetName,
|
|
44020
|
+
'item_id': itemId,
|
|
44021
|
+
'org': org,
|
|
44022
|
+
'user_id': userId
|
|
44023
|
+
},
|
|
44024
|
+
errors: {
|
|
44025
|
+
404: `Not found within the tenant.`
|
|
44026
|
+
}
|
|
44027
|
+
});
|
|
44028
|
+
}
|
|
44029
|
+
/**
|
|
44030
|
+
* Update a dataset item
|
|
44031
|
+
* Update any subset of `input`, `expected_output`, `metadata`, or `status` on a dataset item. Uses Langfuse's id-based upsert.
|
|
44032
|
+
* @returns DatasetItem
|
|
44033
|
+
* @throws ApiError
|
|
44034
|
+
*/
|
|
44035
|
+
static aiMentorOrgsUsersEvaluationsDatasetsItemsUpdate({
|
|
44036
|
+
datasetName,
|
|
44037
|
+
itemId,
|
|
44038
|
+
org,
|
|
44039
|
+
userId,
|
|
44040
|
+
requestBody
|
|
44041
|
+
}) {
|
|
44042
|
+
return request(OpenAPI, {
|
|
44043
|
+
method: 'PUT',
|
|
44044
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/{item_id}/',
|
|
44045
|
+
path: {
|
|
44046
|
+
'dataset_name': datasetName,
|
|
44047
|
+
'item_id': itemId,
|
|
44048
|
+
'org': org,
|
|
44049
|
+
'user_id': userId
|
|
44050
|
+
},
|
|
44051
|
+
body: requestBody,
|
|
44052
|
+
mediaType: 'application/json',
|
|
44053
|
+
errors: {
|
|
44054
|
+
400: `Validation error.`,
|
|
44055
|
+
404: `Not found within the tenant.`
|
|
44056
|
+
}
|
|
44057
|
+
});
|
|
44058
|
+
}
|
|
44059
|
+
/**
|
|
44060
|
+
* Delete a dataset item
|
|
44061
|
+
* Delete a dataset item.
|
|
44062
|
+
* @returns void
|
|
44063
|
+
* @throws ApiError
|
|
44064
|
+
*/
|
|
44065
|
+
static aiMentorOrgsUsersEvaluationsDatasetsItemsDestroy({
|
|
44066
|
+
datasetName,
|
|
44067
|
+
itemId,
|
|
44068
|
+
org,
|
|
44069
|
+
userId
|
|
44070
|
+
}) {
|
|
44071
|
+
return request(OpenAPI, {
|
|
44072
|
+
method: 'DELETE',
|
|
44073
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/{item_id}/',
|
|
44074
|
+
path: {
|
|
44075
|
+
'dataset_name': datasetName,
|
|
44076
|
+
'item_id': itemId,
|
|
44077
|
+
'org': org,
|
|
44078
|
+
'user_id': userId
|
|
44079
|
+
},
|
|
44080
|
+
errors: {
|
|
44081
|
+
404: `Not found within the tenant.`
|
|
44082
|
+
}
|
|
44083
|
+
});
|
|
44084
|
+
}
|
|
44085
|
+
/**
|
|
44086
|
+
* Upload a CSV of dataset items
|
|
44087
|
+
* Bulk-create items from a CSV (multipart `file` field). The CSV must have an `input` column; `expected_output` is optional. Rows with empty `input` are skipped.
|
|
44088
|
+
* @returns DatasetItemBulkCreateResponse
|
|
44089
|
+
* @throws ApiError
|
|
44090
|
+
*/
|
|
44091
|
+
static aiMentorOrgsUsersEvaluationsDatasetsItemsUploadCreate({
|
|
44092
|
+
datasetName,
|
|
44093
|
+
org,
|
|
44094
|
+
userId,
|
|
44095
|
+
formData
|
|
44096
|
+
}) {
|
|
44097
|
+
return request(OpenAPI, {
|
|
44098
|
+
method: 'POST',
|
|
44099
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/upload/',
|
|
44100
|
+
path: {
|
|
44101
|
+
'dataset_name': datasetName,
|
|
44102
|
+
'org': org,
|
|
44103
|
+
'user_id': userId
|
|
44104
|
+
},
|
|
44105
|
+
formData: formData,
|
|
44106
|
+
mediaType: 'multipart/form-data',
|
|
44107
|
+
errors: {
|
|
44108
|
+
400: `Validation error.`,
|
|
44109
|
+
404: `Not found within the tenant.`
|
|
44110
|
+
}
|
|
44111
|
+
});
|
|
44112
|
+
}
|
|
44113
|
+
/**
|
|
44114
|
+
* List experiment runs
|
|
44115
|
+
* List runs for a dataset. The response merges Langfuse-persisted runs with in-flight `EvaluationTaskRecord` rows (status `pending` / `in_progress`), deduplicated by `run_name`. `pending_count` reports how many pending entries are in the page so the UI can badge in-flight work.
|
|
44116
|
+
* @returns PaginatedRunList
|
|
44117
|
+
* @throws ApiError
|
|
44118
|
+
*/
|
|
44119
|
+
static evaluationsRunsList({
|
|
44120
|
+
datasetName,
|
|
44121
|
+
org,
|
|
44122
|
+
userId,
|
|
44123
|
+
limit,
|
|
44124
|
+
page,
|
|
44125
|
+
userEmail
|
|
44126
|
+
}) {
|
|
44127
|
+
return request(OpenAPI, {
|
|
44128
|
+
method: 'GET',
|
|
44129
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/',
|
|
44130
|
+
path: {
|
|
44131
|
+
'dataset_name': datasetName,
|
|
44132
|
+
'org': org,
|
|
44133
|
+
'user_id': userId
|
|
44134
|
+
},
|
|
44135
|
+
query: {
|
|
44136
|
+
'limit': limit,
|
|
44137
|
+
'page': page,
|
|
44138
|
+
'user_email': userEmail
|
|
44139
|
+
},
|
|
44140
|
+
errors: {
|
|
44141
|
+
404: `Not found within the tenant.`
|
|
44142
|
+
}
|
|
44143
|
+
});
|
|
44144
|
+
}
|
|
44145
|
+
/**
|
|
44146
|
+
* Start an experiment run
|
|
44147
|
+
* Dispatch a Celery task that runs the chosen mentor against every item in the dataset. Returns immediately (HTTP 202) with the new task record. Poll the list endpoint (or the run-detail endpoint once Langfuse persists the run) to watch the `pending → in_progress → completed` transition.
|
|
44148
|
+
* @returns Run
|
|
44149
|
+
* @throws ApiError
|
|
44150
|
+
*/
|
|
44151
|
+
static aiMentorOrgsUsersEvaluationsDatasetsRunsCreate({
|
|
44152
|
+
datasetName,
|
|
44153
|
+
org,
|
|
44154
|
+
userId,
|
|
44155
|
+
requestBody
|
|
44156
|
+
}) {
|
|
44157
|
+
return request(OpenAPI, {
|
|
44158
|
+
method: 'POST',
|
|
44159
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/',
|
|
44160
|
+
path: {
|
|
44161
|
+
'dataset_name': datasetName,
|
|
44162
|
+
'org': org,
|
|
44163
|
+
'user_id': userId
|
|
44164
|
+
},
|
|
44165
|
+
body: requestBody,
|
|
44166
|
+
mediaType: 'application/json',
|
|
44167
|
+
errors: {
|
|
44168
|
+
400: `Validation error.`,
|
|
44169
|
+
404: `Dataset or mentor not found within the tenant.`
|
|
44170
|
+
}
|
|
44171
|
+
});
|
|
44172
|
+
}
|
|
44173
|
+
/**
|
|
44174
|
+
* Retrieve experiment run details
|
|
44175
|
+
* Returns the run header plus every `dataset_run_item` fully expanded with `input`, `expected_output`, `actual_output`, `trace_id`, and per-item `scores`. Also embeds a `pending_judges` array for any in-flight LLM-as-Judge evaluations against this run.
|
|
44176
|
+
*
|
|
44177
|
+
* Cost: 1 PG query + 2 ClickHouse queries + 1 score query regardless of run size.
|
|
44178
|
+
* @returns RunDetailResponse
|
|
44179
|
+
* @throws ApiError
|
|
44180
|
+
*/
|
|
44181
|
+
static aiMentorOrgsUsersEvaluationsDatasetsRunsRetrieve({
|
|
44182
|
+
datasetName,
|
|
44183
|
+
org,
|
|
44184
|
+
runName,
|
|
44185
|
+
userId
|
|
44186
|
+
}) {
|
|
44187
|
+
return request(OpenAPI, {
|
|
44188
|
+
method: 'GET',
|
|
44189
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/{run_name}/',
|
|
44190
|
+
path: {
|
|
44191
|
+
'dataset_name': datasetName,
|
|
44192
|
+
'org': org,
|
|
44193
|
+
'run_name': runName,
|
|
44194
|
+
'user_id': userId
|
|
44195
|
+
},
|
|
44196
|
+
errors: {
|
|
44197
|
+
403: `Authenticated, but the resource belongs to another tenant.`,
|
|
44198
|
+
404: `Not found within the tenant.`
|
|
44199
|
+
}
|
|
44200
|
+
});
|
|
44201
|
+
}
|
|
44202
|
+
/**
|
|
44203
|
+
* Delete an experiment run
|
|
44204
|
+
* Delete an experiment run.
|
|
44205
|
+
* @returns void
|
|
44206
|
+
* @throws ApiError
|
|
44207
|
+
*/
|
|
44208
|
+
static aiMentorOrgsUsersEvaluationsDatasetsRunsDestroy({
|
|
44209
|
+
datasetName,
|
|
44210
|
+
org,
|
|
44211
|
+
runName,
|
|
44212
|
+
userId
|
|
44213
|
+
}) {
|
|
44214
|
+
return request(OpenAPI, {
|
|
44215
|
+
method: 'DELETE',
|
|
44216
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/{run_name}/',
|
|
44217
|
+
path: {
|
|
44218
|
+
'dataset_name': datasetName,
|
|
44219
|
+
'org': org,
|
|
44220
|
+
'run_name': runName,
|
|
44221
|
+
'user_id': userId
|
|
44222
|
+
},
|
|
44223
|
+
errors: {
|
|
44224
|
+
403: `Authenticated, but the resource belongs to another tenant.`,
|
|
44225
|
+
404: `Not found within the tenant.`
|
|
44226
|
+
}
|
|
44227
|
+
});
|
|
44228
|
+
}
|
|
44229
|
+
/**
|
|
44230
|
+
* List LLM-as-Judge evaluations for a run
|
|
44231
|
+
* Returns every judge task record (any status) targeting this run. Useful for showing an 'Evaluations' history on a run-detail view, including failed and pending ones.
|
|
44232
|
+
* @returns PaginatedJudgeList
|
|
44233
|
+
* @throws ApiError
|
|
44234
|
+
*/
|
|
44235
|
+
static evaluationsRunJudgesList({
|
|
44236
|
+
datasetName,
|
|
44237
|
+
org,
|
|
44238
|
+
runName,
|
|
44239
|
+
userId,
|
|
44240
|
+
limit,
|
|
44241
|
+
page,
|
|
44242
|
+
status,
|
|
44243
|
+
userEmail
|
|
44244
|
+
}) {
|
|
44245
|
+
return request(OpenAPI, {
|
|
44246
|
+
method: 'GET',
|
|
44247
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/{run_name}/evaluate/',
|
|
44248
|
+
path: {
|
|
44249
|
+
'dataset_name': datasetName,
|
|
44250
|
+
'org': org,
|
|
44251
|
+
'run_name': runName,
|
|
44252
|
+
'user_id': userId
|
|
44253
|
+
},
|
|
44254
|
+
query: {
|
|
44255
|
+
'limit': limit,
|
|
44256
|
+
'page': page,
|
|
44257
|
+
'status': status,
|
|
44258
|
+
'user_email': userEmail
|
|
44259
|
+
}
|
|
44260
|
+
});
|
|
44261
|
+
}
|
|
44262
|
+
/**
|
|
44263
|
+
* Start an LLM-as-Judge evaluation
|
|
44264
|
+
* Dispatch a Celery task that runs a separate LLM over every item in the run, scoring the actual output against the input + expected output using the provided criteria. The judge's score lands in Langfuse with `score_name`, and its reasoning is stored in the score's `comment`.
|
|
44265
|
+
*
|
|
44266
|
+
* Returns immediately (HTTP 202) with the new task record. The task transitions through `pending → in_progress → completed` (or `failed`); poll the list endpoint or the run-detail endpoint to watch.
|
|
44267
|
+
* @returns JudgeRecord
|
|
44268
|
+
* @throws ApiError
|
|
44269
|
+
*/
|
|
44270
|
+
static evaluationsRunJudgeCreate({
|
|
44271
|
+
datasetName,
|
|
44272
|
+
org,
|
|
44273
|
+
runName,
|
|
44274
|
+
userId,
|
|
44275
|
+
requestBody
|
|
44276
|
+
}) {
|
|
44277
|
+
return request(OpenAPI, {
|
|
44278
|
+
method: 'POST',
|
|
44279
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/{run_name}/evaluate/',
|
|
44280
|
+
path: {
|
|
44281
|
+
'dataset_name': datasetName,
|
|
44282
|
+
'org': org,
|
|
44283
|
+
'run_name': runName,
|
|
44284
|
+
'user_id': userId
|
|
44285
|
+
},
|
|
44286
|
+
body: requestBody,
|
|
44287
|
+
mediaType: 'application/json',
|
|
44288
|
+
errors: {
|
|
44289
|
+
400: `Empty run or invalid input.`,
|
|
44290
|
+
404: `Not found within the tenant.`
|
|
44291
|
+
}
|
|
44292
|
+
});
|
|
44293
|
+
}
|
|
44294
|
+
/**
|
|
44295
|
+
* Export experiment results as CSV
|
|
44296
|
+
* Download the run as a CSV. Columns: `item_id`, `input`, `expected_output`, `trace_id`, `actual_output`, and one `score_<name>` column per distinct score name in the run.
|
|
44297
|
+
* @returns binary CSV file download.
|
|
44298
|
+
* @throws ApiError
|
|
44299
|
+
*/
|
|
44300
|
+
static aiMentorOrgsUsersEvaluationsDatasetsRunsExportRetrieve({
|
|
44301
|
+
datasetName,
|
|
44302
|
+
org,
|
|
44303
|
+
runName,
|
|
44304
|
+
userId
|
|
44305
|
+
}) {
|
|
44306
|
+
return request(OpenAPI, {
|
|
44307
|
+
method: 'GET',
|
|
44308
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/{run_name}/export/',
|
|
44309
|
+
path: {
|
|
44310
|
+
'dataset_name': datasetName,
|
|
44311
|
+
'org': org,
|
|
44312
|
+
'run_name': runName,
|
|
44313
|
+
'user_id': userId
|
|
44314
|
+
},
|
|
44315
|
+
errors: {
|
|
44316
|
+
403: `Authenticated, but the resource belongs to another tenant.`,
|
|
44317
|
+
404: `Not found within the tenant.`
|
|
44318
|
+
}
|
|
44319
|
+
});
|
|
44320
|
+
}
|
|
44321
|
+
/**
|
|
44322
|
+
* List LLM-as-Judge evaluations (tenant-wide)
|
|
44323
|
+
* Returns every judge task record in the tenant, across all datasets and runs. Useful for a tenant-wide 'Evaluations' inbox.
|
|
44324
|
+
* @returns PaginatedJudgeList
|
|
44325
|
+
* @throws ApiError
|
|
44326
|
+
*/
|
|
44327
|
+
static evaluationsJudgesGlobalList({
|
|
44328
|
+
org,
|
|
44329
|
+
userId,
|
|
44330
|
+
datasetName,
|
|
44331
|
+
limit,
|
|
44332
|
+
page,
|
|
44333
|
+
status,
|
|
44334
|
+
userEmail
|
|
44335
|
+
}) {
|
|
44336
|
+
return request(OpenAPI, {
|
|
44337
|
+
method: 'GET',
|
|
44338
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/judges/',
|
|
44339
|
+
path: {
|
|
44340
|
+
'org': org,
|
|
44341
|
+
'user_id': userId
|
|
44342
|
+
},
|
|
44343
|
+
query: {
|
|
44344
|
+
'dataset_name': datasetName,
|
|
44345
|
+
'limit': limit,
|
|
44346
|
+
'page': page,
|
|
44347
|
+
'status': status,
|
|
44348
|
+
'user_email': userEmail
|
|
44349
|
+
}
|
|
44350
|
+
});
|
|
44351
|
+
}
|
|
44352
|
+
/**
|
|
44353
|
+
* List score configurations
|
|
44354
|
+
* Score configurations define reusable rubrics (numeric ranges, boolean, or categorical labels). They are optional — scores work without one — but useful for enforcing consistent grading.
|
|
44355
|
+
* @returns PaginatedScoreConfigList
|
|
44356
|
+
* @throws ApiError
|
|
44357
|
+
*/
|
|
44358
|
+
static aiMentorOrgsUsersEvaluationsScoreConfigsRetrieve({
|
|
44359
|
+
org,
|
|
44360
|
+
userId,
|
|
44361
|
+
limit,
|
|
44362
|
+
page
|
|
44363
|
+
}) {
|
|
44364
|
+
return request(OpenAPI, {
|
|
44365
|
+
method: 'GET',
|
|
44366
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/score-configs/',
|
|
44367
|
+
path: {
|
|
44368
|
+
'org': org,
|
|
44369
|
+
'user_id': userId
|
|
44370
|
+
},
|
|
44371
|
+
query: {
|
|
44372
|
+
'limit': limit,
|
|
44373
|
+
'page': page
|
|
44374
|
+
}
|
|
44375
|
+
});
|
|
44376
|
+
}
|
|
44377
|
+
/**
|
|
44378
|
+
* Create a score configuration
|
|
44379
|
+
* Create a score configuration.
|
|
44380
|
+
* @returns ScoreConfig
|
|
44381
|
+
* @throws ApiError
|
|
44382
|
+
*/
|
|
44383
|
+
static aiMentorOrgsUsersEvaluationsScoreConfigsCreate({
|
|
44384
|
+
org,
|
|
44385
|
+
userId,
|
|
44386
|
+
requestBody
|
|
44387
|
+
}) {
|
|
44388
|
+
return request(OpenAPI, {
|
|
44389
|
+
method: 'POST',
|
|
44390
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/score-configs/',
|
|
44391
|
+
path: {
|
|
44392
|
+
'org': org,
|
|
44393
|
+
'user_id': userId
|
|
44394
|
+
},
|
|
44395
|
+
body: requestBody,
|
|
44396
|
+
mediaType: 'application/json',
|
|
44397
|
+
errors: {
|
|
44398
|
+
400: `Validation error.`
|
|
44399
|
+
}
|
|
44400
|
+
});
|
|
44401
|
+
}
|
|
44402
|
+
/**
|
|
44403
|
+
* List scores
|
|
44404
|
+
* List scores (human annotations and LLM-judge results) with optional filters. Pair `dataset_run_id` with a run id to scope to one experiment; pass `trace_id` to scope to a single chat turn or mentor invocation.
|
|
44405
|
+
* @returns PaginatedScoreList
|
|
44406
|
+
* @throws ApiError
|
|
44407
|
+
*/
|
|
44408
|
+
static aiMentorOrgsUsersEvaluationsScoresRetrieve({
|
|
44409
|
+
org,
|
|
44410
|
+
userId,
|
|
44411
|
+
datasetRunId,
|
|
44412
|
+
limit,
|
|
44413
|
+
name,
|
|
44414
|
+
page,
|
|
44415
|
+
traceId
|
|
44416
|
+
}) {
|
|
44417
|
+
return request(OpenAPI, {
|
|
44418
|
+
method: 'GET',
|
|
44419
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/scores/',
|
|
44420
|
+
path: {
|
|
44421
|
+
'org': org,
|
|
44422
|
+
'user_id': userId
|
|
44423
|
+
},
|
|
44424
|
+
query: {
|
|
44425
|
+
'dataset_run_id': datasetRunId,
|
|
44426
|
+
'limit': limit,
|
|
44427
|
+
'name': name,
|
|
44428
|
+
'page': page,
|
|
44429
|
+
'trace_id': traceId
|
|
44430
|
+
}
|
|
44431
|
+
});
|
|
44432
|
+
}
|
|
44433
|
+
/**
|
|
44434
|
+
* Create a score
|
|
44435
|
+
* Create a score on a trace or observation. Use this to record human grading of a single chat message (pass the chat frame's `generation_id` as `trace_id`) or to score an experiment-run item (also pass `dataset_run_id` so the score shows up in the run's CSV export).
|
|
44436
|
+
* @returns ScoreCreateResponse
|
|
44437
|
+
* @throws ApiError
|
|
44438
|
+
*/
|
|
44439
|
+
static aiMentorOrgsUsersEvaluationsScoresCreate({
|
|
44440
|
+
org,
|
|
44441
|
+
userId,
|
|
44442
|
+
requestBody
|
|
44443
|
+
}) {
|
|
44444
|
+
return request(OpenAPI, {
|
|
44445
|
+
method: 'POST',
|
|
44446
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/scores/',
|
|
44447
|
+
path: {
|
|
44448
|
+
'org': org,
|
|
44449
|
+
'user_id': userId
|
|
44450
|
+
},
|
|
44451
|
+
body: requestBody,
|
|
44452
|
+
mediaType: 'application/json',
|
|
44453
|
+
errors: {
|
|
44454
|
+
400: `Validation error.`
|
|
44455
|
+
}
|
|
44456
|
+
});
|
|
44457
|
+
}
|
|
44458
|
+
/**
|
|
44459
|
+
* Delete a score
|
|
44460
|
+
* Delete a score.
|
|
44461
|
+
* @returns void
|
|
44462
|
+
* @throws ApiError
|
|
44463
|
+
*/
|
|
44464
|
+
static aiMentorOrgsUsersEvaluationsScoresDestroy({
|
|
44465
|
+
org,
|
|
44466
|
+
scoreId,
|
|
44467
|
+
userId
|
|
44468
|
+
}) {
|
|
44469
|
+
return request(OpenAPI, {
|
|
44470
|
+
method: 'DELETE',
|
|
44471
|
+
url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/scores/{score_id}/',
|
|
44472
|
+
path: {
|
|
44473
|
+
'org': org,
|
|
44474
|
+
'score_id': scoreId,
|
|
44475
|
+
'user_id': userId
|
|
44476
|
+
},
|
|
44477
|
+
errors: {
|
|
44478
|
+
404: `Not found within the tenant.`
|
|
44479
|
+
}
|
|
44480
|
+
});
|
|
44481
|
+
}
|
|
44482
|
+
}
|
|
44483
|
+
|
|
44213
44484
|
class FeaturesService {
|
|
44214
44485
|
/**
|
|
44215
44486
|
* Returns a list of the apps that the user has access to.
|
|
@@ -48097,6 +48368,7 @@ exports.CoreService = CoreService;
|
|
|
48097
48368
|
exports.CredentialsService = CredentialsService;
|
|
48098
48369
|
exports.CreditsService = CreditsService;
|
|
48099
48370
|
exports.CustomDomainsService = CustomDomainsService;
|
|
48371
|
+
exports.EvaluationsService = EvaluationsService;
|
|
48100
48372
|
exports.FeaturesService = FeaturesService;
|
|
48101
48373
|
exports.ItemsService = ItemsService;
|
|
48102
48374
|
exports.MediaService = MediaService;
|