@iblai/iblai-api 4.253.3-ai → 4.254.0-ai

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (69) hide show
  1. package/dist/index.cjs.js +653 -381
  2. package/dist/index.cjs.js.map +1 -1
  3. package/dist/index.esm.js +653 -382
  4. package/dist/index.esm.js.map +1 -1
  5. package/dist/index.umd.js +653 -381
  6. package/dist/index.umd.js.map +1 -1
  7. package/dist/types/index.d.ts +28 -0
  8. package/dist/types/models/DataTypeEnum.d.ts +10 -0
  9. package/dist/types/models/Dataset.d.ts +12 -0
  10. package/dist/types/models/DatasetCreate.d.ts +8 -0
  11. package/dist/types/models/DatasetItem.d.ts +20 -0
  12. package/dist/types/models/DatasetItemBulkCreateResponse.d.ts +5 -0
  13. package/dist/types/models/DatasetItemCreate.d.ts +10 -0
  14. package/dist/types/models/DatasetItemInput.d.ts +7 -0
  15. package/dist/types/models/DatasetItemUpdate.d.ts +10 -0
  16. package/dist/types/models/DatasetItemUpdateStatusEnum.d.ts +8 -0
  17. package/dist/types/models/DatasetRunItem.d.ts +16 -0
  18. package/dist/types/models/ExperimentCreate.d.ts +8 -0
  19. package/dist/types/models/JudgeRecord.d.ts +18 -0
  20. package/dist/types/models/LLMJudge.d.ts +10 -0
  21. package/dist/types/models/PaginatedDatasetItemList.d.ts +7 -0
  22. package/dist/types/models/PaginatedDatasetList.d.ts +7 -0
  23. package/dist/types/models/PaginatedJudgeList.d.ts +7 -0
  24. package/dist/types/models/PaginatedRunList.d.ts +7 -0
  25. package/dist/types/models/PaginatedScoreConfigList.d.ts +7 -0
  26. package/dist/types/models/PaginatedScoreList.d.ts +7 -0
  27. package/dist/types/models/Run.d.ts +19 -0
  28. package/dist/types/models/RunDetailResponse.d.ts +19 -0
  29. package/dist/types/models/Score.d.ts +17 -0
  30. package/dist/types/models/ScoreConfig.d.ts +12 -0
  31. package/dist/types/models/ScoreConfigCategory.d.ts +7 -0
  32. package/dist/types/models/ScoreConfigCreate.d.ts +13 -0
  33. package/dist/types/models/ScoreCreate.d.ts +14 -0
  34. package/dist/types/models/ScoreCreateResponse.d.ts +7 -0
  35. package/dist/types/services/AiMentorService.d.ts +0 -171
  36. package/dist/types/services/EvaluationsService.d.ts +353 -0
  37. package/package.json +1 -1
  38. package/sdk_schema.yml +1512 -299
  39. package/src/core/OpenAPI.ts +1 -1
  40. package/src/index.ts +28 -0
  41. package/src/models/DataTypeEnum.ts +14 -0
  42. package/src/models/Dataset.ts +17 -0
  43. package/src/models/DatasetCreate.ts +13 -0
  44. package/src/models/DatasetItem.ts +25 -0
  45. package/src/models/DatasetItemBulkCreateResponse.ts +10 -0
  46. package/src/models/DatasetItemCreate.ts +15 -0
  47. package/src/models/DatasetItemInput.ts +12 -0
  48. package/src/models/DatasetItemUpdate.ts +15 -0
  49. package/src/models/DatasetItemUpdateStatusEnum.ts +12 -0
  50. package/src/models/DatasetRunItem.ts +21 -0
  51. package/src/models/ExperimentCreate.ts +13 -0
  52. package/src/models/JudgeRecord.ts +23 -0
  53. package/src/models/LLMJudge.ts +15 -0
  54. package/src/models/PaginatedDatasetItemList.ts +12 -0
  55. package/src/models/PaginatedDatasetList.ts +12 -0
  56. package/src/models/PaginatedJudgeList.ts +12 -0
  57. package/src/models/PaginatedRunList.ts +12 -0
  58. package/src/models/PaginatedScoreConfigList.ts +12 -0
  59. package/src/models/PaginatedScoreList.ts +12 -0
  60. package/src/models/Run.ts +24 -0
  61. package/src/models/RunDetailResponse.ts +24 -0
  62. package/src/models/Score.ts +22 -0
  63. package/src/models/ScoreConfig.ts +17 -0
  64. package/src/models/ScoreConfigCategory.ts +12 -0
  65. package/src/models/ScoreConfigCreate.ts +18 -0
  66. package/src/models/ScoreCreate.ts +19 -0
  67. package/src/models/ScoreCreateResponse.ts +12 -0
  68. package/src/services/AiMentorService.ts +0 -456
  69. package/src/services/EvaluationsService.ts +851 -0
package/dist/index.cjs.js CHANGED
@@ -110,7 +110,7 @@ class CancelablePromise {
110
110
 
111
111
  const OpenAPI = {
112
112
  BASE: 'https://base.manager.iblai.app',
113
- VERSION: '4.253.3-ai-plus',
113
+ VERSION: '4.254.0-ai-plus',
114
114
  WITH_CREDENTIALS: false,
115
115
  CREDENTIALS: 'include',
116
116
  TOKEN: undefined,
@@ -405,6 +405,36 @@ exports.CreditTransactionHistoryStatusEnum = void 0;
405
405
  CreditTransactionHistoryStatusEnum["CANCELLED"] = "cancelled";
406
406
  })(exports.CreditTransactionHistoryStatusEnum || (exports.CreditTransactionHistoryStatusEnum = {}));
407
407
 
408
+ /* generated using openapi-typescript-codegen -- do not edit */
409
+ /* istanbul ignore file */
410
+ /* tslint:disable */
411
+ /* eslint-disable */
412
+ /**
413
+ * * `ACTIVE` - ACTIVE
414
+ * * `ARCHIVED` - ARCHIVED
415
+ */
416
+ exports.DatasetItemUpdateStatusEnum = void 0;
417
+ (function (DatasetItemUpdateStatusEnum) {
418
+ DatasetItemUpdateStatusEnum["ACTIVE"] = "ACTIVE";
419
+ DatasetItemUpdateStatusEnum["ARCHIVED"] = "ARCHIVED";
420
+ })(exports.DatasetItemUpdateStatusEnum || (exports.DatasetItemUpdateStatusEnum = {}));
421
+
422
+ /* generated using openapi-typescript-codegen -- do not edit */
423
+ /* istanbul ignore file */
424
+ /* tslint:disable */
425
+ /* eslint-disable */
426
+ /**
427
+ * * `NUMERIC` - NUMERIC
428
+ * * `BOOLEAN` - BOOLEAN
429
+ * * `CATEGORICAL` - CATEGORICAL
430
+ */
431
+ exports.DataTypeEnum = void 0;
432
+ (function (DataTypeEnum) {
433
+ DataTypeEnum["NUMERIC"] = "NUMERIC";
434
+ DataTypeEnum["BOOLEAN"] = "BOOLEAN";
435
+ DataTypeEnum["CATEGORICAL"] = "CATEGORICAL";
436
+ })(exports.DataTypeEnum || (exports.DataTypeEnum = {}));
437
+
408
438
  /* generated using openapi-typescript-codegen -- do not edit */
409
439
  /* istanbul ignore file */
410
440
  /* tslint:disable */
@@ -19899,386 +19929,6 @@ class AiMentorService {
19899
19929
  }
19900
19930
  });
19901
19931
  }
19902
- /**
19903
- * List datasets belonging to the tenant.
19904
- * @returns any No response body
19905
- * @throws ApiError
19906
- */
19907
- static aiMentorOrgsUsersEvaluationsDatasetsRetrieve({
19908
- org,
19909
- userId
19910
- }) {
19911
- return request(OpenAPI, {
19912
- method: 'GET',
19913
- url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/',
19914
- path: {
19915
- 'org': org,
19916
- 'user_id': userId
19917
- }
19918
- });
19919
- }
19920
- /**
19921
- * Create a new dataset.
19922
- * @returns any No response body
19923
- * @throws ApiError
19924
- */
19925
- static aiMentorOrgsUsersEvaluationsDatasetsCreate({
19926
- org,
19927
- userId
19928
- }) {
19929
- return request(OpenAPI, {
19930
- method: 'POST',
19931
- url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/',
19932
- path: {
19933
- 'org': org,
19934
- 'user_id': userId
19935
- }
19936
- });
19937
- }
19938
- /**
19939
- * Get a single dataset by name.
19940
- * @returns any No response body
19941
- * @throws ApiError
19942
- */
19943
- static aiMentorOrgsUsersEvaluationsDatasetsRetrieve2({
19944
- datasetName,
19945
- org,
19946
- userId
19947
- }) {
19948
- return request(OpenAPI, {
19949
- method: 'GET',
19950
- url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/',
19951
- path: {
19952
- 'dataset_name': datasetName,
19953
- 'org': org,
19954
- 'user_id': userId
19955
- }
19956
- });
19957
- }
19958
- /**
19959
- * List items in a dataset.
19960
- * @returns any No response body
19961
- * @throws ApiError
19962
- */
19963
- static aiMentorOrgsUsersEvaluationsDatasetsItemsRetrieve({
19964
- datasetName,
19965
- org,
19966
- userId
19967
- }) {
19968
- return request(OpenAPI, {
19969
- method: 'GET',
19970
- url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/',
19971
- path: {
19972
- 'dataset_name': datasetName,
19973
- 'org': org,
19974
- 'user_id': userId
19975
- }
19976
- });
19977
- }
19978
- /**
19979
- * Add items to a dataset from direct input or trace IDs.
19980
- * @returns any No response body
19981
- * @throws ApiError
19982
- */
19983
- static aiMentorOrgsUsersEvaluationsDatasetsItemsCreate({
19984
- datasetName,
19985
- org,
19986
- userId
19987
- }) {
19988
- return request(OpenAPI, {
19989
- method: 'POST',
19990
- url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/',
19991
- path: {
19992
- 'dataset_name': datasetName,
19993
- 'org': org,
19994
- 'user_id': userId
19995
- }
19996
- });
19997
- }
19998
- /**
19999
- * Update a dataset item.
20000
- * @returns any No response body
20001
- * @throws ApiError
20002
- */
20003
- static aiMentorOrgsUsersEvaluationsDatasetsItemsUpdate({
20004
- datasetName,
20005
- itemId,
20006
- org,
20007
- userId
20008
- }) {
20009
- return request(OpenAPI, {
20010
- method: 'PUT',
20011
- url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/{item_id}/',
20012
- path: {
20013
- 'dataset_name': datasetName,
20014
- 'item_id': itemId,
20015
- 'org': org,
20016
- 'user_id': userId
20017
- }
20018
- });
20019
- }
20020
- /**
20021
- * Delete a dataset item.
20022
- * @returns void
20023
- * @throws ApiError
20024
- */
20025
- static aiMentorOrgsUsersEvaluationsDatasetsItemsDestroy({
20026
- datasetName,
20027
- itemId,
20028
- org,
20029
- userId
20030
- }) {
20031
- return request(OpenAPI, {
20032
- method: 'DELETE',
20033
- url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/{item_id}/',
20034
- path: {
20035
- 'dataset_name': datasetName,
20036
- 'item_id': itemId,
20037
- 'org': org,
20038
- 'user_id': userId
20039
- }
20040
- });
20041
- }
20042
- /**
20043
- * Upload a CSV file to create dataset items.
20044
- * @returns any No response body
20045
- * @throws ApiError
20046
- */
20047
- static aiMentorOrgsUsersEvaluationsDatasetsItemsUploadCreate({
20048
- datasetName,
20049
- org,
20050
- userId
20051
- }) {
20052
- return request(OpenAPI, {
20053
- method: 'POST',
20054
- url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/upload/',
20055
- path: {
20056
- 'dataset_name': datasetName,
20057
- 'org': org,
20058
- 'user_id': userId
20059
- }
20060
- });
20061
- }
20062
- /**
20063
- * List experiment runs for a dataset.
20064
- * @returns any No response body
20065
- * @throws ApiError
20066
- */
20067
- static aiMentorOrgsUsersEvaluationsDatasetsRunsRetrieve({
20068
- datasetName,
20069
- org,
20070
- userId
20071
- }) {
20072
- return request(OpenAPI, {
20073
- method: 'GET',
20074
- url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/',
20075
- path: {
20076
- 'dataset_name': datasetName,
20077
- 'org': org,
20078
- 'user_id': userId
20079
- }
20080
- });
20081
- }
20082
- /**
20083
- * Start an experiment — dispatches a Celery task.
20084
- * @returns any No response body
20085
- * @throws ApiError
20086
- */
20087
- static aiMentorOrgsUsersEvaluationsDatasetsRunsCreate({
20088
- datasetName,
20089
- org,
20090
- userId
20091
- }) {
20092
- return request(OpenAPI, {
20093
- method: 'POST',
20094
- url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/',
20095
- path: {
20096
- 'dataset_name': datasetName,
20097
- 'org': org,
20098
- 'user_id': userId
20099
- }
20100
- });
20101
- }
20102
- /**
20103
- * Get experiment run details.
20104
- * @returns any No response body
20105
- * @throws ApiError
20106
- */
20107
- static aiMentorOrgsUsersEvaluationsDatasetsRunsRetrieve2({
20108
- datasetName,
20109
- org,
20110
- runName,
20111
- userId
20112
- }) {
20113
- return request(OpenAPI, {
20114
- method: 'GET',
20115
- url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/{run_name}/',
20116
- path: {
20117
- 'dataset_name': datasetName,
20118
- 'org': org,
20119
- 'run_name': runName,
20120
- 'user_id': userId
20121
- }
20122
- });
20123
- }
20124
- /**
20125
- * Delete an experiment run.
20126
- * @returns void
20127
- * @throws ApiError
20128
- */
20129
- static aiMentorOrgsUsersEvaluationsDatasetsRunsDestroy({
20130
- datasetName,
20131
- org,
20132
- runName,
20133
- userId
20134
- }) {
20135
- return request(OpenAPI, {
20136
- method: 'DELETE',
20137
- url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/{run_name}/',
20138
- path: {
20139
- 'dataset_name': datasetName,
20140
- 'org': org,
20141
- 'run_name': runName,
20142
- 'user_id': userId
20143
- }
20144
- });
20145
- }
20146
- /**
20147
- * Trigger LLM-as-Judge evaluation on a completed experiment run.
20148
- * @returns any No response body
20149
- * @throws ApiError
20150
- */
20151
- static aiMentorOrgsUsersEvaluationsDatasetsRunsEvaluateCreate({
20152
- datasetName,
20153
- org,
20154
- runName,
20155
- userId
20156
- }) {
20157
- return request(OpenAPI, {
20158
- method: 'POST',
20159
- url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/{run_name}/evaluate/',
20160
- path: {
20161
- 'dataset_name': datasetName,
20162
- 'org': org,
20163
- 'run_name': runName,
20164
- 'user_id': userId
20165
- }
20166
- });
20167
- }
20168
- /**
20169
- * Export experiment results as CSV.
20170
- * @returns any No response body
20171
- * @throws ApiError
20172
- */
20173
- static aiMentorOrgsUsersEvaluationsDatasetsRunsExportRetrieve({
20174
- datasetName,
20175
- org,
20176
- runName,
20177
- userId
20178
- }) {
20179
- return request(OpenAPI, {
20180
- method: 'GET',
20181
- url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/{run_name}/export/',
20182
- path: {
20183
- 'dataset_name': datasetName,
20184
- 'org': org,
20185
- 'run_name': runName,
20186
- 'user_id': userId
20187
- }
20188
- });
20189
- }
20190
- /**
20191
- * List score configurations.
20192
- * @returns any No response body
20193
- * @throws ApiError
20194
- */
20195
- static aiMentorOrgsUsersEvaluationsScoreConfigsRetrieve({
20196
- org,
20197
- userId
20198
- }) {
20199
- return request(OpenAPI, {
20200
- method: 'GET',
20201
- url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/score-configs/',
20202
- path: {
20203
- 'org': org,
20204
- 'user_id': userId
20205
- }
20206
- });
20207
- }
20208
- /**
20209
- * Create a score configuration.
20210
- * @returns any No response body
20211
- * @throws ApiError
20212
- */
20213
- static aiMentorOrgsUsersEvaluationsScoreConfigsCreate({
20214
- org,
20215
- userId
20216
- }) {
20217
- return request(OpenAPI, {
20218
- method: 'POST',
20219
- url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/score-configs/',
20220
- path: {
20221
- 'org': org,
20222
- 'user_id': userId
20223
- }
20224
- });
20225
- }
20226
- /**
20227
- * List scores with optional filters.
20228
- * @returns any No response body
20229
- * @throws ApiError
20230
- */
20231
- static aiMentorOrgsUsersEvaluationsScoresRetrieve({
20232
- org,
20233
- userId
20234
- }) {
20235
- return request(OpenAPI, {
20236
- method: 'GET',
20237
- url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/scores/',
20238
- path: {
20239
- 'org': org,
20240
- 'user_id': userId
20241
- }
20242
- });
20243
- }
20244
- /**
20245
- * Create a score (human annotation).
20246
- * @returns any No response body
20247
- * @throws ApiError
20248
- */
20249
- static aiMentorOrgsUsersEvaluationsScoresCreate({
20250
- org,
20251
- userId
20252
- }) {
20253
- return request(OpenAPI, {
20254
- method: 'POST',
20255
- url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/scores/',
20256
- path: {
20257
- 'org': org,
20258
- 'user_id': userId
20259
- }
20260
- });
20261
- }
20262
- /**
20263
- * Delete a score.
20264
- * @returns void
20265
- * @throws ApiError
20266
- */
20267
- static aiMentorOrgsUsersEvaluationsScoresDestroy({
20268
- org,
20269
- scoreId,
20270
- userId
20271
- }) {
20272
- return request(OpenAPI, {
20273
- method: 'DELETE',
20274
- url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/scores/{score_id}/',
20275
- path: {
20276
- 'org': org,
20277
- 'score_id': scoreId,
20278
- 'user_id': userId
20279
- }
20280
- });
20281
- }
20282
19932
  /**
20283
19933
  * Retrieve the count of free usage credits available to a user.
20284
19934
  *
@@ -44210,6 +43860,627 @@ class CustomDomainsService {
44210
43860
  }
44211
43861
  }
44212
43862
 
43863
+ class EvaluationsService {
43864
+ /**
43865
+ * List datasets
43866
+ * List datasets belonging to the tenant. Supports server-side filtering by name substring and creator email (matched against the cached `created_by_email` in Langfuse metadata).
43867
+ * @returns PaginatedDatasetList
43868
+ * @throws ApiError
43869
+ */
43870
+ static evaluationsDatasetsList({
43871
+ org,
43872
+ userId,
43873
+ limit,
43874
+ name,
43875
+ page,
43876
+ userEmail
43877
+ }) {
43878
+ return request(OpenAPI, {
43879
+ method: 'GET',
43880
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/',
43881
+ path: {
43882
+ 'org': org,
43883
+ 'user_id': userId
43884
+ },
43885
+ query: {
43886
+ 'limit': limit,
43887
+ 'name': name,
43888
+ 'page': page,
43889
+ 'user_email': userEmail
43890
+ }
43891
+ });
43892
+ }
43893
+ /**
43894
+ * Create a dataset
43895
+ * Create a Langfuse dataset under the tenant. The creator's `username` and `user_email` are captured into metadata so future list responses can attribute the row without an extra DB lookup.
43896
+ * @returns Dataset
43897
+ * @throws ApiError
43898
+ */
43899
+ static aiMentorOrgsUsersEvaluationsDatasetsCreate({
43900
+ org,
43901
+ userId,
43902
+ requestBody
43903
+ }) {
43904
+ return request(OpenAPI, {
43905
+ method: 'POST',
43906
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/',
43907
+ path: {
43908
+ 'org': org,
43909
+ 'user_id': userId
43910
+ },
43911
+ body: requestBody,
43912
+ mediaType: 'application/json',
43913
+ errors: {
43914
+ 400: `Validation error.`
43915
+ }
43916
+ });
43917
+ }
43918
+ /**
43919
+ * Retrieve a dataset
43920
+ * Get a single dataset by name.
43921
+ * @returns Dataset
43922
+ * @throws ApiError
43923
+ */
43924
+ static aiMentorOrgsUsersEvaluationsDatasetsRetrieve({
43925
+ datasetName,
43926
+ org,
43927
+ userId
43928
+ }) {
43929
+ return request(OpenAPI, {
43930
+ method: 'GET',
43931
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/',
43932
+ path: {
43933
+ 'dataset_name': datasetName,
43934
+ 'org': org,
43935
+ 'user_id': userId
43936
+ },
43937
+ errors: {
43938
+ 403: `Authenticated, but the resource belongs to another tenant.`,
43939
+ 404: `Not found within the tenant.`
43940
+ }
43941
+ });
43942
+ }
43943
+ /**
43944
+ * List dataset items
43945
+ * List items in a dataset. Pass `?include_trace=true` to attach `trace_input` / `trace_output` for items linked to a source trace (one bulk ClickHouse query for the page — no per-row fan-out).
43946
+ * @returns PaginatedDatasetItemList
43947
+ * @throws ApiError
43948
+ */
43949
+ static evaluationsDatasetItemsList({
43950
+ datasetName,
43951
+ org,
43952
+ userId,
43953
+ includeTrace,
43954
+ limit,
43955
+ page
43956
+ }) {
43957
+ return request(OpenAPI, {
43958
+ method: 'GET',
43959
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/',
43960
+ path: {
43961
+ 'dataset_name': datasetName,
43962
+ 'org': org,
43963
+ 'user_id': userId
43964
+ },
43965
+ query: {
43966
+ 'include_trace': includeTrace,
43967
+ 'limit': limit,
43968
+ 'page': page
43969
+ },
43970
+ errors: {
43971
+ 404: `Not found within the tenant.`
43972
+ }
43973
+ });
43974
+ }
43975
+ /**
43976
+ * Add dataset items
43977
+ * Add items to a dataset. Provide either an `items` array of `{input, expected_output}` objects OR a `trace_ids` array to seed items from existing traces (input/expected are then copied from the trace). Exactly one of the two must be present.
43978
+ * @returns DatasetItemBulkCreateResponse
43979
+ * @throws ApiError
43980
+ */
43981
+ static aiMentorOrgsUsersEvaluationsDatasetsItemsCreate({
43982
+ datasetName,
43983
+ org,
43984
+ userId,
43985
+ requestBody
43986
+ }) {
43987
+ return request(OpenAPI, {
43988
+ method: 'POST',
43989
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/',
43990
+ path: {
43991
+ 'dataset_name': datasetName,
43992
+ 'org': org,
43993
+ 'user_id': userId
43994
+ },
43995
+ body: requestBody,
43996
+ mediaType: 'application/json',
43997
+ errors: {
43998
+ 400: `Validation error.`,
43999
+ 404: `Not found within the tenant.`
44000
+ }
44001
+ });
44002
+ }
44003
+ /**
44004
+ * Retrieve a dataset item
44005
+ * Retrieve a single dataset item. `trace_input` / `trace_output` are always populated when the item has a `source_trace_id` (single-row case, no fan-out concern).
44006
+ * @returns DatasetItem
44007
+ * @throws ApiError
44008
+ */
44009
+ static aiMentorOrgsUsersEvaluationsDatasetsItemsRetrieve({
44010
+ datasetName,
44011
+ itemId,
44012
+ org,
44013
+ userId
44014
+ }) {
44015
+ return request(OpenAPI, {
44016
+ method: 'GET',
44017
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/{item_id}/',
44018
+ path: {
44019
+ 'dataset_name': datasetName,
44020
+ 'item_id': itemId,
44021
+ 'org': org,
44022
+ 'user_id': userId
44023
+ },
44024
+ errors: {
44025
+ 404: `Not found within the tenant.`
44026
+ }
44027
+ });
44028
+ }
44029
+ /**
44030
+ * Update a dataset item
44031
+ * Update any subset of `input`, `expected_output`, `metadata`, or `status` on a dataset item. Uses Langfuse's id-based upsert.
44032
+ * @returns DatasetItem
44033
+ * @throws ApiError
44034
+ */
44035
+ static aiMentorOrgsUsersEvaluationsDatasetsItemsUpdate({
44036
+ datasetName,
44037
+ itemId,
44038
+ org,
44039
+ userId,
44040
+ requestBody
44041
+ }) {
44042
+ return request(OpenAPI, {
44043
+ method: 'PUT',
44044
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/{item_id}/',
44045
+ path: {
44046
+ 'dataset_name': datasetName,
44047
+ 'item_id': itemId,
44048
+ 'org': org,
44049
+ 'user_id': userId
44050
+ },
44051
+ body: requestBody,
44052
+ mediaType: 'application/json',
44053
+ errors: {
44054
+ 400: `Validation error.`,
44055
+ 404: `Not found within the tenant.`
44056
+ }
44057
+ });
44058
+ }
44059
+ /**
44060
+ * Delete a dataset item
44061
+ * Delete a dataset item.
44062
+ * @returns void
44063
+ * @throws ApiError
44064
+ */
44065
+ static aiMentorOrgsUsersEvaluationsDatasetsItemsDestroy({
44066
+ datasetName,
44067
+ itemId,
44068
+ org,
44069
+ userId
44070
+ }) {
44071
+ return request(OpenAPI, {
44072
+ method: 'DELETE',
44073
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/{item_id}/',
44074
+ path: {
44075
+ 'dataset_name': datasetName,
44076
+ 'item_id': itemId,
44077
+ 'org': org,
44078
+ 'user_id': userId
44079
+ },
44080
+ errors: {
44081
+ 404: `Not found within the tenant.`
44082
+ }
44083
+ });
44084
+ }
44085
+ /**
44086
+ * Upload a CSV of dataset items
44087
+ * Bulk-create items from a CSV (multipart `file` field). The CSV must have an `input` column; `expected_output` is optional. Rows with empty `input` are skipped.
44088
+ * @returns DatasetItemBulkCreateResponse
44089
+ * @throws ApiError
44090
+ */
44091
+ static aiMentorOrgsUsersEvaluationsDatasetsItemsUploadCreate({
44092
+ datasetName,
44093
+ org,
44094
+ userId,
44095
+ formData
44096
+ }) {
44097
+ return request(OpenAPI, {
44098
+ method: 'POST',
44099
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/items/upload/',
44100
+ path: {
44101
+ 'dataset_name': datasetName,
44102
+ 'org': org,
44103
+ 'user_id': userId
44104
+ },
44105
+ formData: formData,
44106
+ mediaType: 'multipart/form-data',
44107
+ errors: {
44108
+ 400: `Validation error.`,
44109
+ 404: `Not found within the tenant.`
44110
+ }
44111
+ });
44112
+ }
44113
+ /**
44114
+ * List experiment runs
44115
+ * List runs for a dataset. The response merges Langfuse-persisted runs with in-flight `EvaluationTaskRecord` rows (status `pending` / `in_progress`), deduplicated by `run_name`. `pending_count` reports how many pending entries are in the page so the UI can badge in-flight work.
44116
+ * @returns PaginatedRunList
44117
+ * @throws ApiError
44118
+ */
44119
+ static evaluationsRunsList({
44120
+ datasetName,
44121
+ org,
44122
+ userId,
44123
+ limit,
44124
+ page,
44125
+ userEmail
44126
+ }) {
44127
+ return request(OpenAPI, {
44128
+ method: 'GET',
44129
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/',
44130
+ path: {
44131
+ 'dataset_name': datasetName,
44132
+ 'org': org,
44133
+ 'user_id': userId
44134
+ },
44135
+ query: {
44136
+ 'limit': limit,
44137
+ 'page': page,
44138
+ 'user_email': userEmail
44139
+ },
44140
+ errors: {
44141
+ 404: `Not found within the tenant.`
44142
+ }
44143
+ });
44144
+ }
44145
+ /**
44146
+ * Start an experiment run
44147
+ * Dispatch a Celery task that runs the chosen mentor against every item in the dataset. Returns immediately (HTTP 202) with the new task record. Poll the list endpoint (or the run-detail endpoint once Langfuse persists the run) to watch the `pending → in_progress → completed` transition.
44148
+ * @returns Run
44149
+ * @throws ApiError
44150
+ */
44151
+ static aiMentorOrgsUsersEvaluationsDatasetsRunsCreate({
44152
+ datasetName,
44153
+ org,
44154
+ userId,
44155
+ requestBody
44156
+ }) {
44157
+ return request(OpenAPI, {
44158
+ method: 'POST',
44159
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/',
44160
+ path: {
44161
+ 'dataset_name': datasetName,
44162
+ 'org': org,
44163
+ 'user_id': userId
44164
+ },
44165
+ body: requestBody,
44166
+ mediaType: 'application/json',
44167
+ errors: {
44168
+ 400: `Validation error.`,
44169
+ 404: `Dataset or mentor not found within the tenant.`
44170
+ }
44171
+ });
44172
+ }
44173
+ /**
44174
+ * Retrieve experiment run details
44175
+ * Returns the run header plus every `dataset_run_item` fully expanded with `input`, `expected_output`, `actual_output`, `trace_id`, and per-item `scores`. Also embeds a `pending_judges` array for any in-flight LLM-as-Judge evaluations against this run.
44176
+ *
44177
+ * Cost: 1 PG query + 2 ClickHouse queries + 1 score query regardless of run size.
44178
+ * @returns RunDetailResponse
44179
+ * @throws ApiError
44180
+ */
44181
+ static aiMentorOrgsUsersEvaluationsDatasetsRunsRetrieve({
44182
+ datasetName,
44183
+ org,
44184
+ runName,
44185
+ userId
44186
+ }) {
44187
+ return request(OpenAPI, {
44188
+ method: 'GET',
44189
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/{run_name}/',
44190
+ path: {
44191
+ 'dataset_name': datasetName,
44192
+ 'org': org,
44193
+ 'run_name': runName,
44194
+ 'user_id': userId
44195
+ },
44196
+ errors: {
44197
+ 403: `Authenticated, but the resource belongs to another tenant.`,
44198
+ 404: `Not found within the tenant.`
44199
+ }
44200
+ });
44201
+ }
44202
+ /**
44203
+ * Delete an experiment run
44204
+ * Delete an experiment run.
44205
+ * @returns void
44206
+ * @throws ApiError
44207
+ */
44208
+ static aiMentorOrgsUsersEvaluationsDatasetsRunsDestroy({
44209
+ datasetName,
44210
+ org,
44211
+ runName,
44212
+ userId
44213
+ }) {
44214
+ return request(OpenAPI, {
44215
+ method: 'DELETE',
44216
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/{run_name}/',
44217
+ path: {
44218
+ 'dataset_name': datasetName,
44219
+ 'org': org,
44220
+ 'run_name': runName,
44221
+ 'user_id': userId
44222
+ },
44223
+ errors: {
44224
+ 403: `Authenticated, but the resource belongs to another tenant.`,
44225
+ 404: `Not found within the tenant.`
44226
+ }
44227
+ });
44228
+ }
44229
+ /**
44230
+ * List LLM-as-Judge evaluations for a run
44231
+ * Returns every judge task record (any status) targeting this run. Useful for showing an 'Evaluations' history on a run-detail view, including failed and pending ones.
44232
+ * @returns PaginatedJudgeList
44233
+ * @throws ApiError
44234
+ */
44235
+ static evaluationsRunJudgesList({
44236
+ datasetName,
44237
+ org,
44238
+ runName,
44239
+ userId,
44240
+ limit,
44241
+ page,
44242
+ status,
44243
+ userEmail
44244
+ }) {
44245
+ return request(OpenAPI, {
44246
+ method: 'GET',
44247
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/{run_name}/evaluate/',
44248
+ path: {
44249
+ 'dataset_name': datasetName,
44250
+ 'org': org,
44251
+ 'run_name': runName,
44252
+ 'user_id': userId
44253
+ },
44254
+ query: {
44255
+ 'limit': limit,
44256
+ 'page': page,
44257
+ 'status': status,
44258
+ 'user_email': userEmail
44259
+ }
44260
+ });
44261
+ }
44262
+ /**
44263
+ * Start an LLM-as-Judge evaluation
44264
+ * Dispatch a Celery task that runs a separate LLM over every item in the run, scoring the actual output against the input + expected output using the provided criteria. The judge's score lands in Langfuse with `score_name`, and its reasoning is stored in the score's `comment`.
44265
+ *
44266
+ * Returns immediately (HTTP 202) with the new task record. The task transitions through `pending → in_progress → completed` (or `failed`); poll the list endpoint or the run-detail endpoint to watch.
44267
+ * @returns JudgeRecord
44268
+ * @throws ApiError
44269
+ */
44270
+ static evaluationsRunJudgeCreate({
44271
+ datasetName,
44272
+ org,
44273
+ runName,
44274
+ userId,
44275
+ requestBody
44276
+ }) {
44277
+ return request(OpenAPI, {
44278
+ method: 'POST',
44279
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/{run_name}/evaluate/',
44280
+ path: {
44281
+ 'dataset_name': datasetName,
44282
+ 'org': org,
44283
+ 'run_name': runName,
44284
+ 'user_id': userId
44285
+ },
44286
+ body: requestBody,
44287
+ mediaType: 'application/json',
44288
+ errors: {
44289
+ 400: `Empty run or invalid input.`,
44290
+ 404: `Not found within the tenant.`
44291
+ }
44292
+ });
44293
+ }
44294
+ /**
44295
+ * Export experiment results as CSV
44296
+ * Download the run as a CSV. Columns: `item_id`, `input`, `expected_output`, `trace_id`, `actual_output`, and one `score_<name>` column per distinct score name in the run.
44297
+ * @returns binary CSV file download.
44298
+ * @throws ApiError
44299
+ */
44300
+ static aiMentorOrgsUsersEvaluationsDatasetsRunsExportRetrieve({
44301
+ datasetName,
44302
+ org,
44303
+ runName,
44304
+ userId
44305
+ }) {
44306
+ return request(OpenAPI, {
44307
+ method: 'GET',
44308
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/datasets/{dataset_name}/runs/{run_name}/export/',
44309
+ path: {
44310
+ 'dataset_name': datasetName,
44311
+ 'org': org,
44312
+ 'run_name': runName,
44313
+ 'user_id': userId
44314
+ },
44315
+ errors: {
44316
+ 403: `Authenticated, but the resource belongs to another tenant.`,
44317
+ 404: `Not found within the tenant.`
44318
+ }
44319
+ });
44320
+ }
44321
+ /**
44322
+ * List LLM-as-Judge evaluations (tenant-wide)
44323
+ * Returns every judge task record in the tenant, across all datasets and runs. Useful for a tenant-wide 'Evaluations' inbox.
44324
+ * @returns PaginatedJudgeList
44325
+ * @throws ApiError
44326
+ */
44327
+ static evaluationsJudgesGlobalList({
44328
+ org,
44329
+ userId,
44330
+ datasetName,
44331
+ limit,
44332
+ page,
44333
+ status,
44334
+ userEmail
44335
+ }) {
44336
+ return request(OpenAPI, {
44337
+ method: 'GET',
44338
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/judges/',
44339
+ path: {
44340
+ 'org': org,
44341
+ 'user_id': userId
44342
+ },
44343
+ query: {
44344
+ 'dataset_name': datasetName,
44345
+ 'limit': limit,
44346
+ 'page': page,
44347
+ 'status': status,
44348
+ 'user_email': userEmail
44349
+ }
44350
+ });
44351
+ }
44352
+ /**
44353
+ * List score configurations
44354
+ * Score configurations define reusable rubrics (numeric ranges, boolean, or categorical labels). They are optional — scores work without one — but useful for enforcing consistent grading.
44355
+ * @returns PaginatedScoreConfigList
44356
+ * @throws ApiError
44357
+ */
44358
+ static aiMentorOrgsUsersEvaluationsScoreConfigsRetrieve({
44359
+ org,
44360
+ userId,
44361
+ limit,
44362
+ page
44363
+ }) {
44364
+ return request(OpenAPI, {
44365
+ method: 'GET',
44366
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/score-configs/',
44367
+ path: {
44368
+ 'org': org,
44369
+ 'user_id': userId
44370
+ },
44371
+ query: {
44372
+ 'limit': limit,
44373
+ 'page': page
44374
+ }
44375
+ });
44376
+ }
44377
+ /**
44378
+ * Create a score configuration
44379
+ * Create a score configuration.
44380
+ * @returns ScoreConfig
44381
+ * @throws ApiError
44382
+ */
44383
+ static aiMentorOrgsUsersEvaluationsScoreConfigsCreate({
44384
+ org,
44385
+ userId,
44386
+ requestBody
44387
+ }) {
44388
+ return request(OpenAPI, {
44389
+ method: 'POST',
44390
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/score-configs/',
44391
+ path: {
44392
+ 'org': org,
44393
+ 'user_id': userId
44394
+ },
44395
+ body: requestBody,
44396
+ mediaType: 'application/json',
44397
+ errors: {
44398
+ 400: `Validation error.`
44399
+ }
44400
+ });
44401
+ }
44402
+ /**
44403
+ * List scores
44404
+ * List scores (human annotations and LLM-judge results) with optional filters. Pair `dataset_run_id` with a run id to scope to one experiment; pass `trace_id` to scope to a single chat turn or mentor invocation.
44405
+ * @returns PaginatedScoreList
44406
+ * @throws ApiError
44407
+ */
44408
+ static aiMentorOrgsUsersEvaluationsScoresRetrieve({
44409
+ org,
44410
+ userId,
44411
+ datasetRunId,
44412
+ limit,
44413
+ name,
44414
+ page,
44415
+ traceId
44416
+ }) {
44417
+ return request(OpenAPI, {
44418
+ method: 'GET',
44419
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/scores/',
44420
+ path: {
44421
+ 'org': org,
44422
+ 'user_id': userId
44423
+ },
44424
+ query: {
44425
+ 'dataset_run_id': datasetRunId,
44426
+ 'limit': limit,
44427
+ 'name': name,
44428
+ 'page': page,
44429
+ 'trace_id': traceId
44430
+ }
44431
+ });
44432
+ }
44433
+ /**
44434
+ * Create a score
44435
+ * Create a score on a trace or observation. Use this to record human grading of a single chat message (pass the chat frame's `generation_id` as `trace_id`) or to score an experiment-run item (also pass `dataset_run_id` so the score shows up in the run's CSV export).
44436
+ * @returns ScoreCreateResponse
44437
+ * @throws ApiError
44438
+ */
44439
+ static aiMentorOrgsUsersEvaluationsScoresCreate({
44440
+ org,
44441
+ userId,
44442
+ requestBody
44443
+ }) {
44444
+ return request(OpenAPI, {
44445
+ method: 'POST',
44446
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/scores/',
44447
+ path: {
44448
+ 'org': org,
44449
+ 'user_id': userId
44450
+ },
44451
+ body: requestBody,
44452
+ mediaType: 'application/json',
44453
+ errors: {
44454
+ 400: `Validation error.`
44455
+ }
44456
+ });
44457
+ }
44458
+ /**
44459
+ * Delete a score
44460
+ * Delete a score.
44461
+ * @returns void
44462
+ * @throws ApiError
44463
+ */
44464
+ static aiMentorOrgsUsersEvaluationsScoresDestroy({
44465
+ org,
44466
+ scoreId,
44467
+ userId
44468
+ }) {
44469
+ return request(OpenAPI, {
44470
+ method: 'DELETE',
44471
+ url: '/api/ai-mentor/orgs/{org}/users/{user_id}/evaluations/scores/{score_id}/',
44472
+ path: {
44473
+ 'org': org,
44474
+ 'score_id': scoreId,
44475
+ 'user_id': userId
44476
+ },
44477
+ errors: {
44478
+ 404: `Not found within the tenant.`
44479
+ }
44480
+ });
44481
+ }
44482
+ }
44483
+
44213
44484
  class FeaturesService {
44214
44485
  /**
44215
44486
  * Returns a list of the apps that the user has access to.
@@ -48097,6 +48368,7 @@ exports.CoreService = CoreService;
48097
48368
  exports.CredentialsService = CredentialsService;
48098
48369
  exports.CreditsService = CreditsService;
48099
48370
  exports.CustomDomainsService = CustomDomainsService;
48371
+ exports.EvaluationsService = EvaluationsService;
48100
48372
  exports.FeaturesService = FeaturesService;
48101
48373
  exports.ItemsService = ItemsService;
48102
48374
  exports.MediaService = MediaService;