@oro-ai/sdk 1.0.20 → 1.0.22
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/index.d.mts +35 -1
- package/dist/index.d.ts +35 -1
- package/dist/index.js +8 -0
- package/dist/index.mjs +7 -0
- package/package.json +1 -1
- package/src/generated/sdk.gen.ts +12 -1
- package/src/generated/types.gen.ts +33 -0
package/dist/index.d.mts
CHANGED
|
@@ -581,6 +581,10 @@ type AgentVersionStatus = {
|
|
|
581
581
|
* Final score if eligible
|
|
582
582
|
*/
|
|
583
583
|
final_score?: (number | null);
|
|
584
|
+
/**
|
|
585
|
+
* Average reasoning coefficient from included successful runs
|
|
586
|
+
*/
|
|
587
|
+
reasoning_coefficient?: (number | null);
|
|
584
588
|
/**
|
|
585
589
|
* Whether artifacts are released
|
|
586
590
|
*/
|
|
@@ -1155,6 +1159,12 @@ type EvaluationRunDetail = {
|
|
|
1155
1159
|
sandbox_metadata?: ({
|
|
1156
1160
|
[key: string]: unknown;
|
|
1157
1161
|
} | null);
|
|
1162
|
+
/**
|
|
1163
|
+
* Score breakdown including reasoning details
|
|
1164
|
+
*/
|
|
1165
|
+
score_components_summary?: ({
|
|
1166
|
+
[key: string]: unknown;
|
|
1167
|
+
} | null);
|
|
1158
1168
|
};
|
|
1159
1169
|
/**
|
|
1160
1170
|
* Public representation of an evaluation run.
|
|
@@ -1967,6 +1977,15 @@ type RunningEvaluation = {
|
|
|
1967
1977
|
*/
|
|
1968
1978
|
progress_percent?: number;
|
|
1969
1979
|
};
|
|
1980
|
+
/**
|
|
1981
|
+
* Problems for an evaluation run.
|
|
1982
|
+
*/
|
|
1983
|
+
type RunProblemsResponse = {
|
|
1984
|
+
/**
|
|
1985
|
+
* Problems to evaluate against
|
|
1986
|
+
*/
|
|
1987
|
+
problems: Array<ProblemPublic>;
|
|
1988
|
+
};
|
|
1970
1989
|
/**
|
|
1971
1990
|
* 400 - Candidate score does not exceed the challenge threshold.
|
|
1972
1991
|
*/
|
|
@@ -2764,6 +2783,16 @@ type CompleteRunData = {
|
|
|
2764
2783
|
};
|
|
2765
2784
|
type CompleteRunResponse2 = (CompleteRunResponse);
|
|
2766
2785
|
type CompleteRunError = ((MissingScoreError | ValidationError) | EvalRunNotFoundError | (NotRunOwnerError | RunAlreadyCompleteError) | HTTPValidationError);
|
|
2786
|
+
type GetRunProblemsData = {
|
|
2787
|
+
path: {
|
|
2788
|
+
/**
|
|
2789
|
+
* Evaluation run ID
|
|
2790
|
+
*/
|
|
2791
|
+
eval_run_id: string;
|
|
2792
|
+
};
|
|
2793
|
+
};
|
|
2794
|
+
type GetRunProblemsResponse = (RunProblemsResponse);
|
|
2795
|
+
type GetRunProblemsError = (EvalRunNotFoundError | HTTPValidationError);
|
|
2767
2796
|
type BanMinerData = {
|
|
2768
2797
|
body: BanRequest;
|
|
2769
2798
|
path: {
|
|
@@ -3285,6 +3314,11 @@ declare const presignUpload: <ThrowOnError extends boolean = false>(options: Opt
|
|
|
3285
3314
|
* Finalize an evaluation run with terminal status and score.
|
|
3286
3315
|
*/
|
|
3287
3316
|
declare const completeRun: <ThrowOnError extends boolean = false>(options: OptionsLegacyParser<CompleteRunData, ThrowOnError>) => _hey_api_client_fetch.RequestResult<CompleteRunResponse, CompleteRunError, ThrowOnError>;
|
|
3317
|
+
/**
|
|
3318
|
+
* Get problems for an evaluation run
|
|
3319
|
+
* Returns the problems that should be evaluated for a given run.
|
|
3320
|
+
*/
|
|
3321
|
+
declare const getRunProblems: <ThrowOnError extends boolean = false>(options: OptionsLegacyParser<GetRunProblemsData, ThrowOnError>) => _hey_api_client_fetch.RequestResult<RunProblemsResponse, GetRunProblemsError, ThrowOnError>;
|
|
3288
3322
|
/**
|
|
3289
3323
|
* Ban a miner
|
|
3290
3324
|
* Ban a miner from submitting agents.
|
|
@@ -3775,4 +3809,4 @@ declare class SessionAuthManager {
|
|
|
3775
3809
|
*/
|
|
3776
3810
|
declare function configureSessionAuth(baseUrl: string, config: SessionAuthConfig): SessionAuthManager;
|
|
3777
3811
|
|
|
3778
|
-
export { type ActivateSuiteData, type ActivateSuiteError, type ActivateSuiteResponse, type ActivateSuiteResponse2, type AdminAgentCodeResponse, type AdminAgentVersionEntry, type AdminAgentVersionsResponse, type AdminEvaluationRunEntry, type AdminEvaluationRunsResponse, type AdminMinerEntry, type AdminMinersResponse, type AdminValidatorEntry, type AdminValidatorsResponse, type AdmissionReason, type AdmissionStatus, type AgentLatestVersion, type AgentNotFoundError, type AgentPublic, type AgentVersionHistoryEntry, type AgentVersionNotFoundError, type AgentVersionProblemsResponse, type AgentVersionPublic, type AgentVersionScoreEntry, type AgentVersionState, type AgentVersionStatus, type AgentVersionVariance, type AgentVersionVarianceResponse, type AlreadyInvalidatedError, type ArtifactDownloadRequest, type ArtifactDownloadResponse, type ArtifactNotFoundError, type ArtifactNotReleasedError, type ArtifactReleaseState, type ArtifactType, type AtCapacityError, type AuditEventEntry, type AuditEventsResponse, type BanMinerData, type BanMinerError, type BanMinerResponse, type BanRequest, type BanResponse, type BanValidatorData, type BanValidatorError, type BanValidatorResponse, type BittensorAuthConfig, type Body_submit_agent, type CachedSession, type CancelAgentVersionData, type CancelAgentVersionError, type CancelAgentVersionResponse, type CancelRequest, type CancelResponse, type ChallengeRequest, type ChallengeResponse, type ChutesAuthStatusResponse, type ClaimWorkData, type ClaimWorkError, type ClaimWorkResponse, type ClaimWorkResponse2, type ClearMinerCooldownData, type ClearMinerCooldownError, type ClearMinerCooldownResponse, type CodeAnalysisError, type CompleteRunData, type CompleteRunError, type CompleteRunRequest, type CompleteRunResponse, type CompleteRunResponse2, type CooldownActiveError, type CreateSessionEndpointData, type CreateSessionEndpointError, type CreateSessionEndpointResponse, type CreateSuiteData, type CreateSuiteError, type CreateSuiteRequest, type CreateSuiteResponse, type CreateSuiteResponse2, type DiscardAgentVersionData, type DiscardAgentVersionError, type DiscardAgentVersionResponse, type DiscardRequest, type DiscardResponse, type ErrorCategory, type EvalRunNotFoundError, type EvaluationRunDetail, type EvaluationRunPublic, type EvaluationRunStatus, type EvaluationRunStatusPublic, type FileTooLargeError, type GetAgentVersionCodeData, type GetAgentVersionCodeError, type GetAgentVersionCodeResponse, type GetAgentVersionData, type GetAgentVersionError, type GetAgentVersionProblemsData, type GetAgentVersionProblemsError, type GetAgentVersionProblemsResponse, type GetAgentVersionResponse, type GetAgentVersionRunsData, type GetAgentVersionRunsError, type GetAgentVersionRunsResponse, type GetAgentVersionStatusData, type GetAgentVersionStatusError, type GetAgentVersionStatusResponse, type GetAgentVersionVarianceData, type GetAgentVersionVarianceError, type GetAgentVersionVarianceResponse, type GetArtifactDownloadUrlData, type GetArtifactDownloadUrlError, type GetArtifactDownloadUrlResponse, type GetAuditEventsData, type GetAuditEventsError, type GetAuditEventsResponse, type GetChutesAuthStatusError, type GetChutesAuthStatusResponse, type GetCurrentSuiteError, type GetCurrentSuiteResponse, type GetEvaluationRunData, type GetEvaluationRunError, type GetEvaluationRunResponse, type GetLeaderboardData, type GetLeaderboardError, type GetLeaderboardResponse, type GetOwnedAgentVersionStatusData, type GetOwnedAgentVersionStatusError, type GetOwnedAgentVersionStatusResponse, type GetPendingEvaluationsData, type GetPendingEvaluationsError, type GetPendingEvaluationsResponse, type GetReaperStatsError, type GetReaperStatsResponse, type GetRunningEvaluationsError, type GetRunningEvaluationsResponse, type GetSuiteProblemsData, type GetSuiteProblemsError, type GetSuiteProblemsResponse, type GetTopAgentError, type GetTopAgentResponse, type GetTopHistoryData, type GetTopHistoryError, type GetTopHistoryResponse, type GetValidatorScoresData, type GetValidatorScoresError, type GetValidatorScoresResponse, type GetValidatorsError, type GetValidatorsResponse, type HTTPValidationError, type HealthCheckError, type HealthCheckResponse, type HeartbeatData, type HeartbeatError, type HeartbeatRequest, type HeartbeatResponse, type HeartbeatResponse2, type InvalidAgentNameError, type InvalidArtifactTypeError, type InvalidFileError, type InvalidProblemIdError, type InvalidateEvaluationRunData, type InvalidateEvaluationRunError, type InvalidateEvaluationRunResponse, type InvalidateRunRequest, type JoinWaitlistData, type JoinWaitlistError, type JoinWaitlistResponse, type LeaderboardEntry, type LeaderboardResponse, type LeaseExpiredError, type ListAgentVersions1Data, type ListAgentVersions1Error, type ListAgentVersions1Response, type ListAgentVersionsData, type ListAgentVersionsError, type ListAgentVersionsResponse, type ListEvaluationRunsData, type ListEvaluationRunsError, type ListEvaluationRunsResponse, type ListMinerAgentsError, type ListMinerAgentsResponse, type ListMinersData, type ListMinersError, type ListMinersResponse, type ListSuitesError, type ListSuitesResponse, type ListValidatorsData, type ListValidatorsError, type ListValidatorsResponse, type LogoutData, type LogoutError, type LogoutResponse, type LogoutResponse2, type MinerAgentsResponse, type MinerNotFoundError, type MissingParameterError, type MissingScoreError, type NoActiveSuiteError, type NotRunOwnerError, type OroErrorCode, type PendingEvaluation, type PendingEvaluationSummary, type PendingEvaluationsResponse, type PresignUploadData, type PresignUploadError, type PresignUploadRequest, type PresignUploadResponse, type PresignUploadResponse2, type ProblemNotFoundError, type ProblemProgressEntry, type ProblemProgressUpdate, type ProblemPublic, type ProblemStatus, type ProgressUpdateRequest, type ProgressUpdateResponse, type RateLimitExceededError, type ReaperStatsResponse, type ReevaluateAgentVersionData, type ReevaluateAgentVersionError, type ReevaluateAgentVersionResponse, type ReevaluateRequest, type ReevaluateResponse, type ReinstateAgentVersionData, type ReinstateAgentVersionError, type ReinstateAgentVersionResponse, type ReinstateRequest, type RequestChallengeData, type RequestChallengeError, type RequestChallengeResponse, type RetryConfig, type RetryContext, type RunAlreadyCompleteError, type RunningEvaluation, type ScoreBelowThresholdError, type SessionAuthConfig, SessionAuthManager, type SessionInfo, type SessionRequest, type SessionResponse, type SetTopAgentData, type SetTopAgentError, type SetTopAgentResponse, type SetTopRequest, type SetTopResponse, type StoreChutesTokenData, type StoreChutesTokenError, type StoreChutesTokenRequest, type StoreChutesTokenResponse, type SubmitAgentData, type SubmitAgentError, type SubmitAgentResponse, type SubmitAgentResponse2, type SuiteNotFoundError, type SuitePublic, type SuiteWithProblemsResponse, type TerminalStatus, type TopAgentResponse, type TopHistoryEntry, type TopHistoryResponse, type UnbanMinerData, type UnbanMinerError, type UnbanMinerResponse, type UnbanValidatorData, type UnbanValidatorError, type UnbanValidatorResponse, type UpdateProgressData, type UpdateProgressError, type UpdateProgressResponse, type ValidationError, type ValidatorCurrentAgent, type ValidatorNotFoundError, type ValidatorProblemResult, type ValidatorPublic, type ValidatorScoreSummary, type ValidatorScoresResponse, type ValidatorStatus, type WaitlistSignupRequest, type WaitlistSignupResponse, type WorkItemStatus, activateSuite, banMiner, banValidator, cancelAgentVersion, claimWork, classifyError, classifyStatus, clearMinerCooldown, client, completeRun, computeDelay, configureBittensorAuth, configurePublicClient, configureSessionAuth, createRetryFetch, createSessionEndpoint, createSuite, discardAgentVersion, generateAuthHeaders, getAgentVersion, getAgentVersionCode, getAgentVersionProblems, getAgentVersionRuns, getAgentVersionStatus, getAgentVersionVariance, getArtifactDownloadUrl, getAuditEvents, getChutesAuthStatus, getCurrentSuite, getErrorCode, getErrorDetail, getEvaluationRun, getLeaderboard, getOwnedAgentVersionStatus, getPendingEvaluations, getReaperStats, getRunningEvaluations, getSuiteProblems, getTopAgent, getTopHistory, getValidatorScores, getValidators, hasDetail, hasErrorCode, healthCheck, heartbeat, invalidateEvaluationRun, isTransient, isTransientError, joinWaitlist, listAgentVersions, listAgentVersions1, listEvaluationRuns, listMinerAgents, listMiners, listSuites, listValidators, logout, parseRetryAfter, presignUpload, reevaluateAgentVersion, reinstateAgentVersion, requestChallenge, setTopAgent, storeChutesToken, submitAgent, unbanMiner, unbanValidator, updateProgress };
|
|
3812
|
+
export { type ActivateSuiteData, type ActivateSuiteError, type ActivateSuiteResponse, type ActivateSuiteResponse2, type AdminAgentCodeResponse, type AdminAgentVersionEntry, type AdminAgentVersionsResponse, type AdminEvaluationRunEntry, type AdminEvaluationRunsResponse, type AdminMinerEntry, type AdminMinersResponse, type AdminValidatorEntry, type AdminValidatorsResponse, type AdmissionReason, type AdmissionStatus, type AgentLatestVersion, type AgentNotFoundError, type AgentPublic, type AgentVersionHistoryEntry, type AgentVersionNotFoundError, type AgentVersionProblemsResponse, type AgentVersionPublic, type AgentVersionScoreEntry, type AgentVersionState, type AgentVersionStatus, type AgentVersionVariance, type AgentVersionVarianceResponse, type AlreadyInvalidatedError, type ArtifactDownloadRequest, type ArtifactDownloadResponse, type ArtifactNotFoundError, type ArtifactNotReleasedError, type ArtifactReleaseState, type ArtifactType, type AtCapacityError, type AuditEventEntry, type AuditEventsResponse, type BanMinerData, type BanMinerError, type BanMinerResponse, type BanRequest, type BanResponse, type BanValidatorData, type BanValidatorError, type BanValidatorResponse, type BittensorAuthConfig, type Body_submit_agent, type CachedSession, type CancelAgentVersionData, type CancelAgentVersionError, type CancelAgentVersionResponse, type CancelRequest, type CancelResponse, type ChallengeRequest, type ChallengeResponse, type ChutesAuthStatusResponse, type ClaimWorkData, type ClaimWorkError, type ClaimWorkResponse, type ClaimWorkResponse2, type ClearMinerCooldownData, type ClearMinerCooldownError, type ClearMinerCooldownResponse, type CodeAnalysisError, type CompleteRunData, type CompleteRunError, type CompleteRunRequest, type CompleteRunResponse, type CompleteRunResponse2, type CooldownActiveError, type CreateSessionEndpointData, type CreateSessionEndpointError, type CreateSessionEndpointResponse, type CreateSuiteData, type CreateSuiteError, type CreateSuiteRequest, type CreateSuiteResponse, type CreateSuiteResponse2, type DiscardAgentVersionData, type DiscardAgentVersionError, type DiscardAgentVersionResponse, type DiscardRequest, type DiscardResponse, type ErrorCategory, type EvalRunNotFoundError, type EvaluationRunDetail, type EvaluationRunPublic, type EvaluationRunStatus, type EvaluationRunStatusPublic, type FileTooLargeError, type GetAgentVersionCodeData, type GetAgentVersionCodeError, type GetAgentVersionCodeResponse, type GetAgentVersionData, type GetAgentVersionError, type GetAgentVersionProblemsData, type GetAgentVersionProblemsError, type GetAgentVersionProblemsResponse, type GetAgentVersionResponse, type GetAgentVersionRunsData, type GetAgentVersionRunsError, type GetAgentVersionRunsResponse, type GetAgentVersionStatusData, type GetAgentVersionStatusError, type GetAgentVersionStatusResponse, type GetAgentVersionVarianceData, type GetAgentVersionVarianceError, type GetAgentVersionVarianceResponse, type GetArtifactDownloadUrlData, type GetArtifactDownloadUrlError, type GetArtifactDownloadUrlResponse, type GetAuditEventsData, type GetAuditEventsError, type GetAuditEventsResponse, type GetChutesAuthStatusError, type GetChutesAuthStatusResponse, type GetCurrentSuiteError, type GetCurrentSuiteResponse, type GetEvaluationRunData, type GetEvaluationRunError, type GetEvaluationRunResponse, type GetLeaderboardData, type GetLeaderboardError, type GetLeaderboardResponse, type GetOwnedAgentVersionStatusData, type GetOwnedAgentVersionStatusError, type GetOwnedAgentVersionStatusResponse, type GetPendingEvaluationsData, type GetPendingEvaluationsError, type GetPendingEvaluationsResponse, type GetReaperStatsError, type GetReaperStatsResponse, type GetRunProblemsData, type GetRunProblemsError, type GetRunProblemsResponse, type GetRunningEvaluationsError, type GetRunningEvaluationsResponse, type GetSuiteProblemsData, type GetSuiteProblemsError, type GetSuiteProblemsResponse, type GetTopAgentError, type GetTopAgentResponse, type GetTopHistoryData, type GetTopHistoryError, type GetTopHistoryResponse, type GetValidatorScoresData, type GetValidatorScoresError, type GetValidatorScoresResponse, type GetValidatorsError, type GetValidatorsResponse, type HTTPValidationError, type HealthCheckError, type HealthCheckResponse, type HeartbeatData, type HeartbeatError, type HeartbeatRequest, type HeartbeatResponse, type HeartbeatResponse2, type InvalidAgentNameError, type InvalidArtifactTypeError, type InvalidFileError, type InvalidProblemIdError, type InvalidateEvaluationRunData, type InvalidateEvaluationRunError, type InvalidateEvaluationRunResponse, type InvalidateRunRequest, type JoinWaitlistData, type JoinWaitlistError, type JoinWaitlistResponse, type LeaderboardEntry, type LeaderboardResponse, type LeaseExpiredError, type ListAgentVersions1Data, type ListAgentVersions1Error, type ListAgentVersions1Response, type ListAgentVersionsData, type ListAgentVersionsError, type ListAgentVersionsResponse, type ListEvaluationRunsData, type ListEvaluationRunsError, type ListEvaluationRunsResponse, type ListMinerAgentsError, type ListMinerAgentsResponse, type ListMinersData, type ListMinersError, type ListMinersResponse, type ListSuitesError, type ListSuitesResponse, type ListValidatorsData, type ListValidatorsError, type ListValidatorsResponse, type LogoutData, type LogoutError, type LogoutResponse, type LogoutResponse2, type MinerAgentsResponse, type MinerNotFoundError, type MissingParameterError, type MissingScoreError, type NoActiveSuiteError, type NotRunOwnerError, type OroErrorCode, type PendingEvaluation, type PendingEvaluationSummary, type PendingEvaluationsResponse, type PresignUploadData, type PresignUploadError, type PresignUploadRequest, type PresignUploadResponse, type PresignUploadResponse2, type ProblemNotFoundError, type ProblemProgressEntry, type ProblemProgressUpdate, type ProblemPublic, type ProblemStatus, type ProgressUpdateRequest, type ProgressUpdateResponse, type RateLimitExceededError, type ReaperStatsResponse, type ReevaluateAgentVersionData, type ReevaluateAgentVersionError, type ReevaluateAgentVersionResponse, type ReevaluateRequest, type ReevaluateResponse, type ReinstateAgentVersionData, type ReinstateAgentVersionError, type ReinstateAgentVersionResponse, type ReinstateRequest, type RequestChallengeData, type RequestChallengeError, type RequestChallengeResponse, type RetryConfig, type RetryContext, type RunAlreadyCompleteError, type RunProblemsResponse, type RunningEvaluation, type ScoreBelowThresholdError, type SessionAuthConfig, SessionAuthManager, type SessionInfo, type SessionRequest, type SessionResponse, type SetTopAgentData, type SetTopAgentError, type SetTopAgentResponse, type SetTopRequest, type SetTopResponse, type StoreChutesTokenData, type StoreChutesTokenError, type StoreChutesTokenRequest, type StoreChutesTokenResponse, type SubmitAgentData, type SubmitAgentError, type SubmitAgentResponse, type SubmitAgentResponse2, type SuiteNotFoundError, type SuitePublic, type SuiteWithProblemsResponse, type TerminalStatus, type TopAgentResponse, type TopHistoryEntry, type TopHistoryResponse, type UnbanMinerData, type UnbanMinerError, type UnbanMinerResponse, type UnbanValidatorData, type UnbanValidatorError, type UnbanValidatorResponse, type UpdateProgressData, type UpdateProgressError, type UpdateProgressResponse, type ValidationError, type ValidatorCurrentAgent, type ValidatorNotFoundError, type ValidatorProblemResult, type ValidatorPublic, type ValidatorScoreSummary, type ValidatorScoresResponse, type ValidatorStatus, type WaitlistSignupRequest, type WaitlistSignupResponse, type WorkItemStatus, activateSuite, banMiner, banValidator, cancelAgentVersion, claimWork, classifyError, classifyStatus, clearMinerCooldown, client, completeRun, computeDelay, configureBittensorAuth, configurePublicClient, configureSessionAuth, createRetryFetch, createSessionEndpoint, createSuite, discardAgentVersion, generateAuthHeaders, getAgentVersion, getAgentVersionCode, getAgentVersionProblems, getAgentVersionRuns, getAgentVersionStatus, getAgentVersionVariance, getArtifactDownloadUrl, getAuditEvents, getChutesAuthStatus, getCurrentSuite, getErrorCode, getErrorDetail, getEvaluationRun, getLeaderboard, getOwnedAgentVersionStatus, getPendingEvaluations, getReaperStats, getRunProblems, getRunningEvaluations, getSuiteProblems, getTopAgent, getTopHistory, getValidatorScores, getValidators, hasDetail, hasErrorCode, healthCheck, heartbeat, invalidateEvaluationRun, isTransient, isTransientError, joinWaitlist, listAgentVersions, listAgentVersions1, listEvaluationRuns, listMinerAgents, listMiners, listSuites, listValidators, logout, parseRetryAfter, presignUpload, reevaluateAgentVersion, reinstateAgentVersion, requestChallenge, setTopAgent, storeChutesToken, submitAgent, unbanMiner, unbanValidator, updateProgress };
|
package/dist/index.d.ts
CHANGED
|
@@ -581,6 +581,10 @@ type AgentVersionStatus = {
|
|
|
581
581
|
* Final score if eligible
|
|
582
582
|
*/
|
|
583
583
|
final_score?: (number | null);
|
|
584
|
+
/**
|
|
585
|
+
* Average reasoning coefficient from included successful runs
|
|
586
|
+
*/
|
|
587
|
+
reasoning_coefficient?: (number | null);
|
|
584
588
|
/**
|
|
585
589
|
* Whether artifacts are released
|
|
586
590
|
*/
|
|
@@ -1155,6 +1159,12 @@ type EvaluationRunDetail = {
|
|
|
1155
1159
|
sandbox_metadata?: ({
|
|
1156
1160
|
[key: string]: unknown;
|
|
1157
1161
|
} | null);
|
|
1162
|
+
/**
|
|
1163
|
+
* Score breakdown including reasoning details
|
|
1164
|
+
*/
|
|
1165
|
+
score_components_summary?: ({
|
|
1166
|
+
[key: string]: unknown;
|
|
1167
|
+
} | null);
|
|
1158
1168
|
};
|
|
1159
1169
|
/**
|
|
1160
1170
|
* Public representation of an evaluation run.
|
|
@@ -1967,6 +1977,15 @@ type RunningEvaluation = {
|
|
|
1967
1977
|
*/
|
|
1968
1978
|
progress_percent?: number;
|
|
1969
1979
|
};
|
|
1980
|
+
/**
|
|
1981
|
+
* Problems for an evaluation run.
|
|
1982
|
+
*/
|
|
1983
|
+
type RunProblemsResponse = {
|
|
1984
|
+
/**
|
|
1985
|
+
* Problems to evaluate against
|
|
1986
|
+
*/
|
|
1987
|
+
problems: Array<ProblemPublic>;
|
|
1988
|
+
};
|
|
1970
1989
|
/**
|
|
1971
1990
|
* 400 - Candidate score does not exceed the challenge threshold.
|
|
1972
1991
|
*/
|
|
@@ -2764,6 +2783,16 @@ type CompleteRunData = {
|
|
|
2764
2783
|
};
|
|
2765
2784
|
type CompleteRunResponse2 = (CompleteRunResponse);
|
|
2766
2785
|
type CompleteRunError = ((MissingScoreError | ValidationError) | EvalRunNotFoundError | (NotRunOwnerError | RunAlreadyCompleteError) | HTTPValidationError);
|
|
2786
|
+
type GetRunProblemsData = {
|
|
2787
|
+
path: {
|
|
2788
|
+
/**
|
|
2789
|
+
* Evaluation run ID
|
|
2790
|
+
*/
|
|
2791
|
+
eval_run_id: string;
|
|
2792
|
+
};
|
|
2793
|
+
};
|
|
2794
|
+
type GetRunProblemsResponse = (RunProblemsResponse);
|
|
2795
|
+
type GetRunProblemsError = (EvalRunNotFoundError | HTTPValidationError);
|
|
2767
2796
|
type BanMinerData = {
|
|
2768
2797
|
body: BanRequest;
|
|
2769
2798
|
path: {
|
|
@@ -3285,6 +3314,11 @@ declare const presignUpload: <ThrowOnError extends boolean = false>(options: Opt
|
|
|
3285
3314
|
* Finalize an evaluation run with terminal status and score.
|
|
3286
3315
|
*/
|
|
3287
3316
|
declare const completeRun: <ThrowOnError extends boolean = false>(options: OptionsLegacyParser<CompleteRunData, ThrowOnError>) => _hey_api_client_fetch.RequestResult<CompleteRunResponse, CompleteRunError, ThrowOnError>;
|
|
3317
|
+
/**
|
|
3318
|
+
* Get problems for an evaluation run
|
|
3319
|
+
* Returns the problems that should be evaluated for a given run.
|
|
3320
|
+
*/
|
|
3321
|
+
declare const getRunProblems: <ThrowOnError extends boolean = false>(options: OptionsLegacyParser<GetRunProblemsData, ThrowOnError>) => _hey_api_client_fetch.RequestResult<RunProblemsResponse, GetRunProblemsError, ThrowOnError>;
|
|
3288
3322
|
/**
|
|
3289
3323
|
* Ban a miner
|
|
3290
3324
|
* Ban a miner from submitting agents.
|
|
@@ -3775,4 +3809,4 @@ declare class SessionAuthManager {
|
|
|
3775
3809
|
*/
|
|
3776
3810
|
declare function configureSessionAuth(baseUrl: string, config: SessionAuthConfig): SessionAuthManager;
|
|
3777
3811
|
|
|
3778
|
-
export { type ActivateSuiteData, type ActivateSuiteError, type ActivateSuiteResponse, type ActivateSuiteResponse2, type AdminAgentCodeResponse, type AdminAgentVersionEntry, type AdminAgentVersionsResponse, type AdminEvaluationRunEntry, type AdminEvaluationRunsResponse, type AdminMinerEntry, type AdminMinersResponse, type AdminValidatorEntry, type AdminValidatorsResponse, type AdmissionReason, type AdmissionStatus, type AgentLatestVersion, type AgentNotFoundError, type AgentPublic, type AgentVersionHistoryEntry, type AgentVersionNotFoundError, type AgentVersionProblemsResponse, type AgentVersionPublic, type AgentVersionScoreEntry, type AgentVersionState, type AgentVersionStatus, type AgentVersionVariance, type AgentVersionVarianceResponse, type AlreadyInvalidatedError, type ArtifactDownloadRequest, type ArtifactDownloadResponse, type ArtifactNotFoundError, type ArtifactNotReleasedError, type ArtifactReleaseState, type ArtifactType, type AtCapacityError, type AuditEventEntry, type AuditEventsResponse, type BanMinerData, type BanMinerError, type BanMinerResponse, type BanRequest, type BanResponse, type BanValidatorData, type BanValidatorError, type BanValidatorResponse, type BittensorAuthConfig, type Body_submit_agent, type CachedSession, type CancelAgentVersionData, type CancelAgentVersionError, type CancelAgentVersionResponse, type CancelRequest, type CancelResponse, type ChallengeRequest, type ChallengeResponse, type ChutesAuthStatusResponse, type ClaimWorkData, type ClaimWorkError, type ClaimWorkResponse, type ClaimWorkResponse2, type ClearMinerCooldownData, type ClearMinerCooldownError, type ClearMinerCooldownResponse, type CodeAnalysisError, type CompleteRunData, type CompleteRunError, type CompleteRunRequest, type CompleteRunResponse, type CompleteRunResponse2, type CooldownActiveError, type CreateSessionEndpointData, type CreateSessionEndpointError, type CreateSessionEndpointResponse, type CreateSuiteData, type CreateSuiteError, type CreateSuiteRequest, type CreateSuiteResponse, type CreateSuiteResponse2, type DiscardAgentVersionData, type DiscardAgentVersionError, type DiscardAgentVersionResponse, type DiscardRequest, type DiscardResponse, type ErrorCategory, type EvalRunNotFoundError, type EvaluationRunDetail, type EvaluationRunPublic, type EvaluationRunStatus, type EvaluationRunStatusPublic, type FileTooLargeError, type GetAgentVersionCodeData, type GetAgentVersionCodeError, type GetAgentVersionCodeResponse, type GetAgentVersionData, type GetAgentVersionError, type GetAgentVersionProblemsData, type GetAgentVersionProblemsError, type GetAgentVersionProblemsResponse, type GetAgentVersionResponse, type GetAgentVersionRunsData, type GetAgentVersionRunsError, type GetAgentVersionRunsResponse, type GetAgentVersionStatusData, type GetAgentVersionStatusError, type GetAgentVersionStatusResponse, type GetAgentVersionVarianceData, type GetAgentVersionVarianceError, type GetAgentVersionVarianceResponse, type GetArtifactDownloadUrlData, type GetArtifactDownloadUrlError, type GetArtifactDownloadUrlResponse, type GetAuditEventsData, type GetAuditEventsError, type GetAuditEventsResponse, type GetChutesAuthStatusError, type GetChutesAuthStatusResponse, type GetCurrentSuiteError, type GetCurrentSuiteResponse, type GetEvaluationRunData, type GetEvaluationRunError, type GetEvaluationRunResponse, type GetLeaderboardData, type GetLeaderboardError, type GetLeaderboardResponse, type GetOwnedAgentVersionStatusData, type GetOwnedAgentVersionStatusError, type GetOwnedAgentVersionStatusResponse, type GetPendingEvaluationsData, type GetPendingEvaluationsError, type GetPendingEvaluationsResponse, type GetReaperStatsError, type GetReaperStatsResponse, type GetRunningEvaluationsError, type GetRunningEvaluationsResponse, type GetSuiteProblemsData, type GetSuiteProblemsError, type GetSuiteProblemsResponse, type GetTopAgentError, type GetTopAgentResponse, type GetTopHistoryData, type GetTopHistoryError, type GetTopHistoryResponse, type GetValidatorScoresData, type GetValidatorScoresError, type GetValidatorScoresResponse, type GetValidatorsError, type GetValidatorsResponse, type HTTPValidationError, type HealthCheckError, type HealthCheckResponse, type HeartbeatData, type HeartbeatError, type HeartbeatRequest, type HeartbeatResponse, type HeartbeatResponse2, type InvalidAgentNameError, type InvalidArtifactTypeError, type InvalidFileError, type InvalidProblemIdError, type InvalidateEvaluationRunData, type InvalidateEvaluationRunError, type InvalidateEvaluationRunResponse, type InvalidateRunRequest, type JoinWaitlistData, type JoinWaitlistError, type JoinWaitlistResponse, type LeaderboardEntry, type LeaderboardResponse, type LeaseExpiredError, type ListAgentVersions1Data, type ListAgentVersions1Error, type ListAgentVersions1Response, type ListAgentVersionsData, type ListAgentVersionsError, type ListAgentVersionsResponse, type ListEvaluationRunsData, type ListEvaluationRunsError, type ListEvaluationRunsResponse, type ListMinerAgentsError, type ListMinerAgentsResponse, type ListMinersData, type ListMinersError, type ListMinersResponse, type ListSuitesError, type ListSuitesResponse, type ListValidatorsData, type ListValidatorsError, type ListValidatorsResponse, type LogoutData, type LogoutError, type LogoutResponse, type LogoutResponse2, type MinerAgentsResponse, type MinerNotFoundError, type MissingParameterError, type MissingScoreError, type NoActiveSuiteError, type NotRunOwnerError, type OroErrorCode, type PendingEvaluation, type PendingEvaluationSummary, type PendingEvaluationsResponse, type PresignUploadData, type PresignUploadError, type PresignUploadRequest, type PresignUploadResponse, type PresignUploadResponse2, type ProblemNotFoundError, type ProblemProgressEntry, type ProblemProgressUpdate, type ProblemPublic, type ProblemStatus, type ProgressUpdateRequest, type ProgressUpdateResponse, type RateLimitExceededError, type ReaperStatsResponse, type ReevaluateAgentVersionData, type ReevaluateAgentVersionError, type ReevaluateAgentVersionResponse, type ReevaluateRequest, type ReevaluateResponse, type ReinstateAgentVersionData, type ReinstateAgentVersionError, type ReinstateAgentVersionResponse, type ReinstateRequest, type RequestChallengeData, type RequestChallengeError, type RequestChallengeResponse, type RetryConfig, type RetryContext, type RunAlreadyCompleteError, type RunningEvaluation, type ScoreBelowThresholdError, type SessionAuthConfig, SessionAuthManager, type SessionInfo, type SessionRequest, type SessionResponse, type SetTopAgentData, type SetTopAgentError, type SetTopAgentResponse, type SetTopRequest, type SetTopResponse, type StoreChutesTokenData, type StoreChutesTokenError, type StoreChutesTokenRequest, type StoreChutesTokenResponse, type SubmitAgentData, type SubmitAgentError, type SubmitAgentResponse, type SubmitAgentResponse2, type SuiteNotFoundError, type SuitePublic, type SuiteWithProblemsResponse, type TerminalStatus, type TopAgentResponse, type TopHistoryEntry, type TopHistoryResponse, type UnbanMinerData, type UnbanMinerError, type UnbanMinerResponse, type UnbanValidatorData, type UnbanValidatorError, type UnbanValidatorResponse, type UpdateProgressData, type UpdateProgressError, type UpdateProgressResponse, type ValidationError, type ValidatorCurrentAgent, type ValidatorNotFoundError, type ValidatorProblemResult, type ValidatorPublic, type ValidatorScoreSummary, type ValidatorScoresResponse, type ValidatorStatus, type WaitlistSignupRequest, type WaitlistSignupResponse, type WorkItemStatus, activateSuite, banMiner, banValidator, cancelAgentVersion, claimWork, classifyError, classifyStatus, clearMinerCooldown, client, completeRun, computeDelay, configureBittensorAuth, configurePublicClient, configureSessionAuth, createRetryFetch, createSessionEndpoint, createSuite, discardAgentVersion, generateAuthHeaders, getAgentVersion, getAgentVersionCode, getAgentVersionProblems, getAgentVersionRuns, getAgentVersionStatus, getAgentVersionVariance, getArtifactDownloadUrl, getAuditEvents, getChutesAuthStatus, getCurrentSuite, getErrorCode, getErrorDetail, getEvaluationRun, getLeaderboard, getOwnedAgentVersionStatus, getPendingEvaluations, getReaperStats, getRunningEvaluations, getSuiteProblems, getTopAgent, getTopHistory, getValidatorScores, getValidators, hasDetail, hasErrorCode, healthCheck, heartbeat, invalidateEvaluationRun, isTransient, isTransientError, joinWaitlist, listAgentVersions, listAgentVersions1, listEvaluationRuns, listMinerAgents, listMiners, listSuites, listValidators, logout, parseRetryAfter, presignUpload, reevaluateAgentVersion, reinstateAgentVersion, requestChallenge, setTopAgent, storeChutesToken, submitAgent, unbanMiner, unbanValidator, updateProgress };
|
|
3812
|
+
export { type ActivateSuiteData, type ActivateSuiteError, type ActivateSuiteResponse, type ActivateSuiteResponse2, type AdminAgentCodeResponse, type AdminAgentVersionEntry, type AdminAgentVersionsResponse, type AdminEvaluationRunEntry, type AdminEvaluationRunsResponse, type AdminMinerEntry, type AdminMinersResponse, type AdminValidatorEntry, type AdminValidatorsResponse, type AdmissionReason, type AdmissionStatus, type AgentLatestVersion, type AgentNotFoundError, type AgentPublic, type AgentVersionHistoryEntry, type AgentVersionNotFoundError, type AgentVersionProblemsResponse, type AgentVersionPublic, type AgentVersionScoreEntry, type AgentVersionState, type AgentVersionStatus, type AgentVersionVariance, type AgentVersionVarianceResponse, type AlreadyInvalidatedError, type ArtifactDownloadRequest, type ArtifactDownloadResponse, type ArtifactNotFoundError, type ArtifactNotReleasedError, type ArtifactReleaseState, type ArtifactType, type AtCapacityError, type AuditEventEntry, type AuditEventsResponse, type BanMinerData, type BanMinerError, type BanMinerResponse, type BanRequest, type BanResponse, type BanValidatorData, type BanValidatorError, type BanValidatorResponse, type BittensorAuthConfig, type Body_submit_agent, type CachedSession, type CancelAgentVersionData, type CancelAgentVersionError, type CancelAgentVersionResponse, type CancelRequest, type CancelResponse, type ChallengeRequest, type ChallengeResponse, type ChutesAuthStatusResponse, type ClaimWorkData, type ClaimWorkError, type ClaimWorkResponse, type ClaimWorkResponse2, type ClearMinerCooldownData, type ClearMinerCooldownError, type ClearMinerCooldownResponse, type CodeAnalysisError, type CompleteRunData, type CompleteRunError, type CompleteRunRequest, type CompleteRunResponse, type CompleteRunResponse2, type CooldownActiveError, type CreateSessionEndpointData, type CreateSessionEndpointError, type CreateSessionEndpointResponse, type CreateSuiteData, type CreateSuiteError, type CreateSuiteRequest, type CreateSuiteResponse, type CreateSuiteResponse2, type DiscardAgentVersionData, type DiscardAgentVersionError, type DiscardAgentVersionResponse, type DiscardRequest, type DiscardResponse, type ErrorCategory, type EvalRunNotFoundError, type EvaluationRunDetail, type EvaluationRunPublic, type EvaluationRunStatus, type EvaluationRunStatusPublic, type FileTooLargeError, type GetAgentVersionCodeData, type GetAgentVersionCodeError, type GetAgentVersionCodeResponse, type GetAgentVersionData, type GetAgentVersionError, type GetAgentVersionProblemsData, type GetAgentVersionProblemsError, type GetAgentVersionProblemsResponse, type GetAgentVersionResponse, type GetAgentVersionRunsData, type GetAgentVersionRunsError, type GetAgentVersionRunsResponse, type GetAgentVersionStatusData, type GetAgentVersionStatusError, type GetAgentVersionStatusResponse, type GetAgentVersionVarianceData, type GetAgentVersionVarianceError, type GetAgentVersionVarianceResponse, type GetArtifactDownloadUrlData, type GetArtifactDownloadUrlError, type GetArtifactDownloadUrlResponse, type GetAuditEventsData, type GetAuditEventsError, type GetAuditEventsResponse, type GetChutesAuthStatusError, type GetChutesAuthStatusResponse, type GetCurrentSuiteError, type GetCurrentSuiteResponse, type GetEvaluationRunData, type GetEvaluationRunError, type GetEvaluationRunResponse, type GetLeaderboardData, type GetLeaderboardError, type GetLeaderboardResponse, type GetOwnedAgentVersionStatusData, type GetOwnedAgentVersionStatusError, type GetOwnedAgentVersionStatusResponse, type GetPendingEvaluationsData, type GetPendingEvaluationsError, type GetPendingEvaluationsResponse, type GetReaperStatsError, type GetReaperStatsResponse, type GetRunProblemsData, type GetRunProblemsError, type GetRunProblemsResponse, type GetRunningEvaluationsError, type GetRunningEvaluationsResponse, type GetSuiteProblemsData, type GetSuiteProblemsError, type GetSuiteProblemsResponse, type GetTopAgentError, type GetTopAgentResponse, type GetTopHistoryData, type GetTopHistoryError, type GetTopHistoryResponse, type GetValidatorScoresData, type GetValidatorScoresError, type GetValidatorScoresResponse, type GetValidatorsError, type GetValidatorsResponse, type HTTPValidationError, type HealthCheckError, type HealthCheckResponse, type HeartbeatData, type HeartbeatError, type HeartbeatRequest, type HeartbeatResponse, type HeartbeatResponse2, type InvalidAgentNameError, type InvalidArtifactTypeError, type InvalidFileError, type InvalidProblemIdError, type InvalidateEvaluationRunData, type InvalidateEvaluationRunError, type InvalidateEvaluationRunResponse, type InvalidateRunRequest, type JoinWaitlistData, type JoinWaitlistError, type JoinWaitlistResponse, type LeaderboardEntry, type LeaderboardResponse, type LeaseExpiredError, type ListAgentVersions1Data, type ListAgentVersions1Error, type ListAgentVersions1Response, type ListAgentVersionsData, type ListAgentVersionsError, type ListAgentVersionsResponse, type ListEvaluationRunsData, type ListEvaluationRunsError, type ListEvaluationRunsResponse, type ListMinerAgentsError, type ListMinerAgentsResponse, type ListMinersData, type ListMinersError, type ListMinersResponse, type ListSuitesError, type ListSuitesResponse, type ListValidatorsData, type ListValidatorsError, type ListValidatorsResponse, type LogoutData, type LogoutError, type LogoutResponse, type LogoutResponse2, type MinerAgentsResponse, type MinerNotFoundError, type MissingParameterError, type MissingScoreError, type NoActiveSuiteError, type NotRunOwnerError, type OroErrorCode, type PendingEvaluation, type PendingEvaluationSummary, type PendingEvaluationsResponse, type PresignUploadData, type PresignUploadError, type PresignUploadRequest, type PresignUploadResponse, type PresignUploadResponse2, type ProblemNotFoundError, type ProblemProgressEntry, type ProblemProgressUpdate, type ProblemPublic, type ProblemStatus, type ProgressUpdateRequest, type ProgressUpdateResponse, type RateLimitExceededError, type ReaperStatsResponse, type ReevaluateAgentVersionData, type ReevaluateAgentVersionError, type ReevaluateAgentVersionResponse, type ReevaluateRequest, type ReevaluateResponse, type ReinstateAgentVersionData, type ReinstateAgentVersionError, type ReinstateAgentVersionResponse, type ReinstateRequest, type RequestChallengeData, type RequestChallengeError, type RequestChallengeResponse, type RetryConfig, type RetryContext, type RunAlreadyCompleteError, type RunProblemsResponse, type RunningEvaluation, type ScoreBelowThresholdError, type SessionAuthConfig, SessionAuthManager, type SessionInfo, type SessionRequest, type SessionResponse, type SetTopAgentData, type SetTopAgentError, type SetTopAgentResponse, type SetTopRequest, type SetTopResponse, type StoreChutesTokenData, type StoreChutesTokenError, type StoreChutesTokenRequest, type StoreChutesTokenResponse, type SubmitAgentData, type SubmitAgentError, type SubmitAgentResponse, type SubmitAgentResponse2, type SuiteNotFoundError, type SuitePublic, type SuiteWithProblemsResponse, type TerminalStatus, type TopAgentResponse, type TopHistoryEntry, type TopHistoryResponse, type UnbanMinerData, type UnbanMinerError, type UnbanMinerResponse, type UnbanValidatorData, type UnbanValidatorError, type UnbanValidatorResponse, type UpdateProgressData, type UpdateProgressError, type UpdateProgressResponse, type ValidationError, type ValidatorCurrentAgent, type ValidatorNotFoundError, type ValidatorProblemResult, type ValidatorPublic, type ValidatorScoreSummary, type ValidatorScoresResponse, type ValidatorStatus, type WaitlistSignupRequest, type WaitlistSignupResponse, type WorkItemStatus, activateSuite, banMiner, banValidator, cancelAgentVersion, claimWork, classifyError, classifyStatus, clearMinerCooldown, client, completeRun, computeDelay, configureBittensorAuth, configurePublicClient, configureSessionAuth, createRetryFetch, createSessionEndpoint, createSuite, discardAgentVersion, generateAuthHeaders, getAgentVersion, getAgentVersionCode, getAgentVersionProblems, getAgentVersionRuns, getAgentVersionStatus, getAgentVersionVariance, getArtifactDownloadUrl, getAuditEvents, getChutesAuthStatus, getCurrentSuite, getErrorCode, getErrorDetail, getEvaluationRun, getLeaderboard, getOwnedAgentVersionStatus, getPendingEvaluations, getReaperStats, getRunProblems, getRunningEvaluations, getSuiteProblems, getTopAgent, getTopHistory, getValidatorScores, getValidators, hasDetail, hasErrorCode, healthCheck, heartbeat, invalidateEvaluationRun, isTransient, isTransientError, joinWaitlist, listAgentVersions, listAgentVersions1, listEvaluationRuns, listMinerAgents, listMiners, listSuites, listValidators, logout, parseRetryAfter, presignUpload, reevaluateAgentVersion, reinstateAgentVersion, requestChallenge, setTopAgent, storeChutesToken, submitAgent, unbanMiner, unbanValidator, updateProgress };
|
package/dist/index.js
CHANGED
|
@@ -67,6 +67,7 @@ __export(index_exports, {
|
|
|
67
67
|
getOwnedAgentVersionStatus: () => getOwnedAgentVersionStatus,
|
|
68
68
|
getPendingEvaluations: () => getPendingEvaluations,
|
|
69
69
|
getReaperStats: () => getReaperStats,
|
|
70
|
+
getRunProblems: () => getRunProblems,
|
|
70
71
|
getRunningEvaluations: () => getRunningEvaluations,
|
|
71
72
|
getSuiteProblems: () => getSuiteProblems,
|
|
72
73
|
getTopAgent: () => getTopAgent,
|
|
@@ -297,6 +298,12 @@ var completeRun = (options) => {
|
|
|
297
298
|
url: "/v1/validator/evaluation-runs/{eval_run_id}/complete"
|
|
298
299
|
});
|
|
299
300
|
};
|
|
301
|
+
var getRunProblems = (options) => {
|
|
302
|
+
return (options?.client ?? client).get({
|
|
303
|
+
...options,
|
|
304
|
+
url: "/v1/validator/evaluation-runs/{eval_run_id}/problems"
|
|
305
|
+
});
|
|
306
|
+
};
|
|
300
307
|
var banMiner = (options) => {
|
|
301
308
|
return (options?.client ?? client).post({
|
|
302
309
|
...options,
|
|
@@ -828,6 +835,7 @@ function configureSessionAuth(baseUrl, config) {
|
|
|
828
835
|
getOwnedAgentVersionStatus,
|
|
829
836
|
getPendingEvaluations,
|
|
830
837
|
getReaperStats,
|
|
838
|
+
getRunProblems,
|
|
831
839
|
getRunningEvaluations,
|
|
832
840
|
getSuiteProblems,
|
|
833
841
|
getTopAgent,
|
package/dist/index.mjs
CHANGED
|
@@ -192,6 +192,12 @@ var completeRun = (options) => {
|
|
|
192
192
|
url: "/v1/validator/evaluation-runs/{eval_run_id}/complete"
|
|
193
193
|
});
|
|
194
194
|
};
|
|
195
|
+
var getRunProblems = (options) => {
|
|
196
|
+
return (options?.client ?? client).get({
|
|
197
|
+
...options,
|
|
198
|
+
url: "/v1/validator/evaluation-runs/{eval_run_id}/problems"
|
|
199
|
+
});
|
|
200
|
+
};
|
|
195
201
|
var banMiner = (options) => {
|
|
196
202
|
return (options?.client ?? client).post({
|
|
197
203
|
...options,
|
|
@@ -722,6 +728,7 @@ export {
|
|
|
722
728
|
getOwnedAgentVersionStatus,
|
|
723
729
|
getPendingEvaluations,
|
|
724
730
|
getReaperStats,
|
|
731
|
+
getRunProblems,
|
|
725
732
|
getRunningEvaluations,
|
|
726
733
|
getSuiteProblems,
|
|
727
734
|
getTopAgent,
|
package/package.json
CHANGED
package/src/generated/sdk.gen.ts
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
// This file is auto-generated by @hey-api/openapi-ts
|
|
2
2
|
|
|
3
3
|
import { createClient, createConfig, type OptionsLegacyParser, formDataBodySerializer } from '@hey-api/client-fetch';
|
|
4
|
-
import type { HealthCheckError, HealthCheckResponse, ListSuitesError, ListSuitesResponse, GetCurrentSuiteError, GetCurrentSuiteResponse, GetSuiteProblemsData, GetSuiteProblemsError, GetSuiteProblemsResponse, GetLeaderboardData, GetLeaderboardError, GetLeaderboardResponse, GetTopAgentError, GetTopAgentResponse, GetTopHistoryData, GetTopHistoryError, GetTopHistoryResponse, GetAgentVersionStatusData, GetAgentVersionStatusError, GetAgentVersionStatusResponse, GetAgentVersionRunsData, GetAgentVersionRunsError, GetAgentVersionRunsResponse, GetAgentVersionProblemsData, GetAgentVersionProblemsError, GetAgentVersionProblemsResponse, GetAgentVersionData, GetAgentVersionError, GetAgentVersionResponse, GetArtifactDownloadUrlData, GetArtifactDownloadUrlError, GetArtifactDownloadUrlResponse, GetEvaluationRunData, GetEvaluationRunError, GetEvaluationRunResponse, GetValidatorsError, GetValidatorsResponse, GetRunningEvaluationsError, GetRunningEvaluationsResponse, GetPendingEvaluationsData, GetPendingEvaluationsError, GetPendingEvaluationsResponse, JoinWaitlistData, JoinWaitlistError, JoinWaitlistResponse, RequestChallengeData, RequestChallengeError, RequestChallengeResponse, CreateSessionEndpointData, CreateSessionEndpointError, CreateSessionEndpointResponse, LogoutData, LogoutError, LogoutResponse2, SubmitAgentData, SubmitAgentError, SubmitAgentResponse2, StoreChutesTokenData, StoreChutesTokenError, StoreChutesTokenResponse, GetChutesAuthStatusError, GetChutesAuthStatusResponse, ListMinerAgentsError, ListMinerAgentsResponse, ListAgentVersionsData, ListAgentVersionsError, ListAgentVersionsResponse, GetOwnedAgentVersionStatusData, GetOwnedAgentVersionStatusError, GetOwnedAgentVersionStatusResponse, ClaimWorkData, ClaimWorkError, ClaimWorkResponse2, HeartbeatData, HeartbeatError, HeartbeatResponse2, UpdateProgressData, UpdateProgressError, UpdateProgressResponse, PresignUploadData, PresignUploadError, PresignUploadResponse2, CompleteRunData, CompleteRunError, CompleteRunResponse2, BanMinerData, BanMinerError, BanMinerResponse, UnbanMinerData, UnbanMinerError, UnbanMinerResponse, BanValidatorData, BanValidatorError, BanValidatorResponse, UnbanValidatorData, UnbanValidatorError, UnbanValidatorResponse, DiscardAgentVersionData, DiscardAgentVersionError, DiscardAgentVersionResponse, ReinstateAgentVersionData, ReinstateAgentVersionError, ReinstateAgentVersionResponse, SetTopAgentData, SetTopAgentError, SetTopAgentResponse, InvalidateEvaluationRunData, InvalidateEvaluationRunError, InvalidateEvaluationRunResponse, ReevaluateAgentVersionData, ReevaluateAgentVersionError, ReevaluateAgentVersionResponse, CancelAgentVersionData, CancelAgentVersionError, CancelAgentVersionResponse, CreateSuiteData, CreateSuiteError, CreateSuiteResponse2, ActivateSuiteData, ActivateSuiteError, ActivateSuiteResponse2, GetAuditEventsData, GetAuditEventsError, GetAuditEventsResponse, GetReaperStatsError, GetReaperStatsResponse, ClearMinerCooldownData, ClearMinerCooldownError, ClearMinerCooldownResponse, ListMinersData, ListMinersError, ListMinersResponse, ListValidatorsData, ListValidatorsError, ListValidatorsResponse, ListAgentVersions1Data, ListAgentVersions1Error, ListAgentVersions1Response, ListEvaluationRunsData, ListEvaluationRunsError, ListEvaluationRunsResponse, GetValidatorScoresData, GetValidatorScoresError, GetValidatorScoresResponse, GetAgentVersionVarianceData, GetAgentVersionVarianceError, GetAgentVersionVarianceResponse, GetAgentVersionCodeData, GetAgentVersionCodeError, GetAgentVersionCodeResponse } from './types.gen';
|
|
4
|
+
import type { HealthCheckError, HealthCheckResponse, ListSuitesError, ListSuitesResponse, GetCurrentSuiteError, GetCurrentSuiteResponse, GetSuiteProblemsData, GetSuiteProblemsError, GetSuiteProblemsResponse, GetLeaderboardData, GetLeaderboardError, GetLeaderboardResponse, GetTopAgentError, GetTopAgentResponse, GetTopHistoryData, GetTopHistoryError, GetTopHistoryResponse, GetAgentVersionStatusData, GetAgentVersionStatusError, GetAgentVersionStatusResponse, GetAgentVersionRunsData, GetAgentVersionRunsError, GetAgentVersionRunsResponse, GetAgentVersionProblemsData, GetAgentVersionProblemsError, GetAgentVersionProblemsResponse, GetAgentVersionData, GetAgentVersionError, GetAgentVersionResponse, GetArtifactDownloadUrlData, GetArtifactDownloadUrlError, GetArtifactDownloadUrlResponse, GetEvaluationRunData, GetEvaluationRunError, GetEvaluationRunResponse, GetValidatorsError, GetValidatorsResponse, GetRunningEvaluationsError, GetRunningEvaluationsResponse, GetPendingEvaluationsData, GetPendingEvaluationsError, GetPendingEvaluationsResponse, JoinWaitlistData, JoinWaitlistError, JoinWaitlistResponse, RequestChallengeData, RequestChallengeError, RequestChallengeResponse, CreateSessionEndpointData, CreateSessionEndpointError, CreateSessionEndpointResponse, LogoutData, LogoutError, LogoutResponse2, SubmitAgentData, SubmitAgentError, SubmitAgentResponse2, StoreChutesTokenData, StoreChutesTokenError, StoreChutesTokenResponse, GetChutesAuthStatusError, GetChutesAuthStatusResponse, ListMinerAgentsError, ListMinerAgentsResponse, ListAgentVersionsData, ListAgentVersionsError, ListAgentVersionsResponse, GetOwnedAgentVersionStatusData, GetOwnedAgentVersionStatusError, GetOwnedAgentVersionStatusResponse, ClaimWorkData, ClaimWorkError, ClaimWorkResponse2, HeartbeatData, HeartbeatError, HeartbeatResponse2, UpdateProgressData, UpdateProgressError, UpdateProgressResponse, PresignUploadData, PresignUploadError, PresignUploadResponse2, CompleteRunData, CompleteRunError, CompleteRunResponse2, GetRunProblemsData, GetRunProblemsError, GetRunProblemsResponse, BanMinerData, BanMinerError, BanMinerResponse, UnbanMinerData, UnbanMinerError, UnbanMinerResponse, BanValidatorData, BanValidatorError, BanValidatorResponse, UnbanValidatorData, UnbanValidatorError, UnbanValidatorResponse, DiscardAgentVersionData, DiscardAgentVersionError, DiscardAgentVersionResponse, ReinstateAgentVersionData, ReinstateAgentVersionError, ReinstateAgentVersionResponse, SetTopAgentData, SetTopAgentError, SetTopAgentResponse, InvalidateEvaluationRunData, InvalidateEvaluationRunError, InvalidateEvaluationRunResponse, ReevaluateAgentVersionData, ReevaluateAgentVersionError, ReevaluateAgentVersionResponse, CancelAgentVersionData, CancelAgentVersionError, CancelAgentVersionResponse, CreateSuiteData, CreateSuiteError, CreateSuiteResponse2, ActivateSuiteData, ActivateSuiteError, ActivateSuiteResponse2, GetAuditEventsData, GetAuditEventsError, GetAuditEventsResponse, GetReaperStatsError, GetReaperStatsResponse, ClearMinerCooldownData, ClearMinerCooldownError, ClearMinerCooldownResponse, ListMinersData, ListMinersError, ListMinersResponse, ListValidatorsData, ListValidatorsError, ListValidatorsResponse, ListAgentVersions1Data, ListAgentVersions1Error, ListAgentVersions1Response, ListEvaluationRunsData, ListEvaluationRunsError, ListEvaluationRunsResponse, GetValidatorScoresData, GetValidatorScoresError, GetValidatorScoresResponse, GetAgentVersionVarianceData, GetAgentVersionVarianceError, GetAgentVersionVarianceResponse, GetAgentVersionCodeData, GetAgentVersionCodeError, GetAgentVersionCodeResponse } from './types.gen';
|
|
5
5
|
|
|
6
6
|
export const client = createClient(createConfig());
|
|
7
7
|
|
|
@@ -364,6 +364,17 @@ export const completeRun = <ThrowOnError extends boolean = false>(options: Optio
|
|
|
364
364
|
});
|
|
365
365
|
};
|
|
366
366
|
|
|
367
|
+
/**
|
|
368
|
+
* Get problems for an evaluation run
|
|
369
|
+
* Returns the problems that should be evaluated for a given run.
|
|
370
|
+
*/
|
|
371
|
+
export const getRunProblems = <ThrowOnError extends boolean = false>(options: OptionsLegacyParser<GetRunProblemsData, ThrowOnError>) => {
|
|
372
|
+
return (options?.client ?? client).get<GetRunProblemsResponse, GetRunProblemsError, ThrowOnError>({
|
|
373
|
+
...options,
|
|
374
|
+
url: '/v1/validator/evaluation-runs/{eval_run_id}/problems'
|
|
375
|
+
});
|
|
376
|
+
};
|
|
377
|
+
|
|
367
378
|
/**
|
|
368
379
|
* Ban a miner
|
|
369
380
|
* Ban a miner from submitting agents.
|
|
@@ -601,6 +601,10 @@ export type AgentVersionStatus = {
|
|
|
601
601
|
* Final score if eligible
|
|
602
602
|
*/
|
|
603
603
|
final_score?: (number | null);
|
|
604
|
+
/**
|
|
605
|
+
* Average reasoning coefficient from included successful runs
|
|
606
|
+
*/
|
|
607
|
+
reasoning_coefficient?: (number | null);
|
|
604
608
|
/**
|
|
605
609
|
* Whether artifacts are released
|
|
606
610
|
*/
|
|
@@ -1205,6 +1209,12 @@ export type EvaluationRunDetail = {
|
|
|
1205
1209
|
*/
|
|
1206
1210
|
sandbox_metadata?: ({
|
|
1207
1211
|
[key: string]: unknown;
|
|
1212
|
+
} | null);
|
|
1213
|
+
/**
|
|
1214
|
+
* Score breakdown including reasoning details
|
|
1215
|
+
*/
|
|
1216
|
+
score_components_summary?: ({
|
|
1217
|
+
[key: string]: unknown;
|
|
1208
1218
|
} | null);
|
|
1209
1219
|
};
|
|
1210
1220
|
|
|
@@ -2060,6 +2070,16 @@ export type RunningEvaluation = {
|
|
|
2060
2070
|
progress_percent?: number;
|
|
2061
2071
|
};
|
|
2062
2072
|
|
|
2073
|
+
/**
|
|
2074
|
+
* Problems for an evaluation run.
|
|
2075
|
+
*/
|
|
2076
|
+
export type RunProblemsResponse = {
|
|
2077
|
+
/**
|
|
2078
|
+
* Problems to evaluate against
|
|
2079
|
+
*/
|
|
2080
|
+
problems: Array<ProblemPublic>;
|
|
2081
|
+
};
|
|
2082
|
+
|
|
2063
2083
|
/**
|
|
2064
2084
|
* 400 - Candidate score does not exceed the challenge threshold.
|
|
2065
2085
|
*/
|
|
@@ -2967,6 +2987,19 @@ export type CompleteRunResponse2 = (CompleteRunResponse);
|
|
|
2967
2987
|
|
|
2968
2988
|
export type CompleteRunError = ((MissingScoreError | ValidationError) | EvalRunNotFoundError | (NotRunOwnerError | RunAlreadyCompleteError) | HTTPValidationError);
|
|
2969
2989
|
|
|
2990
|
+
export type GetRunProblemsData = {
|
|
2991
|
+
path: {
|
|
2992
|
+
/**
|
|
2993
|
+
* Evaluation run ID
|
|
2994
|
+
*/
|
|
2995
|
+
eval_run_id: string;
|
|
2996
|
+
};
|
|
2997
|
+
};
|
|
2998
|
+
|
|
2999
|
+
export type GetRunProblemsResponse = (RunProblemsResponse);
|
|
3000
|
+
|
|
3001
|
+
export type GetRunProblemsError = (EvalRunNotFoundError | HTTPValidationError);
|
|
3002
|
+
|
|
2970
3003
|
export type BanMinerData = {
|
|
2971
3004
|
body: BanRequest;
|
|
2972
3005
|
path: {
|