@salesforce/lds-adapters-service-einsteinllm 1.414.1 → 1.415.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/src/raml/api.raml CHANGED
@@ -435,6 +435,10 @@ types:
435
435
  description: Additional configuration to fine tune model parameters
436
436
  type: EinsteinLlmAdditionalConfigInputRepresentation # Hand-rolled update from 'object'
437
437
  required: false # TODO Hand-rolled W-9314597
438
+ includeMetrics:
439
+ description: Whether to return metrics
440
+ type: boolean
441
+ required: false
438
442
  inputParams:
439
443
  description: Dictionary of input parameters to generate prompt from prompt
440
444
  template.
@@ -481,6 +485,11 @@ types:
481
485
  description: Any provider specific attributes will be included as part of
482
486
  this object
483
487
  type: WrappedMap | nil # Hand-rolled union 'nil'
488
+ performance:
489
+ description: Performance metrics including overall latency and detailed execution
490
+ breakdown
491
+ required: false
492
+ type: EinsteinPromptTemplatePerformanceRepresentation
484
493
  prompt:
485
494
  description: Prompt used for the generation
486
495
  type: string | nil # Hand-rolled union 'nil'
@@ -520,6 +529,10 @@ types:
520
529
  required: false # TODO Hand-rolled W-17552098
521
530
  items:
522
531
  type: EinsteinPromptTemplateAttachmentRepresentation
532
+ tokenUsage:
533
+ description: token usage information
534
+ required: false
535
+ type: EinsteinPromptTemplateTokenUsageRepresentation
523
536
  EinsteinLlmGenerationCitationRepresentation:
524
537
  description: Output of a Einstein LLM Generation Citation output
525
538
  type: object
@@ -984,6 +997,121 @@ types:
984
997
  versionId:
985
998
  description: Prompt Template Version Id
986
999
  type: string
1000
+ EinsteinPromptTemplatePerformanceRepresentation:
1001
+ description: Performance metrics including overall latency and detailed execution
1002
+ breakdown
1003
+ type: object
1004
+ properties:
1005
+ execution:
1006
+ description: Detailed latency breakdown for all execution steps
1007
+ type: EinsteinPromptTemplateLatencyExecutionRepresentation
1008
+ latency:
1009
+ description: Overall latency metrics for the entire operation
1010
+ type: EinsteinPromptTemplateLatencyRepresentation
1011
+ EinsteinPromptTemplateLatencyBreakdownItemRepresentation:
1012
+ description: Latency breakdown item with reference name and latency metrics
1013
+ type: object
1014
+ properties:
1015
+ latency:
1016
+ description: Latency information for this breakdown item
1017
+ type: EinsteinPromptTemplateLatencyRepresentation
1018
+ referenceName:
1019
+ description: Reference name for the breakdown item
1020
+ type: string
1021
+ EinsteinPromptTemplateLatencyExecutionRepresentation:
1022
+ description: Latency execution breakdown with metrics for all execution steps
1023
+ type: object
1024
+ properties:
1025
+ generation:
1026
+ description: Latency metrics for generation step
1027
+ type: EinsteinPromptTemplateLatencyStepRepresentation
1028
+ required: false
1029
+ hydration:
1030
+ description: Latency metrics for hydration step
1031
+ type: EinsteinPromptTemplateLatencyStepRepresentation
1032
+ required: false
1033
+ loadTemplate:
1034
+ description: Latency metrics for loading the template
1035
+ type: EinsteinPromptTemplateLatencyStepRepresentation
1036
+ mask:
1037
+ description: Latency metrics for masking step
1038
+ type: EinsteinPromptTemplateLatencyStepRepresentation
1039
+ required: false
1040
+ resolveData:
1041
+ description: Latency metrics for resolving all data (inputs and data providers)
1042
+ with breakdown
1043
+ type: EinsteinPromptTemplateLatencyStepRepresentation
1044
+ required: false
1045
+ summarize:
1046
+ description: Latency metrics for summarization step
1047
+ type: EinsteinPromptTemplateLatencyStepRepresentation
1048
+ required: false
1049
+ EinsteinPromptTemplateLatencyRepresentation:
1050
+ description: Latency information with duration and start time
1051
+ type: object
1052
+ properties:
1053
+ duration:
1054
+ description: Duration of the operation in milliseconds
1055
+ type: integer
1056
+ startTime:
1057
+ description: Start time of the operation in milliseconds
1058
+ type: integer
1059
+ EinsteinPromptTemplateLatencyStepRepresentation:
1060
+ description: Latency step information with latency metrics and breakdown
1061
+ type: object
1062
+ properties:
1063
+ breakdown:
1064
+ description: Breakdown of latency by reference name
1065
+ type: array
1066
+ required: false
1067
+ items:
1068
+ type: EinsteinPromptTemplateLatencyBreakdownItemRepresentation
1069
+ latency:
1070
+ description: Latency information for this step
1071
+ type: EinsteinPromptTemplateLatencyRepresentation
1072
+ EinsteinPromptTemplatePromptTokenUsageRepresentation:
1073
+ description: Output representation for prompt token usage with breakdown
1074
+ type: object
1075
+ properties:
1076
+ breakdown:
1077
+ description: Breakdown of token usage by source (text expressions, files,
1078
+ etc.)
1079
+ required: false
1080
+ type: array
1081
+ items:
1082
+ type: EinsteinPromptTemplateTokenBreakdownRepresentation
1083
+ total:
1084
+ description: Total number of tokens used in the prompt
1085
+ type: integer
1086
+ EinsteinPromptTemplateTokenUsageRepresentation:
1087
+ description: Output representation for token usage and its breakdown
1088
+ type: object
1089
+ properties:
1090
+ completion:
1091
+ description: Number of tokens used for completion
1092
+ type: integer
1093
+ prompt:
1094
+ description: Prompt token usage details including breakdown by source
1095
+ type: EinsteinPromptTemplatePromptTokenUsageRepresentation
1096
+ total:
1097
+ description: Total number of tokens used in the request
1098
+ type: integer
1099
+ EinsteinPromptTemplateTokenBreakdownRepresentation:
1100
+ description: Output representation for a single token breakdown item by source
1101
+ type: object
1102
+ properties:
1103
+ occurrences:
1104
+ description: Number of times this expression appears in the prompt
1105
+ type: integer
1106
+ role:
1107
+ description: Role associated with source of token.
1108
+ type: string
1109
+ source:
1110
+ description: Specific part of prompt that contributed to tokens.
1111
+ type: string
1112
+ tokens:
1113
+ description: Number of tokens contributed by this source
1114
+ type: integer
987
1115
  WrappedListString:
988
1116
  description: Wrapped list of String for use in Apex.
989
1117
  type: object