npm - @salesforce/lds-adapters-sfap-einstein-ai-gateway - Versions diffs - 0.1.0-dev1 - Mend

@salesforce/lds-adapters-sfap-einstein-ai-gateway 0.1.0-dev1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (50) hide show

package/src/raml/api.raml ADDED Viewed

@@ -0,0 +1,1003 @@
+#%RAML 1.0
+types:
+  LLMProvidersResponse:
+    description: List of LLM providers supported in the gateway.
+    type: array
+    items: LLMProviderResponse
+  GenerationResponse:
+    type: object
+    properties:
+      id:
+        description: ID of the generation request.
+        type: string
+        required: true
+      generations:
+        description: List of generated text items.
+        type: array
+        items: GenerationResponseGenerations
+        required: true
+      prompt?:
+        description: Prompt used for the generation. Can be `null`.
+        (nullable): true
+        type: string | nil
+      input_safety_score?:
+        (nullable): true
+        type: SafetyScoreRepresentation | nil
+      parameters?:
+        description: Any provider-specific attributes included as part of this object. Can be `null`.
+        (nullable): true
+        type: object
+        properties:
+          //:
+            type: any
+        example:
+          strict: false
+          value:
+            model: text-davinci-003
+            object: text_completion
+            usage:
+              completion_tokens: 235
+              prompt_tokens: 91
+              total_tokens: 326
+        additionalProperties: true
+  HyperLink:
+    description: Hyperlink object included in the Links schema.
+    type: object
+    properties:
+      href?:
+        description: Link to the endpoint.
+        example:
+          strict: false
+          value: https://bot-svc-llm.sfproxy.einstein.aws-prod1-useast1.aws.sfdc.cl/v1.0/chat/session/
+        type: string
+  Error:
+    type: object
+    examples:
+      generated_1:
+        strict: false
+        value:
+          message: Bad Request
+      generated_2:
+        strict: false
+        value:
+          message: Access bearer token is missing or invalid
+      generated_3:
+        strict: false
+        value:
+          message: User forbidden from accessing the resource
+      generated_4:
+        strict: false
+        value:
+          message: Server is busy and cannot process the request at this time
+      generated_5:
+        strict: false
+        value:
+          message: Too many requests for the server to handle
+      generated_6:
+        strict: false
+        value:
+          message: Internal server error
+      generated_7:
+        strict: false
+        value:
+          message: Service is unavailable
+      generated_8:
+        strict: false
+        value:
+          message: List models not supported for this provider
+    additionalProperties: true
+    properties:
+      message:
+        description: Exception error message.
+        example:
+          strict: false
+          value: Something went wrong
+        type: string
+        required: true
+  GenerationSettings:
+    description: Settings that can be configured for a generation.
+    type: object
+    properties:
+      num_generations?:
+        description: Number of completions to be generated for a prompt.
+        default: 1
+        type: integer
+      max_tokens?:
+        description: Maximum number of tokens to be generated.
+        default: 16
+        type: integer
+      temperature?:
+        description: Sampling temperature to be used. Higher values mean more random token choices. Lower values mean less random token choices. Min value of 0; max value of 1.0.
+        default: 0.5
+        type: number
+      stop_sequences?:
+        description: An array of stop sequences to be used. The generated text is cut at the end of the earliest occurrence of a stop sequence.
+        type: array
+        items:
+          type: string
+      frequency_penalty?:
+        description: The frequency penalty to be used. Min value is 0.0; max value is 1.0. Can reduce the repetitiveness of generated tokens. The higher the value, the stronger a penalty is applied to previously present tokens, proportional to how many times they have already appeared in the prompt or prior generation.
+        default: 0.0
+        type: number
+      presence_penalty?:
+        description: The presence penalty to be used. Min value is 0.0; max value is 1.0. Can reduce the repetitiveness of generated tokens. Behaves similarly to `frequency_penalty`, except that this penalty is applied equally to all tokens that have already appeared, regardless of their exact frequencies.
+        default: 0.0
+        type: number
+      parameters?:
+        description: Dictionary of any other parameters that are required by the specified provider. Values are passed as is to the provider so that the request can include parameters that are unique to a provider.
+        type: object
+        properties:
+          //:
+            type: any
+        example:
+          strict: false
+          value:
+            top_p: 0.5
+            logProbs: 3
+            echo: false
+        additionalProperties: true
+  ChatSupportedProviders:
+    description: Provider used in the session.
+    enum:
+      - OpenAI
+    type: any
+  Links:
+    description: List of Einstein GPT API endpoints for HATEOAS compliance.
+    type: object
+    additionalProperties: false
+    properties:
+      self: HyperLink
+      session?: HyperLink
+      messages?: HyperLink
+  LLMProviderDetails:
+    description: Dictionary of properties for the provider.
+    type: object
+    properties:
+      provider_type:
+        description: Type of LLM provider (internal or external).
+        enum:
+          - internal
+          - external
+        type: string
+        required: true
+      provider_description:
+        description: Short description of the provider.
+        type: string
+        required: true
+      supports_generate:
+        description: Indicates whether the provider supports the `generate` operation.
+        type: boolean
+        required: true
+      supports_models:
+        description: Indicates whether the provider supports the `models` operation.
+        type: boolean
+        required: true
+      supports_embeddings:
+        description: Indicates whether the provider supports the `embeddings` operation.
+        type: boolean
+        required: true
+      max_tokens:
+        description: The maximum number of tokens allowed by the provider.
+        type: integer
+        required: true
+  ModelsResponse:
+    description: List of models for the specified provider.
+    type: array
+    items: ModelResponse
+  UserMessage:
+    description: The message from the user to the LLM.
+    example:
+      strict: false
+      value: Write a product description for a new phone.
+    type: string
+  PluginGenerationRequest:
+    description: Generic plug-in generation request
+    type: object
+    additionalProperties: true
+  LLMProviderResponse:
+    description: LLM provider properties.
+    type: object
+    properties:
+      name:
+        description: Name of the provider.
+        enum:
+          - OpenAI
+          - Cohere
+          - InternalTextGeneration
+          - InternalCodeGeneration
+        type: string
+        required: true
+      details?: LLMProviderDetails
+  GenerationDetails:
+    description: Details for a generation request.
+    type: object
+    properties:
+      generations:
+        description: Generated responses from the LLM.
+        type: array
+        items: ChatMessage
+        required: true
+      parameters?:
+        description: Any provider-specific attributes included as part of this object.
+        type: object
+        example:
+          strict: false
+          value:
+            model: text-davinci-003
+            object: text_completion
+            usage:
+              completion_tokens: 235
+              prompt_tokens: 91
+              total_tokens: 326
+        additionalProperties: true
+  ResponseId:
+    description: Identifier for a response.
+    example:
+      strict: false
+      value: 014DFFD2-04B5-4765-8EA7-507585268CD3
+    type: string
+  ChatMessage:
+    description: Representation of a message in a conversation.
+    type: object
+    properties:
+      id?:
+        description: Generation ID. This value is required to register feedback.
+        type: string
+      role:
+        description: Persona that sent the message.
+        enum:
+          - system
+          - user
+          - assistant
+        type: string
+        required: true
+      content:
+        description: The content of the message.
+        example:
+          strict: false
+          value: Can you give me a recipe for chocolate brownies?
+        type: string
+        required: true
+      timestamp?:
+        description: Timestamp when the message was sent.
+        example:
+          strict: false
+          value: 1682536893
+        type: number
+      parameters?:
+        description: Any provider-specific attributes included as part of this object.
+        (nullable): true
+        type: object
+        example:
+          strict: false
+          value:
+            finish_reason: stop
+            index: 0
+            logprobs: null
+        additionalProperties: true
+      generation_safety_score?: SafetyScoreRepresentation
+      generation_content_quality?: ContentQualityRepresentation
+  GenerationResponseGenerations:
+    description: Generated text that is part of the generated response.
+    type: object
+    properties:
+      id?:
+        description: Generation ID. This value is required to register feedback.
+        type: string
+      text:
+        description: The generated text.
+        type: string
+        required: true
+      parameters?:
+        description: Any provider-specific attributes included as part of this object. Can be `null`.
+        (nullable): true
+        type: object
+        properties:
+          //:
+            type: any
+        example:
+          strict: false
+          value:
+            finish_reason: stop
+            index: 0
+            logprobs: null
+        additionalProperties: true
+      generation_safety_score?:
+        (nullable): true
+        type: SafetyScoreRepresentation | nil
+      generation_content_quality?:
+        (nullable): true
+        type: ContentQualityRepresentation | nil
+  SafetyCategoryScores:
+    description: Probability for each category. A higher probability indicates a more toxic content.
+    type: object
+    properties:
+      toxicity?:
+        default: 0.0
+        type: number
+        minimum: 0
+        maximum: 1
+      hate?:
+        default: 0.0
+        type: number
+        minimum: 0
+        maximum: 1
+      identity?:
+        default: 0.0
+        type: number
+        minimum: 0
+        maximum: 1
+      violence?:
+        default: 0.0
+        type: number
+        minimum: 0
+        maximum: 1
+      physical?:
+        default: 0.0
+        type: number
+        minimum: 0
+        maximum: 1
+      sexual?:
+        default: 0.0
+        type: number
+        minimum: 0
+        maximum: 1
+      profanity?:
+        default: 0.0
+        type: number
+        minimum: 0
+        maximum: 1
+      biased?:
+        default: 0.0
+        type: number
+        minimum: 0
+        maximum: 1
+  PluginGenerationResponse:
+    description: Generic plug-in generation response
+    type: object
+    additionalProperties: true
+  GenerationRequest:
+    type: object
+    properties:
+      prompt:
+        description: The prompt or text to be completed.
+        type: string
+        required: true
+      num_generations?:
+        description: Number of completions to be generated for the prompt.
+        default: 1
+        type: integer
+      max_tokens?:
+        description: Maximum number of tokens to be generated.
+        type: integer
+      enable_pii_masking?:
+        description: Indicates whether to mask personally identifiable information (PII) in the prompt. Defaults to `false`.
+        type: boolean
+      temperature?:
+        description: Sampling temperature to be used. Higher values mean more random token choices. Lower values mean less random token choices. Min value of 0; max value of 1.0.
+        default: 0.5
+        type: number
+      stop_sequences?:
+        description: An array of stop sequences. The generated text is cut at the end of the earliest occurrence of a stop sequence.
+        type: array
+        items:
+          type: string
+      frequency_penalty?:
+        description: The frequency penalty. Min value is 0.0; max value is 1.0. Can reduce the repetitiveness of generated tokens. The higher the value, the stronger a penalty is applied to previously present tokens, proportional to how many times they have already appeared in the prompt or prior generation.
+        default: 0.0
+        type: number
+      presence_penalty?:
+        description: The presence penalty. Min value is 0.0; max value is 1.0. Can reduce the repetitiveness of generated tokens. Behaves similarly to `frequency_penalty`, except that this penalty is applied equally to all tokens that have already appeared, regardless of their exact frequencies.
+        default: 0.0
+        type: number
+      model?:
+        description: The model to be used for generating responses. Defaults to a provider-specific model.
+        example:
+          strict: false
+          value: text-davinci-003
+        type: string
+      parameters?:
+        description: Dictionary of any other parameters that are required by the provider. Values are passed as is to the provider so that the request can include parameters that are unique to a provider.
+        type: object
+        properties:
+          //:
+            type: any
+        example:
+          strict: false
+          value:
+            top_p: 0.5
+            logProbs: 3
+            echo: false
+        additionalProperties: true
+      tags?:
+        description: Dictionary of any other information relevant to the gateway client.
+        type: object
+        properties:
+          //:
+            type: any
+        example:
+          strict: false
+          value:
+            node-id: node-53p98pwse5i39ququ4
+            node-53p98pwse5i39ququ4: gateway-request-id
+        additionalProperties: true
+  ContentQualityRepresentation:
+    description: Data generated by the Trust Layer for content safety and quality (e.g., scores, explanations)
+    type: object
+    properties:
+      is_toxicity_detected?:
+        description: True if the overall safety score exceeds threshold, false otherwise. Null value indicates safety score call failed
+        type: boolean
+  SafetyScoreRepresentation:
+    description: Overall score and category score
+    type: object
+    properties:
+      safety_score?:
+        description: A higher score implies safer content
+        type: number
+        minimum: 0
+        maximum: 1
+      category_scores?: SafetyCategoryScores | nil
+  ModelResponse:
+    description: Model properties.
+    type: object
+    properties:
+      id:
+        description: ID of the model.
+        type: string
+        required: true
+      properties?:
+        description: Dictionary of properties for the model. Values are specific to each provider.
+        type: object
+        example:
+          strict: false
+          value:
+            permission:
+              - allow_fine_tuning: true
+  GenerationsErrorRepresentation:
+    description: Error response representation
+    type: object
+    additionalProperties: true
+    properties:
+      message:
+        description: Exception error message
+        type: string
+        required: true
+  ConversationalMemorySettings:
+    description: Settings that can be configured for conversational memory
+    type: object
+    properties:
+      strategy?:
+        description: The strategy to use when providing conversational context to the LLM.
+        default: last_n_turns
+        enum:
+          - last_n_turns
+        type: string
+      max_turns?:
+        description: Maximum number of turns to be included in the context provided to the LLM. To be used with last_n_turns strategy.
+        default: 5
+        type: integer
+  GenerationSettingsResponse:
+    (amf-and):
+      - GenerationSettings
+    type: any
+  FeedbackRequest:
+    type: object
+    properties:
+      id:
+        description: A unique ID for the feedback object.
+        type: string
+      generation_id?:
+        description: The ID of the gateway's generation response. For example, `GenerationResponseGenerations.id`.
+        type: string
+      turn_id?:
+        description: The unique ID of a batch of generations to support to capture a single feedback for multiple generations.
+        type: string
+      app_generation_id?:
+        description: The app-specific generation ID to support cases where client further split a generation into multiple generations.
+        type: string
+      app_generation?:
+        description: The app-specific generation text to support cases where the client further splits a generation into multiple generations.
+        type: string
+      feedback?:
+        description: The feedback sentiment. Can be `null`.
+        enum:
+          - GOOD
+          - BAD
+        (nullable): true
+        type: string | nil
+      feedback_text?:
+        description: The textual representation of the feedback as provided by the user.
+        type: string
+      source?:
+        description: The source of the feedback. For example, `human` or `app`.
+        type: string
+      app_feedback?:
+        description: Dictionary of any app-level feedback and any other free-form parameters.
+        type: object
+        properties:
+          //:
+            type: any # Fix for W-14390785
+        additionalProperties: true
+  FeedbackResponseRepresentation:
+    description: Output of a einstein llm feedback call
+    type: object
+    properties:
+      message:
+        description: Response text of the feedback API
+        type: string
+  FeedbackResponse202Representation:
+    description: Output of a einstein llm feedback call
+    type: object
+    additionalProperties: true
+    properties:
+      message:
+        description: Response text of the feedback API
+        type: string
+  FeedbackErrorRepresentation:
+    description: Feedback Error Representation
+    type: object
+    additionalProperties: true
+    properties:
+      message:
+        description: Exception error message
+        type: string
+  EmbeddingRequest:
+    type: object
+    properties:
+      input:
+        description: Input text used for generating an embedding. Data is encoded as an array of strings.
+        type: array
+        items:
+          type: string
+        required: true
+      model?:
+        description: The model to be used for generating the embedding. Defaults to a provider-specific model.
+        example:
+          strict: false
+          value: text-embedding-ada-002
+        type: string
+      enable_pii_masking?:
+        description: Indicates whether to mask personally identifiable information (PII) in the prompt. Defaults to `false`.
+        type: boolean
+      localization?: Localization
+      parameters?:
+        description: Dictionary of any other parameters that are required by the specified provider. Values are passed as is to the provider so that the request can include parameters that are unique to a provider.
+        type: object
+        properties:
+          //:
+            type: any # Fix for W-14390785
+        example:
+          strict: false
+          value:
+            logprobs: 5
+        additionalProperties: true
+  Localization:
+    description: Localization
+    type: object
+    properties:
+      defaultLocale:
+        type: string
+        description: Language and region code.
+        required: true
+      inputLocales?:
+        description: Locales contained in the prompt text.
+        type: array
+        items: ProbableLocale
+      expectedLocales?:
+        description: Expected output languages of the generations. Derived from output language instructions of the prompt.
+        type: array
+        items: string
+  ProbableLocale:
+    description: ''
+    type: object
+    properties:
+      locale:
+        type: string
+        description: Language and region code.
+        required: true
+      probability?:
+        type: number
+        minimum: 0
+        maximum: 1
+  EmbeddingResponse:
+    type: object
+    properties:
+      embeddings?:
+        description: Array of `Embeddings` in the response.
+        type: array
+        items: Embeddings
+      parameters?:
+        description: Any provider-specific attributes are included as part of this object.
+        type: object
+        properties:
+          //:
+            type: any # Fix for W-14390785
+        example:
+          strict: false
+          value:
+            texts:
+              - input
+        additionalProperties: true
+  Embeddings:
+    description: Embedding of the text.
+    type: object
+    properties:
+      embedding?:
+        description: Embedding of the text. Data is specified as an array of numbers.
+        type: array
+        items:
+          type: number
+      index?:
+        description: Index of the input text to which the embedding belongs.
+        type: integer
+  EmbeddingErrorRepresentation:
+    type: object
+    additionalProperties: true
+    properties:
+      error_code:
+        description: Error code to map the error message
+        example:
+          strict: false
+          value: INTERNAL_ERROR
+        type: string
+        required: true
+      message_code:
+        description: The messageCode field is a specification of the error and uniquely identifies an error message.
+        example:
+          strict: false
+          value: E00001
+        type: string
+        required: true
+      message:
+        description: Exception error message.
+        example:
+          strict: false
+          value: A generic error emitted by the API platform and mapped to the 500 HTTP status code
+        type: string
+        required: true
+      target?:
+        description: The targets field is a collection of references that represent the specific occurrence of the problem.
+        type: array
+        items:
+          type: object
+          properties:
+            type:
+              description: FIELD | QUERY_PARAMETER | HTTP_HEADER
+              example:
+                strict: false
+                value: FIELD
+              type: string
+              required: false
+            reference:
+              example:
+                strict: false
+                value: $['order']['payment']['billingAddress']['postalCode']
+              type: string
+              required: false
+      parameters?:
+        description: The parameters field is a collection of name-value pairs where each item in the collection represents a parameter leveraged in the error message.
+        type: array
+        items:
+          type: object
+          properties:
+            name:
+              example:
+                strict: false
+                value: postalCode
+              type: string
+              required: false
+            value:
+              example:
+                strict: false
+                value: '123456789'
+              type: string
+              required: false
+annotationTypes:
+  amf-serverDescription:
+    type: any
+  amf-exclusiveMinimum:
+    type: any
+  amf-binding:
+    type: any
+  nullable:
+    type: any
+  amf-pattern:
+    type: any
+  amf-payloads:
+    type: any
+  amf-exclusiveMaximum:
+    type: any
+  amf-consumes:
+    type: any
+  amf-additionalProperties:
+    type: any
+  amf-or:
+    type: any
+  amf-url:
+    type: any
+  amf-externalDocs:
+    type: any
+  amf-flow:
+    type: any
+  amf-oasDeprecated:
+    type: any
+  amf-contact:
+    type: any
+  amf-multipleOf:
+    type: any
+  amf-xor:
+    type: any
+  amf-not:
+    type: any
+  amf-callbacks:
+    type: any
+  amf-produces:
+    type: any
+  amf-format:
+    type: any
+  amf-license:
+    type: any
+  amf-summary:
+    type: any
+  amf-responses:
+    type: any
+  amf-maximum:
+    type: any
+  amf-tags:
+    type: any
+  amf-dependencies:
+    type: any
+  amf-readOnly:
+    type: any
+  amf-tuple:
+    type: any
+  amf-examples:
+    type: any
+  amf-collectionFormat:
+    type: any
+  amf-termsOfService:
+    type: any
+  amf-servers:
+    type: any
+  amf-xone:
+    type: any
+  amf-defaultResponse:
+    type: any
+  amf-baseUriParameters:
+    type: any
+  amf-parameters:
+    type: any
+  amf-minimum:
+    type: any
+  amf-recursive:
+    type: any
+  amf-and:
+    type: any
+securitySchemes:
+  bearerAuth:
+    type: http
+    description: HTTP C2C (cloud-to-cloud) authentication scheme. Must be in the format `C2C <C2C Token>`.
+    settings: {}
+title: Generative AI Gateway API
+baseUri: api.salesforce.com
+description: |
+  The Generative AI Gateway API connects your Einstein GPT application to large language models (LLMs) from Salesforce-approved providers.
+  To learn more about developing Einstein GPT applications, see the [developer guides](https://gpt-sfdocs.herokuapp.com/docs/platform/foundations/guide/) and the [Confluence space](https://www.sfdc.co/ai).
+version: v1
+/ai/gpt/v1/generations:
+  post:
+    displayName: generations
+    description: Generate a response based on the provided prompt and model parameters.
+    (amf-summary): Generate response
+    headers:
+      'x-client-feature-id':
+        type: string
+        description: Client Feature Id.
+      'x-sfdc-app-context':
+        type: string
+        default: EinsteinGPT
+        required: false
+        description: SFDC app context.
+      'x-LLM-Provider':
+        description: Provider to use.
+        required: false
+        enum:
+          - OpenAI
+          - Cohere
+          - InternalTextGeneration
+          - InternalCodeGeneration
+        example:
+          strict: false
+          value: OpenAI
+        type: string
+    body:
+      application/json:
+        type: GenerationRequest
+    responses:
+      '200':
+        description: OK
+        body:
+          application/json:
+            type: GenerationResponse
+      '400':
+        description: Bad Request
+        body:
+          application/json:
+            type: GenerationsErrorRepresentation
+      '401':
+        description: Access bearer token is missing or invalid
+        body:
+          application/json:
+            type: GenerationsErrorRepresentation
+      '403':
+        description: User forbidden from accessing the resource
+        body:
+          application/json:
+            type: GenerationsErrorRepresentation
+      '423':
+        description: Server is busy and cannot process the request at this time
+        body:
+          application/json:
+            type: GenerationsErrorRepresentation
+      '429':
+        description: Too many requests for the server to handle
+        body:
+          application/json:
+            type: GenerationsErrorRepresentation
+      '500':
+        description: Internal server error.
+        body:
+          application/json:
+            type: GenerationsErrorRepresentation
+      '503':
+        description: Service is unavailable
+        body:
+          application/json:
+            type: GenerationsErrorRepresentation
+      '501':
+        description: Something went wrong
+        body:
+          application/json:
+            type: GenerationsErrorRepresentation
+    securedBy:
+      - bearerAuth
+/ai/gpt/v1/feedback:
+  post:
+    displayName: feedback
+    description: Register feedback for a generation.
+    (amf-summary): Register feedback
+    headers:
+      'x-client-feature-id':
+        type: string
+        description: Client Feature Id.
+      'x-sfdc-app-context':
+        type: string
+        default: EinsteinGPT
+        required: false
+        description: SFDC app context.
+    body:
+      application/json: FeedbackRequest
+    responses:
+      '202':
+        description: Accepted
+        body:
+          application/json:
+            type: FeedbackResponse202Representation
+      '200':
+        description: Something went wrong
+        body:
+          application/json:
+            type: FeedbackResponseRepresentation # Use FeedbackErrorRepresentation as it's an error if luvio key is relaxed
+      '400':
+        description: Bad Request
+        body:
+          application/json:
+            type: FeedbackErrorRepresentation
+      '401':
+        description: Access bearer token is missing or invalid
+        body:
+          application/json:
+            type: FeedbackErrorRepresentation
+      '403':
+        description: User forbidden from accessing the resource
+        body:
+          application/json:
+            type: FeedbackErrorRepresentation
+      '423':
+        description: Server is busy and cannot process the request at this time
+        body:
+          application/json:
+            type: FeedbackErrorRepresentation
+      '429':
+        description: Too many requests for the server to handle
+        body:
+          application/json:
+            type: FeedbackErrorRepresentation
+      '503':
+        description: Service is unavailable
+        body:
+          application/json:
+            type: FeedbackErrorRepresentation
+    securedBy:
+      - bearerAuth
+/ai/gpt/v1/embeddings:
+  post:
+    displayName: embeddings
+    description: Create an embedding vector representing the input text.
+    (amf-summary): Create embedding
+    headers:
+      'x-client-feature-id':
+        type: string
+        description: Client Feature Id.
+      'x-sfdc-app-context':
+        type: string
+        default: EinsteinGPT
+        required: false
+        description: SFDC app context.
+      'x-LLM-Provider':
+        description: Provider to use.
+        required: false
+        enum:
+          - AzureOpenAI
+          - OpenAI
+          - InternalTextGeneration
+          - InternalCodeGeneration
+        example:
+          strict: false
+          value: OpenAI
+        type: string
+    body:
+      application/json: EmbeddingRequest
+    responses:
+      '200':
+        description: OK
+        body:
+          application/json:
+            type: EmbeddingResponse
+      '400':
+        description: Bad Request
+        body:
+          application/json:
+            type: EmbeddingErrorRepresentation
+      '401':
+        description: Access bearer token is missing or invalid
+        body:
+          application/json:
+            type: EmbeddingErrorRepresentation
+      '403':
+        description: User forbidden from accessing the resource
+        body:
+          application/json:
+            type: EmbeddingErrorRepresentation
+      '423':
+        description: Server is busy and cannot process the request at this time
+        body:
+          application/json:
+            type: EmbeddingErrorRepresentation
+      '429':
+        description: Too many requests for the server to handle
+        body:
+          application/json:
+            type: EmbeddingErrorRepresentation
+      '500':
+        description: Internal server error
+        body:
+          application/json:
+            type: EmbeddingErrorRepresentation
+      '503':
+        description: Service is unavailable
+        body:
+          application/json:
+            type: EmbeddingErrorRepresentation
+      '501':
+        description: Something went wrong
+        body:
+          application/json:
+            type: EmbeddingErrorRepresentation
+    securedBy:
+      - bearerAuth