@alquimia-ai/tools 1.2.0 → 1.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -43,13 +43,20 @@ declare class StabilityProvider extends StableDiffusionProvider {
43
43
  generateImage(query: string): Promise<string>;
44
44
  }
45
45
 
46
+ interface ElevenLabsConfig {
47
+ baseURL: string;
48
+ apiKey: string;
49
+ voiceId: string;
50
+ voiceSettings?: {
51
+ stability?: number;
52
+ similarity_boost?: number;
53
+ style?: number;
54
+ };
55
+ }
46
56
  declare class ElevenLabsWhisperProvider extends WhisperProvider {
47
57
  private client;
48
- constructor(config: {
49
- apiKey: string;
50
- voiceId: string;
51
- baseURL: string;
52
- });
58
+ private requestSpecs;
59
+ constructor(config: ElevenLabsConfig);
53
60
  speechToText(audio: string): Promise<string>;
54
61
  textToSpeech(text: string): Promise<any>;
55
62
  }
@@ -43,13 +43,20 @@ declare class StabilityProvider extends StableDiffusionProvider {
43
43
  generateImage(query: string): Promise<string>;
44
44
  }
45
45
 
46
+ interface ElevenLabsConfig {
47
+ baseURL: string;
48
+ apiKey: string;
49
+ voiceId: string;
50
+ voiceSettings?: {
51
+ stability?: number;
52
+ similarity_boost?: number;
53
+ style?: number;
54
+ };
55
+ }
46
56
  declare class ElevenLabsWhisperProvider extends WhisperProvider {
47
57
  private client;
48
- constructor(config: {
49
- apiKey: string;
50
- voiceId: string;
51
- baseURL: string;
52
- });
58
+ private requestSpecs;
59
+ constructor(config: ElevenLabsConfig);
53
60
  speechToText(audio: string): Promise<string>;
54
61
  textToSpeech(text: string): Promise<any>;
55
62
  }
@@ -2063,20 +2063,27 @@ var StabilityProvider = class extends StableDiffusionProvider {
2063
2063
  // src/providers/eleven-labs.ts
2064
2064
  var import_elevenlabs = require("elevenlabs");
2065
2065
  var import_axios3 = __toESM(require("axios"));
2066
- var requestSpecs = {
2066
+ var defaultVoiceSettings = {
2067
+ stability: 0.7,
2068
+ similarity_boost: 0.3,
2069
+ style: 0.2
2070
+ };
2071
+ var defaultRequestSpecs = {
2067
2072
  optimize_streaming_latency: import_elevenlabs.ElevenLabs.OptimizeStreamingLatency.Zero,
2068
2073
  output_format: import_elevenlabs.ElevenLabs.OutputFormat.Mp344100128,
2069
- model_id: "eleven_multilingual_v1",
2070
- language: "es",
2071
- voice_settings: {
2072
- stability: 0.1,
2073
- similarity_boost: 0.15,
2074
- style: 0.2
2075
- }
2074
+ model_id: "eleven_multilingual_v2",
2075
+ language: "es"
2076
2076
  };
2077
2077
  var ElevenLabsWhisperProvider = class extends WhisperProvider {
2078
2078
  constructor(config) {
2079
2079
  super(config);
2080
+ this.requestSpecs = {
2081
+ ...defaultRequestSpecs,
2082
+ voice_settings: {
2083
+ ...defaultVoiceSettings,
2084
+ ...config.voiceSettings
2085
+ }
2086
+ };
2080
2087
  this.client = new import_elevenlabs.ElevenLabsClient(config);
2081
2088
  }
2082
2089
  async speechToText(audio) {
@@ -2117,7 +2124,7 @@ var ElevenLabsWhisperProvider = class extends WhisperProvider {
2117
2124
  `/v1/text-to-speech/${this.config.voiceId}`,
2118
2125
  {
2119
2126
  text,
2120
- ...requestSpecs
2127
+ ...this.requestSpecs
2121
2128
  },
2122
2129
  { responseType: "blob" }
2123
2130
  );