npm - garriga - Versions diffs - 1.0.9 → 1.0.10 - Mend

garriga 1.0.9 → 1.0.10

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/index.js +36 -5
package/package.json +1 -1

package/index.js CHANGED Viewed

@@ -214,20 +214,51 @@ class localLLM {
     );
     if (userToken === "modeloLocalOllama") {
-      try {
+     try {
+        // --- CÁLCULO DINÁMICO DE CONTEXTO ---
+        // 1. Estimar tokens del prompt:
+        // En español y JSON, un token suelen ser aprox 2.7 - 3 caracteres.
+        // Dividimos por 2.7 para ser conservadores (calcular por lo alto) y evitar cortes.
+        const estimatedPromptTokens = Math.ceil(prompt.length / 2.7);
+        // 2. Tokens reservados para la respuesta (output):
+        const numPredict = +(process.env.MAX_TOKENS_FRAUD || 2500);
+        // 3. Buffer de seguridad (por si acaso):
+        const buffer = 1000;
+        // 4. Calcular el total necesario:
+        // 4. Calcular el total necesario:
+        let neededCtx = estimatedPromptTokens + numPredict + buffer;
+        // --- MEJORA: BUCKETING (REDONDEO) ---
+        // Redondeamos hacia arriba al siguiente múltiplo de 1024 o 2048.
+        // Esto evita recargas si el prompt cambia poco de tamaño.
+        const blockSize = 2048;
+        neededCtx = Math.ceil(neededCtx / blockSize) * blockSize;
+        // 5. Aplicar límites (Clamping):
+        const maxServerLimit = +(process.env.MAX_CONTEXT_FRAUD || 65536);
+        const minLimit = 4096;
+        const finalCtx = Math.min(Math.max(neededCtx, minLimit), maxServerLimit);
+        // (Opcional) Log para depurar y ver cuánto está pidiendo realmente
+        console.log(`[Ollama] Dynamic Context -> Prompt Chars: ${prompt.length}, Calculated: ${neededCtx}, Used: ${finalCtx}`);
         const ollamaPayload = {
           prompt,
           model: source,
           stream: false,
           format: "json",
           keep_alive: -1,
           options: {
-            num_ctx: process.env.MAX_CONTEXT_FRAUD || 65536,
-            temperature: process.env.TEMPERATURE_FRAUD || 0.1,
-            num_predict: process.env.MAX_TOKENS_FRAUD || 2500,
+            num_ctx: finalCtx, // Valor dinámico calculado
+            temperature: +(process.env.TEMPERATURE_FRAUD || 0.1),
+            num_predict: numPredict,
           },
         };
         const response = await axios.post(this.apiUrlOllama, ollamaPayload, {
           headers: {
             "Content-Type": "application/json",

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "garriga",
-  "version": "1.0.9",
+  "version": "1.0.10",
   "description": "AI connector",
   "main": "index.js",
   "scripts": {