PyPI - lemonade-sdk - Versions diffs - 8.0.3__py3-none-any.whl → 8.0.5__py3-none-any.whl - Mend

lemonade-sdk 8.0.3py3-none-any.whl → 8.0.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of lemonade-sdk might be problematic. Click here for more details.

Files changed (27) hide show

lemonade/api.py +50 -0
lemonade/common/inference_engines.py +415 -0
lemonade/common/system_info.py +493 -47
lemonade/tools/humaneval.py +1 -1
lemonade/tools/management_tools.py +53 -7
lemonade/tools/mmlu.py +1 -1
lemonade/tools/oga/load.py +1 -1
lemonade/tools/perplexity.py +2 -2
lemonade/tools/quark/quark_load.py +1 -1
lemonade/tools/quark/quark_quantize.py +2 -2
lemonade/tools/server/llamacpp.py +130 -9
lemonade/tools/server/serve.py +102 -0
lemonade/tools/server/static/styles.css +458 -55
lemonade/tools/server/static/webapp.html +322 -35
lemonade/version.py +1 -1
lemonade_sdk-8.0.5.dist-info/METADATA +295 -0
{lemonade_sdk-8.0.3.dist-info → lemonade_sdk-8.0.5.dist-info}/RECORD +26 -25
lemonade_server/cli.py +168 -22
lemonade_server/model_manager.py +12 -2
lemonade_server/pydantic_models.py +25 -1
lemonade_server/server_models.json +46 -44
lemonade_sdk-8.0.3.dist-info/METADATA +0 -183
{lemonade_sdk-8.0.3.dist-info → lemonade_sdk-8.0.5.dist-info}/WHEEL +0 -0
{lemonade_sdk-8.0.3.dist-info → lemonade_sdk-8.0.5.dist-info}/entry_points.txt +0 -0
{lemonade_sdk-8.0.3.dist-info → lemonade_sdk-8.0.5.dist-info}/licenses/LICENSE +0 -0
{lemonade_sdk-8.0.3.dist-info → lemonade_sdk-8.0.5.dist-info}/licenses/NOTICE.md +0 -0
{lemonade_sdk-8.0.3.dist-info → lemonade_sdk-8.0.5.dist-info}/top_level.txt +0 -0

lemonade/tools/server/static/webapp.html CHANGED Viewed

@@ -33,7 +33,47 @@
                         <input type="text" id="chat-input" placeholder="Type your message..." />
                         <button id="send-btn">Send</button>
                     </div>
-                </div>
+                </div>
+                <!-- App Suggestions Section -->
+                <div class="app-suggestions-section">
+                    <div class="suggestion-text">
+                        Use Lemonade with your favorite app
+                    </div>
+                    <div class="app-logos-grid">
+                        <a href="https://lemonade-server.ai/docs/server/apps/open-webui/" target="_blank" class="app-logo-item" title="Open WebUI">
+                            <img src="https://raw.githubusercontent.com/lemonade-sdk/assets/refs/heads/main/partner_logos/openwebui.jpg" alt="Open WebUI" class="app-logo-img">
+                            <span class="app-name">Open WebUI</span>
+                        </a>
+                        <a href="https://lemonade-server.ai/docs/server/apps/continue/" target="_blank" class="app-logo-item" title="Continue">
+                            <img src="https://raw.githubusercontent.com/lemonade-sdk/assets/refs/heads/main/partner_logos/continue_dev.png" alt="Continue" class="app-logo-img">
+                            <span class="app-name">Continue</span>
+                        </a>
+                        <a href="https://github.com/amd/gaia" target="_blank" class="app-logo-item" title="Gaia">
+                            <img src="https://raw.githubusercontent.com/lemonade-sdk/assets/refs/heads/main/partner_logos/gaia.ico" alt="Gaia" class="app-logo-img">
+                            <span class="app-name">Gaia</span>
+                        </a>
+                        <a href="https://lemonade-server.ai/docs/server/apps/anythingLLM/" target="_blank" class="app-logo-item" title="AnythingLLM">
+                            <img src="https://raw.githubusercontent.com/lemonade-sdk/assets/refs/heads/main/partner_logos/anything_llm.png" alt="AnythingLLM" class="app-logo-img">
+                            <span class="app-name">AnythingLLM</span>
+                        </a>
+                        <a href="https://lemonade-server.ai/docs/server/apps/ai-dev-gallery/" target="_blank" class="app-logo-item" title="AI Dev Gallery">
+                            <img src="https://raw.githubusercontent.com/lemonade-sdk/assets/refs/heads/main/partner_logos/ai_dev_gallery.webp" alt="AI Dev Gallery" class="app-logo-img">
+                            <span class="app-name">AI Dev Gallery</span>
+                        </a>
+                        <a href="https://lemonade-server.ai/docs/server/apps/lm-eval/" target="_blank" class="app-logo-item" title="LM-Eval">
+                            <img src="https://raw.githubusercontent.com/lemonade-sdk/assets/refs/heads/main/partner_logos/lm_eval.png" alt="LM-Eval" class="app-logo-img">
+                            <span class="app-name">LM-Eval</span>
+                        </a>
+                        <a href="https://lemonade-server.ai/docs/server/apps/codeGPT/" target="_blank" class="app-logo-item" title="CodeGPT">
+                            <img src="https://raw.githubusercontent.com/lemonade-sdk/assets/refs/heads/main/partner_logos/codegpt.jpg" alt="CodeGPT" class="app-logo-img">
+                            <span class="app-name">CodeGPT</span>
+                        </a>
+                    <a href="https://github.com/lemonade-sdk/lemonade/blob/main/docs/server/apps/ai-toolkit.md" target="_blank" class="app-logo-item" title="AI Toolkit">
+                        <img src="https://raw.githubusercontent.com/lemonade-sdk/assets/refs/heads/main/partner_logos/ai_toolkit.png" alt="AI Toolkit" class="app-logo-img">
+                        <span class="app-name">AI Toolkit</span>
+                    </a>
+                    </div>
+                </div>
             </div>
             <div class="tab-content" id="content-models">                <div class="model-mgmt-register-form collapsed">                    <h3 class="model-mgmt-form-title" onclick="toggleAddModelForm()">
                         Add a Model
@@ -109,7 +149,66 @@
         <div class="copyright">Copyright 2025 AMD</div>
     </footer>
     <script src="https://cdn.jsdelivr.net/npm/openai@4.21.0/dist/openai.min.js"></script>
-    <script>    // Tab switching logic
+    <script src="https://cdn.jsdelivr.net/npm/marked@9.1.0/marked.min.js"></script>
+    <script src="https://polyfill.io/v3/polyfill.min.js?features=es6"></script>
+    <script id="MathJax-script" async src="https://cdn.jsdelivr.net/npm/mathjax@3/es5/tex-mml-chtml.js"></script>
+    <script>
+    // Configure MathJax
+    window.MathJax = {
+        tex: {
+            inlineMath: [['\\(', '\\)'], ['$', '$']],
+            displayMath: [['\\[', '\\]'], ['$$', '$$']],
+            processEscapes: true,
+            processEnvironments: true
+        },
+        options: {
+            skipHtmlTags: ['script', 'noscript', 'style', 'textarea', 'pre']
+        }
+    };
+    </script>
+    <script>
+    // Configure marked.js for safe HTML rendering
+    marked.setOptions({
+        breaks: true,
+        gfm: true,
+        sanitize: false,
+        smartLists: true,
+        smartypants: true
+    });
+    // Function to unescape JSON strings
+    function unescapeJsonString(str) {
+        try {
+            return str.replace(/\\n/g, '\n')
+                     .replace(/\\t/g, '\t')
+                     .replace(/\\r/g, '\r')
+                     .replace(/\\"/g, '"')
+                     .replace(/\\\\/g, '\\');
+        } catch (error) {
+            console.error('Error unescaping string:', error);
+            return str;
+        }
+    }
+    // Function to safely render markdown with MathJax support
+    function renderMarkdown(text) {
+        try {
+            const html = marked.parse(text);
+            // Trigger MathJax to process the new content
+            if (window.MathJax && window.MathJax.typesetPromise) {
+                // Use a timeout to ensure DOM is updated before typesetting
+                setTimeout(() => {
+                    window.MathJax.typesetPromise();
+                }, 0);
+            }
+            return html;
+        } catch (error) {
+            console.error('Error rendering markdown:', error);
+            return text; // fallback to plain text
+        }
+    }
+    // Tab switching logic
     function showTab(tab, updateHash = true) {
         document.getElementById('tab-chat').classList.remove('active');
         document.getElementById('tab-models').classList.remove('active');
@@ -163,6 +262,44 @@
         form.classList.toggle('collapsed');
     }
+    // Handle image load failures for app logos
+    function handleImageFailure(img) {
+        const logoItem = img.closest('.app-logo-item');
+        if (logoItem) {
+            logoItem.classList.add('image-failed');
+        }
+    }
+    // Set up image error handlers when DOM is loaded
+    document.addEventListener('DOMContentLoaded', function() {
+        const logoImages = document.querySelectorAll('.app-logo-img');
+        logoImages.forEach(function(img) {
+            let imageLoaded = false;
+            img.addEventListener('load', function() {
+                imageLoaded = true;
+            });
+            img.addEventListener('error', function() {
+                if (!imageLoaded) {
+                    handleImageFailure(this);
+                }
+            });
+            // Also check if image is already broken (cached failure)
+            if (img.complete && img.naturalWidth === 0) {
+                handleImageFailure(img);
+            }
+            // Timeout fallback for slow connections (5 seconds)
+            setTimeout(function() {
+                if (!imageLoaded && !img.complete) {
+                    handleImageFailure(img);
+                }
+            }, 5000);
+        });
+    });
     // Helper to get server base URL
     function getServerBaseUrl() {
         const port = window.SERVER_PORT || 8000;
@@ -184,18 +321,59 @@
                 select.innerHTML = '<option>No models available</option>';
                 return;
             }
+            // Filter out embedding models from chat interface
+            const allModels = window.SERVER_MODELS || {};
+            let filteredModels = [];
             let defaultIndex = 0;
+            // Check if model is specified in URL parameters
+            const urlModel = new URLSearchParams(window.location.search).get('model');
+            let urlModelIndex = -1;
             data.data.forEach(function(model, index) {
                 const modelId = model.id || model.name || model;
+                const modelInfo = allModels[modelId] || {};
+                const labels = modelInfo.labels || [];
+                // Skip models with "embeddings" or "reranking" label
+                if (labels.includes('embeddings') || labels.includes('reranking')) {
+                    return;
+                }
+                filteredModels.push(modelId);
                 const opt = document.createElement('option');
                 opt.value = modelId;
                 opt.textContent = modelId;
+                // Check if this model matches the URL parameter
+                if (urlModel && modelId === urlModel) {
+                    urlModelIndex = filteredModels.length - 1;
+                }
+                // Default fallback for backwards compatibility
                 if (modelId === 'Llama-3.2-1B-Instruct-Hybrid') {
-                    defaultIndex = index;
+                    defaultIndex = filteredModels.length - 1;
                 }
                 select.appendChild(opt);
             });
-            select.selectedIndex = defaultIndex;
+            if (filteredModels.length === 0) {
+                select.innerHTML = '<option>No chat models available</option>';
+                return;
+            }
+            // Select the URL-specified model if found, otherwise use default
+            if (urlModelIndex !== -1) {
+                select.selectedIndex = urlModelIndex;
+                console.log(`Selected model from URL parameter: ${urlModel}`);
+            } else {
+                select.selectedIndex = defaultIndex;
+                if (urlModel) {
+                    console.warn(`Model '${urlModel}' specified in URL not found in available models`);
+                }
+            }
         } catch (e) {
             const select = document.getElementById('model-select');
             select.innerHTML = `<option>Error loading models: ${e.message}</option>`;
@@ -217,26 +395,24 @@
         // Add labels if they exist
         const modelData = allModels[modelId];
-        if (modelData) {
-            // Add reasoning label if reasoning is true
-            if (modelData.reasoning === true) {
-                const reasoningLabel = document.createElement('span');
-                reasoningLabel.className = 'model-label reasoning';
-                reasoningLabel.textContent = 'reasoning';
-                container.appendChild(reasoningLabel);
-            }
-            // Add other labels if they exist
-            if (modelData.labels && Array.isArray(modelData.labels)) {
-                modelData.labels.forEach(label => {
-                    const labelSpan = document.createElement('span');
-                    const labelLower = label.toLowerCase();
-                    const labelClass = (labelLower === 'vision') ? 'vision' : 'other';
-                    labelSpan.className = `model-label ${labelClass}`;
-                    labelSpan.textContent = label;
-                    container.appendChild(labelSpan);
-                });
-            }
+        if (modelData && modelData.labels && Array.isArray(modelData.labels)) {
+            modelData.labels.forEach(label => {
+                const labelSpan = document.createElement('span');
+                const labelLower = label.toLowerCase();
+                let labelClass = 'other';
+                if (labelLower === 'vision') {
+                    labelClass = 'vision';
+                } else if (labelLower === 'embeddings') {
+                    labelClass = 'embeddings';
+                } else if (labelLower === 'reasoning') {
+                    labelClass = 'reasoning';
+                } else if (labelLower === 'reranking') {
+                    labelClass = 'reranking';
+                }
+                labelSpan.className = `model-label ${labelClass}`;
+                labelSpan.textContent = label;
+                container.appendChild(labelSpan);
+            });
         }
         return container;
@@ -358,16 +534,110 @@
     const modelSelect = document.getElementById('model-select');
     let messages = [];
-    function appendMessage(role, text) {
+    function appendMessage(role, text, isMarkdown = false) {
         const div = document.createElement('div');
         div.className = 'chat-message ' + role;
         // Add a bubble for iMessage style
         const bubble = document.createElement('div');
         bubble.className = 'chat-bubble ' + role;
-        bubble.innerHTML = text;
+        if (role === 'llm' && isMarkdown) {
+            bubble.innerHTML = renderMarkdownWithThinkTokens(text);
+        } else {
+            bubble.textContent = text;
+        }
         div.appendChild(bubble);
         chatHistory.appendChild(div);
         chatHistory.scrollTop = chatHistory.scrollHeight;
+        return bubble; // Return the bubble element for streaming updates
+    }
+    function updateMessageContent(bubbleElement, text, isMarkdown = false) {
+        if (isMarkdown) {
+            bubbleElement.innerHTML = renderMarkdownWithThinkTokens(text);
+        } else {
+            bubbleElement.textContent = text;
+        }
+    }
+    function renderMarkdownWithThinkTokens(text) {
+        // Check if text contains opening think tag
+        if (text.includes('<think>')) {
+            if (text.includes('</think>')) {
+                // Complete think block - handle as before
+                const thinkMatch = text.match(/<think>(.*?)<\/think>/s);
+                if (thinkMatch) {
+                    const thinkContent = thinkMatch[1].trim();
+                    const mainResponse = text.replace(/<think>.*?<\/think>/s, '').trim();
+                    // Create collapsible structure
+                    let html = '';
+                    if (thinkContent) {
+                        html += `
+                            <div class="think-tokens-container">
+                                <div class="think-tokens-header" onclick="toggleThinkTokens(this)">
+                                    <span class="think-tokens-chevron">▼</span>
+                                    <span class="think-tokens-label">Thinking...</span>
+                                </div>
+                                <div class="think-tokens-content">
+                                    ${renderMarkdown(thinkContent)}
+                                </div>
+                            </div>
+                        `;
+                    }
+                    if (mainResponse) {
+                        html += `<div class="main-response">${renderMarkdown(mainResponse)}</div>`;
+                    }
+                    return html;
+                }
+            } else {
+                // Partial think block - only opening tag found, still being generated
+                const thinkMatch = text.match(/<think>(.*)/s);
+                if (thinkMatch) {
+                    const thinkContent = thinkMatch[1];
+                    const beforeThink = text.substring(0, text.indexOf('<think>'));
+                    let html = '';
+                    if (beforeThink.trim()) {
+                        html += `<div class="main-response">${renderMarkdown(beforeThink)}</div>`;
+                    }
+                    html += `
+                        <div class="think-tokens-container">
+                            <div class="think-tokens-header" onclick="toggleThinkTokens(this)">
+                                <span class="think-tokens-chevron">▼</span>
+                                <span class="think-tokens-label">Thinking...</span>
+                            </div>
+                            <div class="think-tokens-content">
+                                ${renderMarkdown(thinkContent)}
+                            </div>
+                        </div>
+                    `;
+                    return html;
+                }
+            }
+        }
+        // Fallback to normal markdown rendering
+        return renderMarkdown(text);
+    }
+    function toggleThinkTokens(header) {
+        const container = header.parentElement;
+        const content = container.querySelector('.think-tokens-content');
+        const chevron = header.querySelector('.think-tokens-chevron');
+        if (content.style.display === 'none') {
+            content.style.display = 'block';
+            chevron.textContent = '▼';
+            container.classList.remove('collapsed');
+        } else {
+            content.style.display = 'none';
+            chevron.textContent = '▶';
+            container.classList.add('collapsed');
+        }
     }
     async function sendMessage() {
@@ -379,8 +649,7 @@
         sendBtn.disabled = true;
         // Streaming OpenAI completions (placeholder, adapt as needed)
         let llmText = '';
-        appendMessage('llm', '...');
-        const llmDiv = chatHistory.lastChild.querySelector('.chat-bubble.llm');
+        const llmBubble = appendMessage('llm', '...');
         try {
             // Use the correct endpoint for chat completions
             const resp = await fetch(getServerBaseUrl() + '/api/v1/chat/completions', {
@@ -395,22 +664,40 @@
             if (!resp.body) throw new Error('No stream');
             const reader = resp.body.getReader();
             let decoder = new TextDecoder();
-            llmDiv.textContent = '';
+            llmBubble.textContent = '';
             while (true) {
                 const { done, value } = await reader.read();
                 if (done) break;
                 const chunk = decoder.decode(value);
                 if (chunk.trim() === 'data: [DONE]' || chunk.trim() === '[DONE]') continue;
-                // Try to extract the content from the OpenAI chunk
-                const match = chunk.match(/"content"\s*:\s*"([^"]*)"/);
-                if (match && match[1]) {
-                    llmText += match[1];
-                    llmDiv.textContent = llmText;
+                // Handle Server-Sent Events format
+                const lines = chunk.split('\n');
+                for (const line of lines) {
+                    if (line.startsWith('data: ')) {
+                        const jsonStr = line.substring(6).trim();
+                        if (jsonStr === '[DONE]') continue;
+                        try {
+                            const parsed = JSON.parse(jsonStr);
+                            if (parsed.choices && parsed.choices[0] && parsed.choices[0].delta && parsed.choices[0].delta.content) {
+                                llmText += parsed.choices[0].delta.content;
+                                updateMessageContent(llmBubble, llmText, true);
+                            }
+                        } catch (e) {
+                            // Fallback to regex parsing if JSON parsing fails
+                            const match = jsonStr.match(/"content"\s*:\s*"((?:\\.|[^"\\])*)"/);
+                            if (match && match[1]) {
+                                llmText += unescapeJsonString(match[1]);
+                                updateMessageContent(llmBubble, llmText, true);
+                            }
+                        }
+                    }
                 }
             }
             messages.push({ role: 'assistant', content: llmText });
         } catch (e) {
-            llmDiv.textContent = '[Error: ' + e.message + ']';
+            llmBubble.textContent = '[Error: ' + e.message + ']';
         }
         sendBtn.disabled = false;
     }

lemonade/version.py CHANGED Viewed

	@@ -1 +1 @@
1	- __version__ = "8.0.3"
1	+ __version__ = "8.0.5"

lemonade-sdk 8.0.3__py3-none-any.whl → 8.0.5__py3-none-any.whl

Potentially problematic release.

lemonade-sdk 8.0.3py3-none-any.whl → 8.0.5py3-none-any.whl