PyPI - lemonade-sdk - Versions diffs - 9.1.1__py3-none-any.whl - Mend

lemonade-sdk 9.1.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (84) hide show

lemonade/__init__.py +5 -0
lemonade/api.py +180 -0
lemonade/cache.py +92 -0
lemonade/cli.py +173 -0
lemonade/common/__init__.py +0 -0
lemonade/common/build.py +176 -0
lemonade/common/cli_helpers.py +139 -0
lemonade/common/exceptions.py +98 -0
lemonade/common/filesystem.py +368 -0
lemonade/common/inference_engines.py +408 -0
lemonade/common/network.py +93 -0
lemonade/common/printing.py +110 -0
lemonade/common/status.py +471 -0
lemonade/common/system_info.py +1411 -0
lemonade/common/test_helpers.py +28 -0
lemonade/profilers/__init__.py +1 -0
lemonade/profilers/agt_power.py +437 -0
lemonade/profilers/hwinfo_power.py +429 -0
lemonade/profilers/memory_tracker.py +259 -0
lemonade/profilers/profiler.py +58 -0
lemonade/sequence.py +363 -0
lemonade/state.py +159 -0
lemonade/tools/__init__.py +1 -0
lemonade/tools/accuracy.py +432 -0
lemonade/tools/adapter.py +114 -0
lemonade/tools/bench.py +302 -0
lemonade/tools/flm/__init__.py +1 -0
lemonade/tools/flm/utils.py +305 -0
lemonade/tools/huggingface/bench.py +187 -0
lemonade/tools/huggingface/load.py +235 -0
lemonade/tools/huggingface/utils.py +359 -0
lemonade/tools/humaneval.py +264 -0
lemonade/tools/llamacpp/bench.py +255 -0
lemonade/tools/llamacpp/load.py +222 -0
lemonade/tools/llamacpp/utils.py +1260 -0
lemonade/tools/management_tools.py +319 -0
lemonade/tools/mmlu.py +319 -0
lemonade/tools/oga/__init__.py +0 -0
lemonade/tools/oga/bench.py +120 -0
lemonade/tools/oga/load.py +804 -0
lemonade/tools/oga/migration.py +403 -0
lemonade/tools/oga/utils.py +462 -0
lemonade/tools/perplexity.py +147 -0
lemonade/tools/prompt.py +263 -0
lemonade/tools/report/__init__.py +0 -0
lemonade/tools/report/llm_report.py +203 -0
lemonade/tools/report/table.py +899 -0
lemonade/tools/server/__init__.py +0 -0
lemonade/tools/server/flm.py +133 -0
lemonade/tools/server/llamacpp.py +320 -0
lemonade/tools/server/serve.py +2123 -0
lemonade/tools/server/static/favicon.ico +0 -0
lemonade/tools/server/static/index.html +279 -0
lemonade/tools/server/static/js/chat.js +1059 -0
lemonade/tools/server/static/js/model-settings.js +183 -0
lemonade/tools/server/static/js/models.js +1395 -0
lemonade/tools/server/static/js/shared.js +556 -0
lemonade/tools/server/static/logs.html +191 -0
lemonade/tools/server/static/styles.css +2654 -0
lemonade/tools/server/static/webapp.html +321 -0
lemonade/tools/server/tool_calls.py +153 -0
lemonade/tools/server/tray.py +664 -0
lemonade/tools/server/utils/macos_tray.py +226 -0
lemonade/tools/server/utils/port.py +77 -0
lemonade/tools/server/utils/thread.py +85 -0
lemonade/tools/server/utils/windows_tray.py +408 -0
lemonade/tools/server/webapp.py +34 -0
lemonade/tools/server/wrapped_server.py +559 -0
lemonade/tools/tool.py +374 -0
lemonade/version.py +1 -0
lemonade_install/__init__.py +1 -0
lemonade_install/install.py +239 -0
lemonade_sdk-9.1.1.dist-info/METADATA +276 -0
lemonade_sdk-9.1.1.dist-info/RECORD +84 -0
lemonade_sdk-9.1.1.dist-info/WHEEL +5 -0
lemonade_sdk-9.1.1.dist-info/entry_points.txt +5 -0
lemonade_sdk-9.1.1.dist-info/licenses/LICENSE +201 -0
lemonade_sdk-9.1.1.dist-info/licenses/NOTICE.md +47 -0
lemonade_sdk-9.1.1.dist-info/top_level.txt +3 -0
lemonade_server/cli.py +805 -0
lemonade_server/model_manager.py +758 -0
lemonade_server/pydantic_models.py +159 -0
lemonade_server/server_models.json +643 -0
lemonade_server/settings.py +39 -0

lemonade/tools/server/static/js/chat.js ADDED Viewed

@@ -0,0 +1,1059 @@
+// Chat logic and functionality
+let messages = [];
+let attachedFiles = [];
+let systemMessageElement = null;
+let abortController = null;
+const THINKING_ANIM_INTERVAL_MS = 550;
+// Toggle this to false if you prefer plain dots only.
+const THINKING_USE_LEMON = true;
+const THINKING_FRAMES = THINKING_USE_LEMON
+    ? ['Thinking.','Thinking..','Thinking...','Thinking 🍋']
+    : ['Thinking.','Thinking..','Thinking...'];
+// Get DOM elements
+let chatHistory, chatInput, attachmentBtn, fileAttachment, attachmentsPreviewContainer, attachmentsPreviewRow, modelSelect, toggleBtn;
+// Track if a stream is currently active (separate from abortController existing briefly before validation)
+let isStreaming = false;
+// When the user scrolls up in the chat history, disable automatic scrolling until they scroll back to the bottom.
+let autoscrollEnabled = true;
+const AUTOSCROLL_TOLERANCE_PX = 10;
+// Initialize chat functionality when DOM is loaded
+document.addEventListener('DOMContentLoaded', function() {
+    chatHistory = document.getElementById('chat-history');
+    chatInput = document.getElementById('chat-input');
+    toggleBtn = document.getElementById('toggle-btn');
+    attachmentBtn = document.getElementById('attachment-btn');
+    fileAttachment = document.getElementById('file-attachment');
+    attachmentsPreviewContainer = document.getElementById('attachments-preview-container');
+    attachmentsPreviewRow = document.getElementById('attachments-preview-row');
+    modelSelect = document.getElementById('model-select');
+    // Set up event listeners
+    setupChatEventListeners();
+    // Pause autoscroll when user scrolls up in the chat history. If they scroll back to bottom, resume.
+    if (chatHistory) {
+        chatHistory.addEventListener('scroll', function () {
+            try {
+                const atBottom = chatHistory.scrollTop + chatHistory.clientHeight >= chatHistory.scrollHeight - AUTOSCROLL_TOLERANCE_PX;
+                if (atBottom) {
+                    if (!autoscrollEnabled) {
+                        autoscrollEnabled = true;
+                        chatHistory.classList.remove('autoscroll-paused');
+                    }
+                } else {
+                    if (autoscrollEnabled) {
+                        autoscrollEnabled = false;
+                        chatHistory.classList.add('autoscroll-paused');
+                    }
+                }
+            } catch (_) {}
+        });
+    }
+    // Initialize model dropdown (will be populated when models.js calls updateModelStatusIndicator)
+    initializeModelDropdown();
+    // Update attachment button state periodically
+    updateAttachmentButtonState();
+    setInterval(updateAttachmentButtonState, 1000);
+    // Display initial system message
+    displaySystemMessage();
+});
+function setupChatEventListeners() {
+    // Toggle button click – send or stop streaming
+    toggleBtn.onclick = function () {
+        if (abortController) {
+            abortCurrentRequest();
+        } else {
+            sendMessage();
+        }
+    };
+    // Send on Enter, clear attachments on Escape
+    if (chatInput) {
+        chatInput.addEventListener('keydown', handleChatInputKeydown);
+        chatInput.addEventListener('paste', handleChatInputPaste);
+    }
+    // Open file picker and handle image selection
+    if (attachmentBtn && fileAttachment) {
+        attachmentBtn.addEventListener('click', function () {
+            // Let the selection handler validate vision capability, etc.
+            fileAttachment.click();
+        });
+        fileAttachment.addEventListener('change', handleFileSelection);
+    }
+    // React to model selection changes
+    if (modelSelect) {
+        modelSelect.addEventListener('change', handleModelSelectChange);
+    }
+}
+// Initialize model dropdown with available models
+function initializeModelDropdown() {
+    const allModels = window.SERVER_MODELS || {};
+    // Clear existing options except the first one
+    const indicator = document.getElementById('model-status-indicator');
+    if (indicator.classList.contains('offline') || modelSelect.value === 'server-offline') {
+        modelSelect.value = 'server-offline';
+    } else {
+        modelSelect.innerHTML = '<option value="">Click to select a model ▼</option>';
+    }
+    // Add only installed models to dropdown
+    Object.keys(allModels).forEach(modelId => {
+        // Only add if the model is installed
+        if (window.installedModels && window.installedModels.has(modelId)) {
+            const option = document.createElement('option');
+            option.value = modelId;
+            option.textContent = modelId;
+            modelSelect.appendChild(option);
+        }
+    });
+    // Set current selection based on loaded model
+    updateModelSelectValue();
+}
+// Make dropdown initialization accessible globally so models.js can refresh it
+window.initializeModelDropdown = initializeModelDropdown;
+// Update model select value to match currently loaded model
+function updateModelSelectValue() {
+    const indicator = document.getElementById('model-status-indicator');
+    if (currentLoadedModel && indicator.classList.contains('loading')) {
+		modelSelect.value = 'loading-model';
+	} else if (currentLoadedModel) {
+        modelSelect.value = currentLoadedModel;
+    } else if (indicator.classList.contains('offline') && modelSelect.value === 'server-offline') {
+		modelSelect.value = 'server-offline';
+    } else {
+        return;
+    }
+}
+// Make updateModelSelectValue accessible globally
+window.updateModelSelectValue = updateModelSelectValue;
+// Handle model selection change
+async function handleModelSelectChange() {
+    const selectedModel = modelSelect.value;
+    if (!selectedModel) return; // "Click to select a model ▼" selected
+    if (selectedModel === currentLoadedModel) return; // Same model already loaded
+    // Use the standardized load function
+    await loadModelStandardized(selectedModel, {
+        onLoadingStart: (modelId) => {
+            // Update dropdown to show loading state with model name
+            const loadingOption = document.createElement('option');
+            const select = document.getElementById('model-select');
+            select.innerHTML = '';
+            if (loadingOption) {
+            	loadingOption.value = 'loading-model';
+                loadingOption.textContent = `Loading ${modelId}...`;
+            	loadingOption.hidden = true;
+            	select.appendChild(loadingOption);
+            }
+            // Gray out send button during loading
+            updateAttachmentButtonState();
+        },
+        onLoadingEnd: (modelId, success) => {
+            // Reset the default option text
+            const defaultOption = modelSelect.querySelector('option[value=""]');
+            if (defaultOption) defaultOption.textContent = 'Click to select a model ▼';
+            // Update button state after loading completes
+            updateAttachmentButtonState();
+		},
+        onSuccess: () => {
+            updateAttachmentButtonState();
+        },
+        onError: () => {
+            updateModelSelectValue();
+            updateAttachmentButtonState();
+        }
+    });
+}
+// Update attachment button state based on current model
+function updateAttachmentButtonState() {
+    // Update model dropdown selection
+    updateModelSelectValue();
+    // Update send button state based on model loading
+    if (toggleBtn) {
+        const loading = !!(modelSelect && modelSelect.disabled);
+        if (isStreaming) {
+            toggleBtn.disabled = false;
+            toggleBtn.textContent = 'Stop';
+        } else {
+            // Gray out send button if no model is loaded or if loading
+            toggleBtn.disabled = loading || !currentLoadedModel;
+            toggleBtn.textContent = 'Send';
+        }
+    }
+    if (!currentLoadedModel) {
+        attachmentBtn.style.opacity = '0.5';
+        attachmentBtn.style.cursor = 'not-allowed';
+        attachmentBtn.title = 'Load a model first';
+    } else {
+        const isVision = isVisionModel(currentLoadedModel);
+        if (isVision) {
+            attachmentBtn.style.opacity = '1';
+            attachmentBtn.style.cursor = 'pointer';
+            attachmentBtn.title = 'Attach images';
+        } else {
+            attachmentBtn.style.opacity = '0.5';
+            attachmentBtn.style.cursor = 'not-allowed';
+            attachmentBtn.title = 'Image attachments not supported by this model';
+        }
+    }
+    // Update system message when model state changes
+    displaySystemMessage();
+}
+// Make updateAttachmentButtonState accessible globally
+window.updateAttachmentButtonState = updateAttachmentButtonState;
+// Make displaySystemMessage accessible globally
+window.displaySystemMessage = displaySystemMessage;
+// Check if model supports vision and update attachment button
+function checkCurrentModel() {
+    if (attachedFiles.length > 0 && currentLoadedModel && !isVisionModel(currentLoadedModel)) {
+        if (confirm(`The current model "${currentLoadedModel}" does not support images. Would you like to remove the attached images?`)) {
+            clearAttachments();
+        }
+    }
+    updateAttachmentButtonState();
+}
+// Handle file selection
+function handleFileSelection() {
+    if (fileAttachment.files.length > 0) {
+        // Check if current model supports vision
+        if (!currentLoadedModel) {
+            alert('Please load a model first before attaching images.');
+            fileAttachment.value = '';
+            return;
+        }
+        if (!isVisionModel(currentLoadedModel)) {
+            alert(`The current model "${currentLoadedModel}" does not support image inputs. Please load a model with "Vision" capabilities.`);
+            fileAttachment.value = '';
+            return;
+        }
+        // Filter only image files
+        const imageFiles = Array.from(fileAttachment.files).filter(file => {
+            if (!file.type.startsWith('image/')) {
+                console.warn(`Skipping non-image file: ${file.name} (${file.type})`);
+                return false;
+            }
+            return true;
+        });
+        if (imageFiles.length === 0) {
+            alert('Please select only image files (PNG, JPG, GIF, etc.)');
+            fileAttachment.value = '';
+            return;
+        }
+        if (imageFiles.length !== fileAttachment.files.length) {
+            alert(`${fileAttachment.files.length - imageFiles.length} non-image file(s) were skipped. Only image files are supported.`);
+        }
+        attachedFiles = imageFiles;
+        updateInputPlaceholder();
+        updateAttachmentPreviewVisibility();
+        updateAttachmentPreviews();
+    }
+}
+// Handle chat input keydown events
+function handleChatInputKeydown(e) {
+    if (e.key === 'Escape' && attachedFiles.length > 0) {
+        e.preventDefault();
+        clearAttachments();
+    } else if (e.key === 'Enter' && !e.shiftKey) {
+        e.preventDefault();
+        // Only send if we have a loaded model
+        if (currentLoadedModel && modelSelect.value !== '' && !modelSelect.disabled) {
+            sendMessage();
+        }
+        // Otherwise do nothing - button is grayed out
+    }
+}
+// Handle paste events for images
+async function handleChatInputPaste(e) {
+    const clipboardData = e.clipboardData || window.clipboardData;
+    const items = clipboardData.items;
+    let hasImage = false;
+    let pastedText = '';
+    // Check for text content first
+    for (let item of items) {
+        if (item.type === 'text/plain') {
+            pastedText = clipboardData.getData('text/plain');
+        }
+    }
+    // Check for images
+    for (let item of items) {
+        if (item.type.indexOf('image') !== -1) {
+            hasImage = true;
+            const file = item.getAsFile();
+            if (file && file.type.startsWith('image/')) {
+                // Check if current model supports vision before adding image
+                const currentModel = modelSelect.value;
+                if (!isVisionModel(currentModel)) {
+                    alert(`The selected model "${currentModel}" does not support image inputs. Please select a model with "Vision" capabilities to paste images.`);
+                    // Don't prevent default if we're not handling the paste
+                    return;
+                }
+                // Add to attachedFiles array only if it's an image and model supports vision
+                attachedFiles.push(file);
+            } else if (file) {
+                console.warn(`Skipping non-image pasted file: ${file.name || 'unknown'} (${file.type})`);
+            }
+        }
+    }
+    // If we have images, prevent default and handle specially
+    if (hasImage && attachedFiles.length > 0) {
+        e.preventDefault();
+        // If there's also text, insert it at cursor position
+        if (pastedText) {
+            insertTextAtCursor(chatInput, pastedText);
+        }
+        // Update placeholder to show attached images
+        updateInputPlaceholder();
+        updateAttachmentPreviewVisibility();
+        updateAttachmentPreviews();
+    }
+    // If no images, let the browser handle the paste normally (preserves cursor position and undo)
+}
+// Helper function to insert text at cursor position
+function insertTextAtCursor(textElement, text) {
+    const start = textElement.selectionStart;
+    const end = textElement.selectionEnd;
+    const currentValue = textElement.value;
+    // Insert the text at the cursor position
+    const newValue = currentValue.substring(0, start) + text + currentValue.substring(end);
+    textElement.value = newValue;
+    // Move cursor to end of inserted text
+    const newCursorPos = start + text.length;
+    textElement.setSelectionRange(newCursorPos, newCursorPos);
+    // Focus the element to ensure cursor is visible
+    textElement.focus();
+}
+function clearAttachments() {
+    attachedFiles = [];
+    fileAttachment.value = '';
+    updateInputPlaceholder();
+    updateAttachmentPreviewVisibility();
+    updateAttachmentPreviews();
+}
+function updateAttachmentPreviewVisibility() {
+    if (attachedFiles.length > 0) {
+        attachmentsPreviewContainer.classList.add('has-attachments');
+    } else {
+        attachmentsPreviewContainer.classList.remove('has-attachments');
+    }
+}
+function updateAttachmentPreviews() {
+    // Clear existing previews
+    attachmentsPreviewRow.innerHTML = '';
+    if (attachedFiles.length === 0) return;
+    attachedFiles.forEach((file, index) => {
+        // Skip non-image files (extra safety check)
+        if (!file.type.startsWith('image/')) {
+            console.warn(`Skipping non-image file in preview: ${file.name} (${file.type})`);
+            return;
+        }
+        const previewDiv = document.createElement('div');
+        previewDiv.className = 'attachment-preview';
+        // Create thumbnail
+        const thumbnail = document.createElement('img');
+        thumbnail.className = 'attachment-thumbnail';
+        thumbnail.alt = file.name;
+        // Create filename display
+        const filename = document.createElement('div');
+        filename.className = 'attachment-filename';
+        filename.textContent = file.name || `pasted-image-${index + 1}`;
+        filename.title = file.name || `pasted-image-${index + 1}`;
+        // Create remove button
+        const removeBtn = document.createElement('button');
+        removeBtn.className = 'attachment-remove-btn';
+        removeBtn.innerHTML = '✕';
+        removeBtn.title = 'Remove this image';
+        removeBtn.onclick = () => removeAttachment(index);
+        // Generate thumbnail for image
+        const reader = new FileReader();
+        reader.onload = (e) => { thumbnail.src = e.target.result; };
+        reader.readAsDataURL(file);
+        previewDiv.appendChild(thumbnail);
+        previewDiv.appendChild(filename);
+        previewDiv.appendChild(removeBtn);
+        attachmentsPreviewRow.appendChild(previewDiv);
+    });
+}
+function removeAttachment(index) {
+    attachedFiles.splice(index, 1);
+    updateInputPlaceholder();
+    updateAttachmentPreviewVisibility();
+    updateAttachmentPreviews();
+}
+// Function to update input placeholder to show attached files
+function updateInputPlaceholder() {
+    if (attachedFiles.length > 0) {
+        chatInput.placeholder = `Type your message... (${attachedFiles.length} image${attachedFiles.length > 1 ? 's' : ''} attached)`;
+    } else {
+        chatInput.placeholder = 'Type your message...';
+    }
+}
+// Function to convert file to base64
+function fileToBase64(file) {
+    return new Promise((resolve, reject) => {
+        const reader = new FileReader();
+        reader.readAsDataURL(file);
+        reader.onload = () => resolve(reader.result.split(',')[1]);
+        reader.onerror = error => reject(error);
+    });
+}
+/**
+ * Incrementally (re)renders reasoning + answer without blowing away the header so user
+ * collapsing/expanding persists while tokens stream.
+ */
+function updateMessageContent(bubbleElement, text, isMarkdown = false) {
+    if (!isMarkdown) {
+        bubbleElement.textContent = text;
+        return;
+    }
+    const { main, thought, isThinking } = parseReasoningBlocks(text);
+    // Pure normal markdown (no reasoning)
+    if (!thought.trim()) {
+        // If structure existed before, replace fully (safe—no toggle needed)
+        bubbleElement.innerHTML = renderMarkdown(main);
+        delete bubbleElement.dataset.thinkExpanded;
+        return;
+    }
+    // Determine current expanded state (user preference) or default
+    let expanded;
+    if (bubbleElement.dataset.thinkExpanded === 'true') expanded = true;
+    else if (bubbleElement.dataset.thinkExpanded === 'false') expanded = false;
+    else expanded = !!isThinking; // default: open while still streaming until user intervenes
+    // Create structure once
+    let container = bubbleElement.querySelector('.think-tokens-container');
+    let thoughtContent, headerChevron, headerLabel, mainDiv;
+    if (!container) {
+        bubbleElement.innerHTML = ''; // first time constructing reasoning UI
+        container = document.createElement('div');
+        container.className = 'think-tokens-container' + (expanded ? '' : ' collapsed');
+        const header = document.createElement('div');
+        header.className = 'think-tokens-header';
+        header.onclick = function () { toggleThinkTokens(header); };
+        headerChevron = document.createElement('span');
+        headerChevron.className = 'think-tokens-chevron';
+        headerChevron.textContent = expanded ? '▼' : '▶';
+        headerLabel = document.createElement('span');
+        headerLabel.className = 'think-tokens-label';
+        header.appendChild(headerChevron);
+        header.appendChild(headerLabel);
+        thoughtContent = document.createElement('div');
+        thoughtContent.className = 'think-tokens-content';
+        thoughtContent.style.display = expanded ? 'block' : 'none';
+        container.appendChild(header);
+        container.appendChild(thoughtContent);
+        bubbleElement.appendChild(container);
+        if (main.trim()) {
+            mainDiv = document.createElement('div');
+            mainDiv.className = 'main-response';
+            bubbleElement.appendChild(mainDiv);
+        }
+    } else {
+        thoughtContent = container.querySelector('.think-tokens-content');
+        headerChevron = container.querySelector('.think-tokens-chevron');
+        headerLabel = container.querySelector('.think-tokens-label');
+        mainDiv = bubbleElement.querySelector('.main-response');
+    }
+    // Update label & chevron (don’t override user-expanded state)
+    headerChevron.textContent = expanded ? '▼' : '▶';
+    // Animation-aware label handling
+    if (isThinking) {
+        // If not already animating, seed an initial frame then start animation
+        if (bubbleElement.dataset.thinkAnimActive !== '1') {
+            headerLabel.textContent = THINKING_FRAMES[0];
+            startThinkingAnimation(container);
+        }
+    } else {
+        // Stop any animation and set final label
+        if (bubbleElement.dataset.thinkAnimActive === '1') {
+            stopThinkingAnimation(container);
+        } else {
+            headerLabel.textContent = 'Thought Process';
+        }
+    }
+    // Update reasoning content (can re-run markdown safely)
+    thoughtContent.innerHTML = renderMarkdown(thought);
+    // Update main answer section
+    if (main.trim()) {
+        if (!mainDiv) {
+            mainDiv = document.createElement('div');
+            mainDiv.className = 'main-response';
+            bubbleElement.appendChild(mainDiv);
+        }
+        mainDiv.innerHTML = renderMarkdown(main);
+    } else if (mainDiv) {
+        mainDiv.remove();
+    }
+    // Persist preference
+    bubbleElement.dataset.thinkExpanded = expanded ? 'true' : 'false';
+}
+// Scroll helper that respects user's scroll interaction. If autoscroll is disabled
+// because the user scrolled up, this will not force the view to the bottom.
+function scrollChatToBottom(force = false) {
+    if (!chatHistory) return;
+    if (force || autoscrollEnabled) {
+        // Small timeout to allow DOM insertion/layout to finish in streaming cases
+        setTimeout(() => {
+            try { chatHistory.scrollTop = chatHistory.scrollHeight; } catch (_) {}
+        }, 0);
+    }
+}
+function appendMessage(role, text, isMarkdown = false) {
+    const div = document.createElement('div');
+    div.className = 'chat-message ' + role;
+    // Add a bubble for iMessage style
+    const bubble = document.createElement('div');
+    bubble.className = 'chat-bubble ' + role;
+    // Check if isMarkdown is true, regardless of role
+    if (isMarkdown) {
+        // Build structure via incremental updater (ensures later token updates won’t wipe user toggle)
+        updateMessageContent(bubble, text, true);
+    } else {
+        bubble.textContent = text;
+    }
+    div.appendChild(bubble);
+    chatHistory.appendChild(div);
+    scrollChatToBottom();
+    return bubble;
+}
+// Display system message based on current state
+function displaySystemMessage() {
+    // Remove existing system message if it exists
+    if (systemMessageElement) {
+        systemMessageElement.remove();
+        systemMessageElement = null;
+    }
+    // Don't show system message if there are already user/LLM messages
+    if (messages.length > 0) return;
+    let messageText = '';
+    // Check if any models are installed
+    const hasInstalledModels = window.installedModels && window.installedModels.size > 0;
+    if (!hasInstalledModels) {
+        // No models installed - show first message
+        messageText = `Welcome to Lemonade! To get started:
+1. Head over to the Model Management tab.
+2. Use the 📥Download button to download a model.
+3. Use the 🚀Load button to load the model.
+4. Come back to this tab, and you are ready to chat with the model.`;
+    } else if (!currentLoadedModel) {
+        // Models available but none loaded - show second message
+        messageText = 'Welcome to Lemonade! Choose a model from the dropdown menu below to load it and start chatting.';
+    }
+    if (messageText) {
+        const div = document.createElement('div');
+        div.className = 'chat-message system';
+        div.setAttribute('data-system-message', 'true');
+        const bubble = document.createElement('div');
+        bubble.className = 'chat-bubble system';
+        bubble.textContent = messageText;
+        div.appendChild(bubble);
+        chatHistory.appendChild(div);
+        scrollChatToBottom();
+        systemMessageElement = div;
+    }
+}
+function abortCurrentRequest() {
+    if (abortController) {
+        // Abort the in-flight fetch stream immediately
+        abortController.abort();
+        // Also signal the server to halt generation promptly (helps slow CPU backends)
+        try {
+            // Fire-and-forget; no await to avoid blocking UI
+            fetch(getServerBaseUrl() + '/api/v1/halt', { method: 'GET', keepalive: true }).catch(() => {});
+        } catch (_) {}
+        abortController = null;
+        isStreaming = false;
+        updateAttachmentButtonState();
+        console.log('Streaming request aborted by user.');
+    }
+}
+// ---------- Reasoning Parsing (Harmony + <think>) ----------
+function parseReasoningBlocks(raw) {
+    if (raw == null) return { main: '', thought: '', isThinking: false };
+    // Added additional Harmony variants: <|channel|>analysis<|channel|>, <|channel|>analysis<|message|>, <|channel|>analysis<|assistant|>
+    const RE_OPEN  = /<think>|<\|channel\|>analysis<\|(channel|message|assistant)\|>/;
+    const RE_CLOSE = /<\/think>|<\|end\|>/;
+    let remaining = String(raw);
+    let main = '';
+    let thought = '';
+    let isThinking = false;
+    while (true) {
+        const openIdx = remaining.search(RE_OPEN);
+        if (openIdx === -1) {
+            if (isThinking) {
+                thought += remaining;
+            } else {
+                main += remaining;
+            }
+            break;
+        }
+        // Text before the opener
+        if (isThinking) {
+            thought += remaining.slice(0, openIdx);
+        } else {
+            main += remaining.slice(0, openIdx);
+        }
+        // Drop the opener
+        remaining = remaining.slice(openIdx).replace(RE_OPEN, '');
+        isThinking = true;
+        const closeIdx = remaining.search(RE_CLOSE);
+        if (closeIdx === -1) {
+            // Still streaming reasoning (no closer yet)
+            thought += remaining;
+            break;
+        }
+        // Add reasoning segment up to closer
+        thought += remaining.slice(0, closeIdx);
+        remaining = remaining.slice(closeIdx).replace(RE_CLOSE, '');
+        isThinking = false;
+        // Loop to look for additional reasoning blocks
+    }
+    return { main, thought, isThinking };
+}
+function renderMarkdownWithThinkTokens(text, preservedExpanded) {
+    const { main, thought, isThinking } = parseReasoningBlocks(text);
+    if (!thought.trim()) {
+        return renderMarkdown(main);
+    }
+    // If we have a preserved user preference, honor it. Otherwise default:
+    // open while streaming (original behavior) else collapsed = false.
+    let expanded = (typeof preservedExpanded === 'boolean')
+        ? preservedExpanded
+        : !!isThinking;
+    const chevron = expanded ? '▼' : '▶';
+    const label = expanded && isThinking ? 'Thinking...' : (expanded ? 'Thought Process' : 'Thought Process');
+    let html = `
+        <div class="think-tokens-container${expanded ? '' : ' collapsed'}">
+            <div class="think-tokens-header" onclick="toggleThinkTokens(this)">
+                <span class="think-tokens-chevron">${chevron}</span>
+                <span class="think-tokens-label">${label}</span>
+            </div>
+            <div class="think-tokens-content" style="display:${expanded ? 'block' : 'none'};">
+                ${renderMarkdown(thought)}
+            </div>
+        </div>
+    `;
+    if (main.trim()) {
+        html += `<div class="main-response">${renderMarkdown(main)}</div>`;
+    }
+    return html;
+}
+function extractAssistantReasoning(fullText) {
+    const { main, thought } = parseReasoningBlocks(fullText);
+    const result = { content: (main || '').trim(), raw: fullText };
+    if (thought && thought.trim()) result.reasoning_content = thought.trim();
+    return result;
+}
+// -----------------------------------------------------------
+function toggleThinkTokens(header) {
+    const container = header.parentElement;
+    const content = container.querySelector('.think-tokens-content');
+    const chevron = header.querySelector('.think-tokens-chevron');
+    const bubble = header.closest('.chat-bubble');
+    const nowCollapsed = !container.classList.contains('collapsed'); // current (before toggle) expanded?
+    if (nowCollapsed) {
+        // Collapse
+        content.style.display = 'none';
+        chevron.textContent = '▶';
+        container.classList.add('collapsed');
+        if (bubble) bubble.dataset.thinkExpanded = 'false';
+    } else {
+        // Expand
+        content.style.display = 'block';
+        chevron.textContent = '▼';
+        container.classList.remove('collapsed');
+        if (bubble) bubble.dataset.thinkExpanded = 'true';
+    }
+}
+function startThinkingAnimation(container) {
+    const bubble = container.closest('.chat-bubble');
+    if (!bubble || bubble.dataset.thinkAnimActive === '1') return;
+    const labelEl = container.querySelector('.think-tokens-label');
+    if (!labelEl) return;
+    bubble.dataset.thinkAnimActive = '1';
+    let i = 0;
+    const update = () => {
+        // If streaming ended mid-cycle, stop.
+        if (bubble.dataset.thinkAnimActive !== '1') return;
+        labelEl.textContent = THINKING_FRAMES[i % THINKING_FRAMES.length];
+        i++;
+        bubble.dataset.thinkAnimId = String(setTimeout(update, THINKING_ANIM_INTERVAL_MS));
+    };
+    update();
+}
+function stopThinkingAnimation(container, finalLabel = 'Thought Process') {
+    const bubble = container.closest('.chat-bubble');
+    if (!bubble) return;
+    bubble.dataset.thinkAnimActive = '0';
+    const id = bubble.dataset.thinkAnimId;
+    if (id) {
+        clearTimeout(Number(id));
+        delete bubble.dataset.thinkAnimId;
+    }
+    const labelEl = container.querySelector('.think-tokens-label');
+    if (labelEl) labelEl.textContent = finalLabel;
+}
+async function sendMessage(existingTextIfAny) {
+    const text = (existingTextIfAny !== undefined ? existingTextIfAny : chatInput.value.trim());
+    // Prepare abort controller for this request
+    abortController = new AbortController();
+    // UI state: set button to Stop
+    if (toggleBtn) {
+        toggleBtn.disabled = false;
+        toggleBtn.textContent = 'Stop';
+    }
+    if (!text && attachedFiles.length === 0) {
+        // Nothing to send; revert button state and clear abort handle
+        abortController = null;
+        updateAttachmentButtonState();
+        return;
+    }
+    isStreaming = true;
+    // Remove system message when user starts chatting
+    if (systemMessageElement) {
+        systemMessageElement.remove();
+        systemMessageElement = null;
+    }
+    // Check if a model is loaded
+    if (!currentLoadedModel) {
+        alert('Please load a model first before sending messages.');
+        abortController = null;
+        isStreaming = false;
+        updateAttachmentButtonState();
+        return;
+    }
+    // Check if trying to send images to non-vision model
+    if (attachedFiles.length > 0 && !isVisionModel(currentLoadedModel)) {
+        alert(`Cannot send images to model "${currentLoadedModel}" as it does not support vision. Please load a model with "Vision" capabilities or remove the attached images.`);
+        return;
+    }
+    // Create message content
+    let messageContent = [];
+    // Add text if present
+    if (text) {
+        messageContent.push({ type: "text", text: text });
+    }
+    // Add images if present
+    if (attachedFiles.length > 0) {
+        for (const file of attachedFiles) {
+            if (file.type.startsWith('image/')) {
+                try {
+                    const base64 = await fileToBase64(file);
+                    messageContent.push({
+                        type: "image_url",
+                        image_url: { url: `data:${file.type};base64,${base64}` }
+                    });
+                } catch (error) {
+                    console.error('Error converting image to base64:', error);
+                }
+            }
+        }
+    }
+    // Display user message (show text and file names)
+    let displayText = text;
+    if (attachedFiles.length > 0) {
+        const fileNames = attachedFiles.map(f => f.name || 'pasted-image').join(', ');
+        displayText = displayText ? `${displayText}\n[Images: ${fileNames}]` : `[Images: ${fileNames}]`;
+    }
+    appendMessage('user', displayText, true);
+    // Add to messages array
+    const userMessage = {
+        role: 'user',
+        content: messageContent.length === 1 && messageContent[0].type === "text"
+            ? messageContent[0].text
+            : messageContent
+    };
+    messages.push(userMessage);
+    // Clear input and attachments
+    chatInput.value = '';
+    attachedFiles = [];
+    fileAttachment.value = '';
+    updateInputPlaceholder(); // Reset placeholder
+    updateAttachmentPreviewVisibility(); // Hide preview container
+    updateAttachmentPreviews(); // Clear previews
+    // Keep the Send/Stop button enabled during streaming so user can abort.
+    // Streaming OpenAI completions (placeholder, adapt as needed)
+    let llmText = '';
+    const llmBubble = appendMessage('llm', '...');
+    try {
+        // Use the correct endpoint for chat completions with model settings
+        const modelSettings = getCurrentModelSettings ? getCurrentModelSettings() : {};
+        console.log('Applying model settings to API request:', modelSettings);
+        const payload = {
+            model: currentLoadedModel,
+            messages: messages,
+            stream: true,
+            ...modelSettings // Apply current model settings
+        };
+        const resp = await httpRequest(getServerBaseUrl() + '/api/v1/chat/completions', {
+            method: 'POST',
+            headers: { 'Content-Type': 'application/json' },
+            body: JSON.stringify(payload),
+            signal: abortController ? abortController.signal : undefined
+        });
+        if (!resp.body) throw new Error('No stream');
+        const reader = resp.body.getReader();
+        let decoder = new TextDecoder();
+        llmBubble.textContent = '';
+        const reasoningEnabled = (() => {
+            try {
+                const meta = window.SERVER_MODELS?.[currentLoadedModel];
+                return Array.isArray(meta?.labels) && meta.labels.includes('reasoning');
+            } catch (_) { return false; }
+        })();
+        let thinkOpened = false;
+        let thinkClosed = false;
+        let reasoningSchemaActive = false;     // true if we saw delta.reasoning object
+        let receivedAnyReasoning = false;      // true once any reasoning (schema or reasoning_content) arrived
+        while (true) {
+            const { done, value } = await reader.read();
+            if (done) break;
+            const chunk = decoder.decode(value);
+            if (!chunk.trim()) continue;
+            // Handle Server-Sent Events format
+            const lines = chunk.split('\n');
+            for (const rawLine of lines) {
+                if (!rawLine.startsWith('data: ')) continue;
+                const jsonStr = rawLine.slice(6).trim();
+                if (!jsonStr || jsonStr === '[DONE]') continue;
+                let deltaObj;
+                try { deltaObj = JSON.parse(jsonStr); } catch { continue; }
+                const choiceDelta = deltaObj?.choices?.[0]?.delta;
+                if (!choiceDelta) continue;
+                // 1. OpenAI reasoning object (preferred schema)
+                if (choiceDelta.reasoning && !thinkClosed) {
+                    reasoningSchemaActive = true;
+                    const r = choiceDelta.reasoning;
+                    if (!thinkOpened) {
+                        llmText += '<think>';
+                        thinkOpened = true;
+                    }
+                    if (Array.isArray(r.content)) {
+                        for (const seg of r.content) {
+                            if (seg?.type === 'output_text' && seg.text) {
+                                llmText += unescapeJsonString(seg.text);
+                                receivedAnyReasoning = true;
+                            }
+                        }
+                    }
+                    if (r.done && !thinkClosed) {
+                        llmText += '</think>';
+                        thinkClosed = true;
+                    }
+                }
+                // 2. llama.cpp style: reasoning_content (string fragments)
+                if (choiceDelta.reasoning_content && !thinkClosed) {
+                    if (!thinkOpened) {
+                        llmText += '<think>';
+                        thinkOpened = true;
+                    }
+                    llmText += unescapeJsonString(choiceDelta.reasoning_content);
+                    receivedAnyReasoning = true;
+                    // We DO NOT close yet; we’ll close when first normal content arrives.
+                }
+                // 3. Plain content tokens
+                if (choiceDelta.content) {
+                    let c = unescapeJsonString(choiceDelta.content);
+                    // If we are inside reasoning (opened, not closed) and this is the first visible answer token,
+                    // close the reasoning block before appending (unless model already emitted </think> itself).
+                    if (thinkOpened && !thinkClosed) {
+                        if (c.startsWith('</think>')) {
+                            // Model closed it explicitly; strip that tag and mark closed
+                            c = c.replace(/^<\/think>\s*/, '');
+                            thinkClosed = true;
+                        } else {
+                            // Close ourselves (covers reasoning_content path & schema early content anomaly)
+                            if (receivedAnyReasoning || reasoningEnabled) {
+                                llmText += '</think>';
+                                thinkClosed = true;
+                            }
+                        }
+                    }
+                    // If content stream itself begins a new reasoning section (rare), handle gracefully
+                    if (!thinkOpened && /<think>/.test(c)) {
+                        thinkOpened = true;
+                        const parts = c.split(/<think>/);
+                        // parts[0] is anything before accidental <think>, treat as normal visible content
+                        llmText += parts[0];
+                        // Everything after opener treated as reasoning until a closing tag or we decide to close
+                        llmText += '<think>' + parts.slice(1).join('<think>');
+                        receivedAnyReasoning = true;
+                        updateMessageContent(llmBubble, llmText, true);
+                        scrollChatToBottom();
+                        continue;
+                    }
+                    llmText += c;
+                }
+                updateMessageContent(llmBubble, llmText, true);
+                scrollChatToBottom();
+            }
+        }
+        // Final safety close (e.g., model stopped mid-reasoning)
+        if (thinkOpened && !thinkClosed) {
+            llmText += '</think>';
+        }
+        const assistantMsg = extractAssistantReasoning(llmText);
+        messages.push({ role: 'assistant', ...assistantMsg });
+    } catch (e) {
+        // If the request was aborted by the user, just clean up UI without error banner
+        if (e.name === 'AbortError') {
+            console.log('Chat request aborted by user.');
+        } else {
+            let detail = e.message;
+        try {
+            const errPayload = { model: currentLoadedModel, messages: messages, stream: false };
+            const errResp = await httpJson(getServerBaseUrl() + '/api/v1/chat/completions', {
+                method: 'POST',
+                headers: { 'Content-Type': 'application/json' },
+                body: JSON.stringify(errPayload)
+            });
+            if (errResp && errResp.detail) detail = errResp.detail;
+        } catch (_) {}
+        if (e && e.name !== 'AbortError') {
+            llmBubble.textContent = '[Error: ' + detail + ']';
+            showErrorBanner(`Chat error: ${detail}`);
+        }
+    }
+    }
+    // Reset UI state after streaming finishes
+    abortController = null;
+    isStreaming = false;
+    updateAttachmentButtonState();
+    updateMessageContent(llmBubble, llmText, true);
+}