PyPI - local-deep-research - Versions diffs - 0.6.0__py3-none-any.whl → 0.6.1__py3-none-any.whl - Mend

local-deep-research 0.6.0py3-none-any.whl → 0.6.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

local_deep_research/__version__.py CHANGED Viewed

	@@ -1 +1 @@
1	- __version__ = "0.6.0"
1	+ __version__ = "0.6.1"

local_deep_research/web/templates/pages/benchmark_results.html CHANGED Viewed

@@ -6,6 +6,7 @@
 {% block extra_head %}
 <meta name="csrf-token" content="{{ csrf_token() }}">
+<meta name="app-version" content="{{ version }}">
 <style>
 .benchmark-results-card {
     width: 100%;
@@ -769,14 +770,21 @@ function createRunCard(run) {
                     <div class="summary-label">Avg Time/Question</div>
                 </div>
                 <div class="summary-item">
-                    ${status === 'in_progress' ?
-                        `<button class="btn btn-outline btn-sm delete-btn" onclick="event.stopPropagation(); cancelAndDeleteBenchmarkRun(${run.id})" style="background: #3a1e1e !important; border-color: #f44336 !important; color: #f44336 !important;">
-                            <i class="fas fa-stop"></i> Cancel & Delete
-                        </button>` :
-                        `<button class="btn btn-outline btn-sm delete-btn" onclick="event.stopPropagation(); deleteBenchmarkRun(${run.id})">
-                            <i class="fas fa-trash"></i> Delete
-                        </button>`
-                    }
+                    <div style="display: flex; gap: 8px;">
+                        ${status === 'completed' ?
+                            `<button class="btn btn-outline btn-sm" onclick="event.stopPropagation(); downloadBenchmarkYAML(${run.id})" style="background: #1e3a1e !important; border-color: #4caf50 !important; color: #4caf50 !important;">
+                                <i class="fas fa-download"></i> YAML
+                            </button>` : ''
+                        }
+                        ${status === 'in_progress' ?
+                            `<button class="btn btn-outline btn-sm delete-btn" onclick="event.stopPropagation(); cancelAndDeleteBenchmarkRun(${run.id})" style="background: #3a1e1e !important; border-color: #f44336 !important; color: #f44336 !important;">
+                                <i class="fas fa-stop"></i> Cancel & Delete
+                            </button>` :
+                            `<button class="btn btn-outline btn-sm delete-btn" onclick="event.stopPropagation(); deleteBenchmarkRun(${run.id})">
+                                <i class="fas fa-trash"></i> Delete
+                            </button>`
+                        }
+                    </div>
                     <div class="summary-label">Actions</div>
                 </div>
             </div>
@@ -1061,6 +1069,136 @@ async function cancelAndDeleteBenchmarkRun(runId) {
     }
 }
+async function downloadBenchmarkYAML(runId) {
+    try {
+        // Find the run in our local data
+        const run = benchmarkRuns.find(r => r.id === runId);
+        if (!run) {
+            showAlert('Benchmark run not found', 'error');
+            return;
+        }
+        // Get current date for filename
+        const date = new Date().toISOString().split('T')[0];
+        // Get app version from meta tag
+        const appVersion = document.querySelector('meta[name="app-version"]')?.content || 'Could not fetch version';
+        // Extract model name and clean it for filename
+        const modelName = run.search_config?.model_name || 'unknown-model';
+        const cleanModelName = modelName.replace(/[^a-zA-Z0-9.-]/g, '-').toLowerCase();
+        // Get all relevant settings from database
+        let localContextWindow = 'Could not fetch';
+        let maxTokens = 'Could not fetch';
+        let contextWindowUnrestricted = 'Could not fetch';
+        let contextWindowSize = 'Could not fetch';
+        let supportsMaxTokens = 'Could not fetch';
+        try {
+            const settingsResponse = await fetch('/settings/api');
+            if (settingsResponse.ok) {
+                const data = await settingsResponse.json();
+                if (data.status === 'success' && data.settings) {
+                    const settings = data.settings;
+                    // LLM settings - extract the 'value' property from each setting object
+                    localContextWindow = settings['llm.local_context_window_size']?.value || 'Could not fetch';
+                    maxTokens = settings['llm.max_tokens']?.value || 'Could not fetch';
+                    contextWindowUnrestricted = settings['llm.context_window_unrestricted']?.value !== undefined ?
+                        (settings['llm.context_window_unrestricted'].value ? 'Yes' : 'No') : 'Could not fetch';
+                    contextWindowSize = settings['llm.context_window_size']?.value || 'Could not fetch';
+                    supportsMaxTokens = settings['llm.supports_max_tokens']?.value !== undefined ?
+                        (settings['llm.supports_max_tokens'].value ? 'Yes' : 'No') : 'Could not fetch';
+                }
+            }
+        } catch (e) {
+            console.error('Could not fetch current settings:', e);
+        }
+        // Calculate average search results if available
+        const avgSearchResults = formatAvgSearchResults(run).replace(' results', '');
+        const searchResultsNum = avgSearchResults !== 'N/A' ? avgSearchResults : '# Please fill in';
+        // Generate YAML content
+        const yamlContent = `# Benchmark Result
+# Generated from Local Deep Research v${appVersion}
+# Date: ${date}
+# Model Information
+model: ${modelName}
+model_provider: ${run.search_config?.provider || 'unknown'}
+quantization: # Please fill in if applicable
+# Search Engine (critical for benchmark reproducibility)
+search_engine: ${run.search_config?.search_tool || 'unknown'}
+search_provider_version: # if known, e.g., "latest", "2024.1.0"
+average_results_per_query: ${searchResultsNum}
+# Hardware
+hardware:
+  gpu: # Please fill in
+  ram: # Please fill in
+  cpu: # Please fill in
+# Benchmark Results
+results:
+  dataset: SimpleQA
+  total_questions: ${run.total_examples}
+  ${run.search_config?.search_strategy === 'focused_iteration' ? 'focused_iteration' : 'source_based'}:
+    accuracy: ${run.overall_accuracy ? run.overall_accuracy.toFixed(1) : 0}% (${Math.round(run.overall_accuracy * run.total_examples / 100)}/${run.total_examples})
+    iterations: ${run.search_config?.iterations || 'N/A'}
+    questions_per_iteration: ${run.search_config?.questions_per_iteration || 'N/A'}
+    avg_time_per_question: ${formatAvgProcessingTime(run)}
+    total_tokens_used: # if available
+# Configuration
+configuration:
+  context_window: ${localContextWindow} # Current setting at download time - may differ from benchmark run
+  temperature: ${run.search_config?.temperature || 'N/A'}
+  max_tokens: ${maxTokens} # Current setting at download time
+  local_provider_context_window_size: ${localContextWindow} # Current setting at download time
+  context_window_unrestricted: ${contextWindowUnrestricted} # Current setting at download time
+# Versions
+versions:
+  ldr_version: ${appVersion}
+  ollama_version: # if applicable
+# Test Details
+test_details:
+  date_tested: ${date}
+  rate_limiting_issues: # yes/no
+  search_failures: # number of failed searches, if any
+# Notes
+notes: |
+  # Add any observations, errors, or insights here
+  # Search strategy: ${run.search_config?.search_strategy || 'unknown'}
+  # Provider: ${run.search_config?.provider || 'unknown'}
+  # Note: Configuration values are from current settings at download time,
+  # not necessarily the values used during the benchmark run
+`;
+        // Create blob and download
+        const blob = new Blob([yamlContent], { type: 'text/yaml' });
+        const url = window.URL.createObjectURL(blob);
+        const a = document.createElement('a');
+        a.style.display = 'none';
+        a.href = url;
+        a.download = `${cleanModelName}_${date}.yaml`;
+        document.body.appendChild(a);
+        a.click();
+        window.URL.revokeObjectURL(url);
+        document.body.removeChild(a);
+        showAlert('Benchmark YAML downloaded! Hardware details are optional but helpful for performance context.', 'success');
+    } catch (error) {
+        console.error('Error downloading YAML:', error);
+        showAlert('Error downloading YAML: ' + error.message, 'error');
+    }
+}
 async function deleteBenchmarkRun(runId) {
     try {
         const response = await fetch(`/benchmark/api/delete/${runId}`, {

{local_deep_research-0.6.0.dist-info → local_deep_research-0.6.1.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: local-deep-research
-Version: 0.6.0
+Version: 0.6.1
 Summary: AI-powered research assistant with deep, iterative analysis using LLMs and web searches
 Author-Email: LearningCircuit <185559241+LearningCircuit@users.noreply.github.com>, HashedViking <6432677+HashedViking@users.noreply.github.com>, djpetti <djpetti@gmail.com>
 License: MIT License
@@ -302,7 +302,7 @@ Early experiments on small SimpleQA dataset samples:
 | Configuration | Accuracy | Notes |
 |--------------|----------|--------|
 | gpt-4.1-mini + SearXNG + focused_iteration | 90-95% | Limited sample size |
-| gpt-4.1-mini + Tavily | Up to 95% | Limited sample size |
+| gpt-4.1-mini + Tavily + focused_iteration | 90-95% | Limited sample size |
 | gemini-2.0-flash-001 + SearXNG | 82% | Single test run |
 Note: These are preliminary results from initial testing. Performance varies significantly based on query types, model versions, and configurations. [Run your own benchmarks →](docs/BENCHMARKING.md)

{local_deep_research-0.6.0.dist-info → local_deep_research-0.6.1.dist-info}/RECORD RENAMED Viewed

@@ -1,9 +1,9 @@
-local_deep_research-0.6.0.dist-info/METADATA,sha256=f1zxuIR6tmbB13f_PPbBBGvIyFiEAicvJDgwO9YOcPU,14505
-local_deep_research-0.6.0.dist-info/WHEEL,sha256=tSfRZzRHthuv7vxpI4aehrdN9scLjk-dCJkPLzkHxGg,90
-local_deep_research-0.6.0.dist-info/entry_points.txt,sha256=GcXS501Rjh-P80S8db7hnrQ23mS_Jg27PwpVQVO77as,113
-local_deep_research-0.6.0.dist-info/licenses/LICENSE,sha256=Qg2CaTdu6SWnSqk1_JtgBPp_Da-LdqJDhT1Vt1MUc5s,1072
+local_deep_research-0.6.1.dist-info/METADATA,sha256=YMrqywP2xGWYA40UZUB51NA5A3k9iYUitu5kHiJlpO4,14522
+local_deep_research-0.6.1.dist-info/WHEEL,sha256=tSfRZzRHthuv7vxpI4aehrdN9scLjk-dCJkPLzkHxGg,90
+local_deep_research-0.6.1.dist-info/entry_points.txt,sha256=GcXS501Rjh-P80S8db7hnrQ23mS_Jg27PwpVQVO77as,113
+local_deep_research-0.6.1.dist-info/licenses/LICENSE,sha256=Qg2CaTdu6SWnSqk1_JtgBPp_Da-LdqJDhT1Vt1MUc5s,1072
 local_deep_research/__init__.py,sha256=j1ktf_e9HeXPe86NHibY5aINtZfTSGRTvLNtz9BJZa4,1071
-local_deep_research/__version__.py,sha256=cID1jLnC_vj48GgMN6Yb1FA3JsQ95zNmCHmRYE8TFhY,22
+local_deep_research/__version__.py,sha256=baAcEjLSYFIeNZF51tOMmA_zAMhN8HvKael-UU-Ruec,22
 local_deep_research/advanced_search_system/__init__.py,sha256=sGusMj4eFIrhXR6QbOM16UDKB6aI-iS4IFivKWpMlh0,234
 local_deep_research/advanced_search_system/answer_decoding/__init__.py,sha256=BmmbIPQnouYyboFD61CDq71fW5On555w7dbt42s9gV4,148
 local_deep_research/advanced_search_system/answer_decoding/browsecomp_answer_decoder.py,sha256=4FDMP4n_z5DOzVIisH3_kexRqNm1AO3MDe-Md3WtgE0,12856
@@ -244,7 +244,7 @@ local_deep_research/web/templates/components/mobile_nav.html,sha256=6wbqweC5DGEy
 local_deep_research/web/templates/components/settings_form.html,sha256=Z1eEQ_SFlioH24zrIDpjMQ-ajEJC2lLN4Tu8Y8uASLY,15987
 local_deep_research/web/templates/components/sidebar.html,sha256=yvdex0rFt9IFEhVu50MEyvpBIlMKg8x9hLZf-cugPaY,1698
 local_deep_research/web/templates/pages/benchmark.html,sha256=jeqe6koHeVmXKt0U8_JKWnSZEZouq5SuW_kEZMMKjRs,103838
-local_deep_research/web/templates/pages/benchmark_results.html,sha256=K9cs2-i_jUsGVrZaDO8NmCsVNo7fmbthpW9zKglnSb0,33639
+local_deep_research/web/templates/pages/benchmark_results.html,sha256=ijQesleJN-pCNoyQGViRH5bCwb15fYY3vliH5hWjTfM,39771
 local_deep_research/web/templates/pages/benchmark_simple.html,sha256=mLvhzJqRj4rFRJPG9Jo-eHYSogeDVnpRgd5TwACZ1t8,14396
 local_deep_research/web/templates/pages/cost_analytics.html,sha256=mXHw-MSXztJMh6xvW2D_9KXW5EuyrpNnMFTpP7Ob2GQ,46194
 local_deep_research/web/templates/pages/details.html,sha256=Led51_cv97e_Z057_7QVWT7imVB4f71FWeL2q83CJrE,12413
@@ -289,4 +289,4 @@ local_deep_research/web_search_engines/retriever_registry.py,sha256=ZErfErn6s1LI
 local_deep_research/web_search_engines/search_engine_base.py,sha256=0ys6nqm4WLTvYqHLZk4x5ZKFTc4BcqhUBjT1m1Jibp0,17114
 local_deep_research/web_search_engines/search_engine_factory.py,sha256=jKvLkv6rHWSKTnqfLvyvA2WF4qu5qaelgd4IoGOcyVs,12588
 local_deep_research/web_search_engines/search_engines_config.py,sha256=aZ1Y5YMPWgZqRC-wCJ4JUQgliBNSbU0dOUlCvR_elws,6086
-local_deep_research-0.6.0.dist-info/RECORD,,
+local_deep_research-0.6.1.dist-info/RECORD,,

{local_deep_research-0.6.0.dist-info → local_deep_research-0.6.1.dist-info}/WHEEL RENAMED Viewed

File without changes

{local_deep_research-0.6.0.dist-info → local_deep_research-0.6.1.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{local_deep_research-0.6.0.dist-info → local_deep_research-0.6.1.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

local-deep-research 0.6.0__py3-none-any.whl → 0.6.1__py3-none-any.whl

local-deep-research 0.6.0py3-none-any.whl → 0.6.1py3-none-any.whl