PyPI - mirage-benchmark - Versions diffs - 1.0.4__py3-none-any.whl - Mend

mirage-benchmark 1.0.4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of mirage-benchmark might be problematic. Click here for more details.

Files changed (30) hide show

mirage/__init__.py +83 -0
mirage/cli.py +150 -0
mirage/core/__init__.py +52 -0
mirage/core/config.py +248 -0
mirage/core/llm.py +1745 -0
mirage/core/prompts.py +884 -0
mirage/embeddings/__init__.py +31 -0
mirage/embeddings/models.py +512 -0
mirage/embeddings/rerankers_multimodal.py +766 -0
mirage/embeddings/rerankers_text.py +149 -0
mirage/evaluation/__init__.py +26 -0
mirage/evaluation/metrics.py +2223 -0
mirage/evaluation/metrics_optimized.py +2172 -0
mirage/pipeline/__init__.py +45 -0
mirage/pipeline/chunker.py +545 -0
mirage/pipeline/context.py +1003 -0
mirage/pipeline/deduplication.py +491 -0
mirage/pipeline/domain.py +514 -0
mirage/pipeline/pdf_processor.py +598 -0
mirage/pipeline/qa_generator.py +798 -0
mirage/utils/__init__.py +31 -0
mirage/utils/ablation.py +360 -0
mirage/utils/preflight.py +663 -0
mirage/utils/stats.py +626 -0
mirage_benchmark-1.0.4.dist-info/METADATA +490 -0
mirage_benchmark-1.0.4.dist-info/RECORD +30 -0
mirage_benchmark-1.0.4.dist-info/WHEEL +5 -0
mirage_benchmark-1.0.4.dist-info/entry_points.txt +3 -0
mirage_benchmark-1.0.4.dist-info/licenses/LICENSE +190 -0
mirage_benchmark-1.0.4.dist-info/top_level.txt +1 -0

mirage_benchmark-1.0.4.dist-info/METADATA ADDED Viewed

@@ -0,0 +1,490 @@
+Metadata-Version: 2.4
+Name: mirage-benchmark
+Version: 1.0.4
+Summary: A Multiagent Framework for Generating Multimodal Multihop QA Datasets for RAG Evaluation
+Home-page: https://github.com/ChandanKSahu/MiRAGE
+Author: MiRAGE Authors
+Author-email: MiRAGE Authors <contact@example.com>
+Maintainer-email: MiRAGE Authors <contact@example.com>
+License: Apache-2.0
+Project-URL: Homepage, https://github.com/ChandanKSahu/MiRAGE
+Project-URL: Documentation, https://github.com/ChandanKSahu/MiRAGE#readme
+Project-URL: Repository, https://github.com/ChandanKSahu/MiRAGE.git
+Project-URL: Issues, https://github.com/ChandanKSahu/MiRAGE/issues
+Keywords: rag,multimodal,qa,dataset,generation,llm,vlm,evaluation,benchmark
+Classifier: Development Status :: 4 - Beta
+Classifier: Intended Audience :: Developers
+Classifier: Intended Audience :: Science/Research
+Classifier: License :: OSI Approved :: Apache Software License
+Classifier: Programming Language :: Python :: 3
+Classifier: Programming Language :: Python :: 3.9
+Classifier: Programming Language :: Python :: 3.10
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
+Classifier: Topic :: Software Development :: Libraries :: Python Modules
+Requires-Python: >=3.9
+Description-Content-Type: text/markdown
+License-File: LICENSE
+Requires-Dist: torch>=2.0.0
+Requires-Dist: faiss-cpu>=1.7.0
+Requires-Dist: numpy>=1.21.0
+Requires-Dist: Pillow>=9.0.0
+Requires-Dist: transformers>=4.44.0
+Requires-Dist: huggingface_hub>=0.16.0
+Requires-Dist: tqdm>=4.65.0
+Requires-Dist: pyyaml>=6.0
+Requires-Dist: requests>=2.28.0
+Requires-Dist: aiohttp>=3.8.0
+Requires-Dist: sentence-transformers>=2.2.0
+Requires-Dist: bertopic>=0.16.0
+Requires-Dist: umap-learn>=0.5.0
+Requires-Dist: pandas>=1.5.0
+Requires-Dist: scikit-learn>=1.0.0
+Provides-Extra: gpu
+Requires-Dist: faiss-gpu>=1.7.0; extra == "gpu"
+Requires-Dist: bitsandbytes>=0.43.0; extra == "gpu"
+Requires-Dist: accelerate>=0.20.0; extra == "gpu"
+Provides-Extra: pdf
+Requires-Dist: docling>=0.1.0; extra == "pdf"
+Requires-Dist: pypdfium2>=4.0.0; extra == "pdf"
+Provides-Extra: eval
+Requires-Dist: ragas>=0.1.0; extra == "eval"
+Requires-Dist: datasets>=2.0.0; extra == "eval"
+Requires-Dist: langchain-google-genai>=1.0.0; extra == "eval"
+Requires-Dist: langchain-openai>=0.1.0; extra == "eval"
+Provides-Extra: dev
+Requires-Dist: pytest>=7.0.0; extra == "dev"
+Requires-Dist: flake8>=5.0.0; extra == "dev"
+Requires-Dist: black>=22.0.0; extra == "dev"
+Requires-Dist: twine>=4.0.0; extra == "dev"
+Requires-Dist: build>=0.10.0; extra == "dev"
+Provides-Extra: all
+Requires-Dist: faiss-gpu>=1.7.0; extra == "all"
+Requires-Dist: bitsandbytes>=0.43.0; extra == "all"
+Requires-Dist: accelerate>=0.20.0; extra == "all"
+Requires-Dist: docling>=0.1.0; extra == "all"
+Requires-Dist: pypdfium2>=4.0.0; extra == "all"
+Requires-Dist: ragas>=0.1.0; extra == "all"
+Requires-Dist: datasets>=2.0.0; extra == "all"
+Requires-Dist: langchain-google-genai>=1.0.0; extra == "all"
+Requires-Dist: langchain-openai>=0.1.0; extra == "all"
+Requires-Dist: pytest>=7.0.0; extra == "all"
+Requires-Dist: flake8>=5.0.0; extra == "all"
+Requires-Dist: black>=22.0.0; extra == "all"
+Dynamic: author
+Dynamic: home-page
+Dynamic: license-file
+Dynamic: requires-python
+# MiRAGE: A Multiagent Framework for Generating Multimodal Multihop Question-Answer Dataset for RAG Evaluation
+<p align="center">
+  <img src="https://img.shields.io/badge/python-3.9+-blue.svg" alt="Python 3.9+">
+  <img src="https://img.shields.io/badge/license-Apache%202.0-green.svg" alt="License">
+  <img src="https://img.shields.io/pypi/v/mirage-benchmark.svg" alt="PyPI">
+</p>
+**MiRAGE** is a multi-agent framework for generating high-quality, multimodal, multihop question-answer datasets for evaluating Retrieval-Augmented Generation (RAG) systems.
+<p align="center">
+  <img src="assets/mirage_framework.png" alt="MiRAGE Framework Architecture" width="100%">
+</p>
+## Key Features
+- **Multi-hop Context Completion**: Iteratively expands incomplete chunks with relevant context
+- **Domain and Expert Role Detection**: Automatic domain identification using BERTopic + LLM
+- **Multi-stage QA Pipeline**: Generate, Select, Verify, Correct for quality assurance
+- **Multimodal Support**: Handles text, tables, figures, and images
+- **Multiple Backend Support**: Gemini, OpenAI, and local Ollama models
+- **Fully Parallelized**: Thread and process pools for maximum throughput
+## Table of Contents
+- [Installation](#installation)
+- [Quick Start](#quick-start)
+- [Usage](#usage)
+- [API Keys Setup](#api-keys-setup)
+- [Configuration](#configuration)
+- [Command Line Options](#command-line-options)
+- [Output Format](#output-format)
+- [Project Structure](#project-structure)
+- [Contributing](#contributing)
+- [License](#license)
+## Installation
+### From PyPI
+```bash
+pip install mirage-benchmark
+```
+### From Source
+```bash
+git clone https://github.com/ChandanKSahu/MiRAGE.git
+cd MiRAGE
+pip install -e .
+```
+### With Optional Dependencies
+```bash
+pip install mirage-benchmark[gpu]   # GPU support
+pip install mirage-benchmark[pdf]   # PDF processing
+pip install mirage-benchmark[all]   # All dependencies
+```
+## Quick Start
+### Step 1: Set Up API Key
+Choose one of the following backends:
+**Option A: Google Gemini (Recommended)**
+```bash
+export GEMINI_API_KEY="your-gemini-api-key"
+```
+**Option B: OpenAI**
+```bash
+export OPENAI_API_KEY="your-openai-api-key"
+```
+**Option C: Local Ollama (No API key needed)**
+```bash
+# Install and start Ollama
+ollama serve
+ollama pull llama3
+```
+### Step 2: Prepare Your Data
+Place your documents in a folder:
+```bash
+mkdir -p data/my_documents
+cp /path/to/your/*.pdf data/my_documents/
+```
+### Step 3: Run MiRAGE
+```bash
+# Basic usage
+python run_mirage.py --input data/my_documents --output output/my_dataset
+# With API key as argument
+python run_mirage.py -i data/my_documents -o output/my_dataset --api-key YOUR_API_KEY
+# Using OpenAI
+python run_mirage.py -i data/my_documents -o output/my_dataset --backend openai
+# Using local Ollama
+python run_mirage.py -i data/my_documents -o output/my_dataset --backend ollama
+```
+### Step 4: Check Results
+```bash
+ls output/my_dataset/
+# qa_deduplicated.json  - Final QA dataset
+# chunks.json           - Semantic chunks
+# evaluation_report.json - Quality metrics
+```
+## Usage
+### Basic Usage
+```bash
+python run_mirage.py --input <INPUT_DIR> --output <OUTPUT_DIR>
+```
+### With All Options
+```bash
+python run_mirage.py \
+    --input data/documents \
+    --output output/results \
+    --backend gemini \
+    --api-key YOUR_API_KEY \
+    --num-qa-pairs 100 \
+    --max-workers 4 \
+    --verbose
+```
+### Run Preflight Checks
+Before running the full pipeline, verify your setup:
+```bash
+python run_mirage.py --preflight
+```
+### Using Sample Dataset
+A sample dataset is included for testing:
+```bash
+# Unzip sample data
+unzip data/FinanceAnnualReports.zip -d data/sample/
+# Run on sample
+python run_mirage.py -i data/sample -o output/sample_results
+```
+## API Keys Setup
+### Google Gemini
+1. Get API key from: https://makersuite.google.com/app/apikey
+2. Set environment variable:
+```bash
+export GEMINI_API_KEY="your-key-here"
+```
+Or create a file:
+```bash
+mkdir -p ~/.config/gemini
+echo "your-key-here" > ~/.config/gemini/api_key.txt
+```
+### OpenAI
+1. Get API key from: https://platform.openai.com/api-keys
+2. Set environment variable:
+```bash
+export OPENAI_API_KEY="your-key-here"
+```
+### Ollama (Local - Free)
+No API key needed! Just install Ollama:
+```bash
+# Install
+curl -fsSL https://ollama.com/install.sh | sh
+# Start server
+ollama serve
+# Pull models
+ollama pull llama3      # For text
+ollama pull llava       # For vision
+```
+## Configuration
+### Using config.yaml
+Copy the example config and customize:
+```bash
+cp config.yaml.example config.yaml
+```
+Edit `config.yaml`:
+```yaml
+backend:
+  active: GEMINI  # GEMINI, OPENAI, or OLLAMA
+  gemini:
+    api_key_path: ~/.config/gemini/api_key.txt
+    llm_model: gemini-2.0-flash
+    vlm_model: gemini-2.0-flash
+  openai:
+    api_key_path: ~/.config/openai/api_key.txt
+    llm_model: gpt-4o
+    vlm_model: gpt-4o
+  ollama:
+    base_url: http://localhost:11434
+    llm_model: llama3
+    vlm_model: llava
+paths:
+  input_pdf_dir: data/documents
+  output_dir: output/results
+qa_generation:
+  target_qa_pairs: 100
+  max_workers: 4
+```
+Then run:
+```bash
+python run_mirage.py --config config.yaml
+```
+## Command Line Options
+| Option | Short | Description | Default |
+|--------|-------|-------------|---------|
+| `--input` | `-i` | Input directory with documents | Required |
+| `--output` | `-o` | Output directory for results | Required |
+| `--api-key` | `-k` | API key for LLM backend | From env |
+| `--backend` | `-b` | Backend: gemini, openai, ollama | gemini |
+| `--model` | | Model name | Auto |
+| `--config` | `-c` | Config file path | config.yaml |
+| `--num-qa-pairs` | | Target QA pairs to generate | 100 |
+| `--max-workers` | | Parallel workers | 4 |
+| `--preflight` | | Run preflight checks only | - |
+| `--skip-preflight` | | Skip preflight checks | - |
+| `--skip-pdf-processing` | | Skip PDF conversion | - |
+| `--skip-chunking` | | Skip chunking step | - |
+| `--verbose` | `-v` | Verbose output | - |
+| `--version` | | Show version | - |
+| `--help` | `-h` | Show help | - |
+## Output Format
+### Generated Files
+```
+output/my_dataset/
+├── markdown/              # Converted markdown files
+├── chunks.json           # Semantic chunks
+├── qa_dataset.json       # Raw QA pairs
+├── qa_deduplicated.json  # Final deduplicated QA pairs
+├── evaluation_report.json # Quality metrics
+└── run_config.json       # Run configuration
+```
+### QA Dataset Structure
+```json
+{
+  "chunk_id": 1,
+  "question": "What is the company's revenue growth?",
+  "answer": "The company achieved 15% revenue growth...",
+  "context_chunks": [...],
+  "hop_count": 2,
+  "relevance_score": "9",
+  "difficulty_score": "7",
+  "expert_persona": "Financial Analyst",
+  "domain": "Finance"
+}
+```
+<p align="center">
+  <img src="assets/ample question-answer pair generated.png" alt="Sample QA Pair" width="100%">
+</p>
+## Project Structure
+```
+MiRAGE/
+├── src/mirage/              # Main package
+│   ├── core/               # LLM interfaces, prompts, config
+│   ├── embeddings/         # Embedding models, rerankers
+│   ├── pipeline/           # PDF processing, QA generation
+│   ├── evaluation/         # Metrics
+│   └── utils/              # Utilities
+├── data/                   # Your documents
+│   └── documents/         # Input folder
+├── output/                 # Generated results
+├── config.yaml.example     # Example configuration
+├── run_mirage.py          # Main entry point
+└── README.md
+```
+## Examples
+### Generate QA from PDFs
+```bash
+# Using Gemini
+export GEMINI_API_KEY="your-key"
+python run_mirage.py -i data/pdfs -o output/qa_dataset
+# Using OpenAI
+export OPENAI_API_KEY="your-key"
+python run_mirage.py -i data/pdfs -o output/qa_dataset --backend openai
+# Using Ollama (local, free)
+python run_mirage.py -i data/pdfs -o output/qa_dataset --backend ollama
+```
+### Generate More QA Pairs
+```bash
+python run_mirage.py -i data/documents -o output/large_dataset --num-qa-pairs 500
+```
+### Use More Workers
+```bash
+python run_mirage.py -i data/documents -o output/fast_run --max-workers 8
+```
+### Skip Already Processed Steps
+```bash
+# If you already have markdown files
+python run_mirage.py -i data/documents -o output/results --skip-pdf-processing
+# If you already have chunks
+python run_mirage.py -i data/documents -o output/results --skip-chunking
+```
+## Troubleshooting
+### API Key Issues
+```bash
+# Check if API key is set
+echo $GEMINI_API_KEY
+# Set it if missing
+export GEMINI_API_KEY="your-key"
+```
+### Import Errors
+```bash
+# Reinstall package
+pip install -e .
+```
+### Preflight Check Failures
+```bash
+# Run verbose preflight
+python run_mirage.py --preflight --verbose
+```
+## Contributing
+1. Fork the repository
+2. Create a feature branch
+3. Make your changes
+4. Submit a pull request
+See [CONTRIBUTING.md](CONTRIBUTING.md) for details.
+## Citation
+```bibtex
+@software{mirage2024,
+  title = {MiRAGE: A Multiagent Framework for Generating Multimodal Multihop Question-Answer Dataset for RAG Evaluation},
+  author = {MiRAGE Authors},
+  year = {2026},
+  url = {https://github.com/ChandanKSahu/MiRAGE}
+}
+```
+## License
+Apache License 2.0 - see [LICENSE](LICENSE)
+## Acknowledgments
+- [RAGAS](https://github.com/explodinggradients/ragas) for evaluation metrics
+- [BERTopic](https://github.com/MaartenGr/BERTopic) for topic modeling
+- [FAISS](https://github.com/facebookresearch/faiss) for similarity search
+- [Docling](https://github.com/DS4SD/docling) for PDF processing

mirage_benchmark-1.0.4.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,30 @@
+mirage/__init__.py,sha256=wjg2h7W2McIwR2m3mcpfqZ1VfPlLXSJXGQ6YnnjRF9w,2588
+mirage/cli.py,sha256=MGzZ9rHCa4q5TesEsgMbigt49wC5qGRMMP7iMlzKi58,4824
+mirage/core/__init__.py,sha256=YQTAWi5AfsHWnKuI_W2_vQ2tzt7ooevkHEqruayAqo8,1484
+mirage/core/config.py,sha256=hQjdYt-pohPmYPBFidnKUg7p-1y84ljx29fbNY0f-6Y,7235
+mirage/core/llm.py,sha256=qpPcrM6WWFNMF6Y0WAuPvGlMbd6k7ILRCj1oa3Pm4zY,77587
+mirage/core/prompts.py,sha256=J4SJ-sjDjYRDfIr9aJSvuz07ecy_Jt6Amza0SsqpZ7g,22953
+mirage/embeddings/__init__.py,sha256=RlXUthPGdNNXU-09Ms0Wrm7AQifLUP107_6OHz0AXR8,1291
+mirage/embeddings/models.py,sha256=0x0q2tXfulXqA_lHwYDvhxfQ3LWWLRcv7khb_H2FiJM,21519
+mirage/embeddings/rerankers_multimodal.py,sha256=Lf-doykXHmMA-Rzem6-tS5DwbukNy-bTx-5WmNLCJ0E,32780
+mirage/embeddings/rerankers_text.py,sha256=VviQ7TiGYl8xIAMbZeh5olSAeBLjg-cDcIwd-0oWCAc,6406
+mirage/evaluation/__init__.py,sha256=yL29oL1HLZuXJgrgCHdfXZpvTF-nV5uQN-LUUjPwp8c,1033
+mirage/evaluation/metrics.py,sha256=odWhLx0pU-vTniy6Yf3khwgmiR8R_phrdhencgy7GHs,98042
+mirage/evaluation/metrics_optimized.py,sha256=KP2YP8Y5kqRTAa7g7InAjWmm2h-iipirE3bWeWYUavY,88048
+mirage/pipeline/__init__.py,sha256=StBcwv_doTd639v7wTg4ZCeV-aNv8QvwuFNLDzW4nrU,1984
+mirage/pipeline/chunker.py,sha256=0eiqqn4x5nxkj8ovFXMFM99AoF5CE6KeVtfJvNyDh3M,21612
+mirage/pipeline/context.py,sha256=_sNTeNo2Wsq72mg0uHD52dBHfVNCbZFyIjbDfS5ozfE,42772
+mirage/pipeline/deduplication.py,sha256=5fko2OkfEBQx5lKHYNOrqJP4roETMnBTK7IOEbQ9Prw,19074
+mirage/pipeline/domain.py,sha256=AsZDnBfOWdmTcelb6j-SfUlrNoQYDAiycqb4l2AE2bw,20817
+mirage/pipeline/pdf_processor.py,sha256=6gcxPrJl9gujuMOugUMG8KAoSvxBfhBXXmaC0ixAXMw,25358
+mirage/pipeline/qa_generator.py,sha256=ZKC2LJiZfiNqs6o4IQQkF5-A6S9aKFlbTayKc1amNDI,34490
+mirage/utils/__init__.py,sha256=h3UTJyyEZWIectZbklgOaA0s73xSIe8fJKwgcDpiodk,1285
+mirage/utils/ablation.py,sha256=vfUNAfXHhF4_S2Sxpu4kZ9akWcQzWqPahg7FMzZsJm8,12272
+mirage/utils/preflight.py,sha256=QRmzL-YJzAy0jp5wdYg7zmoFRJ-uZq1PFsDdIUcc-aI,23998
+mirage/utils/stats.py,sha256=kqrP2BuLy6eZnZRQZqE7julNrrsKEznOGFvFH03kpjw,23115
+mirage_benchmark-1.0.4.dist-info/licenses/LICENSE,sha256=S5DUh9Vf2wAP1uRJuvpRPF3fCZJbq_O-mbx-R9gOBIY,10763
+mirage_benchmark-1.0.4.dist-info/METADATA,sha256=94EtjpY6QD2pWU0JFMIwx4ZLJH43yVLhQ4kzr8BonSc,12926
+mirage_benchmark-1.0.4.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+mirage_benchmark-1.0.4.dist-info/entry_points.txt,sha256=OvyHIX_38WFVMsNJMqkpdcQXY9-kQgR2173ZRKeNlcM,90
+mirage_benchmark-1.0.4.dist-info/top_level.txt,sha256=x6Yl54RzCGuLqqWDF4zZ-tEaP2pUKzUqb57hVrbakVI,7
+mirage_benchmark-1.0.4.dist-info/RECORD,,

mirage_benchmark-1.0.4.dist-info/WHEEL ADDED Viewed

@@ -0,0 +1,5 @@
+Wheel-Version: 1.0
+Generator: setuptools (80.9.0)
+Root-Is-Purelib: true
+Tag: py3-none-any

mirage_benchmark-1.0.4.dist-info/entry_points.txt ADDED Viewed

@@ -0,0 +1,3 @@
+[console_scripts]
+mirage = mirage.cli:main
+mirage-preflight = mirage.utils.preflight:main