PyPI - npcpy - Versions diffs - 1.3.13__tar.gz → 1.3.14__tar.gz - Mend

npcpy 1.3.13tar.gz → 1.3.14tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (84) hide show

{npcpy-1.3.13/npcpy.egg-info → npcpy-1.3.14}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: npcpy
-Version: 1.3.13
+Version: 1.3.14
 Summary: npcpy is the premier open-source library for integrating LLMs and Agents into python systems.
 Home-page: https://github.com/NPC-Worldwide/npcpy
 Author: Christopher Agostino
@@ -305,7 +305,7 @@ ggm = NPC(
 isabel = NPC(
     name='Isabel Allende',
     primary_directive='You are Isabel Allende, weaving stories with emotion and history. Analyze texts and provide insight.',
-    model='llama3.2:8b',
+    model='llama3.2',
     provider='ollama',
 )
@@ -359,7 +359,7 @@ LLM responses can be obtained without NPCs as well.
 ```python
 from npcpy.llm_funcs import get_llm_response
-response = get_llm_response("Who was the celtic Messenger god?", model='mistral:7b', provider='ollama')
+response = get_llm_response("Who was the celtic Messenger god?", model='qwen3:4b', provider='ollama')
 print(response['response'])
 ```
@@ -400,7 +400,7 @@ Return structured outputs by specifying `format='json'` or passing a Pydantic sc
 ```python
 from npcpy.llm_funcs import get_llm_response
-response = get_llm_response("What is the sentiment of the american people towards the repeal of Roe v Wade? Return a json object with `sentiment` as the key and a float value from -1 to 1 as the value", model='claude-4-5-haiku-latest', provider='deepseek', format='json')
+response = get_llm_response("What is the sentiment of the american people towards the repeal of Roe v Wade? Return a json object with `sentiment` as the key and a float value from -1 to 1 as the value", model='deepseek-chat', provider='deepseek', format='json')
 print(response['response'])
 ```

{npcpy-1.3.13 → npcpy-1.3.14}/README.md RENAMED Viewed

@@ -209,7 +209,7 @@ ggm = NPC(
 isabel = NPC(
     name='Isabel Allende',
     primary_directive='You are Isabel Allende, weaving stories with emotion and history. Analyze texts and provide insight.',
-    model='llama3.2:8b',
+    model='llama3.2',
     provider='ollama',
 )
@@ -263,7 +263,7 @@ LLM responses can be obtained without NPCs as well.
 ```python
 from npcpy.llm_funcs import get_llm_response
-response = get_llm_response("Who was the celtic Messenger god?", model='mistral:7b', provider='ollama')
+response = get_llm_response("Who was the celtic Messenger god?", model='qwen3:4b', provider='ollama')
 print(response['response'])
 ```
@@ -304,7 +304,7 @@ Return structured outputs by specifying `format='json'` or passing a Pydantic sc
 ```python
 from npcpy.llm_funcs import get_llm_response
-response = get_llm_response("What is the sentiment of the american people towards the repeal of Roe v Wade? Return a json object with `sentiment` as the key and a float value from -1 to 1 as the value", model='claude-4-5-haiku-latest', provider='deepseek', format='json')
+response = get_llm_response("What is the sentiment of the american people towards the repeal of Roe v Wade? Return a json object with `sentiment` as the key and a float value from -1 to 1 as the value", model='deepseek-chat', provider='deepseek', format='json')
 print(response['response'])
 ```

{npcpy-1.3.13 → npcpy-1.3.14}/npcpy/ft/diff.py RENAMED Viewed

@@ -180,52 +180,66 @@ if TORCH_AVAILABLE:
             noise = torch.randn_like(x)
             return sqrt_alpha * x + sqrt_one_minus * noise, noise
-        def train(self, dataloader):
+        def train(self, dataloader, progress_callback=None):
             optimizer = torch.optim.AdamW(
-                self.model.parameters(),
+                self.model.parameters(),
                 lr=self.config.learning_rate
             )
             os.makedirs(self.config.output_model_path, exist_ok=True)
             checkpoint_dir = os.path.join(
-                self.config.output_model_path,
+                self.config.output_model_path,
                 'checkpoints'
             )
             os.makedirs(checkpoint_dir, exist_ok=True)
             global_step = 0
+            total_batches = len(dataloader)
+            loss_history = []
             for epoch in range(self.config.num_epochs):
                 self.model.train()
                 epoch_loss = 0.0
                 pbar = tqdm(dataloader, desc=f'Epoch {epoch+1}')
                 for batch_idx, (images, captions) in enumerate(pbar):
                     images = images.to(self.device)
                     batch_size = images.shape[0]
                     t = torch.randint(
-                        0,
-                        self.config.timesteps,
-                        (batch_size,),
+                        0,
+                        self.config.timesteps,
+                        (batch_size,),
                         device=self.device
                     ).long()
                     noisy_images, noise = self.add_noise(images, t)
                     predicted_noise = self.model(noisy_images, t)
                     loss = F.mse_loss(predicted_noise, noise)
                     optimizer.zero_grad()
                     loss.backward()
                     optimizer.step()
                     epoch_loss += loss.item()
                     global_step += 1
                     pbar.set_postfix({'loss': loss.item()})
+                    # Report progress via callback
+                    if progress_callback:
+                        progress_callback({
+                            'epoch': epoch + 1,
+                            'total_epochs': self.config.num_epochs,
+                            'batch': batch_idx + 1,
+                            'total_batches': total_batches,
+                            'step': global_step,
+                            'loss': loss.item(),
+                            'loss_history': loss_history[-100:],  # Last 100 losses
+                        })
                     if global_step % self.config.checkpoint_frequency == 0:
                         ckpt_path = os.path.join(
                             checkpoint_dir,
@@ -238,8 +252,9 @@ if TORCH_AVAILABLE:
                             'optimizer_state_dict': optimizer.state_dict(),
                             'loss': loss.item(),
                         }, ckpt_path)
                 avg_loss = epoch_loss / len(dataloader)
+                loss_history.append(avg_loss)
                 print(f'Epoch {epoch+1} avg loss: {avg_loss:.6f}')
             final_path = os.path.join(
@@ -300,35 +315,35 @@ else:
     DiffusionTrainer = None
-def train_diffusion(image_paths, captions=None, config=None,
-                    resume_from=None):
+def train_diffusion(image_paths, captions=None, config=None,
+                    resume_from=None, progress_callback=None):
     if not TORCH_AVAILABLE:
         raise ImportError(
             "PyTorch not available. Install: pip install torch torchvision"
         )
     if config is None:
         config = DiffusionConfig()
     if captions is None:
         captions = [''] * len(image_paths)
     dataset = ImageDataset(image_paths, captions, config.image_size)
     dataloader = DataLoader(
-        dataset,
-        batch_size=config.batch_size,
+        dataset,
+        batch_size=config.batch_size,
         shuffle=True,
         num_workers=0
     )
     trainer = DiffusionTrainer(config)
     if resume_from and os.path.exists(resume_from):
         checkpoint = torch.load(resume_from, map_location=trainer.device)
         trainer.model.load_state_dict(checkpoint['model_state_dict'])
         print(f'Resumed from {resume_from}')
-    output_path = trainer.train(dataloader)
+    output_path = trainer.train(dataloader, progress_callback=progress_callback)
     gc.collect()
     if torch.cuda.is_available():

{npcpy-1.3.13 → npcpy-1.3.14}/npcpy/ft/rl.py RENAMED Viewed

@@ -1,4 +1,5 @@
-from dataclasses import dataclass
+from dataclasses import dataclass, field
+from typing import List
 from datetime import datetime
 import glob
@@ -12,7 +13,8 @@ try:
     import torch
     from transformers import (
         AutoModelForCausalLM,
-        AutoTokenizer
+        AutoTokenizer,
+        BitsAndBytesConfig
     )
     from trl import DPOTrainer, DPOConfig
 except:
@@ -23,6 +25,7 @@ except:
     torch = None
     AutoModelForCausalLM = None
     AutoTokenizer = None
+    BitsAndBytesConfig = None
 import random
@@ -44,6 +47,24 @@ class RLConfig:
     beta: float = 0.5
     max_length: int = 512
     max_prompt_length: int = 256
+    # Quantization options
+    use_4bit: bool = False
+    use_8bit: bool = False
+    # Precision options
+    fp16: bool = False
+    bf16: bool = False
+    # LoRA configuration
+    lora_r: int = 8
+    lora_alpha: int = 16
+    lora_dropout: float = 0.1
+    lora_target_modules: List[str] = field(
+        default_factory=lambda: ["q_proj", "k_proj", "v_proj", "o_proj"]
+    )
+    # Training options
+    max_pairs: int = 200
+    warmup_steps: int = 5
+    logging_steps: int = 5
+    save_steps: int = 20
 class TaskExecutor:
@@ -207,8 +228,8 @@ def create_preference_pairs(
             f"Warning: Only {len(pairs)} pairs found. "
             "May overfit."
         )
-    return Dataset.from_list(pairs[:100])
+    return Dataset.from_list(pairs)
 def train_with_dpo(
@@ -218,84 +239,121 @@ def train_with_dpo(
     if config is None:
         config = RLConfig()
     preference_dataset = create_preference_pairs(
         traces,
         min_reward_gap=config.min_reward_gap
     )
     if preference_dataset is None or len(preference_dataset) == 0:
         print("No valid preference pairs. Cannot train.")
         return None
+    # Limit pairs if specified
+    if config.max_pairs and len(preference_dataset) > config.max_pairs:
+        preference_dataset = preference_dataset.select(range(config.max_pairs))
+    print(f"Training with {len(preference_dataset)} preference pairs")
+    # Build model loading kwargs
+    model_kwargs = {
+        "device_map": "auto",
+        "trust_remote_code": True,
+        "low_cpu_mem_usage": True
+    }
+    # Handle quantization
+    if config.use_4bit:
+        if BitsAndBytesConfig is None:
+            raise ImportError("bitsandbytes required for 4-bit. pip install bitsandbytes")
+        model_kwargs["quantization_config"] = BitsAndBytesConfig(
+            load_in_4bit=True,
+            bnb_4bit_quant_type="nf4",
+            bnb_4bit_compute_dtype=torch.float16,
+            bnb_4bit_use_double_quant=True
+        )
+        print("Using 4-bit quantization")
+    elif config.use_8bit:
+        if BitsAndBytesConfig is None:
+            raise ImportError("bitsandbytes required for 8-bit. pip install bitsandbytes")
+        model_kwargs["quantization_config"] = BitsAndBytesConfig(
+            load_in_8bit=True
+        )
+        print("Using 8-bit quantization")
+    else:
+        # Set dtype based on precision config
+        if config.bf16:
+            model_kwargs["torch_dtype"] = torch.bfloat16
+        elif config.fp16:
+            model_kwargs["torch_dtype"] = torch.float16
+        else:
+            model_kwargs["torch_dtype"] = torch.float32
     model = AutoModelForCausalLM.from_pretrained(
         config.base_model_name,
-        torch_dtype=torch.float32,
-        device_map="auto",
-        low_cpu_mem_usage=True
+        **model_kwargs
     )
     tokenizer = AutoTokenizer.from_pretrained(
         config.base_model_name,
         trust_remote_code=True
     )
     if tokenizer.pad_token is None:
         tokenizer.pad_token = tokenizer.eos_token
     peft_config = LoraConfig(
-        r=8,
-        lora_alpha=16,
-        lora_dropout=0.1,
+        r=config.lora_r,
+        lora_alpha=config.lora_alpha,
+        lora_dropout=config.lora_dropout,
         bias="none",
         task_type="CAUSAL_LM",
-        target_modules=[
-            "q_proj",
-            "k_proj",
-            "v_proj",
-            "o_proj"
-        ]
+        target_modules=config.lora_target_modules
     )
+    # Select optimizer based on quantization
+    if config.use_4bit or config.use_8bit:
+        optim = "paged_adamw_8bit"
+    else:
+        optim = "adamw_torch"
     training_args = DPOConfig(
         output_dir="./dpo_results",
-        per_device_train_batch_size=(
-            config.per_device_train_batch_size
-        ),
-        gradient_accumulation_steps=(
-            config.gradient_accumulation_steps
-        ),
+        per_device_train_batch_size=config.per_device_train_batch_size,
+        gradient_accumulation_steps=config.gradient_accumulation_steps,
         learning_rate=config.learning_rate,
         num_train_epochs=config.num_train_epochs,
         weight_decay=0.1,
         beta=config.beta,
-        logging_steps=2,
-        save_steps=10,
+        logging_steps=config.logging_steps,
+        save_steps=config.save_steps,
         remove_unused_columns=False,
         max_length=config.max_length,
         max_prompt_length=config.max_prompt_length,
         dataloader_num_workers=0,
-        fp16=False,
-        bf16=False,
-        optim="adamw_torch",
-        warmup_steps=2,
+        fp16=config.fp16 or config.use_4bit,
+        bf16=config.bf16,
+        optim=optim,
+        warmup_steps=config.warmup_steps,
         save_strategy="steps",
-        save_total_limit=3
+        save_total_limit=2
     )
     trainer = DPOTrainer(
         model,
         args=training_args,
         train_dataset=preference_dataset,
-        peft_config=peft_config
+        peft_config=peft_config,
+        tokenizer=tokenizer
     )
     print("Starting DPO training...")
     trainer.train()
+    os.makedirs(config.adapter_path, exist_ok=True)
     trainer.save_model(config.adapter_path)
     print(f"Adapter saved to {config.adapter_path}")
     return config.adapter_path
@@ -333,28 +391,53 @@ def run_rl_training(
 def load_rl_model(
     base_model_id: str,
-    adapter_path: str
+    adapter_path: str,
+    use_4bit: bool = False,
+    use_8bit: bool = False,
+    merge_adapter: bool = True
 ):
     print(f"Loading base model: {base_model_id}")
+    model_kwargs = {
+        "device_map": "auto",
+        "trust_remote_code": True
+    }
+    if use_4bit:
+        if BitsAndBytesConfig is None:
+            raise ImportError("bitsandbytes required for 4-bit")
+        model_kwargs["quantization_config"] = BitsAndBytesConfig(
+            load_in_4bit=True,
+            bnb_4bit_quant_type="nf4",
+            bnb_4bit_compute_dtype=torch.float16,
+            bnb_4bit_use_double_quant=True
+        )
+    elif use_8bit:
+        if BitsAndBytesConfig is None:
+            raise ImportError("bitsandbytes required for 8-bit")
+        model_kwargs["quantization_config"] = BitsAndBytesConfig(
+            load_in_8bit=True
+        )
+    else:
+        model_kwargs["torch_dtype"] = torch.float16
     model = AutoModelForCausalLM.from_pretrained(
         base_model_id,
-        torch_dtype=torch.float32,
-        device_map="auto",
-        attn_implementation='eager'
+        **model_kwargs
     )
     tokenizer = AutoTokenizer.from_pretrained(
         base_model_id,
         trust_remote_code=True
     )
     if tokenizer.pad_token is None:
         tokenizer.pad_token = tokenizer.eos_token
     if adapter_path and os.path.exists(adapter_path):
         print(f"Loading adapter: {adapter_path}")
         model = PeftModel.from_pretrained(model, adapter_path)
-        model = model.merge_and_unload()
+        if merge_adapter and not (use_4bit or use_8bit):
+            model = model.merge_and_unload()
     return model, tokenizer

{npcpy-1.3.13 → npcpy-1.3.14}/npcpy/serve.py RENAMED Viewed

@@ -51,6 +51,7 @@ from npcpy.memory.command_history import setup_chroma_db
 from npcpy.memory.search import execute_rag_command, execute_brainblast_command
 from npcpy.data.load import load_file_contents
 from npcpy.data.web import search_web
+from npcpy.data.image import capture_screenshot
 import base64
@@ -1008,7 +1009,7 @@ def get_attachment(attachment_id):
 @app.route("/api/capture_screenshot", methods=["GET"])
 def capture():
-    screenshot = capture_screenshot(None, full=True)
+    screenshot = capture_screenshot(full=True)
     if not screenshot:
@@ -1895,10 +1896,26 @@ def finetune_diffusers():
         'output_dir': output_dir,
         'epochs': num_epochs,
         'current_epoch': 0,
+        'current_batch': 0,
+        'total_batches': 0,
+        'current_loss': None,
+        'loss_history': [],
+        'step': 0,
         'start_time': datetime.datetime.now().isoformat()
     }
     print(f"🌋 Finetuning job {job_id} initialized. Output directory: {output_dir}")
+    def progress_callback(progress_data):
+        """Callback to update job progress from training loop."""
+        finetune_jobs[job_id]['current_epoch'] = progress_data.get('epoch', 0)
+        finetune_jobs[job_id]['epochs'] = progress_data.get('total_epochs', num_epochs)
+        finetune_jobs[job_id]['current_batch'] = progress_data.get('batch', 0)
+        finetune_jobs[job_id]['total_batches'] = progress_data.get('total_batches', 0)
+        finetune_jobs[job_id]['step'] = progress_data.get('step', 0)
+        finetune_jobs[job_id]['current_loss'] = progress_data.get('loss')
+        if progress_data.get('loss_history'):
+            finetune_jobs[job_id]['loss_history'] = progress_data['loss_history']
     def run_training_async():
         print(f"🌋 Finetuning job {job_id}: Starting asynchronous training thread...")
         try:
@@ -1908,16 +1925,15 @@ def finetune_diffusers():
                 learning_rate=learning_rate,
                 output_model_path=output_dir
             )
             print(f"🌋 Finetuning job {job_id}: Calling train_diffusion with config: {config}")
-            # Assuming train_diffusion might print its own progress or allow callbacks
-            # For more granular logging, you'd need to modify train_diffusion itself
             model_path = train_diffusion(
                 expanded_images,
                 captions,
-                config=config
+                config=config,
+                progress_callback=progress_callback
             )
             finetune_jobs[job_id]['status'] = 'complete'
             finetune_jobs[job_id]['model_path'] = model_path
             finetune_jobs[job_id]['end_time'] = datetime.datetime.now().isoformat()
@@ -1947,21 +1963,32 @@ def finetune_diffusers():
 def finetune_status(job_id):
     if job_id not in finetune_jobs:
         return jsonify({'error': 'Job not found'}), 404
     job = finetune_jobs[job_id]
     if job['status'] == 'complete':
         return jsonify({
+            'status': 'complete',
             'complete': True,
-            'outputPath': job.get('model_path', job['output_dir'])
+            'outputPath': job.get('model_path', job['output_dir']),
+            'loss_history': job.get('loss_history', [])
         })
     elif job['status'] == 'error':
-        return jsonify({'error': job.get('error_msg', 'Unknown error')})
+        return jsonify({
+            'status': 'error',
+            'error': job.get('error_msg', 'Unknown error')
+        })
     return jsonify({
-        'step': job.get('current_epoch', 0),
-        'total': job['epochs'],
-        'status': 'running'
+        'status': 'running',
+        'epoch': job.get('current_epoch', 0),
+        'total_epochs': job.get('epochs', 0),
+        'batch': job.get('current_batch', 0),
+        'total_batches': job.get('total_batches', 0),
+        'step': job.get('step', 0),
+        'loss': job.get('current_loss'),
+        'loss_history': job.get('loss_history', []),
+        'start_time': job.get('start_time')
     })
 @app.route("/api/ml/train", methods=["POST"])

{npcpy-1.3.13 → npcpy-1.3.14/npcpy.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: npcpy
-Version: 1.3.13
+Version: 1.3.14
 Summary: npcpy is the premier open-source library for integrating LLMs and Agents into python systems.
 Home-page: https://github.com/NPC-Worldwide/npcpy
 Author: Christopher Agostino
@@ -305,7 +305,7 @@ ggm = NPC(
 isabel = NPC(
     name='Isabel Allende',
     primary_directive='You are Isabel Allende, weaving stories with emotion and history. Analyze texts and provide insight.',
-    model='llama3.2:8b',
+    model='llama3.2',
     provider='ollama',
 )
@@ -359,7 +359,7 @@ LLM responses can be obtained without NPCs as well.
 ```python
 from npcpy.llm_funcs import get_llm_response
-response = get_llm_response("Who was the celtic Messenger god?", model='mistral:7b', provider='ollama')
+response = get_llm_response("Who was the celtic Messenger god?", model='qwen3:4b', provider='ollama')
 print(response['response'])
 ```
@@ -400,7 +400,7 @@ Return structured outputs by specifying `format='json'` or passing a Pydantic sc
 ```python
 from npcpy.llm_funcs import get_llm_response
-response = get_llm_response("What is the sentiment of the american people towards the repeal of Roe v Wade? Return a json object with `sentiment` as the key and a float value from -1 to 1 as the value", model='claude-4-5-haiku-latest', provider='deepseek', format='json')
+response = get_llm_response("What is the sentiment of the american people towards the repeal of Roe v Wade? Return a json object with `sentiment` as the key and a float value from -1 to 1 as the value", model='deepseek-chat', provider='deepseek', format='json')
 print(response['response'])
 ```

{npcpy-1.3.13 → npcpy-1.3.14}/npcpy.egg-info/SOURCES.txt RENAMED Viewed

@@ -64,6 +64,7 @@ npcpy/work/plan.py
 npcpy/work/trigger.py
 tests/test_audio.py
 tests/test_command_history.py
+tests/test_documentation_examples.py
 tests/test_image.py
 tests/test_llm_funcs.py
 tests/test_load.py

{npcpy-1.3.13 → npcpy-1.3.14}/setup.py RENAMED Viewed

@@ -83,7 +83,7 @@ extra_files = package_files("npcpy/npc_team/")
 setup(
     name="npcpy",
-    version="1.3.13",
+    version="1.3.14",
     packages=find_packages(exclude=["tests*"]),
     install_requires=base_requirements,
     extras_require={

npcpy 1.3.13__tar.gz → 1.3.14__tar.gz

npcpy 1.3.13tar.gz → 1.3.14tar.gz