PyPI - computer-use-ootb-internal - Versions diffs - 0.0.104__py3-none-any.whl → 0.0.106__py3-none-any.whl - Mend

computer-use-ootb-internal 0.0.104py3-none-any.whl → 0.0.106py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

computer_use_ootb_internal/app_teachmode.py CHANGED Viewed

@@ -1,521 +1,491 @@
-import argparse
-import time
-import json
-from datetime import datetime
-import threading
-import requests
-import platform  # Add platform import
-import subprocess  # Add subprocess import
-import pyautogui  # Add pyautogui import
-import webbrowser # Add webbrowser import
-import os # Import os for path joining
-from fastapi import FastAPI, Request
-from fastapi.responses import JSONResponse
-from fastapi.middleware.cors import CORSMiddleware
-from screeninfo import get_monitors
-from computer_use_ootb_internal.computer_use_demo.tools.computer import get_screen_details
-from computer_use_ootb_internal.run_teachmode_ootb_args import simple_teachmode_sampling_loop
-app = FastAPI()
-# Add CORS middleware to allow requests from the frontend
-app.add_middleware(
-    CORSMiddleware,
-    allow_origins=["*"],
-    allow_credentials=True,
-    allow_methods=["*"],
-    allow_headers=["*"],
-)
-# Rate limiter for API endpoints
-class RateLimiter:
-    def __init__(self, interval_seconds=2):
-        self.interval = interval_seconds
-        self.last_request_time = {}
-        self.lock = threading.Lock()
-    def allow_request(self, endpoint):
-        with self.lock:
-            current_time = time.time()
-            # Priority endpoints always allowed
-            if endpoint in ["/update_params", "/update_message"]:
-                return True
-            # For other endpoints, apply rate limiting
-            if endpoint not in self.last_request_time:
-                self.last_request_time[endpoint] = current_time
-                return True
-            elapsed = current_time - self.last_request_time[endpoint]
-            if elapsed < self.interval:
-                return False
-            self.last_request_time[endpoint] = current_time
-            return True
-def log_ootb_request(server_url, ootb_request_type, data):
-    logging_data = {
-        "type": ootb_request_type,
-        "data": data,
-        "timestamp": datetime.now().strftime("%Y-%m-%d %H:%M:%S")
-    }
-    if not server_url.endswith("/update_ootb_logging"):
-        server_logging_url = server_url + "/update_ootb_logging"
-    else:
-        server_logging_url = server_url
-    requests.post(server_logging_url, json=logging_data)
-class SharedState:
-    def __init__(self, args):
-        self.args = args
-        self.task_updated = False
-        self.chatbot_messages = []
-        # Store all state-related data here
-        self.model = args.model
-        self.task = getattr(args, 'task', "")
-        self.selected_screen = args.selected_screen
-        self.user_id = args.user_id
-        self.trace_id = args.trace_id
-        self.api_keys = args.api_keys
-        self.server_url = args.server_url
-        self.message_queue = []
-        self.is_processing = False
-        self.should_stop = False
-        self.is_paused = False
-        # Add a new event to better control stopping
-        self.stop_event = threading.Event()
-        # Add a reference to the processing thread
-        self.processing_thread = None
-shared_state = None
-rate_limiter = RateLimiter(interval_seconds=2)
-# Add the new prepare_environment function here
-def prepare_environment(state):
-    """Prepares the environment before starting the main processing loop, e.g., opening specific apps."""
-    if platform.system() == "Windows":
-        # Assuming Star Rail mode is indicated by user_id containing "star_rail"
-        # You might need to adjust this condition based on the actual logic in run_teachmode_args
-        is_star_rail = "star_rail" in state.user_id.lower() or \
-                       "star_rail" in state.trace_id.lower() or \
-                       "hero_case" in state.trace_id.lower()
-        if is_star_rail:
-            print("Star Rail mode detected on Windows. Opening Edge browser...")
-            url = "https://sr.mihoyo.com/cloud/#/"
-            browser_opened = False
-            try:
-                print(f"Attempting to open {url} using specific Edge paths...")
-                # Common paths for msedge.exe
-                edge_paths = [
-                    os.path.join(os.environ.get("ProgramFiles(x86)", "C:\Program Files (x86)"), "Microsoft\Edge\Application\msedge.exe"),
-                    os.path.join(os.environ.get("ProgramFiles", "C:\Program Files"), "Microsoft\Edge\Application\msedge.exe")
-                ]
-                opened_with_subprocess = False
-                for edge_path in edge_paths:
-                    if os.path.exists(edge_path):
-                        try:
-                            print(f"Trying path: {edge_path}")
-                            subprocess.Popen([edge_path, url])
-                            print(f"Successfully launched Edge with Popen using path: {edge_path}")
-                            opened_with_subprocess = True
-                            browser_opened = True
-                            break # Exit loop once successfully opened
-                        except Exception as sub_e:
-                            print(f"Failed to launch Edge with Popen using {edge_path}: {sub_e}")
-                    else:
-                        print(f"Edge path not found: {edge_path}")
-                # Fallback to webbrowser.open if subprocess failed
-                if not opened_with_subprocess:
-                    print("Subprocess launch failed, falling back to webbrowser.open()...")
-                    try:
-                         if webbrowser.open(url):
-                             print("Successfully opened browser using webbrowser.open() as fallback.")
-                             browser_opened = True
-                         else:
-                             print("webbrowser.open() also failed to indicate success.")
-                    except Exception as web_e:
-                         print(f"webbrowser.open() fallback failed: {web_e}")
-                if not browser_opened:
-                    print("ERROR: Failed to open browser using both subprocess and webbrowser.")
-                    # Decide if you want to proceed without the browser or raise an error
-                    # For now, we'll proceed to the click attempt but it might fail
-                # Add pyautogui click after attempting to open the browser
-                print("Proceeding with pyautogui actions...")
-                time.sleep(5) # Wait time for the browser to load
-                # Print detected screen size
-                screen_width, screen_height = pyautogui.size()
-                print(f"Detected screen size: {screen_width}x{screen_height}")
-                click_x = int(screen_width * (1036 / 1280))
-                click_y = int(screen_height * (500 / 720))
-                print(f"Calculated click coordinates: ({click_x}, {click_y})")
-                # Disable failsafe before clicking
-                pyautogui.FAILSAFE = False
-                print("PyAutoGUI failsafe temporarily disabled.")
-                print(f"Clicking at coordinates: ({click_x}, {click_y})")
-                pyautogui.click(click_x, click_y)
-                time.sleep(2)
-                pyautogui.click(click_x, click_y)
-                # Re-enable failsafe (optional, as script might end anyway)
-                # pyautogui.FAILSAFE = True
-                # print("PyAutoGUI failsafe re-enabled.")
-            except FileNotFoundError:
-                # This specific error might occur if edge_path exists but execution fails
-                print("Error: Could not execute the browser command (FileNotFound). Check permissions or path.")
-            except Exception as e:
-                print(f"Error during environment preparation (browser/click): {e}")
-            finally:
-                 # Ensure failsafe is re-enabled if an error occurs after disabling it
-                 pyautogui.FAILSAFE = True
-                 print("PyAutoGUI failsafe re-enabled.")
-    else:
-        # Placeholder for potential preparations on other OS or non-Star Rail modes
-        print("Environment preparation: No specific actions required for this OS/mode.")
-@app.post("/update_params")
-async def update_parameters(request: Request):
-    data = await request.json()
-    if 'task' not in data:
-        return JSONResponse(
-            content={"status": "error", "message": "Missing required field: task"},
-            status_code=400
-        )
-    shared_state.args = argparse.Namespace(**data)
-    shared_state.task_updated = True
-    # Update shared state when parameters change
-    shared_state.model = getattr(shared_state.args, 'model', "teach-mode-gpt-4o")
-    shared_state.task = getattr(shared_state.args, 'task', "Create a claim on the SAP system, using Receipt.pdf as attachment.")
-    shared_state.selected_screen = getattr(shared_state.args, 'selected_screen', 0)
-    shared_state.user_id = getattr(shared_state.args, 'user_id', "hero_cases")
-    shared_state.trace_id = getattr(shared_state.args, 'trace_id', "build_scroll_combat")
-    shared_state.api_keys = getattr(shared_state.args, 'api_keys', "sk-proj-1234567890")
-    shared_state.server_url = getattr(shared_state.args, 'server_url', "http://ec2-44-234-43-86.us-west-2.compute.amazonaws.com")
-    log_ootb_request(shared_state.server_url, "update_params", data)
-    # Call the preparation function here, after parameters are updated
-    prepare_environment(shared_state)
-    return JSONResponse(
-        content={"status": "success", "message": "Parameters updated", "new_args": vars(shared_state.args)},
-        status_code=200
-    )
-@app.post("/update_message")
-async def update_message(request: Request):
-    data = await request.json()
-    if 'message' not in data:
-        return JSONResponse(
-            content={"status": "error", "message": "Missing required field: message"},
-            status_code=400
-        )
-    log_ootb_request(shared_state.server_url, "update_message", data)
-    message = data['message']
-    shared_state.chatbot_messages.append({"role": "user", "content": message})
-    shared_state.task = message
-    shared_state.args.task = message
-    # Reset stop event before starting
-    shared_state.stop_event.clear()
-    # Start processing if not already running
-    if not shared_state.is_processing:
-        # Create and store the thread
-        shared_state.processing_thread = threading.Thread(target=process_input, daemon=True)
-        shared_state.processing_thread.start()
-    return JSONResponse(
-        content={"status": "success", "message": "Message received", "task": shared_state.task},
-        status_code=200
-    )
-@app.get("/get_messages")
-async def get_messages(request: Request):
-    # Apply rate limiting
-    if not rate_limiter.allow_request(request.url.path):
-        return JSONResponse(
-            content={"status": "error", "message": "Rate limit exceeded. Try again after 2 seconds."},
-            status_code=429
-        )
-    log_ootb_request(shared_state.server_url, "get_messages", {})
-    # Return all messages in the queue and clear it
-    messages = shared_state.message_queue.copy()
-    shared_state.message_queue = []
-    return JSONResponse(
-        content={"status": "success", "messages": messages},
-        status_code=200
-    )
-@app.get("/get_screens")
-async def get_screens(request: Request):
-    # Apply rate limiting
-    if not rate_limiter.allow_request(request.url.path):
-        return JSONResponse(
-            content={"status": "error", "message": "Rate limit exceeded. Try again after 2 seconds."},
-            status_code=429
-        )
-    log_ootb_request(shared_state.server_url, "get_screens", {})
-    screen_options, primary_index = get_screen_details()
-    return JSONResponse(
-        content={"status": "success", "screens": screen_options, "primary_index": primary_index},
-        status_code=200
-    )
-@app.post("/stop_processing")
-async def stop_processing(request: Request):
-    # Apply rate limiting
-    if not rate_limiter.allow_request(request.url.path):
-        return JSONResponse(
-            content={"status": "error", "message": "Rate limit exceeded. Try again after 2 seconds."},
-            status_code=429
-        )
-    log_ootb_request(shared_state.server_url, "stop_processing", {})
-    if shared_state.is_processing:
-        # Set both flags to ensure stopping the current task
-        shared_state.should_stop = True
-        shared_state.stop_event.set()
-        # Send an immediate message to the queue to inform the user
-        stop_initiated_msg = {"role": "assistant", "content": f"Stopping task '{shared_state.task}'..."}
-        shared_state.message_queue.append(stop_initiated_msg)
-        return JSONResponse(
-            content={"status": "success", "message": "Task is being stopped, server will remain available for new tasks"},
-            status_code=200
-        )
-    else:
-        return JSONResponse(
-            content={"status": "error", "message": "No active processing to stop"},
-            status_code=400
-        )
-@app.post("/toggle_pause")
-async def toggle_pause(request: Request):
-    # Apply rate limiting
-    if not rate_limiter.allow_request(request.url.path):
-        return JSONResponse(
-            content={"status": "error", "message": "Rate limit exceeded. Try again after 2 seconds."},
-            status_code=429
-        )
-    log_ootb_request(shared_state.server_url, "toggle_pause", {})
-    if not shared_state.is_processing:
-        return JSONResponse(
-            content={"status": "error", "message": "No active processing to pause/resume"},
-            status_code=400
-        )
-    # Toggle the pause state
-    shared_state.is_paused = not shared_state.is_paused
-    current_state = shared_state.is_paused
-    print(f"Toggled pause state to: {current_state}")
-    status_message = "paused" if current_state else "resumed"
-    # Add a message to the queue to inform the user
-    if current_state:
-        message = {"role": "assistant", "content": f"Task '{shared_state.task}' has been paused. Click Continue to resume."}
-    else:
-        message = {"role": "assistant", "content": f"Task '{shared_state.task}' has been resumed."}
-    shared_state.chatbot_messages.append(message)
-    shared_state.message_queue.append(message)
-    return JSONResponse(
-        content={
-            "status": "success",
-            "message": f"Processing {status_message}",
-            "is_paused": current_state
-        },
-        status_code=200
-    )
-@app.get("/status")
-async def get_status(request: Request):
-    # Apply rate limiting
-    if not rate_limiter.allow_request(request.url.path):
-        return JSONResponse(
-            content={"status": "error", "message": "Rate limit exceeded. Try again after 2 seconds."},
-            status_code=429
-        )
-    log_ootb_request(shared_state.server_url, "get_status", {})
-    print(f"Status check - Processing: {shared_state.is_processing}, Paused: {shared_state.is_paused}")
-    return JSONResponse(
-        content={
-            "status": "success",
-            "is_processing": shared_state.is_processing,
-            "is_paused": shared_state.is_paused
-        },
-        status_code=200
-    )
-def process_input():
-    shared_state.is_processing = True
-    shared_state.should_stop = False
-    shared_state.is_paused = False
-    shared_state.stop_event.clear()  # Ensure stop event is cleared at the start
-    print(f"start sampling loop: {shared_state.chatbot_messages}")
-    print(f"shared_state.args before sampling loop: {shared_state.args}")
-    try:
-        # Get the generator for the sampling loop
-        sampling_loop = simple_teachmode_sampling_loop(
-            model=shared_state.model,
-            task=shared_state.task,
-            selected_screen=shared_state.selected_screen,
-            user_id=shared_state.user_id,
-            trace_id=shared_state.trace_id,
-            api_keys=shared_state.api_keys,
-            server_url=shared_state.server_url,
-        )
-        # Process messages from the sampling loop
-        for loop_msg in sampling_loop:
-            # Check stop condition more frequently
-            if shared_state.should_stop or shared_state.stop_event.is_set():
-                print("Processing stopped by user")
-                break
-            # Check if paused and wait while paused
-            while shared_state.is_paused and not shared_state.should_stop and not shared_state.stop_event.is_set():
-                print(f"Processing paused at: {time.strftime('%H:%M:%S')}")
-                # Wait a short time and check stop condition regularly
-                for _ in range(5):  # Check 5 times per second
-                    if shared_state.should_stop or shared_state.stop_event.is_set():
-                        break
-                    time.sleep(0.2)
-            # Check again after pause loop
-            if shared_state.should_stop or shared_state.stop_event.is_set():
-                print("Processing stopped while paused or resuming")
-                break
-            # Process the message
-            if loop_msg.startswith('<img'):
-                message = {"role": "user", "content": loop_msg}
-            else:
-                message = {"role": "assistant", "content": loop_msg}
-            shared_state.chatbot_messages.append(message)
-            shared_state.message_queue.append(message)
-            # Short sleep to allow stop signals to be processed
-            for _ in range(5):  # Check 5 times per second
-                if shared_state.should_stop or shared_state.stop_event.is_set():
-                    print("Processing stopped during sleep")
-                    break
-                time.sleep(0.1)
-            if shared_state.should_stop or shared_state.stop_event.is_set():
-                break
-    except Exception as e:
-        # Handle any exceptions in the processing loop
-        error_msg = f"Error during task processing: {str(e)}"
-        print(error_msg)
-        error_message = {"role": "assistant", "content": error_msg}
-        shared_state.message_queue.append(error_message)
-    finally:
-        # Handle completion or interruption
-        if shared_state.should_stop or shared_state.stop_event.is_set():
-            stop_msg = f"Task '{shared_state.task}' was stopped. Ready for new tasks."
-            final_message = {"role": "assistant", "content": stop_msg}
-        else:
-            complete_msg = f"Task '{shared_state.task}' completed. Thanks for using Teachmode-OOTB."
-            final_message = {"role": "assistant", "content": complete_msg}
-        shared_state.chatbot_messages.append(final_message)
-        shared_state.message_queue.append(final_message)
-        # Reset all state flags to allow for new tasks
-        shared_state.is_processing = False
-        shared_state.should_stop = False
-        shared_state.is_paused = False
-        shared_state.stop_event.clear()
-        print("Processing completed, ready for new tasks")
-def main():
-    global app, shared_state, rate_limiter
-    parser = argparse.ArgumentParser(
-        description="Run a synchronous sampling loop for assistant/tool interactions in teach-mode."
-    )
-    parser.add_argument("--model", default="teach-mode-gpt-4o")
-    parser.add_argument("--task", default="Create a claim on the SAP system, using Receipt.pdf as attachment.")
-    parser.add_argument("--selected_screen", type=int, default=0)
-    parser.add_argument("--user_id", default="star_rail_dev")
-    parser.add_argument("--trace_id", default="scroll")
-    parser.add_argument("--api_key_file", default="api_key.json")
-    parser.add_argument("--api_keys", default="")
-    parser.add_argument(
-        "--server_url",
-        default="http://ec2-44-234-43-86.us-west-2.compute.amazonaws.com",
-        help="Server URL for the session"
-    )
-    args = parser.parse_args()
-    shared_state = SharedState(args)
-    rate_limiter = RateLimiter(interval_seconds=2)
-    import uvicorn
-    import platform
-    import os
-    # Default port
-    port = 7888
-    # Determine port based on Windows username
-    if platform.system() == "Windows":
-        username = os.environ["USERNAME"].lower()
-        if username == "altair":
-            port = 14000
-        elif username.startswith("guest") and username[5:].isdigit():
-            num = int(username[5:])
-            if 1 <= num <= 10:
-                port = 14000 + num
-            else:
-                port = 7888
-        else:
-            port = 7888
-    uvicorn.run(app, host="0.0.0.0", port=port)
-if __name__ == "__main__":
-    # main()
-    # Test log_ootb_request
+import argparse
+import time
+import json
+from datetime import datetime
+import threading
+import requests
+import platform  # Add platform import
+import subprocess  # Add subprocess import
+import pyautogui  # Add pyautogui import
+import webbrowser # Add webbrowser import
+import os # Import os for path joining
+from fastapi import FastAPI, Request
+from fastapi.responses import JSONResponse
+from fastapi.middleware.cors import CORSMiddleware
+from screeninfo import get_monitors
+from computer_use_ootb_internal.computer_use_demo.tools.computer import get_screen_details
+from computer_use_ootb_internal.run_teachmode_ootb_args import simple_teachmode_sampling_loop
+app = FastAPI()
+# Add CORS middleware to allow requests from the frontend
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+# Rate limiter for API endpoints
+class RateLimiter:
+    def __init__(self, interval_seconds=2):
+        self.interval = interval_seconds
+        self.last_request_time = {}
+        self.lock = threading.Lock()
+    def allow_request(self, endpoint):
+        with self.lock:
+            current_time = time.time()
+            # Priority endpoints always allowed
+            if endpoint in ["/update_params", "/update_message"]:
+                return True
+            # For other endpoints, apply rate limiting
+            if endpoint not in self.last_request_time:
+                self.last_request_time[endpoint] = current_time
+                return True
+            elapsed = current_time - self.last_request_time[endpoint]
+            if elapsed < self.interval:
+                return False
+            self.last_request_time[endpoint] = current_time
+            return True
+def log_ootb_request(server_url, ootb_request_type, data):
+    logging_data = {
+        "type": ootb_request_type,
+        "data": data,
+        "timestamp": datetime.now().strftime("%Y-%m-%d %H:%M:%S")
+    }
+    if not server_url.endswith("/update_ootb_logging"):
+        server_logging_url = server_url + "/update_ootb_logging"
+    else:
+        server_logging_url = server_url
+    requests.post(server_logging_url, json=logging_data)
+class SharedState:
+    def __init__(self, args):
+        self.args = args
+        self.task_updated = False
+        self.chatbot_messages = []
+        # Store all state-related data here
+        self.model = args.model
+        self.task = getattr(args, 'task', "")
+        self.selected_screen = args.selected_screen
+        self.user_id = args.user_id
+        self.trace_id = args.trace_id
+        self.api_keys = args.api_keys
+        self.server_url = args.server_url
+        self.message_queue = []
+        self.is_processing = False
+        self.should_stop = False
+        self.is_paused = False
+        # Add a new event to better control stopping
+        self.stop_event = threading.Event()
+        # Add a reference to the processing thread
+        self.processing_thread = None
+shared_state = None
+rate_limiter = RateLimiter(interval_seconds=2)
+# Add the new prepare_environment function here
+def prepare_environment(state):
+    """Prepares the environment before starting the main processing loop, e.g., opening specific apps."""
+    if platform.system() == "Windows":
+        # Assuming Star Rail mode is indicated by user_id containing "star_rail"
+        # You might need to adjust this condition based on the actual logic in run_teachmode_args
+        is_star_rail = "star_rail" in state.user_id.lower() or \
+                       "star_rail" in state.trace_id.lower() or \
+                       "hero_case" in state.trace_id.lower()
+        if is_star_rail:
+            print("Star Rail mode detected on Windows. Opening Edge browser...")
+            url = "https://sr.mihoyo.com/cloud/#/"
+            browser_opened = False
+            try:
+                # Use only webbrowser.open
+                print(f"Attempting to open {url} using webbrowser.open()...")
+                if webbrowser.open(url):
+                    print(f"Successfully requested browser to open {url} via webbrowser.open().")
+                    browser_opened = True
+                else:
+                    print("webbrowser.open() returned False, indicating potential failure.")
+                if not browser_opened:
+                    print("ERROR: Failed to confirm browser opening via webbrowser.open().")
+                    # Still proceed to click attempt
+                # Add pyautogui click after attempting to open the browser
+                print("Proceeding with pyautogui actions...")
+                time.sleep(5) # Wait time for the browser to load
+                # Print detected screen size
+                screen_width, screen_height = pyautogui.size()
+                print(f"Detected screen size: {screen_width}x{screen_height}")
+                click_x = int(screen_width * (1036 / 1280))
+                click_y = int(screen_height * (500 / 720))
+                print(f"Calculated click coordinates: ({click_x}, {click_y})")
+                # Disable failsafe before clicking
+                pyautogui.FAILSAFE = False
+                print("PyAutoGUI failsafe temporarily disabled.")
+                print(f"Clicking at coordinates: ({click_x}, {click_y})")
+                pyautogui.click(click_x, click_y)
+                time.sleep(2)
+                pyautogui.click(click_x, click_y)
+                # Re-enable failsafe (optional, as script might end anyway)
+                # pyautogui.FAILSAFE = True
+                # print("PyAutoGUI failsafe re-enabled.")
+            except Exception as e:
+                print(f"Error during environment preparation (browser/click): {e}")
+            finally:
+                 # Ensure failsafe is re-enabled if an error occurs after disabling it
+                 pyautogui.FAILSAFE = True
+                 print("PyAutoGUI failsafe re-enabled.")
+    else:
+        # Placeholder for potential preparations on other OS or non-Star Rail modes
+        print("Environment preparation: No specific actions required for this OS/mode.")
+@app.post("/update_params")
+async def update_parameters(request: Request):
+    data = await request.json()
+    if 'task' not in data:
+        return JSONResponse(
+            content={"status": "error", "message": "Missing required field: task"},
+            status_code=400
+        )
+    shared_state.args = argparse.Namespace(**data)
+    shared_state.task_updated = True
+    # Update shared state when parameters change
+    shared_state.model = getattr(shared_state.args, 'model', "teach-mode-gpt-4o")
+    shared_state.task = getattr(shared_state.args, 'task', "Create a claim on the SAP system, using Receipt.pdf as attachment.")
+    shared_state.selected_screen = getattr(shared_state.args, 'selected_screen', 0)
+    shared_state.user_id = getattr(shared_state.args, 'user_id', "hero_cases")
+    shared_state.trace_id = getattr(shared_state.args, 'trace_id', "build_scroll_combat")
+    shared_state.api_keys = getattr(shared_state.args, 'api_keys', "sk-proj-1234567890")
+    shared_state.server_url = getattr(shared_state.args, 'server_url', "http://ec2-44-234-43-86.us-west-2.compute.amazonaws.com")
+    log_ootb_request(shared_state.server_url, "update_params", data)
+    # Call the preparation function here, after parameters are updated
+    prepare_environment(shared_state)
+    return JSONResponse(
+        content={"status": "success", "message": "Parameters updated", "new_args": vars(shared_state.args)},
+        status_code=200
+    )
+@app.post("/update_message")
+async def update_message(request: Request):
+    data = await request.json()
+    if 'message' not in data:
+        return JSONResponse(
+            content={"status": "error", "message": "Missing required field: message"},
+            status_code=400
+        )
+    log_ootb_request(shared_state.server_url, "update_message", data)
+    message = data['message']
+    shared_state.chatbot_messages.append({"role": "user", "content": message})
+    shared_state.task = message
+    shared_state.args.task = message
+    # Reset stop event before starting
+    shared_state.stop_event.clear()
+    # Start processing if not already running
+    if not shared_state.is_processing:
+        # Create and store the thread
+        shared_state.processing_thread = threading.Thread(target=process_input, daemon=True)
+        shared_state.processing_thread.start()
+    return JSONResponse(
+        content={"status": "success", "message": "Message received", "task": shared_state.task},
+        status_code=200
+    )
+@app.get("/get_messages")
+async def get_messages(request: Request):
+    # Apply rate limiting
+    if not rate_limiter.allow_request(request.url.path):
+        return JSONResponse(
+            content={"status": "error", "message": "Rate limit exceeded. Try again after 2 seconds."},
+            status_code=429
+        )
+    log_ootb_request(shared_state.server_url, "get_messages", {})
+    # Return all messages in the queue and clear it
+    messages = shared_state.message_queue.copy()
+    shared_state.message_queue = []
+    return JSONResponse(
+        content={"status": "success", "messages": messages},
+        status_code=200
+    )
+@app.get("/get_screens")
+async def get_screens(request: Request):
+    # Apply rate limiting
+    if not rate_limiter.allow_request(request.url.path):
+        return JSONResponse(
+            content={"status": "error", "message": "Rate limit exceeded. Try again after 2 seconds."},
+            status_code=429
+        )
+    log_ootb_request(shared_state.server_url, "get_screens", {})
+    screen_options, primary_index = get_screen_details()
+    return JSONResponse(
+        content={"status": "success", "screens": screen_options, "primary_index": primary_index},
+        status_code=200
+    )
+@app.post("/stop_processing")
+async def stop_processing(request: Request):
+    # Apply rate limiting
+    if not rate_limiter.allow_request(request.url.path):
+        return JSONResponse(
+            content={"status": "error", "message": "Rate limit exceeded. Try again after 2 seconds."},
+            status_code=429
+        )
+    log_ootb_request(shared_state.server_url, "stop_processing", {})
+    if shared_state.is_processing:
+        # Set both flags to ensure stopping the current task
+        shared_state.should_stop = True
+        shared_state.stop_event.set()
+        # Send an immediate message to the queue to inform the user
+        stop_initiated_msg = {"role": "assistant", "content": f"Stopping task '{shared_state.task}'..."}
+        shared_state.message_queue.append(stop_initiated_msg)
+        return JSONResponse(
+            content={"status": "success", "message": "Task is being stopped, server will remain available for new tasks"},
+            status_code=200
+        )
+    else:
+        return JSONResponse(
+            content={"status": "error", "message": "No active processing to stop"},
+            status_code=400
+        )
+@app.post("/toggle_pause")
+async def toggle_pause(request: Request):
+    # Apply rate limiting
+    if not rate_limiter.allow_request(request.url.path):
+        return JSONResponse(
+            content={"status": "error", "message": "Rate limit exceeded. Try again after 2 seconds."},
+            status_code=429
+        )
+    log_ootb_request(shared_state.server_url, "toggle_pause", {})
+    if not shared_state.is_processing:
+        return JSONResponse(
+            content={"status": "error", "message": "No active processing to pause/resume"},
+            status_code=400
+        )
+    # Toggle the pause state
+    shared_state.is_paused = not shared_state.is_paused
+    current_state = shared_state.is_paused
+    print(f"Toggled pause state to: {current_state}")
+    status_message = "paused" if current_state else "resumed"
+    # Add a message to the queue to inform the user
+    if current_state:
+        message = {"role": "assistant", "content": f"Task '{shared_state.task}' has been paused. Click Continue to resume."}
+    else:
+        message = {"role": "assistant", "content": f"Task '{shared_state.task}' has been resumed."}
+    shared_state.chatbot_messages.append(message)
+    shared_state.message_queue.append(message)
+    return JSONResponse(
+        content={
+            "status": "success",
+            "message": f"Processing {status_message}",
+            "is_paused": current_state
+        },
+        status_code=200
+    )
+@app.get("/status")
+async def get_status(request: Request):
+    # Apply rate limiting
+    if not rate_limiter.allow_request(request.url.path):
+        return JSONResponse(
+            content={"status": "error", "message": "Rate limit exceeded. Try again after 2 seconds."},
+            status_code=429
+        )
+    log_ootb_request(shared_state.server_url, "get_status", {})
+    print(f"Status check - Processing: {shared_state.is_processing}, Paused: {shared_state.is_paused}")
+    return JSONResponse(
+        content={
+            "status": "success",
+            "is_processing": shared_state.is_processing,
+            "is_paused": shared_state.is_paused
+        },
+        status_code=200
+    )
+def process_input():
+    shared_state.is_processing = True
+    shared_state.should_stop = False
+    shared_state.is_paused = False
+    shared_state.stop_event.clear()  # Ensure stop event is cleared at the start
+    print(f"start sampling loop: {shared_state.chatbot_messages}")
+    print(f"shared_state.args before sampling loop: {shared_state.args}")
+    try:
+        # Get the generator for the sampling loop
+        sampling_loop = simple_teachmode_sampling_loop(
+            model=shared_state.model,
+            task=shared_state.task,
+            selected_screen=shared_state.selected_screen,
+            user_id=shared_state.user_id,
+            trace_id=shared_state.trace_id,
+            api_keys=shared_state.api_keys,
+            server_url=shared_state.server_url,
+        )
+        # Process messages from the sampling loop
+        for loop_msg in sampling_loop:
+            # Check stop condition more frequently
+            if shared_state.should_stop or shared_state.stop_event.is_set():
+                print("Processing stopped by user")
+                break
+            # Check if paused and wait while paused
+            while shared_state.is_paused and not shared_state.should_stop and not shared_state.stop_event.is_set():
+                print(f"Processing paused at: {time.strftime('%H:%M:%S')}")
+                # Wait a short time and check stop condition regularly
+                for _ in range(5):  # Check 5 times per second
+                    if shared_state.should_stop or shared_state.stop_event.is_set():
+                        break
+                    time.sleep(0.2)
+            # Check again after pause loop
+            if shared_state.should_stop or shared_state.stop_event.is_set():
+                print("Processing stopped while paused or resuming")
+                break
+            # Process the message
+            if loop_msg.startswith('<img'):
+                message = {"role": "user", "content": loop_msg}
+            else:
+                message = {"role": "assistant", "content": loop_msg}
+            shared_state.chatbot_messages.append(message)
+            shared_state.message_queue.append(message)
+            # Short sleep to allow stop signals to be processed
+            for _ in range(5):  # Check 5 times per second
+                if shared_state.should_stop or shared_state.stop_event.is_set():
+                    print("Processing stopped during sleep")
+                    break
+                time.sleep(0.1)
+            if shared_state.should_stop or shared_state.stop_event.is_set():
+                break
+    except Exception as e:
+        # Handle any exceptions in the processing loop
+        error_msg = f"Error during task processing: {str(e)}"
+        print(error_msg)
+        error_message = {"role": "assistant", "content": error_msg}
+        shared_state.message_queue.append(error_message)
+    finally:
+        # Handle completion or interruption
+        if shared_state.should_stop or shared_state.stop_event.is_set():
+            stop_msg = f"Task '{shared_state.task}' was stopped. Ready for new tasks."
+            final_message = {"role": "assistant", "content": stop_msg}
+        else:
+            complete_msg = f"Task '{shared_state.task}' completed. Thanks for using Teachmode-OOTB."
+            final_message = {"role": "assistant", "content": complete_msg}
+        shared_state.chatbot_messages.append(final_message)
+        shared_state.message_queue.append(final_message)
+        # Reset all state flags to allow for new tasks
+        shared_state.is_processing = False
+        shared_state.should_stop = False
+        shared_state.is_paused = False
+        shared_state.stop_event.clear()
+        print("Processing completed, ready for new tasks")
+def main():
+    global app, shared_state, rate_limiter
+    parser = argparse.ArgumentParser(
+        description="Run a synchronous sampling loop for assistant/tool interactions in teach-mode."
+    )
+    parser.add_argument("--model", default="teach-mode-gpt-4o")
+    parser.add_argument("--task", default="Create a claim on the SAP system, using Receipt.pdf as attachment.")
+    parser.add_argument("--selected_screen", type=int, default=0)
+    parser.add_argument("--user_id", default="star_rail_dev")
+    parser.add_argument("--trace_id", default="scroll")
+    parser.add_argument("--api_key_file", default="api_key.json")
+    parser.add_argument("--api_keys", default="")
+    parser.add_argument(
+        "--server_url",
+        default="http://ec2-44-234-43-86.us-west-2.compute.amazonaws.com",
+        help="Server URL for the session"
+    )
+    args = parser.parse_args()
+    shared_state = SharedState(args)
+    rate_limiter = RateLimiter(interval_seconds=2)
+    import uvicorn
+    import platform
+    import os
+    # Default port
+    port = 7888
+    # Determine port based on Windows username
+    if platform.system() == "Windows":
+        username = os.environ["USERNAME"].lower()
+        if username == "altair":
+            port = 14000
+        elif username.startswith("guest") and username[5:].isdigit():
+            num = int(username[5:])
+            if 1 <= num <= 10:
+                port = 14000 + num
+            else:
+                port = 7888
+        else:
+            port = 7888
+    uvicorn.run(app, host="0.0.0.0", port=port)
+if __name__ == "__main__":
+    # main()
+    # Test log_ootb_request
     log_ootb_request("http://ec2-44-234-43-86.us-west-2.compute.amazonaws.com", "test_request", {"message": "Test message"})

computer-use-ootb-internal 0.0.104__py3-none-any.whl → 0.0.106__py3-none-any.whl

computer-use-ootb-internal 0.0.104py3-none-any.whl → 0.0.106py3-none-any.whl