RubyGems - rubyx-py - Versions diffs - 0.1.0 - Mend

rubyx-py 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (36) hide show

checksums.yaml +7 -0
data/Cargo.toml +19 -0
data/README.md +469 -0
data/ext/rubyx/Cargo.toml +19 -0
data/ext/rubyx/extconf.rb +22 -0
data/ext/rubyx/src/async_gen.rs +1298 -0
data/ext/rubyx/src/context.rs +812 -0
data/ext/rubyx/src/convert.rs +1498 -0
data/ext/rubyx/src/eval.rs +377 -0
data/ext/rubyx/src/exception.rs +184 -0
data/ext/rubyx/src/future.rs +126 -0
data/ext/rubyx/src/import.rs +34 -0
data/ext/rubyx/src/lib.rs +4212 -0
data/ext/rubyx/src/nonblocking_stream.rs +1422 -0
data/ext/rubyx/src/pipe_notify.rs +232 -0
data/ext/rubyx/src/python/sync_adapter.py +31 -0
data/ext/rubyx/src/python_api.rs +6029 -0
data/ext/rubyx/src/python_ffi.rs +18 -0
data/ext/rubyx/src/python_finder.rs +119 -0
data/ext/rubyx/src/python_guard.rs +25 -0
data/ext/rubyx/src/ruby_helpers.rs +74 -0
data/ext/rubyx/src/rubyx_object.rs +1931 -0
data/ext/rubyx/src/rubyx_stream.rs +950 -0
data/ext/rubyx/src/stream.rs +713 -0
data/ext/rubyx/src/test_helpers.rs +351 -0
data/lib/generators/rubyx/install_generator.rb +24 -0
data/lib/generators/rubyx/templates/rubyx_initializer.rb +17 -0
data/lib/rubyx/context.rb +27 -0
data/lib/rubyx/error.rb +30 -0
data/lib/rubyx/rails.rb +105 -0
data/lib/rubyx/railtie.rb +20 -0
data/lib/rubyx/uv.rb +261 -0
data/lib/rubyx/version.rb +4 -0
data/lib/rubyx-py.rb +1 -0
data/lib/rubyx.rb +136 -0
metadata +123 -0

data/ext/rubyx/src/test_helpers.rs ADDED Viewed

@@ -0,0 +1,351 @@
+//! Shared test infrastructure for Python API initialization and GIL management.
+//!
+//! This module provides a single, centralized point for Python initialization across all test
+//! modules. It prevents the SIGSEGV that occurs when multiple test modules each initialize
+//! Python independently.
+//!
+//! # Pattern
+//!
+//! The key insight is that `PyGILState_Ensure` / `PyGILState_Release` (our `ensure_gil` /
+//! `release_gil`) are **thread-safe**: they create per-thread state automatically. This
+//! makes them safe to call from any OS thread in Cargo's test-runner pool.
+//!
+//! In contrast, `PyEval_SaveThread` / `PyEval_RestoreThread` bind to a specific OS thread
+//! and deadlock when restored on a different thread — which happens with `#[serial]` tests
+//! because Cargo's thread pool may schedule successive tests on different threads.
+//!
+//! We:
+//! 1. Initialize Python once via `OnceLock`.
+//! 2. Immediately call `save_thread()` to release the GIL (discard the returned state).
+//! 3. Each test acquires the GIL with `ensure_gil()` (via `GilGuard`) and releases it on drop.
+//!
+//! # Ruby Threading
+//!
+//! Ruby's GVL (Global VM Lock) binds to the thread that called `embed::init()`, and Ruby
+//! C API functions require proper thread-local state (`ruby_current_ec_ptr`). Rust's test
+//! harness spawns a **new OS thread for every test**, so neither `Ruby::get()` nor direct
+//! C API calls work from test threads.
+//!
+//! The solution uses an executor pattern:
+//! 1. A dedicated long-lived thread calls `embed::init()` and then releases the GVL via
+//!    `rb_thread_call_without_gvl`, running an executor loop that waits for work items.
+//! 2. Test threads send closures to the executor via a channel.
+//! 3. The executor calls `rb_thread_call_with_gvl` for each work item — this works because
+//!    the executor thread is inside `rb_thread_call_without_gvl` and is still registered
+//!    with Ruby. Inside `rb_thread_call_with_gvl`, `Ruby::get()` succeeds normally.
+//! 4. Results are sent back to the test thread via a one-shot channel.
+use crate::python_api::PythonApi;
+use crate::python_ffi::PyGILState;
+use crate::python_finder::find_libpython;
+use magnus::Ruby;
+use std::any::Any;
+use std::ffi::c_void;
+use std::panic::{self, AssertUnwindSafe};
+use std::sync::mpsc::{Receiver, Sender};
+use std::sync::{Mutex, OnceLock};
+extern "C" {
+    fn rb_thread_call_without_gvl(
+        func: unsafe extern "C" fn(*mut c_void) -> *mut c_void,
+        data1: *mut c_void,
+        ubf: Option<unsafe extern "C" fn(*mut c_void)>,
+        data2: *mut c_void,
+    ) -> *mut c_void;
+    fn rb_thread_call_with_gvl(
+        func: unsafe extern "C" fn(*mut c_void) -> *mut c_void,
+        data1: *mut c_void,
+    ) -> *mut c_void;
+}
+/// Tracks whether Python initialization has been attempted.
+static PYTHON_INIT: OnceLock<bool> = OnceLock::new();
+/// Get the shared Python API instance, initializing if necessary.
+///
+/// Stores the `PythonApi` in `crate::API` so that both test helpers and
+/// production code paths (e.g. `method_missing` → `crate::api()`) share
+/// the same instance.
+///
+/// After this returns, the GIL is **not** held. Use `skip_if_no_python()` to
+/// acquire the GIL via a `GilGuard`.
+pub fn get_api() -> Option<&'static PythonApi> {
+    let success = PYTHON_INIT.get_or_init(|| {
+        let path = match find_libpython() {
+            Some(p) => p,
+            None => return false,
+        };
+        let mut api = match unsafe { PythonApi::load(&path) } {
+            Ok(a) => a,
+            Err(_) => return false,
+        };
+        api.initialize();
+        let _ = api.install_async_to_sync_class();
+        // Release the GIL that Py_Initialize left us holding.
+        // We intentionally discard the returned PyThreadState — from here on,
+        // all GIL acquisition goes through the thread-safe ensure_gil/release_gil.
+        let _ = api.save_thread();
+        // Store in the crate-level API so crate::api() works in production code
+        // paths called from tests (e.g. method_missing).
+        let _ = crate::API.set(api);
+        true
+    });
+    if *success {
+        crate::API.get()
+    } else {
+        None
+    }
+}
+/// RAII guard that manages GIL acquisition and release for tests.
+///
+/// Created by `skip_if_no_python()`. Holds the GIL for the duration of its lifetime.
+/// Uses `PyGILState_Ensure` / `PyGILState_Release` which are thread-safe and work
+/// correctly regardless of which OS thread the test is scheduled on.
+pub struct GilGuard<'a> {
+    api: &'a PythonApi,
+    gil_state: PyGILState,
+}
+impl<'a> GilGuard<'a> {
+    /// Access the Python API while holding the GIL.
+    pub fn api(&self) -> &'a PythonApi {
+        self.api
+    }
+}
+impl<'a> Drop for GilGuard<'a> {
+    fn drop(&mut self) {
+        self.api.release_gil(self.gil_state);
+    }
+}
+/// Skip the test if Python is not available, otherwise return a GIL guard.
+///
+/// This is the main entry point for tests. It:
+/// 1. Initializes Python (if not already done)
+/// 2. Acquires the GIL via `ensure_gil()` (thread-safe)
+/// 3. Returns a guard that releases the GIL on drop
+///
+/// # Example
+///
+/// ```ignore
+/// #[test]
+/// fn test_something() {
+///     let Some(guard) = skip_if_no_python() else { return; };
+///     let api = guard.api();
+///     api.run_simple_string("x = 42").unwrap();
+/// }
+/// ```
+pub fn skip_if_no_python() -> Option<GilGuard<'static>> {
+    let api = get_api()?;
+    let gil_state = api.ensure_gil();
+    Some(GilGuard { api, gil_state })
+}
+// ---------------------------------------------------------------------------
+// Ruby executor pattern
+// ---------------------------------------------------------------------------
+/// Type-erased work item sent from test threads to the Ruby executor.
+type WorkFn = Box<dyn FnOnce() + Send>;
+/// Carries a work item through the C callback interface, with space to
+/// store a panic payload if the work item panics.
+struct WorkSlot {
+    work: Option<WorkFn>,
+    panic: Option<Box<dyn Any + Send>>,
+}
+/// Holds the sender half of the executor channel, wrapped in a Mutex because
+/// `std::sync::mpsc::Sender` is `!Sync` (required for statics via `OnceLock`).
+/// The Mutex is effectively uncontended since `#[serial]` ensures only one test
+/// runs at a time.
+static RUBY_EXECUTOR: OnceLock<Mutex<Sender<WorkFn>>> = OnceLock::new();
+/// Executor loop that runs inside `rb_thread_call_without_gvl` on the Ruby
+/// init thread. Receives work items from test threads and dispatches them
+/// via `rb_thread_call_with_gvl`.
+///
+/// This works because the executor thread is still registered with Ruby
+/// (it called `embed::init()`), so `rb_thread_call_with_gvl` is valid here.
+unsafe extern "C" fn executor_loop(data: *mut c_void) -> *mut c_void {
+    let rx = &*(data as *const Receiver<WorkFn>);
+    while let Ok(work) = rx.recv() {
+        let mut slot = WorkSlot {
+            work: Some(work),
+            panic: None,
+        };
+        rb_thread_call_with_gvl(run_work_with_gvl, &mut slot as *mut WorkSlot as *mut c_void);
+        // If the work item panicked, the panic payload is in slot.panic.
+        // The test thread will see the result channel drop (no send) and
+        // the with_ruby_python function handles this. But we can't
+        // resume_unwind here (we're in a C callback). The panic info
+        // was already sent via the result channel by the work item itself.
+    }
+    std::ptr::null_mut()
+}
+/// Callback for `rb_thread_call_with_gvl`. Runs the work item with
+/// proper Ruby thread-local state and GVL held.
+///
+/// Panics are caught via `catch_unwind` to prevent unwinding across the
+/// FFI boundary (which is UB). The panic payload is stored back into the
+/// work slot so the caller can propagate it.
+unsafe extern "C" fn run_work_with_gvl(data: *mut c_void) -> *mut c_void {
+    let slot = &mut *(data as *mut WorkSlot);
+    if let Some(f) = slot.work.take() {
+        if let Err(payload) = panic::catch_unwind(AssertUnwindSafe(f)) {
+            slot.panic = Some(payload);
+        }
+    }
+    std::ptr::null_mut()
+}
+/// Initialize the Ruby VM once on a dedicated long-lived thread and start
+/// the executor loop.
+///
+/// The dedicated thread:
+/// 1. Calls `embed::init()` — becoming Ruby's "main" thread
+/// 2. Defines the `RubyxObject` class
+/// 3. Releases the GVL via `rb_thread_call_without_gvl` and enters the
+///    executor loop, waiting for work items from test threads
+fn ensure_ruby_vm() {
+    RUBY_EXECUTOR.get_or_init(|| {
+        let (tx, rx) = std::sync::mpsc::channel::<WorkFn>();
+        let (ready_tx, ready_rx) = std::sync::mpsc::channel();
+        // Spawn a dedicated thread that will be Ruby's "main" thread for the
+        // entire test process lifetime.
+        std::thread::spawn(move || {
+            let cleanup = unsafe { magnus::embed::init() };
+            let ruby: &Ruby = &cleanup;
+            ruby.define_class("RubyxObject", ruby.class_object())
+                .expect("Failed to define RubyxObject class for tests");
+            // Signal that Ruby is ready before releasing the GVL.
+            ready_tx.send(()).expect("ready channel send failed");
+            // Leak the receiver so it lives forever (the executor loop
+            // borrows it via raw pointer through the C callback interface).
+            let rx_ptr = Box::into_raw(Box::new(rx));
+            // Release the GVL and enter the executor loop. The loop receives
+            // work items from test threads and dispatches them via
+            // rb_thread_call_with_gvl.
+            unsafe {
+                rb_thread_call_without_gvl(
+                    executor_loop,
+                    rx_ptr as *mut c_void,
+                    None,
+                    std::ptr::null_mut(),
+                );
+            }
+            // Never reached, but prevent cleanup from running.
+            std::mem::forget(cleanup);
+        });
+        ready_rx.recv().expect("Ruby init thread failed");
+        Mutex::new(tx)
+    });
+}
+/// Run a closure with both Ruby GVL and Python GIL held.
+///
+/// Returns `None` if Python is not available (test should be skipped).
+///
+/// This is the main entry point for tests that need both Ruby and Python.
+/// The closure is sent to the Ruby executor thread, which runs it inside
+/// `rb_thread_call_with_gvl` with proper Ruby thread-local state.
+/// The Python GIL is also acquired on the executor thread before the
+/// closure runs.
+///
+/// # Example
+///
+/// ```ignore
+/// #[test]
+/// #[serial]
+/// fn test_something() {
+///     with_ruby_python(|ruby, api| {
+///         let py_str = api.string_from_str("hello");
+///         let rb_str = "hello".into_value_with(ruby);
+///         // ...
+///     });
+/// }
+/// ```
+pub fn with_ruby_python<F, R>(f: F) -> Option<R>
+where
+    F: FnOnce(&Ruby, &'static PythonApi) -> R + Send + 'static,
+    R: Send + 'static,
+{
+    // Initialize Python first — must happen before Ruby VM init to avoid
+    // interference with Python C extension loading.
+    let api = get_api()?;
+    ensure_ruby_vm();
+    let (result_tx, result_rx) = std::sync::mpsc::channel::<Result<R, Box<dyn Any + Send>>>();
+    let work: WorkFn = Box::new(move || {
+        // Inside rb_thread_call_with_gvl: Ruby GVL is held, thread-local
+        // state is set up, Ruby::get_unchecked() is safe.
+        let ruby = unsafe { Ruby::get_unchecked() };
+        // Acquire the Python GIL on the executor thread.
+        let gil = api.ensure_gil();
+        let result = panic::catch_unwind(AssertUnwindSafe(|| f(&ruby, api)));
+        api.release_gil(gil);
+        let _ = result_tx.send(result);
+    });
+    // Send the work item to the executor thread.
+    RUBY_EXECUTOR
+        .get()
+        .expect("executor not initialized")
+        .lock()
+        .expect("executor mutex poisoned")
+        .send(work)
+        .expect("executor channel closed");
+    // Block until the executor finishes running our closure.
+    // If the closure panicked, resume the panic on the test thread.
+    match result_rx.recv().expect("executor result channel closed") {
+        Ok(value) => Some(value),
+        Err(payload) => panic::resume_unwind(payload),
+    }
+}
+// Keep the old API available for backward compatibility during migration.
+// These can be removed once all tests are migrated to with_ruby_python.
+/// RAII guard that holds both a Ruby VM handle and a Python GIL.
+pub struct RubyPythonGuard<'a> {
+    ruby: Ruby,
+    gil_guard: GilGuard<'a>,
+}
+impl<'a> RubyPythonGuard<'a> {
+    pub fn api(&self) -> &'a PythonApi {
+        self.gil_guard.api()
+    }
+    pub fn ruby(&self) -> &Ruby {
+        &self.ruby
+    }
+}
+/// Skip the test if Python is not available, and ensure the Ruby VM is initialized.
+///
+/// **Deprecated**: Use `with_ruby_python` instead. This function only works when
+/// the test happens to run on the Ruby init thread (which is unreliable with Cargo's
+/// test harness).
+pub fn skip_if_no_ruby_python() -> Option<RubyPythonGuard<'static>> {
+    let _ = get_api()?;
+    ensure_ruby_vm();
+    let gil_guard = skip_if_no_python()?;
+    let ruby = Ruby::get().ok()?;
+    Some(RubyPythonGuard { ruby, gil_guard })
+}

data/lib/generators/rubyx/install_generator.rb ADDED Viewed

@@ -0,0 +1,24 @@
+module Rubyx
+  module Generators
+    class InstallGenerator < ::Rails::Generators::Base
+      source_root File.expand_path('templates', __dir__)
+      def create_pyproject
+        copy_file 'pyproject.toml', 'pyproject.toml'
+      end
+      def create_initializer
+        copy_file 'rubyx_initializer.rb', 'config/initializers/rubyx.rb'
+      end
+      def create_python_directory
+        empty_directory 'app/python'
+        copy_file 'example.py', 'app/python/example.py'
+      end
+      def add_gitignore
+        append_to_file '.gitignore', "\n# Python (managed by rubyx-py)\n.venv/\n" if File.exist?('.gitignore')
+      end
+    end
+  end
+end

data/lib/generators/rubyx/templates/rubyx_initializer.rb ADDED Viewed

@@ -0,0 +1,17 @@
+Rubyx::Rails.configure do |config|
+  # Path to your Python project's pyproject.toml
+  config.pyproject_path = Rails.root.join('pyproject.toml')
+  # Auto-initialize Python when Rails boots
+  # Set to false for forking servers (Puma workers) — use on_worker_boot instead
+  config.auto_init = true
+  # Directories to add to Python's sys.path (makes .py files importable)
+  config.python_paths = [Rails.root.join('app/python').to_s]
+  # Use system uv instead of auto-downloading (optional)
+  # config.uv_path = `which uv`.strip
+  # Extra arguments for uv sync (optional)
+  # config.uv_args = ['--extra', 'ml']
+end

data/lib/rubyx/context.rb ADDED Viewed

@@ -0,0 +1,27 @@
+module Rubyx
+  class Context
+    def eval(code, **globals)
+      if globals.empty?
+        _eval(code.to_s)
+      else
+        _eval_with_globals(code.to_s, globals)
+      end
+    end
+    def await(code, **globals)
+      if globals.empty?
+        _await(code.to_s)
+      else
+        _await_with_globals(code.to_s, globals)
+      end
+    end
+    def async_await(code, **globals)
+      if globals.empty?
+        _async_await(code.to_s)
+      else
+        _async_await_with_globals(code.to_s, globals)
+      end
+    end
+  end
+end

data/lib/rubyx/error.rb ADDED Viewed

@@ -0,0 +1,30 @@
+module Rubyx
+  VALID_MODULE_NAME_PATTERN = /\A[a-zA-Z_][a-zA-Z0-9_]*(\.[a-zA-Z_][a-zA-Z0-9_]*)*\z/
+  class Error < StandardError; end
+  class PythonError < Error; end
+  class ImportError < PythonError; end
+  class InvalidModuleNameError < Error; end
+  class KeyError < Error; end
+  class IndexError < Error; end
+  class ValueError < Error; end
+  class AttributeError < Error; end
+  class TypeError < Error; end
+  module Uv
+    class Error < Rubyx::Error; end
+    class SetupError < Error; end
+    class InitError < Error; end
+  end
+end

data/lib/rubyx/rails.rb ADDED Viewed

@@ -0,0 +1,105 @@
+module Rubyx
+  module Rails
+    class Error < Rubyx::Error; end
+    class Configuration
+      attr_accessor :pyproject_path, :pyproject_content, :auto_init,
+                    :force_reinit, :uv_version, :debug, :python_paths,
+                    :uv_path, :uv_args
+      def initialize
+        @pyproject_path = nil
+        @pyproject_content = nil
+        @auto_init = false
+        @force_reinit = false
+        @uv_version = Rubyx::Uv::DEFAULT_UV_VERSION
+        @debug = false
+        @python_paths = []
+        @uv_path = nil
+        @uv_args = []
+      end
+    end
+    class << self
+      def configuration
+        @configuration ||= Configuration.new
+      end
+      def configure
+        yield configuration
+      end
+      def init!
+        return if initialized?
+        config = configuration
+        pyproject_toml = resolve_pyproject(config)
+        project_dir = resolve_project_dir(config)
+        options = {
+          force: config.force_reinit,
+          uv_version: config.uv_version,
+          project_dir: project_dir,
+          uv_args: config.uv_args,
+        }
+        options[:uv_path] = config.uv_path if config.uv_path
+        Rubyx.uv_init(pyproject_toml, **options)
+        inject_python_paths(config.python_paths)
+        @initialized = true
+        if config.debug
+          ::Rails.logger.info "[Rubyx] Python initialized (project_dir: #{project_dir})"
+        end
+      rescue => e
+        @initialized = false
+        ::Rails.logger.error "[Rubyx] Failed to initialize Python: #{e.message}" if defined?(::Rails.logger)
+        raise
+      end
+      def ensure_initialized!
+        return if initialized?
+        init!
+      end
+      def initialized?
+        @initialized == true
+      end
+      private
+      def resolve_pyproject(config)
+        if config.pyproject_path && File.exist?(config.pyproject_path.to_s)
+          File.read(config.pyproject_path.to_s)
+        elsif config.pyproject_content
+          config.pyproject_content
+        else
+          raise Error, "No pyproject.toml configured. Set pyproject_path or pyproject_content in config/initializers/rubyx.rb"
+        end
+      end
+      def resolve_project_dir(config)
+        if config.pyproject_path
+          File.dirname(config.pyproject_path.to_s)
+        elsif defined?(::Rails) && ::Rails.respond_to?(:root)
+          ::Rails.root.to_s
+        else
+          Dir.pwd
+        end
+      end
+      def inject_python_paths(paths)
+        return if paths.nil? || paths.empty?
+        paths.each do |path|
+          expanded = File.expand_path(path)
+          Rubyx.eval("import sys; sys.path.insert(0, '#{expanded}')") if Dir.exist?(expanded)
+        end
+      end
+    end
+  end
+end

data/lib/rubyx/railtie.rb ADDED Viewed

@@ -0,0 +1,20 @@
+require_relative 'rails'
+module Rubyx
+  class Railtie < ::Rails::Railtie
+    config.rubyx = ActiveSupport::OrderedOptions.new
+    # Auto-initialize Python after all config initializers have run
+    config.after_initialize do
+      if Rubyx::Rails.configuration.auto_init
+        Rubyx::Rails.init!
+        ::Rails.logger.info '[Rubyx] Python environment initialized successfully'
+      end
+    end
+    # Register rake tasks
+    rake_tasks do
+      load 'rubyx/tasks/rubyx.rake'
+    end
+  end
+end