PyPI - mseep-rmcp - Versions diffs - 0.3.3__py3-none-any.whl - Mend

mseep-rmcp 0.3.3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (34) hide show

mseep_rmcp-0.3.3.dist-info/METADATA +50 -0
mseep_rmcp-0.3.3.dist-info/RECORD +34 -0
mseep_rmcp-0.3.3.dist-info/WHEEL +5 -0
mseep_rmcp-0.3.3.dist-info/entry_points.txt +2 -0
mseep_rmcp-0.3.3.dist-info/licenses/LICENSE +21 -0
mseep_rmcp-0.3.3.dist-info/top_level.txt +1 -0
rmcp/__init__.py +31 -0
rmcp/cli.py +317 -0
rmcp/core/__init__.py +14 -0
rmcp/core/context.py +150 -0
rmcp/core/schemas.py +156 -0
rmcp/core/server.py +261 -0
rmcp/r_assets/__init__.py +8 -0
rmcp/r_integration.py +112 -0
rmcp/registries/__init__.py +26 -0
rmcp/registries/prompts.py +316 -0
rmcp/registries/resources.py +266 -0
rmcp/registries/tools.py +223 -0
rmcp/scripts/__init__.py +9 -0
rmcp/security/__init__.py +15 -0
rmcp/security/vfs.py +233 -0
rmcp/tools/descriptive.py +279 -0
rmcp/tools/econometrics.py +250 -0
rmcp/tools/fileops.py +315 -0
rmcp/tools/machine_learning.py +299 -0
rmcp/tools/regression.py +287 -0
rmcp/tools/statistical_tests.py +332 -0
rmcp/tools/timeseries.py +239 -0
rmcp/tools/transforms.py +293 -0
rmcp/tools/visualization.py +590 -0
rmcp/transport/__init__.py +16 -0
rmcp/transport/base.py +130 -0
rmcp/transport/jsonrpc.py +243 -0
rmcp/transport/stdio.py +201 -0

rmcp/tools/timeseries.py ADDED Viewed

@@ -0,0 +1,239 @@
+"""
+Time series analysis tools for RMCP.
+Comprehensive time series modeling and forecasting capabilities.
+"""
+from typing import Dict, Any
+from ..registries.tools import tool
+from ..core.schemas import table_schema
+from ..r_integration import execute_r_script
+@tool(
+    name="arima_model",
+    input_schema={
+        "type": "object",
+        "properties": {
+            "data": {
+                "type": "object",
+                "properties": {
+                    "values": {"type": "array", "items": {"type": "number"}},
+                    "dates": {"type": "array", "items": {"type": "string"}}
+                },
+                "required": ["values"]
+            },
+            "order": {
+                "type": "array",
+                "items": {"type": "integer"},
+                "minItems": 3,
+                "maxItems": 3,
+                "description": "ARIMA order (p, d, q)"
+            },
+            "seasonal": {
+                "type": "array",
+                "items": {"type": "integer"},
+                "minItems": 4,
+                "maxItems": 4,
+                "description": "Seasonal ARIMA order (P, D, Q, s)"
+            },
+            "forecast_periods": {"type": "integer", "minimum": 1, "maximum": 100, "default": 12}
+        },
+        "required": ["data"]
+    },
+    description="Fit ARIMA time series model with forecasting"
+)
+async def arima_model(context, params):
+    """Fit ARIMA model and generate forecasts."""
+    await context.info("Fitting ARIMA time series model")
+    r_script = '''
+    # Install required packages
+    if (!require(forecast)) install.packages("forecast", quietly = TRUE)
+    library(forecast)
+    # Prepare data
+    values <- args$data$values
+    # Convert to time series
+    if (!is.null(args$data$dates)) {
+        dates <- as.Date(args$data$dates)
+        ts_data <- ts(values, frequency = 12)  # Assume monthly by default
+    } else {
+        ts_data <- ts(values, frequency = 12)
+    }
+    # Fit ARIMA model
+    if (!is.null(args$order)) {
+        if (!is.null(args$seasonal)) {
+            model <- Arima(ts_data, order = args$order, seasonal = args$seasonal)
+        } else {
+            model <- Arima(ts_data, order = args$order)
+        }
+    } else {
+        # Auto ARIMA
+        model <- auto.arima(ts_data)
+    }
+    # Generate forecasts
+    forecast_periods <- args$forecast_periods %||% 12
+    forecasts <- forecast(model, h = forecast_periods)
+    # Extract results
+    result <- list(
+        model_type = "ARIMA",
+        order = arimaorder(model),
+        coefficients = as.list(coef(model)),
+        aic = AIC(model),
+        bic = BIC(model),
+        loglik = logLik(model)[1],
+        sigma2 = model$sigma2,
+        fitted_values = as.numeric(fitted(model)),
+        residuals = as.numeric(residuals(model)),
+        forecasts = as.numeric(forecasts$mean),
+        forecast_lower = as.numeric(forecasts$lower[,2]),  # 95% CI
+        forecast_upper = as.numeric(forecasts$upper[,2]),
+        accuracy = accuracy(model),
+        n_obs = length(values)
+    )
+    '''
+    try:
+        result = execute_r_script(r_script, params)
+        await context.info("ARIMA model fitted successfully",
+                          aic=result.get("aic"),
+                          n_obs=result.get("n_obs"))
+        return result
+    except Exception as e:
+        await context.error("ARIMA model fitting failed", error=str(e))
+        raise
+@tool(
+    name="decompose_timeseries",
+    input_schema={
+        "type": "object",
+        "properties": {
+            "data": {
+                "type": "object",
+                "properties": {
+                    "values": {"type": "array", "items": {"type": "number"}},
+                    "dates": {"type": "array", "items": {"type": "string"}}
+                },
+                "required": ["values"]
+            },
+            "frequency": {"type": "integer", "minimum": 1, "default": 12},
+            "type": {"type": "string", "enum": ["additive", "multiplicative"], "default": "additive"}
+        },
+        "required": ["data"]
+    },
+    description="Decompose time series into trend, seasonal, and remainder components"
+)
+async def decompose_timeseries(context, params):
+    """Decompose time series into components."""
+    await context.info("Decomposing time series")
+    r_script = '''
+    values <- args$data$values
+    frequency <- args$frequency %||% 12
+    decomp_type <- args$type %||% "additive"
+    # Create time series
+    ts_data <- ts(values, frequency = frequency)
+    # Decompose
+    if (decomp_type == "multiplicative") {
+        decomp <- decompose(ts_data, type = "multiplicative")
+    } else {
+        decomp <- decompose(ts_data, type = "additive")
+    }
+    result <- list(
+        original = as.numeric(decomp$x),
+        trend = as.numeric(decomp$trend),
+        seasonal = as.numeric(decomp$seasonal),
+        remainder = as.numeric(decomp$random),
+        type = decomp_type,
+        frequency = frequency,
+        n_obs = length(values)
+    )
+    '''
+    try:
+        result = execute_r_script(r_script, params)
+        await context.info("Time series decomposed successfully")
+        return result
+    except Exception as e:
+        await context.error("Time series decomposition failed", error=str(e))
+        raise
+@tool(
+    name="stationarity_test",
+    input_schema={
+        "type": "object",
+        "properties": {
+            "data": {
+                "type": "object",
+                "properties": {
+                    "values": {"type": "array", "items": {"type": "number"}}
+                },
+                "required": ["values"]
+            },
+            "test": {"type": "string", "enum": ["adf", "kpss", "pp"], "default": "adf"}
+        },
+        "required": ["data"]
+    },
+    description="Test time series for stationarity (ADF, KPSS, Phillips-Perron)"
+)
+async def stationarity_test(context, params):
+    """Test time series stationarity."""
+    await context.info("Testing time series stationarity")
+    r_script = '''
+    if (!require(tseries)) install.packages("tseries", quietly = TRUE)
+    library(tseries)
+    values <- args$data$values
+    test_type <- args$test %||% "adf"
+    ts_data <- ts(values)
+    if (test_type == "adf") {
+        test_result <- adf.test(ts_data)
+        test_name <- "Augmented Dickey-Fuller"
+    } else if (test_type == "kpss") {
+        test_result <- kpss.test(ts_data)
+        test_name <- "KPSS"
+    } else if (test_type == "pp") {
+        test_result <- pp.test(ts_data)
+        test_name <- "Phillips-Perron"
+    }
+    result <- list(
+        test_name = test_name,
+        test_type = test_type,
+        statistic = as.numeric(test_result$statistic),
+        p_value = test_result$p.value,
+        critical_values = as.list(test_result$critical),
+        alternative = test_result$alternative,
+        is_stationary = if (test_type == "kpss") test_result$p.value > 0.05 else test_result$p.value < 0.05,
+        n_obs = length(values)
+    )
+    '''
+    try:
+        result = execute_r_script(r_script, params)
+        await context.info("Stationarity test completed",
+                          test=result.get("test_name"),
+                          p_value=result.get("p_value"))
+        return result
+    except Exception as e:
+        await context.error("Stationarity test failed", error=str(e))
+        raise

rmcp/tools/transforms.py ADDED Viewed

@@ -0,0 +1,293 @@
+"""
+Data transformation tools for RMCP.
+Essential data manipulation and cleaning capabilities.
+"""
+from typing import Dict, Any
+from ..registries.tools import tool
+from ..core.schemas import table_schema
+from ..r_integration import execute_r_script
+@tool(
+    name="lag_lead",
+    input_schema={
+        "type": "object",
+        "properties": {
+            "data": table_schema(),
+            "variables": {"type": "array", "items": {"type": "string"}},
+            "lags": {"type": "array", "items": {"type": "integer"}},
+            "leads": {"type": "array", "items": {"type": "integer"}}
+        },
+        "required": ["data", "variables"]
+    },
+    description="Create lagged and lead variables for time series analysis"
+)
+async def lag_lead(context, params):
+    """Create lagged and lead variables."""
+    await context.info("Creating lag/lead variables")
+    r_script = '''
+    data <- as.data.frame(args$data)
+    variables <- args$variables
+    lags <- args$lags %||% c(1)
+    leads <- args$leads %||% c()
+    result_data <- data
+    # Create lagged variables
+    for (var in variables) {
+        for (lag_val in lags) {
+            new_var <- paste0(var, "_lag", lag_val)
+            result_data[[new_var]] <- c(rep(NA, lag_val), head(data[[var]], -lag_val))
+        }
+    }
+    # Create lead variables
+    for (var in variables) {
+        for (lead_val in leads) {
+            new_var <- paste0(var, "_lead", lead_val)
+            result_data[[new_var]] <- c(tail(data[[var]], -lead_val), rep(NA, lead_val))
+        }
+    }
+    result <- list(
+        data = result_data,
+        variables_created = names(result_data)[!names(result_data) %in% names(data)],
+        n_obs = nrow(result_data),
+        operation = "lag_lead"
+    )
+    '''
+    try:
+        result = execute_r_script(r_script, params)
+        await context.info("Lag/lead variables created successfully")
+        return result
+    except Exception as e:
+        await context.error("Lag/lead creation failed", error=str(e))
+        raise
+@tool(
+    name="winsorize",
+    input_schema={
+        "type": "object",
+        "properties": {
+            "data": table_schema(),
+            "variables": {"type": "array", "items": {"type": "string"}},
+            "percentiles": {
+                "type": "array",
+                "items": {"type": "number", "minimum": 0, "maximum": 0.5},
+                "minItems": 2,
+                "maxItems": 2,
+                "default": [0.01, 0.99]
+            }
+        },
+        "required": ["data", "variables"]
+    },
+    description="Winsorize variables to handle outliers"
+)
+async def winsorize(context, params):
+    """Winsorize variables to handle outliers."""
+    await context.info("Winsorizing variables")
+    r_script = '''
+    data <- as.data.frame(args$data)
+    variables <- args$variables
+    percentiles <- args$percentiles %||% c(0.01, 0.99)
+    result_data <- data
+    outliers_summary <- list()
+    for (var in variables) {
+        original_values <- data[[var]]
+        # Calculate percentile thresholds
+        lower_threshold <- quantile(original_values, percentiles[1], na.rm = TRUE)
+        upper_threshold <- quantile(original_values, percentiles[2], na.rm = TRUE)
+        # Winsorize
+        winsorized <- pmax(pmin(original_values, upper_threshold), lower_threshold)
+        result_data[[var]] <- winsorized
+        # Track changes
+        n_lower <- sum(original_values < lower_threshold, na.rm = TRUE)
+        n_upper <- sum(original_values > upper_threshold, na.rm = TRUE)
+        outliers_summary[[var]] <- list(
+            lower_threshold = lower_threshold,
+            upper_threshold = upper_threshold,
+            n_capped_lower = n_lower,
+            n_capped_upper = n_upper,
+            total_capped = n_lower + n_upper
+        )
+    }
+    result <- list(
+        data = result_data,
+        outliers_summary = outliers_summary,
+        percentiles = percentiles,
+        variables_winsorized = variables,
+        n_obs = nrow(result_data)
+    )
+    '''
+    try:
+        result = execute_r_script(r_script, params)
+        await context.info("Variables winsorized successfully")
+        return result
+    except Exception as e:
+        await context.error("Winsorization failed", error=str(e))
+        raise
+@tool(
+    name="difference",
+    input_schema={
+        "type": "object",
+        "properties": {
+            "data": table_schema(),
+            "variables": {"type": "array", "items": {"type": "string"}},
+            "order": {"type": "integer", "minimum": 1, "maximum": 3, "default": 1},
+            "log_transform": {"type": "boolean", "default": False}
+        },
+        "required": ["data", "variables"]
+    },
+    description="Compute differences of variables (for stationarity)"
+)
+async def difference(context, params):
+    """Compute differences of variables."""
+    await context.info("Computing variable differences")
+    r_script = '''
+    data <- as.data.frame(args$data)
+    variables <- args$variables
+    diff_order <- args$order %||% 1
+    log_transform <- args$log_transform %||% FALSE
+    result_data <- data
+    for (var in variables) {
+        original_values <- data[[var]]
+        # Log transform first if requested
+        if (log_transform) {
+            if (any(original_values <= 0, na.rm = TRUE)) {
+                stop(paste("Cannot log-transform", var, "- contains non-positive values"))
+            }
+            transformed <- log(original_values)
+            log_var <- paste0("log_", var)
+            result_data[[log_var]] <- transformed
+            working_values <- transformed
+            base_name <- log_var
+        } else {
+            working_values <- original_values
+            base_name <- var
+        }
+        # Compute differences
+        diff_values <- working_values
+        for (i in 1:diff_order) {
+            diff_values <- diff(diff_values)
+            diff_name <- paste0(base_name, "_diff", if (diff_order > 1) i else "")
+            # Pad with NA to maintain same length
+            padded_diff <- c(rep(NA, i), diff_values)
+            result_data[[diff_name]] <- padded_diff
+        }
+    }
+    result <- list(
+        data = result_data,
+        variables_differenced = variables,
+        difference_order = diff_order,
+        log_transformed = log_transform,
+        n_obs = nrow(result_data)
+    )
+    '''
+    try:
+        result = execute_r_script(r_script, params)
+        await context.info("Variable differences computed successfully")
+        return result
+    except Exception as e:
+        await context.error("Differencing failed", error=str(e))
+        raise
+@tool(
+    name="standardize",
+    input_schema={
+        "type": "object",
+        "properties": {
+            "data": table_schema(),
+            "variables": {"type": "array", "items": {"type": "string"}},
+            "method": {"type": "string", "enum": ["z_score", "min_max", "robust"], "default": "z_score"}
+        },
+        "required": ["data", "variables"]
+    },
+    description="Standardize variables using z-score, min-max, or robust scaling"
+)
+async def standardize(context, params):
+    """Standardize variables."""
+    await context.info("Standardizing variables")
+    r_script = '''
+    data <- as.data.frame(args$data)
+    variables <- args$variables
+    method <- args$method %||% "z_score"
+    result_data <- data
+    scaling_info <- list()
+    for (var in variables) {
+        original_values <- data[[var]]
+        if (method == "z_score") {
+            mean_val <- mean(original_values, na.rm = TRUE)
+            sd_val <- sd(original_values, na.rm = TRUE)
+            scaled <- (original_values - mean_val) / sd_val
+            scaling_info[[var]] <- list(mean = mean_val, sd = sd_val)
+        } else if (method == "min_max") {
+            min_val <- min(original_values, na.rm = TRUE)
+            max_val <- max(original_values, na.rm = TRUE)
+            scaled <- (original_values - min_val) / (max_val - min_val)
+            scaling_info[[var]] <- list(min = min_val, max = max_val)
+        } else if (method == "robust") {
+            median_val <- median(original_values, na.rm = TRUE)
+            mad_val <- mad(original_values, na.rm = TRUE)
+            scaled <- (original_values - median_val) / mad_val
+            scaling_info[[var]] <- list(median = median_val, mad = mad_val)
+        }
+        new_var <- paste0(var, "_", method)
+        result_data[[new_var]] <- scaled
+    }
+    result <- list(
+        data = result_data,
+        scaling_method = method,
+        scaling_info = scaling_info,
+        variables_scaled = variables,
+        n_obs = nrow(result_data)
+    )
+    '''
+    try:
+        result = execute_r_script(r_script, params)
+        await context.info("Variables standardized successfully")
+        return result
+    except Exception as e:
+        await context.error("Standardization failed", error=str(e))
+        raise