npm - @shaxpir/duiduidui-models - Versions diffs - 1.9.20 → 1.9.21 - Mend

@shaxpir/duiduidui-models 1.9.20 → 1.9.21

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/dist/models/SkillLevel.d.ts +108 -34
package/dist/models/SkillLevel.js +139 -53
package/package.json +1 -2

package/dist/models/SkillLevel.d.ts CHANGED Viewed

@@ -1,72 +1,146 @@
 import { ReviewResult } from './Review';
 import { Bounds } from './BayesianScore';
 /**
- * Represents a skill level rating with uncertainty bounds.
- * Uses the Glicko-2 rating system for skill assessment.
+ * Represents a skill level estimate with uncertainty.
+ * Uses Item Response Theory (IRT) for skill assessment.
+ *
+ * The skill level represents the estimated number of characters
+ * a user has mastered. A user with skill level N is expected to
+ * succeed on recognition tasks for characters with difficulty <= N.
  */
 export interface SkillLevel {
+    /** Estimated skill level (maps to ~number of characters mastered) */
+    mu: number;
+    /** Uncertainty in the estimate (standard deviation) */
+    sigma: number;
+}
+/**
+ * Legacy interface for backwards compatibility during migration.
+ * Maps to the new SkillLevel interface.
+ * @deprecated Use SkillLevel with mu/sigma instead
+ */
+export interface LegacySkillLevel {
     rating: number;
     rating_deviation: number;
     volatility: number;
 }
 /**
- * Model for updating and managing skill levels using the Glicko-2 rating system.
+ * Model for updating and managing skill levels using Item Response Theory (IRT).
  *
- * Unlike traditional Glicko-2 which uses a 1500-centered scale for chess,
- * this adapts the algorithm to DuiDuiDui's semantic scale where:
- * - Rating 0 = absolute beginner (knows ~0 characters)
- * - Rating 100 = knows ~100 characters
- * - Rating 3000 = knows ~3000 characters
+ * This model estimates user skill based on a logistic psychometric function:
+ *   P(success | difficulty d, skill μ) = 1 / (1 + exp(k * (d - μ)))
  *
- * The Glicko-2 algorithm is used without the typical scaling transformations,
- * working directly on our 0-10000 absolute scale.
+ * Where:
+ * - μ (mu) is the skill level we're estimating
+ * - k controls the steepness of the transition from "easy" to "hard"
+ * - Cards with difficulty < μ are likely to be answered correctly
+ * - Cards with difficulty > μ are likely to be answered incorrectly
+ *
+ * The model uses Bayesian updating with a Gaussian approximation:
+ * - Each observation updates μ based on prediction error
+ * - Uncertainty (σ) decreases as we accumulate evidence
+ * - No full history is needed - just μ and σ are sufficient statistics
+ *
+ * Scale semantics:
+ * - μ = 0: absolute beginner (knows ~0 characters)
+ * - μ = 100: knows ~100 characters
+ * - μ = 3000: knows ~3000 characters
  */
 export declare class SkillLevelModel {
     /**
-     * Update skill level using the Glicko-2 algorithm after a review.
+     * Steepness parameter for the logistic function.
+     *
+     * Controls how sharply success probability drops as difficulty exceeds skill:
+     * - k = 0.05 means the transition zone spans ~40 difficulty points
+     * - At difficulty = μ, P(success) = 50%
+     * - At difficulty = μ + 20, P(success) ≈ 27%
+     * - At difficulty = μ + 40, P(success) ≈ 12%
+     *
+     * Lower k = more gradual transition, higher k = sharper cutoff.
+     */
+    private static readonly K;
+    /**
+     * Minimum sigma value to prevent over-confidence.
+     * Even with many observations, we maintain some uncertainty.
+     */
+    private static readonly MIN_SIGMA;
+    /**
+     * Maximum sigma value for initial state.
+     */
+    private static readonly MAX_SIGMA;
+    /**
+     * Update skill level using IRT after a review.
      *
-     * @param rating Current skill level rating
-     * @param ratingDeviation Current rating deviation (uncertainty)
-     * @param volatility Current volatility (performance consistency)
-     * @param cardDifficulty Difficulty of the card reviewed (on same scale as rating)
-     * @param cardRatingDeviation Rating deviation for the card (typically fixed, e.g., 100)
+     * Uses Bayesian updating with a Gaussian approximation to the posterior.
+     * The update is incremental - only requires current μ and σ, not full history.
+     *
+     * @param mu Current skill level estimate
+     * @param sigma Current uncertainty (standard deviation)
+     * @param cardDifficulty Difficulty of the card reviewed
      * @param outcome Review result (FAIL/HARD/GOOD/EASY)
-     * @param tau System constant controlling volatility changes (default 0.5)
-     * @returns Updated skill level with new rating, rating_deviation, and volatility
+     * @returns Updated skill level with new mu and sigma
      */
-    static updateWithGlicko2(rating: number, ratingDeviation: number, volatility: number, cardDifficulty: number, cardRatingDeviation: number, outcome: ReviewResult, tau?: number): SkillLevel;
+    static update(mu: number, sigma: number, cardDifficulty: number, outcome: ReviewResult): SkillLevel;
     /**
-     * Map a review outcome to a numeric score for Glicko-2.
+     * Update skill level using IRT (Glicko-2 compatible signature).
+     *
+     * This method provides backwards compatibility with the old Glicko-2 API.
+     * The volatility and cardRatingDeviation parameters are ignored.
+     *
+     * @deprecated Use update() instead for cleaner IRT semantics
+     */
+    static updateWithGlicko2(rating: number, ratingDeviation: number, _volatility: number, cardDifficulty: number, _cardRatingDeviation: number, outcome: ReviewResult, _tau?: number): LegacySkillLevel;
+    /**
+     * Map a review outcome to a success score for IRT.
      *
      * @param outcome Review result
-     * @returns Numeric score from 0.0 (complete failure) to 1.0 (perfect success)
+     * @returns Success score from 0.0 (complete failure) to 1.0 (perfect success)
      */
     static outcomeToScore(outcome: ReviewResult): number;
     /**
-     * Calculate confidence bounds from Glicko-2 parameters.
-     * Returns a proper statistical confidence interval.
+     * Calculate the probability of success on a card given skill level.
+     *
+     * @param mu Skill level estimate
+     * @param cardDifficulty Difficulty of the card
+     * @returns Probability of success (0 to 1)
+     */
+    static predictSuccess(mu: number, cardDifficulty: number): number;
+    /**
+     * Calculate confidence bounds for the skill estimate.
      *
-     * @param rating Current skill level rating
-     * @param ratingDeviation Rating deviation (standard deviation of rating)
+     * @param mu Skill level estimate
+     * @param sigma Uncertainty (standard deviation)
      * @param confidence Confidence level (0.95 for 95%, 0.99 for 99%)
      * @returns Bounds object with lower and upper confidence limits
      */
-    static calculateBounds(rating: number, ratingDeviation: number, confidence?: number): Bounds;
+    static calculateBounds(mu: number, sigma: number, confidence?: number): Bounds;
     /**
      * Create a default skill level for a new user.
-     * Starts at rating 0 (knows no characters) with high uncertainty.
+     * Starts at skill 0 (knows no characters) with high uncertainty.
      *
-     * @param initialRatingDeviation Initial rating deviation (default 50, meaning ±100 char uncertainty at 95% CI)
-     * @param initialVolatility Initial volatility (default 0.06, moderate)
+     * @param initialSigma Initial uncertainty (default 50)
      * @returns New SkillLevel object
      */
-    static createDefault(initialRatingDeviation?: number, initialVolatility?: number): SkillLevel;
+    static createDefault(initialSigma?: number): SkillLevel;
+    /**
+     * Create a default skill level in legacy format.
+     * @deprecated Use createDefault() instead
+     */
+    static createDefaultLegacy(initialRatingDeviation?: number, initialVolatility?: number): LegacySkillLevel;
+    /**
+     * Convert from legacy Glicko-2 format to IRT format.
+     */
+    static fromLegacy(legacy: LegacySkillLevel): SkillLevel;
+    /**
+     * Convert from IRT format to legacy Glicko-2 format.
+     */
+    static toLegacy(skill: SkillLevel): LegacySkillLevel;
     /**
      * Check if the skill level has high confidence (low uncertainty).
      *
-     * @param ratingDeviation Rating deviation
-     * @param threshold Maximum rating deviation to be considered "high confidence" (default 15)
-     * @returns True if uncertainty is low (rating deviation below threshold)
+     * @param sigma Uncertainty (standard deviation)
+     * @param threshold Maximum sigma to be considered "high confidence" (default 15)
+     * @returns True if uncertainty is low
      */
-    static isHighConfidence(ratingDeviation: number, threshold?: number): boolean;
+    static isHighConfidence(sigma: number, threshold?: number): boolean;
 }

package/dist/models/SkillLevel.js CHANGED Viewed

@@ -1,106 +1,192 @@
 "use strict";
-var __importDefault = (this && this.__importDefault) || function (mod) {
-    return (mod && mod.__esModule) ? mod : { "default": mod };
-};
 Object.defineProperty(exports, "__esModule", { value: true });
 exports.SkillLevelModel = void 0;
-const glicko2_lite_1 = __importDefault(require("glicko2-lite"));
 /**
- * Model for updating and managing skill levels using the Glicko-2 rating system.
+ * Model for updating and managing skill levels using Item Response Theory (IRT).
  *
- * Unlike traditional Glicko-2 which uses a 1500-centered scale for chess,
- * this adapts the algorithm to DuiDuiDui's semantic scale where:
- * - Rating 0 = absolute beginner (knows ~0 characters)
- * - Rating 100 = knows ~100 characters
- * - Rating 3000 = knows ~3000 characters
+ * This model estimates user skill based on a logistic psychometric function:
+ *   P(success | difficulty d, skill μ) = 1 / (1 + exp(k * (d - μ)))
  *
- * The Glicko-2 algorithm is used without the typical scaling transformations,
- * working directly on our 0-10000 absolute scale.
+ * Where:
+ * - μ (mu) is the skill level we're estimating
+ * - k controls the steepness of the transition from "easy" to "hard"
+ * - Cards with difficulty < μ are likely to be answered correctly
+ * - Cards with difficulty > μ are likely to be answered incorrectly
+ *
+ * The model uses Bayesian updating with a Gaussian approximation:
+ * - Each observation updates μ based on prediction error
+ * - Uncertainty (σ) decreases as we accumulate evidence
+ * - No full history is needed - just μ and σ are sufficient statistics
+ *
+ * Scale semantics:
+ * - μ = 0: absolute beginner (knows ~0 characters)
+ * - μ = 100: knows ~100 characters
+ * - μ = 3000: knows ~3000 characters
  */
 class SkillLevelModel {
     /**
-     * Update skill level using the Glicko-2 algorithm after a review.
+     * Update skill level using IRT after a review.
+     *
+     * Uses Bayesian updating with a Gaussian approximation to the posterior.
+     * The update is incremental - only requires current μ and σ, not full history.
      *
-     * @param rating Current skill level rating
-     * @param ratingDeviation Current rating deviation (uncertainty)
-     * @param volatility Current volatility (performance consistency)
-     * @param cardDifficulty Difficulty of the card reviewed (on same scale as rating)
-     * @param cardRatingDeviation Rating deviation for the card (typically fixed, e.g., 100)
+     * @param mu Current skill level estimate
+     * @param sigma Current uncertainty (standard deviation)
+     * @param cardDifficulty Difficulty of the card reviewed
      * @param outcome Review result (FAIL/HARD/GOOD/EASY)
-     * @param tau System constant controlling volatility changes (default 0.5)
-     * @returns Updated skill level with new rating, rating_deviation, and volatility
+     * @returns Updated skill level with new mu and sigma
+     */
+    static update(mu, sigma, cardDifficulty, outcome) {
+        const k = SkillLevelModel.K;
+        // Map outcome to success value (0 to 1)
+        const y = SkillLevelModel.outcomeToScore(outcome);
+        // Predicted probability of success given current skill estimate
+        const p = 1 / (1 + Math.exp(k * (cardDifficulty - mu)));
+        // Prediction error: positive if did better than expected, negative if worse
+        const error = y - p;
+        // Fisher information for logistic model (highest at p = 0.5)
+        const info = p * (1 - p);
+        // Update variance (precision increases with information)
+        const sigmaSquared = sigma * sigma;
+        const newSigmaSquared = 1 / (1 / sigmaSquared + k * k * info);
+        const newSigma = Math.sqrt(newSigmaSquared);
+        // Update mean (shift toward evidence)
+        const newMu = mu + newSigmaSquared * k * error;
+        return {
+            mu: Math.max(0, newMu), // Skill can't go negative
+            sigma: Math.max(SkillLevelModel.MIN_SIGMA, Math.min(SkillLevelModel.MAX_SIGMA, newSigma))
+        };
+    }
+    /**
+     * Update skill level using IRT (Glicko-2 compatible signature).
+     *
+     * This method provides backwards compatibility with the old Glicko-2 API.
+     * The volatility and cardRatingDeviation parameters are ignored.
+     *
+     * @deprecated Use update() instead for cleaner IRT semantics
      */
-    static updateWithGlicko2(rating, ratingDeviation, volatility, cardDifficulty, cardRatingDeviation, outcome, tau = 0.5) {
-        // Map outcome to numeric score (0.0 to 1.0)
-        const score = SkillLevelModel.outcomeToScore(outcome);
-        // Call glicko2-lite with a single match
-        // Match format: [opponentRating, opponentRD, outcome]
-        const result = (0, glicko2_lite_1.default)(rating, ratingDeviation, volatility, [
-            [cardDifficulty, cardRatingDeviation, score]
-        ], { tau });
+    static updateWithGlicko2(rating, ratingDeviation, _volatility, cardDifficulty, _cardRatingDeviation, outcome, _tau = 0.5) {
+        const result = SkillLevelModel.update(rating, ratingDeviation, cardDifficulty, outcome);
+        // Return in legacy format
         return {
-            rating: result.rating,
-            rating_deviation: result.rd,
-            volatility: result.vol
+            rating: result.mu,
+            rating_deviation: result.sigma,
+            volatility: 0.06 // Fixed value, not used in IRT
         };
     }
     /**
-     * Map a review outcome to a numeric score for Glicko-2.
+     * Map a review outcome to a success score for IRT.
      *
      * @param outcome Review result
-     * @returns Numeric score from 0.0 (complete failure) to 1.0 (perfect success)
+     * @returns Success score from 0.0 (complete failure) to 1.0 (perfect success)
      */
     static outcomeToScore(outcome) {
         switch (outcome) {
             case 'EASY': return 1.0;
-            case 'GOOD': return 0.67;
-            case 'HARD': return 0.33;
+            case 'GOOD': return 0.85;
+            case 'HARD': return 0.3;
             case 'FAIL': return 0.0;
         }
     }
     /**
-     * Calculate confidence bounds from Glicko-2 parameters.
-     * Returns a proper statistical confidence interval.
+     * Calculate the probability of success on a card given skill level.
      *
-     * @param rating Current skill level rating
-     * @param ratingDeviation Rating deviation (standard deviation of rating)
+     * @param mu Skill level estimate
+     * @param cardDifficulty Difficulty of the card
+     * @returns Probability of success (0 to 1)
+     */
+    static predictSuccess(mu, cardDifficulty) {
+        return 1 / (1 + Math.exp(SkillLevelModel.K * (cardDifficulty - mu)));
+    }
+    /**
+     * Calculate confidence bounds for the skill estimate.
+     *
+     * @param mu Skill level estimate
+     * @param sigma Uncertainty (standard deviation)
      * @param confidence Confidence level (0.95 for 95%, 0.99 for 99%)
      * @returns Bounds object with lower and upper confidence limits
      */
-    static calculateBounds(rating, ratingDeviation, confidence = 0.95) {
+    static calculateBounds(mu, sigma, confidence = 0.95) {
         // Z-score for desired confidence level
-        // 95% CI: ±1.96 standard deviations
-        // 99% CI: ±2.58 standard deviations
         const z = confidence === 0.95 ? 1.96 : confidence === 0.99 ? 2.58 : 1.96;
         return {
-            lower: Math.max(0, rating - z * ratingDeviation),
-            upper: Math.max(0, rating + z * ratingDeviation)
+            lower: Math.max(0, mu - z * sigma),
+            upper: mu + z * sigma
         };
     }
     /**
      * Create a default skill level for a new user.
-     * Starts at rating 0 (knows no characters) with high uncertainty.
+     * Starts at skill 0 (knows no characters) with high uncertainty.
      *
-     * @param initialRatingDeviation Initial rating deviation (default 50, meaning ±100 char uncertainty at 95% CI)
-     * @param initialVolatility Initial volatility (default 0.06, moderate)
+     * @param initialSigma Initial uncertainty (default 50)
      * @returns New SkillLevel object
      */
-    static createDefault(initialRatingDeviation = 50, initialVolatility = 0.06) {
+    static createDefault(initialSigma = 50) {
+        return {
+            mu: 0,
+            sigma: initialSigma
+        };
+    }
+    /**
+     * Create a default skill level in legacy format.
+     * @deprecated Use createDefault() instead
+     */
+    static createDefaultLegacy(initialRatingDeviation = 50, initialVolatility = 0.06) {
         return {
             rating: 0,
             rating_deviation: initialRatingDeviation,
             volatility: initialVolatility
         };
     }
+    /**
+     * Convert from legacy Glicko-2 format to IRT format.
+     */
+    static fromLegacy(legacy) {
+        return {
+            mu: legacy.rating,
+            sigma: legacy.rating_deviation
+        };
+    }
+    /**
+     * Convert from IRT format to legacy Glicko-2 format.
+     */
+    static toLegacy(skill) {
+        return {
+            rating: skill.mu,
+            rating_deviation: skill.sigma,
+            volatility: 0.06
+        };
+    }
     /**
      * Check if the skill level has high confidence (low uncertainty).
      *
-     * @param ratingDeviation Rating deviation
-     * @param threshold Maximum rating deviation to be considered "high confidence" (default 15)
-     * @returns True if uncertainty is low (rating deviation below threshold)
+     * @param sigma Uncertainty (standard deviation)
+     * @param threshold Maximum sigma to be considered "high confidence" (default 15)
+     * @returns True if uncertainty is low
      */
-    static isHighConfidence(ratingDeviation, threshold = 15) {
-        return ratingDeviation < threshold;
+    static isHighConfidence(sigma, threshold = 15) {
+        return sigma < threshold;
     }
 }
 exports.SkillLevelModel = SkillLevelModel;
+/**
+ * Steepness parameter for the logistic function.
+ *
+ * Controls how sharply success probability drops as difficulty exceeds skill:
+ * - k = 0.05 means the transition zone spans ~40 difficulty points
+ * - At difficulty = μ, P(success) = 50%
+ * - At difficulty = μ + 20, P(success) ≈ 27%
+ * - At difficulty = μ + 40, P(success) ≈ 12%
+ *
+ * Lower k = more gradual transition, higher k = sharper cutoff.
+ */
+SkillLevelModel.K = 0.05;
+/**
+ * Minimum sigma value to prevent over-confidence.
+ * Even with many observations, we maintain some uncertainty.
+ */
+SkillLevelModel.MIN_SIGMA = 5;
+/**
+ * Maximum sigma value for initial state.
+ */
+SkillLevelModel.MAX_SIGMA = 100;

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@shaxpir/duiduidui-models",
-  "version": "1.9.20",
+  "version": "1.9.21",
   "repository": {
     "type": "git",
     "url": "https://github.com/shaxpir/duiduidui-models"
@@ -19,7 +19,6 @@
     "@shaxpir/duiduidui-models": "^1.4.14",
     "@shaxpir/sharedb": "^6.0.6",
     "@shaxpir/shaxpir-common": "^1.4.1",
-    "glicko2-lite": "^4.0.0",
     "ot-json1": "1.0.1",
     "ot-text-unicode": "4.0.0",
     "reconnecting-websocket": "4.4.0"