PyPI - iita-python - Versions diffs - 1.0.2__tar.gz → 1.2__tar.gz - Mend

iita-python 1.0.2tar.gz → 1.2tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (24) hide show

{iita_python-1.0.2/iita_python.egg-info → iita_python-1.2}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: iita_python
-Version: 1.0.2
+Version: 1.2
 Summary: IITA algorithm in python
 Author-email: Aliaksei Badnarchuk <alexejbodnarchuk@gmail.com>
 Requires-Python: >=3.9
@@ -111,7 +111,7 @@ Returns: float (MSE, lower is better)
 ## Testing
-See the `test_ipynbs` folder. You can open the Jupyter notebooks in Google Colab and run all cells to see test results.
+See the `testing` branch. You can open the Jupyter notebooks in Google Colab and run all cells to see test results.
 I am comparing my results on the PISA dataset to those of Milan Segedinac ([his implementation](https://github.com/milansegedinac/kst))

{iita_python-1.0.2 → iita_python-1.2}/README.md RENAMED Viewed

@@ -101,7 +101,7 @@ Returns: float (MSE, lower is better)
 ## Testing
-See the `test_ipynbs` folder. You can open the Jupyter notebooks in Google Colab and run all cells to see test results.
+See the `testing` branch. You can open the Jupyter notebooks in Google Colab and run all cells to see test results.
 I am comparing my results on the PISA dataset to those of Milan Segedinac ([his implementation](https://github.com/milansegedinac/kst))

{iita_python-1.0.2 → iita_python-1.2}/iita_python/_version.py RENAMED Viewed

@@ -28,7 +28,7 @@ version_tuple: VERSION_TUPLE
 commit_id: COMMIT_ID
 __commit_id__: COMMIT_ID
-__version__ = version = '1.0.2'
-__version_tuple__ = version_tuple = (1, 0, 2)
+__version__ = version = '1.2'
+__version_tuple__ = version_tuple = (1, 2)
-__commit_id__ = commit_id = 'g481ee8703'
+__commit_id__ = commit_id = 'gb97b590cd'

iita_python-1.2/iita_python/additional_ce.py ADDED Viewed

@@ -0,0 +1,101 @@
+import numpy as np
+import pandas as pd
+import numpy.typing as npt
+from typing import Self, List
+from iita_python.dataset import Dataset
+def pairwise_diff_ce(rp: pd.DataFrame) -> pd.DataFrame:
+    """
+    Computes counterexamples from a response pattern DataFrame by using pairwise differences of item correspondences\n
+    Can be used for non-binary data because of not relying on strict 0/1 values\n
+    Does not support missing values in the response patterns\n
+    """
+    items = rp.shape[1]
+    subjects = rp.shape[0]
+    ce = pd.DataFrame(0, index=np.arange(items), columns=np.arange(items))
+    for i in range(subjects):
+        # for subject i, if a < b, add b - a for all item pairs (a,b)
+        # this is equivalent to ce[a][b] += 1 if a=0 and b=1, but works for non-binary data as well
+        row = rp.loc[i].to_numpy()
+        ce -= np.clip(row[:, None] - row[None, :], None, 0)
+    return ce
+def missing_value_substitution_ce(rp: pd.DataFrame) -> pd.DataFrame:
+    """
+    Computes counterexamples from a response pattern DataFrame by using pairwise differences of item correspondences\n
+    Substitutes missing values in the response patterns with the mean of the item, making some counterexample amounts fractional\n
+    Can be used for non-binary data because of not relying on strict 0/1 values\n
+    """
+    items = rp.shape[1]
+    subjects = rp.shape[0]
+    rp1 = rp.copy()
+    for i in range(items):
+        # substitute missing values in item i with the mean of the item
+        col = rp1.loc[:, i].to_numpy()
+        mean_val = np.nanmean(col)
+        col = pd.Series(col).fillna(mean_val)
+        rp1.loc[:, i] = col
+    # then calculate pairwise difference counterexamples
+    return pairwise_diff_ce(rp1)
+def relativify(calculator: callable):
+    """
+    Decorator to relativify counterexample calculators\n
+    The counterexample amounts are divided by the number of cases for each item pair where both items are not missing\n
+    """
+    def wrapper(rp: pd.DataFrame):
+        f"""
+        Computes counterexamples relative to the amount of valid cases using {calculator.__name__} as base calculator\n
+        The counterexample amounts are divided by the number of cases for each item pair where both items are not missing\n
+        """
+        ce = calculator(rp)
+        items = rp.shape[1]
+        subjects = rp.shape[0]
+        valid_cases = pd.DataFrame(0, index=np.arange(items), columns=np.arange(items))
+        for i in range(subjects):
+            #for subject i, increment all cases where neither a nor b are NaN (valid case for counterexamples)
+            not_nan = np.logical_not(rp.loc[i].isna())
+            valid_cases += np.outer(not_nan, not_nan).astype(int)
+        # avoid division by zero
+        valid_cases = valid_cases.replace(0, 1)
+        return ce / valid_cases
+    return wrapper
+class AdditionalCEDataset(Dataset):
+    def __init__(self, response_patterns: pd.DataFrame | npt.NDArray | List[List[int]]):
+        """
+        Computes the counterexamples and equivalence examples from response patterns\n
+        Supports pandas dataframes, numpy arrays, and python lists\n
+        Rows represent the subjects, columns - the items\n
+        In addition to the base Dataset, this class provides additional counterexample calculators:\n
+        - pairwise_diff_ce: computes counterexamples using pairwise differences of item correspondences, allowing for non-binary data\n
+        - missing_value_substitution_ce: computes counterexamples using pairwise differences with missing values substituted by item means\n
+        """
+        super().__init__(response_patterns)
+        self.pairwise_diff_ce = lambda self, relative=False: (
+            relativify(pairwise_diff_ce) if relative else pairwise_diff_ce
+        )(self.rp)
+        self.pairwise_diff_ce.__doc__ = pairwise_diff_ce.__doc__
+        self.missing_value_substitution_ce = lambda self, relative=False: (
+            relativify(missing_value_substitution_ce) if relative else missing_value_substitution_ce
+        )(self.rp)
+        self.missing_value_substitution_ce.__doc__ = missing_value_substitution_ce.__doc__

{iita_python-1.0.2 → iita_python-1.2}/iita_python/dataset.py RENAMED Viewed

@@ -31,7 +31,7 @@ class Dataset():
     @property
     def items(self):
-        return self.ce.shape[0]
+        return self.rp.shape[1]
     @property
     def subjects(self):
@@ -52,31 +52,44 @@ class Dataset():
         self._eqe = None
         #counterexamples computation
-        self.ce = pd.DataFrame(0, index=np.arange(self.rp.shape[1]), columns=np.arange(self.rp.shape[1]))
+        self.ce = pd.DataFrame(0, index=np.arange(self.items), columns=np.arange(self.items))
-        for i in range(len(self.rp)):
-            #for subject i, find all cases where a=0 and b=1 (counterexamples to b->a or a <= b) and increment where they intersect
+        for i in range(self.subjects):
+            #for subject i, increment all cases where a=0 and b=1 (counterexamples to b->a or a <= b)
             not_a = (self.rp.loc[i] == 0)
             b = (self.rp.loc[i] == 1)
             self.ce.loc[not_a, b] += 1
         #equivalence examples computation
-        self.eqe = pd.DataFrame(0, index=np.arange(self.rp.shape[1]), columns=np.arange(self.rp.shape[1]))
-        for i in range(len(self.rp)):
+        self.eqe = pd.DataFrame(0, index=np.arange(self.items), columns=np.arange(self.items))
+        for i in range(self.subjects):
             #for subject i, increment all cases where a=b (examples of equivalence of a and b)
             row = self.rp.loc[i].to_numpy()
             self.eqe += np.equal.outer(row, row).astype(int)
+        self.valid_ce_cases = pd.DataFrame(0, index=np.arange(self.items), columns=np.arange(self.items))
+        for i in range(self.subjects):
+            #for subject i, increment all cases where neither a nor b are NaN (valid case for counterexamples)
+            not_nan = np.logical_not(self.rp.loc[i].isna())
+            self.valid_ce_cases += np.outer(not_nan, not_nan).astype(int)
     def add(self, dataset_to_add: Self):
         """
         Add a second IITA_Dataset: concatenate the response patterns, add counterexamples and equivalence examples\n
         Item amounts must match, else ValueError
         """
-        if (self.rp.shape[1] != dataset_to_add.shape[1]):
+        if (self.items != dataset_to_add.items):
             raise ValueError('Item amounts must match')
         self.rp = pd.concat(self.rp, dataset_to_add.rp)
         self.ce = self.ce + dataset_to_add.ce
         self.eqe = self.eqe + dataset_to_add.eqe
+    @property
+    def relative_ce(self) -> pd.DataFrame:
+        """
+        Returns the counterexamples matrix accounting for missing values
+        """
+        return self.ce / self.valid_ce_cases
     __iadd__ = add

{iita_python-1.0.2 → iita_python-1.2}/iita_python/quasiorder.py RENAMED Viewed

@@ -23,30 +23,20 @@ class QuasiOrder:
         return edge_list
 def unfold_examples(
-        matrix: pd.DataFrame,
-        relativity: npt.NDArray | None = None,
-        dtype=np.float32
+        matrix: pd.DataFrame
     ) -> npt.NDArray:
     """
     Turns an item/item metric DataFrame into
     a list of tuples of the form (x, [i, j]), where matrix[i, j] = x.\n
-    Can input a relativity matrix, then exery x gets divided by relativity[i, j].
-    This can be used to account for missing values
     """
-    dfmatrix = pd.DataFrame(matrix).astype(dtype)
-    rel = relativity
-    if (rel is None):
-        rel = np.ones(dfmatrix.shape, dtype=int)
-    dfmatrix = dfmatrix / rel
+    dfmatrix = pd.DataFrame(matrix)
     n = dfmatrix.shape[0]
     pos = np.arange(n, dtype=np.int_)
     i = np.repeat(pos, n)
     j = np.tile(pos, n)
-    res = np.array(list(zip(dfmatrix.to_numpy()[i, j], i, j)), dtype=np.int_)
+    res = np.array(list(zip(dfmatrix.to_numpy()[i, j], i, j)))
     return res[res[:, 1] != res[:, 2]]
 def ind_gen(counterexamples: npt.NDArray, n: int) -> list[QuasiOrder]:

{iita_python-1.0.2 → iita_python-1.2/iita_python.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: iita_python
-Version: 1.0.2
+Version: 1.2
 Summary: IITA algorithm in python
 Author-email: Aliaksei Badnarchuk <alexejbodnarchuk@gmail.com>
 Requires-Python: >=3.9
@@ -111,7 +111,7 @@ Returns: float (MSE, lower is better)
 ## Testing
-See the `test_ipynbs` folder. You can open the Jupyter notebooks in Google Colab and run all cells to see test results.
+See the `testing` branch. You can open the Jupyter notebooks in Google Colab and run all cells to see test results.
 I am comparing my results on the PISA dataset to those of Milan Segedinac ([his implementation](https://github.com/milansegedinac/kst))

{iita_python-1.0.2 → iita_python-1.2}/iita_python.egg-info/SOURCES.txt RENAMED Viewed

@@ -6,6 +6,7 @@ setup.py
 .github/workflows/release.yaml
 iita_python/__init__.py
 iita_python/_version.py
+iita_python/additional_ce.py
 iita_python/dataset.py
 iita_python/fit_metrics.py
 iita_python/quasiorder.py
@@ -14,8 +15,4 @@ iita_python.egg-info/PKG-INFO
 iita_python.egg-info/SOURCES.txt
 iita_python.egg-info/dependency_links.txt
 iita_python.egg-info/requires.txt
-iita_python.egg-info/top_level.txt
-test_ipynbs/fit_metrics.ipynb
-test_ipynbs/pisa.csv
-test_ipynbs/quasi-order-gen.ipynb
-test_ipynbs/sim_missing_data.ipynb
+iita_python.egg-info/top_level.txt

iita_python-1.0.2/test_ipynbs/fit_metrics.ipynb DELETED Viewed

@@ -1,235 +0,0 @@
-{
-  "cells": [
-    {
-      "cell_type": "markdown",
-      "id": "aefc5a77",
-      "metadata": {
-        "id": "aefc5a77"
-      },
-      "source": [
-        "# Testing the fit metric calculation on the PISA dataset, comparing to the KST library by Milan Segedinac"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "source": [
-        "1. Imporitng both libraries and requirements"
-      ],
-      "metadata": {
-        "id": "dzpt8hYXs7kO"
-      },
-      "id": "dzpt8hYXs7kO"
-    },
-    {
-      "cell_type": "code",
-      "source": [
-        "!git clone https://github.com/Alexe1900/iita_python.git\n",
-        "!git clone https://github.com/milansegedinac/kst.git\n",
-        "!pip install numpy\n",
-        "!pip install pandas\n",
-        "import sys\n",
-        "sys.path.append(\"/content/iita_python\")\n",
-        "sys.path.append(\"/content/kst\")\n",
-        "import numpy as np\n",
-        "import pandas as pd\n",
-        "import iita_python as test_iita\n",
-        "import learning_spaces.kst as kst"
-      ],
-      "metadata": {
-        "id": "s4P_gsz7tDlG",
-        "outputId": "03b37282-44e0-43f1-996e-ba3de8248eab",
-        "colab": {
-          "base_uri": "https://localhost:8080/"
-        }
-      },
-      "id": "s4P_gsz7tDlG",
-      "execution_count": 1,
-      "outputs": [
-        {
-          "output_type": "stream",
-          "name": "stdout",
-          "text": [
-            "fatal: destination path 'iita_python' already exists and is not an empty directory.\n",
-            "fatal: destination path 'kst' already exists and is not an empty directory.\n",
-            "Requirement already satisfied: numpy in /usr/local/lib/python3.12/dist-packages (2.0.2)\n",
-            "Requirement already satisfied: pandas in /usr/local/lib/python3.12/dist-packages (2.2.2)\n",
-            "Requirement already satisfied: numpy>=1.26.0 in /usr/local/lib/python3.12/dist-packages (from pandas) (2.0.2)\n",
-            "Requirement already satisfied: python-dateutil>=2.8.2 in /usr/local/lib/python3.12/dist-packages (from pandas) (2.9.0.post0)\n",
-            "Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.12/dist-packages (from pandas) (2025.2)\n",
-            "Requirement already satisfied: tzdata>=2022.7 in /usr/local/lib/python3.12/dist-packages (from pandas) (2025.2)\n",
-            "Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.12/dist-packages (from python-dateutil>=2.8.2->pandas) (1.17.0)\n"
-          ]
-        }
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "source": [
-        "2. Importing the dataset, generating quasi-orders"
-      ],
-      "metadata": {
-        "id": "Wwxr0c_rtSMN"
-      },
-      "id": "Wwxr0c_rtSMN"
-    },
-    {
-      "cell_type": "code",
-      "source": [
-        "from iita_python.utils import read_rp\n",
-        "\n",
-        "data_raw = read_rp(\"iita_python/test_ipynbs/pisa.csv\")\n",
-        "data = test_iita.Dataset(data_raw)\n",
-        "\n",
-        "unfolded_ce = test_iita.unfold_examples(data.counterexamples)\n",
-        "qos = test_iita.ind_gen(unfolded_ce, data.items)"
-      ],
-      "metadata": {
-        "id": "7CZKj4kktWg6"
-      },
-      "id": "7CZKj4kktWg6",
-      "execution_count": 2,
-      "outputs": []
-    },
-    {
-      "cell_type": "markdown",
-      "source": [
-        "3. Testing the fit metrics"
-      ],
-      "metadata": {
-        "id": "t-RqTjTEuBUo"
-      },
-      "id": "t-RqTjTEuBUo"
-    },
-    {
-      "cell_type": "markdown",
-      "source": [
-        "3.1. Original IITA fit metric"
-      ],
-      "metadata": {
-        "id": "oXyUJR12jT22"
-      },
-      "id": "oXyUJR12jT22"
-    },
-    {
-      "cell_type": "code",
-      "source": [
-        "import iita_python.fit_metrics as test_fit\n",
-        "corrects = kst.iita(data.response_patterns, 3)['diff']\n",
-        "\n",
-        "for i, qo in enumerate(qos):\n",
-        "  test_metric = round(test_fit.orig_iita_fit(data, qo), 3)\n",
-        "  corr_metric = round(corrects[i], 3)\n",
-        "\n",
-        "  try:\n",
-        "    assert (test_metric == corr_metric)\n",
-        "    print(f'Fit metric {i}/{len(qos)} correct ✅')\n",
-        "  except AssertionError:\n",
-        "    print(f'Fit metric {i}/{len(qos)} incorrect ❌')\n",
-        "    print(f'Test: {test_metric}')\n",
-        "    print(f'Correct: {corr_metric}')"
-      ],
-      "metadata": {
-        "id": "a5IvxR1I7-BG",
-        "outputId": "abc3c1be-79b3-4721-9c7c-a6e0e6669ba7",
-        "colab": {
-          "base_uri": "https://localhost:8080/"
-        }
-      },
-      "id": "a5IvxR1I7-BG",
-      "execution_count": 8,
-      "outputs": [
-        {
-          "output_type": "stream",
-          "name": "stdout",
-          "text": [
-            "Fit metric 0/13 correct ✅\n",
-            "Fit metric 1/13 correct ✅\n",
-            "Fit metric 2/13 correct ✅\n",
-            "Fit metric 3/13 correct ✅\n",
-            "Fit metric 4/13 correct ✅\n",
-            "Fit metric 5/13 correct ✅\n",
-            "Fit metric 6/13 correct ✅\n",
-            "Fit metric 7/13 correct ✅\n",
-            "Fit metric 8/13 correct ✅\n",
-            "Fit metric 9/13 correct ✅\n",
-            "Fit metric 10/13 correct ✅\n",
-            "Fit metric 11/13 correct ✅\n",
-            "Fit metric 12/13 correct ✅\n"
-          ]
-        }
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "source": [
-        "3.2. Corrected fit metric"
-      ],
-      "metadata": {
-        "id": "VIPtCas5jXP3"
-      },
-      "id": "VIPtCas5jXP3"
-    },
-    {
-      "cell_type": "code",
-      "source": [
-        "corrects = kst.iita(data.response_patterns, 2)['diff']\n",
-        "\n",
-        "for i, qo in enumerate(qos):\n",
-        "  test_metric = round(test_fit.corr_iita_fit(data, qo), 3)\n",
-        "  corr_metric = round(corrects[i], 3)\n",
-        "\n",
-        "  try:\n",
-        "    assert (test_metric == corr_metric)\n",
-        "    print(f'Fit metric {i}/{len(qos)} correct ✅')\n",
-        "  except AssertionError:\n",
-        "    print(f'Fit metric {i}/{len(qos)} incorrect ❌')\n",
-        "    print(f'Test: {test_metric}')\n",
-        "    print(f'Correct: {corr_metric}')"
-      ],
-      "metadata": {
-        "id": "j1LoyigWjc5t",
-        "outputId": "bd2ca738-1a94-4ce8-b507-325a1acdf9e1",
-        "colab": {
-          "base_uri": "https://localhost:8080/"
-        }
-      },
-      "id": "j1LoyigWjc5t",
-      "execution_count": 9,
-      "outputs": [
-        {
-          "output_type": "stream",
-          "name": "stdout",
-          "text": [
-            "Fit metric 0/13 correct ✅\n",
-            "Fit metric 1/13 correct ✅\n",
-            "Fit metric 2/13 correct ✅\n",
-            "Fit metric 3/13 correct ✅\n",
-            "Fit metric 4/13 correct ✅\n",
-            "Fit metric 5/13 correct ✅\n",
-            "Fit metric 6/13 correct ✅\n",
-            "Fit metric 7/13 correct ✅\n",
-            "Fit metric 8/13 correct ✅\n",
-            "Fit metric 9/13 correct ✅\n",
-            "Fit metric 10/13 correct ✅\n",
-            "Fit metric 11/13 correct ✅\n",
-            "Fit metric 12/13 correct ✅\n"
-          ]
-        }
-      ]
-    }
-  ],
-  "metadata": {
-    "language_info": {
-      "name": "python"
-    },
-    "colab": {
-      "provenance": []
-    },
-    "kernelspec": {
-      "name": "python3",
-      "display_name": "Python 3"
-    }
-  },
-  "nbformat": 4,
-  "nbformat_minor": 5
-}

iita_python-1.0.2/test_ipynbs/pisa.csv DELETED Viewed

@@ -1,340 +0,0 @@
-1,0,0,0,0
-0,0,0,0,0
-1,0,0,0,0
-1,0,0,0,0
-0,1,0,0,0
-1,1,0,0,0
-0,0,0,0,0
-1,1,0,0,1
-1,1,0,0,0
-1,1,0,0,0
-1,0,0,0,0
-1,1,0,0,0
-0,0,0,0,0
-1,0,0,0,0
-1,0,0,0,0
-1,0,0,0,0
-0,0,0,0,0
-1,1,0,0,0
-1,1,0,0,0
-0,0,0,0,0
-1,0,0,0,0
-1,0,0,0,0
-1,1,0,0,0
-1,0,0,0,0
-0,1,0,0,0
-1,1,0,0,0
-1,0,0,0,0
-1,0,0,0,0
-0,0,0,0,0
-1,0,0,0,0
-0,1,0,1,0
-1,0,0,0,0
-1,1,0,0,0
-1,1,0,1,0
-1,1,0,0,0
-1,1,0,0,0
-1,1,0,0,0
-1,1,0,0,1
-1,0,0,0,0
-1,1,0,0,0
-1,1,0,0,0
-1,0,0,0,0
-1,1,0,0,0
-1,0,0,0,0
-1,1,0,0,0
-1,1,0,0,0
-1,1,0,1,0
-1,1,0,0,0
-1,1,0,1,0
-1,1,0,0,1
-1,1,0,0,0
-1,0,0,0,0
-1,1,0,0,0
-1,1,0,0,1
-1,1,0,0,0
-1,1,0,0,0
-1,0,0,0,1
-1,0,0,0,0
-1,1,0,0,0
-1,0,0,0,0
-1,0,0,0,0
-1,1,0,0,0
-1,1,0,0,0
-1,0,0,0,0
-1,1,0,0,0
-1,1,0,0,0
-1,1,0,0,0
-1,1,0,0,1
-1,1,0,0,0
-0,0,0,0,0
-1,1,0,1,0
-1,1,0,1,0
-1,1,0,1,0
-1,1,0,0,0
-1,1,0,0,0
-1,0,0,0,1
-1,0,0,0,0
-1,1,0,0,0
-1,1,0,1,0
-1,0,0,0,0
-0,0,0,0,0
-1,1,0,0,0
-1,1,0,0,0
-1,0,0,0,0
-1,1,0,0,0
-1,1,0,0,0
-1,1,0,0,0
-1,0,0,0,0
-1,0,0,0,1
-1,1,0,0,0
-1,1,0,0,0
-1,1,0,1,0
-1,1,0,0,1
-1,1,0,0,0
-1,0,0,0,0
-1,0,0,0,0
-1,1,0,0,0
-1,1,0,0,0
-1,1,0,1,0
-1,1,0,0,0
-1,1,0,0,1
-1,1,0,0,0
-1,1,0,0,0
-1,1,0,0,0
-1,1,0,1,0
-1,1,0,0,0
-1,1,0,0,0
-1,0,0,0,0
-1,1,0,0,0
-1,1,0,0,1
-1,1,0,1,0
-1,1,0,1,0
-1,1,0,0,1
-1,1,0,1,0
-1,1,0,1,0
-1,0,0,0,0
-1,1,0,1,0
-1,0,0,0,0
-0,1,0,0,0
-1,1,0,0,1
-1,1,0,0,0
-1,1,0,0,0
-1,1,0,0,0
-0,0,0,1,0
-0,0,0,0,0
-1,0,0,0,0
-1,0,0,0,0
-0,0,0,0,0
-0,1,0,0,0
-0,0,0,0,0
-1,0,0,0,0
-0,1,0,0,0
-1,1,0,0,0
-0,0,0,0,0
-1,1,0,0,0
-1,1,0,0,0
-1,0,0,1,0
-0,0,0,0,0
-0,1,0,0,0
-0,1,0,0,0
-1,1,0,0,0
-1,0,0,0,0
-1,1,0,0,0
-1,1,0,0,0
-1,0,0,0,0
-0,1,0,0,1
-1,1,0,0,0
-1,1,0,1,0
-1,0,0,0,0
-0,1,0,0,1
-1,0,0,0,0
-1,1,0,0,0
-0,0,0,0,0
-0,0,0,0,0
-1,1,0,0,0
-0,1,0,0,0
-0,0,0,0,0
-0,0,0,0,0
-0,0,0,0,0
-1,0,0,0,0
-0,1,1,0,0
-1,1,1,0,0
-1,0,1,0,0
-1,1,1,0,0
-0,1,1,1,0
-1,1,1,1,0
-1,1,1,1,1
-1,1,1,0,0
-0,0,1,0,0
-1,1,1,1,1
-1,1,1,0,0
-1,1,1,1,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,0,1
-1,0,1,0,0
-0,1,1,0,0
-1,0,1,0,0
-1,1,1,1,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,0,1
-1,0,1,0,0
-0,1,1,0,0
-1,0,1,1,0
-1,1,1,1,0
-1,1,1,0,0
-1,1,1,1,0
-1,0,1,0,0
-1,1,1,0,0
-1,1,1,0,1
-1,0,1,0,0
-1,1,1,0,0
-1,1,1,0,1
-1,1,1,0,1
-1,1,1,0,0
-1,0,1,1,1
-1,1,1,0,0
-1,1,1,1,1
-1,1,1,0,0
-0,1,1,0,0
-0,1,1,0,0
-0,1,1,0,0
-1,1,1,1,0
-1,1,1,0,0
-1,0,1,0,0
-1,0,1,0,1
-1,1,1,0,1
-1,1,1,0,0
-1,1,1,1,0
-1,1,1,0,0
-1,1,1,1,0
-1,0,1,0,0
-1,1,1,0,0
-0,1,1,0,0
-1,1,1,1,1
-1,1,1,0,0
-1,1,1,1,0
-1,1,1,1,0
-1,0,1,1,0
-1,1,1,0,1
-1,1,1,0,0
-1,1,1,1,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,1,0
-1,1,1,0,0
-1,1,1,1,0
-1,1,1,0,0
-1,0,1,1,0
-1,1,1,1,1
-1,1,1,0,0
-1,1,1,1,0
-1,1,1,1,0
-1,1,1,1,0
-1,1,1,1,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,1,0
-1,1,1,1,0
-1,1,1,1,1
-1,1,1,0,0
-1,1,1,1,0
-1,1,1,1,1
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,0,1
-1,0,1,1,0
-1,1,1,0,0
-1,1,1,1,1
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,0,1
-1,1,1,1,1
-0,1,1,0,1
-1,1,1,0,1
-1,0,1,0,0
-1,1,1,0,1
-1,1,1,0,1
-1,1,1,0,0
-1,1,1,0,1
-1,1,1,0,1
-1,1,1,1,0
-1,1,1,1,0
-1,1,1,1,0
-1,1,1,1,0
-0,1,1,0,0
-1,1,1,0,0
-0,1,1,1,0
-1,1,1,1,0
-1,1,1,1,0
-1,1,1,0,0
-1,1,1,1,1
-1,1,1,1,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,0,1
-1,1,1,1,0
-1,1,1,0,0
-1,1,1,0,1
-1,1,1,0,0
-1,1,1,1,0
-1,1,1,0,1
-1,1,1,1,1
-1,1,1,0,0
-1,1,1,1,0
-1,1,1,1,1
-1,1,1,1,0
-1,1,1,1,0
-1,1,1,1,0
-1,1,1,1,0
-1,1,1,1,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,1,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,1,0
-1,1,1,1,0
-1,1,1,1,0
-1,1,1,0,0
-1,0,1,0,0
-1,1,1,0,0
-1,0,1,0,0
-0,0,1,0,0
-1,0,1,0,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,0,0
-1,0,1,0,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,0,0
-1,1,1,1,0
-0,1,1,0,0
-1,0,1,1,0
-1,1,1,0,0
-1,0,1,0,0
-0,0,1,0,0
-0,0,1,0,0
-0,1,0,0,0
-0,1,0,0,0
-0,1,0,0,0
-1,0,0,0,0
-1,0,0,0,0
-0,0,0,0,0
-0,0,0,0,0

iita_python-1.0.2/test_ipynbs/quasi-order-gen.ipynb DELETED Viewed

@@ -1,219 +0,0 @@
-{
-  "cells": [
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "cw9gSDCONN4s"
-      },
-      "source": [
-        "# Testing the quasi-order generation on the PISA dataset, comparing to the KST library by Milan Segedinac"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "gH1gF08aNy22"
-      },
-      "source": [
-        "1. Importing both libraries and requirements"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/"
-        },
-        "id": "bvA-pXFUN36a",
-        "outputId": "fefbb9ca-5eb1-41ec-da36-fc31f7de1093"
-      },
-      "outputs": [
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "fatal: destination path 'iita_python' already exists and is not an empty directory.\n",
-            "fatal: destination path 'kst' already exists and is not an empty directory.\n",
-            "Requirement already satisfied: numpy in /usr/local/lib/python3.12/dist-packages (2.0.2)\n",
-            "Requirement already satisfied: pandas in /usr/local/lib/python3.12/dist-packages (2.2.2)\n",
-            "Requirement already satisfied: numpy>=1.26.0 in /usr/local/lib/python3.12/dist-packages (from pandas) (2.0.2)\n",
-            "Requirement already satisfied: python-dateutil>=2.8.2 in /usr/local/lib/python3.12/dist-packages (from pandas) (2.9.0.post0)\n",
-            "Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.12/dist-packages (from pandas) (2025.2)\n",
-            "Requirement already satisfied: tzdata>=2022.7 in /usr/local/lib/python3.12/dist-packages (from pandas) (2025.2)\n",
-            "Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.12/dist-packages (from python-dateutil>=2.8.2->pandas) (1.17.0)\n"
-          ]
-        }
-      ],
-      "source": [
-        "!git clone https://github.com/Alexe1900/iita_python.git\n",
-        "!git clone https://github.com/milansegedinac/kst.git\n",
-        "!pip install numpy\n",
-        "!pip install pandas\n",
-        "import sys\n",
-        "sys.path.append(\"/content/iita_python\")\n",
-        "sys.path.append(\"/content/kst\")\n",
-        "import numpy as np\n",
-        "import pandas as pd\n",
-        "import iita_python as iita\n",
-        "import learning_spaces.kst as kst"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "CwlVMK3MO3QJ"
-      },
-      "source": [
-        "2. Importing the dataset"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": 3,
-      "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/"
-        },
-        "id": "FvSAv-4cOWQp",
-        "outputId": "4d1adf29-3d0c-40cf-d79d-9a8df3d9f945"
-      },
-      "outputs": [
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "Data imported successfully ✅\n"
-          ]
-        }
-      ],
-      "source": [
-        "from iita_python.utils import read_rp\n",
-        "\n",
-        "data_raw = read_rp(\"iita_python/test_ipynbs/pisa.csv\")\n",
-        "assert not data_raw.empty\n",
-        "print(\"Data imported successfully ✅\")"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "UVRNzocZTCZC"
-      },
-      "source": [
-        "3. Counting the counterexamples"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": 6,
-      "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/"
-        },
-        "id": "lWysv1UsTGPf",
-        "outputId": "d24fc04a-e60d-45c6-ce95-c77f859df45e"
-      },
-      "outputs": [
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "Counterexamples computed correctly ✅\n"
-          ]
-        }
-      ],
-      "source": [
-        "data = iita.Dataset(data_raw)\n",
-        "\n",
-        "correct_ce = kst.ob_counter(data_raw)\n",
-        "\n",
-        "try:\n",
-        "  assert (correct_ce == data.counterexamples.to_numpy()).all()\n",
-        "  print(\"Counterexamples computed correctly ✅\")\n",
-        "except AssertionError:\n",
-        "  print(\"Counterexamples computed incorrectly ❌\")\n"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "H7X3tEf7bGdt"
-      },
-      "source": [
-        "4. Generating the quasi-orders"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/"
-        },
-        "id": "Ywvri9o8bGA0",
-        "outputId": "438b2adf-3bb1-4784-cab7-ff32228d5eab"
-      },
-      "outputs": [
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "Correct number of quasi-orders ✅\n",
-            "Quasi-order 0/13 correct ✅\n",
-            "Quasi-order 1/13 correct ✅\n",
-            "Quasi-order 2/13 correct ✅\n",
-            "Quasi-order 3/13 correct ✅\n",
-            "Quasi-order 4/13 correct ✅\n",
-            "Quasi-order 5/13 correct ✅\n",
-            "Quasi-order 6/13 correct ✅\n",
-            "Quasi-order 7/13 correct ✅\n",
-            "Quasi-order 8/13 correct ✅\n",
-            "Quasi-order 9/13 correct ✅\n",
-            "Quasi-order 10/13 correct ✅\n",
-            "Quasi-order 11/13 correct ✅\n",
-            "Quasi-order 12/13 correct ✅\n"
-          ]
-        }
-      ],
-      "source": [
-        "correct_qos = kst.ind_gen(correct_ce)\n",
-        "\n",
-        "unfolded_ce = iita.unfold_examples(data.counterexamples)\n",
-        "test_qos = iita.ind_gen(unfolded_ce, data.items)\n",
-        "test_qos = [sorted([(int(a), int(b)) for a, b in qo.get_edge_list()]) for qo in test_qos]\n",
-        "\n",
-        "try:\n",
-        "  assert len(correct_qos) == len(test_qos)\n",
-        "  print(f'Correct number of quasi-orders ✅')\n",
-        "except AssertionError:\n",
-        "  print(f'Wrong number of quasi-orders ❌')\n",
-        "  quit()\n",
-        "\n",
-        "for i, (corr_qo, test_qo) in enumerate(zip(correct_qos, test_qos)):\n",
-        "  corr_qo = sorted(corr_qo)\n",
-        "  try:\n",
-        "    assert corr_qo == test_qo\n",
-        "    print(f'Quasi-order {i}/{len(correct_qos)} correct ✅')\n",
-        "  except AssertionError:\n",
-        "    print(f'Quasi-order {i}/{len(correct_qos)} incorrect ❌')\n",
-        "    print(f'Test: {test_qo}')\n",
-        "    print(f'Correct: {corr_qo}')"
-      ]
-    }
-  ],
-  "metadata": {
-    "colab": {
-      "provenance": []
-    },
-    "kernelspec": {
-      "display_name": "Python 3",
-      "name": "python3"
-    },
-    "language_info": {
-      "name": "python"
-    }
-  },
-  "nbformat": 4,
-  "nbformat_minor": 0
-}

iita_python-1.0.2/test_ipynbs/sim_missing_data.ipynb DELETED Viewed

@@ -1,176 +0,0 @@
-{
-  "cells": [
-    {
-      "cell_type": "markdown",
-      "id": "c534cd3f",
-      "metadata": {
-        "id": "c534cd3f"
-      },
-      "source": [
-        "# Testing on PISA dataset with randomized missing data"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "source": [
-        "1. Importing package and dataset"
-      ],
-      "metadata": {
-        "id": "1nLTjppYSRTe"
-      },
-      "id": "1nLTjppYSRTe"
-    },
-    {
-      "cell_type": "code",
-      "source": [
-        "!pip install iita_python\n",
-        "!git clone https://gist.github.com/717f0147675b0c8ed25e50d583c943bf.git\n",
-        "\n",
-        "import numpy as np\n",
-        "import iita_python as iita\n",
-        "import iita_python.fit_metrics as iita_fm\n",
-        "from iita_python.utils import read_rp\n",
-        "from random import randint\n",
-        "\n",
-        "data = read_rp('./717f0147675b0c8ed25e50d583c943bf/pisa.csv')"
-      ],
-      "metadata": {
-        "id": "SlEiX6B1SSsU",
-        "outputId": "55bf001f-aba5-493c-a3a6-77da399684c0",
-        "colab": {
-          "base_uri": "https://localhost:8080/"
-        }
-      },
-      "id": "SlEiX6B1SSsU",
-      "execution_count": 8,
-      "outputs": [
-        {
-          "output_type": "stream",
-          "name": "stdout",
-          "text": [
-            "Requirement already satisfied: iita_python in /usr/local/lib/python3.12/dist-packages (0.0.post42)\n",
-            "Requirement already satisfied: numpy in /usr/local/lib/python3.12/dist-packages (from iita_python) (2.0.2)\n",
-            "Requirement already satisfied: pandas in /usr/local/lib/python3.12/dist-packages (from iita_python) (2.2.2)\n",
-            "Requirement already satisfied: python-dateutil>=2.8.2 in /usr/local/lib/python3.12/dist-packages (from pandas->iita_python) (2.9.0.post0)\n",
-            "Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.12/dist-packages (from pandas->iita_python) (2025.2)\n",
-            "Requirement already satisfied: tzdata>=2022.7 in /usr/local/lib/python3.12/dist-packages (from pandas->iita_python) (2025.2)\n",
-            "Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.12/dist-packages (from python-dateutil>=2.8.2->pandas->iita_python) (1.17.0)\n",
-            "fatal: destination path '717f0147675b0c8ed25e50d583c943bf' already exists and is not an empty directory.\n"
-          ]
-        }
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "source": [
-        "2. Testing function"
-      ],
-      "metadata": {
-        "id": "jlvoh1yOata0"
-      },
-      "id": "jlvoh1yOata0"
-    },
-    {
-      "cell_type": "code",
-      "source": [
-        "def test(metric):\n",
-        "  correct = True\n",
-        "  correct_qo = None\n",
-        "  correct_count = 0\n",
-        "\n",
-        "  while (correct and correct_count < data.shape[0]*data.shape[1]):\n",
-        "    print(f'doing {correct_count}')\n",
-        "    test_dataset = iita.Dataset(data)\n",
-        "    unfolded_ce = iita.unfold_examples(test_dataset.ce)\n",
-        "    qos = iita.ind_gen(unfolded_ce, test_dataset.items)\n",
-        "\n",
-        "    best_qo_id = -1\n",
-        "    best_qo_diff = float('inf')\n",
-        "    for i, qo in enumerate(qos):\n",
-        "      qo_diff = metric(test_dataset, qo)\n",
-        "      if (qo_diff < best_qo_diff):\n",
-        "        best_qo_diff = qo_diff\n",
-        "        best_qo_id = i\n",
-        "\n",
-        "    best_qo = sorted([(int(a), int(b)) for a, b in qos[best_qo_id].get_edge_list()])\n",
-        "    if (correct_qo is None):\n",
-        "      correct_count += 1\n",
-        "      correct_qo = best_qo\n",
-        "    elif (best_qo != correct_qo):\n",
-        "      correct = False\n",
-        "    else:\n",
-        "      correct_count += 1\n",
-        "\n",
-        "      while (True):\n",
-        "        a = randint(0, test_dataset.items - 1)\n",
-        "        b = randint(0, test_dataset.subjects - 1)\n",
-        "        if (not np.isnan(data[a][b])):\n",
-        "          break;\n",
-        "      data.loc[b, a] = np.nan\n",
-        "\n",
-        "  return correct_count"
-      ],
-      "metadata": {
-        "id": "ok9yLOnsTOU7"
-      },
-      "id": "ok9yLOnsTOU7",
-      "execution_count": 21,
-      "outputs": []
-    },
-    {
-      "cell_type": "code",
-      "source": [
-        "res = test(iita_fm.orig_iita_fit)"
-      ],
-      "metadata": {
-        "id": "giLvbXdtX4uc"
-      },
-      "id": "giLvbXdtX4uc",
-      "execution_count": null,
-      "outputs": []
-    },
-    {
-      "cell_type": "code",
-      "source": [
-        "res"
-      ],
-      "metadata": {
-        "id": "N2K347pebF9u",
-        "outputId": "b603f637-7b16-4161-eb18-4cf5ea12d989",
-        "colab": {
-          "base_uri": "https://localhost:8080/"
-        }
-      },
-      "id": "N2K347pebF9u",
-      "execution_count": 23,
-      "outputs": [
-        {
-          "output_type": "execute_result",
-          "data": {
-            "text/plain": [
-              "525"
-            ]
-          },
-          "metadata": {},
-          "execution_count": 23
-        }
-      ]
-    }
-  ],
-  "metadata": {
-    "kernelspec": {
-      "display_name": "iita",
-      "language": "python",
-      "name": "python3"
-    },
-    "language_info": {
-      "name": "python",
-      "version": "3.12.11"
-    },
-    "colab": {
-      "provenance": []
-    }
-  },
-  "nbformat": 4,
-  "nbformat_minor": 5
-}