PyPI - gr-libs - Versions diffs - 0.1.8__py3-none-any.whl → 0.2.2__py3-none-any.whl - Mend

gr-libs 0.1.8py3-none-any.whl → 0.2.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (68) hide show

gr_libs/__init__.py +3 -1
gr_libs/_evaluation/__init__.py +1 -0
evaluation/analyze_results_cross_alg_cross_domain.py → gr_libs/_evaluation/_analyze_results_cross_alg_cross_domain.py +81 -88
evaluation/generate_experiments_results.py → gr_libs/_evaluation/_generate_experiments_results.py +6 -6
evaluation/generate_task_specific_statistics_plots.py → gr_libs/_evaluation/_generate_task_specific_statistics_plots.py +11 -14
evaluation/get_plans_images.py → gr_libs/_evaluation/_get_plans_images.py +3 -4
evaluation/increasing_and_decreasing_.py → gr_libs/_evaluation/_increasing_and_decreasing_.py +3 -1
gr_libs/_version.py +2 -2
gr_libs/all_experiments.py +294 -0
gr_libs/environment/__init__.py +14 -1
gr_libs/environment/{utils → _utils}/utils.py +1 -1
gr_libs/environment/environment.py +257 -22
gr_libs/metrics/__init__.py +2 -0
gr_libs/metrics/metrics.py +166 -31
gr_libs/ml/__init__.py +1 -6
gr_libs/ml/base/__init__.py +3 -1
gr_libs/ml/base/rl_agent.py +68 -3
gr_libs/ml/neural/__init__.py +1 -3
gr_libs/ml/neural/deep_rl_learner.py +227 -67
gr_libs/ml/neural/utils/__init__.py +1 -2
gr_libs/ml/planner/mcts/{utils → _utils}/tree.py +1 -1
gr_libs/ml/planner/mcts/mcts_model.py +71 -34
gr_libs/ml/sequential/__init__.py +0 -1
gr_libs/ml/sequential/{lstm_model.py → _lstm_model.py} +11 -14
gr_libs/ml/tabular/__init__.py +1 -3
gr_libs/ml/tabular/tabular_q_learner.py +27 -9
gr_libs/ml/tabular/tabular_rl_agent.py +22 -9
gr_libs/ml/utils/__init__.py +2 -9
gr_libs/ml/utils/format.py +13 -90
gr_libs/ml/utils/math.py +3 -2
gr_libs/ml/utils/other.py +2 -2
gr_libs/ml/utils/storage.py +41 -94
gr_libs/odgr_executor.py +268 -0
gr_libs/problems/consts.py +2 -2
gr_libs/recognizer/_utils/__init__.py +0 -0
gr_libs/recognizer/{utils → _utils}/format.py +2 -2
gr_libs/recognizer/gr_as_rl/gr_as_rl_recognizer.py +116 -36
gr_libs/recognizer/graml/{gr_dataset.py → _gr_dataset.py} +11 -11
gr_libs/recognizer/graml/graml_recognizer.py +172 -29
gr_libs/recognizer/recognizer.py +59 -10
gr_libs/tutorials/draco_panda_tutorial.py +58 -0
gr_libs/tutorials/draco_parking_tutorial.py +56 -0
{tutorials → gr_libs/tutorials}/gcdraco_panda_tutorial.py +5 -9
{tutorials → gr_libs/tutorials}/gcdraco_parking_tutorial.py +3 -7
{tutorials → gr_libs/tutorials}/graml_minigrid_tutorial.py +2 -2
{tutorials → gr_libs/tutorials}/graml_panda_tutorial.py +5 -10
{tutorials → gr_libs/tutorials}/graml_parking_tutorial.py +5 -9
{tutorials → gr_libs/tutorials}/graml_point_maze_tutorial.py +2 -1
{tutorials → gr_libs/tutorials}/graql_minigrid_tutorial.py +2 -2
{gr_libs-0.1.8.dist-info → gr_libs-0.2.2.dist-info}/METADATA +84 -29
gr_libs-0.2.2.dist-info/RECORD +71 -0
{gr_libs-0.1.8.dist-info → gr_libs-0.2.2.dist-info}/WHEEL +1 -1
gr_libs-0.2.2.dist-info/top_level.txt +2 -0
tests/test_draco.py +14 -0
tests/test_gcdraco.py +2 -2
tests/test_graml.py +4 -4
tests/test_graql.py +1 -1
evaluation/create_minigrid_map_image.py +0 -38
evaluation/file_system.py +0 -53
evaluation/generate_experiments_results_new_ver1.py +0 -238
evaluation/generate_experiments_results_new_ver2.py +0 -331
gr_libs/ml/neural/utils/penv.py +0 -60
gr_libs/recognizer/utils/__init__.py +0 -1
gr_libs-0.1.8.dist-info/RECORD +0 -70
gr_libs-0.1.8.dist-info/top_level.txt +0 -4
/gr_libs/environment/{utils → _utils}/__init__.py +0 -0
/gr_libs/ml/planner/mcts/{utils → _utils}/__init__.py +0 -0
/gr_libs/ml/planner/mcts/{utils → _utils}/node.py +0 -0

gr_libs/all_experiments.py ADDED Viewed

@@ -0,0 +1,294 @@
+""" executes odgr_executor parallely on a set of problems defined in consts.py """
+import concurrent.futures
+import os
+import subprocess
+import sys
+import threading
+import dill
+import numpy as np
+from gr_libs.ml.utils.storage import get_experiment_results_path
+# Define the lists
+# domains = ['minigrid', 'point_maze', 'parking', 'panda']
+# envs = {
+#     'minigrid': ['obstacles', 'lava_crossing'],
+#     'point_maze': ['four_rooms', 'lava_crossing'],
+#     'parking': ['gc_agent', 'gd_agent'],
+#     'panda': ['gc_agent', 'gd_agent']
+# }
+# tasks = {
+#     'minigrid': ['L111', 'L222', 'L333', 'L444', 'L555'],
+#     'point_maze': ['L111', 'L222', 'L333', 'L444', 'L555'],
+#     'parking': ['L111', 'L222', 'L333', 'L444', 'L555'],
+#     'panda': ['L111', 'L222', 'L333', 'L444', 'L555']
+# }
+configs = {
+    "minigrid": {
+        "MiniGrid-SimpleCrossingS13N4": ["L1", "L2", "L3", "L4", "L5"],
+        "MiniGrid-LavaCrossingS9N2": ["L1", "L2", "L3", "L4", "L5"],
+    }
+    # 'point_maze': {
+    #     'PointMaze-FourRoomsEnvDense-11x11': ['L1', 'L2', 'L3', 'L4', 'L5'],
+    #     'PointMaze-ObstaclesEnvDense-11x11': ['L1', 'L2', 'L3', 'L4', 'L5']
+    # }
+    # 'parking': {
+    #     'Parking-S-14-PC-': ['L1', 'L2', 'L3', 'L4', 'L5'],
+    #     'Parking-S-14-PC-': ['L1', 'L2', 'L3', 'L4', 'L5']
+    # }
+    # 'panda': {
+    #     'PandaMyReachDense': ['L1', 'L2', 'L3', 'L4', 'L5'],
+    #     'PandaMyReachDense': ['L1', 'L2', 'L3', 'L4', 'L5']
+    # }
+}
+# for minigrid:
+# TODO assert these instead i the beggingning of the code before beginning
+# with the actual threading
+recognizers = ["ExpertBasedGraml", "Graql"]
+# recognizers = ['Graql']
+# for point_maze:
+# recognizers = ['ExpertBasedGraml']
+# recognizers = ['Draco']
+# for parking:
+# recognizers = ['GCGraml']
+# recognizers = ['GCDraco']
+# for panda:
+# recognizers = ['GCGraml']
+# recognizers = ['GCDraco']
+n = 5  # Number of times to execute each task
+# Function to read results from the result file
+def read_results(res_file_path):
+    """
+    Read the results from a result file.
+    Args:
+        res_file_path (str): The path to the result file.
+    Returns:
+        The results read from the file.
+    """
+    with open(res_file_path, "rb") as f:
+        results = dill.load(f)
+    return results
+# Every thread worker executes this function.
+def run_experiment(domain, env, task, recognizer, i, generate_new=False):
+    """
+    Run an experiment.
+    Args:
+        domain (str): The domain of the experiment.
+        env (str): The environment of the experiment.
+        task (str): The task of the experiment.
+        recognizer (str): The recognizer used in the experiment.
+        i (int): The index of the experiment.
+        generate_new (bool, optional): Whether to generate new results.
+        Defaults to False.
+    Returns:
+        tuple: A tuple containing the experiment details and the results.
+    """
+    cmd = f"python gr_libs/odgr_executor.py --domain {domain} --recognizer \
+          {recognizer} --env_name {env} --task {task} --collect_stats"
+    print(f"Starting execution: {cmd}")
+    try:
+        res_file_path = get_experiment_results_path(domain, env, task, recognizer)
+        res_file_path_txt = os.path.join(res_file_path, "res.txt")
+        i_res_file_path_txt = os.path.join(res_file_path, f"res_{i}.txt")
+        res_file_path_pkl = os.path.join(res_file_path, "res.pkl")
+        i_res_file_path_pkl = os.path.join(res_file_path, f"res_{i}.pkl")
+        if generate_new or (
+            not os.path.exists(i_res_file_path_txt)
+            or not os.path.exists(i_res_file_path_pkl)
+        ):
+            if os.path.exists(i_res_file_path_txt) or os.path.exists(
+                i_res_file_path_pkl
+            ):
+                i_res_file_path_txt = i_res_file_path_txt.replace(f"_{i}", f"_{i}_new")
+                i_res_file_path_pkl = i_res_file_path_pkl.replace(f"_{i}", f"_{i}_new")
+            process = subprocess.Popen(cmd, shell=True)
+            process.wait()
+            if process.returncode != 0:
+                print(f"Execution failed: {cmd}")
+                print(f"Error: {result.stderr}")
+                return None
+            else:
+                print(f"Finished execution successfully: {cmd}")
+            file_lock = threading.Lock()
+            with file_lock:
+                os.rename(res_file_path_pkl, i_res_file_path_pkl)
+                os.rename(res_file_path_txt, i_res_file_path_txt)
+        else:
+            print(
+                f"File {i_res_file_path_txt} already exists. Skipping execution \
+                 of {cmd}"
+            )
+        return ((domain, env, task, recognizer), read_results(i_res_file_path_pkl))
+    except Exception as e:
+        print(f"Exception occurred while running experiment: {e}")
+        return None
+# Collect results
+results = {}
+# create an executor that manages a pool of threads.
+# Note that any failure in the threads will not stop the main thread
+# from continuing and vice versa, nor will the debugger view the
+# failure if in debug mode.
+# Use prints and if any thread's printing stops suspect failure.
+# If failure happened, use breakpoints before failure and use the
+# watch to see the failure by pasting the problematic piece of code.
+with concurrent.futures.ThreadPoolExecutor() as executor:
+    futures = []
+    for domain, envs in configs.items():
+        for env, tasks in envs.items():
+            for task in tasks:
+                for recognizer in recognizers:
+                    for i in range(n):
+                        futures.append(
+                            executor.submit(
+                                run_experiment,
+                                domain,
+                                env,
+                                task,
+                                recognizer,
+                                i,
+                                generate_new=(
+                                    True
+                                    if len(sys.argv) > 1
+                                    and sys.argv[1] == "--generate_new"
+                                    else False
+                                ),
+                            )
+                        )
+    for future in concurrent.futures.as_completed(futures):
+        if future.result() is None:
+            print(
+                f"for future {future}, future.result() is None. \
+                 Continuing to next future."
+            )
+            continue
+        key, result = future.result()
+        print(f"main thread reading results from future {key}")
+        if key not in results:
+            results[key] = []
+        results[key].append(result)
+# Calculate average accuracy and standard deviation for each percentage
+detailed_summary = {}
+compiled_accuracies = {}
+for key, result_list in results.items():
+    domain, env, task, recognizer = key
+    percentages = result_list[0].keys()
+    detailed_summary[key] = {}
+    if (domain, recognizer) not in compiled_accuracies:
+        compiled_accuracies[(domain, recognizer)] = {}
+    for percentage in percentages:
+        if percentage == "total":
+            continue
+        if percentage not in compiled_accuracies[(domain, recognizer)].keys():
+            compiled_accuracies[(domain, recognizer)][percentage] = {}
+        if percentage not in detailed_summary[key].keys():
+            detailed_summary[key][percentage] = {}
+        consecutive_accuracies = [
+            result[percentage]["consecutive"]["accuracy"] for result in result_list
+        ]
+        non_consecutive_accuracies = [
+            result[percentage]["non_consecutive"]["accuracy"] for result in result_list
+        ]
+        if (
+            "consecutive"
+            in compiled_accuracies[(domain, recognizer)][percentage].keys()
+        ):
+            compiled_accuracies[(domain, recognizer)][percentage]["consecutive"].extend(
+                consecutive_accuracies
+            )
+        else:
+            compiled_accuracies[(domain, recognizer)][percentage][
+                "consecutive"
+            ] = consecutive_accuracies
+        if (
+            "non_consecutive"
+            in compiled_accuracies[(domain, recognizer)][percentage].keys()
+        ):
+            compiled_accuracies[(domain, recognizer)][percentage][
+                "non_consecutive"
+            ].extend(non_consecutive_accuracies)
+        else:
+            compiled_accuracies[(domain, recognizer)][percentage][
+                "non_consecutive"
+            ] = non_consecutive_accuracies
+        avg_consecutive_accuracy = np.mean(consecutive_accuracies)
+        consecutive_std_dev = np.std(consecutive_accuracies)
+        detailed_summary[key][percentage]["consecutive"] = (
+            avg_consecutive_accuracy,
+            consecutive_std_dev,
+        )
+        avg_non_consecutive_accuracy = np.mean(non_consecutive_accuracies)
+        non_consecutive_std_dev = np.std(non_consecutive_accuracies)
+        detailed_summary[key][percentage]["non_consecutive"] = (
+            avg_non_consecutive_accuracy,
+            non_consecutive_std_dev,
+        )
+compiled_summary = {}
+for key, percentage_dict in compiled_accuracies.items():
+    compiled_summary[key] = {}
+    for percentage, cons_accuracies in percentage_dict.items():
+        compiled_summary[key][percentage] = {}
+        for is_cons, accuracies in cons_accuracies.items():
+            avg_accuracy = np.mean(accuracies)
+            std_dev = np.std(accuracies)
+            compiled_summary[key][percentage][is_cons] = (avg_accuracy, std_dev)
+# Write different summary results to different files
+if not os.path.exists(os.path.join("outputs", "summaries")):
+    os.makedirs(os.path.join("outputs", "summaries"))
+detailed_summary_file_path = os.path.join(
+    "outputs",
+    "summaries",
+    f"detailed_summary_{''.join(configs.keys())}_{recognizers[0]}.txt",
+)
+compiled_summary_file_path = os.path.join(
+    "outputs",
+    "summaries",
+    f"compiled_summary_{''.join(configs.keys())}_{recognizers[0]}.txt",
+)
+with open(detailed_summary_file_path, "w") as f:
+    for key, percentage_dict in detailed_summary.items():
+        domain, env, task, recognizer = key
+        f.write(f"{domain}\t{env}\t{task}\t{recognizer}\n")
+        for percentage, cons_info in percentage_dict.items():
+            for is_cons, (avg_accuracy, std_dev) in cons_info.items():
+                f.write(
+                    f"\t\t{percentage}\t{is_cons}\t{avg_accuracy:.4f}\t{std_dev:.4f}\n"
+                )
+with open(compiled_summary_file_path, "w") as f:
+    for key, percentage_dict in compiled_summary.items():
+        for percentage, cons_info in percentage_dict.items():
+            for is_cons, (avg_accuracy, std_dev) in cons_info.items():
+                f.write(
+                    f"{key[0]}\t{key[1]}\t{percentage}\t{is_cons}\t{avg_accuracy:.4f}\t{std_dev:.4f}\n"
+                )
+        domain, recognizer = key
+        f.write(f"{domain}\t{recognizer}\n")
+        for percentage, cons_info in percentage_dict.items():
+            for is_cons, (avg_accuracy, std_dev) in cons_info.items():
+                f.write(
+                    f"\t\t{percentage}\t{is_cons}\t{avg_accuracy:.4f}\t{std_dev:.4f}\n"
+                )
+print(f"Detailed summary results written to {detailed_summary_file_path}")
+print(f"Compiled summary results written to {compiled_summary_file_path}")

gr_libs/environment/__init__.py CHANGED Viewed

@@ -1,9 +1,22 @@
+"""
+A module GR algorithms can store hard-coded parameters anf functionalities
+that are environment-related.
+"""
 import importlib.metadata
 import warnings
 def is_extra_installed(package: str, extra: str) -> bool:
-    """Check if an extra was installed for a given package."""
+    """Check if an extra was installed for a given package.
+    Args:
+        package (str): The name of the package.
+        extra (str): The name of the extra to check.
+    Returns:
+        bool: True if the extra is installed, False otherwise.
+    """
     try:
         # Get metadata for the installed package
         dist = importlib.metadata.metadata(package)

gr_libs/environment/{utils → _utils}/utils.py RENAMED Viewed

@@ -1,11 +1,11 @@
 import logging
 import sys
 from gr_libs.environment.environment import (
     MINIGRID,
     PANDA,
     PARKING,
     POINT_MAZE,
-    EnvProperty,
     MinigridProperty,
     PandaProperty,
     ParkingProperty,

gr-libs 0.1.8__py3-none-any.whl → 0.2.2__py3-none-any.whl

gr-libs 0.1.8py3-none-any.whl → 0.2.2py3-none-any.whl