PyPI - sierra-research - Versions diffs - 1.3.11__py3-none-any.whl → 1.5.0__py3-none-any.whl - Mend

sierra-research 1.3.11py3-none-any.whl → 1.5.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (254) hide show

sierra/__init__.py +3 -3
sierra/core/__init__.py +3 -3
sierra/core/batchroot.py +223 -0
sierra/core/cmdline.py +681 -1057
sierra/core/compare.py +11 -0
sierra/core/config.py +96 -88
sierra/core/engine.py +306 -0
sierra/core/execenv.py +380 -0
sierra/core/expdef.py +11 -0
sierra/core/experiment/__init__.py +1 -0
sierra/core/experiment/bindings.py +150 -101
sierra/core/experiment/definition.py +414 -245
sierra/core/experiment/spec.py +83 -85
sierra/core/exproot.py +44 -0
sierra/core/generators/__init__.py +10 -0
sierra/core/generators/experiment.py +528 -0
sierra/core/generators/generator_factory.py +138 -137
sierra/core/graphs/__init__.py +23 -0
sierra/core/graphs/bcbridge.py +94 -0
sierra/core/graphs/heatmap.py +245 -324
sierra/core/graphs/pathset.py +27 -0
sierra/core/graphs/schema.py +77 -0
sierra/core/graphs/stacked_line.py +341 -0
sierra/core/graphs/summary_line.py +506 -0
sierra/core/logging.py +3 -2
sierra/core/models/__init__.py +3 -1
sierra/core/models/info.py +19 -0
sierra/core/models/interface.py +52 -122
sierra/core/pipeline/__init__.py +2 -5
sierra/core/pipeline/pipeline.py +228 -126
sierra/core/pipeline/stage1/__init__.py +10 -0
sierra/core/pipeline/stage1/pipeline_stage1.py +45 -31
sierra/core/pipeline/stage2/__init__.py +10 -0
sierra/core/pipeline/stage2/pipeline_stage2.py +8 -11
sierra/core/pipeline/stage2/runner.py +401 -0
sierra/core/pipeline/stage3/__init__.py +12 -0
sierra/core/pipeline/stage3/gather.py +321 -0
sierra/core/pipeline/stage3/pipeline_stage3.py +37 -84
sierra/core/pipeline/stage4/__init__.py +12 -2
sierra/core/pipeline/stage4/pipeline_stage4.py +36 -354
sierra/core/pipeline/stage5/__init__.py +12 -0
sierra/core/pipeline/stage5/pipeline_stage5.py +33 -208
sierra/core/pipeline/yaml.py +48 -0
sierra/core/plugin.py +529 -62
sierra/core/proc.py +11 -0
sierra/core/prod.py +11 -0
sierra/core/ros1/__init__.py +5 -1
sierra/core/ros1/callbacks.py +22 -21
sierra/core/ros1/cmdline.py +59 -88
sierra/core/ros1/generators.py +159 -175
sierra/core/ros1/variables/__init__.py +3 -0
sierra/core/ros1/variables/exp_setup.py +122 -116
sierra/core/startup.py +106 -76
sierra/core/stat_kernels.py +4 -5
sierra/core/storage.py +13 -32
sierra/core/trampoline.py +30 -0
sierra/core/types.py +116 -71
sierra/core/utils.py +103 -106
sierra/core/variables/__init__.py +1 -1
sierra/core/variables/base_variable.py +12 -17
sierra/core/variables/batch_criteria.py +387 -481
sierra/core/variables/builtin.py +135 -0
sierra/core/variables/exp_setup.py +19 -39
sierra/core/variables/population_size.py +72 -76
sierra/core/variables/variable_density.py +44 -68
sierra/core/vector.py +1 -1
sierra/main.py +256 -88
sierra/plugins/__init__.py +119 -0
sierra/plugins/compare/__init__.py +14 -0
sierra/plugins/compare/graphs/__init__.py +19 -0
sierra/plugins/compare/graphs/cmdline.py +120 -0
sierra/plugins/compare/graphs/comparator.py +291 -0
sierra/plugins/compare/graphs/inter_controller.py +531 -0
sierra/plugins/compare/graphs/inter_scenario.py +297 -0
sierra/plugins/compare/graphs/namecalc.py +53 -0
sierra/plugins/compare/graphs/outputroot.py +73 -0
sierra/plugins/compare/graphs/plugin.py +147 -0
sierra/plugins/compare/graphs/preprocess.py +172 -0
sierra/plugins/compare/graphs/schema.py +37 -0
sierra/plugins/engine/__init__.py +14 -0
sierra/plugins/engine/argos/__init__.py +18 -0
sierra/plugins/{platform → engine}/argos/cmdline.py +144 -151
sierra/plugins/{platform/argos/variables → engine/argos/generators}/__init__.py +5 -0
sierra/plugins/engine/argos/generators/engine.py +394 -0
sierra/plugins/engine/argos/plugin.py +393 -0
sierra/plugins/{platform/argos/generators → engine/argos/variables}/__init__.py +5 -0
sierra/plugins/engine/argos/variables/arena_shape.py +183 -0
sierra/plugins/engine/argos/variables/cameras.py +240 -0
sierra/plugins/engine/argos/variables/constant_density.py +112 -0
sierra/plugins/engine/argos/variables/exp_setup.py +82 -0
sierra/plugins/{platform → engine}/argos/variables/physics_engines.py +83 -87
sierra/plugins/engine/argos/variables/population_constant_density.py +178 -0
sierra/plugins/engine/argos/variables/population_size.py +115 -0
sierra/plugins/engine/argos/variables/population_variable_density.py +123 -0
sierra/plugins/engine/argos/variables/rendering.py +108 -0
sierra/plugins/engine/ros1gazebo/__init__.py +18 -0
sierra/plugins/engine/ros1gazebo/cmdline.py +175 -0
sierra/plugins/{platform/ros1robot → engine/ros1gazebo}/generators/__init__.py +5 -0
sierra/plugins/engine/ros1gazebo/generators/engine.py +125 -0
sierra/plugins/engine/ros1gazebo/plugin.py +404 -0
sierra/plugins/engine/ros1gazebo/variables/__init__.py +15 -0
sierra/plugins/engine/ros1gazebo/variables/population_size.py +214 -0
sierra/plugins/engine/ros1robot/__init__.py +18 -0
sierra/plugins/engine/ros1robot/cmdline.py +159 -0
sierra/plugins/{platform/ros1gazebo → engine/ros1robot}/generators/__init__.py +4 -0
sierra/plugins/engine/ros1robot/generators/engine.py +95 -0
sierra/plugins/engine/ros1robot/plugin.py +410 -0
sierra/plugins/{hpc/local → engine/ros1robot/variables}/__init__.py +5 -0
sierra/plugins/engine/ros1robot/variables/population_size.py +146 -0
sierra/plugins/execenv/__init__.py +11 -0
sierra/plugins/execenv/hpc/__init__.py +18 -0
sierra/plugins/execenv/hpc/adhoc/__init__.py +18 -0
sierra/plugins/execenv/hpc/adhoc/cmdline.py +30 -0
sierra/plugins/execenv/hpc/adhoc/plugin.py +131 -0
sierra/plugins/execenv/hpc/cmdline.py +137 -0
sierra/plugins/execenv/hpc/local/__init__.py +18 -0
sierra/plugins/execenv/hpc/local/cmdline.py +31 -0
sierra/plugins/execenv/hpc/local/plugin.py +145 -0
sierra/plugins/execenv/hpc/pbs/__init__.py +18 -0
sierra/plugins/execenv/hpc/pbs/cmdline.py +30 -0
sierra/plugins/execenv/hpc/pbs/plugin.py +121 -0
sierra/plugins/execenv/hpc/slurm/__init__.py +18 -0
sierra/plugins/execenv/hpc/slurm/cmdline.py +30 -0
sierra/plugins/execenv/hpc/slurm/plugin.py +133 -0
sierra/plugins/execenv/prefectserver/__init__.py +18 -0
sierra/plugins/execenv/prefectserver/cmdline.py +66 -0
sierra/plugins/execenv/prefectserver/dockerremote/__init__.py +18 -0
sierra/plugins/execenv/prefectserver/dockerremote/cmdline.py +66 -0
sierra/plugins/execenv/prefectserver/dockerremote/plugin.py +132 -0
sierra/plugins/execenv/prefectserver/flow.py +66 -0
sierra/plugins/execenv/prefectserver/local/__init__.py +18 -0
sierra/plugins/execenv/prefectserver/local/cmdline.py +29 -0
sierra/plugins/execenv/prefectserver/local/plugin.py +133 -0
sierra/plugins/{hpc/adhoc → execenv/robot}/__init__.py +1 -0
sierra/plugins/execenv/robot/turtlebot3/__init__.py +18 -0
sierra/plugins/execenv/robot/turtlebot3/plugin.py +204 -0
sierra/plugins/expdef/__init__.py +14 -0
sierra/plugins/expdef/json/__init__.py +14 -0
sierra/plugins/expdef/json/plugin.py +504 -0
sierra/plugins/expdef/xml/__init__.py +14 -0
sierra/plugins/expdef/xml/plugin.py +386 -0
sierra/{core/hpc → plugins/proc}/__init__.py +1 -1
sierra/plugins/proc/collate/__init__.py +15 -0
sierra/plugins/proc/collate/cmdline.py +47 -0
sierra/plugins/proc/collate/plugin.py +271 -0
sierra/plugins/proc/compress/__init__.py +18 -0
sierra/plugins/proc/compress/cmdline.py +47 -0
sierra/plugins/proc/compress/plugin.py +123 -0
sierra/plugins/proc/decompress/__init__.py +18 -0
sierra/plugins/proc/decompress/plugin.py +96 -0
sierra/plugins/proc/imagize/__init__.py +15 -0
sierra/plugins/proc/imagize/cmdline.py +49 -0
sierra/plugins/proc/imagize/plugin.py +270 -0
sierra/plugins/proc/modelrunner/__init__.py +16 -0
sierra/plugins/proc/modelrunner/plugin.py +250 -0
sierra/plugins/proc/statistics/__init__.py +15 -0
sierra/plugins/proc/statistics/cmdline.py +64 -0
sierra/plugins/proc/statistics/plugin.py +390 -0
sierra/plugins/{hpc → prod}/__init__.py +1 -0
sierra/plugins/prod/graphs/__init__.py +18 -0
sierra/plugins/prod/graphs/cmdline.py +269 -0
sierra/plugins/prod/graphs/collate.py +279 -0
sierra/plugins/prod/graphs/inter/__init__.py +13 -0
sierra/plugins/prod/graphs/inter/generate.py +83 -0
sierra/plugins/prod/graphs/inter/heatmap.py +86 -0
sierra/plugins/prod/graphs/inter/line.py +134 -0
sierra/plugins/prod/graphs/intra/__init__.py +15 -0
sierra/plugins/prod/graphs/intra/generate.py +202 -0
sierra/plugins/prod/graphs/intra/heatmap.py +74 -0
sierra/plugins/prod/graphs/intra/line.py +114 -0
sierra/plugins/prod/graphs/plugin.py +103 -0
sierra/plugins/prod/graphs/targets.py +63 -0
sierra/plugins/prod/render/__init__.py +18 -0
sierra/plugins/prod/render/cmdline.py +72 -0
sierra/plugins/prod/render/plugin.py +282 -0
sierra/plugins/storage/__init__.py +5 -0
sierra/plugins/storage/arrow/__init__.py +18 -0
sierra/plugins/storage/arrow/plugin.py +38 -0
sierra/plugins/storage/csv/__init__.py +9 -0
sierra/plugins/storage/csv/plugin.py +12 -5
sierra/version.py +3 -2
sierra_research-1.5.0.dist-info/METADATA +238 -0
sierra_research-1.5.0.dist-info/RECORD +186 -0
{sierra_research-1.3.11.dist-info → sierra_research-1.5.0.dist-info}/WHEEL +1 -2
sierra/core/experiment/xml.py +0 -454
sierra/core/generators/controller_generator_parser.py +0 -34
sierra/core/generators/exp_creator.py +0 -351
sierra/core/generators/exp_generators.py +0 -142
sierra/core/graphs/scatterplot2D.py +0 -109
sierra/core/graphs/stacked_line_graph.py +0 -251
sierra/core/graphs/stacked_surface_graph.py +0 -220
sierra/core/graphs/summary_line_graph.py +0 -371
sierra/core/hpc/cmdline.py +0 -142
sierra/core/models/graphs.py +0 -87
sierra/core/pipeline/stage2/exp_runner.py +0 -286
sierra/core/pipeline/stage3/imagizer.py +0 -149
sierra/core/pipeline/stage3/run_collator.py +0 -317
sierra/core/pipeline/stage3/statistics_calculator.py +0 -478
sierra/core/pipeline/stage4/graph_collator.py +0 -320
sierra/core/pipeline/stage4/inter_exp_graph_generator.py +0 -240
sierra/core/pipeline/stage4/intra_exp_graph_generator.py +0 -317
sierra/core/pipeline/stage4/model_runner.py +0 -168
sierra/core/pipeline/stage4/rendering.py +0 -283
sierra/core/pipeline/stage4/yaml_config_loader.py +0 -103
sierra/core/pipeline/stage5/inter_scenario_comparator.py +0 -328
sierra/core/pipeline/stage5/intra_scenario_comparator.py +0 -989
sierra/core/platform.py +0 -493
sierra/core/plugin_manager.py +0 -369
sierra/core/root_dirpath_generator.py +0 -241
sierra/plugins/hpc/adhoc/plugin.py +0 -125
sierra/plugins/hpc/local/plugin.py +0 -81
sierra/plugins/hpc/pbs/__init__.py +0 -9
sierra/plugins/hpc/pbs/plugin.py +0 -126
sierra/plugins/hpc/slurm/__init__.py +0 -9
sierra/plugins/hpc/slurm/plugin.py +0 -130
sierra/plugins/platform/__init__.py +0 -9
sierra/plugins/platform/argos/__init__.py +0 -9
sierra/plugins/platform/argos/generators/platform_generators.py +0 -383
sierra/plugins/platform/argos/plugin.py +0 -337
sierra/plugins/platform/argos/variables/arena_shape.py +0 -145
sierra/plugins/platform/argos/variables/cameras.py +0 -243
sierra/plugins/platform/argos/variables/constant_density.py +0 -136
sierra/plugins/platform/argos/variables/exp_setup.py +0 -113
sierra/plugins/platform/argos/variables/population_constant_density.py +0 -175
sierra/plugins/platform/argos/variables/population_size.py +0 -102
sierra/plugins/platform/argos/variables/population_variable_density.py +0 -132
sierra/plugins/platform/argos/variables/rendering.py +0 -104
sierra/plugins/platform/ros1gazebo/__init__.py +0 -9
sierra/plugins/platform/ros1gazebo/cmdline.py +0 -213
sierra/plugins/platform/ros1gazebo/generators/platform_generators.py +0 -137
sierra/plugins/platform/ros1gazebo/plugin.py +0 -335
sierra/plugins/platform/ros1gazebo/variables/__init__.py +0 -10
sierra/plugins/platform/ros1gazebo/variables/population_size.py +0 -204
sierra/plugins/platform/ros1robot/__init__.py +0 -9
sierra/plugins/platform/ros1robot/cmdline.py +0 -175
sierra/plugins/platform/ros1robot/generators/platform_generators.py +0 -112
sierra/plugins/platform/ros1robot/plugin.py +0 -373
sierra/plugins/platform/ros1robot/variables/__init__.py +0 -10
sierra/plugins/platform/ros1robot/variables/population_size.py +0 -146
sierra/plugins/robot/__init__.py +0 -9
sierra/plugins/robot/turtlebot3/__init__.py +0 -9
sierra/plugins/robot/turtlebot3/plugin.py +0 -194
sierra_research-1.3.11.data/data/share/man/man1/sierra-cli.1 +0 -2349
sierra_research-1.3.11.data/data/share/man/man7/sierra-examples.7 +0 -508
sierra_research-1.3.11.data/data/share/man/man7/sierra-exec-envs.7 +0 -331
sierra_research-1.3.11.data/data/share/man/man7/sierra-glossary.7 +0 -285
sierra_research-1.3.11.data/data/share/man/man7/sierra-platforms.7 +0 -358
sierra_research-1.3.11.data/data/share/man/man7/sierra-usage.7 +0 -729
sierra_research-1.3.11.data/data/share/man/man7/sierra.7 +0 -78
sierra_research-1.3.11.dist-info/METADATA +0 -492
sierra_research-1.3.11.dist-info/RECORD +0 -133
sierra_research-1.3.11.dist-info/top_level.txt +0 -1
{sierra_research-1.3.11.dist-info → sierra_research-1.5.0.dist-info}/entry_points.txt +0 -0
{sierra_research-1.3.11.dist-info → sierra_research-1.5.0.dist-info/licenses}/LICENSE +0 -0

sierra/core/pipeline/stage3/statistics_calculator.py DELETED Viewed

@@ -1,478 +0,0 @@
-# Copyright 2019 John Harwell, All rights reserved.
-#
-#  SPDX-License-Identifier: MIT
-"""
-Classes for generating statistics within and across experiments in a batch.
-"""
-# Core packages
-import re
-import multiprocessing as mp
-import typing as tp
-import queue
-import time
-import datetime
-import logging
-import pathlib
-# 3rd party packages
-import pandas as pd
-import psutil
-# Project packages
-import sierra.core.variables.batch_criteria as bc
-from sierra.core import types, utils, stat_kernels, storage, config
-class GatherSpec:
-    """
-    Data class for specifying .csv files to gather from an :term:`Experiment`.
-    """
-    def __init__(self,
-                 exp_name: str,
-                 item_stem: str,
-                 imagize_csv_stem: tp.Optional[str]):
-        self.exp_name = exp_name
-        self.item_stem = item_stem
-        self.imagize_csv_stem = imagize_csv_stem
-    def for_imagizing(self):
-        return self.imagize_csv_stem is not None
-class BatchExpParallelCalculator:
-    """Process :term:`Output .csv` files for each experiment in the batch.
-    In parallel for speed.
-    """
-    def __init__(self, main_config: dict, cmdopts: types.Cmdopts):
-        self.main_config = main_config
-        self.cmdopts = cmdopts
-        self.logger = logging.getLogger(__name__)
-    def __call__(self, criteria: bc.IConcreteBatchCriteria) -> None:
-        exp_to_avg = utils.exp_range_calc(self.cmdopts,
-                                          self.cmdopts['batch_output_root'],
-                                          criteria)
-        template_input_leaf = pathlib.Path(self.cmdopts['template_input_file']).stem
-        avg_opts = {
-            'template_input_leaf': template_input_leaf,
-            'df_skip_verify': self.cmdopts['df_skip_verify'],
-            'dist_stats': self.cmdopts['dist_stats'],
-            'project_imagizing': self.cmdopts['project_imagizing'],
-            'processing_mem_limit': self.cmdopts['processing_mem_limit'],
-            'storage_medium': self.cmdopts['storage_medium'],
-            'df_homogenize': self.cmdopts['df_homogenize']
-        }
-        if self.cmdopts['processing_serial']:
-            n_gatherers = 1
-            n_processors = 1
-        else:
-            # Aways need to have at least one of each! If SIERRA is invoked on a
-            # machine with 2 or less logical cores, the calculation with
-            # psutil.cpu_count() will return 0 for # gatherers.
-            n_gatherers = max(1, int(psutil.cpu_count() * 0.25))
-            n_processors = max(1, int(psutil.cpu_count() * 0.75))
-        with mp.Pool(processes=n_gatherers + n_processors) as pool:
-            self._execute(exp_to_avg, avg_opts, n_gatherers, n_processors, pool)
-    def _execute(self,
-                 exp_to_avg: tp.List[pathlib.Path],
-                 avg_opts: types.SimpleDict,
-                 n_gatherers: int,
-                 n_processors: int,
-                 pool) -> None:
-        m = mp.Manager()
-        gatherq = m.Queue()
-        processq = m.Queue()
-        for exp in exp_to_avg:
-            gatherq.put(exp)
-        # Start some threads gathering .csvs first to get things rolling.
-        self.logger.debug("Starting %d gatherers, method=%s",
-                          n_gatherers,
-                          mp.get_start_method())
-        gathered = [pool.apply_async(BatchExpParallelCalculator._gather_worker,
-                                     (gatherq,
-                                      processq,
-                                      self.main_config,
-                                      avg_opts)) for i in range(0, n_gatherers)]
-        self.logger.debug("Starting %d processors, method=%s",
-                          n_processors,
-                          mp.get_start_method())
-        processed = [pool.apply_async(BatchExpParallelCalculator._process_worker,
-                                      (processq,
-                                       self.main_config,
-                                       self.cmdopts['batch_stat_root'],
-                                       avg_opts)) for i in range(0, n_processors)]
-        # To capture the otherwise silent crashes when something goes wrong in
-        # worker threads. Any assertions will show and any exceptions will be
-        # re-raised.
-        self.logger.debug("Waiting for workers to finish")
-        for g in gathered:
-            g.get()
-        for p in processed:
-            p.get()
-        pool.close()
-        pool.join()
-        self.logger.debug("All threads finished")
-    @staticmethod
-    def _gather_worker(gatherq: mp.Queue,
-                       processq: mp.Queue,
-                       main_config: types.YAMLDict,
-                       avg_opts: tp.Dict[str, str]) -> None:
-        gatherer = ExpCSVGatherer(main_config, avg_opts, processq)
-        # Wait for 3 seconds after the queue is empty before bailing, at the
-        # start. If that is not long enough then exponentially increase from
-        # there until you find how long it takes to get the first item in the
-        # queue, and use that as the appropriate timeout (plus a little
-        # margin).
-        timeout = 3
-        got_item = False
-        n_tries = 0
-        while n_tries < 2:
-            try:
-                exp_output_root = gatherq.get(True, timeout)
-                gatherer(exp_output_root)
-                gatherq.task_done()
-                got_item = True
-            except queue.Empty:
-                if got_item:
-                    break
-                timeout *= 2
-                n_tries += 1
-    @staticmethod
-    def _process_worker(processq: mp.Queue,
-                        main_config: types.YAMLDict,
-                        batch_stat_root: pathlib.Path,
-                        avg_opts: tp.Dict[str, str]) -> None:
-        calculator = ExpStatisticsCalculator(main_config,
-                                             avg_opts,
-                                             batch_stat_root)
-        # Wait for 3 seconds after the queue is empty before bailing, at the
-        # start. If that is not long enough then exponentially increase from
-        # there until you find how long it takes to get the first item in the
-        # queue, and use that as the appropriate timeout (plus a little
-        # margin).
-        timeout = 3
-        got_item = False
-        n_tries = 0
-        while n_tries < 2:
-            try:
-                item = processq.get(True, timeout)
-                key = list(item.keys())[0]
-                calculator(key, item[key])
-                processq.task_done()
-                got_item = True
-            except queue.Empty:
-                if got_item:
-                    break
-                timeout *= 2
-                n_tries += 1
-class ExpCSVGatherer:
-    """Gather all :term:`Output .csv` files from all runs within an experiment.
-    "Gathering" in this context means creating a dictionary mapping which .csv
-    came from where, so that statistics can be generated both across and with
-    experiments in the batch.
-    """
-    def __init__(self,
-                 main_config: types.YAMLDict,
-                 gather_opts: dict,
-                 processq: mp.Queue) -> None:
-        self.processq = processq
-        self.gather_opts = gather_opts
-        # Will get the main name and extension of the config file (without the
-        # full absolute path).
-        self.template_input_fname = self.gather_opts['template_input_leaf']
-        self.main_config = main_config
-        self.run_metrics_leaf = main_config['sierra']['run']['run_metrics_leaf']
-        self.videos_leaf = 'videos'
-        self.project_imagize = gather_opts['project_imagizing']
-        self.logger = logging.getLogger(__name__)
-    def __call__(self, exp_output_root: pathlib.Path) -> None:
-        """Process the CSV files found in the output save path."""
-        if not self.gather_opts['df_skip_verify']:
-            self._verify_exp_outputs(exp_output_root)
-        self.logger.info('Processing .csvs: %s...', exp_output_root.name)
-        pattern = "{}_run{}_output".format(re.escape(self.gather_opts['template_input_leaf']),
-                                           r'\d+')
-        runs = list(exp_output_root.iterdir())
-        assert (all(re.match(pattern, r.name) for r in runs)), \
-            f"Extra files/not all dirs in '{exp_output_root}' are exp runs"
-        # Maps (unique .csv stem, optional parent dir) to the averaged dataframe
-        to_gather = self._calc_gather_items(runs[0], exp_output_root.name)
-        for item in to_gather:
-            self._wait_for_memory()
-            gathered = self._gather_item_from_sims(exp_output_root, item, runs)
-            # Put gathered .csv list  in the process queue
-            self.processq.put(gathered)
-        self.logger.debug("Enqueued %s items from %s for processing",
-                          len(to_gather),
-                          exp_output_root.name)
-    def _calc_gather_items(self,
-                           run_output_root: pathlib.Path,
-                           exp_name: str) -> tp.List[GatherSpec]:
-        to_gather = []
-        sim_output_root = run_output_root / self.run_metrics_leaf
-        # The metrics folder should contain nothing but .csv files and
-        # directories. For all directories it contains, they each should contain
-        # nothing but .csv files (these are for video rendering later).
-        for item in sim_output_root.iterdir():
-            csv_stem = item.stem
-            if item.is_file():
-                to_gather.append(GatherSpec(exp_name=exp_name,
-                                            item_stem=csv_stem,
-                                            imagize_csv_stem=None))
-            else:
-                # This takes FOREVER, so only do it if we absolutely need to
-                if not self.project_imagize:
-                    continue
-                for csv_fname in item.iterdir():
-                    to_gather.append(GatherSpec(exp_name=exp_name,
-                                                item_stem=csv_stem,
-                                                imagize_csv_stem=csv_fname.stem))
-        return to_gather
-    def _gather_item_from_sims(self,
-                               exp_output_root: pathlib.Path,
-                               item: GatherSpec,
-                               runs: tp.List[pathlib.Path]) -> tp.Dict[GatherSpec,
-                                                                       tp.List[pd.DataFrame]]:
-        gathered = {}  # type: tp.Dict[GatherSpec, pd.DataFrame]
-        for run in runs:
-            sim_output_root = run / self.run_metrics_leaf
-            if item.for_imagizing():
-                item_path = sim_output_root / item.item_stem / \
-                    (item.imagize_csv_stem + config.kStorageExt['csv'])
-            else:
-                item_path = sim_output_root / \
-                    (item.item_stem + config.kStorageExt['csv'])
-            reader = storage.DataFrameReader(self.gather_opts['storage_medium'])
-            df = reader(item_path, index_col=False)
-            if df.dtypes.iloc[0] == 'object':
-                df[df.columns[0]] = df[df.columns[0]].apply(lambda x: float(x))
-            if item not in gathered:
-                gathered[item] = []
-            gathered[item].append(df)
-        return gathered
-    def _wait_for_memory(self) -> None:
-        while True:
-            mem = psutil.virtual_memory()
-            avail = mem.available / mem.total
-            free_percent = avail * 100
-            free_limit = 100 - self.gather_opts['processing_mem_limit']
-            if free_percent >= free_limit:
-                return
-            self.logger.info("Waiting for memory: avail=%s,min=%s",
-                             free_percent,
-                             free_limit)
-            time.sleep(1)
-    def _verify_exp_outputs(self, exp_output_root: pathlib.Path) -> None:
-        """
-        Verify the integrity of all runs in an experiment.
-        Specifically:
-        - All runs produced all CSV files.
-        - All runs CSV files with the same name have the same # rows and
-          columns.
-        - No CSV files contain NaNs.
-        """
-        experiments = exp_output_root.iterdir()
-        self.logger.info('Verifying results in %s...', str(exp_output_root))
-        start = time.time()
-        for exp1 in experiments:
-            csv_root1 = exp1 / self.run_metrics_leaf
-            for exp2 in experiments:
-                csv_root2 = exp2 / self.run_metrics_leaf
-                if not csv_root2.is_dir():
-                    continue
-                self._verify_exp_outputs_pairwise(csv_root1, csv_root2)
-        elapsed = int(time.time() - start)
-        sec = datetime.timedelta(seconds=elapsed)
-        self.logger.info("Done verifying results in %s: %s",
-                         exp_output_root,
-                         sec)
-    def _verify_exp_outputs_pairwise(self,
-                                     csv_root1: pathlib.Path,
-                                     csv_root2: pathlib.Path) -> None:
-        for csv in csv_root2.iterdir():
-            path1 = csv
-            path2 = csv_root2 / csv.name
-            # .csvs for rendering that we don't verify (for now...)
-            if path1.is_dir() or path2.is_dir():
-                self.logger.debug("Not verifying '%s': contains rendering data",
-                                  str(path1))
-                continue
-            assert (utils.path_exists(path1) and utils.path_exists(path2)), \
-                f"Either {path1} or {path2} does not exist"
-            # Verify both dataframes have same # columns, and that
-            # column sets are identical
-            reader = storage.DataFrameReader(self.gather_opts['storage_medium'])
-            df1 = reader(path1)
-            df2 = reader(path2)
-            assert (len(df1.columns) == len(df2.columns)), \
-                (f"Dataframes from {path1} and {path2} do not have "
-                 "the same # columns")
-            assert (sorted(df1.columns) == sorted(df2.columns)), \
-                f"Columns from {path1} and {path2} not identical"
-            # Verify the length of all columns in both dataframes is the same
-            for c1 in df1.columns:
-                assert (all(len(df1[c1]) == len(df1[c2]) for c2 in df1.columns)), \
-                    f"Not all columns from {path1} have same length"
-                assert (all(len(df1[c1]) == len(df2[c2]) for c2 in df1.columns)), \
-                    (f"Not all columns from {path1} and {path2} have "
-                     "the same length")
-class ExpStatisticsCalculator:
-    """Generate statistics from output files for all runs within an experiment.
-    .. IMPORTANT:: You *CANNOT* use logging ANYWHERE during processing .csv
-       files. Why ? I *think* because of a bug in the logging module itself. If
-       you get unlucky enough to spawn the process which enters the __call__()
-       method in this class while another logging statement is in progress (and
-       is therefore holding an internal logging module lock), then the
-       underlying fork() call will copy the lock in the acquired state. Then,
-       when this class goes to try to log something, it deadlocks with itself.
-       You also can't just create loggers with unique names, as this seems to be
-       something like the GIL, but for the logging module. Sometimes python
-       sucks.
-    """
-    def __init__(self,
-                 main_config: types.YAMLDict,
-                 avg_opts: dict,
-                 batch_stat_root: pathlib.Path) -> None:
-        self.avg_opts = avg_opts
-        # will get the main name and extension of the config file (without the
-        # full absolute path)
-        self.template_input_fname = self.avg_opts['template_input_leaf']
-        self.main_config = main_config
-        self.batch_stat_root = batch_stat_root
-        self.intra_perf_csv = main_config['sierra']['perf']['intra_perf_csv']
-        self.intra_perf_col = main_config['sierra']['perf']['intra_perf_col']
-    def __call__(self,
-                 gather_spec: GatherSpec,
-                 gathered_dfs: tp.List[pd.DataFrame]) -> None:
-        csv_concat = pd.concat(gathered_dfs)
-        exp_stat_root = self.batch_stat_root / gather_spec.exp_name
-        utils.dir_create_checked(exp_stat_root, exist_ok=True)
-        # Create directory for averaged .csv files for imagizing later.
-        if gather_spec.for_imagizing():
-            utils.dir_create_checked(exp_stat_root / gather_spec.item_stem,
-                                     exist_ok=True)
-        by_row_index = csv_concat.groupby(csv_concat.index)
-        dfs = {}
-        if self.avg_opts['dist_stats'] in ['none', 'all']:
-            dfs.update(stat_kernels.mean.from_groupby(by_row_index))
-        if self.avg_opts['dist_stats'] in ['conf95', 'all']:
-            dfs.update(stat_kernels.conf95.from_groupby(by_row_index))
-        if self.avg_opts['dist_stats'] in ['bw', 'all']:
-            dfs.update(stat_kernels.bw.from_groupby(by_row_index))
-        for ext in dfs:
-            opath = exp_stat_root / gather_spec.item_stem
-            if gather_spec.for_imagizing():
-                opath /= (gather_spec.imagize_csv_stem + ext)
-            else:
-                opath = opath.with_suffix(ext)
-            df = utils.df_fill(dfs[ext], self.avg_opts['df_homogenize'])
-            writer = storage.DataFrameWriter(self.avg_opts['storage_medium'])
-            writer(df, opath, index=False)
-__api__ = [
-    'GatherSpec',
-    'BatchExpParallelCalculator',
-    'ExpCSVGatherer',
-    'ExpStatisticsCalculator'
-]

sierra-research 1.3.11__py3-none-any.whl → 1.5.0__py3-none-any.whl

sierra-research 1.3.11py3-none-any.whl → 1.5.0py3-none-any.whl