PyPI - potassco-benchmark-tool - Versions diffs - 2.1.1__py3-none-any.whl - Mend

potassco-benchmark-tool 2.1.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (29) hide show

benchmarktool/__init__.py +0 -0
benchmarktool/entry_points.py +417 -0
benchmarktool/init/programs/gcat.sh +24 -0
benchmarktool/init/runscripts/runscript-all.xml +49 -0
benchmarktool/init/runscripts/runscript-dist.xml +20 -0
benchmarktool/init/runscripts/runscript-example.xml +31 -0
benchmarktool/init/runscripts/runscript-seq.xml +27 -0
benchmarktool/init/templates/seq-generic-single.sh +27 -0
benchmarktool/init/templates/seq-generic-zip.sh +14 -0
benchmarktool/init/templates/seq-generic.sh +12 -0
benchmarktool/init/templates/single.dist +25 -0
benchmarktool/result/__init__.py +0 -0
benchmarktool/result/ipynb_gen.py +477 -0
benchmarktool/result/ods_config.py +42 -0
benchmarktool/result/ods_gen.py +714 -0
benchmarktool/result/parser.py +167 -0
benchmarktool/result/result.py +453 -0
benchmarktool/resultparser/__init__.py +0 -0
benchmarktool/resultparser/clasp.py +88 -0
benchmarktool/runscript/__init__.py +0 -0
benchmarktool/runscript/parser.py +477 -0
benchmarktool/runscript/runscript.py +1481 -0
benchmarktool/tools.py +82 -0
potassco_benchmark_tool-2.1.1.dist-info/METADATA +112 -0
potassco_benchmark_tool-2.1.1.dist-info/RECORD +29 -0
potassco_benchmark_tool-2.1.1.dist-info/WHEEL +5 -0
potassco_benchmark_tool-2.1.1.dist-info/entry_points.txt +2 -0
potassco_benchmark_tool-2.1.1.dist-info/licenses/LICENSE +21 -0
potassco_benchmark_tool-2.1.1.dist-info/top_level.txt +1 -0

benchmarktool/result/parser.py ADDED Viewed

@@ -0,0 +1,167 @@
+"""
+Created on Jan 19, 2010
+@author: Roland Kaminski
+"""
+from typing import Any, Optional
+from lxml import etree  # type: ignore[import-untyped]
+from benchmarktool import tools
+from benchmarktool.result.result import (
+    Benchmark,
+    Class,
+    ClassResult,
+    Config,
+    DistJob,
+    Instance,
+    InstanceResult,
+    Machine,
+    Project,
+    Result,
+    Run,
+    Runspec,
+    SeqJob,
+    Setting,
+    System,
+)
+# pylint: disable=too-many-instance-attributes
+class Parser:
+    """
+    A parser to parse XML result files.
+    """
+    def __init__(self) -> None:
+        """
+        Initializes the parser.
+        """
+        self.system_order = 0
+        self.result = Result()
+        self.setting_order = 0
+        self.benchscope = False
+        self.system: Optional[System] = None
+        self.benchmark: Optional[Benchmark] = None
+        self.benchclass: Optional[Class] = None
+        self.classresult: Optional[ClassResult] = None
+        self.instresult: Optional[InstanceResult] = None
+        self.runspec: Optional[Runspec] = None
+        self.project: Optional[Project] = None
+        self.run: Optional[Run] = None
+    def parse(self, infile: Any) -> Result:
+        """
+        Parse a given result file and return its representation
+        in form of an instance of class Result.
+        Attributes:
+            infile (Any): The file to parse.
+        """
+        # to reduce memory consumption especially for large result files
+        # do not use the full blown etree representation
+        parser = etree.XMLParser(target=self)
+        etree.parse(infile, parser)
+        assert isinstance(self.result, Result)
+        return self.result
+    # pylint: disable=too-many-statements,too-many-branches
+    def start(self, tag: str, attrib: dict[str, Any]) -> None:
+        """
+        This method is called for every opening XML tag.
+        Attributes:
+            tag (str):               The name of the tag.
+            attrib (dict[str, Any]): The attributes of the tag.
+        """
+        match tag:
+            case "machine":
+                machine = Machine(attrib["name"], attrib["cpu"], attrib["memory"])
+                self.result.machines[machine.name] = machine
+            case "config":
+                config = Config(attrib["name"], attrib["template"])
+                self.result.configs[config.name] = config
+            case "system":
+                self.system = System(
+                    attrib["name"], attrib["version"], attrib["config"], attrib["measures"], self.system_order
+                )
+                self.result.systems[(self.system.name, self.system.version)] = self.system
+                self.system_order += 1
+                self.setting_order = 0
+            case "setting":
+                tag = attrib.pop("tag", None)
+                name = attrib.pop("name")
+                cmdline = attrib.pop("cmdline")
+                assert self.system is not None
+                setting = Setting(self.system, name, cmdline, tag, self.setting_order, attrib)
+                self.system.settings[name] = setting
+                self.setting_order += 1
+            case "seqjob":
+                name = attrib.pop("name")
+                timeout = tools.xml_to_seconds_time(attrib.pop("timeout"))
+                runs = int(attrib.pop("runs"))
+                parallel = int(attrib.pop("parallel"))
+                seq_job = SeqJob(name, timeout, runs, attrib, parallel)
+                self.result.jobs[seq_job.name] = seq_job
+            case "distjob":
+                name = attrib.pop("name")
+                timeout = tools.xml_to_seconds_time(attrib.pop("timeout"))
+                runs = int(attrib.pop("runs"))
+                script_mode = attrib.pop("script_mode")
+                walltime = attrib.pop("walltime")
+                partition = attrib.pop("partition")
+                dist_job = DistJob(name, timeout, runs, attrib, script_mode, walltime, partition)
+                self.result.jobs[dist_job.name] = dist_job
+            case "benchmark":
+                self.benchscope = True
+                self.benchmark = Benchmark(attrib["name"])
+                self.result.benchmarks[self.benchmark.name] = self.benchmark
+            case "project":
+                self.project = Project(attrib["name"], attrib["job"])
+                self.result.projects[self.project.name] = self.project
+            case "runspec":
+                self.benchscope = False
+                self.runspec = Runspec(
+                    self.result.systems[(attrib["system"], attrib["version"])],
+                    self.result.machines[attrib["machine"]],
+                    self.result.benchmarks[attrib["benchmark"]],
+                    self.result.systems[(attrib["system"], attrib["version"])].settings[attrib["setting"]],
+                )
+                assert self.project is not None
+                self.project.runspecs.append(self.runspec)
+            case "class":
+                if self.benchscope:
+                    assert self.benchmark is not None
+                    self.benchclass = Class(self.benchmark, attrib["name"], int(attrib["id"]))
+                    self.benchmark.classes[self.benchclass.id] = self.benchclass
+                else:
+                    assert self.runspec is not None
+                    benchclass = self.runspec.benchmark.classes[int(attrib["id"])]
+                    self.classresult = ClassResult(benchclass)
+                    self.runspec.classresults.append(self.classresult)
+            case "instance":
+                if self.benchscope:
+                    assert self.benchclass is not None
+                    instance = Instance(self.benchclass, attrib["name"], int(attrib["id"]))
+                    self.benchclass.instances[instance.id] = instance
+                else:
+                    assert self.classresult is not None
+                    benchinst = self.classresult.benchclass.instances[int(attrib["id"])]
+                    self.instresult = InstanceResult(benchinst)
+                    self.classresult.instresults.append(self.instresult)
+            case "run":
+                if not self.benchscope:
+                    assert self.instresult is not None
+                    self.run = Run(self.instresult, int(attrib["number"]))
+                    self.instresult.runs.append(self.run)
+            case "measure":
+                assert self.run is not None
+                self.run.measures[attrib["name"]] = (attrib["type"], attrib["val"])
+    def close(self) -> None:
+        """
+        This method is called for every closing XML tag.
+        """

benchmarktool/result/result.py ADDED Viewed

@@ -0,0 +1,453 @@
+"""
+Created on Jan 19, 2010
+@author: Roland Kaminski
+"""
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import Any, Iterator, Optional
+from benchmarktool.result.ods_gen import ODSDoc
+class Result:
+    """
+    Stores the benchmark description and its results.
+    """
+    def __init__(self) -> None:
+        """
+        Initializes an empty result.
+        """
+        self.machines: dict[str, Machine] = {}
+        self.configs: dict[str, Config] = {}
+        self.systems: dict[tuple[str, str], System] = {}
+        self.jobs: dict[str, SeqJob | DistJob] = {}
+        self.benchmarks: dict[str, Benchmark] = {}
+        self.projects: dict[str, Project] = {}
+    def merge(self, projects: list["Project"]) -> "BenchmarkMerge":
+        """
+        Concatenates the benchmarks in the given projects into one benchmark set.
+        Attributes:
+            projects (list[Project]): The projects to merge with.
+        """
+        benchmarks: set[Benchmark] = set()
+        for project in projects:
+            for runspec in project:
+                for classresult in runspec:
+                    for instresult in classresult.instresults:
+                        instresult.instance.values["max_runs"] = max(
+                            instresult.instance.values["max_runs"], len(instresult.runs)
+                        )
+                benchmarks.add(runspec.benchmark)
+        return BenchmarkMerge(benchmarks)
+    def gen_office(
+        self, out: str, sel_projects: set[str], measures: list[tuple[str, Any]], export: bool = False
+    ) -> Optional[str]:
+        """
+        Prints the current result in open office spreadsheet format.
+        Returns the name of the export file if values are exported.
+        Attributes:
+            out (str):                        The output file to write to.
+            sel_projects (set[str]):          The selected projects ("" for all).
+            measures (list[tuple[str, Any]]): The measures to extract.
+        """
+        projects: list[Project] = []
+        for project in self.projects.values():
+            if len(sel_projects) == 0 or project.name in sel_projects:
+                projects.append(project)
+        benchmark_merge = self.merge(projects)
+        sheet = ODSDoc(benchmark_merge, measures)
+        for project in projects:
+            for runspec in project:
+                sheet.add_runspec(runspec)
+        sheet.finish()
+        sheet.make_ods(out)
+        if export:
+            # as_posix() for windows compatibility
+            ex_file = Path(out).absolute().as_posix().replace(".ods", ".parquet")
+            timeout_meta = {}
+            for project in projects:
+                for runspec in project.runspecs:
+                    timeout_meta[
+                        "_to_"
+                        + runspec.setting.system.name
+                        + "-"
+                        + runspec.setting.system.version
+                        + "/"
+                        + runspec.setting.name
+                    ] = [self.jobs[project.job].timeout]
+            sheet.inst_sheet.export_values(ex_file, timeout_meta)
+            return ex_file
+        return None
+class BenchmarkMerge:
+    """
+    Represents an (ordered) set of benchmark sets.
+    """
+    def __init__(self, benchmarks: set["Benchmark"]):
+        """
+        Initializes using the given set of benchmarks.
+        Attributes:
+            benchmarks (set[Benchmark]): Benchmarks to merge.
+        """
+        self.benchmarks = benchmarks
+        inst_num = 0
+        class_num = 0
+        for benchclass in self:
+            benchclass.values["row"] = class_num
+            benchclass.values["inst_start"] = inst_num
+            for instance in benchclass:
+                instance.values["row"] = inst_num
+                inst_num += max(instance.values["max_runs"], 1)
+            benchclass.values["inst_end"] = inst_num - 1
+            class_num += 1
+    def __iter__(self) -> Iterator["Class"]:
+        """
+        Creates an interator over all benchmark classes in all benchmarks.
+        """
+        for benchmark in sorted(self.benchmarks):
+            yield from benchmark
+@dataclass(order=True, frozen=True)
+class Machine:
+    """
+    Represents a machine.
+    Attributes:
+        name (str):   The name of the machine.
+        cpu (str):    String describing the CPU.
+        memory (str): String describing the Memory.
+    """
+    name: str
+    cpu: str = field(compare=False)
+    memory: str = field(compare=False)
+@dataclass(order=True, frozen=True)
+class Config:
+    """
+    Represents a config.
+    Attributes:
+        name (str):     The name of the config.
+        template (str): A path to the template file.
+    """
+    name: str
+    template: str = field(compare=False)
+@dataclass(order=True, frozen=True)
+class System:
+    """
+    Represents a system.
+    Attributes:
+        name (str):                    The name of the system.
+        version (str):                 The version.
+        config (str):                  The config (a string).
+        measures (str):                The measurement function (a string).
+        order (int):                   An integer denoting the occurrence in the XML file.
+        settings (dict[str, Setting]): Dictionary of all system settings.
+    """
+    name: str
+    version: str
+    config: str = field(compare=False)
+    measures: str = field(compare=False)
+    order: int
+    settings: dict[str, "Setting"] = field(default_factory=dict, compare=False)
+@dataclass(order=True, frozen=True)
+class Setting:
+    """
+    Represents a setting.
+    Attributes:
+        system (System):       The system associated with the setting.
+        name (str):            The name of the setting.
+        cmdline (str):         Command line parameters.
+        tag (str):             Tags of the setting.
+        order (int):           An integer denoting the occurrence in the XML file.
+        attr (dict[str, Any]): Arbitrary extra arguments.
+    """
+    system: "System"
+    name: str
+    cmdline: str = field(compare=False)
+    tag: str = field(compare=False)
+    order: int
+    attr: dict[str, Any] = field(compare=False)
+@dataclass(order=True, frozen=True)
+class Job:
+    """
+    Represents a job.
+    Attributes:
+        name (str):            The name of the job.
+        timeout (int):         Timeout of the job.
+        runs (int):            Number of repetitions per instance.
+        attr (dict[str, Any]): Arbitrary extra arguments.
+    """
+    name: str
+    timeout: int = field(compare=False)
+    runs: int = field(compare=False)
+    attr: dict[str, Any] = field(compare=False)
+@dataclass(order=True, frozen=True)
+class SeqJob(Job):
+    """
+    Represents a sequential job.
+    Attributes:
+        name (str):              The name of the job.
+        timeout (int):           Timeout of the job.
+        runs (int):              Number of repetitions per instance.
+        attrib (dict[str, Any]): Arbitrary extra arguments.
+        parallel (int):          Number of processes to start in parallel.
+    """
+    parallel: int = field(compare=False)
+@dataclass(order=True, frozen=True)
+class DistJob(Job):
+    """
+    Represents a dist job.
+    Attributes:
+        name (str):              The name of the job.
+        timeout (int):           Timeout of the job.
+        runs (int):              Number of repetitions per instance.
+        attrib (dict[str, Any]): Arbitrary extra arguments.
+        script_mode (str):       Specifies the script generation mode.
+        walltime (str):          The walltime for a distributed job.
+    """
+    script_mode: str = field(compare=False)
+    walltime: str = field(compare=False)
+    partition: str = field(compare=False)
+@dataclass(order=True, frozen=True)
+class Benchmark:
+    """
+    Represents a benchmark, i.e., a set of instances.
+    Attributes:
+        name (str):                 The name of the benchmark.
+        classes (dict[int, Class]): Benchmark classes in this benchmark.
+    """
+    name: str
+    classes: dict[int, "Class"] = field(default_factory=dict, compare=False)
+    def __iter__(self) -> Iterator["Class"]:
+        """
+        Creates an iterator over all benchmark classes.
+        """
+        yield from sorted(self.classes.values())
+@dataclass(order=True, frozen=True)
+class Class:
+    """
+    Represents a benchmark class.
+    Attributes:
+        benchmark (Benchmark):           The benchmark associaed with this class.
+        name (str):                      The name of the benchmark.
+        id (int):                        A unique id (in the scope of the benchmark).
+        instances (dict[int, Instance]): Instances belonging to this benchmark class.
+        values (dict[str, Any]):         Mutable dict with helper values.
+    """
+    benchmark: Benchmark
+    name: str
+    id: int = field(compare=False)
+    instances: dict[int, "Instance"] = field(default_factory=dict, compare=False)
+    values: dict[str, int] = field(default_factory=dict, compare=False)
+    def __post_init__(self) -> None:
+        """
+        Initialize mutable helper variables.
+        """
+        self.values["row"] = 0
+        self.values["inst_start"] = 0
+        self.values["inst_end"] = 0
+    def __iter__(self) -> Iterator["Instance"]:
+        """
+        Creates an iterator over all instances in the benchmark class.
+        """
+        yield from sorted(self.instances.values())
+@dataclass(order=True, frozen=True)
+class Instance:
+    """
+    Represents a benchmark instance.
+    Attributes:
+        benchclass (Class):      The class of the instance.
+        name (str):              The name of the benchmark.
+        id (int):                A unique id (in the scope of the benchmark).
+        max_runs (int):          Max number of runs.
+        values (dict[str, Any]): Mutable dict with helper values.
+    """
+    benchclass: Class
+    name: str
+    id: int = field(compare=False)
+    values: dict[str, int] = field(default_factory=dict, compare=False)
+    def __post_init__(self) -> None:
+        """
+        Initialize mutable helper variables.
+        """
+        self.values["max_runs"] = 0
+        self.values["row"] = 0
+@dataclass(order=True, frozen=True)
+class Project:
+    """
+    Describes a project, i.e, a collection of run specifications.
+    Attributes:
+        name (str):                 The name of the project.
+        job (str):                  The name of the associated job.
+        runspecs (list['Runspec']): Run specifications of the project.
+    """
+    name: str
+    job: str = field(compare=False)
+    runspecs: list["Runspec"] = field(default_factory=list, compare=False)
+    def __iter__(self) -> Iterator["Runspec"]:
+        """
+        Creates an iterator over all run specification in the project.
+        """
+        yield from self.runspecs
+@dataclass(order=True, frozen=True)
+class Runspec:
+    """
+    Describes a run specification, i.e, how to run individual systems
+    on a set of instances.
+    Attributes:
+        system (System):                  The system to evaluate.
+        machine (Machine):                The machine to run on.
+        benchmark (Benchmark):            The benchmark set to evaluate.
+        setting (Setting):                The setting to run with.
+        classresults (list[ClassResult]): The benchmark results.
+    """
+    system: "System"
+    machine: "Machine"
+    benchmark: "Benchmark"
+    setting: "Setting"
+    classresults: list["ClassResult"] = field(default_factory=list, compare=False)
+    def __iter__(self) -> Iterator["ClassResult"]:
+        """
+        Creates an iterator over all results (grouped by benchmark class.)
+        """
+        yield from self.classresults
+@dataclass(order=True, frozen=True)
+class ClassResult:
+    """
+    Represents the results of all instances of a benchmark class.
+    Attributes:
+        benchclass (Class):                 The benchmark class for the results.
+        instresults (list[InstanceResult]): Results of instances belonging to the benchmark class.
+    """
+    benchclass: "Class"
+    instresults: list["InstanceResult"] = field(default_factory=list, compare=False)
+    def __iter__(self) -> Iterator["InstanceResult"]:
+        """
+        Creates an iterator over all the individual results per instance.
+        """
+        yield from self.instresults
+@dataclass(order=True, frozen=True)
+class InstanceResult:
+    """
+    Represents the result of an individual instance (with possibly multiple runs).
+    Attributes:
+        instance (Instance): The instance for the results.
+        runs (list[Run]):    Results of runs belonging to the instance.
+    """
+    instance: "Instance"
+    runs: list["Run"] = field(default_factory=list, compare=False)
+    def __iter__(self) -> Iterator["Run"]:
+        """
+        Creates an iterator over the result of all runs.
+        """
+        yield from self.runs
+@dataclass(order=True, frozen=True)
+class Run:
+    """
+    Represents the result of an individual run of a benchmark instance.
+    Attributes:
+        instresult (InstanceResult):           The associated instance result.
+        number (int):                          The number of the run.
+        measures (dict[str, tuple[str, str]]): Concrete measurements.
+    """
+    instresult: "InstanceResult"
+    number: int
+    measures: dict[str, tuple[str, str]] = field(default_factory=dict, compare=False)
+    def iter(self, measures: list[tuple[str, Any]]) -> Iterator[tuple[str, str, str]]:
+        """
+        Creates an iterator over all measures captured during the run.
+        Measures can be filter by giving a string set of measure names.
+        If this string set is empty, instead all measures sorted by their keys
+        will be returned.
+        Attributes:
+            measures (list[tuple[str, Any]]): Selected measures.
+        """
+        if len(measures) == 0:
+            for name in sorted(self.measures.keys()):
+                yield name, self.measures[name][0], self.measures[name][1]
+        else:
+            for name, _ in measures:
+                if name in self.measures:
+                    yield name, self.measures[name][0], self.measures[name][1]
+                else:
+                    yield name, "None", "NaN"

benchmarktool/resultparser/__init__.py ADDED Viewed

File without changes