PyPI - idmtools-platform-comps - Versions diffs - 0.0.0.dev0__py3-none-any.whl → 0.0.2__py3-none-any.whl - Mend

idmtools-platform-comps 0.0.0.dev0py3-none-any.whl → 0.0.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (64) hide show

idmtools_platform_comps/__init__.py +25 -8
idmtools_platform_comps/cli/__init__.py +4 -0
idmtools_platform_comps/cli/cli_functions.py +50 -0
idmtools_platform_comps/cli/comps.py +492 -0
idmtools_platform_comps/comps_cli.py +48 -0
idmtools_platform_comps/comps_operations/__init__.py +6 -0
idmtools_platform_comps/comps_operations/asset_collection_operations.py +263 -0
idmtools_platform_comps/comps_operations/experiment_operations.py +569 -0
idmtools_platform_comps/comps_operations/simulation_operations.py +678 -0
idmtools_platform_comps/comps_operations/suite_operations.py +228 -0
idmtools_platform_comps/comps_operations/workflow_item_operations.py +269 -0
idmtools_platform_comps/comps_platform.py +309 -0
idmtools_platform_comps/plugin_info.py +168 -0
idmtools_platform_comps/ssmt_operations/__init__.py +6 -0
idmtools_platform_comps/ssmt_operations/simulation_operations.py +77 -0
idmtools_platform_comps/ssmt_operations/workflow_item_operations.py +73 -0
idmtools_platform_comps/ssmt_platform.py +44 -0
idmtools_platform_comps/ssmt_work_items/__init__.py +4 -0
idmtools_platform_comps/ssmt_work_items/comps_work_order_task.py +29 -0
idmtools_platform_comps/ssmt_work_items/comps_workitems.py +113 -0
idmtools_platform_comps/ssmt_work_items/icomps_workflowitem.py +71 -0
idmtools_platform_comps/ssmt_work_items/work_order.py +54 -0
idmtools_platform_comps/utils/__init__.py +4 -0
idmtools_platform_comps/utils/assetize_output/__init__.py +4 -0
idmtools_platform_comps/utils/assetize_output/assetize_output.py +125 -0
idmtools_platform_comps/utils/assetize_output/assetize_ssmt_script.py +144 -0
idmtools_platform_comps/utils/base_singularity_work_order.json +6 -0
idmtools_platform_comps/utils/download/__init__.py +4 -0
idmtools_platform_comps/utils/download/download.py +178 -0
idmtools_platform_comps/utils/download/download_ssmt.py +81 -0
idmtools_platform_comps/utils/download_experiment.py +116 -0
idmtools_platform_comps/utils/file_filter_workitem.py +519 -0
idmtools_platform_comps/utils/general.py +358 -0
idmtools_platform_comps/utils/linux_mounts.py +73 -0
idmtools_platform_comps/utils/lookups.py +123 -0
idmtools_platform_comps/utils/package_version.py +489 -0
idmtools_platform_comps/utils/python_requirements_ac/__init__.py +4 -0
idmtools_platform_comps/utils/python_requirements_ac/create_asset_collection.py +155 -0
idmtools_platform_comps/utils/python_requirements_ac/install_requirements.py +109 -0
idmtools_platform_comps/utils/python_requirements_ac/requirements_to_asset_collection.py +374 -0
idmtools_platform_comps/utils/python_version.py +40 -0
idmtools_platform_comps/utils/scheduling.py +154 -0
idmtools_platform_comps/utils/singularity_build.py +491 -0
idmtools_platform_comps/utils/spatial_output.py +76 -0
idmtools_platform_comps/utils/ssmt_utils/__init__.py +6 -0
idmtools_platform_comps/utils/ssmt_utils/common.py +70 -0
idmtools_platform_comps/utils/ssmt_utils/file_filter.py +568 -0
idmtools_platform_comps/utils/sweeping.py +162 -0
idmtools_platform_comps-0.0.2.dist-info/METADATA +100 -0
idmtools_platform_comps-0.0.2.dist-info/RECORD +62 -0
idmtools_platform_comps-0.0.2.dist-info/entry_points.txt +9 -0
idmtools_platform_comps-0.0.2.dist-info/licenses/LICENSE.TXT +3 -0
{idmtools_platform_comps-0.0.0.dev0.dist-info → idmtools_platform_comps-0.0.2.dist-info}/top_level.txt +1 -0
ssmt_image/Dockerfile +52 -0
ssmt_image/Makefile +21 -0
ssmt_image/__init__.py +6 -0
ssmt_image/bootstrap.sh +30 -0
ssmt_image/build_docker_image.py +161 -0
ssmt_image/pip.conf +3 -0
ssmt_image/push_docker_image.py +49 -0
ssmt_image/requirements.txt +9 -0
idmtools_platform_comps-0.0.0.dev0.dist-info/METADATA +0 -41
idmtools_platform_comps-0.0.0.dev0.dist-info/RECORD +0 -5
{idmtools_platform_comps-0.0.0.dev0.dist-info → idmtools_platform_comps-0.0.2.dist-info}/WHEEL +0 -0

idmtools_platform_comps/utils/general.py ADDED Viewed

@@ -0,0 +1,358 @@
+"""idmtools general status.
+Copyright 2021, Bill & Melinda Gates Foundation. All rights reserved.
+"""
+import os
+import re
+import uuid
+import ntpath
+from logging import getLogger, DEBUG
+from typing import List, Dict, Union, Generator, Optional
+from uuid import UUID
+from COMPS import Client
+from COMPS.Data import Simulation, SimulationFile, AssetCollectionFile, WorkItemFile, OutputFileMetadata, Experiment
+from COMPS.Data import AssetCollection as COMPSAssetCollection
+from COMPS.Data.AssetFile import AssetFile
+from COMPS.Data.Simulation import SimulationState
+from COMPS.Data.WorkItem import WorkItemState, WorkItem
+from requests import RequestException
+from idmtools.assets import AssetCollection, Asset
+from idmtools.core import EntityStatus, ItemType
+from idmtools.core.context import get_current_platform
+from idmtools.core.interfaces.ientity import IEntity
+from idmtools.entities.iplatform import IPlatform
+from idmtools.utils.local_os import LocalOS
+ASSETS_PATH = "Assets\\"
+if LocalOS.is_window():
+    ASSETS_PATH = ASSETS_PATH.lower()
+logger = getLogger(__name__)
+chars_to_replace = ['/', '\\', ':', "'", '"', '?', '<', '>', '*', '|', "\0", "(", ")", '`']
+clean_names_expr = re.compile(f'[{re.escape("".join(chars_to_replace))}]')
+def fatal_code(e: Exception) -> bool:
+    """
+    Uses to determine if we should stop retrying based on request status code.
+    Args:
+        e: Exception to check
+    Returns:
+        True is exception is a request and status code matches 404
+    """
+    if isinstance(e, RequestException):
+        return e.response.status_code == 404
+    return False
+def convert_comps_status(comps_status: SimulationState) -> EntityStatus:
+    """
+    Convert status from COMPS to IDMTools.
+    Args:
+        comps_status: Status in Comps
+    Returns:
+        EntityStatus
+    """
+    if comps_status == SimulationState.Succeeded:
+        return EntityStatus.SUCCEEDED
+    elif comps_status in (SimulationState.Canceled, SimulationState.CancelRequested, SimulationState.Failed):
+        return EntityStatus.FAILED
+    elif comps_status == SimulationState.Created:
+        return EntityStatus.CREATED
+    else:
+        return EntityStatus.RUNNING
+def convert_comps_workitem_status(comps_status: WorkItemState) -> EntityStatus:
+    """
+    Convert status from COMPS to IDMTools.
+    Created = 0                # WorkItem has been saved to the database
+    CommissionRequested = 5    # WorkItem is ready to be processed by the next available worker of the correct type
+    Commissioned = 10          # WorkItem has been commissioned to a worker of the correct type and is beginning execution
+    Validating = 30            # WorkItem is being validated
+    Running = 40               # WorkItem is currently running
+    Waiting = 50               # WorkItem is waiting for dependent items to complete
+    ResumeRequested = 60       # Dependent items have completed and WorkItem is ready to be processed by the next available worker of the correct type
+    CancelRequested = 80       # WorkItem cancellation was requested
+    Canceled = 90              # WorkItem was successfully canceled
+    Resumed = 100              # WorkItem has been claimed by a worker of the correct type and is resuming
+    Canceling = 120            # WorkItem is in the process of being canceled by the worker
+    Succeeded = 130            # WorkItem completed successfully
+    Failed = 140               # WorkItem failed
+    Args:
+        comps_status: Status in Comps
+    Returns:
+        EntityStatus
+    """
+    work_item_canceled = (WorkItemState.Canceled, WorkItemState.CancelRequested, WorkItemState.Failed)
+    work_item_created = [
+        WorkItemState.Created, WorkItemState.Resumed, WorkItemState.CommissionRequested, WorkItemState.Commissioned
+    ]
+    if comps_status == WorkItemState.Succeeded:
+        return EntityStatus.SUCCEEDED
+    elif comps_status in work_item_canceled:
+        return EntityStatus.FAILED
+    elif comps_status == work_item_created:
+        return EntityStatus.CREATED
+    else:
+        return EntityStatus.RUNNING
+def clean_experiment_name(experiment_name: str) -> str:
+    """
+    Enforce any COMPS-specific demands on experiment names.
+    Args:
+        experiment_name: name of the experiment
+    Returns:the experiment name allowed for use
+    """
+    experiment_name = clean_names_expr.sub("_", experiment_name)
+    return experiment_name.encode("ascii", "ignore").decode('utf8').strip()
+def get_file_from_collection(platform: IPlatform, collection_id: UUID, file_path: str) -> bytearray:
+    """
+    Retrieve a file from an asset collection.
+    Args:
+        platform: Platform object to use
+        collection_id: Asset Collection ID
+        file_path: Path within collection
+    Examples::
+    >>> import uuid
+    >>> get_file_from_collection(platform, uuid.UUID("fc461146-3b2a-441f-bc51-0bff3a9c1ba0"), "StdOut.txt")
+    Returns:
+        Object Byte Array
+    """
+    logger.debug(f"Cache miss for {collection_id} {file_path}")
+    # retrieve the collection
+    ac = platform.get_item(collection_id, ItemType.ASSETCOLLECTION, raw=True)
+    # Look for the asset file in the collection
+    file_name = ntpath.basename(file_path)
+    path = ntpath.dirname(file_path)
+    if LocalOS.is_window():
+        file_name = file_name.lower()
+        path = path.lower()
+    path = os.path.normpath(path.lstrip(ASSETS_PATH).strip('/'))
+    for asset_file in ac.assets:
+        if LocalOS.is_window():
+            if asset_file.file_name.lower() == file_name and os.path.normpath(asset_file.relative_path or '').lower() == path:
+                return asset_file.retrieve()
+        else:
+            if asset_file.file_name == file_name and os.path.normpath(asset_file.relative_path or '') == path:
+                return asset_file.retrieve()
+def get_file_as_generator(file: Union[SimulationFile, AssetCollectionFile, AssetFile, WorkItemFile, OutputFileMetadata],
+                          chunk_size: int = 128, resume_byte_pos: Optional[int] = None) -> \
+        Generator[bytearray, None, None]:
+    """
+    Get file as a generator.
+    Args:
+        file: File to stream contents through a generator
+        chunk_size: Size of chunks to load
+        resume_byte_pos: Optional start of download
+    Returns:
+        Generator for file content
+    """
+    if isinstance(file, OutputFileMetadata):
+        url = file.url
+    else:
+        url = file.uri
+    i = url.find('/asset/')
+    if i == -1:
+        raise RuntimeError('Unable to parse asset url: ' + url)
+    if resume_byte_pos:
+        header = {'Range': 'bytes=%d-' % resume_byte_pos}
+    else:
+        header = {}
+    response = Client.get(url[i:], headers=header, stream=True)
+    yield from response.iter_content(chunk_size=chunk_size)
+class Workitem(object):
+    """SimpleItem to define workitem for proxy purposes.
+    Notes:
+        - TODO deprecate this if possible
+    """
+    pass
+def get_asset_for_comps_item(platform: IPlatform, item: IEntity, files: List[str], cache=None,
+                             comps_item: Union[Experiment, Workitem, Simulation] = None) -> Dict[str, bytearray]:
+    """
+    Retrieve assets from an Entity(Simulation, Experiment, WorkItem).
+    Args:
+        platform: Platform Object to use
+        item: Item to fetch assets from
+        files: List of file names to retrieve
+        cache: Cache object to use
+        comps_item: Optional comps item
+    Returns:
+        Dictionary in structure of filename -> bytearray
+    """
+    if logger.isEnabledFor(DEBUG):
+        logger.debug(f"Loading the files {files} from {item}")
+    if len(files) == 0:
+        transients = []
+        assets = None
+    else:
+        all_paths = set(files)
+        assets = set(path for path in all_paths if path.lower().startswith("assets"))
+        transients = all_paths.difference(assets)
+    # Create the return dict
+    ret = {}
+    # Retrieve the transient if any
+    if isinstance(comps_item, (Simulation, WorkItem)):
+        if transients or len(files) == 0:
+            transient_files = comps_item.retrieve_output_files(paths=transients)
+            ret = dict(zip(transients, transient_files))
+    else:
+        ret = dict()
+    # Take care of the assets
+    if assets and comps_item.configuration:
+        # Get the collection_id for the simulation
+        collection_id = comps_item.configuration.asset_collection_id
+        if collection_id:
+            # Retrieve the files
+            for file_path in assets:
+                # Normalize the separators
+                normalized_path = ntpath.normpath(file_path)
+                if cache is not None:
+                    ret[file_path] = cache.memoize()(get_file_from_collection)(platform, collection_id, normalized_path)
+                else:
+                    ret[file_path] = get_file_from_collection(platform, collection_id, normalized_path)
+    return ret
+def update_item(platform: IPlatform, item_id: str, item_type: ItemType, tags: dict = None, name: str = None):
+    """Utility function to update existing COMPS experiment/simulation/workitem's tags.
+    For example, you can add/update simulation's tag once its post-process is done to mark the simulation with
+    more meaningful text with tag/name
+    Args:
+        platform: Platform
+        item_id: experiment/simulation/workitem id
+        item_type: The type of the object to be retrieved
+        tags: tags dict for update
+        name: name of experiment/simulation/workitem
+    Returns:
+        None
+    """
+    comps_item = platform.get_item(item_id, item_type, raw=True)
+    current_tags = comps_item.tags
+    if tags is not None:
+        current_tags.update(tags)
+        comps_item.set_tags(current_tags)
+    if name is not None:
+        comps_item.name = name
+    comps_item.save()
+def generate_ac_from_asset_md5(file_name: str, asset_md5: [str, uuid.UUID], platform: 'IPlatform' = None,
+                               tags: dict = None):
+    """
+    Get an asset collection by asset id(md5).
+    Args:
+        file_name: file name string
+        asset_md5: asset md5 string
+        platform : Platform object
+        tags: tags dict for asset collection
+    Returns:
+        COMPS AssetCollection
+    """
+    if tags is None:
+        tags = {'Name': file_name, 'md5': asset_md5}
+    else:
+        tags['Name'] = file_name
+        tags['md5'] = asset_md5
+    if platform is None:
+        platform = get_current_platform()
+    ac = COMPSAssetCollection()
+    ac.set_tags(tags)
+    acf = AssetCollectionFile(file_name=file_name, md5_checksum=asset_md5)
+    ac.add_asset(acf)
+    ac.save()
+    print('done - created AC ' + str(ac.id))
+    asset_collection: AssetCollection = platform._assets.to_entity(ac)
+    return asset_collection
+def generate_ac_from_asset_md5_file(file_path: str):
+    """
+    Get an asset collection by file path.
+    Args:
+        file_path : file path
+    Returns:
+        COMPS AssetCollection
+    """
+    # Check if the file exists and is accessible
+    try:
+        with open(file_path, "r") as asset_fd:
+            content = asset_fd.read()
+    except FileNotFoundError:
+        logger.debug(f"Error: The file {file_path} was not found.")
+        return None
+    except IOError:
+        logger.debug(f"Error: Could not read the file {file_path}.")
+        return None
+    # Split the content and check format
+    items = content.split(':')
+    if len(items) < 3:
+        logger.debug("Error: The file's content is not in the expected format.")
+        return None
+    file_name = items[0]
+    asset_md5 = items[2]
+    # Handle errors from generate_ac_from_asset_md5
+    try:
+        asset_collection: AssetCollection = generate_ac_from_asset_md5(file_name, asset_md5)
+    except Exception as e:
+        logger.debug(f"An error occurred while generating AC from asset ID: {e}")
+        return None
+    return asset_collection
+def save_sif_asset_md5_from_ac_id(ac_id: str):
+    """
+    Get the md5 of the asset in the asset collection of singularity.
+    Args:
+        ac_id: asset collection id
+    """
+    from COMPS.Data import QueryCriteria
+    ac = COMPSAssetCollection.get(ac_id, QueryCriteria().select_children(['assets']))
+    asset = Asset(filename=ac.assets[0].file_name, checksum=ac.assets[0].md5_checksum)
+    # Save the asset filename and md5 checksum to local file
+    asset.save_md5_checksum()

idmtools_platform_comps/utils/linux_mounts.py ADDED Viewed

@@ -0,0 +1,73 @@
+"""idmtools set linux mounts.
+Copyright 2021, Bill & Melinda Gates Foundation. All rights reserved.
+"""
+import os
+from COMPS import AuthManager
+from COMPS.Data import Simulation
+from typing import TYPE_CHECKING, List, Dict
+if TYPE_CHECKING:  # pragma: no cover
+    from idmtools.entities.iplatform import IPlatform
+DEFAULT_ENVIRONMENTS = ["SLURMSTAGE", "CALCULON", "NIBBLER"]
+def set_linux_mounts(platform: 'IPlatform', linux_environment: str = None) -> None:
+    """
+    For COMPS Platform, check and set linux mounts.
+    Args:
+        platform: idmtools COMPS Platform
+        linux_environment: platform environment
+    Returns:
+        None
+    """
+    linux_envs = DEFAULT_ENVIRONMENTS
+    if linux_environment is not None:
+        linux_envs.append(linux_environment.upper())
+    if platform.environment.upper() in linux_envs:
+        mounts = AuthManager.get_environment_macros(platform.environment)['DOCKER_MOUNTS']
+        mounts = {v[0]: v[1:4] for v in [m.split(';') for m in mounts.split('|')]}
+        # pretend I'm on Linux and set the Linux mapping environment variables
+        for k, v in mounts.items():
+            os.environ[k] = ';'.join([v[0], v[2]])
+def clear_linux_mounts(platform: 'IPlatform', linux_environment: str = None) -> None:
+    """
+    For COMPS Platform, check and clear linux mounts.
+    Args:
+        platform: idmtools COMPS Platform
+        linux_environment: platform environment
+    Returns:
+        None
+    """
+    linux_envs = DEFAULT_ENVIRONMENTS
+    if linux_environment is not None:
+        linux_envs.append(linux_environment.upper())
+    if platform.environment.upper() in linux_envs:
+        mounts = AuthManager.get_environment_macros(platform.environment)['DOCKER_MOUNTS']
+        mounts = {v[0]: v[1:4] for v in [m.split(';') for m in mounts.split('|')]}
+        # pretend I'm on Linux and clear the Linux mapping environment variables
+        for k, v in mounts.items():
+            os.environ.pop(k)
+def get_workdir_from_simulations(platform: 'IPlatform', comps_simulations: List[Simulation]) -> Dict[str, str]:
+    """
+    Get COMPS simulations working directory.
+    Args:
+        platform: idmtools COMPS Platform
+        comps_simulations: COMPS Simulations
+    Returns:
+        dictionary with simulation id as key and working directory as value
+    """
+    set_linux_mounts(platform)
+    sim_work_dir = {str(sim.id): sim.hpc_jobs[-1].working_directory for sim in comps_simulations if sim.hpc_jobs}
+    clear_linux_mounts(platform)
+    return sim_work_dir

idmtools_platform_comps/utils/lookups.py ADDED Viewed

@@ -0,0 +1,123 @@
+"""idmtools comps lookups.
+Copyright 2021, Bill & Melinda Gates Foundation. All rights reserved.
+"""
+from datetime import datetime, timedelta
+from logging import getLogger
+from typing import List
+import backoff
+from COMPS.Data import Experiment, Simulation, QueryCriteria
+from requests import Timeout, HTTPError
+from idmtools_platform_comps.utils.general import fatal_code
+logger = getLogger(__name__)
+@backoff.on_exception(backoff.constant(1.5), (Timeout, ConnectionError, HTTPError), max_tries=5, giveup=fatal_code)
+def get_experiment_by_id(exp_id, query_criteria: QueryCriteria = None) -> Experiment:
+    """Get an experiment by id."""
+    return Experiment.get(exp_id, query_criteria=query_criteria)
+@backoff.on_exception(backoff.constant(1.5), (Timeout, ConnectionError, HTTPError), max_tries=5, giveup=fatal_code)
+def get_simulation_by_id(sim_id, query_criteria: QueryCriteria = None) -> Simulation:
+    """
+    Fetches simulation by id and optional query criteria.
+    Wrapped in additional Retry Logic. Used by other lookup methods
+    Args:
+        sim_id:
+        query_criteria: Optional QueryCriteria to search with
+    Returns:
+        Simulation with ID
+    """
+    return Simulation.get(id=sim_id, query_criteria=query_criteria)
+def get_all_experiments_for_user(user: str) -> List[Experiment]:
+    """
+    Returns all the experiments for a specific user.
+    Args:
+        user: username to locate
+    Returns:
+        Experiments for a user
+    """
+    # COMPS limits the retrieval to 1000 so to make sure we get all experiments for a given user, we need to be clever
+    # Also COMPS does not have an order_by so we have to go through all date ranges
+    interval = 365
+    results = {}
+    end_date = start_date = datetime.today()
+    limit_date = datetime.strptime("2014-03-31", '%Y-%m-%d')  # Oldest simulation in COMPS
+    while start_date > limit_date:
+        start_date = end_date - timedelta(days=interval)
+        batch = Experiment.get(query_criteria=QueryCriteria().where(["owner={}".format(user),
+                                                                     "date_created<={}".format(
+                                                                         end_date.strftime('%Y-%m-%d')),
+                                                                     "date_created>={}".format(
+                                                                         start_date.strftime('%Y-%m-%d'))]))
+        if len(batch) == 1000:
+            # We hit a limit, reduce the interval and run again
+            interval = interval / 2
+            continue
+        if len(batch) == 0:
+            interval *= 2
+        else:
+            # Add the experiments to the dict
+            for e in batch:
+                results[e.id] = e
+        # Go from there
+        end_date = start_date
+    return list(results.values())
+def get_simulations_from_big_experiments(experiment_id):
+    """
+    Get simulation for large experiment. This allows us to pull simulations in chunks.
+    Args:
+        experiment_id: Experiment id to load
+    Returns:
+        List of simulations
+    """
+    e = get_experiment_by_id(experiment_id)
+    start_date = end_date = e.date_created
+    import pytz
+    limit_date = datetime.today().replace(tzinfo=pytz.utc)
+    interval = 60
+    stop_flag = False
+    results = {}
+    while start_date < limit_date:
+        start_date = end_date + timedelta(minutes=interval)
+        try:
+            batch = Simulation.get(query_criteria=QueryCriteria()
+                                   .select(['id', 'state', 'date_created']).select_children('tags')
+                                   .where(["experiment_id={}".format(experiment_id),
+                                           "date_created>={}".format(end_date.strftime('%Y-%m-%d %T')),
+                                           "date_created<={}".format(start_date.strftime('%Y-%m-%d %T'))])
+                                   )
+        except Exception as e:
+            logger.exception(e)
+            interval /= 2
+            continue
+        if not batch:
+            if stop_flag:
+                break
+            else:
+                interval = 120
+                stop_flag = True
+        else:
+            stop_flag = False
+            for s in batch:
+                results[s.id] = s
+        end_date = start_date
+    return results.values()

idmtools-platform-comps 0.0.0.dev0__py3-none-any.whl → 0.0.2__py3-none-any.whl

idmtools-platform-comps 0.0.0.dev0py3-none-any.whl → 0.0.2py3-none-any.whl