PyPI - cloudos-cli - Versions diffs - 2.17.0__py3-none-any.whl - Mend

cloudos-cli 2.17.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (41) hide show

cloudos_cli/__init__.py +11 -0
cloudos_cli/__main__.py +1297 -0
cloudos_cli/_version.py +1 -0
cloudos_cli/clos.py +726 -0
cloudos_cli/jobs/__init__.py +8 -0
cloudos_cli/jobs/job.py +555 -0
cloudos_cli/queue/__init__.py +8 -0
cloudos_cli/queue/queue.py +139 -0
cloudos_cli/utils/__init__.py +9 -0
cloudos_cli/utils/errors.py +32 -0
cloudos_cli/utils/requests.py +75 -0
cloudos_cli-2.17.0.dist-info/LICENSE +674 -0
cloudos_cli-2.17.0.dist-info/METADATA +1060 -0
cloudos_cli-2.17.0.dist-info/RECORD +41 -0
cloudos_cli-2.17.0.dist-info/WHEEL +5 -0
cloudos_cli-2.17.0.dist-info/entry_points.txt +2 -0
cloudos_cli-2.17.0.dist-info/top_level.txt +2 -0
tests/__init__.py +0 -0
tests/functions_for_pytest.py +7 -0
tests/test_clos/__init__.py +0 -0
tests/test_clos/test_create_cromwell_header.py +35 -0
tests/test_clos/test_cromwell_switch.py +77 -0
tests/test_clos/test_detect_workflow.py +47 -0
tests/test_clos/test_get_cromwell_status.py +77 -0
tests/test_clos/test_get_curated_workflow_list.py +72 -0
tests/test_clos/test_get_job_list.py +79 -0
tests/test_clos/test_get_job_status.py +75 -0
tests/test_clos/test_get_project_list.py +74 -0
tests/test_clos/test_get_user_info.py +68 -0
tests/test_clos/test_get_workflow_list.py +87 -0
tests/test_clos/test_is_module.py +48 -0
tests/test_clos/test_process_job_list.py +74 -0
tests/test_clos/test_process_project_list.py +36 -0
tests/test_clos/test_process_workflow_list.py +36 -0
tests/test_clos/test_wait_job_completion.py +40 -0
tests/test_clos/test_workflow_import.py +77 -0
tests/test_jobs/__init__.py +0 -0
tests/test_jobs/test_convert_nextflow_to_json.py +104 -0
tests/test_jobs/test_project_id.py +67 -0
tests/test_jobs/test_send_job.py +84 -0
tests/test_jobs/test_workflow_id.py +67 -0

cloudos_cli/jobs/__init__.py ADDED Viewed

@@ -0,0 +1,8 @@
+"""
+Functions and classes related to jobs.
+"""
+from .job import Job
+__all__ = ['job']

cloudos_cli/jobs/job.py ADDED Viewed

@@ -0,0 +1,555 @@
+"""
+This is the main class to create jobs.
+"""
+from dataclasses import dataclass
+from typing import Union
+import json
+from cloudos_cli.clos import Cloudos
+from cloudos_cli.utils.errors import BadRequestException
+from cloudos_cli.utils.requests import retry_requests_post
+@dataclass
+class Job(Cloudos):
+    """Class to store and operate jobs.
+    Parameters
+    ----------
+    cloudos_url : string
+        The CloudOS service url.
+    apikey : string
+        Your CloudOS API key.
+    cromwell_token : string
+        Cromwell server token.
+    workspace_id : string
+        The specific Cloudos workspace id.
+    project_name : string
+        The name of a CloudOS project.
+    workflow_name : string
+        The name of a CloudOS workflow or pipeline.
+    verify: [bool|string]
+        Whether to use SSL verification or not. Alternatively, if
+        a string is passed, it will be interpreted as the path to
+        the SSL certificate file.
+    mainfile : string
+        The name of the mainFile used by the workflow. Required for WDL pipelines as different
+        mainFiles could be loaded for a single pipeline.
+    importsfile : string
+        The name of the importsFile used by the workflow. Optional and only used for WDL pipelines
+        as different importsFiles could be loaded for a single pipeline.
+    repository_platform : string
+        The name of the repository platform of the workflow.
+    project_id : string
+        The CloudOS project id for a given project name.
+    workflow_id : string
+        The CloudOS workflow id for a given workflow_name.
+    """
+    workspace_id: str
+    project_name: str
+    workflow_name: str
+    verify: Union[bool, str] = True
+    mainfile: str = None
+    importsfile: str = None
+    repository_platform: str = 'github'
+    project_id: str = None
+    workflow_id: str = None
+    @property
+    def project_id(self) -> str:
+        return self._project_id
+    @project_id.setter
+    def project_id(self, v) -> None:
+        if isinstance(v, property):
+            # Fetch the value as not defined by user.
+            self._project_id = self.fetch_cloudos_id(
+                self.apikey,
+                self.cloudos_url,
+                'projects',
+                self.workspace_id,
+                self.project_name,
+                verify=self.verify)
+        else:
+            # Let the user define the value.
+            self._project_id = v
+    @property
+    def workflow_id(self) -> str:
+        return self._workflow_id
+    @workflow_id.setter
+    def workflow_id(self, v) -> None:
+        if isinstance(v, property):
+            # Fetch the value as not defined by user.
+            self._workflow_id = self.fetch_cloudos_id(
+                self.apikey,
+                self.cloudos_url,
+                'workflows',
+                self.workspace_id,
+                self.workflow_name,
+                self.mainfile,
+                self.importsfile,
+                self.repository_platform,
+                self.verify)
+        else:
+            # Let the user define the value.
+            self._workflow_id = v
+    def fetch_cloudos_id(self,
+                         apikey,
+                         cloudos_url,
+                         resource,
+                         workspace_id,
+                         name,
+                         mainfile=None,
+                         importsfile=None,
+                         repository_platform='github',
+                         verify=True):
+        """Fetch the cloudos id for a given name.
+        Paramters
+        ---------
+        apikey : string
+            Your CloudOS API key
+        cloudos_url : string
+            The CloudOS service url.
+        resource : string
+            The resource you want to fetch from. E.g.: projects.
+        workspace_id : string
+            The specific Cloudos workspace id.
+        name : string
+            The name of a CloudOS resource element.
+        mainfile : string
+            The name of the mainFile used by the workflow. Only used when resource == 'workflows'.
+            Required for WDL pipelines as different mainFiles could be loaded for a single
+            pipeline.
+        importsfile : string
+            The name of the importsFile used by the workflow. Optional and only used for WDL pipelines
+            as different importsFiles could be loaded for a single pipeline.
+        repository_platform : string
+            The name of the repository platform of the workflow resides.
+        verify: [bool|string]
+            Whether to use SSL verification or not. Alternatively, if
+            a string is passed, it will be interpreted as the path to
+            the SSL certificate file.
+        Returns
+        -------
+        project_id : string
+            The CloudOS project id for a given project name.
+        """
+        allowed_resources = ['projects', 'workflows']
+        if resource not in allowed_resources:
+            raise ValueError('Your specified resource is not supported. ' +
+                             f'Use one of the following: {allowed_resources}')
+        if resource == 'workflows':
+            content = self.get_workflow_list(workspace_id, verify=verify)
+            for element in content:
+                if (element["name"] == name and
+                    element["repository"]["platform"] == repository_platform and
+                    not element["archived"]["status"]):
+                    if mainfile is None:
+                        return element["_id"]
+                    elif element["mainFile"] == mainfile:
+                        if importsfile is None and "importsFile" not in element.keys():
+                            return element["_id"]
+                        elif "importsFile" in element.keys() and element["importsFile"] == importsfile:
+                            return element["_id"]
+        elif resource == 'projects':
+            r = self.get_project_list(workspace_id, verify=verify)
+            content = json.loads(r.content)
+            # New API projects endpoint spec
+            if type(content) is dict:
+                for element in content["projects"]:
+                    if element["name"] == name:
+                        return element["_id"]
+            # Old API projects endpoint spec added for backwards compatibility
+            elif type(content) is list:
+                for element in content:
+                    if element["name"] == name:
+                        return element["_id"]
+        if mainfile is not None:
+            raise ValueError(f'[ERROR] A workflow named \'{name}\' with a mainFile \'{mainfile}\'' +
+                             f' and an importsFile \'{importsfile}\' was not found')
+        else:
+            raise ValueError(f'[ERROR] No {name} element in {resource} was found')
+    def convert_nextflow_to_json(self,
+                                 job_config,
+                                 parameter,
+                                 example_parameters,
+                                 git_commit,
+                                 git_tag,
+                                 project_id,
+                                 workflow_id,
+                                 job_name,
+                                 resumable,
+                                 save_logs,
+                                 batch,
+                                 job_queue_id,
+                                 nextflow_profile,
+                                 nextflow_version,
+                                 instance_type,
+                                 instance_disk,
+                                 storage_mode,
+                                 lustre_size,
+                                 execution_platform,
+                                 hpc_id,
+                                 workflow_type,
+                                 cromwell_id,
+                                 cost_limit,
+                                 use_mountpoints,
+                                 docker_login):
+        """Converts a nextflow.config file into a json formatted dict.
+        Parameters
+        ----------
+        job_config : string
+            Path to a nextflow.config file with parameters scope.
+        parameter : tuple
+            Tuple of strings indicating the parameters to pass to the pipeline call.
+            They are in the following form: ('param1=param1val', 'param2=param2val', ...)
+        example_parameters : list
+            A list of dicts, with the parameters required for the API request in JSON format.
+            It is typically used to run curated pipelines using the already available
+            example parameters.
+        git_commit : string
+            The exact commit of the pipeline to use. Equivalent to -r
+            option in Nextflow. If not specified, the last commit of the
+            default branch will be used.
+        git_tag : string
+            The tag of the pipeline to use. If not specified, the last
+            commit of the default branch will be used.
+        project_id : string
+            The CloudOS project id for a given project name.
+        workflow_id : string
+            The CloudOS workflow id for a given workflow_name.
+        job_name : string.
+            The name to assign to the job.
+        resumable: bool
+            Whether to create a resumable job or not.
+        save_logs : bool
+            Whether to save job logs or not.
+        batch: bool
+            Whether to create a batch job or an ignite one.
+        job_queue_id : string
+            Job queue Id to use in the batch job.
+        nextflow_profile: string
+            A comma separated string with the profiles to be used.
+        nextflow_version: string
+            Nextflow version to use when executing the workflow in CloudOS.
+        instance_type : string
+            Name of the instance type to be used for the job master node, for example for AWS EC2 c5.xlarge
+        instance_disk : int
+            The disk space of the instance, in GB.
+        storage_mode : string
+            Either 'lustre' or 'regular'. Indicates if the user wants to select regular
+            or lustre storage.
+        lustre_size : int
+            The lustre storage to be used when --storage-mode=lustre, in GB. It should be 1200 or
+            a multiple of it.
+        execution_platform : string ['aws'|'azure'|'hpc']
+            The execution platform implemented in your CloudOS.
+        hpc_id : string
+            The ID of your HPC in CloudOS.
+        workflow_type : str
+            The type of workflow to run. Either 'nextflow' or 'wdl'.
+        cromwell_id : str
+            Cromwell server ID.
+        cost_limit : float
+            Job cost limit. -1 means no cost limit.
+        use_mountpoints : bool
+            Whether to use or not AWS S3 mountpoint for quicker file staging.
+        docker_login : bool
+            Whether to use private docker images, provided the users have linked their docker.io accounts.
+        Returns
+        -------
+        params : dict
+            A JSON formatted dict.
+        """
+        workflow_params = []
+        if workflow_type == 'wdl':
+            # This is required as non-resumable jobs fails always using WDL workflows.
+            resumable = True
+        if (
+            nextflow_profile is None and
+            job_config is None and
+            len(parameter) == 0 and
+            len(example_parameters) == 0
+        ):
+            raise ValueError('No --job-config, --nextflow_profile, --parameter or ' +
+                             '--example_parameters were specified,' +
+                             '  please use at least one of these options.')
+        if workflow_type == 'wdl' and job_config is None and len(parameter) == 0:
+            raise ValueError('No --job-config or --parameter were provided. At least one of ' +
+                             'these are required for WDL workflows.')
+        if job_config is not None:
+            with open(job_config, 'r') as p:
+                reading = False
+                for p_l in p:
+                    if 'params' in p_l.lower():
+                        reading = True
+                    else:
+                        if reading:
+                            if workflow_type == 'wdl':
+                                p_l_strip = p_l.strip().replace(
+                                    ' ', '')
+                            else:
+                                p_l_strip = p_l.strip().replace(
+                                    ' ', '').replace('\"', '').replace('\'', '')
+                            if len(p_l_strip) == 0:
+                                continue
+                            elif p_l_strip[0] == '/' or p_l_strip[0] == '#':
+                                continue
+                            elif p_l_strip == '}':
+                                reading = False
+                            else:
+                                p_list = p_l_strip.split('=')
+                                p_name = p_list[0]
+                                p_value = '='.join(p_list[1:])
+                                if len(p_list) < 2:
+                                    raise ValueError('Please, specify your ' +
+                                                     'parameters in ' +
+                                                     f'{job_config} using ' +
+                                                     'the \'=\' as spacer. ' +
+                                                     'E.g: name = my_name')
+                                elif workflow_type == 'wdl':
+                                    param = {"prefix": "",
+                                             "name": p_name,
+                                             "parameterKind": "textValue",
+                                             "textValue": p_value}
+                                    workflow_params.append(param)
+                                else:
+                                    param = {"prefix": "--",
+                                             "name": p_name,
+                                             "parameterKind": "textValue",
+                                             "textValue": p_value}
+                                    workflow_params.append(param)
+            if len(workflow_params) == 0:
+                raise ValueError(f'The {job_config} file did not contain any ' +
+                                 'valid parameter')
+        if len(parameter) > 0:
+            for p in parameter:
+                p_split = p.split('=')
+                if len(p_split) < 2:
+                    raise ValueError('Please, specify -p / --parameter using a single \'=\' ' +
+                                     'as spacer. E.g: input=value')
+                p_name = p_split[0]
+                p_value = '='.join(p_split[1:])
+                if workflow_type == 'wdl':
+                    param = {"prefix": "",
+                             "name": p_name,
+                             "parameterKind": "textValue",
+                             "textValue": p_value}
+                    workflow_params.append(param)
+                else:
+                    param = {"prefix": "--",
+                             "name": p_name,
+                             "parameterKind": "textValue",
+                             "textValue": p_value}
+                    workflow_params.append(param)
+            if len(workflow_params) == 0:
+                raise ValueError(f'The provided parameters are not valid: {parameter}')
+        if len(example_parameters) > 0:
+            for example_param in example_parameters:
+                workflow_params.append(example_param)
+        if git_tag is not None and git_commit is not None:
+            raise ValueError('Please, specify none or only one of --git-tag' +
+                             ' or --git-commit options but not both.')
+        if git_commit is not None:
+            revision_block = {
+                                 "commit": git_commit,
+                                 "isLatest": False
+                             }
+        elif git_tag is not None:
+            revision_block = {
+                                 "tag": git_tag,
+                                 "isLatest": False
+                             }
+        else:
+            revision_block = ""
+        if storage_mode == "lustre":
+            print('\n[WARNING] Lustre storage has been selected. Please, be sure that this kind of ' +
+                  'storage is available in your CloudOS workspace.\n')
+            if lustre_size % 1200:
+                raise ValueError('Please, specify a lustre storage size of 1200 or a multiple of it. ' +
+                                 f'{lustre_size} is not a valid number.')
+        if storage_mode not in ['lustre', 'regular']:
+            raise ValueError('Please, use either \'lustre\' or \'regular\' for --storage-mode ' +
+                             f'{storage_mode} is not allowed')
+        params = {
+            "parameters": workflow_params,
+            "project": project_id,
+            "workflow": workflow_id,
+            "name": job_name,
+            "nextflowVersion": nextflow_version,
+            "resumable": resumable,
+            "saveProcessLogs": save_logs,
+            "batch": {
+                "dockerLogin": docker_login,
+                "enabled": batch,
+                "jobQueue": job_queue_id
+            },
+            "cromwellCloudResources": cromwell_id,
+            "executionPlatform": execution_platform,
+            "hpc": hpc_id,
+            "storageSizeInGb": instance_disk,
+            "execution": {
+                "computeCostLimit": cost_limit,
+                "optim": "test"
+            },
+            "lusterFsxStorageSizeInGb": lustre_size,
+            "storageMode": storage_mode,
+            "revision": revision_block,
+            "profile": nextflow_profile,
+            "instanceType": instance_type,
+            "usesFusionFileSystem": use_mountpoints
+        }
+        if execution_platform != 'hpc':
+            params['masterInstance'] = {
+                "requestedInstance": {
+                    "type": instance_type,
+                    "asSpot": False
+                }
+            }
+        return params
+    def send_job(self,
+                 job_config=None,
+                 parameter=(),
+                 example_parameters=[],
+                 git_commit=None,
+                 git_tag=None,
+                 job_name='new_job',
+                 resumable=False,
+                 save_logs=True,
+                 batch=True,
+                 job_queue_id=None,
+                 nextflow_profile=None,
+                 nextflow_version='22.10.8',
+                 instance_type='c5.xlarge',
+                 instance_disk=500,
+                 storage_mode='regular',
+                 lustre_size=1200,
+                 execution_platform='aws',
+                 hpc_id=None,
+                 workflow_type='nextflow',
+                 cromwell_id=None,
+                 cost_limit=30.0,
+                 use_mountpoints=False,
+                 docker_login=False,
+                 verify=True):
+        """Send a job to CloudOS.
+        Parameters
+        ----------
+        job_config : string
+            Path to a nextflow.config file with parameters scope.
+        parameter : tuple
+            Tuple of strings indicating the parameters to pass to the pipeline call.
+            They are in the following form: ('param1=param1val', 'param2=param2val', ...)
+        example_parameters : list
+            A list of dicts, with the parameters required for the API request in JSON format.
+            It is typically used to run curated pipelines using the already available
+            example parameters.
+        git_commit : string
+            The exact commit of the pipeline to use. Equivalent to -r
+            option in Nextflow. If not specified, the last commit of the
+            default branch will be used.
+        git_tag : string
+            The tag of the pipeline to use. If not specified, the last
+            commit of the default branch will be used.
+        job_name : string
+            The name to assign to the job.
+        resumable : bool
+            Whether to create a resumable job or not.
+        save_logs : bool
+            Whether to save job logs or not.
+        batch: bool
+            Whether to create a batch job or an ignite one.
+        job_queue_id : string
+            Job queue Id to use in the batch job.
+        nextflow_profile: string
+            A comma separated string with the profiles to be used.
+        nextflow_version: string
+            Nextflow version to use when executing the workflow in CloudOS.
+        instance_type : string
+            Name of the instance type to be used for the job master node, for example for AWS EC2 c5.xlarge
+        instance_disk : int
+            The disk space of the instance, in GB.
+        storage_mode : string
+            Either 'lustre' or 'regular'. Indicates if the user wants to select regular
+            or lustre storage.
+        lustre_size : int
+            The lustre storage to be used when --storage-mode=lustre, in GB. It should be 1200 or
+            a multiple of it.
+        execution_platform : string ['aws'|'azure'|'hpc']
+            The execution platform implemented in your CloudOS.
+        hpc_id : string
+            The ID of your HPC in CloudOS.
+        workflow_type : str
+            The type of workflow to run. Either 'nextflow' or 'wdl'.
+        cromwell_id : str
+            Cromwell server ID.
+        cost_limit : float
+            Job cost limit. -1 means no cost limit.
+        use_mountpoints : bool
+            Whether to use or not AWS S3 mountpoint for quicker file staging.
+        docker_login : bool
+            Whether to use private docker images, provided the users have linked their docker.io accounts.
+        verify: [bool|string]
+            Whether to use SSL verification or not. Alternatively, if
+            a string is passed, it will be interpreted as the path to
+            the SSL certificate file.
+        Returns
+        -------
+        j_id : string
+            The CloudOS job id of the job just launched.
+        """
+        apikey = self.apikey
+        cloudos_url = self.cloudos_url
+        workspace_id = self.workspace_id
+        workflow_id = self.workflow_id
+        project_id = self.project_id
+        # Prepare api request for CloudOS to run a job
+        headers = {
+            "Content-type": "application/json",
+            "apikey": apikey
+        }
+        params = self.convert_nextflow_to_json(job_config,
+                                               parameter,
+                                               example_parameters,
+                                               git_commit,
+                                               git_tag,
+                                               project_id,
+                                               workflow_id,
+                                               job_name,
+                                               resumable,
+                                               save_logs,
+                                               batch,
+                                               job_queue_id,
+                                               nextflow_profile,
+                                               nextflow_version,
+                                               instance_type,
+                                               instance_disk,
+                                               storage_mode,
+                                               lustre_size,
+                                               execution_platform,
+                                               hpc_id,
+                                               workflow_type,
+                                               cromwell_id,
+                                               cost_limit,
+                                               use_mountpoints,
+                                               docker_login)
+        r = retry_requests_post("{}/api/v1/jobs?teamId={}".format(cloudos_url,
+                                                            workspace_id),
+                                data=json.dumps(params), headers=headers, verify=verify)
+        if r.status_code >= 400:
+            raise BadRequestException(r)
+        j_id = json.loads(r.content)["_id"]
+        print('\tJob successfully launched to CloudOS, please check the ' +
+              f'following link: {cloudos_url}/app/jobs/{j_id}')
+        return j_id

cloudos_cli/queue/__init__.py ADDED Viewed

@@ -0,0 +1,8 @@
+"""
+Functions and classes related to job queues.
+"""
+from .queue import Queue
+__all__ = ['queue']