PyPI - pybiolib - Versions diffs - 0.2.951__py3-none-any.whl → 1.2.1890__py3-none-any.whl - Mend

pybiolib 0.2.951py3-none-any.whl → 1.2.1890py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (262) hide show

biolib/__init__.py +357 -11
biolib/_data_record/data_record.py +380 -0
biolib/_index/__init__.py +0 -0
biolib/_index/index.py +55 -0
biolib/_index/query_result.py +103 -0
biolib/_internal/__init__.py +0 -0
biolib/_internal/add_copilot_prompts.py +58 -0
biolib/_internal/add_gui_files.py +81 -0
biolib/_internal/data_record/__init__.py +1 -0
biolib/_internal/data_record/data_record.py +85 -0
biolib/_internal/data_record/push_data.py +116 -0
biolib/_internal/data_record/remote_storage_endpoint.py +43 -0
biolib/_internal/errors.py +5 -0
biolib/_internal/file_utils.py +125 -0
biolib/_internal/fuse_mount/__init__.py +1 -0
biolib/_internal/fuse_mount/experiment_fuse_mount.py +209 -0
biolib/_internal/http_client.py +159 -0
biolib/_internal/lfs/__init__.py +1 -0
biolib/_internal/lfs/cache.py +51 -0
biolib/_internal/libs/__init__.py +1 -0
biolib/_internal/libs/fusepy/__init__.py +1257 -0
biolib/_internal/push_application.py +488 -0
biolib/_internal/runtime.py +22 -0
biolib/_internal/string_utils.py +13 -0
biolib/_internal/templates/__init__.py +1 -0
biolib/_internal/templates/copilot_template/.github/instructions/general-app-knowledge.instructions.md +10 -0
biolib/_internal/templates/copilot_template/.github/instructions/style-general.instructions.md +20 -0
biolib/_internal/templates/copilot_template/.github/instructions/style-python.instructions.md +16 -0
biolib/_internal/templates/copilot_template/.github/instructions/style-react-ts.instructions.md +47 -0
biolib/_internal/templates/copilot_template/.github/prompts/biolib_app_inputs.prompt.md +11 -0
biolib/_internal/templates/copilot_template/.github/prompts/biolib_onboard_repo.prompt.md +19 -0
biolib/_internal/templates/copilot_template/.github/prompts/biolib_run_apps.prompt.md +12 -0
biolib/_internal/templates/dashboard_template/.biolib/config.yml +5 -0
biolib/_internal/templates/github_workflow_template/.github/workflows/biolib.yml +21 -0
biolib/_internal/templates/gitignore_template/.gitignore +10 -0
biolib/_internal/templates/gui_template/.yarnrc.yml +1 -0
biolib/_internal/templates/gui_template/App.tsx +53 -0
biolib/_internal/templates/gui_template/Dockerfile +27 -0
biolib/_internal/templates/gui_template/biolib-sdk.ts +82 -0
biolib/_internal/templates/gui_template/dev-data/output.json +7 -0
biolib/_internal/templates/gui_template/index.css +5 -0
biolib/_internal/templates/gui_template/index.html +13 -0
biolib/_internal/templates/gui_template/index.tsx +10 -0
biolib/_internal/templates/gui_template/package.json +27 -0
biolib/_internal/templates/gui_template/tsconfig.json +24 -0
biolib/_internal/templates/gui_template/vite-plugin-dev-data.ts +50 -0
biolib/_internal/templates/gui_template/vite.config.mts +10 -0
biolib/_internal/templates/init_template/.biolib/config.yml +19 -0
biolib/_internal/templates/init_template/Dockerfile +14 -0
biolib/_internal/templates/init_template/requirements.txt +1 -0
biolib/_internal/templates/init_template/run.py +12 -0
biolib/_internal/templates/init_template/run.sh +4 -0
biolib/_internal/templates/templates.py +25 -0
biolib/_internal/tree_utils.py +106 -0
biolib/_internal/utils/__init__.py +65 -0
biolib/_internal/utils/auth.py +46 -0
biolib/_internal/utils/job_url.py +33 -0
biolib/_internal/utils/multinode.py +263 -0
biolib/_runtime/runtime.py +157 -0
biolib/_session/session.py +44 -0
biolib/_shared/__init__.py +0 -0
biolib/_shared/types/__init__.py +74 -0
biolib/_shared/types/account.py +12 -0
biolib/_shared/types/account_member.py +8 -0
biolib/_shared/types/app.py +9 -0
biolib/_shared/types/data_record.py +40 -0
biolib/_shared/types/experiment.py +32 -0
biolib/_shared/types/file_node.py +17 -0
biolib/_shared/types/push.py +6 -0
biolib/_shared/types/resource.py +37 -0
biolib/_shared/types/resource_deploy_key.py +11 -0
biolib/_shared/types/resource_permission.py +14 -0
biolib/_shared/types/resource_version.py +19 -0
biolib/_shared/types/result.py +14 -0
biolib/_shared/types/typing.py +10 -0
biolib/_shared/types/user.py +19 -0
biolib/_shared/utils/__init__.py +7 -0
biolib/_shared/utils/resource_uri.py +75 -0
biolib/api/__init__.py +6 -0
biolib/api/client.py +168 -0
biolib/app/app.py +252 -49
biolib/app/search_apps.py +45 -0
biolib/biolib_api_client/api_client.py +126 -31
biolib/biolib_api_client/app_types.py +24 -4
biolib/biolib_api_client/auth.py +31 -8
biolib/biolib_api_client/biolib_app_api.py +147 -52
biolib/biolib_api_client/biolib_job_api.py +161 -141
biolib/biolib_api_client/job_types.py +21 -5
biolib/biolib_api_client/lfs_types.py +7 -23
biolib/biolib_api_client/user_state.py +56 -0
biolib/biolib_binary_format/__init__.py +1 -4
biolib/biolib_binary_format/file_in_container.py +105 -0
biolib/biolib_binary_format/module_input.py +24 -7
biolib/biolib_binary_format/module_output_v2.py +149 -0
biolib/biolib_binary_format/remote_endpoints.py +34 -0
biolib/biolib_binary_format/remote_stream_seeker.py +59 -0
biolib/biolib_binary_format/saved_job.py +3 -2
biolib/biolib_binary_format/{attestation_document.py → stdout_and_stderr.py} +8 -8
biolib/biolib_binary_format/system_status_update.py +3 -2
biolib/biolib_binary_format/utils.py +175 -0
biolib/biolib_docker_client/__init__.py +11 -2
biolib/biolib_errors.py +36 -0
biolib/biolib_logging.py +27 -10
biolib/cli/__init__.py +38 -0
biolib/cli/auth.py +46 -0
biolib/cli/data_record.py +164 -0
biolib/cli/index.py +32 -0
biolib/cli/init.py +421 -0
biolib/cli/lfs.py +101 -0
biolib/cli/push.py +50 -0
biolib/cli/run.py +63 -0
biolib/cli/runtime.py +14 -0
biolib/cli/sdk.py +16 -0
biolib/cli/start.py +56 -0
biolib/compute_node/cloud_utils/cloud_utils.py +110 -161
biolib/compute_node/job_worker/cache_state.py +66 -88
biolib/compute_node/job_worker/cache_types.py +1 -6
biolib/compute_node/job_worker/docker_image_cache.py +112 -37
biolib/compute_node/job_worker/executors/__init__.py +0 -3
biolib/compute_node/job_worker/executors/docker_executor.py +532 -199
biolib/compute_node/job_worker/executors/docker_types.py +9 -1
biolib/compute_node/job_worker/executors/types.py +19 -9
biolib/compute_node/job_worker/job_legacy_input_wait_timeout_thread.py +30 -0
biolib/compute_node/job_worker/job_max_runtime_timer_thread.py +3 -5
biolib/compute_node/job_worker/job_storage.py +108 -0
biolib/compute_node/job_worker/job_worker.py +397 -212
biolib/compute_node/job_worker/large_file_system.py +87 -38
biolib/compute_node/job_worker/network_alloc.py +99 -0
biolib/compute_node/job_worker/network_buffer.py +240 -0
biolib/compute_node/job_worker/utilization_reporter_thread.py +197 -0
biolib/compute_node/job_worker/utils.py +9 -24
biolib/compute_node/remote_host_proxy.py +400 -98
biolib/compute_node/utils.py +31 -9
biolib/compute_node/webserver/compute_node_results_proxy.py +189 -0
biolib/compute_node/webserver/proxy_utils.py +28 -0
biolib/compute_node/webserver/webserver.py +130 -44
biolib/compute_node/webserver/webserver_types.py +2 -6
biolib/compute_node/webserver/webserver_utils.py +77 -12
biolib/compute_node/webserver/worker_thread.py +183 -42
biolib/experiments/__init__.py +0 -0
biolib/experiments/experiment.py +356 -0
biolib/jobs/__init__.py +1 -0
biolib/jobs/job.py +741 -0
biolib/jobs/job_result.py +185 -0
biolib/jobs/types.py +50 -0
biolib/py.typed +0 -0
biolib/runtime/__init__.py +14 -0
biolib/sdk/__init__.py +91 -0
biolib/tables.py +34 -0
biolib/typing_utils.py +2 -7
biolib/user/__init__.py +1 -0
biolib/user/sign_in.py +54 -0
biolib/utils/__init__.py +162 -0
biolib/utils/cache_state.py +94 -0
biolib/utils/multipart_uploader.py +194 -0
biolib/utils/seq_util.py +150 -0
biolib/utils/zip/remote_zip.py +640 -0
pybiolib-1.2.1890.dist-info/METADATA +41 -0
pybiolib-1.2.1890.dist-info/RECORD +177 -0
{pybiolib-0.2.951.dist-info → pybiolib-1.2.1890.dist-info}/WHEEL +1 -1
pybiolib-1.2.1890.dist-info/entry_points.txt +2 -0
README.md +0 -17
biolib/app/app_result.py +0 -68
biolib/app/utils.py +0 -62
biolib/biolib-js/0-biolib.worker.js +0 -1
biolib/biolib-js/1-biolib.worker.js +0 -1
biolib/biolib-js/2-biolib.worker.js +0 -1
biolib/biolib-js/3-biolib.worker.js +0 -1
biolib/biolib-js/4-biolib.worker.js +0 -1
biolib/biolib-js/5-biolib.worker.js +0 -1
biolib/biolib-js/6-biolib.worker.js +0 -1
biolib/biolib-js/index.html +0 -10
biolib/biolib-js/main-biolib.js +0 -1
biolib/biolib_api_client/biolib_account_api.py +0 -21
biolib/biolib_api_client/biolib_large_file_system_api.py +0 -108
biolib/biolib_binary_format/aes_encrypted_package.py +0 -42
biolib/biolib_binary_format/module_output.py +0 -58
biolib/biolib_binary_format/rsa_encrypted_aes_package.py +0 -57
biolib/biolib_push.py +0 -114
biolib/cli.py +0 -203
biolib/cli_utils.py +0 -273
biolib/compute_node/cloud_utils/enclave_parent_types.py +0 -7
biolib/compute_node/enclave/__init__.py +0 -2
biolib/compute_node/enclave/enclave_remote_hosts.py +0 -53
biolib/compute_node/enclave/nitro_secure_module_utils.py +0 -64
biolib/compute_node/job_worker/executors/base_executor.py +0 -18
biolib/compute_node/job_worker/executors/pyppeteer_executor.py +0 -173
biolib/compute_node/job_worker/executors/remote/__init__.py +0 -1
biolib/compute_node/job_worker/executors/remote/nitro_enclave_utils.py +0 -81
biolib/compute_node/job_worker/executors/remote/remote_executor.py +0 -51
biolib/lfs.py +0 -196
biolib/pyppeteer/.circleci/config.yml +0 -100
biolib/pyppeteer/.coveragerc +0 -3
biolib/pyppeteer/.gitignore +0 -89
biolib/pyppeteer/.pre-commit-config.yaml +0 -28
biolib/pyppeteer/CHANGES.md +0 -253
biolib/pyppeteer/CONTRIBUTING.md +0 -26
biolib/pyppeteer/LICENSE +0 -12
biolib/pyppeteer/README.md +0 -137
biolib/pyppeteer/docs/Makefile +0 -177
biolib/pyppeteer/docs/_static/custom.css +0 -28
biolib/pyppeteer/docs/_templates/layout.html +0 -10
biolib/pyppeteer/docs/changes.md +0 -1
biolib/pyppeteer/docs/conf.py +0 -299
biolib/pyppeteer/docs/index.md +0 -21
biolib/pyppeteer/docs/make.bat +0 -242
biolib/pyppeteer/docs/reference.md +0 -211
biolib/pyppeteer/docs/server.py +0 -60
biolib/pyppeteer/poetry.lock +0 -1699
biolib/pyppeteer/pyppeteer/__init__.py +0 -135
biolib/pyppeteer/pyppeteer/accessibility.py +0 -286
biolib/pyppeteer/pyppeteer/browser.py +0 -401
biolib/pyppeteer/pyppeteer/browser_fetcher.py +0 -194
biolib/pyppeteer/pyppeteer/command.py +0 -22
biolib/pyppeteer/pyppeteer/connection/__init__.py +0 -242
biolib/pyppeteer/pyppeteer/connection/cdpsession.py +0 -101
biolib/pyppeteer/pyppeteer/coverage.py +0 -346
biolib/pyppeteer/pyppeteer/device_descriptors.py +0 -787
biolib/pyppeteer/pyppeteer/dialog.py +0 -79
biolib/pyppeteer/pyppeteer/domworld.py +0 -597
biolib/pyppeteer/pyppeteer/emulation_manager.py +0 -53
biolib/pyppeteer/pyppeteer/errors.py +0 -48
biolib/pyppeteer/pyppeteer/events.py +0 -63
biolib/pyppeteer/pyppeteer/execution_context.py +0 -156
biolib/pyppeteer/pyppeteer/frame/__init__.py +0 -299
biolib/pyppeteer/pyppeteer/frame/frame_manager.py +0 -306
biolib/pyppeteer/pyppeteer/helpers.py +0 -245
biolib/pyppeteer/pyppeteer/input.py +0 -371
biolib/pyppeteer/pyppeteer/jshandle.py +0 -598
biolib/pyppeteer/pyppeteer/launcher.py +0 -683
biolib/pyppeteer/pyppeteer/lifecycle_watcher.py +0 -169
biolib/pyppeteer/pyppeteer/models/__init__.py +0 -103
biolib/pyppeteer/pyppeteer/models/_protocol.py +0 -12460
biolib/pyppeteer/pyppeteer/multimap.py +0 -82
biolib/pyppeteer/pyppeteer/network_manager.py +0 -678
biolib/pyppeteer/pyppeteer/options.py +0 -8
biolib/pyppeteer/pyppeteer/page.py +0 -1728
biolib/pyppeteer/pyppeteer/pipe_transport.py +0 -59
biolib/pyppeteer/pyppeteer/target.py +0 -147
biolib/pyppeteer/pyppeteer/task_queue.py +0 -24
biolib/pyppeteer/pyppeteer/timeout_settings.py +0 -36
biolib/pyppeteer/pyppeteer/tracing.py +0 -93
biolib/pyppeteer/pyppeteer/us_keyboard_layout.py +0 -305
biolib/pyppeteer/pyppeteer/util.py +0 -18
biolib/pyppeteer/pyppeteer/websocket_transport.py +0 -47
biolib/pyppeteer/pyppeteer/worker.py +0 -101
biolib/pyppeteer/pyproject.toml +0 -97
biolib/pyppeteer/spell.txt +0 -137
biolib/pyppeteer/tox.ini +0 -72
biolib/pyppeteer/utils/generate_protocol_types.py +0 -603
biolib/start_cli.py +0 -7
biolib/utils.py +0 -47
biolib/validators/validate_app_version.py +0 -183
biolib/validators/validate_argument.py +0 -134
biolib/validators/validate_module.py +0 -323
biolib/validators/validate_zip_file.py +0 -40
biolib/validators/validator_utils.py +0 -103
pybiolib-0.2.951.dist-info/LICENSE +0 -21
pybiolib-0.2.951.dist-info/METADATA +0 -61
pybiolib-0.2.951.dist-info/RECORD +0 -153
pybiolib-0.2.951.dist-info/entry_points.txt +0 -3
/LICENSE → /pybiolib-1.2.1890.dist-info/licenses/LICENSE +0 -0

biolib/_internal/utils/job_url.py ADDED Viewed

@@ -0,0 +1,33 @@
+import re
+from urllib.parse import urlparse
+import biolib.utils
+from biolib.typing_utils import Optional, Tuple
+def parse_result_id_or_url(result_id_or_url: str, default_token: Optional[str] = None) -> Tuple[str, Optional[str]]:
+    result_id_or_url = result_id_or_url.strip()
+    if '/' not in result_id_or_url:
+        return (result_id_or_url, default_token)
+    if not result_id_or_url.startswith('http://') and not result_id_or_url.startswith('https://'):
+        result_id_or_url = 'https://' + result_id_or_url
+    parsed_url = urlparse(result_id_or_url)
+    if biolib.utils.BIOLIB_BASE_URL:
+        expected_base = urlparse(biolib.utils.BIOLIB_BASE_URL)
+        if parsed_url.scheme != expected_base.scheme or parsed_url.netloc != expected_base.netloc:
+            raise ValueError(f'URL must start with {biolib.utils.BIOLIB_BASE_URL}, got: {result_id_or_url}')
+    pattern = r'/results?/(?P<uuid>[a-f0-9-]+)/?(?:\?token=(?P<token>[^&]+))?'
+    match = re.search(pattern, result_id_or_url, re.IGNORECASE)
+    if not match:
+        raise ValueError(f'URL must be in format <base_url>/results/<UUID>/?token=<token>, got: {result_id_or_url}')
+    uuid = match.group('uuid')
+    token = match.group('token') or default_token
+    return (uuid, token)

biolib/_internal/utils/multinode.py ADDED Viewed

@@ -0,0 +1,263 @@
+import glob
+import os
+import re
+import shutil
+import subprocess
+import tempfile
+import biolib
+from biolib.utils import SeqUtil
+def natsorted(lst):
+    """Sort the list using the natural sort key."""
+    def _natural_sort_key(s):
+        """A key function for natural sorting."""
+        return [int(text) if text.isdigit() else text.lower() for text in re.split('([0-9]+)', s)]
+    return sorted(lst, key=_natural_sort_key)
+def fasta_above_threshold(fasta_file, work_threshold, work_per_residue=1, verbose=False):
+    """True if total FASYA residue work above max_work"""
+    records = SeqUtil.parse_fasta(fasta_file)
+    # Calculate work units
+    total_work_units = 0
+    for i, record in enumerate(records):
+        sequence_work_units = len(record.sequence) * work_per_residue
+        total_work_units += sequence_work_units
+        if total_work_units >= work_threshold:
+            if verbose:
+                print(f'FASTA above threshold (stopped at {total_work_units}) >= {work_threshold}')
+                print(f'From  from {i+1}/{len(records)} sequences in {fasta_file}')
+            return True
+    if verbose:
+        print(f'FASTA below threshold ({total_work_units}) < {work_threshold}')
+        print(f'From {len(records)} sequences in {fasta_file}')
+    return False
+def run_locally(command_list, args):
+    """Run script locally (no multi-node processing)"""
+    # Prepare command
+    new_args = vars(args)
+    # Delete multinode-specific input arguments
+    for k in list(new_args.keys()):
+        if str(k).startswith('multinode'):
+            del new_args[k]
+    # Convert to list format
+    new_args_list = _args_dict_to_args_list(new_args)
+    # Prepare command, e.g. ["python3", "predict.py"] + new_args_list
+    command = command_list + new_args_list
+    if args.verbose >= 1:
+        print(f'Running {command}')
+    # Run command
+    result = subprocess.run(command, capture_output=True, text=True, check=False)
+    if result.returncode == 0:
+        print(f'{result.stdout}')
+    else:
+        print(f'Error: {result.stderr}')
+def fasta_batch_records(records, work_per_batch_min, work_per_residue=1, verbose=False):
+    """Converts FASTA records to batches of records, based on thresholds"""
+    def log_batches(batches):
+        for i, batch in enumerate(batches):
+            batch_dict = {
+                'records': len(batch),
+                'residues': sum(len(record.sequence) for record in batch),
+            }
+            n_seqs, n_res = batch_dict['records'], batch_dict['residues']
+            print(f'Batch {i+1}: {n_res} residues from {n_seqs} sequences')
+    batches = []
+    batch = []
+    current_longest_seq_len = 0
+    for record in records:
+        seq_len = len(record.sequence)
+        potential_longest_seq_len = max(current_longest_seq_len, seq_len)
+        # Calculate work units if we were to add this record
+        potential_work_units = potential_longest_seq_len * work_per_residue * (len(batch) + 1)
+        if potential_work_units >= work_per_batch_min and len(batch) > 0:
+            batches.append(batch)
+            batch = []
+            current_longest_seq_len = 0
+            potential_longest_seq_len = seq_len
+        # Add to batch
+        batch.append(record)
+        current_longest_seq_len = potential_longest_seq_len
+    # Append last batch if present
+    if batch:
+        batches.append(batch)
+    if verbose:
+        log_batches(batches)
+    return batches
+def fasta_send_batches_biolib(
+    app_url, batches, args, args_fasta='fasta', machine='cpu.large', stream_all_jobs=True, verbose=1
+):
+    """
+    Send jobs through pybiolib interface
+    """
+    if args.verbose >= 1:
+        print(f'Sending {len(batches)} batches to Biolib')
+    # Login to biolib, prepare app
+    # current_app = biolib.load(Runtime.get_app_uri())
+    current_app = biolib.load(app_url)  # Nb: uses "_" not "-"
+    # Compute results
+    job_list = []
+    for i, batch_records in enumerate(batches):  # MH
+        # Write FASTA, send to server
+        with tempfile.TemporaryDirectory() as tempdir:
+            # New arguments
+            new_args = vars(args)
+            # Write batched FASTA to send
+            fasta_path = f'{tempdir}/input.fasta'
+            SeqUtil.write_records_to_fasta(fasta_path, batch_records)
+            new_args[args_fasta] = fasta_path
+            new_args['multinode_only_local'] = True
+            # Convert to list
+            new_args_list = _args_dict_to_args_list(new_args)
+            # Send job
+            job = current_app.cli(args=new_args_list, blocking=False, machine=machine)
+            job_list.append(job)
+            # Job stats
+            if args.verbose:
+                batch_dict = _get_batch_stats(batch_records)
+                n_seqs, n_res = batch_dict['records'], batch_dict['residues']
+                print(f'Sending job {i+1}: {n_res} residues from {n_seqs} sequences -> arg_list = {new_args_list}')
+    # Stream job output at a time
+    print('Streaming job outputs ...')
+    for i, job in enumerate(job_list):
+        # Try to print if verbose. Always on first job, otherwise only if stream_all_jobs set
+        if (i == 0 and verbose) or (stream_all_jobs and verbose):
+            job.stream_logs()
+        # Check if job succeeded
+        assert job.get_exit_code() == 0, f'Job failed with exit code {job.get_exit_code()}'
+        # Write to disk
+        output_dir = f'job_output/job_{i+1}'
+        job.save_files(output_dir=output_dir)
+        if verbose:
+            print(f'Saving to {output_dir}')
+def merge_folder(folder_name, job_out_dir='job_output', out_dir='output', verbose=1):
+    """Helper function for merging folders"""
+    os.makedirs(out_dir, exist_ok=True)
+    job_dirs = glob.glob(f'{job_out_dir}/job_*')
+    job_dirs = natsorted(job_dirs)
+    # Move first file, prepare to merge
+    first_folder = f'{job_dirs[0]}/{folder_name}'
+    merged_folder = f'{out_dir}/{folder_name}'
+    shutil.move(first_folder, merged_folder)
+    if verbose:
+        print(f'Merging {folder_name} from {len(job_dirs)} directories to {merged_folder}')
+    # If more than one folder, merge to first
+    if len(job_dirs) >= 2:
+        # Find each job output file
+        for job_dir in job_dirs[1:]:
+            # Move over extra files
+            extra_folder = f'{job_dir}/{folder_name}'
+            extra_files = os.listdir(extra_folder)
+            for file_name in extra_files:
+                file_path = f'{extra_folder}/{file_name}'
+                shutil.move(file_path, merged_folder)
+def merge_file(
+    file_name,
+    header_lines_int=1,
+    job_out_dir='job_output',
+    out_dir='output',
+    verbose=1,
+):
+    """Helper function for merging files with headers"""
+    os.makedirs(out_dir, exist_ok=True)
+    job_dirs = glob.glob(f'{job_out_dir}/job_*')
+    job_dirs = natsorted(job_dirs)
+    # Move first file, prepare to merge
+    first_file = f'{job_dirs[0]}/{file_name}'
+    merged_file = f'{out_dir}/{file_name}'
+    shutil.move(first_file, merged_file)
+    if verbose:
+        print(f'Merging {file_name} from {len(job_dirs)} directories to {merged_file}')
+    # If more than one file, append to first
+    if len(job_dirs) >= 2:
+        # Open first file
+        with open(merged_file, 'a') as merged_file_handle:
+            # Find each job output file
+            for job_dir in job_dirs[1:]:
+                # Open extra file
+                extra_file = f'{job_dir}/{file_name}'
+                with open(extra_file) as extra_file_handle:
+                    # Skip first n header lines
+                    for _ in range(header_lines_int):
+                        next(extra_file_handle)
+                    # Append content to first file
+                    contents = extra_file_handle.read()
+                    merged_file_handle.write(contents)
+def _get_batch_stats(batch):
+    stats_dict = {
+        'records': len(batch),
+        'residues': sum(len(R.sequence) for R in batch),
+    }
+    return stats_dict
+def _args_dict_to_args_list(new_args):
+    """Converts args dict to list of arguments for Biolib"""
+    nested_list = [[f'--{key}', f'{value}'] for key, value in new_args.items()]
+    arg_list = []
+    for lst in nested_list:
+        for item in lst:
+            arg_list.append(item)
+    return arg_list

biolib/_runtime/runtime.py ADDED Viewed

@@ -0,0 +1,157 @@
+import json
+import re
+from pathlib import Path
+from typing import Optional
+from biolib import api
+from biolib._internal.runtime import BioLibRuntimeError, BioLibRuntimeNotRecognizedError, RuntimeJobDataDict
+from biolib.biolib_logging import logger
+from biolib.typing_utils import cast
+from biolib.utils.seq_util import SeqUtil
+class Runtime:
+    _job_data: Optional[RuntimeJobDataDict] = None
+    @staticmethod
+    def check_is_environment_biolib_app() -> bool:
+        return bool(Runtime._try_to_get_job_data())
+    @staticmethod
+    def check_is_environment_biolib_cloud() -> bool:
+        return Runtime._get_job_data().get('is_environment_biolib_cloud', False)
+    @staticmethod
+    def get_job_id() -> str:
+        return Runtime._get_job_data()['job_uuid']
+    @staticmethod
+    def get_job_auth_token() -> str:
+        return Runtime._get_job_data()['job_auth_token']
+    @staticmethod
+    def get_job_requested_machine() -> Optional[str]:
+        job_data = Runtime._get_job_data()
+        job_requested_machine = job_data.get('job_requested_machine')
+        if not job_requested_machine:
+            return None
+        return job_requested_machine
+    @staticmethod
+    def is_spot_machine_requested() -> bool:
+        job_data = Runtime._get_job_data()
+        return job_data.get('job_requested_machine_spot', False)
+    @staticmethod
+    def get_app_uri() -> str:
+        return Runtime._get_job_data()['app_uri']
+    @staticmethod
+    def get_max_workers() -> int:
+        return Runtime._get_job_data()['job_reserved_machines']
+    @staticmethod
+    def get_secret(secret_name: str) -> bytes:
+        assert re.match(
+            '^[a-zA-Z0-9_-]*$', secret_name
+        ), 'Secret name can only contain alphanumeric characters and dashes or underscores '
+        try:
+            with open(f'/biolib/secrets/{secret_name}', 'rb') as file:
+                return file.read()
+        except BaseException as error:
+            raise BioLibRuntimeError(f'Unable to get system secret: {secret_name}') from error
+    @staticmethod
+    def get_temporary_client_secret(secret_name: str) -> bytes:
+        assert re.match(
+            '^[a-zA-Z0-9_-]*$', secret_name
+        ), 'Secret name can only contain alphanumeric characters and dashes or underscores '
+        try:
+            with open(f'/biolib/temporary-client-secrets/{secret_name}', 'rb') as file:
+                return file.read()
+        except BaseException as error:
+            raise BioLibRuntimeError(f'Unable to get secret: {secret_name}') from error
+    @staticmethod
+    def set_main_result_prefix(result_prefix: str) -> None:
+        job_data = Runtime._get_job_data()
+        api.client.patch(
+            data={'result_name_prefix': result_prefix},
+            headers={'Job-Auth-Token': job_data['job_auth_token']},
+            path=f"/jobs/{job_data['job_uuid']}/main_result/",
+        )
+    @staticmethod
+    def set_result_name_prefix(result_prefix: str) -> None:
+        Runtime.set_main_result_prefix(result_prefix)
+    @staticmethod
+    def set_result_name_prefix_from_fasta(path_to_fasta: str) -> None:
+        """
+        Set BioLib result name to FASTA file name (excluding file extension) or,
+        if detecting a BioLib generated name, use ID of the first sequence in the fasta file
+        """
+        try:
+            # Set job name to first header if FASTA text input (random BioLib file) detected
+            if re.match('^input_[A-Za-z0-9]+.*', path_to_fasta):
+                first_id = next(SeqUtil.parse_fasta(path_to_fasta)).id
+                result_name = first_id.replace(' ', '_')[:60]
+            else:
+                result_name = Path(path_to_fasta).name
+            logger.debug(f'Setting result name to "{result_name}" from {path_to_fasta}')
+            Runtime.set_result_name_prefix(result_name)
+        except Exception as e:
+            logger.warning(f'Failed to set result name from fasta file {path_to_fasta}: {str(e)}')
+    @staticmethod
+    def set_result_name_from_file(path_to_file: str) -> None:
+        try:
+            if path_to_file.lower().endswith('.fasta'):
+                return Runtime.set_result_name_prefix_from_fasta(path_to_file)
+            # Set job name only if not a BioLib default name
+            if not re.match('^input_[A-Za-z0-9]+.*', path_to_file):
+                result_name = Path(path_to_file).name[:60]
+                logger.debug(f'Setting result name to "{result_name}" from {path_to_file}')
+                Runtime.set_result_name_prefix(result_name)
+        except Exception as e:
+            logger.warning(f'Failed to set result name from file {path_to_file}: {str(e)}')
+    @staticmethod
+    def set_result_name_from_string(result_name: str) -> None:
+        try:
+            truncated_name = result_name[:60]
+            logger.debug(f'Setting result name to "{truncated_name}" from string')
+            Runtime.set_result_name_prefix(truncated_name)
+        except Exception as e:
+            logger.warning(f'Failed to set result name from string: {str(e)}')
+    @staticmethod
+    def create_result_note(note: str) -> None:
+        job_id = Runtime.get_job_id()
+        # Note: Authentication is added by app caller proxy in compute node
+        api.client.post(data={'note': note}, path=f'/jobs/{job_id}/notes/')
+    @staticmethod
+    def _try_to_get_job_data() -> Optional[RuntimeJobDataDict]:
+        if not Runtime._job_data:
+            try:
+                with open('/biolib/secrets/biolib_system_secret') as file:
+                    job_data: RuntimeJobDataDict = json.load(file)
+            except BaseException:
+                return None
+            if not job_data['version'].startswith('1.'):
+                raise BioLibRuntimeError(f"Unexpected system secret version {job_data['version']} expected 1.x.x")
+            Runtime._job_data = job_data
+        return cast(RuntimeJobDataDict, Runtime._job_data)
+    @staticmethod
+    def _get_job_data() -> RuntimeJobDataDict:
+        job_data = Runtime._try_to_get_job_data()
+        if not job_data:
+            raise BioLibRuntimeNotRecognizedError() from None
+        return job_data

biolib/_session/session.py ADDED Viewed

@@ -0,0 +1,44 @@
+from biolib import utils
+from biolib.typing_utils import Optional
+from biolib.api.client import ApiClient, ApiClientInitDict
+from biolib.app import BioLibApp
+class Session:
+    def __init__(self, _init_dict: ApiClientInitDict, _experiment: Optional[str] = None) -> None:
+        self._api = ApiClient(_init_dict=_init_dict)
+        self._experiment = _experiment
+    @staticmethod
+    def get_session(refresh_token: str, base_url: Optional[str] = None, client_type: Optional[str] = None, experiment: Optional[str] = None) -> 'Session':
+        return Session(
+            _init_dict=ApiClientInitDict(
+                refresh_token=refresh_token,
+                base_url=base_url or utils.load_base_url_from_env(),
+                client_type=client_type,
+            ),
+            _experiment=experiment,
+        )
+    def load(self, uri: str, suppress_version_warning: bool = False) -> BioLibApp:
+        r"""Load a BioLib application by its URI or website URL.
+        Args:
+            uri (str): The URI or website URL of the application to load. Can be either:
+                - App URI (e.g., 'biolib/myapp:1.0.0')
+                - Website URL (e.g., 'https://biolib.com/biolib/myapp/')
+            suppress_version_warning (bool): If True, don't print a warning when no version is specified.
+                Defaults to False.
+        Returns:
+            BioLibApp: The loaded application object
+        Example::
+            >>> # Load by URI
+            >>> app = biolib.load('biolib/myapp:1.0.0')
+            >>> # Load by website URL
+            >>> app = biolib.load('https://biolib.com/biolib/myapp/')
+            >>> result = app.cli('--help')
+        """
+        return BioLibApp(uri=uri, _api_client=self._api, suppress_version_warning=suppress_version_warning, _experiment=self._experiment)

biolib/_shared/__init__.py ADDED Viewed

File without changes

biolib/_shared/types/__init__.py ADDED Viewed

@@ -0,0 +1,74 @@
+from .account import AccountDict, AccountDetailedDict
+from .account_member import AccountMemberDict
+from .app import AppDetailedDict, AppSlimDict
+from .data_record import (
+    DataRecordDetailedDict,
+    DataRecordSlimDict,
+    DataRecordTypeDict,
+    DataRecordValidationRuleDict,
+    SqliteV1Column,
+    SqliteV1DatabaseSchema,
+    SqliteV1ForeignKey,
+    SqliteV1Table,
+)
+from .experiment import (
+    DeprecatedExperimentDict,
+    ExperimentDetailedDict,
+    ExperimentDict,
+    ResultCounts,
+)
+from .file_node import FileNodeDict, FileZipMetadataDict, ZipFileNodeDict
+from .push import PushResponseDict
+from .resource import ResourceDetailedDict, ResourceDict, ResourceTypeLiteral, ResourceUriDict, SemanticVersionDict
+from .resource_deploy_key import ResourceDeployKeyDict, ResourceDeployKeyWithSecretDict
+from .resource_permission import ResourcePermissionDetailedDict, ResourcePermissionDict
+from .resource_version import (
+    ResourceVersionAssetsDict,
+    ResourceVersionDetailedDict,
+    ResourceVersionDict,
+)
+from .result import ResultDetailedDict, ResultDict
+from .typing import Optional
+from .user import EnterpriseSettingsDict, UserDetailedDict, UserDict
+__all__ = [
+    'AccountDetailedDict',
+    'AccountDict',
+    'AccountMemberDict',
+    'AppDetailedDict',
+    'AppSlimDict',
+    'DataRecordDetailedDict',
+    'DataRecordSlimDict',
+    'DataRecordTypeDict',
+    'DataRecordValidationRuleDict',
+    'DeprecatedExperimentDict',
+    'EnterpriseSettingsDict',
+    'ExperimentDetailedDict',
+    'ExperimentDict',
+    'FileNodeDict',
+    'FileZipMetadataDict',
+    'Optional',
+    'PushResponseDict',
+    'ResourceDeployKeyDict',
+    'ResourceDeployKeyWithSecretDict',
+    'ResourceDetailedDict',
+    'ResourceDict',
+    'ResourceTypeLiteral',
+    'ResourcePermissionDetailedDict',
+    'ResourcePermissionDict',
+    'ResourceUriDict',
+    'ResourceVersionAssetsDict',
+    'ResourceVersionDetailedDict',
+    'ResourceVersionDict',
+    'ResultCounts',
+    'ResultDetailedDict',
+    'ResultDict',
+    'SemanticVersionDict',
+    'SqliteV1Column',
+    'SqliteV1DatabaseSchema',
+    'SqliteV1ForeignKey',
+    'SqliteV1Table',
+    'UserDetailedDict',
+    'UserDict',
+    'ZipFileNodeDict',
+]

biolib/_shared/types/account.py ADDED Viewed

@@ -0,0 +1,12 @@
+from .typing import TypedDict
+class AccountDict(TypedDict):
+    uuid: str
+    handle: str
+    display_name: str
+    description: str
+class AccountDetailedDict(AccountDict):
+    bio: str

biolib/_shared/types/account_member.py ADDED Viewed

@@ -0,0 +1,8 @@
+from .typing import Literal, TypedDict
+from .user import UserDict
+class AccountMemberDict(TypedDict):
+    user: UserDict
+    role: Literal['member', 'admin']
+    added_at: str

biolib/_shared/types/app.py ADDED Viewed

@@ -0,0 +1,9 @@
+from .typing import TypedDict
+class AppSlimDict(TypedDict):
+    pass
+class AppDetailedDict(AppSlimDict):
+    pass

biolib/_shared/types/data_record.py ADDED Viewed

@@ -0,0 +1,40 @@
+from .typing import Dict, List, Literal, Optional, TypedDict, Union
+class SqliteV1ForeignKey(TypedDict):
+    table: str
+    column: str
+class SqliteV1Column(TypedDict):
+    type: Literal['INTEGER', 'REAL', 'TEXT', 'JSON']
+    nullable: Optional[bool]
+    foreign_key: Optional[SqliteV1ForeignKey]
+    json_schema: Optional[Dict]
+class SqliteV1Table(TypedDict):
+    columns: Dict[str, SqliteV1Column]
+class SqliteV1DatabaseSchema(TypedDict):
+    tables: Dict[str, SqliteV1Table]
+class DataRecordValidationRuleDict(TypedDict):
+    path: str
+    type: str
+    rule: Union[SqliteV1DatabaseSchema]
+class DataRecordTypeDict(TypedDict):
+    name: str
+    validation_rules: List[DataRecordValidationRuleDict]
+class DataRecordSlimDict(TypedDict):
+    pass
+class DataRecordDetailedDict(DataRecordSlimDict):
+    type: Optional[DataRecordTypeDict]

biolib/_shared/types/experiment.py ADDED Viewed

@@ -0,0 +1,32 @@
+from .result import ResultDict
+from .typing import Optional, TypedDict
+class ResultCounts(TypedDict):
+    cancelled: int
+    completed: int
+    failed: int
+    in_progress: int
+    queued: int
+    total: int
+class DeprecatedExperimentDict(TypedDict):
+    # Note: fields on this TypedDict are deprecated
+    job_count: int
+    job_running_count: int
+class ExperimentDict(DeprecatedExperimentDict):
+    uuid: Optional[str]
+    name: Optional[str]
+    account_uuid: Optional[str]
+    created_at: Optional[str]
+    finished_at: Optional[str]
+    last_created_at: Optional[str]
+    last_created_result: Optional[ResultDict]
+    result_counts: ResultCounts
+class ExperimentDetailedDict(ExperimentDict):
+    pass

pybiolib 0.2.951__py3-none-any.whl → 1.2.1890__py3-none-any.whl

pybiolib 0.2.951py3-none-any.whl → 1.2.1890py3-none-any.whl