PyPI - compose-runner - Versions diffs - 0.6.3rc1__tar.gz → 0.6.4rc1__tar.gz - Mend

compose-runner 0.6.3rc1tar.gz → 0.6.4rc1tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

{compose_runner-0.6.3rc1 → compose_runner-0.6.4rc1}/Dockerfile RENAMED Viewed

@@ -1,5 +1,12 @@
 FROM python:3.13-slim
+ARG COMPOSE_RUNNER_VERSION
+ENV COMPOSE_RUNNER_VERSION=${COMPOSE_RUNNER_VERSION}
+LABEL org.opencontainers.image.title="compose-runner ecs task"
+LABEL org.opencontainers.image.version=${COMPOSE_RUNNER_VERSION}
+RUN test -n "$COMPOSE_RUNNER_VERSION" || (echo "COMPOSE_RUNNER_VERSION build arg is required" && exit 1)
 RUN apt-get update && apt-get install -y \
     git \
     && rm -rf /var/lib/apt/lists/*

{compose_runner-0.6.3rc1 → compose_runner-0.6.4rc1}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: compose-runner
-Version: 0.6.3rc1
+Version: 0.6.4rc1
 Summary: A package for running neurosynth-compose analyses
 Project-URL: Repository, https://github.com/neurostuff/compose-runner
 Author-email: James Kent <jamesdkent21@gmail.com>
@@ -67,7 +67,7 @@ The deployed architecture works like this:
    Pass `-c resultsBucketName=<bucket>` to use an existing S3 bucket, or omit it
    to let the stack create and retain a dedicated bucket. Additional knobs:
-   - `-c stateMachineTimeoutSeconds=7200` to control the max wall clock per run
+  - `-c stateMachineTimeoutSeconds=32400` to control the max wall clock per run
    - `-c submitTimeoutSeconds` / `-c statusTimeoutSeconds` / `-c pollTimeoutSeconds`
      to tune Lambda timeouts
    - `-c taskEphemeralStorageGiB` if the default 21 GiB scratch volume is insufficient

{compose_runner-0.6.3rc1 → compose_runner-0.6.4rc1}/README.md RENAMED Viewed

@@ -44,7 +44,7 @@ The deployed architecture works like this:
    Pass `-c resultsBucketName=<bucket>` to use an existing S3 bucket, or omit it
    to let the stack create and retain a dedicated bucket. Additional knobs:
-   - `-c stateMachineTimeoutSeconds=7200` to control the max wall clock per run
+  - `-c stateMachineTimeoutSeconds=32400` to control the max wall clock per run
    - `-c submitTimeoutSeconds` / `-c statusTimeoutSeconds` / `-c pollTimeoutSeconds`
      to tune Lambda timeouts
    - `-c taskEphemeralStorageGiB` if the default 21 GiB scratch volume is insufficient

{compose_runner-0.6.3rc1 → compose_runner-0.6.4rc1}/compose_runner/_version.py RENAMED Viewed

@@ -28,7 +28,7 @@ version_tuple: VERSION_TUPLE
 commit_id: COMMIT_ID
 __commit_id__: COMMIT_ID
-__version__ = version = '0.6.3rc1'
-__version_tuple__ = version_tuple = (0, 6, 3, 'rc1')
+__version__ = version = '0.6.4rc1'
+__version_tuple__ = version_tuple = (0, 6, 4, 'rc1')
 __commit_id__ = commit_id = None

{compose_runner-0.6.3rc1 → compose_runner-0.6.4rc1}/compose_runner/aws_lambda/run_handler.py RENAMED Viewed

@@ -4,6 +4,8 @@ import json
 import logging
 import os
 import uuid
+import urllib.error
+import urllib.request
 from typing import Any, Dict, Optional
 import boto3
@@ -22,6 +24,8 @@ RESULTS_PREFIX_ENV = "RESULTS_PREFIX"
 NSC_KEY_ENV = "NSC_KEY"
 NV_KEY_ENV = "NV_KEY"
+DEFAULT_TASK_SIZE = "standard"
 def _log(job_id: str, message: str, **details: Any) -> None:
     payload = {"job_id": job_id, "message": message, **details}
@@ -29,6 +33,67 @@ def _log(job_id: str, message: str, **details: Any) -> None:
     logger.info(json.dumps(payload))
+def _compose_api_base_url(environment: str) -> str:
+    env = (environment or "production").lower()
+    if env == "staging":
+        return "https://synth.neurostore.xyz/api"
+    if env == "local":
+        return "http://localhost:81/api"
+    return "https://compose.neurosynth.org/api"
+def _fetch_meta_analysis(meta_analysis_id: str, environment: str) -> Optional[Dict[str, Any]]:
+    base_url = _compose_api_base_url(environment).rstrip("/")
+    url = f"{base_url}/meta-analyses/{meta_analysis_id}?nested=true"
+    request = urllib.request.Request(url, headers={"User-Agent": "compose-runner/submit"})
+    try:
+        with urllib.request.urlopen(request, timeout=10) as response:
+            return json.load(response)
+    except (urllib.error.URLError, urllib.error.HTTPError, json.JSONDecodeError) as exc:
+        logger.warning("Failed to fetch meta-analysis %s: %s", meta_analysis_id, exc)
+        return None
+def _requires_large_task(specification: Dict[str, Any]) -> bool:
+    if not isinstance(specification, dict):
+        return False
+    corrector = specification.get("corrector")
+    if not isinstance(corrector, dict):
+        return False
+    if corrector.get("type") != "FWECorrector":
+        return False
+    args = corrector.get("args")
+    if not isinstance(args, dict):
+        return False
+    method = args.get("method")
+    if method is None:
+        kwargs = args.get("**kwargs")
+        if isinstance(kwargs, dict):
+            method = kwargs.get("method")
+    if isinstance(method, str) and method.lower() == "montecarlo":
+        return True
+    return False
+def _select_task_size(meta_analysis_id: str, environment: str, artifact_prefix: str) -> str:
+    doc = _fetch_meta_analysis(meta_analysis_id, environment)
+    if not doc:
+        return DEFAULT_TASK_SIZE
+    specification = doc.get("specification")
+    try:
+        if _requires_large_task(specification):
+            _log(
+                artifact_prefix,
+                "workflow.task_size_selected",
+                task_size="large",
+                reason="montecarlo_fwe",
+            )
+            return "large"
+    except Exception as exc:  # noqa: broad-except
+        logger.warning("Failed to evaluate specification for %s: %s", meta_analysis_id, exc)
+    return DEFAULT_TASK_SIZE
 def _job_input(
     payload: Dict[str, Any],
     artifact_prefix: str,
@@ -36,6 +101,7 @@ def _job_input(
     prefix: Optional[str],
     nsc_key: Optional[str],
     nv_key: Optional[str],
+    task_size: str,
 ) -> Dict[str, Any]:
     no_upload_flag = bool(payload.get("no_upload", False))
     doc: Dict[str, Any] = {
@@ -44,6 +110,7 @@ def _job_input(
         "environment": payload.get("environment", "production"),
         "no_upload": "true" if no_upload_flag else "false",
         "results": {"bucket": bucket or "", "prefix": prefix or ""},
+        "task_size": task_size,
     }
     n_cores = payload.get("n_cores")
     doc["n_cores"] = str(n_cores) if n_cores is not None else ""
@@ -76,7 +143,10 @@ def handler(event: Dict[str, Any], context: Any) -> Dict[str, Any]:
     nsc_key = payload.get("nsc_key") or os.environ.get(NSC_KEY_ENV)
     nv_key = payload.get("nv_key") or os.environ.get(NV_KEY_ENV)
-    job_input = _job_input(payload, artifact_prefix, bucket, prefix, nsc_key, nv_key)
+    environment = payload.get("environment", "production")
+    task_size = _select_task_size(payload["meta_analysis_id"], environment, artifact_prefix)
+    job_input = _job_input(payload, artifact_prefix, bucket, prefix, nsc_key, nv_key, task_size)
     params = {
         "stateMachineArn": os.environ[STATE_MACHINE_ARN_ENV],
         "name": artifact_prefix,

{compose_runner-0.6.3rc1 → compose_runner-0.6.4rc1}/compose_runner/ecs_task.py RENAMED Viewed

@@ -93,6 +93,7 @@ def main() -> None:
     nv_key = os.environ.get(NV_KEY_ENV) or None
     no_upload = _bool_from_env(os.environ.get(NO_UPLOAD_ENV))
     n_cores = _resolve_n_cores(os.environ.get(N_CORES_ENV))
+    compose_runner_version = os.environ.get("COMPOSE_RUNNER_VERSION", "unknown")
     bucket = os.environ.get(RESULTS_BUCKET_ENV)
     prefix = os.environ.get(RESULTS_PREFIX_ENV)
@@ -106,6 +107,7 @@ def main() -> None:
         meta_analysis_id=meta_analysis_id,
         environment=environment,
         no_upload=no_upload,
+        compose_runner_version=compose_runner_version,
     )
     try:
         url, _ = run_compose(
@@ -125,6 +127,7 @@ def main() -> None:
             "result_url": url,
             "artifacts_bucket": bucket,
             "artifacts_prefix": prefix,
+            "compose_runner_version": compose_runner_version,
         }
         if bucket:

compose_runner-0.6.4rc1/compose_runner/tests/cassettes/test_lambda_handlers/test_select_task_size_uses_large_for_montecarlo.yaml ADDED Viewed

@@ -0,0 +1,60 @@
+interactions:
+- request:
+    method: GET
+    uri: https://synth.neurostore.xyz/api/meta-analyses/ZPSvyvhZAopz?nested=true
+    body: null
+    headers:
+      Accept:
+      - '*/*'
+      Accept-Encoding:
+      - gzip, deflate
+      Connection:
+      - keep-alive
+      User-Agent:
+      - python-requests/2.32.4
+  response:
+    status:
+      code: 200
+      message: OK
+    headers:
+      Server:
+      - nginx/1.21.6
+      Date:
+      - Tue, 21 Oct 2025 14:08:45 GMT
+      Content-Type:
+      - application/json
+      Transfer-Encoding:
+      - chunked
+      Connection:
+      - keep-alive
+      Vary:
+      - Accept-Encoding
+      Content-Encoding:
+      - gzip
+      Strict-Transport-Security:
+      - max-age=31536000
+    body:
+      string: '{"id": "ZPSvyvhZAopz", "created_at": "2025-10-21T04:57:40.236536+00:00",
+        "updated_at": null, "user": "github|12564882", "username": "James Kent", "name":
+        "Untitled MKDADensity Meta Analysis: included", "description": "MKDADensity
+        meta analysis with FWECorrector", "provenance": null, "specification": {"id":
+        "zQdMa4uAaYYU", "created_at": "2025-10-21T04:57:39.888528+00:00", "updated_at":
+        null, "user": "github|12564882", "username": "James Kent", "type": "CBMA",
+        "estimator": {"type": "MKDADensity", "args": {"null_method": "approximate",
+        "n_iters": 5000, "**kwargs": {}, "kernel__r": 10, "kernel__value": 1}}, "database_studyset":
+        null, "filter": "included", "corrector": {"type": "FWECorrector", "args":
+        {"voxel_thresh": 0.001, "n_iters": 5000, "vfwe_only": false, "method": "montecarlo"}},
+        "conditions": [true], "weights": [1.0]}, "neurostore_analysis": {"id": "8S5xRedCGRkz",
+        "created_at": "2025-10-21T04:57:40.255480+00:00", "updated_at": null, "neurostore_id":
+        null, "exception": null, "traceback": null, "status": "PENDING"}, "studyset":
+        {"id": "9jPvdkuRufUP", "created_at": "2025-10-21T04:57:40.008456+00:00", "updated_at":
+        null, "user": "github|12564882", "username": "James Kent", "snapshot": null,
+        "neurostore_id": "3EmvH2LELwR2", "version": null, "url": "https://neurostore.org/api/studysets/3EmvH2LELwR2"},
+        "annotation": {"id": "YVLt6DRFKdd5", "created_at": "2025-10-21T04:57:40.121637+00:00",
+        "updated_at": null, "user": "github|12564882", "username": "James Kent", "snapshot":
+        null, "neurostore_id": "TebrRstj8ofh", "studyset": "3EmvH2LELwR2", "url":
+        "https://neurostore.org/api/annotations/TebrRstj8ofh"}, "project": "D2cTfoxNfpLy",
+        "cached_studyset": "9jPvdkuRufUP", "cached_annotation": "YVLt6DRFKdd5", "run_key":
+        "PDeDnh_8MXc88xoVJySz3w", "results": [], "neurostore_url": null}'
+    http_version: HTTP/1.1
+version: 1

compose_runner-0.6.4rc1/compose_runner/tests/cassettes/test_lambda_handlers/test_select_task_size_uses_standard_for_fdr.yaml ADDED Viewed

@@ -0,0 +1,55 @@
+interactions:
+- request:
+    body: null
+    headers:
+      Connection:
+      - close
+      Host:
+      - synth.neurostore.xyz
+      User-Agent:
+      - compose-runner/submit
+    method: GET
+    uri: https://synth.neurostore.xyz/api/meta-analyses/VtFZJFniCKvG?nested=true
+  response:
+    body:
+      string: '{"id": "VtFZJFniCKvG", "created_at": "2025-10-21T14:10:35.309383+00:00",
+        "updated_at": null, "user": "github|12564882", "username": "James Kent", "name":
+        "Untitled MKDADensity Meta Analysis: included (1)", "description": "MKDADensity
+        meta analysis with FDRCorrector", "provenance": null, "specification": {"id":
+        "DtVzKEKGaXLu", "created_at": "2025-10-21T14:10:34.564365+00:00", "updated_at":
+        null, "user": "github|12564882", "username": "James Kent", "type": "CBMA",
+        "estimator": {"type": "MKDADensity", "args": {"null_method": "approximate",
+        "n_iters": 5000, "**kwargs": {}, "kernel__r": 10, "kernel__value": 1}}, "database_studyset":
+        null, "filter": "included", "corrector": {"type": "FDRCorrector", "args":
+        {"method": "indep", "alpha": 0.05}}, "conditions": [true], "weights": [1.0]},
+        "neurostore_analysis": {"id": "564c8kRnJVT4", "created_at": "2025-10-21T14:10:35.325173+00:00",
+        "updated_at": null, "neurostore_id": null, "exception": null, "traceback":
+        null, "status": "PENDING"}, "studyset": {"id": "FA3BDBdGRZ5d", "created_at":
+        "2025-10-21T14:10:34.821625+00:00", "updated_at": null, "user": "github|12564882",
+        "username": "James Kent", "snapshot": null, "neurostore_id": "3EmvH2LELwR2",
+        "version": null, "url": "https://neurostore.org/api/studysets/3EmvH2LELwR2"},
+        "annotation": {"id": "XELVYV7ftp7e", "created_at": "2025-10-21T14:10:35.183354+00:00",
+        "updated_at": null, "user": "github|12564882", "username": "James Kent", "snapshot":
+        null, "neurostore_id": "TebrRstj8ofh", "studyset": "3EmvH2LELwR2", "url":
+        "https://neurostore.org/api/annotations/TebrRstj8ofh"}, "project": "D2cTfoxNfpLy",
+        "cached_studyset": "FA3BDBdGRZ5d", "cached_annotation": "XELVYV7ftp7e", "run_key":
+        "V_jTcP2zfNlWD4KhwKKcJw", "results": [], "neurostore_url": null}'
+    headers:
+      Connection:
+      - close
+      Content-Length:
+      - '1750'
+      Content-Type:
+      - application/json
+      Date:
+      - Tue, 21 Oct 2025 14:14:50 GMT
+      Server:
+      - nginx/1.21.6
+      Strict-Transport-Security:
+      - max-age=31536000
+      Vary:
+      - Accept-Encoding
+    status:
+      code: 200
+      message: OK
+version: 1

{compose_runner-0.6.3rc1 → compose_runner-0.6.4rc1}/compose_runner/tests/test_lambda_handlers.py RENAMED Viewed

@@ -4,6 +4,8 @@ import json
 from datetime import datetime, timezone
 from typing import Any, Dict
+import pytest
 from compose_runner.aws_lambda import log_poll_handler, results_handler, run_handler, status_handler
@@ -23,6 +25,28 @@ def _make_http_event(payload: Dict[str, Any]) -> Dict[str, Any]:
     }
+def test_requires_large_task_detection():
+    spec = {"corrector": {"type": "FWECorrector", "args": {"method": "montecarlo"}}}
+    assert run_handler._requires_large_task(spec)
+def test_requires_large_task_false_when_method_differs():
+    spec = {"corrector": {"type": "FWECorrector", "args": {"method": "bonferroni"}}}
+    assert run_handler._requires_large_task(spec) is False
+@pytest.mark.vcr(record_mode="once")
+def test_select_task_size_uses_large_for_montecarlo():
+    task_size = run_handler._select_task_size("ZPSvyvhZAopz", "staging", "artifact-test")
+    assert task_size == "large"
+@pytest.mark.vcr(record_mode="once")
+def test_select_task_size_uses_standard_for_fdr():
+    task_size = run_handler._select_task_size("VtFZJFniCKvG", "staging", "artifact-test")
+    assert task_size == "standard"
 def test_run_handler_http_success(monkeypatch, tmp_path):
     captured = {}
@@ -36,6 +60,7 @@ def test_run_handler_http_success(monkeypatch, tmp_path):
                 ...
     monkeypatch.setattr(run_handler, "_SFN_CLIENT", FakeSFN())
+    monkeypatch.setattr(run_handler, "_select_task_size", lambda *args: "standard")
     monkeypatch.setenv("STATE_MACHINE_ARN", "arn:aws:states:state-machine")
     monkeypatch.setenv("RESULTS_BUCKET", "bucket")
     monkeypatch.setenv("RESULTS_PREFIX", "prefix")
@@ -63,6 +88,32 @@ def test_run_handler_http_success(monkeypatch, tmp_path):
     assert input_doc["results"]["prefix"] == "prefix"
     assert input_doc["nsc_key"] == "nsc"
     assert input_doc["nv_key"] == "nv"
+    assert input_doc["task_size"] == "standard"
+def test_run_handler_http_uses_large_task(monkeypatch):
+    captured = {}
+    class FakeSFN:
+        def start_execution(self, **kwargs):
+            captured.update(kwargs)
+            return {"executionArn": "arn:aws:states:us-east-1:123:execution:state-machine:run-456"}
+        class exceptions:
+            class ExecutionAlreadyExists(Exception):
+                ...
+    monkeypatch.setattr(run_handler, "_SFN_CLIENT", FakeSFN())
+    monkeypatch.setattr(run_handler, "_select_task_size", lambda *args: "large")
+    monkeypatch.setenv("STATE_MACHINE_ARN", "arn:aws:states:state-machine")
+    monkeypatch.setenv("RESULTS_BUCKET", "bucket")
+    monkeypatch.setenv("RESULTS_PREFIX", "prefix")
+    event = _make_http_event({"meta_analysis_id": "abc123"})
+    response = run_handler.handler(event, DummyContext())
+    assert response["statusCode"] == 202
+    input_doc = json.loads(captured["input"])
+    assert input_doc["task_size"] == "large"
 def test_run_handler_missing_meta_analysis(monkeypatch):

{compose_runner-0.6.3rc1 → compose_runner-0.6.4rc1}/infra/cdk/stacks/compose_runner_stack.py RENAMED Viewed

@@ -40,7 +40,12 @@ class ComposeRunnerStack(Stack):
         task_cpu = int(self.node.try_get_context("taskCpu") or 4096)
         task_memory_mib = int(self.node.try_get_context("taskMemoryMiB") or 30720)
         task_ephemeral_storage_gib = int(self.node.try_get_context("taskEphemeralStorageGiB") or 21)
-        state_machine_timeout_seconds = int(self.node.try_get_context("stateMachineTimeoutSeconds") or 7200)
+        task_cpu_large = int(self.node.try_get_context("taskCpuLarge") or 16384)
+        task_memory_large_mib = int(self.node.try_get_context("taskMemoryLargeMiB") or 65536)
+        state_machine_timeout_seconds = int(self.node.try_get_context("stateMachineTimeoutSeconds") or 32400)
+        if task_cpu_large >= 16384 and task_memory_large_mib < 32768:
+            raise ValueError("taskMemoryLargeMiB must be at least 32768 MiB for 16 vCPU tasks.")
         project_root = Path(__file__).resolve().parents[3]
         project_version = self.node.try_get_context("composeRunnerVersion")
@@ -121,6 +126,20 @@ class ComposeRunnerStack(Stack):
             ephemeral_storage_gib=task_ephemeral_storage_gib,
         )
+        task_definition_large = ecs.FargateTaskDefinition(
+            self,
+            "ComposeRunnerLargeTaskDefinition",
+            cpu=task_cpu_large,
+            memory_limit_mib=task_memory_large_mib,
+            ephemeral_storage_gib=task_ephemeral_storage_gib,
+        )
+        container_environment = {
+            "RESULTS_BUCKET": results_bucket.bucket_name,
+            "RESULTS_PREFIX": results_prefix,
+            "DELETE_TMP": "true",
+        }
         container = task_definition.add_container(
             "ComposeRunnerContainer",
             image=ecs.ContainerImage.from_docker_image_asset(fargate_asset),
@@ -129,16 +148,46 @@ class ComposeRunnerStack(Stack):
                 log_group=task_log_group,
                 stream_prefix="compose-runner",
             ),
-            environment={
-                "RESULTS_BUCKET": results_bucket.bucket_name,
-                "RESULTS_PREFIX": results_prefix,
-                "DELETE_TMP": "true",
-            },
+            environment=container_environment,
+        )
+        container_large = task_definition_large.add_container(
+            "ComposeRunnerLargeContainer",
+            image=ecs.ContainerImage.from_docker_image_asset(fargate_asset),
+            entry_point=["python", "-m", "compose_runner.ecs_task"],
+            logging=ecs.LogDriver.aws_logs(
+                log_group=task_log_group,
+                stream_prefix="compose-runner",
+            ),
+            environment=container_environment,
         )
         results_bucket.grant_read_write(task_definition.task_role)
+        results_bucket.grant_read_write(task_definition_large.task_role)
+        container_env_overrides = [
+            tasks.TaskEnvironmentVariable(
+                name="ARTIFACT_PREFIX", value=sfn.JsonPath.string_at("$.artifact_prefix")
+            ),
+            tasks.TaskEnvironmentVariable(
+                name="META_ANALYSIS_ID", value=sfn.JsonPath.string_at("$.meta_analysis_id")
+            ),
+            tasks.TaskEnvironmentVariable(
+                name="ENVIRONMENT", value=sfn.JsonPath.string_at("$.environment")
+            ),
+            tasks.TaskEnvironmentVariable(name="NSC_KEY", value=sfn.JsonPath.string_at("$.nsc_key")),
+            tasks.TaskEnvironmentVariable(name="NV_KEY", value=sfn.JsonPath.string_at("$.nv_key")),
+            tasks.TaskEnvironmentVariable(name="NO_UPLOAD", value=sfn.JsonPath.string_at("$.no_upload")),
+            tasks.TaskEnvironmentVariable(name="N_CORES", value=sfn.JsonPath.string_at("$.n_cores")),
+            tasks.TaskEnvironmentVariable(
+                name="RESULTS_BUCKET", value=sfn.JsonPath.string_at("$.results.bucket")
+            ),
+            tasks.TaskEnvironmentVariable(
+                name="RESULTS_PREFIX", value=sfn.JsonPath.string_at("$.results.prefix")
+            ),
+        ]
-        run_task = tasks.EcsRunTask(
+        run_task_standard = tasks.EcsRunTask(
             self,
             "RunFargateJob",
             integration_pattern=sfn.IntegrationPattern.RUN_JOB,
@@ -153,41 +202,41 @@ class ComposeRunnerStack(Stack):
             container_overrides=[
                 tasks.ContainerOverride(
                     container_definition=container,
-                    environment=[
-                        tasks.TaskEnvironmentVariable(
-                            name="ARTIFACT_PREFIX", value=sfn.JsonPath.string_at("$.artifact_prefix")
-                        ),
-                        tasks.TaskEnvironmentVariable(
-                            name="META_ANALYSIS_ID", value=sfn.JsonPath.string_at("$.meta_analysis_id")
-                        ),
-                        tasks.TaskEnvironmentVariable(
-                            name="ENVIRONMENT", value=sfn.JsonPath.string_at("$.environment")
-                        ),
-                        tasks.TaskEnvironmentVariable(
-                            name="NSC_KEY", value=sfn.JsonPath.string_at("$.nsc_key")
-                        ),
-                        tasks.TaskEnvironmentVariable(
-                            name="NV_KEY", value=sfn.JsonPath.string_at("$.nv_key")
-                        ),
-                        tasks.TaskEnvironmentVariable(
-                            name="NO_UPLOAD", value=sfn.JsonPath.string_at("$.no_upload")
-                        ),
-                        tasks.TaskEnvironmentVariable(
-                            name="N_CORES", value=sfn.JsonPath.string_at("$.n_cores")
-                        ),
-                        tasks.TaskEnvironmentVariable(
-                            name="RESULTS_BUCKET", value=sfn.JsonPath.string_at("$.results.bucket")
-                        ),
-                        tasks.TaskEnvironmentVariable(
-                            name="RESULTS_PREFIX", value=sfn.JsonPath.string_at("$.results.prefix")
-                        ),
-                    ],
+                    environment=container_env_overrides,
                 )
             ],
             result_path="$.ecs",
         )
-        run_task.add_retry(
+        run_task_large = tasks.EcsRunTask(
+            self,
+            "RunFargateJobLarge",
+            integration_pattern=sfn.IntegrationPattern.RUN_JOB,
+            cluster=cluster,
+            task_definition=task_definition_large,
+            launch_target=tasks.EcsFargateLaunchTarget(
+                platform_version=ecs.FargatePlatformVersion.LATEST
+            ),
+            assign_public_ip=True,
+            security_groups=[task_security_group],
+            subnets=ec2.SubnetSelection(subnet_type=ec2.SubnetType.PUBLIC),
+            container_overrides=[
+                tasks.ContainerOverride(
+                    container_definition=container_large,
+                    environment=container_env_overrides,
+                )
+            ],
+            result_path="$.ecs",
+        )
+        run_task_standard.add_retry(
+            errors=["States.ALL"],
+            interval=Duration.seconds(30),
+            backoff_rate=2.0,
+            max_attempts=2,
+        )
+        run_task_large.add_retry(
             errors=["States.ALL"],
             interval=Duration.seconds(30),
             backoff_rate=2.0,
@@ -202,11 +251,20 @@ class ComposeRunnerStack(Stack):
                 "meta_analysis_id.$": "$.meta_analysis_id",
                 "environment.$": "$.environment",
                 "results.$": "$.results",
+                "task_size.$": "$.task_size",
                 "ecs.$": "$.ecs",
             },
         )
-        definition_chain = run_task.next(run_output)
+        definition_chain = sfn.Choice(
+            self,
+            "SelectFargateTask",
+        ).when(
+            sfn.Condition.string_equals("$.task_size", "large"),
+            run_task_large.next(run_output),
+        ).otherwise(
+            run_task_standard.next(run_output)
+        )
         state_machine = sfn.StateMachine(
             self,