PyPI - cg - Versions diffs - 76.0.0__py3-none-any.whl → 83.14.0__py3-none-any.whl - Mend

cg 76.0.0py3-none-any.whl → 83.14.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (152) hide show

cg/__init__.py +1 -1
cg/apps/housekeeper/hk.py +18 -1
cg/apps/tb/api.py +42 -5
cg/cli/transfer.py +13 -2
cg/cli/upload/mutacc.py +16 -3
cg/cli/upload/scout.py +2 -2
cg/cli/upload/utils.py +10 -1
cg/cli/workflow/balsamic/base.py +86 -172
cg/cli/workflow/balsamic/options.py +3 -48
cg/cli/workflow/balsamic/umi.py +210 -15
cg/cli/workflow/microsalt/base.py +4 -2
cg/cli/workflow/mip_dna/base.py +1 -1
cg/cli/workflow/nallo/base.py +73 -23
cg/cli/workflow/nf_analysis.py +5 -207
cg/cli/workflow/raredisease/base.py +41 -54
cg/cli/workflow/rnafusion/base.py +38 -8
cg/cli/workflow/taxprofiler/base.py +31 -18
cg/cli/workflow/tomte/base.py +83 -10
cg/constants/constants.py +25 -30
cg/constants/devices.py +6 -1
cg/constants/gene_panel.py +3 -1
cg/constants/housekeeper_tags.py +28 -28
cg/constants/lims.py +4 -0
cg/constants/nf_analysis.py +0 -1
cg/constants/observations.py +21 -5
cg/constants/orderforms.py +3 -3
cg/constants/pacbio.py +1 -0
cg/constants/priority.py +1 -1
cg/constants/report.py +1 -0
cg/constants/scout.py +12 -9
cg/constants/sequencing.py +2 -2
cg/constants/tb.py +5 -5
cg/exc.py +27 -5
cg/meta/compress/compress.py +7 -2
cg/meta/delivery_report/balsamic.py +3 -1
cg/meta/delivery_report/delivery_report_api.py +4 -3
cg/meta/delivery_report/nallo.py +11 -11
cg/meta/delivery_report/raredisease.py +7 -3
cg/meta/delivery_report/templates/macros/data_analysis/qc_metrics/balsamic_qc_metrics.html +1 -0
cg/meta/delivery_report/templates/macros/ticket_system.html +1 -1
cg/meta/observations/balsamic_observations_api.py +110 -14
cg/meta/observations/mip_dna_observations_api.py +1 -1
cg/meta/observations/nallo_observations_api.py +1 -1
cg/meta/observations/observations_api.py +23 -32
cg/meta/observations/raredisease_observations_api.py +1 -1
cg/meta/tar/tar.py +5 -2
cg/meta/transfer/lims.py +32 -3
cg/meta/upload/balsamic/balsamic.py +1 -8
cg/meta/upload/coverage.py +5 -5
cg/meta/upload/raredisease/raredisease.py +3 -0
cg/meta/upload/scout/hk_tags.py +1 -0
cg/meta/upload/scout/nallo_config_builder.py +31 -7
cg/meta/workflow/balsamic.py +70 -36
cg/meta/workflow/fastq.py +8 -0
cg/meta/workflow/microsalt/quality_controller/models.py +0 -2
cg/meta/workflow/microsalt/quality_controller/quality_controller.py +8 -16
cg/meta/workflow/microsalt/quality_controller/result_logger.py +3 -6
cg/meta/workflow/microsalt/quality_controller/utils.py +2 -45
cg/meta/workflow/nallo.py +21 -99
cg/meta/workflow/nf_analysis.py +12 -263
cg/meta/workflow/raredisease.py +3 -112
cg/meta/workflow/rnafusion.py +2 -34
cg/meta/workflow/taxprofiler.py +2 -38
cg/meta/workflow/tomte.py +2 -42
cg/models/balsamic/config.py +0 -24
cg/models/balsamic/metrics.py +5 -3
cg/models/cg_config.py +39 -16
cg/models/deliverables/metric_deliverables.py +1 -1
cg/models/delivery_report/metadata.py +2 -1
cg/models/nallo/nallo.py +14 -64
cg/models/nf_analysis.py +1 -41
cg/models/raredisease/raredisease.py +1 -63
cg/models/rnafusion/rnafusion.py +0 -26
cg/models/scout/scout_load_config.py +5 -2
cg/models/taxprofiler/taxprofiler.py +0 -42
cg/models/tomte/tomte.py +0 -69
cg/resources/nallo_bundle_filenames.yaml +292 -22
cg/resources/raredisease_bundle_filenames.yaml +11 -1
cg/resources/taxprofiler_bundle_filenames.yaml +20 -0
cg/server/admin.py +106 -25
cg/server/app.py +15 -4
cg/server/endpoints/sequencing_run/dtos.py +21 -3
cg/server/endpoints/sequencing_run/pacbio_sequencing_run.py +29 -10
cg/server/endpoints/sequencing_run/pacbio_smrt_cell_metrics.py +20 -0
cg/services/analysis_starter/{service.py → analysis_starter.py} +11 -9
cg/services/analysis_starter/configurator/abstract_model.py +8 -0
cg/services/analysis_starter/configurator/configurator.py +1 -1
cg/services/analysis_starter/configurator/extensions/nallo.py +27 -0
cg/services/analysis_starter/configurator/extensions/{abstract.py → pipeline_extension.py} +1 -1
cg/services/analysis_starter/configurator/extensions/raredisease.py +3 -1
cg/services/analysis_starter/configurator/extensions/tomte_extension.py +28 -0
cg/services/analysis_starter/configurator/file_creators/balsamic_config.py +240 -0
cg/services/analysis_starter/configurator/file_creators/gene_panel.py +10 -5
cg/services/analysis_starter/configurator/file_creators/nextflow/params_file/abstract.py +2 -1
cg/services/analysis_starter/configurator/file_creators/nextflow/params_file/models.py +40 -1
cg/services/analysis_starter/configurator/file_creators/nextflow/params_file/nallo.py +37 -0
cg/services/analysis_starter/configurator/file_creators/nextflow/params_file/raredisease.py +8 -5
cg/services/analysis_starter/configurator/file_creators/nextflow/params_file/tomte_params_file_creator.py +64 -0
cg/services/analysis_starter/configurator/file_creators/nextflow/sample_sheet/creator.py +1 -1
cg/services/analysis_starter/configurator/file_creators/nextflow/sample_sheet/nallo_sample_sheet_creator.py +65 -0
cg/services/analysis_starter/configurator/file_creators/nextflow/sample_sheet/protocol.py +12 -0
cg/services/analysis_starter/configurator/file_creators/nextflow/sample_sheet/{raredisease.py → raredisease_sample_sheet_creator.py} +2 -2
cg/services/analysis_starter/configurator/file_creators/nextflow/sample_sheet/{rnafusion.py → rnafusion_sample_sheet_creator.py} +2 -2
cg/services/analysis_starter/configurator/file_creators/nextflow/sample_sheet/{taxprofiler.py → taxprofiler_sample_sheet_creator.py} +2 -2
cg/services/analysis_starter/configurator/file_creators/nextflow/sample_sheet/tomte_sample_sheet_creator.py +36 -0
cg/services/analysis_starter/configurator/implementations/balsamic.py +68 -0
cg/services/analysis_starter/configurator/implementations/nextflow.py +22 -5
cg/services/analysis_starter/configurator/models/balsamic.py +152 -0
cg/services/analysis_starter/configurator/models/mip_dna.py +6 -8
cg/services/analysis_starter/configurator/models/nextflow.py +9 -0
cg/services/analysis_starter/constants.py +2 -0
cg/services/analysis_starter/factories/configurator_factory.py +131 -51
cg/services/analysis_starter/factories/starter_factory.py +36 -7
cg/services/analysis_starter/input_fetcher/implementations/bam_fetcher.py +57 -0
cg/services/analysis_starter/input_fetcher/implementations/fastq_fetcher.py +3 -3
cg/services/analysis_starter/submitters/seqera_platform/{client.py → seqera_platform_client.py} +19 -3
cg/services/analysis_starter/submitters/seqera_platform/seqera_platform_submitter.py +73 -0
cg/services/analysis_starter/submitters/submitter.py +1 -1
cg/services/analysis_starter/submitters/subprocess/submitter.py +2 -1
cg/services/analysis_starter/tracker/implementations/balsamic.py +22 -0
cg/services/analysis_starter/tracker/implementations/microsalt.py +4 -4
cg/services/analysis_starter/tracker/implementations/mip_dna.py +4 -1
cg/services/analysis_starter/tracker/implementations/{nextflow.py → nextflow_tracker.py} +6 -4
cg/services/analysis_starter/tracker/tracker.py +19 -15
cg/services/deliver_files/factory.py +1 -1
cg/services/delivery_message/messages/__init__.py +24 -14
cg/services/delivery_message/messages/{microsalt_mwr_message.py → microsalt_message.py} +1 -1
cg/services/delivery_message/utils.py +4 -40
cg/services/illumina/backup/backup_service.py +29 -7
cg/services/orders/validation/constants.py +3 -0
cg/services/orders/validation/index_sequences.py +558 -0
cg/services/orders/validation/order_types/microsalt/models/sample.py +2 -3
cg/services/run_devices/pacbio/data_storage_service/pacbio_store_service.py +39 -18
cg/services/run_devices/pacbio/data_transfer_service/data_transfer_service.py +8 -2
cg/services/run_devices/pacbio/data_transfer_service/dto.py +9 -3
cg/services/run_devices/pacbio/data_transfer_service/utils.py +14 -7
cg/services/run_devices/pacbio/metrics_parser/models.py +1 -0
cg/services/run_devices/pacbio/sequencing_runs_service.py +35 -7
cg/services/sequencing_qc_service/quality_checks/checks.py +18 -16
cg/services/sequencing_qc_service/quality_checks/utils.py +82 -18
cg/services/sequencing_qc_service/sequencing_qc_service.py +12 -10
cg/store/crud/create.py +73 -42
cg/store/crud/read.py +73 -7
cg/store/crud/update.py +14 -3
cg/store/models.py +98 -35
cg/store/store.py +8 -1
{cg-76.0.0.dist-info → cg-83.14.0.dist-info}/METADATA +1 -1
{cg-76.0.0.dist-info → cg-83.14.0.dist-info}/RECORD +150 -138
cg/services/analysis_starter/submitters/seqera_platform/submitter.py +0 -39
cg/services/delivery_message/messages/microsalt_mwx_message.py +0 -18
{cg-76.0.0.dist-info → cg-83.14.0.dist-info}/WHEEL +0 -0
{cg-76.0.0.dist-info → cg-83.14.0.dist-info}/entry_points.txt +0 -0

cg/meta/workflow/tomte.py CHANGED Viewed

@@ -4,20 +4,14 @@ import logging
 from pathlib import Path
 from cg.constants import Workflow
-from cg.constants.constants import GenomeVersion, Strandedness
+from cg.constants.constants import GenomeVersion
 from cg.constants.nf_analysis import TOMTE_METRIC_CONDITIONS
 from cg.meta.workflow.nf_analysis import NfAnalysisAPI
 from cg.models.analysis import NextflowAnalysis
 from cg.models.cg_config import CGConfig
 from cg.models.deliverables.metric_deliverables import MetricsBase
-from cg.models.tomte.tomte import (
-    TomteParameters,
-    TomteQCMetrics,
-    TomteSampleSheetEntry,
-    TomteSampleSheetHeaders,
-)
+from cg.models.tomte.tomte import TomteQCMetrics
 from cg.resources import TOMTE_BUNDLE_FILENAMES_PATH
-from cg.store.models import CaseSample
 LOG = logging.getLogger(__name__)
@@ -48,45 +42,11 @@ class TomteAnalysisAPI(NfAnalysisAPI):
         self.revision: str = config.tomte.revision
         self.nextflow_binary_path: str = config.tomte.binary_path
-    @property
-    def sample_sheet_headers(self) -> list[str]:
-        """Headers for sample sheet."""
-        return TomteSampleSheetHeaders.list()
-    @property
-    def is_gene_panel_required(self) -> bool:
-        """Return True if a gene panel is needs to be created using the information in StatusDB and exporting it from Scout."""
-        return True
     @staticmethod
     def get_bundle_filenames_path() -> Path:
         """Return path to bundle template."""
         return TOMTE_BUNDLE_FILENAMES_PATH
-    def get_sample_sheet_content_per_sample(self, case_sample: CaseSample) -> list[list[str]]:
-        """Collect and format information required to build a sample sheet for a single sample."""
-        fastq_forward_read_paths, fastq_reverse_read_paths = self.get_paired_read_paths(
-            sample=case_sample.sample
-        )
-        sample_sheet_entry = TomteSampleSheetEntry(
-            case_id=case_sample.case.internal_id,
-            name=case_sample.sample.internal_id,
-            fastq_forward_read_paths=fastq_forward_read_paths,
-            fastq_reverse_read_paths=fastq_reverse_read_paths,
-            strandedness=Strandedness.REVERSE,
-        )
-        return sample_sheet_entry.reformat_sample_content
-    def get_built_workflow_parameters(self, case_id: str, dry_run: bool = False) -> TomteParameters:
-        """Return parameters."""
-        return TomteParameters(
-            input=self.get_sample_sheet_path(case_id=case_id),
-            outdir=self.get_case_path(case_id=case_id),
-            gene_panel_clinical_filter=self.get_gene_panels_path(case_id=case_id),
-            tissue=self.get_case_source_type(case_id=case_id),
-            genome=self.get_genome_build(case_id=case_id),
-        )
     def get_genome_build(self, case_id: str) -> str:
         return GenomeVersion.HG38

cg/models/balsamic/config.py CHANGED Viewed

@@ -38,28 +38,6 @@ class BalsamicConfigSample(BaseModel):
     fastq_info: dict[str, dict[str, Path]]
-class BalsamicConfigReference(BaseModel):
-    """Metadata of reference files.
-    Attributes:
-        reference_genome: reference genome fasta file
-        reference_genome_version: reference genome build version
-    """
-    reference_genome: Path
-    reference_genome_version: str | None = Field(default=None, validate_default=True)
-    @field_validator("reference_genome_version")
-    @classmethod
-    def extract_genome_version_from_path(cls, _, info: ValidationInfo) -> str:
-        """
-        Return the genome version from the reference path:
-        /home/proj/stage/cancer/balsamic_cache/X.X.X/hg19/genome/human_g1k_v37.fasta
-        """
-        return str(info.data.get("reference_genome")).split("/")[-3]
 class BalsamicConfigPanel(BaseModel):
     """Balsamic attributes of a panel BED file.
@@ -134,13 +112,11 @@ class BalsamicConfigJSON(BaseModel):
     Attributes:
         analysis: config analysis attributes
         samples: sample attributes associated to a specific case
-        reference: BALSAMIC build reference
         panel: panel attributes (targeted analysis exclusively)
     """
     analysis: BalsamicConfigAnalysis
     samples: list[BalsamicConfigSample]
-    reference: BalsamicConfigReference
     panel: BalsamicConfigPanel | None = None
     QC: BalsamicConfigQC
     vcf: dict[str, BalsamicVarCaller]

cg/models/balsamic/metrics.py CHANGED Viewed

@@ -1,6 +1,8 @@
-from pydantic import field_validator
+from pydantic import AfterValidator, field_validator
+from typing_extensions import Annotated
 from cg.models.deliverables.metric_deliverables import MetricCondition, MetricsBase
+from cg.models.delivery_report.validators import get_sex_as_string
 from cg.models.qc_metrics import QCMetrics
@@ -25,7 +27,9 @@ class BalsamicQCMetrics(QCMetrics):
     fold_80_base_penalty: float | None = None
     mean_insert_size: float | None = None
+    median_target_coverage: float | None = None
     percent_duplication: float | None = None
+    compare_predicted_to_given_sex: Annotated[str | None, AfterValidator(get_sex_as_string)] = None
     _percent_duplication: float = field_validator("percent_duplication")(percent_value_validation)
@@ -34,7 +38,6 @@ class BalsamicTargetedQCMetrics(BalsamicQCMetrics):
     """BALSAMIC targeted QC metrics"""
     mean_target_coverage: float | None = None
-    median_target_coverage: float | None = None
     pct_target_bases_50x: float | None = None
     pct_target_bases_100x: float | None = None
     pct_target_bases_250x: float | None = None
@@ -56,7 +59,6 @@ class BalsamicTargetedQCMetrics(BalsamicQCMetrics):
 class BalsamicWGSQCMetrics(BalsamicQCMetrics):
     """BALSAMIC WHOLE_GENOME_SEQUENCING QC metrics"""
-    median_coverage: float | None = None
     pct_15x: float | None = None
     pct_30x: float | None = None
     pct_60x: float | None = None

cg/models/cg_config.py CHANGED Viewed

@@ -22,7 +22,7 @@ from cg.apps.tb import TrailblazerAPI
 from cg.clients.arnold.api import ArnoldAPIClient
 from cg.clients.chanjo2.client import Chanjo2APIClient
 from cg.clients.janus.api import JanusAPIClient
-from cg.constants.observations import LoqusdbInstance
+from cg.constants.observations import BalsamicObservationPanel, LoqusdbInstance
 from cg.constants.priority import SlurmQos
 from cg.meta.delivery.delivery import DeliveryAPI
 from cg.services.analysis_service.analysis_service import AnalysisService
@@ -178,23 +178,40 @@ class MutaccAutoConfig(CommonAppConfig):
     padding: int = 300
+class LoqusDBDumpFiles(BaseModel):
+    artefact_sv: Path  # WGS
+    artefact_snv: Path
+    cancer_germline_snv: Path
+    cancer_somatic_snv: Path
+    cancer_somatic_sv: Path
+    clinical_snv: Path
+    clinical_sv: Path
+    cancer_somatic_snv_panels: dict[BalsamicObservationPanel, Path]  # Panel
 class BalsamicConfig(CommonAppConfig):
-    balsamic_cache: str
-    bed_path: str
-    binary_path: str
-    cadd_path: str
-    conda_binary: str
+    balsamic_cache: Path
+    bed_path: Path
+    binary_path: Path
+    cadd_path: Path
+    conda_binary: Path
     conda_env: str
-    genome_interval_path: str
-    gens_coverage_female_path: str
-    gens_coverage_male_path: str
-    gnomad_af5_path: str
-    loqusdb_path: str
-    pon_path: str
-    root: str
-    sentieon_licence_path: str
+    genome_interval_path: Path
+    gens_coverage_female_path: Path
+    gens_coverage_male_path: Path
+    gnomad_af5_path: Path
+    head_job_partition: str
+    loqusdb_path: Path
+    loqusdb_dump_files: LoqusDBDumpFiles
+    panel_of_normals: dict[str, Path]  # For TGS and Exome
+    pon_path: Path
+    root: Path
+    sentieon_licence_path: Path
+    sentieon_licence_server: str
     slurm: SlurmConfig
-    swegen_path: str
+    swegen_path: Path
+    swegen_snv: Path
+    swegen_sv: Path
 class MutantConfig(BaseModel):
@@ -415,7 +432,6 @@ class CGConfig(BaseModel):
     max_flowcells: int | None = None
     nanopore_data_directory: str
     run_instruments: RunInstruments
-    sentieon_licence_server: str
     tower_binary_path: str
     # Base APIs that always should exist
@@ -458,6 +474,13 @@ class CGConfig(BaseModel):
     loqusdb_somatic: CommonAppConfig = Field(None, alias=LoqusdbInstance.SOMATIC.value)
     loqusdb_tumor: CommonAppConfig = Field(None, alias=LoqusdbInstance.TUMOR.value)
     loqusdb_wes: CommonAppConfig = Field(None, alias=LoqusdbInstance.WES.value)
+    loqusdb_somatic_lymphoid: CommonAppConfig = Field(
+        None, alias=LoqusdbInstance.SOMATIC_LYMPHOID.value
+    )
+    loqusdb_somatic_myeloid: CommonAppConfig = Field(
+        None, alias=LoqusdbInstance.SOMATIC_MYELOID.value
+    )
+    loqusdb_somatic_exome: CommonAppConfig = Field(None, alias=LoqusdbInstance.SOMATIC_EXOME.value)
     madeline_api_: MadelineAPI = None
     mutacc_auto: MutaccAutoConfig = Field(None, alias="mutacc-auto")
     mutacc_auto_api_: MutaccAutoAPI = None

cg/models/deliverables/metric_deliverables.py CHANGED Viewed

@@ -164,6 +164,6 @@ class MetricsDeliverablesCondition(BaseModel):
 class MultiqcDataJson(BaseModel):
     """Multiqc data json model."""
-    report_general_stats_data: list[dict] | None = None
+    report_general_stats_data: list[dict[str, Any]] | None = None
     report_data_sources: dict | None = None
     report_saved_raw_data: dict[str, dict] | None = None

cg/models/delivery_report/metadata.py CHANGED Viewed

@@ -92,6 +92,7 @@ class BalsamicSampleMetadataModel(SampleMetadataModel):
     mean_insert_size: Annotated[str, BeforeValidator(get_number_as_string)] = NA_FIELD
     fold_80: Annotated[str, BeforeValidator(get_number_as_string)] = NA_FIELD
+    predicted_sex: str = NA_FIELD
 class BalsamicTargetedSampleMetadataModel(BalsamicSampleMetadataModel):
@@ -166,7 +167,7 @@ class WTSSampleMetadataModel(SequencingSampleMetadataModel):
     pct_surviving: Annotated[str, BeforeValidator(get_number_as_string)] = NA_FIELD
     q20_rate: Annotated[str, BeforeValidator(get_float_as_percentage)] = NA_FIELD
     q30_rate: Annotated[str, BeforeValidator(get_float_as_percentage)] = NA_FIELD
-    ribosomal_bases: Annotated[str, BeforeValidator(get_float_as_percentage)] = NA_FIELD
+    ribosomal_bases: Annotated[str, BeforeValidator(get_number_as_string)] = NA_FIELD
     rin: Annotated[str, BeforeValidator(get_number_as_string)] = NA_FIELD
     uniquely_mapped_reads: Annotated[str, BeforeValidator(get_number_as_string)] = NA_FIELD

cg/models/nallo/nallo.py CHANGED Viewed

@@ -1,14 +1,22 @@
-from enum import StrEnum
-from pathlib import Path
+from typing import Annotated
-from pydantic import BaseModel, field_validator
+from pydantic import BeforeValidator, Field
 from cg.constants import SexOptions
-from cg.exc import NfSampleSheetError
-from cg.models.nf_analysis import WorkflowParameters
 from cg.models.qc_metrics import QCMetrics
+def convert_sex(plink_sex: float) -> SexOptions:
+    if plink_sex == 2:
+        return SexOptions.FEMALE
+    elif plink_sex == 1:
+        return SexOptions.MALE
+    elif plink_sex == 0:
+        return SexOptions.UNKNOWN
+    else:
+        raise NotImplementedError
 class NalloQCMetrics(QCMetrics):
     """Nallo QC metrics."""
@@ -16,62 +24,4 @@ class NalloQCMetrics(QCMetrics):
     coverage_bases: float | None
     median_coverage: float | None
     percent_duplicates: float | None
-    predicted_sex_sex_check: SexOptions
-class NalloSampleSheetEntry(BaseModel):
-    """Nallo sample model is used when building the sample sheet."""
-    project: str
-    sample: str
-    read_file: Path
-    family_id: str
-    paternal_id: str
-    maternal_id: str
-    sex: int
-    phenotype: int
-    @property
-    def reformat_sample_content(self) -> list[list[str]]:
-        """Reformat sample sheet content as a list of lists, where each list represents a line in the final file."""
-        return [
-            [
-                self.project,
-                self.sample,
-                self.read_file,
-                self.family_id,
-                self.paternal_id,
-                self.maternal_id,
-                self.sex,
-                self.phenotype,
-            ]
-        ]
-    @field_validator("read_file")
-    @classmethod
-    def read_file_exists(cls, bam_path: Path) -> Path:
-        """Verify that bam files exist."""
-        if not bam_path.is_file():
-            raise NfSampleSheetError(f"Bam file does not exist: {str(bam_path)}")
-        return bam_path
-class NalloSampleSheetHeaders(StrEnum):
-    project: str = "project"
-    sample: str = "sample"
-    file: str = "file"
-    family_id: str = "family_id"
-    paternal_id: str = "paternal_id"
-    maternal_id: str = "maternal_id"
-    sex: str = "sex"
-    phenotype: str = "phenotype"
-    @classmethod
-    def list(cls) -> list[str]:
-        return list(map(lambda header: header.value, cls))
-class NalloParameters(WorkflowParameters):
-    """Model for Nallo parameters."""
-    filter_variants_hgnc_ids: str
+    predicted_sex: Annotated[SexOptions, BeforeValidator(convert_sex)] = Field(alias="somalier_sex")

cg/models/nf_analysis.py CHANGED Viewed

@@ -1,13 +1,6 @@
 from pathlib import Path
-from pydantic import BaseModel, ValidationInfo, conlist, field_validator
-from cg.exc import NfSampleSheetError
-class WorkflowParameters(BaseModel):
-    input: Path
-    outdir: Path
+from pydantic import BaseModel, field_validator
 class NfCommandArgs(BaseModel):
@@ -29,39 +22,6 @@ class NfCommandArgs(BaseModel):
     params_file: str | Path | None = None
-class NextflowSampleSheetEntry(BaseModel):
-    """Nextflow sample sheet model.
-    Attributes:
-        name: sample name, or case id
-        fastq_forward_read_paths: list of all fastq read1 file paths corresponding to sample
-        fastq_reverse_read_paths: list of all fastq read2 file paths corresponding to sample
-    """
-    name: str
-    fastq_forward_read_paths: conlist(Path, min_length=1)
-    fastq_reverse_read_paths: conlist(Path, min_length=1)
-    @field_validator("fastq_reverse_read_paths")
-    @classmethod
-    def validate_complete_fastq_file_pairs(
-        cls, fastq_reverse: list[str], info: ValidationInfo
-    ) -> list[str]:
-        """Verify that the number of fastq forward files is the same as for the reverse."""
-        if len(fastq_reverse) != len(info.data.get("fastq_forward_read_paths")):
-            raise NfSampleSheetError("Fastq file length for forward and reverse do not match")
-        return fastq_reverse
-    @field_validator("fastq_forward_read_paths", "fastq_reverse_read_paths")
-    @classmethod
-    def fastq_files_exist(cls, fastq_paths: list[str]) -> list[str]:
-        """Verify that fastq files exist."""
-        for fastq_path in fastq_paths:
-            if not fastq_path.is_file():
-                raise NfSampleSheetError(f"Fastq file does not exist: {str(fastq_path)}")
-        return fastq_paths
 class FileDeliverable(BaseModel):
     """Specification for a general deliverables file."""

cg/models/raredisease/raredisease.py CHANGED Viewed

@@ -1,8 +1,4 @@
-from enum import StrEnum
-from pathlib import Path
 from cg.constants.constants import SexOptions
-from cg.models.nf_analysis import NextflowSampleSheetEntry, WorkflowParameters
 from cg.models.qc_metrics import QCMetrics
@@ -10,64 +6,6 @@ class RarediseaseQCMetrics(QCMetrics):
     """Raredisease QC metrics."""
     mapped_reads: int
-    percent_duplicates: float
+    percent_duplication: float
     predicted_sex_sex_check: SexOptions
     total_reads: int
-class RarediseaseSampleSheetEntry(NextflowSampleSheetEntry):
-    """Raredisease sample model is used when building the sample sheet."""
-    sex: str
-    phenotype: int
-    sex: int
-    paternal_id: str
-    maternal_id: str
-    case_id: str
-    @property
-    def reformat_sample_content(self) -> list[list[str]]:
-        """Reformat sample sheet content as a list of lists, where each list represents a line in the final file."""
-        return [
-            [
-                self.name,
-                lane + 1,
-                self.fastq_forward_read_paths,
-                self.fastq_reverse_read_paths,
-                self.sex,
-                self.phenotype,
-                self.paternal_id,
-                self.maternal_id,
-                self.case_id,
-            ]
-            for lane, (self.fastq_forward_read_paths, self.fastq_reverse_read_paths) in enumerate(
-                zip(self.fastq_forward_read_paths, self.fastq_reverse_read_paths)
-            )
-        ]
-class RarediseaseSampleSheetHeaders(StrEnum):
-    sample: str = "sample"
-    lane: str = "lane"
-    fastq_1: str = "fastq_1"
-    fastq_2: str = "fastq_2"
-    sex: str = "sex"
-    phenotype: str = "phenotype"
-    paternal_id: str = "paternal_id"
-    maternal_id: str = "maternal_id"
-    case_id: str = "case_id"
-    @classmethod
-    def list(cls) -> list[str]:
-        return list(map(lambda header: header.value, cls))
-class RarediseaseParameters(WorkflowParameters):
-    """Model for Raredisease parameters."""
-    target_bed_file: str
-    analysis_type: str
-    save_mapped_as_cram: bool
-    vcfanno_extra_resources: str
-    vep_filters_scout_fmt: str
-    sample_id_map: Path

cg/models/rnafusion/rnafusion.py CHANGED Viewed

@@ -1,5 +1,3 @@
-from cg.constants.constants import Strandedness
-from cg.models.nf_analysis import NextflowSampleSheetEntry, WorkflowParameters
 from cg.models.qc_metrics import QCMetrics
@@ -19,27 +17,3 @@ class RnafusionQCMetrics(QCMetrics):
     pct_duplication: float
     read_pairs_examined: float
     uniquely_mapped_percent: float
-class RnafusionParameters(WorkflowParameters):
-    """Rnafusion parameters."""
-class RnafusionSampleSheetEntry(NextflowSampleSheetEntry):
-    """Rnafusion sample sheet model."""
-    strandedness: Strandedness
-    @staticmethod
-    def headers() -> list[str]:
-        """Return sample sheet headers."""
-        return ["sample", "fastq_1", "fastq_2", "strandedness"]
-    def reformat_sample_content(self) -> list[list[str]]:
-        """Reformat sample sheet content as a list of list, where each list represents a line in the final file."""
-        return [
-            [self.name, fastq_forward_read_path, fastq_reverse_read_path, str(self.strandedness)]
-            for fastq_forward_read_path, fastq_reverse_read_path in zip(
-                self.fastq_forward_read_paths, self.fastq_reverse_read_paths
-            )
-        ]

cg/models/scout/scout_load_config.py CHANGED Viewed

@@ -84,12 +84,15 @@ class ScoutMipIndividual(ScoutIndividual):
 class ScoutNalloIndividual(ScoutIndividual):
+    assembly_alignment_path: str | None = None
+    chromograph_images: ChromographImages = ChromographImages()
     d4_file: str | None = None
+    minor_allele_frequency_wig: str | None = None
+    mt_bam: str | None = None
     paraphase_alignment_path: str | None = None
+    phase_blocks: str | None = None
     reviewer: Reviewer = Reviewer()
     tiddit_coverage_wig: str | None = None
-    minor_allele_frequency_wig: str | None = None
-    assembly_alignment_path: str | None = None
 class ScoutRarediseaseIndividual(ScoutIndividual):

cg/models/taxprofiler/taxprofiler.py CHANGED Viewed

@@ -1,5 +1,3 @@
-from cg.constants.sequencing import SequencingPlatform
-from cg.models.nf_analysis import NextflowSampleSheetEntry, WorkflowParameters
 from cg.models.qc_metrics import QCMetrics
@@ -14,43 +12,3 @@ class TaxprofilerQCMetrics(QCMetrics):
     pct_duplication: float
     raw_total_sequences: float
     reads_mapped: float
-class TaxprofilerParameters(WorkflowParameters):
-    """Taxprofiler parameters."""
-class TaxprofilerSampleSheetEntry(NextflowSampleSheetEntry):
-    """Taxprofiler sample model is used when building the sample sheet."""
-    instrument_platform: SequencingPlatform
-    fasta: str
-    @staticmethod
-    def headers() -> list[str]:
-        """Return sample sheet headers."""
-        return [
-            "sample",
-            "run_accession",
-            "instrument_platform",
-            "fastq_1",
-            "fastq_2",
-            "fasta",
-        ]
-    def reformat_sample_content(self) -> list[list[str]]:
-        """Reformat sample sheet content as a list of list, where each list represents a line in the final file."""
-        reformatted_content = []
-        for run_accession, (forward_path, reverse_path) in enumerate(
-            zip(self.fastq_forward_read_paths, self.fastq_reverse_read_paths), 1
-        ):
-            line = [
-                self.name,
-                run_accession,
-                self.instrument_platform,
-                forward_path,
-                reverse_path,
-                self.fasta,
-            ]
-            reformatted_content.append(line)
-        return reformatted_content

cg/models/tomte/tomte.py CHANGED Viewed

@@ -1,73 +1,4 @@
-from enum import StrEnum
-from pathlib import Path
-from pydantic import field_validator
-from cg.constants.constants import GenomeVersion, Strandedness
-from cg.constants.sample_sources import SourceType
-from cg.models.nf_analysis import NextflowSampleSheetEntry, WorkflowParameters
 from cg.models.qc_metrics import QCMetrics
-from cg.utils.utils import replace_non_alphanumeric
-class TomteSampleSheetEntry(NextflowSampleSheetEntry):
-    """Tomte sample model is used when building the sample sheet."""
-    case_id: str
-    strandedness: Strandedness
-    @property
-    def reformat_sample_content(self) -> list[list[str]]:
-        """Reformat sample sheet content as a list of lists, where
-        each list represents a line in the final file."""
-        return [
-            [
-                self.case_id,
-                self.name,
-                fastq_forward_read_path,
-                fastq_reverse_read_path,
-                str(self.strandedness),
-            ]
-            for fastq_forward_read_path, fastq_reverse_read_path in zip(
-                self.fastq_forward_read_paths, self.fastq_reverse_read_paths
-            )
-        ]
-class TomteSampleSheetHeaders(StrEnum):
-    case_id: str = "case"
-    name: str = "sample"
-    fastq_1: str = "fastq_1"
-    fastq_2: str = "fastq_2"
-    strandedness: str = "strandedness"
-    @classmethod
-    def list(cls) -> list[str]:
-        return list(map(lambda header: header.value, cls))
-class TomteParameters(WorkflowParameters):
-    """Model for Tomte parameters."""
-    gene_panel_clinical_filter: Path
-    tissue: str
-    genome: str = GenomeVersion.HG38
-    @field_validator("tissue", mode="before")
-    @classmethod
-    def restrict_tissue_values(cls, tissue: str | None) -> str:
-        if tissue:
-            return replace_non_alphanumeric(string=tissue)
-        else:
-            return SourceType.UNKNOWN
-    @field_validator("genome", mode="before")
-    @classmethod
-    def restrict_genome_values(cls, genome: str) -> str:
-        if genome == GenomeVersion.HG38:
-            return GenomeVersion.GRCh38.value
-        elif genome == GenomeVersion.HG19:
-            return GenomeVersion.GRCh37.value
 class TomteQCMetrics(QCMetrics):

cg 76.0.0__py3-none-any.whl → 83.14.0__py3-none-any.whl

cg 76.0.0py3-none-any.whl → 83.14.0py3-none-any.whl