Clinical-Genomics
diff --git a/‎.bumpversion.cfg
+1-1 b/‎.bumpversion.cfg
+1-1
diff --git a/‎.github/workflows/bumpversion.yml
+1-1 b/‎.github/workflows/bumpversion.yml
+1-1
diff --git a/‎alembic/versions/2025_04_28_039dbdf8af01_add_raredisease_ordertype.py
+83 b/‎alembic/versions/2025_04_28_039dbdf8af01_add_raredisease_ordertype.py
+83
diff --git a/‎cg/__init__.py
+1-1 b/‎cg/__init__.py
+1-1
diff --git a/‎cg/constants/constants.py
+16-16 b/‎cg/constants/constants.py
+16-16
diff --git a/‎cg/constants/priority.py
+5-5 b/‎cg/constants/priority.py
+5-5
diff --git a/‎cg/constants/scout.py
+1-1 b/‎cg/constants/scout.py
+1-1
diff --git a/‎cg/meta/orders/utils.py
+61-2 b/‎cg/meta/orders/utils.py
+61-2
diff --git a/‎cg/meta/workflow/nf_analysis.py
+7-1 b/‎cg/meta/workflow/nf_analysis.py
+7-1
diff --git a/‎cg/meta/workflow/raredisease.py
+6-24 b/‎cg/meta/workflow/raredisease.py
+6-24
diff --git a/‎cg/models/orders/constants.py
+15-14 b/‎cg/models/orders/constants.py
+15-14
diff --git a/‎cg/models/raredisease/raredisease.py
-1 b/‎cg/models/raredisease/raredisease.py
-1
@@ -1,5 +1,5 @@
 [bumpversion]
-current_version = 69.5.3
+current_version = 69.8.1
 commit = True
 tag = True
 tag_name = v{new_version}
 
@@ -10,7 +10,7 @@ jobs:
     name: Bump version and push tags to master
     steps:
       - name: Bump version
-        uses: Clinical-Genomics/bump2version-ci@v3
+        uses: Clinical-Genomics/bump2version-ci@2.0.3
         env:
           BUMPVERSION_TOKEN: ${{ secrets.BUMPVERSION_TOKEN }}
           BUMPVERSION_AUTHOR: ${{ secrets.BUMPVERSION_AUTHOR }}
 
@@ -0,0 +1,83 @@
+"""add Raredisease ordertype
+
+Revision ID: 039dbdf8af01
+Revises: 6362cfd4c61f
+Create Date: 2025-04-25 13:57:47.960893
+
+"""
+
+import sqlalchemy as sa
+from sqlalchemy.orm import declarative_base
+
+from alembic import op
+
+# revision identifiers, used by Alembic.
+revision = "039dbdf8af01"
+down_revision = "6362cfd4c61f"
+branch_labels = None
+depends_on = None
+
+Base = declarative_base()
+
+
+old_order_types = [
+    "BALSAMIC",
+    "BALSAMIC_UMI",
+    "FASTQ",
+    "FLUFFY",
+    "METAGENOME",
+    "MICROBIAL_FASTQ",
+    "MICROSALT",
+    "MIP_DNA",
+    "MIP_RNA",
+    "PACBIO_LONG_READ",
+    "NALLO",
+    "RML",
+    "RNAFUSION",
+    "SARS_COV_2",
+    "TAXPROFILER",
+    "TOMTE",
+]
+
+new_order_types = old_order_types.copy()
+new_order_types.append("RAREDISEASE")
+new_order_types.sort()
+
+
+class OrderTypeApplication(Base):
+    """Maps an order type to its allowed applications"""
+
+    __tablename__ = "order_type_application"
+    order_type = sa.Column(sa.types.Enum(*new_order_types), primary_key=True)
+
+
+def upgrade():
+    op.alter_column(
+        table_name="order_type_application",
+        column_name="order_type",
+        existing_type=sa.Enum(*old_order_types),
+        type_=sa.Enum(*new_order_types),
+        nullable=False,
+    )
+
+
+def downgrade():
+    # Remove incompatible entries
+    bind = op.get_bind()
+    session = sa.orm.Session(bind=bind)
+
+    for link in session.query(OrderTypeApplication).filter(
+        OrderTypeApplication.order_type == "RAREDISEASE"
+    ):
+        session.delete(link)
+
+    session.commit()
+
+    # Modify the column type back to the old enum
+    op.alter_column(
+        table_name="order_type_application",
+        column_name="order_type",
+        existing_type=sa.Enum(*new_order_types),
+        type_=sa.Enum(*old_order_types),
+        nullable=False,
+    )
@@ -1,2 +1,2 @@
 __title__ = "cg"
-__version__ = "69.5.3"
+__version__ = "69.8.1"
@@ -165,22 +165,22 @@ class SampleType(StrEnum):
 
 
 class DataDelivery(StrEnum):
-    ANALYSIS_FILES: str = "analysis"
-    ANALYSIS_SCOUT: str = "analysis-scout"
-    BAM: str = "bam"
-    FASTQ: str = "fastq"
-    FASTQ_SCOUT: str = "fastq-scout"
-    FASTQ_QC: str = "fastq_qc"
-    FASTQ_ANALYSIS: str = "fastq-analysis"
-    FASTQ_QC_ANALYSIS: str = "fastq_qc-analysis"
-    FASTQ_ANALYSIS_SCOUT: str = "fastq-analysis-scout"
-    NIPT_VIEWER: str = "nipt-viewer"
-    NO_DELIVERY: str = "no-delivery"
-    RAW_DATA_ANALYSIS: str = "raw_data-analysis"
-    RAW_DATA_ANALYSIS_SCOUT: str = "raw_data-analysis-scout"
-    RAW_DATA_SCOUT: str = "raw_data-scout"
-    SCOUT: str = "scout"
-    STATINA: str = "statina"
+    ANALYSIS_FILES = "analysis"
+    ANALYSIS_SCOUT = "analysis-scout"
+    BAM = "bam"
+    FASTQ = "fastq"
+    FASTQ_SCOUT = "fastq-scout"
+    FASTQ_QC = "fastq_qc"
+    FASTQ_ANALYSIS = "fastq-analysis"
+    FASTQ_QC_ANALYSIS = "fastq_qc-analysis"
+    FASTQ_ANALYSIS_SCOUT = "fastq-analysis-scout"
+    NIPT_VIEWER = "nipt-viewer"
+    NO_DELIVERY = "no-delivery"
+    RAW_DATA_ANALYSIS = "raw_data-analysis"
+    RAW_DATA_ANALYSIS_SCOUT = "raw_data-analysis-scout"
+    RAW_DATA_SCOUT = "raw_data-scout"
+    SCOUT = "scout"
+    STATINA = "statina"
 
 
 class HastaSlurmPartitions(StrEnum):
 
@@ -27,11 +27,11 @@ class PriorityTerms(StrEnum):
 
 
 class Priority(IntEnum):
-    research: int = 0
-    standard: int = 1
-    clinical_trials: int = 2
-    priority: int = 3
-    express: int = 4
+    research = 0
+    standard = 1
+    clinical_trials = 2
+    priority = 3
+    express = 4
 
     @classmethod
     def priority_to_slurm_qos(cls) -> dict[int, str]:
 
@@ -139,7 +139,7 @@ class ScoutUploadKey(StrEnum):
 NALLO_SAMPLE_TAGS: dict[str, set[str]] = dict(
     alignment_path={AlignmentFileTag.BAM, "haplotags"},
     assembly_alignment_path={AlignmentFileTag.BAM, "assembly"},
-    d4_file={"mosdepth_d4"},
+    d4_file={"coverage", "d4"},
     hificnv_coverage={"hificnv", "bigwig"},
     paraphase_alignment_path={AlignmentFileTag.BAM, NalloAnalysisTag.PARAPHASE},
     minor_allele_frequency_wig={"hificnv", "bigwig", "maf"},
 
@@ -4,10 +4,15 @@
 from cg.constants.priority import Priority
 from cg.models.orders.constants import OrderType
 from cg.services.orders.constants import ORDER_TYPE_WORKFLOW_MAP
+from cg.services.orders.validation.models.existing_sample import ExistingSample
 from cg.services.orders.validation.models.order import Order
 from cg.services.orders.validation.models.order_with_cases import OrderWithCases
+from cg.services.orders.validation.models.order_with_samples import OrderWithSamples
+from cg.services.orders.validation.models.sample import Sample as ValidationSample
+from cg.store.models import Application, Sample
+from cg.store.store import Store
 
-DUE_TIME_BY_PRIORITY: dict[Priority, timedelta.days] = {
+DUE_TIME_BY_PRIORITY: dict[Priority, timedelta] = {
     Priority.express: timedelta(days=7),
     Priority.priority: timedelta(days=14),
     Priority.standard: timedelta(days=21),
@@ -21,7 +26,23 @@ def contains_existing_data(order: OrderWithCases) -> bool:
     return any(not case.is_new or case.enumerated_existing_samples for case in order.cases)
 
 
-def get_ticket_tags(order: Order, order_type: OrderType) -> list[str]:
+def contains_external_data(order: Order, status_db: Store) -> bool:
+    """Check if any existing or new sample from the given order is external."""
+    existing_samples: list[Sample] = get_existing_samples(order=order, status_db=status_db)
+    new_samples: list[ValidationSample] = get_new_samples(order=order)
+
+    if any([sample.is_external for sample in existing_samples]):
+        return True
+
+    for sample in new_samples:
+        application: Application | None = status_db.get_application_by_tag(sample.application)
+        if application and application.is_external:
+            return True
+
+    return False
+
+
+def get_ticket_tags(order: Order, order_type: OrderType, status_db: Store) -> list[str]:
     """Generate ticket tags based on the order and order type"""
 
     tags: list[str] = [ORDER_TYPE_WORKFLOW_MAP[order_type]]
@@ -30,6 +51,9 @@ def get_ticket_tags(order: Order, order_type: OrderType) -> list[str]:
         if contains_existing_data(order):
             tags.append("existing-data")
 
+    if contains_external_data(order=order, status_db=status_db):
+        tags.append("external-data")
+
     return tags
 
 
@@ -54,3 +78,38 @@ def get_due_by_date(priority: Priority) -> date:
     """Get the ticket due by date based on the order priority."""
     due_by: datetime = datetime.now() + DUE_TIME_BY_PRIORITY[priority]
     return due_by.date()
+
+
+def get_existing_samples(order: Order, status_db: Store) -> list[Sample]:
+    existing_samples: list[Sample] = []
+
+    if isinstance(order, OrderWithCases):
+        existing_samples.extend(
+            [
+                sample
+                for (_, case) in order.enumerated_existing_cases
+                for sample in status_db.get_samples_by_case_id(case.internal_id)
+            ]
+        )
+
+        existing_samples.extend(
+            [
+                sample
+                for (_, case) in order.enumerated_new_cases
+                for (_, existing_sample) in case.enumerated_existing_samples
+                if (sample := status_db.get_sample_by_internal_id(existing_sample.internal_id))
+            ]
+        )
+
+    return existing_samples
+
+
+def get_new_samples(order: Order) -> list[ValidationSample]:
+    new_samples: list[ValidationSample] = []
+
+    if isinstance(order, OrderWithCases):
+        new_samples.extend([sample for (_, _, sample) in order.enumerated_new_samples])
+    elif isinstance(order, OrderWithSamples):
+        new_samples.extend(order.samples)
+
+    return new_samples
@@ -352,9 +352,15 @@ def create_params_file(self, case_id: str, dry_run: bool) -> None:
         ).model_dump()
         LOG.debug("Adding parameters from the pipeline config file if it exist")
 
-        workflow_parameters: dict = built_workflow_parameters | (
+        yaml_params: dict = (
             read_yaml(self.params) if hasattr(self, "params") and self.params else {}
         )
+
+        # Check for duplicate keys
+        duplicate_keys = set(built_workflow_parameters.keys()) & set(yaml_params.keys())
+        if duplicate_keys:
+            raise ValueError(f"Duplicate parameter keys found: {duplicate_keys}")
+        workflow_parameters: dict = built_workflow_parameters | (yaml_params)
         replaced_workflow_parameters: dict = self.replace_values_in_params_file(
             workflow_parameters=workflow_parameters
         )
 
@@ -13,15 +13,15 @@
     CoveragePostResponse,
     CoverageSample,
 )
-from cg.constants import DEFAULT_CAPTURE_KIT, Workflow
+from cg.constants import Workflow
 from cg.constants.constants import GenomeVersion
 from cg.constants.nf_analysis import (
     RAREDISEASE_COVERAGE_FILE_TAGS,
     RAREDISEASE_COVERAGE_INTERVAL_TYPE,
     RAREDISEASE_COVERAGE_THRESHOLD,
-    RAREDISEASE_PARENT_PEDDY_METRIC_CONDITION,
-    RAREDISEASE_METRIC_CONDITIONS_WGS,
     RAREDISEASE_METRIC_CONDITIONS_WES,
+    RAREDISEASE_METRIC_CONDITIONS_WGS,
+    RAREDISEASE_PARENT_PEDDY_METRIC_CONDITION,
 )
 from cg.constants.scout import RAREDISEASE_CASE_TAGS, ScoutExportFileName
 from cg.constants.sequencing import SeqLibraryPrepCategory
@@ -33,9 +33,9 @@
 from cg.models.deliverables.metric_deliverables import MetricsBase, MultiqcDataJson
 from cg.models.raredisease.raredisease import (
     RarediseaseParameters,
+    RarediseaseQCMetrics,
     RarediseaseSampleSheetEntry,
     RarediseaseSampleSheetHeaders,
-    RarediseaseQCMetrics,
 )
 from cg.resources import RAREDISEASE_BUNDLE_FILENAMES_PATH
 from cg.store.models import CaseSample, Sample
@@ -94,30 +94,13 @@ def get_sample_sheet_content_per_sample(self, case_sample: CaseSample) -> list[l
 
     @property
     def is_gene_panel_required(self) -> bool:
-        """Return True if a gene panel is needs to be created using the information in StatusDB and exporting it from Scout."""
+        """Return True if a gene panel needs to be created using the information in StatusDB and exporting it from Scout."""
         return True
 
-    def get_target_bed(self, case_id: str, analysis_type: str) -> str:
-        """
-        Return the target bed file from LIMS and use default capture kit for WHOLE_GENOME_SEQUENCING.
-        """
-        target_bed_file: str = self.get_target_bed_from_lims(case_id=case_id)
-        if not target_bed_file:
-            if analysis_type == AnalysisType.WGS:
-                return DEFAULT_CAPTURE_KIT
-            raise ValueError("No capture kit was found in LIMS")
-        return target_bed_file
-
-    def get_germlinecnvcaller_flag(self, analysis_type: str) -> bool:
-        if analysis_type == AnalysisType.WGS:
-            return True
-        return False
-
     def get_built_workflow_parameters(self, case_id: str) -> RarediseaseParameters:
         """Return parameters."""
         analysis_type: AnalysisType = self.get_data_analysis_type(case_id=case_id)
-        target_bed_file: str = self.get_target_bed(case_id=case_id, analysis_type=analysis_type)
-        skip_germlinecnvcaller = self.get_germlinecnvcaller_flag(analysis_type=analysis_type)
+        target_bed_file: str = self.get_target_bed_from_lims(case_id=case_id) or ""
         outdir = self.get_case_path(case_id=case_id)
 
         return RarediseaseParameters(
@@ -126,7 +109,6 @@ def get_built_workflow_parameters(self, case_id: str) -> RarediseaseParameters:
             analysis_type=analysis_type,
             target_bed_file=target_bed_file,
             save_mapped_as_cram=True,
-            skip_germlinecnvcaller=skip_germlinecnvcaller,
             vcfanno_extra_resources=f"{outdir}/{ScoutExportFileName.MANAGED_VARIANTS}",
             vep_filters_scout_fmt=f"{outdir}/{ScoutExportFileName.PANELS}",
         )
 
@@ -4,22 +4,23 @@
 
 
 class OrderType(StrEnum):
-    BALSAMIC: str = Workflow.BALSAMIC
-    BALSAMIC_UMI: str = Workflow.BALSAMIC_UMI
-    FASTQ: str = "fastq"
-    FLUFFY: str = Workflow.FLUFFY
-    METAGENOME: str = "metagenome"
-    MICROBIAL_FASTQ: str = "microbial-fastq"
-    MICROSALT: str = Workflow.MICROSALT
-    MIP_DNA: str = Workflow.MIP_DNA
-    MIP_RNA: str = Workflow.MIP_RNA
+    BALSAMIC = Workflow.BALSAMIC
+    BALSAMIC_UMI = Workflow.BALSAMIC_UMI
+    FASTQ = "fastq"
+    FLUFFY = Workflow.FLUFFY
+    METAGENOME = "metagenome"
+    MICROBIAL_FASTQ = "microbial-fastq"
+    MICROSALT = Workflow.MICROSALT
+    MIP_DNA = Workflow.MIP_DNA
+    MIP_RNA = Workflow.MIP_RNA
     NALLO = Workflow.NALLO
     PACBIO_LONG_READ = "pacbio-long-read"
-    RML: str = "rml"
-    RNAFUSION: str = Workflow.RNAFUSION
-    SARS_COV_2: str = "sars-cov-2"
-    TAXPROFILER: str = Workflow.TAXPROFILER
-    TOMTE: str = Workflow.TOMTE
+    RML = "rml"
+    RAREDISEASE = Workflow.RAREDISEASE
+    RNAFUSION = Workflow.RNAFUSION
+    SARS_COV_2 = "sars-cov-2"
+    TAXPROFILER = Workflow.TAXPROFILER
+    TOMTE = Workflow.TOMTE
 
 
 class ExcelSampleAliases(StrEnum):
 
@@ -67,6 +67,5 @@ class RarediseaseParameters(WorkflowParameters):
     target_bed_file: str
     analysis_type: str
     save_mapped_as_cram: bool
-    skip_germlinecnvcaller: bool
     vcfanno_extra_resources: str
     vep_filters_scout_fmt: str
Original file line number	Diff line number	Diff line change
`@@ -1,2 +1,2 @@`
`1`	`1`	`__title__ = "cg"`
`2`		`-__version__ = "69.5.3"`
	`2`	`+__version__ = "69.8.1"`