Merge pull request #1388 from mskcc/release/1.89.0

Release 1.89.0
mskcc · Dec 13, 2024 · 9777f4a · 9777f4a
2 parents ab4ebba + 5bc7157
commit 9777f4a
Show file tree

Hide file tree

Showing 6 changed files with 79 additions and 24 deletions.
diff --git a/.github/workflows/github-actions.yml b/.github/workflows/github-actions.yml
@@ -0,0 +1,56 @@
+on: push
+
+jobs:
+  build:
+
+    runs-on: ubuntu-latest
+
+    services:
+      postgres:
+        image: postgres:latest
+        env:
+          POSTGRES_USER: postgres
+          POSTGRES_PASSWORD: postgres
+          POSTGRES_DB: github_actions
+        ports:
+          - 5432:5432
+        # needed because the postgres container does not provide a healthcheck
+        options: --health-cmd pg_isready --health-interval 10s --health-timeout 5s --health-retries 5
+
+    steps:
+    - uses: actions/checkout@v4
+    - name: Set up Python 3.8
+      uses: actions/setup-python@v5
+      with:
+        python-version: 3.8
+    - name: python ldap
+      run: sudo apt-get install libsasl2-dev python3-dev libldap2-dev libssl-dev #adding package for python ldap error 
+    - name: Install dependencies
+      run: |
+        pip install --upgrade pip
+        python -m pip install python-ldap
+        pip install -r requirements-dev.txt
+    - name: Run migrations
+      run: python manage.py migrate
+      env:
+          BEAGLE_DB_NAME: github_actions
+          BEAGLE_DB_PASSWORD: postgres
+          BEAGLE_DB_USERNAME: postgres
+    - name: Run test
+      run: |
+        python manage.py test
+      env:
+          BEAGLE_DB_NAME: github_actions
+          BEAGLE_DB_PASSWORD: postgres
+          BEAGLE_DB_USERNAME: postgres
+          BEAGLE_DB_PORT: 5432
+          BEAGLE_NOTIFIER_ACTIVE: False
+          TMPDIR: /tmp
+          BEAGLE_SHARED_TMPDIR: $TMPDIR
+          ENVIRONMENT: 'dev'
+          BEAGLE_PRIMARY_ID_REGEX: "^(0\\d{4}|[1-9]\\d{4,})(|_[B-Z]|_[A-Z]{2,})_\\d+$"
+    - name: Black check
+      uses: psf/black@stable
+      with:
+        options: "--check"
+        version: "22.3.0"
diff --git a/beagle/__init__.py b/beagle/__init__.py
@@ -1 +1 @@
-__version__ = "1.88.0"
+__version__ = "1.89.0"
diff --git a/file_system/helper/access_helper.py b/file_system/helper/access_helper.py
@@ -81,8 +81,14 @@ def construct_csv(self):
         """
 
         # get fastq metadata for a given request
-        fastqs = File.objects.filter(file_group__slug="lims", request_id__in=self.request_ids)
-        fastq_metadata = [fastq.filemetadata_set.values()[0]["metadata"] for fastq in fastqs]
+        files = FileRepository.filter(
+            file_group=settings.IMPORT_FILE_GROUP,
+            metadata={settings.IGO_COMPLETE_METADATA_KEY: True},
+            filter_redact=True,
+        ).all()
+        fastqs = files.filter(metadata__igoRequestId__in=self.request_ids)
+        fastq_metadata = [fastq.metadata for fastq in fastqs]
+        fastq_metadata = sorted(fastq_metadata, key=lambda d: d["cmoSampleName"])
         cmoPatientId = set([fastq["cmoPatientId"] for fastq in fastq_metadata])
         # get DMP BAM file group
         dmp_bams = FileRepository.filter(file_group=settings.DMP_BAM_FILE_GROUP)

diff --git a/runner/operator/cmo_ch/v2_1_0/chip_var/input_template.json.jinja2 b/runner/operator/cmo_ch/v2_1_0/chip_var/input_template.json.jinja2
@@ -53,15 +53,15 @@
   },
   "input_47kchpd_tsv_file": {
     "class": "File",
-	  "path": "juno:///work/cch/production/resources/ch_47k_impact/versions/v1/chpd47k_prevalence.tsv"
+	  "location": "juno:///work/cch/production/resources/ch_47k_impact/versions/v1/chpd47k_prevalence.tsv"
   },
   "input_panmeloid_tsv_file": {
     "class": "File",
-	  "path": "juno:///work/cch/production/resources/pan_myeloid/versions/v1/pan_myeloid_variant_count.tsv"
+	  "location": "juno:///work/cch/production/resources/pan_myeloid/versions/v1/pan_myeloid_variant_count.tsv"
   },
   "input_hotspot_tsv_file": {
     "class": "File",
-    "path": "juno:///work/cch/production/resources/ch_47k_impact/versions/v1/hotspots_47kchpd.tsv"
+    "location": "juno:///work/cch/production/resources/ch_47k_impact/versions/v1/hotspots_47kchpd.tsv"
   },
   "retain_info": "CNT,TUMOR_TYPE",
   "vardict_allele_frequency_threshold": 0,

diff --git a/runner/operator/manifest/access_manifest_operator.py b/runner/operator/manifest/access_manifest_operator.py
@@ -98,18 +98,13 @@ def write_to_file(self, fname, s):
         Writes manifest csv to temporary location, registers it as tmp file
         :return: manifest csv path
         """
-        # Split the string into rows using "\r\n" as the delimiter
-        rows = s.split("\r\n")
-        # Split each row into columns using "," as the delimiter
-        data = [row.split(",") for row in rows]
-        # tmp file creation
+        # output path
         tmpdir = os.path.join(settings.BEAGLE_SHARED_TMPDIR, str(uuid.uuid4()))
         Path(tmpdir).mkdir(parents=True, exist_ok=True)
         output = os.path.join(tmpdir, fname)
         # write csv to tmp file group
-        with open(output, "w+", newline="") as csvfile:
-            writer = csv.writer(csvfile)
-            writer.writerows(data)
+        with open(output, mode="w", encoding="utf-8", newline="") as file:
+            file.write(s)
         # register output as tmp file
         self.register_temp_file(output)
         # return with juno formatting

diff --git a/runner/tests/operator/access/manifest/test_access_manifest_operator.py b/runner/tests/operator/access/manifest/test_access_manifest_operator.py
@@ -7,9 +7,6 @@
 from beagle_etl.models import Operator
 from file_system.models import File, FileMetadata
 from runner.operator.operator_factory import OperatorFactory
-import datetime
-import glob
-import shutil
 
 # general fixtures
 COMMON_FIXTURES = [
@@ -32,10 +29,8 @@
 class TestAcessManifestOperator(TestCase):
     # test db
     fixtures = [os.path.join(ROOT_DIR, f) for f in COMMON_FIXTURES]
-    # variables to help check operator output
-    expected_csv_content = [
-        'igoRequestId,primaryId,cmoPatientId,cmoSampleName,dmpPatientId,dmpImpactSamples,dmpAccessSamples,baitSet,libraryVolume,investigatorSampleId,preservation,species,libraryConcentrationNgul,tissueLocation,sampleClass,sex,cfDNA2dBarcode,sampleOrigin,tubeId,tumorOrNormal,captureConcentrationNm,oncotreeCode,dnaInputNg,collectionYear,captureInputNg\n13893_B,13893_B_1,ALLANT2,C-ALLANT2-N001-d01,P-0000002,P-0000005-T01-IM6;P-0000004-T01-IM6,,MSK-ACCESS-v1_0-probesAllwFP,25.0,P-1234567-N00-XS1,EDTA-Streck,,69.0,,Blood,M,8042889270,Whole Blood,,Normal,14.49275362,,200.0,,999.99999978\n13893_B,13893_B_3,ALLANT,C-ALLANT-N001-d01,P-0000001,P-0000002-T01-IM6;P-0000001-T01-IM6,,MSK-ACCESS-v1_0-probesAllwFP,25.0,P-1234567-N00-XS1,EDTA-Streck,,102.5,,Blood,M,8042889270,Whole Blood,,Normal,9.756097561,,200.0,,1000.0000000025001\n13893_B,13893_B_2,ALLANT3,C-ALLANT3-N003-d02,,,,MSK-ACCESS-v1_0-probesAllwFP,25.0,P-1234567-N00-XS1,EDTA-Streck,,74.5,,Blood,M,8042889270,Whole Blood,,Normal,13.42281879,,200.0,,999.999999855\n""\n'
-    ]
+    header_control = "igoRequestId,primaryId,cmoPatientId,cmoSampleName,dmpPatientId,dmpImpactSamples,dmpAccessSamples,baitSet,libraryVolume,investigatorSampleId,preservation,species,libraryConcentrationNgul,tissueLocation,sampleClass,sex,cfDNA2dBarcode,sampleOrigin,tubeId,tumorOrNormal,captureConcentrationNm,oncotreeCode,dnaInputNg,collectionYear,captureInputNg"
+    id_control = "C-ALLANT-N001-d01"
 
     def test_access_manifest_operator(self):
         """
@@ -60,6 +55,9 @@ def test_access_manifest_operator(self):
             self.assertEqual(len(input_json["manifest_data"]), 2)
             # Check contents
             manifest_path = input_json["manifest_data"]["location"].replace("juno:", "")
-            with open(manifest_path, "r") as file:
-                csv_string = file.read()
-            self.assertEqual(csv_string, self.expected_csv_content[i])
+            with open(manifest_path, mode="r", newline="", encoding="utf-8") as file:
+                content = file.read()
+            header = content.split("\r\n")[0]
+            id = content.split("\r\n")[1].split(",")[3]
+            self.assertEqual(header, self.header_control)
+            self.assertEqual(id, self.id_control)