Skip to content

Commit b8a7e5a

Browse files
committed
Merging staging branch into prod branch
2 parents bb6390c + 15edeaa commit b8a7e5a

File tree

8 files changed

+21
-7
lines changed

8 files changed

+21
-7
lines changed

.happy/terraform/envs/rdev/main.tf

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -14,8 +14,8 @@ module stack {
1414
batch_container_memory_limit = 28000
1515
wmg_batch_container_memory_limit = 248000
1616
wmg_desired_vcpus = 128
17-
cg_desired_vcpus = 48
18-
cg_batch_container_memory_limit = 92000
17+
cg_desired_vcpus = 128
18+
cg_batch_container_memory_limit = 248000
1919
backend_instance_count = 1
2020
frontend_instance_count = 1
2121
backend_memory = 8192

.happy/terraform/modules/ecs-stack/variables.tf

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -103,13 +103,13 @@ variable wmg_desired_vcpus {
103103
variable cg_batch_container_memory_limit {
104104
type = number
105105
description = "Memory hard limit for the cellguide pipeline batch container"
106-
default = 92000
106+
default = 248000
107107
}
108108

109109
variable cg_desired_vcpus {
110110
type = number
111111
description = "Number of desired vCPUs for cellguide pipeline"
112-
default = 48
112+
default = 128
113113
}
114114

115115
variable frontend_instance_count {

backend/cellguide/pipeline/computational_marker_genes/computational_markers.py

Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,7 @@
11
import concurrent.futures
22
import itertools
33
import logging
4+
import os
45
import warnings
56
from typing import Tuple
67

@@ -42,6 +43,12 @@
4243

4344
MARKER_SCORE_THRESHOLD = 0.5
4445

46+
# This file contains blacklisted marker genes that match the following criteria:
47+
# Ensembl 104 gene IDs that are annotated with the GO terms: ['GO:0005840', 'GO:0005739']
48+
# These GO terms correspond to the cellular components "ribosome" and "mitochondrion".
49+
file_dir = os.path.dirname(os.path.realpath(__file__))
50+
MARKER_GENE_BLACKLIST_FILENAME = os.path.join(file_dir, "marker_gene_blacklist.txt")
51+
4552

4653
class MarkerGenesCalculator:
4754
def __init__(self, *, snapshot: WmgSnapshot, all_cell_type_ids_in_corpus: list[str], groupby_terms: list[str]):
@@ -477,6 +484,12 @@ def get_computational_marker_genes(
477484

478485
# reset the index to convert MultiIndex back into columns
479486
markers_df = markers_df.reset_index()
487+
with open(MARKER_GENE_BLACKLIST_FILENAME, "r") as f:
488+
marker_gene_blacklist = f.read().split(",")
489+
blacklisted_genes = markers_df["gene_ontology_term_id"].isin(marker_gene_blacklist)
490+
491+
logger.info(f"Removing {blacklisted_genes.sum()} blacklisted marker genes")
492+
markers_df = markers_df[~blacklisted_genes]
480493

481494
# get the top `num_marker_genes` genes per metadata group
482495
top_per_group = (

backend/cellguide/pipeline/computational_marker_genes/marker_gene_blacklist.txt

Lines changed: 1 addition & 0 deletions
Large diffs are not rendered by default.

python_dependencies/cellguide_pipeline/requirements.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -30,7 +30,7 @@ requests==2.31.0
3030
s3transfer==0.6.1
3131
scipy==1.11.1
3232
six==1.16.0
33-
tiledb==0.22.3
33+
tiledb==0.24.0
3434
typing_extensions==4.7.1
3535
tzdata==2023.3
3636
urllib3==1.26.16
Binary file not shown.

tests/unit/cellguide_pipeline/fixtures/computational_marker_genes.json

Lines changed: 1 addition & 1 deletion
Large diffs are not rendered by default.

tests/unit/cellguide_pipeline/fixtures/reformatted_computational_marker_genes.json

Lines changed: 1 addition & 1 deletion
Large diffs are not rendered by default.

0 commit comments

Comments
 (0)