Replace shell commands with subprocess.run

balvisio · balvisio · commit d106dcae26dd · 2025-06-20T05:15:51.000Z
Signed-off-by: Bruno Alvisio &lt;balvisio@nvidia.com&gt;
diff --git a/ci/scripts/pytest_runner.sh b/ci/scripts/pytest_runner.sh
@@ -57,7 +57,7 @@ SKIP_SLOW=false
 ONLY_SLOW=false
 ALLOW_NO_TESTS=false
 # TODO(@cspades): Ignore this Evo2 notebook test, which has a tendency to leave a 32GB orphaned process in GPU.
-declare -a IGNORE_FILES=("sub-packages/bionemo-evo2/examples/fine-tuning-tutorial.ipynb")
+declare -a IGNORE_FILES=()
 error=false
 
 # Parse command line arguments
diff --git a/ci/scripts/run_pytest_notebooks.sh b/ci/scripts/run_pytest_notebooks.sh
@@ -19,4 +19,4 @@
 # Enable strict mode with better error handling
 set -euox pipefail
 
-pytest -v --nbval-lax -p no:python docs/ sub-packages/
+pytest -v --nbval-lax -x -p no:python docs/ sub-packages/
diff --git a/pyproject.toml b/pyproject.toml
@@ -119,7 +119,6 @@ addopts = [
     "--durations-min=30.0",
     "--durations=0",
     "--ignore=3rdparty",
-    "--ignore-glob=sub-packages/bionemo-evo2/examples/fine-tuning-tutorial.ipynb",
     "--ignore-glob=sub-packages/bionemo-moco/examples/discrete_data_interpolant_tutorial.ipynb"
 ]
 markers = ["slow: marks tests as slow (deselect with '-m \"not slow\"')"]
diff --git a/sub-packages/bionemo-core/src/bionemo/core/utils/subprocess_utils.py b/sub-packages/bionemo-core/src/bionemo/core/utils/subprocess_utils.py
@@ -0,0 +1,54 @@
+# SPDX-FileCopyrightText: Copyright (c) 2024 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: LicenseRef-Apache2
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+
+import logging
+import subprocess
+from typing import Any, Dict, List
+
+
+logger = logging.getLogger(__name__)
+
+
+def run_subprocess_safely(command: List[str], timeout: int = 2000) -> Dict[str, Any]:
+    """Run a subprocess and raise an error if it fails.
+
+    Args:
+        command: The command to run.
+        timeout: The timeout for the command.
+
+    Returns:
+        The result of the subprocess.
+    """
+    try:
+        result = subprocess.run(command, capture_output=True, timeout=timeout, check=True, text=True)
+        return {"stdout": result.stdout, "stderr": result.stderr, "returncode": result.returncode}
+    except subprocess.TimeoutExpired as e:
+        logger.error(f"Command timed out. Command: {command}\nstdout:\n{e.stdout}\nstderr:\n{e.stderr}")
+        return {"error": "timeout", "stdout": e.stdout, "stderr": e.stderr, "returncode": None}
+
+    except subprocess.CalledProcessError as e:
+        logger.error(
+            f"Command failed. Command: {command}\nreturncode: {e.returncode}\nstdout:\n{e.stdout}\nstderr:\n{e.stderr}"
+        )
+        return {"error": "non-zero exit", "stdout": e.stdout, "stderr": e.stderr, "returncode": e.returncode}
+
+    except FileNotFoundError as e:
+        logger.error(f"Command not found. Command: {command}\nstderr:\n{str(e)}")
+        return {"error": "not found", "stdout": "", "stderr": str(e), "returncode": None}
+
+    except Exception as e:
+        # catch-all for other unexpected errors
+        return {"error": "other", "message": str(e), "stdout": "", "stderr": "", "returncode": None}
diff --git a/sub-packages/bionemo-evo2/examples/fine-tuning-tutorial.ipynb b/sub-packages/bionemo-evo2/examples/fine-tuning-tutorial.ipynb
@@ -93,9 +93,10 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "%%capture\n",
     "import os\n",
     "\n",
+    "from bionemo.core.utils.subprocess_utils import run_subprocess_safely\n",
+    "\n",
     "\n",
     "concat_path = \"chr20_21_22.fa\"\n",
     "if not os.path.exists(concat_path):\n",
@@ -158,7 +159,6 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "%%capture\n",
     "!preprocess_evo2 --config preprocess_config.yaml"
    ]
   },
@@ -207,7 +207,6 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "%%capture\n",
     "if not os.path.exists(\"nemo2_evo2_1b_8k\"):\n",
     "    !evo2_convert_to_nemo2 \\\n",
     "      --model-path hf://arcinstitute/savanna_evo2_1b_base \\\n",
@@ -262,46 +261,77 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "%%capture\n",
     "MAX_STEPS: int = 10 if FAST_CI_MODE else 100\n",
     "val_check_interval = min(int(MAX_STEPS // 2), 50)\n",
     "warmup_steps = min(MAX_STEPS, 100)\n",
     "# For evo2 training and fine-tuning follow the same set of steps, so we use the same train_evo2 command.\n",
     "#  the big difference is the --ckpt-dir argument which points to a pre-existing checkpoint from some other training run.\n",
     "\n",
     "if FAST_CI_MODE:\n",
-    "    model_subset_option = (\n",
-    "        \"--num-layers 4 --hybrid-override-pattern SDH* --activation-checkpoint-recompute-num-layers 2\"\n",
-    "    )\n",
+    "    model_subset_option = [\n",
+    "        \"--num-layers\",\n",
+    "        \"4\",\n",
+    "        \"--hybrid-override-pattern\",\n",
+    "        \"SDH*\",\n",
+    "        \"--activation-checkpoint-recompute-num-layers\",\n",
+    "        \"2\",\n",
+    "    ]\n",
     "else:\n",
     "    # By default do 5 layers of activation checkpointing\n",
-    "    model_subset_option = \"--activation-checkpoint-recompute-num-layers 5\"\n",
-    "train_cmd = f\"\"\"train_evo2 \\\n",
-    "    -d training_data_config.yaml \\\n",
-    "    --dataset-dir ./preprocessed_data \\\n",
-    "    --result-dir pretraining_demo \\\n",
-    "    --experiment-name evo2 \\\n",
-    "    --model-size 1b \\\n",
-    "    --devices 1 \\\n",
-    "    --num-nodes 1 \\\n",
-    "    --seq-length 8192 \\\n",
-    "    --micro-batch-size 2 \\\n",
-    "    --lr 0.000015 \\\n",
-    "    --min-lr 0.0000149 \\\n",
-    "    --warmup-steps {warmup_steps} \\\n",
-    "    --grad-acc-batches 4 \\\n",
-    "    --max-steps {MAX_STEPS} \\\n",
-    "    --ckpt-dir nemo2_evo2_1b_8k \\\n",
-    "    --clip-grad 250 \\\n",
-    "    --wd 0.001 \\\n",
-    "    --attention-dropout 0.01 \\\n",
-    "    --hidden-dropout 0.01 \\\n",
-    "    --val-check-interval {val_check_interval} \\\n",
-    "    {model_subset_option} \\\n",
-    "    --create-tensorboard-logger \\\n",
-    "    --ckpt-async-save\"\"\"\n",
-    "\n",
-    "!{train_cmd}"
+    "    model_subset_option = [\"--activation-checkpoint-recompute-num-layers\", \"5\"]\n",
+    "\n",
+    "train_cmd = [\n",
+    "    \"train_evo2\",\n",
+    "    \"-d\",\n",
+    "    \"training_data_config.yaml\",\n",
+    "    \"--dataset-dir\",\n",
+    "    \"./preprocessed_data\",\n",
+    "    \"--result-dir\",\n",
+    "    \"pretraining_demo\",\n",
+    "    \"--experiment-name\",\n",
+    "    \"evo2\",\n",
+    "    \"--model-size\",\n",
+    "    \"1b\",\n",
+    "    \"--devices\",\n",
+    "    \"1\",\n",
+    "    \"--num-nodes\",\n",
+    "    \"1\",\n",
+    "    \"--seq-length\",\n",
+    "    \"8192\",\n",
+    "    \"--micro-batch-size\",\n",
+    "    \"2\",\n",
+    "    \"--lr\",\n",
+    "    \"0.000015\",\n",
+    "    \"--min-lr\",\n",
+    "    \"0.0000149\",\n",
+    "    \"--warmup-steps\",\n",
+    "    str(warmup_steps),\n",
+    "    \"--grad-acc-batches\",\n",
+    "    \"4\",\n",
+    "    \"--max-steps\",\n",
+    "    str(MAX_STEPS),\n",
+    "    \"--ckpt-dir\",\n",
+    "    \"nemo2_evo2_1b_8k\",\n",
+    "    \"--clip-grad\",\n",
+    "    \"250\",\n",
+    "    \"--wd\",\n",
+    "    \"0.001\",\n",
+    "    \"--attention-dropout\",\n",
+    "    \"0.01\",\n",
+    "    \"--hidden-dropout\",\n",
+    "    \"0.01\",\n",
+    "    \"--val-check-interval\",\n",
+    "    str(val_check_interval),\n",
+    "    \"--create-tensorboard-logger\",\n",
+    "    \"--ckpt-async-save\",\n",
+    "]\n",
+    "\n",
+    "train_cmd.extend(model_subset_option)\n",
+    "\n",
+    "print(f\"Running command: {train_cmd}\")\n",
+    "\n",
+    "result = run_subprocess_safely(train_cmd)\n",
+    "assert result[\"returncode\"] == 0, result"
    ]
   },
   {
diff --git a/sub-packages/bionemo-evo2/examples/zeroshot_brca1.ipynb b/sub-packages/bionemo-evo2/examples/zeroshot_brca1.ipynb
@@ -50,7 +50,9 @@
     "import seaborn as sns\n",
     "import torch\n",
     "from Bio import SeqIO\n",
-    "from sklearn.metrics import auc, roc_auc_score, roc_curve"
+    "from sklearn.metrics import auc, roc_auc_score, roc_curve\n",
+    "\n",
+    "from bionemo.core.utils.subprocess_utils import run_subprocess_safely"
    ]
   },
   {
@@ -662,24 +664,11 @@
     "# The Evo2 config has 'use_fp8_input_projections: True' by default\n",
     "\n",
     "if FAST_CI_MODE:\n",
-    "    model_subset_option = \"--num-layers 4 --hybrid-override-pattern SDH*\"\n",
+    "    model_subset_options = [\"--num-layers 4\", \"--hybrid-override-pattern SDH*\"]\n",
     "else:\n",
-    "    model_subset_option = \"\"\n",
-    "\n",
-    "fp8_option = \"--fp8\" if fp8_supported else \"\"\n",
-    "\n",
-    "# Update predict commands to run on the full dataset\n",
-    "predict_ref_command = (\n",
-    "    f\"predict_evo2 --fasta {ref_fasta_path} --ckpt-dir {checkpoint_path} \"\n",
-    "    f\"--output-dir {predict_ref_dir} --model-size {MODEL_SIZE} --tensor-parallel-size 1  {model_subset_option} \"\n",
-    "    f\"--pipeline-model-parallel-size 1 --context-parallel-size 1 --output-log-prob-seqs {fp8_option}\"\n",
-    ")\n",
+    "    model_subset_options = []\n",
     "\n",
-    "predict_var_command = (\n",
-    "    f\"predict_evo2 --fasta {var_fasta_path} --ckpt-dir {checkpoint_path} \"\n",
-    "    f\"--output-dir {predict_var_dir} --model-size {MODEL_SIZE} --tensor-parallel-size 1 {model_subset_option} \"\n",
-    "    f\"--pipeline-model-parallel-size 1 --context-parallel-size 1 --output-log-prob-seqs {fp8_option}\"\n",
-    ")"
+    "fp8_option = \"--fp8\" if fp8_supported else \"\""
    ]
   },
   {
@@ -696,8 +685,38 @@
    "outputs": [],
    "source": [
     "%%capture\n",
+    "# Update predict commands to run on the full dataset\n",
+    "# Update predict commands to run on the full dataset\n",
+    "predict_ref_command = [\n",
+    "    \"predict_evo2\",\n",
+    "    \"--fasta\",\n",
+    "    ref_fasta_path,\n",
+    "    \"--ckpt-dir\",\n",
+    "    checkpoint_path,\n",
+    "    \"--output-dir\",\n",
+    "    predict_ref_dir,\n",
+    "    \"--model-size\",\n",
+    "    MODEL_SIZE,\n",
+    "    \"--tensor-parallel-size\",\n",
+    "    \"1\",\n",
+    "    \"--pipeline-model-parallel-size\",\n",
+    "    \"1\",\n",
+    "    \"--context-parallel-size\",\n",
+    "    \"1\",\n",
+    "    \"--output-log-prob-seqs\",\n",
+    "]\n",
+    "\n",
+    "# Optional flags\n",
+    "if model_subset_options:\n",
+    "    predict_ref_command.extend(model_subset_options)\n",
+    "\n",
+    "if fp8_option:\n",
+    "    predict_ref_command.append(fp8_option)\n",
+    "\n",
     "print(f\"Running command: {predict_ref_command}\")\n",
-    "!{predict_ref_command}"
+    "\n",
+    "result = run_subprocess_safely(predict_ref_command)\n",
+    "assert result[\"returncode\"] == 0, result"
    ]
   },
   {
@@ -714,8 +733,35 @@
    "outputs": [],
    "source": [
     "%%capture\n",
+    "predict_var_command = [\n",
+    "    \"predict_evo2\",\n",
+    "    \"--fasta\",\n",
+    "    var_fasta_path,\n",
+    "    \"--ckpt-dir\",\n",
+    "    checkpoint_path,\n",
+    "    \"--output-dir\",\n",
+    "    predict_var_dir,\n",
+    "    \"--model-size\",\n",
+    "    MODEL_SIZE,\n",
+    "    \"--tensor-parallel-size\",\n",
+    "    \"1\",\n",
+    "    \"--pipeline-model-parallel-size\",\n",
+    "    \"1\",\n",
+    "    \"--context-parallel-size\",\n",
+    "    \"1\",\n",
+    "    \"--output-log-prob-seqs\",\n",
+    "]\n",
+    "\n",
+    "if model_subset_options:\n",
+    "    predict_var_command.extend(model_subset_options)  # make sure this is already a single flag or \"--key value\"\n",
+    "\n",
+    "if fp8_option:\n",
+    "    predict_var_command.append(fp8_option)\n",
+    "\n",
     "print(f\"Running command: {predict_var_command}\")\n",
-    "!{predict_var_command}"
+    "\n",
+    "result = run_subprocess_safely(predict_var_command)\n",
+    "assert result[\"returncode\"] == 0, result"
    ]
   },
   {

Original file line number	Diff line number	Diff line change
`@@ -119,7 +119,6 @@ addopts = [`
`119`	`119`	`"--durations-min=30.0",`
`120`	`120`	`"--durations=0",`
`121`	`121`	`"--ignore=3rdparty",`
`122`		`- "--ignore-glob=sub-packages/bionemo-evo2/examples/fine-tuning-tutorial.ipynb",`
`123`	`122`	`"--ignore-glob=sub-packages/bionemo-moco/examples/discrete_data_interpolant_tutorial.ipynb"`
`124`	`123`	`]`
`125`	`124`	`markers = ["slow: marks tests as slow (deselect with '-m \"not slow\"')"]`