Skip to content

Commit acf519c

Browse files
committed
The cluster has no internet access, write the prolog script
1 parent 471c937 commit acf519c

File tree

4 files changed

+15
-2
lines changed

4 files changed

+15
-2
lines changed

.github/workflows/release.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -67,6 +67,7 @@ jobs:
6767
run: |
6868
aws s3 cp provisioner_scripts/create_users.py s3://${{ secrets.S3_BUCKET }}/scripts/create_users.py
6969
aws s3 cp provisioner_scripts/environment.sh s3://${{ secrets.S3_BUCKET }}/scripts/environment.sh
70+
aws s3 cp provisioner_scripts/80_cloudwatch_agent_config_prolog.sh s3://${{ secrets.S3_BUCKET }}/scripts/80_cloudwatch_agent_config_prolog.sh
7071
- name: Release
7172
uses: softprops/action-gh-release@v2
7273
if: github.ref == 'refs/heads/main'

hpc_provisioner/src/hpc_provisioner/config-dev/_head_node.tpl.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -21,6 +21,7 @@ CustomActions:
2121
Args: !config create_users_args
2222
- Script: s3://sboinfrastructureassets-sandbox/scripts/environment.sh
2323
Args: !config environment_args
24+
- Script: s3://sboinfrastructureassets-sandbox/scripts/80_cloudwatch_agent_config_prolog.sh
2425
# - Script: s3://sboinfrastructureassets/scripts/all_or_nothing_allocation.sh
2526
# - Script: s3://sboinfrastructureassets/scripts/setup_lustre_directories.py
2627
# Args:
Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,13 @@
1+
cat << _EOF_ >> /opt/slurm/etc/scripts/prolog.d/80_cloudwatch_agent_config_prolog.sh
2+
#!/bin/bash
3+
4+
CWAGENT_CONFIG=/sbo/data/scratch/CWAgent_config_\$SLURM_CLUSTER_NAME.json
5+
6+
if [ ! -f \$CWAGENT_CONFIG ]; then
7+
echo "Create CWAGENT_CONFIG " \$CWAGENT_CONFIG
8+
sed "s/\\$CLUSTER_NAME/\$SLURM_CLUSTER_NAME/g" /sbo/data/scratch/CWAgent_config_tpl.json > \$CWAGENT_CONFIG
9+
fi
10+
11+
#sudo /opt/slurm/bin/srun --ntasks=\$NODES --ntasks-per-node=1 /opt/aws/amazon-cloudwatch-agent/bin/amazon-cloudwatch-agent-ctl -a stop
12+
sudo /opt/aws/amazon-cloudwatch-agent/bin/amazon-cloudwatch-agent-ctl -a fetch-config -m ec2 -c file:/\$CWAGENT_CONFIG -s
13+
_EOF_

provisioner_scripts/environment.sh

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -3,5 +3,3 @@
33
export CLUSTER_NAME=$1
44

55
echo "CLUSTER_NAME=${CLUSTER_NAME}" >> /etc/environment
6-
7-
curl --create-dirs --output /opt/slurm/etc/scripts/prolog.d/80_cloudwatch_agent_config_prolog.sh --create-file-mode 0755 https://raw.githubusercontent.com/openbraininstitute/hpc-resource-provisioner/refs/heads/slurm_prolog/provisioner_scripts/headnode/80_cloudwatch_agent_config_prolog.sh

0 commit comments

Comments
 (0)