train_ahmedml.jobΒΆ
recipes/aero_cfd/jobs/train_ahmedml.job
1#!/bin/bash -l
2#SBATCH --nodes=1
3#SBATCH --cpus-per-task=28
4#SBATCH --partition=compute
5#SBATCH --gpus-per-node=1
6#SBATCH --ntasks-per-node=1
7#SBATCH --mem=64GB
8#SBATCH --output=/home/%u/logs/ahmedml/%x_%j.out
9#SBATCH --nice=0
10#SBATCH --array=1-20%10
11
12EXPERIMENT_FILE=$(dirname "$0")/experiments/ahmedml_experiments.txt
13# run
14srun --kill-on-bad-exit=1 --cpus-per-task=28 uv run noether-train --hp recipes/aero_cfd/configs/train_ahmedml.yaml $(head -$SLURM_ARRAY_TASK_ID $EXPERIMENT_FILE | tail -1)