train_ahmedml.jobΒΆ

recipes/aero_cfd/jobs/train_ahmedml.job

 1#!/bin/bash -l
 2#SBATCH --nodes=1
 3#SBATCH --cpus-per-task=28
 4#SBATCH --partition=compute
 5#SBATCH --gpus-per-node=1
 6#SBATCH --ntasks-per-node=1
 7#SBATCH --mem=64GB
 8#SBATCH --output=/home/%u/logs/ahmedml/%x_%j.out
 9#SBATCH --nice=0
10#SBATCH --array=1-20%10
11
12EXPERIMENT_FILE=$(dirname "$0")/experiments/ahmedml_experiments.txt
13# run
14srun --kill-on-bad-exit=1 --cpus-per-task=28 uv run noether-train --hp recipes/aero_cfd/configs/train_ahmedml.yaml $(head -$SLURM_ARRAY_TASK_ID $EXPERIMENT_FILE | tail -1)