-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathsbatch_tdda_3d_baseline.sh
22 lines (17 loc) · 1.08 KB
/
sbatch_tdda_3d_baseline.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
#!/bin/bash
#SBATCH -p accelerated
#SBATCH -A hk-project-sustainebot
#SBATCH -J manten-training
# Cluster Settings
#SBATCH -n 1 # Number of tasks
#SBATCH -c 16 # Number of cores per task
#SBATCH -t 06:00:00 # 1-04:00:00 ## # 06:00:00 # 1-00:30:00 # 2-00:00:00
#SBATCH --gres=gpu:4
#SBATCH --ntasks-per-node=1
# Define the paths for storing output and error files
#SBATCH --output=/hkfs/work/workspace/scratch/uqtlv-code_n_mamba/code/manten/outputs/%x_%j.out
#SBATCH --error=/hkfs/work/workspace/scratch/uqtlv-code_n_mamba/code/manten/outputs/%x_%j.err
# shellcheck disable=SC1091
source /home/hk-project-sustainebot/uqtlv/.mambainit
micromamba activate /hkfs/work/workspace/scratch/uqtlv-code_n_mamba/micromamba/envs/manten
accelerate launch --main_process_port 29872 --config_file /home/hk-project-sustainebot/uqtlv/.cache/huggingface/accelerate/default_config.yaml /hkfs/work/workspace/scratch/uqtlv-code_n_mamba/code/manten/manten/scripts/train.py experiment=tdda_3d_baseline training.num_epochs=1000 _detailed_metrics_every_n_epochs=25 _save_every_n_epochs=50 training.log_every_n_steps=150