Spaces:

gregorkrzmanc
/

jetclustering

Sleeping

jetclustering / jobs /training_0.slurm

e75a247 3 months ago

1.31 kB

	#!/bin/bash
	#SBATCH --partition=gpu # Specify the partition
	#SBATCH --account=gpu_gres # Specify the account
	#SBATCH --mem=25000 # Request 10GB of memory
	#SBATCH --time=05:00:00 # Set the time limit to 1 hour
	#SBATCH --job-name=SVJ_training_01 # Name the job
	#SBATCH --output=jobs/training_0_output_3.log # Redirect stdout to a log file
	#SBATCH --error=jobs/training_0_error_3.log # Redirect stderr to a log file
	#SBATCH --gres=gpu:1
	source env.sh
	export APPTAINER_TMPDIR=/work/gkrzmanc/singularity_tmp
	export APPTAINER_CACHEDIR=/work/gkrzmanc/singularity_cache
	nvidia-smi
	singularity exec -B /t3home/gkrzmanc/ -B /work/gkrzmanc/ --nv docker://dologarcia/gatr:v0 python -m src.train -train scouting_PFNano_signals2/SVJ_hadronic_std3/s-channel_mMed-900_mDark-20_rinv-0.3_alpha-peak_13TeV-pythia8_n-2000 -val scouting_PFNano_signals2/SVJ_hadronic_std2/s-channel_mMed-900_mDark-20_rinv-0.3 -net src/models/GATr/Gatr.py -bs 16 --gpus 0 --run-name Eval_Overfit_OC_betaPt_BC --train-dataset-size 16 --val-dataset-size 16 --num-epochs 1 --attr-loss-weight 0.1 --coord-loss-weight 0.1 --beta-type pt+bc --load-model-weights train/Overfit_OC_betaPt_BC_2024_12_27_15_21_33/step_1500_epoch_1500.ckpt

	# Run the job:
	# sbatch jobs/training_0.slurm