From e80471a2cdc0ab255eb8cb76aeb8b548053aa851 Mon Sep 17 00:00:00 2001 From: Patrick Esser Date: Sat, 23 Jul 2022 07:54:48 +0000 Subject: [PATCH] resume v1, disable requeue --- scripts/slurm/v1_iahr_torch111/launcher.sh | 3 ++- scripts/slurm/v1_iahr_torch111/sbatch.sh | 1 + 2 files changed, 3 insertions(+), 1 deletion(-) diff --git a/scripts/slurm/v1_iahr_torch111/launcher.sh b/scripts/slurm/v1_iahr_torch111/launcher.sh index 06a1dca..8448b6f 100755 --- a/scripts/slurm/v1_iahr_torch111/launcher.sh +++ b/scripts/slurm/v1_iahr_torch111/launcher.sh @@ -24,7 +24,8 @@ CONFIG="/fsx/stable-diffusion/stable-diffusion/configs/stable-diffusion/v1_impro # resume and set new seed to reshuffle data #EXTRA="--seed 718 model.params.ckpt_path=/fsx/stable-diffusion/stable-diffusion/checkpoints2/v1pp/v1pp-flatline.ckpt" -EXTRA="--seed 718 --resume_from_checkpoint /fsx/stable-diffusion/stable-diffusion/logs/2022-07-22T07-45-07_v1_improvedaesthetics/checkpoints/last.ckpt" +#EXTRA="--seed 718 --resume_from_checkpoint /fsx/stable-diffusion/stable-diffusion/logs/2022-07-22T07-45-07_v1_improvedaesthetics/checkpoints/last.ckpt" +EXTRA="--seed 719 --resume_from_checkpoint /fsx/stable-diffusion/stable-diffusion/logs/2022-07-22T12-32-32_v1_improvedaestheticsv1_iahr_torch111/checkpoints/last.ckpt" # only images >= 512 and pwatermark <= 0.4999 EXTRA="${EXTRA} data.params.min_size=512 data.params.max_pwatermark=0.4999" diff --git a/scripts/slurm/v1_iahr_torch111/sbatch.sh b/scripts/slurm/v1_iahr_torch111/sbatch.sh index c317b7f..c79d6ac 100755 --- a/scripts/slurm/v1_iahr_torch111/sbatch.sh +++ b/scripts/slurm/v1_iahr_torch111/sbatch.sh @@ -8,6 +8,7 @@ #SBATCH --exclusive #SBATCH --output=%x_%j.out #SBATCH --comment "Key=Monitoring,Value=ON" +#SBATCH --no-requeue module load intelmpi source /opt/intel/mpi/latest/env/vars.sh