match num cpus to num workers, log each node separately
This commit is contained in:
		
							parent
							
								
									9300c0ccfc
								
							
						
					
					
						commit
						89ac468ce8
					
				
					 1 changed files with 2 additions and 1 deletions
				
			
		| 
						 | 
				
			
			@ -3,6 +3,7 @@
 | 
			
		|||
#SBATCH --job-name=stable-diffusion-512cont
 | 
			
		||||
#SBATCH --nodes=24
 | 
			
		||||
#SBATCH --gpus-per-node=8
 | 
			
		||||
#SBATCH --cpus-per-gpu=4
 | 
			
		||||
#SBATCH --ntasks-per-node=1
 | 
			
		||||
#SBATCH --output=%x_%j.%n.out
 | 
			
		||||
 | 
			
		||||
| 
						 | 
				
			
			@ -35,4 +36,4 @@ echo MASTER_ADDR=${MASTER_ADDR}
 | 
			
		|||
echo MASTER_PORT=${MASTER_PORT}
 | 
			
		||||
echo WORLD_SIZE=${WORLD_SIZE}
 | 
			
		||||
 | 
			
		||||
srun bash /fsx/stable-diffusion/stable-diffusion/scripts/slurm/resume_512/launcher.sh
 | 
			
		||||
srun --output=%x_%j.%n.out bash /fsx/stable-diffusion/stable-diffusion/scripts/slurm/resume_512/launcher.sh
 | 
			
		||||
| 
						 | 
				
			
			
 | 
			
		|||
		Loading…
	
		Reference in a new issue