File size: 491 Bytes
d7a991a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
# @package _global_

defaults:
  - override /hydra/launcher: submitit_slurm

hydra:
  launcher:
    timeout_min: 10_080   # 7 days
    max_num_timeout: 3
    partition: g40
    qos: idle
    nodes: 1
    tasks_per_node: ${trainer.devices}
    gpus_per_task: null
    cpus_per_task: 12
    gpus_per_node: ${trainer.devices}
    cpus_per_gpu: null
    comment: laion
    name: hamer
    setup:
      - module load cuda openmpi libfabric-aws
      - export CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7