Hannes Kuchelmeister
commited on
Commit
•
8d9de2d
1
Parent(s):
1486604
make docker-files runnable on GPUs
Browse files- models/DockerfileCUDA +12 -0
- models/docker-compose.cuda.yml +26 -0
- models/docker-compose.yml +5 -2
models/DockerfileCUDA
ADDED
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
FROM pytorch/pytorch:1.9.1-cuda11.1-cudnn8-runtime
|
2 |
+
|
3 |
+
WORKDIR /usr/src/app
|
4 |
+
|
5 |
+
RUN apt-get update
|
6 |
+
RUN apt-get install libgl1 -y
|
7 |
+
|
8 |
+
COPY requirements.txt ./
|
9 |
+
RUN pip install --no-cache-dir -r requirements.txt
|
10 |
+
|
11 |
+
COPY . .
|
12 |
+
|
models/docker-compose.cuda.yml
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
version: "3"
|
2 |
+
services:
|
3 |
+
model-cuda:
|
4 |
+
build:
|
5 |
+
context: .
|
6 |
+
dockerfile: DockerfileCUDA
|
7 |
+
tty: true
|
8 |
+
deploy:
|
9 |
+
resources:
|
10 |
+
reservations:
|
11 |
+
devices:
|
12 |
+
- driver: nvidia
|
13 |
+
count: 1
|
14 |
+
capabilities: [gpu]
|
15 |
+
volumes:
|
16 |
+
- ./logs/:/usr/src/app/logs:z
|
17 |
+
- ./data/:/usr/src/app/data:z
|
18 |
+
- ./configs:/usr/src/app/configs:z
|
19 |
+
command: sh -c "python train.py logger=tensorboard trainer.gpus=1"
|
20 |
+
tensorboard:
|
21 |
+
image: tensorflow/tensorflow
|
22 |
+
volumes:
|
23 |
+
- ./logs:/logs:z
|
24 |
+
command: sh -c "tensorboard --logdir /logs --bind_all"
|
25 |
+
ports:
|
26 |
+
- 8008:6006
|
models/docker-compose.yml
CHANGED
@@ -1,7 +1,10 @@
|
|
1 |
version: "3"
|
2 |
services:
|
3 |
model:
|
4 |
-
build:
|
|
|
|
|
|
|
5 |
volumes:
|
6 |
- ./logs/:/usr/src/app/logs:z
|
7 |
- ./data/:/usr/src/app/data:z
|
@@ -13,4 +16,4 @@ services:
|
|
13 |
- ./logs:/logs:z
|
14 |
command: sh -c "tensorboard --logdir /logs --bind_all"
|
15 |
ports:
|
16 |
-
-
|
|
|
1 |
version: "3"
|
2 |
services:
|
3 |
model:
|
4 |
+
build:
|
5 |
+
context: .
|
6 |
+
dockerfile: Dockerfile
|
7 |
+
tty: true
|
8 |
volumes:
|
9 |
- ./logs/:/usr/src/app/logs:z
|
10 |
- ./data/:/usr/src/app/data:z
|
|
|
16 |
- ./logs:/logs:z
|
17 |
command: sh -c "tensorboard --logdir /logs --bind_all"
|
18 |
ports:
|
19 |
+
- 8008:6006
|