-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathvoyager.yaml
50 lines (50 loc) · 1.84 KB
/
voyager.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
apiVersion: v1
kind: Pod
metadata:
# name: eeg-ssl-interactive
name: eeg-ssl-jupyter
spec:
restartPolicy: Never
volumes:
- name: scratch
emptyDir: {}
- name: ceph
hostPath:
path: /home/dtyoung
type: Directory
- name: ramdisk1
emptyDir:
medium: Memory
containers:
- name: eeg-ssl-container
image: dtyoung/eeg-ssl:voyager
imagePullPolicy: Always
volumeMounts:
- mountPath: /scratch
name: scratch
- mountPath: /ceph
name: ceph
- mountPath: /dev/shm
name: ramdisk1
resources:
limits:
memory: 409G
cpu: 86
habana.ai/gaudi: 8
hugepages-2Mi: 95000Mi
requests:
memory: 409G
cpu: 86
habana.ai/gaudi: 8
hugepages-2Mi: 95000Mi
env:
- name: checkpt
value: "/ceph/datasets/stable_diff/checkpoint_trained_habana"
- name: output
value: "/ceph/results/stable_diffusion/inference_from_trained_habana"
command: ["/bin/sh", "-c"]
# args: [ "while true; do sleep 30; done;" ]
args:
- >-
pip install jupyterlab ;
jupyter lab --allow-root