-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathvalohai.yaml
42 lines (40 loc) · 1.3 KB
/
valohai.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
- step:
name: Data extraction
image: tensorflow/tensorflow:1.5.0-devel-gpu
command: python data-extraction.py
inputs:
- name: dataset
default: https://data.mendeley.com/datasets/rscbjbr9sj/2/files/9e8f7acf-7d3a-487f-8eb5-0bd3255b9685/OCT2017.tar.gz
- step:
name: Train model
image: tensorflow/tensorflow:1.5.0-devel-gpu
command: python train.py {parameters}
parameters:
- name: max_steps
pass-as: --max_steps={v}
description: Number of steps to run the trainer
type: integer
default: 300
- name: learning_rate
pass-as: --learning_rate={v}
description: Initial learning rate
type: float
default: 0.001
- name: dropout
pass-as: --dropout={v}
description: Keep probability for training dropout
type: float
default: 0.9
inputs:
- name: dataset
default: https://data.mendeley.com/datasets/rscbjbr9sj/2/files/9e8f7acf-7d3a-487f-8eb5-0bd3255b9685/OCT2017.tar.gz
- step:
name: Worker environment check
image: tensorflow/tensorflow:1.5.0-devel-gpu
command:
- pwd
- ls -la
- nvidia-smi
- python --version
- nvcc --version | grep release
- cat /usr/include/x86_64-linux-gnu/cudnn_v*.h | grep CUDNN_MAJOR -A 2