-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathdvc.yaml
More file actions
44 lines (37 loc) · 1.65 KB
/
dvc.yaml
File metadata and controls
44 lines (37 loc) · 1.65 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
vars:
- params.yaml
- datasets:
- name: ranganathan
container_path: /datasets/ranganathan/dataset.zip
local_path: ../datasets/ranganathan/dataset.zip
- models:
- name: esm
container_path: /models/esm/manifest.toml
local_path: ../models/esm/manifest.toml
dockerfile: ../models/esm
stages:
create_training_job:
matrix:
dataset: ${datasets}
model: ${models}
cmd:
- docker build --build-arg GIT_CACHE_BUST=${git.git_cache_bust} --secret id=git_auth,src=git-auth.txt -t ${item.model.name}:latest ${item.model.dockerfile}
- docker run --rm -v $(realpath ${source.datasets_dir}):/datasets -v $(realpath ${source.models_dir}):/models -v $(realpath ${destination.local.output_dir}):/opt/ml/model ${item.model.name}:latest train --dataset-zip-file ${item.dataset.container_path} --model-toml-file ${item.model.container_path}
- docker image prune -a -f
deps:
- ${item.dataset.local_path}
- ${item.model.local_path}
- ${item.model.dockerfile}
outs:
- ${destination.local.output_dir}/${item.dataset.name}_${item.model.name}.csv:
cache: true
calculate_metric:
matrix:
dataset: ${datasets}
model: ${models}
cmd: uv run pg2-benchmark metric calc --output-path ${destination.local.output_dir}/${item.dataset.name}_${item.model.name}.csv --metric-path ${destination.local.metric_dir}/${item.dataset.name}_${item.model.name}.csv
deps:
- ${destination.local.output_dir}/${item.dataset.name}_${item.model.name}.csv
outs:
- ${destination.local.metric_dir}/${item.dataset.name}_${item.model.name}.csv:
cache: true