-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathdvc.yaml
58 lines (52 loc) · 1.45 KB
/
dvc.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
stages:
preprocess:
cmd: python code/1_preprocess.py
deps:
- code/1_preprocess.py
outs:
- data/processed/
build_tensordataset:
cmd: python code/2_build_tensordataset.py
deps:
- code/2_build_tensordataset.py
- data/processed/
outs:
- data/tensordataset/
- brick/selfies_property_val_tokenizer/
train:
cmd: python code/3_train_multitask_transformer.py
deps:
- code/3_train_multitask_transformer.py
- data/processed/
- data/tensordataset/
- brick/selfies_property_val_tokenizer/
outs:
- brick/moe
# evaluate:
# cmd: python code/5_1_eval_multi_properties.py
# deps:
# - code/5_1_eval_multi_properties.py
# - brick/moe
# - data/tensordataset/multitask_tensors/hld
# outs:
# - data/metrics/temp
# - data/metrics/multitask_predictions.parquet
# - data/metrics/multitask_metrics.parquet
sqlite:
cmd: python code/6_build_sqlite.py
deps:
- code/6_build_sqlite.py
- brick/selfies_property_val_tokenizer
- data/processed/activities.parquet
outs:
- brick/cvae.sqlite
evaluate_benchmarks:
cmd: python code/7.1_2_property_benchmarks_parallel.py
deps:
- code/7.1_2_property_benchmarks_parallel.py
- brick/moe
- data/tensordataset/multitask_tensors/hld
outs:
- data/metrics/temp
- data/metrics/multitask_predictions.parquet
- data/metrics/multitask_metrics.parquet