-
Notifications
You must be signed in to change notification settings - Fork 0
/
dvc.yaml
72 lines (66 loc) · 2.25 KB
/
dvc.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
stages:
extract_dataset:
cmd: python .\src\data\extract_dataset.py
deps:
- .\src\data\extract_dataset.py
- .\data\raw\zipped
outs:
- .\data\raw\extracted
make_dataset:
cmd: python .\src\data\make_dataset.py train.csv
deps:
- .\data\raw\extracted\train.csv
- .\src\data\make_dataset.py
params:
- make_dataset.test_size
- make_dataset.random_state
outs:
- .\data\interim
modify_features:
cmd: python .\src\features\modify_features.py data/interim/train.csv data/interim/val.csv data/raw/extracted/test.csv
deps:
- .\src\features\modify_features.py
- .\data\interim\train.csv
- .\data\interim\val.csv
- .\data\raw\extracted\test.csv
outs:
- .\data\processed\transformations
build_features:
cmd: python .\src\features\build_features.py data/processed/transformations/train.csv data/processed/transformations/val.csv data/processed/transformations/test.csv
deps:
- .\src\features\build_features.py
- .\data\processed\transformations\train.csv
- .\data\processed\transformations\val.csv
- .\data\processed\transformations\test.csv
outs:
- .\data\processed\build-features
data_preprocessing:
cmd: python .\src\features\data_preprocessing.py train.csv val.csv test.csv
deps:
- .\src\features\data_preprocessing.py
- .\data\processed\build-features\train.csv
- .\data\processed\build-features\val.csv
- .\data\processed\build-features\test.csv
params:
- data_preprocessing.percentiles
outs:
- .\data\processed\final
- .\models\transformers
train_model:
cmd: python .\src\models\train_model.py data/processed/final/train.csv
deps:
- .\src\models\train_model.py
- .\data\processed\final\train.csv
params:
- train_model.random_forest_regressor.n_estimators
- train_model.random_forest_regressor.n_jobs
- train_model.random_forest_regressor.max_depth
- train_model.random_forest_regressor.verbose
outs:
- .\models\models
predict_model:
cmd: python .\src\models\predict_model.py train.csv val.csv
deps:
- .\src\models\predict_model.py
- .\data\processed\final\val.csv
- .\models\models