-
Notifications
You must be signed in to change notification settings - Fork 0
/
dvc.lock
167 lines (167 loc) · 4.84 KB
/
dvc.lock
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
schema: '2.0'
stages:
extract_dataset:
cmd: python .\src\data\extract_dataset.py
deps:
- path: .\data\raw\zipped
hash: md5
md5: 2ac9e57fc0bc2d2a1a610a695529d479.dir
size: 87295035
nfiles: 2
- path: .\src\data\extract_dataset.py
hash: md5
md5: e13ce767752277added5382c0f74dfe9
size: 1711
outs:
- path: .\data\raw\extracted
hash: md5
md5: 07dcb976ec534725901d50758a399273.dir
size: 271383386
nfiles: 2
make_dataset:
cmd: python .\src\data\make_dataset.py train.csv
deps:
- path: .\data\raw\extracted\train.csv
hash: md5
md5: e59c291a4b1c640f1dab33b89daa22e1
size: 200589097
- path: .\src\data\make_dataset.py
hash: md5
md5: 63f7cb7eb76659d9face16c29dc0e15b
size: 4052
params:
params.yaml:
make_dataset.random_state: 30
make_dataset.test_size: 0.1
outs:
- path: .\data\interim
hash: md5
md5: 5441a97a8e44bdeb11d92d9f11b71186.dir
size: 197004804
nfiles: 2
modify_features:
cmd: python .\src\features\modify_features.py data/interim/train.csv data/interim/val.csv
data/raw/extracted/test.csv
deps:
- path: .\data\interim\train.csv
hash: md5
md5: 9282cea0cb6ddf4bdcca66b54678d900
size: 177304798
- path: .\data\interim\val.csv
hash: md5
md5: a41f9bd08b4d05d4701038b4a609104f
size: 19700006
- path: .\data\raw\extracted\test.csv
hash: md5
md5: 0686e4fc98617485dba9fdbabbf1c48d
size: 70794289
- path: .\src\features\modify_features.py
hash: md5
md5: 101954674b493f450de41d3ade407aed
size: 9064
outs:
- path: .\data\processed\transformations
hash: md5
md5: eb8e4295d496ba625c38a500d63ba12d.dir
size: 208192931
nfiles: 3
build_features:
cmd: python .\src\features\build_features.py data/processed/transformations/train.csv
data/processed/transformations/val.csv data/processed/transformations/test.csv
deps:
- path: .\data\processed\transformations\test.csv
hash: md5
md5: 2b77a8e04bfa86ff4e9e7f475c34f001
size: 56394464
- path: .\data\processed\transformations\train.csv
hash: md5
md5: 8b13bb1fae56714208a779f2d2c9a7c8
size: 136614671
- path: .\data\processed\transformations\val.csv
hash: md5
md5: 1e2b47d7113ff47296ad9fb36cdc8472
size: 15183796
- path: .\src\features\build_features.py
hash: md5
md5: 72d6e05893eece88723b591b9ebbf870
size: 2250
outs:
- path: .\data\processed\build-features
hash: md5
md5: 32a5a2e6cd272e22860adbd7bac1348c.dir
size: 331246740
nfiles: 3
data_preprocessing:
cmd: python .\src\features\data_preprocessing.py train.csv val.csv test.csv
deps:
- path: .\data\processed\build-features\test.csv
hash: md5
md5: 7f579e643d6352b7b311a5ba7062d2a8
size: 93345469
- path: .\data\processed\build-features\train.csv
hash: md5
md5: fd3df5bb8d535640a6b5f07fff333311
size: 214106185
- path: .\data\processed\build-features\val.csv
hash: md5
md5: 7c5f78bd281035f2d4c220858b4888ac
size: 23795086
- path: .\src\features\data_preprocessing.py
hash: md5
md5: eed63e4299e98a2989478d6f0678278f
size: 7539
params:
params.yaml:
data_preprocessing.percentiles:
- 0.002
- 0.998
outs:
- path: .\data\processed\final
hash: md5
md5: b22b82a594bf7227d55905b602b20e91.dir
size: 351588991
nfiles: 3
- path: .\models\transformers
hash: md5
md5: d8165f9efb0cac74a6bce75407ee523d.dir
size: 7529
nfiles: 3
train_model:
cmd: python .\src\models\train_model.py data/processed/final/train.csv
deps:
- path: .\data\processed\final\train.csv
hash: md5
md5: 5f9906c51a1abce4bd8530a0bb780528
size: 229128192
- path: .\src\models\train_model.py
hash: md5
md5: 612aadd8d39f25061fe735f747a24c5b
size: 1817
params:
params.yaml:
train_model.random_forest_regressor.max_depth: 5
train_model.random_forest_regressor.n_estimators: 20
train_model.random_forest_regressor.n_jobs: -1
train_model.random_forest_regressor.verbose: 2
outs:
- path: .\models\models
hash: md5
md5: 0d348acd440525c27f292bbb98d4ddd4.dir
size: 98849
nfiles: 1
predict_model:
cmd: python .\src\models\predict_model.py train.csv val.csv
deps:
- path: .\data\processed\final\val.csv
hash: md5
md5: 28da71eff09a2ce8c92c0aa06d48816c
size: 25463541
- path: .\models\models
hash: md5
md5: 0d348acd440525c27f292bbb98d4ddd4.dir
size: 98849
nfiles: 1
- path: .\src\models\predict_model.py
hash: md5
md5: 0665467fc68846f046db803dc4900d48
size: 1641