-
Notifications
You must be signed in to change notification settings - Fork 5
/
dvc.lock
139 lines (139 loc) · 4.71 KB
/
dvc.lock
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
schema: '2.0'
stages:
preprocess:
cmd: python pipeline/preprocess/run.py --input_artifact_name pipeline/data/census.csv
--output_artifact_name pipeline/data/preprocessing_data.csv
deps:
- path: pipeline/data/census.csv
md5: 145de00f6e6053d3f7044628f9a5b5ff
size: 3974474
- path: pipeline/preprocess/run.py
md5: e3b6a0b55e21a6647c04b1a51a259701
size: 2428
outs:
- path: pipeline/data/preprocessing_data.csv
md5: 4309856f7edb21206b5193724ff484b0
size: 3515984
datacheck:
cmd: pytest pipeline/check_data -s -vv --sample_artifact pipeline/data/preprocessing_data.csv
--param params.yaml
deps:
- path: pipeline/check_data/conftest.py
md5: cf5c36dedec8f18fddc9294d1b29a240
size: 1269
- path: pipeline/check_data/test_data.py
md5: 274655585642e55ba840d0d59e830d7b
size: 4049
- path: pipeline/data/preprocessing_data.csv
md5: 4309856f7edb21206b5193724ff484b0
size: 3515984
params:
params.yaml:
data.ks_alpha: 0.05
data.reference_dataset: pipeline/data/preprocessing_data.csv
segregate:
cmd: python pipeline/segregate/run.py --input_artifact pipeline/data/preprocessing_data.csv
--param params.yaml
deps:
- path: pipeline/data/preprocessing_data.csv
md5: 4309856f7edb21206b5193724ff484b0
size: 3515984
- path: pipeline/segregate/run.py
md5: 9e3a0ba0757148d65dda03fa6587d7a2
size: 2489
params:
params.yaml:
data.stratify: salary
data.test_size: 0.3
main.random_seed: 42
outs:
- path: pipeline/data/test_data.csv
md5: 63879402361c93a2ef2589ffb0f3f0bc
size: 1054435
- path: pipeline/data/train_data.csv
md5: 41bf494a1a72935d10542c743ce8b06a
size: 2461705
train:
cmd: python pipeline/train/run.py --train_data pipeline/data/train_data.csv --param
params.yaml --score_file pipeline/data/train_scores.json
deps:
- path: pipeline/data/train_data.csv
md5: 41bf494a1a72935d10542c743ce8b06a
size: 2461705
- path: pipeline/train/helper.py
md5: 18670b995dd6861e998f045885d2ba93
size: 4400
- path: pipeline/train/run.py
md5: 11a247c22e8a40fe882b875c8c2953b1
size: 5136
- path: pipeline/train/transformer_feature.py
md5: 62a2f8c4623bbfc1c45108f2a7367e01
size: 4893
params:
params.yaml:
data.stratify: salary
data.val_size: 0.3
main.random_seed: 42
train.export_artifact: pipeline/data/model_export
outs:
- path: pipeline/data/encoder_export
md5: c84ed6bd7e06ea14739c62ef12d16aa8
size: 503
- path: pipeline/data/model_export
md5: b8f59c9da3b7266271b89ab7e3f678f4
size: 7057678
- path: pipeline/data/train_scores.json
md5: 5f13d837ed8398d8b917d3008a26f0f0
size: 139
evaluate:
cmd: python pipeline/evaluate/run.py --test_data pipeline/data/test_data.csv --model
pipeline/data/model_export --encoder pipeline/data/encoder_export --score_file
pipeline/data/test_scores.json --slice_file pipeline/data/slice_output.json
deps:
- path: pipeline/data/encoder_export
md5: c84ed6bd7e06ea14739c62ef12d16aa8
size: 503
- path: pipeline/data/model_export
md5: b8f59c9da3b7266271b89ab7e3f678f4
size: 7057678
- path: pipeline/data/test_data.csv
md5: 63879402361c93a2ef2589ffb0f3f0bc
size: 1054435
- path: pipeline/evaluate/run.py
md5: c5a5cfd3be79d3913d91ac7a937936a0
size: 4234
- path: pipeline/train/helper.py
md5: 18670b995dd6861e998f045885d2ba93
size: 4400
- path: pipeline/train/transformer_feature.py
md5: 62a2f8c4623bbfc1c45108f2a7367e01
size: 4893
outs:
- path: pipeline/data/slice_output.json
md5: 60821caee5c169094bdf2130455789cd
size: 20428
- path: pipeline/data/test_scores.json
md5: 65dc5ce17b819ba6aad65f00802e4da1
size: 139
check_model:
cmd: pytest pipeline/check_model -s -vv --test_data pipeline/data/test_data.csv
--model pipeline/data/model_export --encoder pipeline/data/encoder_export
deps:
- path: pipeline/check_model/conftest.py
md5: 5b0828906c0c5dd462da38375121922c
size: 1456
- path: pipeline/check_model/test_model.py
md5: cbe1be2b91aa98c0e526da589f0f4857
size: 961
- path: pipeline/data/encoder_export
md5: c84ed6bd7e06ea14739c62ef12d16aa8
size: 503
- path: pipeline/data/model_export
md5: b8f59c9da3b7266271b89ab7e3f678f4
size: 7057678
- path: pipeline/data/test_data.csv
md5: 63879402361c93a2ef2589ffb0f3f0bc
size: 1054435
- path: pipeline/train/transformer_feature.py
md5: 62a2f8c4623bbfc1c45108f2a7367e01
size: 4893