generated from c17hawke/dvc-project-template
-
Notifications
You must be signed in to change notification settings - Fork 9
/
Copy pathdvc.lock
147 lines (147 loc) · 4.34 KB
/
dvc.lock
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
schema: '2.0'
stages:
stage_name:
cmd: python src/stage_01_get_data.py --config=configs/config.yaml
deps:
- path: configs/config.yaml
md5: 231ed57d027344adbbbea246e5c44a57
size: 549
- path: src/stage_01_get_data.py
md5: 22e6655fde373d36cdfd3ec422e201d9
size: 1539
- path: src/utils/common.py
md5: d162961d817182441383bdb0e674e685
size: 675
outs:
- path: data/data.xml
md5: a304afb96060aad90176268345e10355
size: 37891850
get_data:
cmd: python src/stage_01_get_data.py --config=configs/config.yaml
deps:
- path: configs/config.yaml
md5: e4f15537f7c52f9120025cd06d4250b3
size: 565
- path: src/stage_01_get_data.py
md5: 22e6655fde373d36cdfd3ec422e201d9
size: 1539
- path: src/utils/common.py
md5: da75efcaa8787eb12aa16e9c351947cd
size: 1000
outs:
- path: data/data.xml
md5: a304afb96060aad90176268345e10355
size: 37891850
prepare_data:
cmd: python src/stage_02_prepare.py --config=configs/config.yaml --params=params.yaml
deps:
- path: configs/config.yaml
md5: e4f15537f7c52f9120025cd06d4250b3
size: 565
- path: data/data.xml
md5: a304afb96060aad90176268345e10355
size: 37891850
- path: src/stage_02_prepare.py
md5: 125808af32f7db5a2343c600b573787e
size: 2152
- path: src/utils/common.py
md5: da75efcaa8787eb12aa16e9c351947cd
size: 1000
- path: src/utils/data_mgmt.py
md5: 85d36c52eee5649090bc77738f442049
size: 864
params:
params.yaml:
prepare.seed: 2021
prepare.split: 0.2
outs:
- path: artifacts/prepared/test.tsv
md5: 60c757f3b30604473de7fa775dfc00d9
size: 4899778
- path: artifacts/prepared/train.tsv
md5: 553034c4cf40efc63c99c19fe98610d0
size: 18986541
featurize:
cmd: python src/stage_03_featurization.py --config=configs/config.yaml --params=params.yaml
deps:
- path: artifacts/prepared/test.tsv
md5: 60c757f3b30604473de7fa775dfc00d9
size: 4899778
- path: artifacts/prepared/train.tsv
md5: 553034c4cf40efc63c99c19fe98610d0
size: 18986541
- path: configs/config.yaml
md5: e4f15537f7c52f9120025cd06d4250b3
size: 565
- path: src/stage_03_featurization.py
md5: bb584c361c6ce8ffb0093568001f10e4
size: 2954
- path: src/utils/common.py
md5: da75efcaa8787eb12aa16e9c351947cd
size: 1000
- path: src/utils/featurize.py
md5: 282f60529535a7fb8dcde7a4e6a601e8
size: 504
params:
params.yaml:
featurize.max_features: 2500
featurize.ngrams: 3
outs:
- path: artifacts/features/test.pkl
md5: 9d2d234d20214def027d6281a57fd5da
size: 2630489
- path: artifacts/features/train.pkl
md5: 1f43679178ead568fa21eaf209639c65
size: 10246425
train:
cmd: python src/stage_04_train.py --config=configs/config.yaml --params=params.yaml
deps:
- path: artifacts/features/train.pkl
md5: 1f43679178ead568fa21eaf209639c65
size: 10246425
- path: configs/config.yaml
md5: e4f15537f7c52f9120025cd06d4250b3
size: 565
- path: src/stage_04_train.py
md5: a020ea0bd5eff3ff90d27a8e15c961f9
size: 2308
- path: src/utils/common.py
md5: da75efcaa8787eb12aa16e9c351947cd
size: 1000
params:
params.yaml:
train.min_split: 32
train.n_est: 110
train.seed: 2021
outs:
- path: artifacts/model/model.pkl
md5: 0434b51c875ee93ccc6b29ed4938223d
size: 3188471
evaluate:
cmd: python src/stage_05_evaluate.py --config=configs/config.yaml
deps:
- path: artifacts/features/test.pkl
md5: 9d2d234d20214def027d6281a57fd5da
size: 2630489
- path: artifacts/model/model.pkl
md5: 0434b51c875ee93ccc6b29ed4938223d
size: 3188471
- path: configs/config.yaml
md5: e4f15537f7c52f9120025cd06d4250b3
size: 565
- path: src/stage_05_evaluate.py
md5: dd3ff7294a16066870cc401c259a55a7
size: 2785
- path: src/utils/common.py
md5: da75efcaa8787eb12aa16e9c351947cd
size: 1000
outs:
- path: prc.json
md5: e72f5472dfb992d5d3c5a9171d010097
size: 124910
- path: roc.json
md5: 714e129de6314a25562ed6cd3f6c5229
size: 67536
- path: scores.json
md5: 67a5ab5142e285735e4769d6ba117c4a
size: 76