5
5
deps:
6
6
- path: data/data.xml
7
7
hash: md5
8
- md5: 22a1a2931c8370d3aeedd7183606fd7f
9
- size: 14445097
8
+ md5: 4bd325a30d5f1d5ea1a451d98767ddde
9
+ size: 59918667
10
10
- path: src/prepare.py
11
11
hash: md5
12
12
md5: f54d670ac8a4f63206781fc31d1f2651
@@ -18,38 +18,38 @@ stages:
18
18
outs:
19
19
- path: data/prepared
20
20
hash: md5
21
- md5: 153aad06d376b6595932470e459ef42a .dir
22
- size: 8437363
21
+ md5: f8934609be51496ee500f80eea539c6f .dir
22
+ size: 35339221
23
23
nfiles: 2
24
24
featurize:
25
25
cmd: python src/featurization.py data/prepared data/features
26
26
deps:
27
27
- path: data/prepared
28
28
hash: md5
29
- md5: 153aad06d376b6595932470e459ef42a .dir
30
- size: 8437363
29
+ md5: f8934609be51496ee500f80eea539c6f .dir
30
+ size: 35339221
31
31
nfiles: 2
32
32
- path: src/featurization.py
33
33
hash: md5
34
34
md5: e22789fc9581cad11ef7a6fa3aa3f17b
35
35
size: 4158
36
36
params:
37
37
params.yaml:
38
- featurize.max_features: 200
38
+ featurize.max_features: 500
39
39
featurize.ngrams: 2
40
40
outs:
41
41
- path: data/features
42
42
hash: md5
43
- md5: f35d4cc2c552ac959ae602162b8543f3 .dir
44
- size: 2232588
43
+ md5: 121056a1b192b22d31e15f61c8376928 .dir
44
+ size: 12597137
45
45
nfiles: 2
46
46
train:
47
47
cmd: python src/train.py data/features model.pkl
48
48
deps:
49
49
- path: data/features
50
50
hash: md5
51
- md5: f35d4cc2c552ac959ae602162b8543f3 .dir
52
- size: 2232588
51
+ md5: 121056a1b192b22d31e15f61c8376928 .dir
52
+ size: 12597137
53
53
nfiles: 2
54
54
- path: src/train.py
55
55
hash: md5
@@ -63,27 +63,27 @@ stages:
63
63
outs:
64
64
- path: model.pkl
65
65
hash: md5
66
- md5: d1f6e055f7f5e2827fcfae68d9b64d4c
67
- size: 1958115
66
+ md5: 0af1d96a26c6bdaca6094842c4bc45f3
67
+ size: 3365729
68
68
evaluate:
69
69
cmd: python src/evaluate.py model.pkl data/features
70
70
deps:
71
71
- path: data/features
72
72
hash: md5
73
- md5: f35d4cc2c552ac959ae602162b8543f3 .dir
74
- size: 2232588
73
+ md5: 121056a1b192b22d31e15f61c8376928 .dir
74
+ size: 12597137
75
75
nfiles: 2
76
76
- path: model.pkl
77
77
hash: md5
78
- md5: d1f6e055f7f5e2827fcfae68d9b64d4c
79
- size: 1958115
78
+ md5: 0af1d96a26c6bdaca6094842c4bc45f3
79
+ size: 3365729
80
80
- path: src/evaluate.py
81
81
hash: md5
82
82
md5: a1a59f55636170fb56e0c6afd3e28fa4
83
83
size: 3315
84
84
outs:
85
85
- path: eval
86
86
hash: md5
87
- md5: 80a081570c800c60b9b98ca4b3c91dd7 .dir
88
- size: 1292342
87
+ md5: 53c957a76e8202d50581613c16c5ee93 .dir
88
+ size: 4964257
89
89
nfiles: 8
0 commit comments