-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathdvc.lock
More file actions
107 lines (107 loc) · 2.77 KB
/
dvc.lock
File metadata and controls
107 lines (107 loc) · 2.77 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
schema: '2.0'
stages:
data_ingestion:
cmd: python src/data/data_ingestion.py
deps:
- path: src/data/data_ingestion.py
hash: md5
md5: 6d5e6d7b4b4b387ac2f00b21339714b7
size: 4364
params:
params.yaml:
data_ingestion.test_size: 0.2
outs:
- path: data/raw
hash: md5
md5: e13bcce40396cd334c8a7a334868166a.dir
size: 6919701
nfiles: 2
data_preprocessing:
cmd: python src/data/data_preprocessing.py
deps:
- path: data/raw/test.csv
hash: md5
md5: ea97ba82a4a25627bf4ffb52572484ea
size: 1348612
- path: data/raw/train.csv
hash: md5
md5: 1bd422dd6d135bced1d6c64a3e84a45d
size: 5571089
- path: src/data/data_preprocessing.py
hash: md5
md5: d53f52f87e43f8270599bcf75746cdcc
size: 3983
outs:
- path: data/interim
hash: md5
md5: ba42408e7bd1e85685474d6a349ae57e.dir
size: 5134850
nfiles: 2
model_building:
cmd: python src/model/model_building.py
deps:
- path: data/interim/train_processed.csv
hash: md5
md5: 35027dfda8274bd9356544f2ff358aa4
size: 4134324
- path: src/model/model_building.py
hash: md5
md5: d2b9d6bafc76e98c46bb1633eac85b3d
size: 5740
params:
params.yaml:
model_building.learning_rate: 0.09
model_building.max_depth: 20
model_building.max_features: 1000
model_building.n_estimators: 367
model_building.ngram_range:
- 1
- 3
outs:
- path: lgbm_model.pkl
hash: md5
md5: 1645f072eb06f11285658e0181d76e6c
size: 3886710
- path: tfidf_vectorizer.pkl
hash: md5
md5: 54ae4ccbfc21a3927f9334a22d4c3c35
size: 36874
model_evaluation:
cmd: python src/model/model_evaluation.py
deps:
- path: data/interim/test_processed.csv
hash: md5
md5: 4f30375397ec89fead1745ee6d70f201
size: 1000526
- path: data/interim/train_processed.csv
hash: md5
md5: 35027dfda8274bd9356544f2ff358aa4
size: 4134324
- path: lgbm_model.pkl
hash: md5
md5: 1645f072eb06f11285658e0181d76e6c
size: 3886710
- path: src/model/model_evaluation.py
hash: md5
md5: 144add1348069aab9f01232678429851
size: 7626
- path: tfidf_vectorizer.pkl
hash: md5
md5: 54ae4ccbfc21a3927f9334a22d4c3c35
size: 36874
outs:
- path: experiment_info.json
hash: md5
md5: 335fdc9e7952a6cf9f057ca68dedb31c
size: 87
model_registration:
cmd: python src/model/register_model.py
deps:
- path: experiment_info.json
hash: md5
md5: 335fdc9e7952a6cf9f057ca68dedb31c
size: 87
- path: src/model/register_model.py
hash: md5
md5: b68514c1060f1e2232eefc5bc9c235e8
size: 2537