-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathdvc.lock
More file actions
107 lines (107 loc) · 2.77 KB
/
dvc.lock
File metadata and controls
107 lines (107 loc) · 2.77 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
schema: '2.0'
stages:
data_ingestion:
cmd: python src/data/data_ingestion.py
deps:
- path: src/data/data_ingestion.py
hash: md5
md5: 80e0647270a694ede66c099babe031b0
size: 3812
params:
params.yaml:
data_ingestion.test_size: 0.2
outs:
- path: data/raw
hash: md5
md5: e13bcce40396cd334c8a7a334868166a.dir
size: 6919701
nfiles: 2
data_preprocessing:
cmd: python src/data/data_preprocessing.py
deps:
- path: data/raw/test.csv
hash: md5
md5: ea97ba82a4a25627bf4ffb52572484ea
size: 1348612
- path: data/raw/train.csv
hash: md5
md5: 1bd422dd6d135bced1d6c64a3e84a45d
size: 5571089
- path: src/data/data_preprocessing.py
hash: md5
md5: ee5bfac5bda889140222edeb9d21f782
size: 3466
outs:
- path: data/interim
hash: md5
md5: ba42408e7bd1e85685474d6a349ae57e.dir
size: 5134850
nfiles: 2
model_building:
cmd: python src/model/model_building.py
deps:
- path: data/interim/train_processed.csv
hash: md5
md5: 35027dfda8274bd9356544f2ff358aa4
size: 4134324
- path: src/model/model_building.py
hash: md5
md5: 9efb818fcf973a839944c5cc3def37a5
size: 5067
params:
params.yaml:
model_building.learning_rate: 0.09
model_building.max_depth: 20
model_building.max_features: 1000
model_building.n_estimators: 367
model_building.ngram_range:
- 1
- 3
outs:
- path: lgbm_model.pkl
hash: md5
md5: 9bf3b63ef863c9870dd8bb345d738e69
size: 3886723
- path: tfidf_vectorizer.pkl
hash: md5
md5: 5d23166feb3e16832de189534c4579ad
size: 36874
model_evaluation:
cmd: python src/model/model_evaluation.py
deps:
- path: data/interim/test_processed.csv
hash: md5
md5: 4f30375397ec89fead1745ee6d70f201
size: 1000526
- path: data/interim/train_processed.csv
hash: md5
md5: 35027dfda8274bd9356544f2ff358aa4
size: 4134324
- path: lgbm_model.pkl
hash: md5
md5: 9bf3b63ef863c9870dd8bb345d738e69
size: 3886723
- path: src/model/model_evaluation.py
hash: md5
md5: 4e5696548e0d12285358d1985be6de8f
size: 6340
- path: tfidf_vectorizer.pkl
hash: md5
md5: 5d23166feb3e16832de189534c4579ad
size: 36874
outs:
- path: experiment_info.json
hash: md5
md5: 5bcc968bd8e1ec6a69d752e4349f0dda
size: 87
model_registration:
cmd: python src/model/register_model.py
deps:
- path: experiment_info.json
hash: md5
md5: 5bcc968bd8e1ec6a69d752e4349f0dda
size: 87
- path: src/model/register_model.py
hash: md5
md5: 76d9a8ce9477f6c22783654fe3769b1f
size: 2504