-
Notifications
You must be signed in to change notification settings - Fork 0
/
dvc.lock
96 lines (96 loc) · 2.86 KB
/
dvc.lock
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
schema: '2.0'
stages:
data-split:
cmd: python3 src/data_split.py
deps:
- path: data/updated_train.csv
md5: 886b586f88a80c2a48e7b9a9bbfab03e
size: 68899220
- path: src/data_split.py
md5: 054a1dddaf91131d5c890907513b6fd7
size: 1102
outs:
- path: data/processed_data/x_test.npy
md5: 297d701ee718de8f6d937797c70a78e5
size: 12987088
- path: data/processed_data/x_train.npy
md5: 24a1f979d75947c5109cb4317ad96337
size: 34624275
- path: data/processed_data/y_test.npy
md5: fb3f6fa921623491317d186fc25ba885
size: 3582896
- path: data/processed_data/y_train.npy
md5: a1cdc0b02798bade093964500fe6f019
size: 9486528
data-preprocess:
cmd: python3 src/data_preprocess.py
deps:
- path: data/processed_data/x_test.npy
md5: 297d701ee718de8f6d937797c70a78e5
size: 12987088
- path: data/processed_data/x_train.npy
md5: 7eec7ac8791fba43cc41c5c477f7b92e
size: 33512228
- path: src/data_preprocess.py
md5: 2a7f3f0365b1ee9fd5285be250e5d3d1
size: 1166
params:
params.yaml:
data-preprocess.embedding_dim: 300
data-preprocess.sequence_len: 200
data-preprocess.vocab_size: 100000
model-training:
cmd: python3 src/model_training.py
deps:
- path: data/processed_data/x_train.npy
md5: 24a1f979d75947c5109cb4317ad96337
size: 34624275
- path: data/processed_data/y_train.npy
md5: a1cdc0b02798bade093964500fe6f019
size: 9486528
- path: src/model_training.py
md5: c1520bcdd58618d5c56daeb6caebf90a
size: 4265
params:
params.yaml:
model-training.batch_size: 32
model-training.epochs: 2
model-training.val_split: 0.2
outs:
- path: auc.jpg
md5: 276136ed37a26c3d5ed9d6f134cfefdf
size: 21352
- path: log_loss.jpg
md5: fda0a8ca93f3061b7c33b1d38187bf58
size: 17708
- path: models/tokenizer.pkl
md5: 42aff95b4b7b6f20df59f687ec931676
size: 6833489
- path: models/toxicity_classifier.h5
md5: dd9be985c4fcc76be109e864b50dd63c
size: 185288576
model-evaluation:
cmd: python3 src/model_evaluation.py
deps:
- path: data/processed_data/x_test.npy
md5: 297d701ee718de8f6d937797c70a78e5
size: 12987088
- path: data/processed_data/y_test.npy
md5: fb3f6fa921623491317d186fc25ba885
size: 3582896
- path: models/toxicity_classifier.h5
md5: dd9be985c4fcc76be109e864b50dd63c
size: 185288576
- path: src/model_evaluation.py
md5: b50ab2515d69432b4cff4c5bcf5c6cd7
size: 3141
outs:
- path: auc_roc.jpg
md5: 2ed10d9e2f9b668d056a1d8d4f08dd1b
size: 57233
- path: confusion_matrix.jpg
md5: 14dbbddde200fe61cc2987cb455d01ac
size: 123546
- path: scores.json
md5: 91464694715c18fd63ad1aecf00c5487
size: 32