-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathdvc.lock
More file actions
134 lines (134 loc) · 3.56 KB
/
dvc.lock
File metadata and controls
134 lines (134 loc) · 3.56 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
schema: '2.0'
stages:
download:
cmd: python3 -m src.data.download_raw_dataset
deps:
- path: src/config.py
hash: md5
md5: a883d0dec1704d3fcd889893bd8d4c48
size: 1290
- path: src/data/download_raw_dataset.py
hash: md5
md5: 810f4f307477b783266e99604b847e57
size: 649
outs:
- path: data/raw/imdb.parquet
hash: md5
md5: 8ba8a331da61fbf65a154c374da782d1
size: 25169132
preprocess:
cmd: python3 -m src.data.preprocess
deps:
- path: data/raw/imdb.parquet
hash: md5
md5: 8ba8a331da61fbf65a154c374da782d1
size: 25169132
- path: src/config.py
hash: md5
md5: a883d0dec1704d3fcd889893bd8d4c48
size: 1290
- path: src/data/preprocess.py
hash: md5
md5: f6a9a45818fb4648feeab6eec739880f
size: 1603
outs:
- path: data/interim/imdb_cleaned.parquet
hash: md5
md5: 294e39e32874afecd71ca8b19b133b5f
size: 25778404
split:
cmd: python3 -m src.data.split_data
deps:
- path: data/interim/imdb_cleaned.parquet
hash: md5
md5: 294e39e32874afecd71ca8b19b133b5f
size: 25778404
- path: src/config.py
hash: md5
md5: a883d0dec1704d3fcd889893bd8d4c48
size: 1290
- path: src/data/split_data.py
hash: md5
md5: 4382ad1339e71501b336b2320ded9aec
size: 1148
outs:
- path: data/processed/test.parquet
hash: md5
md5: ef6cb503ef27b981bb9bd0a976fb2fb3
size: 2613951
- path: data/processed/train.parquet
hash: md5
md5: cc999769d5051de562fa0583b425be7c
size: 18026684
- path: data/processed/validation.parquet
hash: md5
md5: 9e533ef8e2c19823c3988506cf4c0e2b
size: 5171217
train:
cmd: python3 -m src.modeling.train
deps:
- path: data/processed/train.parquet
hash: md5
md5: cc999769d5051de562fa0583b425be7c
size: 18026684
- path: data/processed/validation.parquet
hash: md5
md5: 9e533ef8e2c19823c3988506cf4c0e2b
size: 5171217
- path: src/config.py
hash: md5
md5: a883d0dec1704d3fcd889893bd8d4c48
size: 1290
- path: src/modeling/train.py
hash: md5
md5: 9e6057a08e5a83b965049ca21dffd189
size: 3590
outs:
- path: models/distilbert-imdb
hash: md5
md5: fb0d8cac7e49876c0f0bf6af02ccc0f3.dir
size: 268783444
nfiles: 7
- path: models/distilbert-imdb-checkpoint
hash: md5
md5: ce6d47edf053239131c230d2f849b968.dir
size: 804528074
nfiles: 11
evaluate:
cmd: python3 -m src.modeling.evaluate
deps:
- path: data/processed/test.parquet
hash: md5
md5: fe80344fbb6c1cb5257c8e91da71f07c
size: 2613371
- path: models/distilbert-imdb
hash: md5
md5: 267dbc22d66ac42d6ba5fa687e8c4e43.dir
size: 268783346
nfiles: 7
- path: src/modeling/evaluate.py
hash: md5
md5: 7e6451f0642f20a55ba46abf29973138
size: 1121
configure_gx:
cmd: python3 -m src.data.gx_context_configuration
deps:
- path: src/data/gx_context_configuration.py
hash: md5
md5: 3a61ff2758fdfc14e6c6003f5162a6be
size: 3718
validate-data:
cmd: python3 -m src.data.validate_data
deps:
- path: data/interim/imdb_cleaned.parquet
hash: md5
md5: 294e39e32874afecd71ca8b19b133b5f
size: 25778404
- path: src/data/gx_context_configuration.py
hash: md5
md5: 3a61ff2758fdfc14e6c6003f5162a6be
size: 3718
- path: src/data/validate_data.py
hash: md5
md5: f211bd7615c06e3a36d2c139f0953a69
size: 776