Register
Login
Resources
Docs Blog Datasets Glossary Case Studies Tutorials & Webinars
Product
Data Engine LLMs Platform Enterprise
Pricing Explore
Connect to our Discord channel

dvc.yaml 8.5 KB

You have to be logged in to leave a comment. Sign In
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
  1. stages:
  2. prepare:
  3. cmd: python -m scripts.prepare
  4. deps:
  5. - scripts/prepare.py
  6. - data/all.csv
  7. params:
  8. - basic
  9. outs:
  10. - outputs/vocab.plk
  11. - outputs/config.json
  12. validate:
  13. foreach: # List of simple values
  14. - mlp
  15. - lstm
  16. - cnn
  17. - selected
  18. do:
  19. cmd: python -m scripts.validate ${item}
  20. deps:
  21. - data/all.csv
  22. - outputs/vocab.plk
  23. - outputs/config.json
  24. - scripts/validate.py
  25. params:
  26. - ${item}
  27. - validate
  28. metrics:
  29. - outputs/${item}_validate_results.json:
  30. cache: false
  31. plots:
  32. - outputs/${item}_validate_plots.csv:
  33. cache: false
  34. validate_bert:
  35. foreach: # List of simple values
  36. bert-base-uncased_basic:
  37. pretrained_model: bert-base-uncased
  38. method: basic
  39. bert-base-uncased_lstm:
  40. pretrained_model: bert-base-uncased
  41. method: lstm
  42. bert-large-uncased_basic:
  43. pretrained_model: bert-large-uncased
  44. method: basic
  45. bert-large-uncased_lstm:
  46. pretrained_model: bert-large-uncased
  47. method: lstm
  48. do:
  49. cmd: python -m scripts.validate_bert bert ${item.pretrained_model} ${item.method}
  50. deps:
  51. - data/all.csv
  52. - model/bert/${item.method}.py
  53. - scripts/validate_bert.py
  54. params:
  55. - bert.max_len
  56. - bert.do_lower_case
  57. - bert.${item.method}
  58. - validate
  59. metrics:
  60. - outputs/bert-${item.pretrained_model}-${item.method}_validate_results.json:
  61. cache: false
  62. plots:
  63. - outputs/bert-${item.pretrained_model}-${item.method}_validate_plots.csv:
  64. cache: false
  65. validate_xlnet:
  66. foreach: # List of simple values
  67. - basic
  68. - sequence_classification
  69. do:
  70. cmd: python -m scripts.validate_bert xlnet ${item}
  71. deps:
  72. - data/all.csv
  73. - model/xlnet/${item}.py
  74. - scripts/validate_bert.py
  75. params:
  76. - xlnet.max_len
  77. - xlnet.${item}
  78. - xlnet.pretrained_model
  79. - validate
  80. metrics:
  81. - outputs/xlnet-${item}_validate_results.json:
  82. cache: false
  83. plots:
  84. - outputs/xlnet-${item}_validate_plots.csv:
  85. cache: false
  86. validate_roberta:
  87. foreach: # List of simple values
  88. siebert/sentiment-roberta-large-english_sentiment:
  89. pretrained_model: siebert/sentiment-roberta-large-english
  90. method: sentiment
  91. do:
  92. cmd: python -m scripts.validate_bert roberta ${item.pretrained_model} ${item.method}
  93. deps:
  94. - data/train.csv
  95. - model/roberta/${item.method}.py
  96. - scripts/validate_bert.py
  97. params:
  98. - roberta.max_len
  99. - roberta.do_lower_case
  100. - roberta.${item.method}
  101. - validate
  102. metrics:
  103. - outputs/roberta-${item.pretrained_model}-${item.method}_validate_results.json:
  104. cache: false
  105. plots:
  106. - outputs/roberta-${item.pretrained_model}-${item.method}_validate_plots.csv:
  107. cache: false
  108. train:
  109. foreach: # List of simple values
  110. - mlp
  111. - lstm
  112. - cnn
  113. - selected
  114. do:
  115. cmd: python -m scripts.train ${item}
  116. deps:
  117. - data/all.csv
  118. - outputs/vocab.plk
  119. - outputs/config.json
  120. - scripts/train.py
  121. params:
  122. - ${item}
  123. - train
  124. metrics:
  125. - outputs/${item}_results.json:
  126. cache: false
  127. plots:
  128. - outputs/${item}_plots.csv:
  129. cache: false
  130. outs:
  131. - outputs/${item}_checkpoint.pth
  132. train_bert:
  133. foreach: # List of simple values
  134. bert-base-uncased_basic:
  135. pretrained_model: bert-base-uncased
  136. method: basic
  137. bert-base-uncased_lstm:
  138. pretrained_model: bert-base-uncased
  139. method: lstm
  140. bert-large-uncased_basic:
  141. pretrained_model: bert-large-uncased
  142. method: basic
  143. bert-large-uncased_lstm:
  144. pretrained_model: bert-large-uncased
  145. method: lstm
  146. do:
  147. cmd: python -m scripts.train_bert bert ${item.pretrained_model} ${item.method}
  148. deps:
  149. - data/all.csv
  150. - model/bert/${item.method}.py
  151. - scripts/train_bert.py
  152. params:
  153. - bert.max_len
  154. - bert.do_lower_case
  155. - bert.${item.method}
  156. - train
  157. metrics:
  158. - outputs/bert-${item.pretrained_model}-${item.method}_results.json:
  159. cache: false
  160. plots:
  161. - outputs/bert-${item.pretrained_model}-${item.method}_plots.csv:
  162. cache: false
  163. outs:
  164. - outputs/bert-${item.pretrained_model}-${item.method}_checkpoint.pth
  165. train_xlnet:
  166. foreach: # List of simple values
  167. xlnet-base-cased_basic:
  168. pretrained_model: xlnet-base-cased
  169. method: basic
  170. xlnet-large-cased_basic:
  171. pretrained_model: xlnet-large-cased
  172. method: basic
  173. do:
  174. cmd: python -m scripts.train_bert xlnet ${item.pretrained_model} ${item.method}
  175. deps:
  176. - data/all.csv
  177. - model/xlnet/${item.method}.py
  178. - scripts/train_bert.py
  179. params:
  180. - xlnet.max_len
  181. - xlnet.do_lower_case
  182. - xlnet.${item.method}
  183. - train
  184. metrics:
  185. - outputs/xlnet-${item.pretrained_model}-${item.method}_results.json:
  186. cache: false
  187. plots:
  188. - outputs/xlnet-${item.pretrained_model}-${item.method}_plots.csv:
  189. cache: false
  190. outs:
  191. - outputs/xlnet-${item.pretrained_model}-${item.method}_checkpoint.pth
  192. train_roberta:
  193. foreach: # List of simple values
  194. roberta-base_basic:
  195. pretrained_model: roberta-base
  196. method: basic
  197. roberta-large_basic:
  198. pretrained_model: roberta-large
  199. method: basic
  200. do:
  201. cmd: python -m scripts.train_bert roberta ${item.pretrained_model} ${item.method}
  202. deps:
  203. - data/all.csv
  204. - model/roberta/${item.method}.py
  205. - scripts/train_bert.py
  206. params:
  207. - roberta.max_len
  208. - roberta.do_lower_case
  209. - roberta.${item.method}
  210. - train
  211. metrics:
  212. - outputs/roberta-${item.pretrained_model}-${item.method}_results.json:
  213. cache: false
  214. plots:
  215. - outputs/roberta-${item.pretrained_model}-${item.method}_plots.csv:
  216. cache: false
  217. outs:
  218. - outputs/roberta-${item.pretrained_model}-${item.method}_checkpoint.pth
  219. inference:
  220. foreach: # List of simple values
  221. - mlp
  222. - lstm
  223. - cnn
  224. - selected
  225. do:
  226. cmd: python -m scripts.inference ${item}
  227. deps:
  228. - data/test.csv
  229. - scripts/inference.py
  230. - outputs/${item}_checkpoint.pth
  231. - outputs/config.json
  232. outs:
  233. - outputs/${item}_submission.csv
  234. inference_bert:
  235. foreach: # List of simple values
  236. bert-base-uncased_basic:
  237. pretrained_model: bert-base-uncased
  238. method: basic
  239. bert-base-uncased_lstm:
  240. pretrained_model: bert-base-uncased
  241. method: lstm
  242. bert-large-uncased_basic:
  243. pretrained_model: bert-large-uncased
  244. method: basic
  245. bert-large-uncased_lstm:
  246. pretrained_model: bert-large-uncased
  247. method: lstm
  248. do:
  249. cmd: python -m scripts.inference_bert bert ${item.pretrained_model} ${item.method}
  250. deps:
  251. - data/test.csv
  252. - scripts/inference_bert.py
  253. - outputs/bert-${item.pretrained_model}-${item.method}_checkpoint.pth
  254. outs:
  255. - outputs/bert-${item.pretrained_model}-${item.method}_submission.csv
  256. inference_xlnet:
  257. foreach: # List of simple values
  258. xlnet-base-cased_basic:
  259. pretrained_model: xlnet-base-cased
  260. method: basic
  261. xlnet-large-cased_basic:
  262. pretrained_model: xlnet-large-cased
  263. method: basic
  264. do:
  265. cmd: python -m scripts.inference_bert xlnet ${item.pretrained_model} ${item.method}
  266. deps:
  267. - data/test.csv
  268. - scripts/inference_bert.py
  269. - outputs/xlnet-${item.pretrained_model}-${item.method}_checkpoint.pth
  270. outs:
  271. - outputs/xlnet-${item.pretrained_model}-${item.method}_submission.csv
  272. inference_roberta:
  273. foreach: # List of simple values
  274. roberta-base_basic:
  275. pretrained_model: roberta-base
  276. method: basic
  277. roberta-large_basic:
  278. pretrained_model: roberta-large
  279. method: basic
  280. do:
  281. cmd: python -m scripts.inference_bert roberta ${item.pretrained_model} ${item.method}
  282. deps:
  283. - data/test.csv
  284. - scripts/inference_bert.py
  285. - outputs/roberta-${item.pretrained_model}-${item.method}_checkpoint.pth
  286. outs:
  287. - outputs/roberta-${item.pretrained_model}-${item.method}_submission.csv
Tip!

Press p or to see the previous file or, n or to see the next file

Comments

Loading...