Register
Login
Resources
Docs Blog Datasets Glossary Case Studies Tutorials & Webinars
Product
Data Engine LLMs Platform Enterprise
Pricing Explore
Connect to our Discord channel

dvc.lock 11 KB

You have to be logged in to leave a comment. Sign In
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
  1. schema: '2.0'
  2. stages:
  3. az-ratings:
  4. cmd: python run.py --rust pcat -t az.raw_ratings -s az-ratings -T import/az-ratings.transcript
  5. -D az-schema -f CSV data/ratings_Books.csv
  6. deps:
  7. - path: data/ratings_Books.csv
  8. md5: 77b4a5b887e14e16b13e7788bdf70156
  9. size: 916259348
  10. - path: schemas/az-schema.status
  11. md5: 01a7ee13889d967ed8ac69bfdf592d80
  12. size: 199
  13. outs:
  14. - path: import/az-ratings.transcript
  15. md5: 4266a96f87e134dac6b60df0514a36d2
  16. bx-ratings:
  17. cmd: python run.py bx-import -T import/bx-ratings.transcript data/BX-Book-Ratings.csv
  18. deps:
  19. - path: data/BX-Book-Ratings.csv
  20. md5: b34fe0534c9b846b8a45f316c60eb92b
  21. size: 30682276
  22. - path: schemas/bx-schema.status
  23. md5: 48cd11df72cf2bb28d5a2ff58f02d972
  24. size: 199
  25. outs:
  26. - path: import/bx-ratings.transcript
  27. md5: 511096523052e1563c4bdcc66b6ed143
  28. gr-authors:
  29. cmd: python run.py --rust import-json -T import/gr-authors.transcript --stage
  30. gr-authors -D gr-schema --truncate import/gr-authors.toml data/goodreads_book_authors.json.gz
  31. deps:
  32. - path: data/goodreads_book_authors.json.gz
  33. md5: b193c3febd961fb69443b65ba05b83a7
  34. size: 17877585
  35. - path: import/gr-authors.toml
  36. md5: 05080719337f65735dfeffacec9764c4
  37. size: 64
  38. - path: schemas/gr-schema.status
  39. md5: bda41944c7f3ff2a207edb2c8a83c9fc
  40. size: 404
  41. outs:
  42. - path: import/gr-authors.transcript
  43. md5: 40acfcc81a4be3363d61febed1716f00
  44. gr-book-genres:
  45. cmd: python run.py --rust import-json -T import/gr-book-genres.transcript --stage
  46. gr-book-genres -D gr-schema --truncate import/gr-book-genres.toml data/goodreads_book_genres_initial.json.gz
  47. deps:
  48. - path: data/goodreads_book_genres_initial.json.gz
  49. md5: 99ee3d1cadd68818c3dd0ef0d2f10602
  50. size: 24253992
  51. - path: import/gr-book-genres.toml
  52. md5: 5098a690f9f9e1320da3a12f0654192a
  53. size: 74
  54. - path: schemas/gr-schema.status
  55. md5: bda41944c7f3ff2a207edb2c8a83c9fc
  56. size: 404
  57. outs:
  58. - path: import/gr-book-genres.transcript
  59. md5: 5cd443ca86c79bef13040a97aa135eb3
  60. gr-books:
  61. cmd: python run.py --rust import-json -T import/gr-books.transcript --stage gr-books
  62. -D gr-schema --truncate import/gr-books.toml data/goodreads_books.json.gz
  63. deps:
  64. - path: data/goodreads_books.json.gz
  65. md5: 01b40c70a00fb6aa321ee478f0fd0d6b
  66. size: 2043729443
  67. - path: import/gr-books.toml
  68. md5: e30abcef8e2d1c32243dcae1a526dfcc
  69. size: 60
  70. - path: schemas/gr-schema.status
  71. md5: bda41944c7f3ff2a207edb2c8a83c9fc
  72. size: 404
  73. outs:
  74. - path: import/gr-books.transcript
  75. md5: f493bf8e51b22ccdf258b07141c0a79d
  76. gr-interactions:
  77. cmd: python run.py --rust import-json -T import/gr-interactions.transcript --stage
  78. gr-interactions -D gr-schema --truncate import/gr-interactions.toml data/goodreads_interactions.json.gz
  79. deps:
  80. - path: data/goodreads_interactions.json.gz
  81. md5: f2d054a85f33d405a9bff6933005ba89
  82. size: 9388113365
  83. - path: import/gr-interactions.toml
  84. md5: c6133a33f6dd80d2e378c0b976112802
  85. size: 74
  86. - path: schemas/gr-schema.status
  87. md5: bda41944c7f3ff2a207edb2c8a83c9fc
  88. size: 404
  89. outs:
  90. - path: import/gr-interactions.transcript
  91. md5: 83ef4771b7c84a5730ba94fe8580a261
  92. gr-works:
  93. cmd: python run.py --rust import-json -T import/gr-works.transcript --stage gr-works
  94. -D gr-schema --truncate import/gr-works.toml data/goodreads_book_works.json.gz
  95. deps:
  96. - path: data/goodreads_book_works.json.gz
  97. md5: e80738a88d02d2b0081cd249d9b4f081
  98. size: 81412944
  99. - path: import/gr-works.toml
  100. md5: 670f9192bd7f532e5787b829722ebe0a
  101. size: 60
  102. - path: schemas/gr-schema.status
  103. md5: bda41944c7f3ff2a207edb2c8a83c9fc
  104. size: 404
  105. outs:
  106. - path: import/gr-works.transcript
  107. md5: 2ff4ab63f7c9043b7526f85f9bb36028
  108. loc-mds-books:
  109. cmd: python run.py --rust parse-marc --db-schema locmds -t book_marc_field --truncate
  110. --stage loc-mds-books -D loc-mds-schema --transcript import/loc-mds-books.transcript
  111. --src-dir data/loc-books --src-prefix BooksAll.2016
  112. deps:
  113. - path: data/loc-books
  114. md5: 1b1e7ab1d98cc81e373dfc53345d4bb7.dir
  115. size: 3129774145
  116. nfiles: 43
  117. - path: schemas/loc-mds-schema.status
  118. md5: e63399b7692987ecd6b579066e5bd35e
  119. size: 266
  120. outs:
  121. - path: import/loc-mds-books.transcript
  122. md5: 19b0a011c9053361278a3d812518b229
  123. loc-mds-names:
  124. cmd: python run.py --rust parse-marc --db-schema locmds -t name_marc_field --truncate
  125. --stage loc-mds-names -D loc-mds-schema --transcript import/loc-mds-names.transcript
  126. --src-dir data/loc-names --src-prefix Names.2016
  127. deps:
  128. - path: data/loc-names
  129. md5: fc488a8775561070cced774803fe0d72.dir
  130. size: 1410755359
  131. nfiles: 40
  132. - path: schemas/loc-mds-schema.status
  133. md5: e63399b7692987ecd6b579066e5bd35e
  134. size: 266
  135. outs:
  136. - path: import/loc-mds-names.transcript
  137. md5: 14ce7449e200f45a93058a6fdac918ec
  138. ol-authors:
  139. cmd: python run.py --rust import-json -T import/ol-authors.transcript --stage
  140. ol-authors -D ol-schema --truncate import/ol-authors.toml data/ol_dump_authors.txt.gz
  141. deps:
  142. - path: data/ol_dump_authors.txt.gz
  143. md5: 364e02a44e9e9a572e88692fc78fef27
  144. size: 306408477
  145. - path: import/ol-authors.toml
  146. md5: d39f4bee21e807362a55474f7c6093d0
  147. size: 111
  148. - path: schemas/ol-schema.status
  149. md5: ea3a792c4941083707b2835f737ada05
  150. size: 265
  151. outs:
  152. - path: import/ol-authors.transcript
  153. md5: 50e5bedc17cba4c5ceb8eef3d86fc307
  154. ol-editions:
  155. cmd: python run.py --rust import-json -T import/ol-editions.transcript --stage
  156. ol-editions -D ol-schema --truncate import/ol-editions.toml data/ol_dump_editions.txt.gz
  157. deps:
  158. - path: data/ol_dump_editions.txt.gz
  159. md5: e105295bf5f8025ecd7e43838ed0739c
  160. size: 6081278291
  161. - path: import/ol-editions.toml
  162. md5: e528cfea761765865a7097be7abbc510
  163. size: 114
  164. - path: schemas/ol-schema.status
  165. md5: ea3a792c4941083707b2835f737ada05
  166. size: 265
  167. outs:
  168. - path: import/ol-editions.transcript
  169. md5: c2c6951a052ebebe5f51ceb79f324162
  170. ol-works:
  171. cmd: python run.py --rust import-json -T import/ol-works.transcript --stage ol-works
  172. -D ol-schema --truncate import/ol-works.toml data/ol_dump_works.txt.gz
  173. deps:
  174. - path: data/ol_dump_works.txt.gz
  175. md5: 84e236955e5f683adde6a677d80475a0
  176. size: 1666325144
  177. - path: import/ol-works.toml
  178. md5: 5ad04190c9392dd7cae3fdead9291f09
  179. size: 105
  180. - path: schemas/ol-schema.status
  181. md5: ea3a792c4941083707b2835f737ada05
  182. size: 265
  183. outs:
  184. - path: import/ol-works.transcript
  185. md5: 6345885738815d2a51d331f7aba9e792
  186. viaf:
  187. cmd: python run.py --rust parse-marc --db-schema viaf -t marc_field --truncate
  188. --stage viaf -D viaf-schema --transcript import/viaf.transcript --line-mode
  189. data/viaf-clusters-marc21.xml.gz
  190. deps:
  191. - path: data/viaf-clusters-marc21.xml.gz
  192. md5: 2f1af5262584d38f7331d333dec81cc3
  193. size: 10662471024
  194. - path: schemas/viaf-schema.status
  195. md5: 4ee5de53afb5dfc1e1740a8667887cc0
  196. size: 204
  197. outs:
  198. - path: import/viaf.transcript
  199. md5: 326fe03b3007b0dbe02ff43c3da7e6cb
  200. status@az-ratings:
  201. cmd: python ../run.py stage-status -o az-ratings.status az-ratings
  202. deps:
  203. - path: az-ratings.transcript
  204. md5: 4266a96f87e134dac6b60df0514a36d2
  205. size: 94
  206. outs:
  207. - path: az-ratings.status
  208. md5: 08a44188987803be46be4286a2e5a5f3
  209. size: 180
  210. status@loc-mds-books:
  211. cmd: python ../run.py stage-status -o loc-mds-books.status loc-mds-books
  212. deps:
  213. - path: loc-mds-books.transcript
  214. md5: 19b0a011c9053361278a3d812518b229
  215. size: 4259
  216. outs:
  217. - path: loc-mds-books.status
  218. md5: f6e0026b4d4fe4bac7056c7fe0491259
  219. size: 4030
  220. status@ol-authors:
  221. cmd: python ../run.py stage-status -o ol-authors.status ol-authors
  222. deps:
  223. - path: ol-authors.transcript
  224. md5: 50e5bedc17cba4c5ceb8eef3d86fc307
  225. size: 130
  226. outs:
  227. - path: ol-authors.status
  228. md5: 456954970c9a56193680bb9399ac9164
  229. size: 185
  230. status@gr-works:
  231. cmd: python ../run.py stage-status -o gr-works.status gr-works
  232. deps:
  233. - path: gr-works.transcript
  234. md5: 2ff4ab63f7c9043b7526f85f9bb36028
  235. size: 136
  236. outs:
  237. - path: gr-works.status
  238. md5: a223984989927e62d8aea9230810d6bb
  239. size: 189
  240. status@loc-mds-names:
  241. cmd: python ../run.py stage-status -o loc-mds-names.status loc-mds-names
  242. deps:
  243. - path: loc-mds-names.transcript
  244. md5: 14ce7449e200f45a93058a6fdac918ec
  245. size: 3845
  246. outs:
  247. - path: loc-mds-names.status
  248. md5: 5d6d486b5b3acde6b3a9ce64d0fe794b
  249. size: 3637
  250. status@ol-works:
  251. cmd: python ../run.py stage-status -o ol-works.status ol-works
  252. deps:
  253. - path: ol-works.transcript
  254. md5: 6345885738815d2a51d331f7aba9e792
  255. size: 128
  256. outs:
  257. - path: ol-works.status
  258. md5: c84b6ccf5f89e6d8faf00cc21b4d5566
  259. size: 181
  260. status@gr-books:
  261. cmd: python ../run.py stage-status -o gr-books.status gr-books
  262. deps:
  263. - path: gr-books.transcript
  264. md5: f493bf8e51b22ccdf258b07141c0a79d
  265. size: 131
  266. outs:
  267. - path: gr-books.status
  268. md5: a0dcde1044f2c61895def1a9523be067
  269. size: 184
  270. status@gr-interactions:
  271. cmd: python ../run.py stage-status -o gr-interactions.status gr-interactions
  272. deps:
  273. - path: gr-interactions.transcript
  274. md5: 83ef4771b7c84a5730ba94fe8580a261
  275. size: 138
  276. outs:
  277. - path: gr-interactions.status
  278. md5: acf7d8bdbf506c81f6c3ea4eded3d702
  279. size: 198
  280. status@gr-book-genres:
  281. cmd: python ../run.py stage-status -o gr-book-genres.status gr-book-genres
  282. deps:
  283. - path: gr-book-genres.transcript
  284. md5: 5cd443ca86c79bef13040a97aa135eb3
  285. size: 145
  286. outs:
  287. - path: gr-book-genres.status
  288. md5: 0c77c736582157805e8248a97b5f7037
  289. size: 204
  290. status@viaf:
  291. cmd: python ../run.py stage-status -o viaf.status viaf
  292. deps:
  293. - path: viaf.transcript
  294. md5: 326fe03b3007b0dbe02ff43c3da7e6cb
  295. size: 136
  296. outs:
  297. - path: viaf.status
  298. md5: 55fb31f4aaa86a2fd921c59c797c09a8
  299. size: 186
  300. status@bx-ratings:
  301. cmd: python ../run.py stage-status -o bx-ratings.status bx-ratings
  302. deps:
  303. - path: bx-ratings.transcript
  304. md5: 511096523052e1563c4bdcc66b6ed143
  305. size: 146
  306. outs:
  307. - path: bx-ratings.status
  308. md5: 9f1009bfdb68267b39ac94ff3d754756
  309. size: 174
  310. status@ol-editions:
  311. cmd: python ../run.py stage-status -o ol-editions.status ol-editions
  312. deps:
  313. - path: ol-editions.transcript
  314. md5: c2c6951a052ebebe5f51ceb79f324162
  315. size: 131
  316. outs:
  317. - path: ol-editions.status
  318. md5: 4c0b955dcf06c319b8dd9c1057c3c056
  319. size: 187
  320. status@gr-authors:
  321. cmd: python ../run.py stage-status -o gr-authors.status gr-authors
  322. deps:
  323. - path: gr-authors.transcript
  324. md5: 40acfcc81a4be3363d61febed1716f00
  325. size: 138
  326. outs:
  327. - path: gr-authors.status
  328. md5: b7701864036091016af9123c02b5d7ed
  329. size: 193
Tip!

Press p or to see the previous file or, n or to see the next file

Comments

Loading...