Register
Login
Resources
Docs Blog Datasets Glossary Case Studies Tutorials & Webinars
Product
Data Engine LLMs Platform Enterprise
Pricing Explore
Connect to our Discord channel

#9 build(deps): bump setuptools from 70.0.0 to 78.1.1

Merged
Ghost merged 2 commits into ncusi:main from ncusi:dependabot/pip/setuptools-78.1.1
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
  1. schema: '2.0'
  2. stages:
  3. download_DevGPT:
  4. cmd:
  5. - dvc get-url --force https://zenodo.org/records/10086809/files/DevGPT.zip?download=1
  6. - mkdir -p data/external
  7. - unzip DevGPT.zip -d data/external/DevGPT
  8. - rm DevGPT.zip
  9. outs:
  10. - path: data/external/DevGPT/
  11. hash: md5
  12. md5: 223e6501a84a339b341bfb843595d1b2.dir
  13. size: 4182300528
  14. nfiles: 65
  15. clone_repos:
  16. cmd: python scripts/data/download_repositories.py data/external/DevGPT/ /mnt/data/MSR_Challenge_2024/repositories/
  17. data/repositories_download_status.json
  18. deps:
  19. - path: data/external/DevGPT/
  20. hash: md5
  21. md5: 223e6501a84a339b341bfb843595d1b2.dir
  22. size: 4182300528
  23. nfiles: 65
  24. - path: scripts/data/download_repositories.py
  25. hash: md5
  26. md5: ecf6bc29c934494835f8117b203198c2
  27. size: 7849
  28. outs:
  29. - path: data/repositories_download_status.json
  30. hash: md5
  31. md5: 985cc0f559f68de003cea224e8a7bc4d
  32. size: 177064
  33. commit_agg:
  34. cmd: python scripts/data/commit_sharings_to_agg.py data/external/DevGPT/ data/repositories_download_status.json
  35. data/interim/
  36. deps:
  37. - path: data/external/DevGPT/
  38. hash: md5
  39. md5: 223e6501a84a339b341bfb843595d1b2.dir
  40. size: 4182300528
  41. nfiles: 65
  42. - path: data/repositories_download_status.json
  43. hash: md5
  44. md5: 985cc0f559f68de003cea224e8a7bc4d
  45. size: 177064
  46. - path: scripts/data/commit_sharings_to_agg.py
  47. hash: md5
  48. md5: 8528815d3f6dea73c0250f9109522b82
  49. size: 5624
  50. outs:
  51. - path: data/interim/commit_sharings_df.csv
  52. hash: md5
  53. md5: dee35aeb0d0b7fa354b0022f9bd998a1
  54. size: 484886
  55. - path: data/interim/commit_sharings_groupby_repo_df.csv
  56. hash: md5
  57. md5: fb48677300a61d2877503ec897f0c4e5
  58. size: 4994
  59. commit_survival:
  60. cmd: python scripts/data/compute_changes_survival.py data/interim/commit_sharings_df.csv
  61. data/repositories_download_status.json data/interim/commit_sharings_changes_survival_df.csv
  62. data/interim/commit_sharings_lines_survival_df.csv
  63. deps:
  64. - path: data/interim/commit_sharings_df.csv
  65. hash: md5
  66. md5: dee35aeb0d0b7fa354b0022f9bd998a1
  67. size: 484886
  68. - path: data/repositories_download_status.json
  69. hash: md5
  70. md5: 985cc0f559f68de003cea224e8a7bc4d
  71. size: 177064
  72. - path: scripts/data/compute_changes_survival.py
  73. hash: md5
  74. md5: 8ad8a68a376a824ab1fb6ba1eea85863
  75. size: 23948
  76. outs:
  77. - path: data/interim/commit_sharings_changes_survival_df.csv
  78. hash: md5
  79. md5: 194afee4cff70543824bd2a73e3a1f1b
  80. size: 532182
  81. - path: data/interim/commit_sharings_lines_survival_df.csv
  82. hash: md5
  83. md5: 021b08469d02ccf69e409720bb12f75e
  84. size: 63102513
  85. repo_stats_git:
  86. cmd: python scripts/data/compute_repository_statistics_git.py data/external/DevGPT/
  87. data/repositories_download_status.json data/interim/repository_statistics_git.json
  88. deps:
  89. - path: data/external/DevGPT/
  90. hash: md5
  91. md5: 223e6501a84a339b341bfb843595d1b2.dir
  92. size: 4182300528
  93. nfiles: 65
  94. - path: data/repositories_download_status.json
  95. hash: md5
  96. md5: 985cc0f559f68de003cea224e8a7bc4d
  97. size: 177064
  98. - path: scripts/data/compute_repository_statistics_git.py
  99. hash: md5
  100. md5: 3a1ab9002d42ab9f1809764e8c4c1be1
  101. size: 6566
  102. outs:
  103. - path: data/interim/repository_statistics_git.json
  104. hash: md5
  105. md5: a2d2d11ae1f4b6b10fcf3adec80cf08a
  106. size: 303476
  107. repo_stats_github:
  108. cmd: python scripts/data/compute_repository_statistics_github.py data/external/DevGPT/
  109. data/repositories_download_status.json data/interim/repository_statistics_github.json
  110. deps:
  111. - path: data/external/DevGPT/
  112. hash: md5
  113. md5: 223e6501a84a339b341bfb843595d1b2.dir
  114. size: 4182300528
  115. nfiles: 65
  116. - path: data/repositories_download_status.json
  117. hash: md5
  118. md5: 985cc0f559f68de003cea224e8a7bc4d
  119. size: 177064
  120. - path: scripts/data/compute_repository_statistics_github.py
  121. hash: md5
  122. md5: a68674ba5fa9a454f2d14c048f11bb49
  123. size: 5164
  124. outs:
  125. - path: data/interim/repository_statistics_github.json
  126. hash: md5
  127. md5: 822db4d12c06eea2e76578f7a4f3fb91
  128. size: 614770
  129. pr_agg:
  130. cmd: python scripts/data/pr_sharings_to_agg.py data/external/DevGPT/ data/repositories_download_status.json
  131. data/interim/
  132. deps:
  133. - path: data/external/DevGPT/
  134. hash: md5
  135. md5: 223e6501a84a339b341bfb843595d1b2.dir
  136. size: 4182300528
  137. nfiles: 65
  138. - path: data/repositories_download_status.json
  139. hash: md5
  140. md5: 985cc0f559f68de003cea224e8a7bc4d
  141. size: 177064
  142. - path: scripts/data/pr_sharings_to_agg.py
  143. hash: md5
  144. md5: a0f9d5fae3236d03c1ccc124cc4c511a
  145. size: 11648
  146. outs:
  147. - path: data/interim/pr_sharings_df.csv
  148. hash: md5
  149. md5: 343abf1b666b59e70e9f9ddd10762642
  150. size: 771169
  151. - path: data/interim/pr_sharings_groupby_repo_df.csv
  152. hash: md5
  153. md5: 5a9a8199defd70f663a4f534dfdfcc79
  154. size: 16720
  155. - path: data/interim/pr_sharings_split_commit_df.csv
  156. hash: md5
  157. md5: b61516427911535aa4df16aa63ae4480
  158. size: 1208561
  159. pr_survival:
  160. cmd: python scripts/data/compute_changes_survival.py data/interim/pr_sharings_df.csv
  161. data/repositories_download_status.json data/interim/pr_sharings_changes_survival_df.csv
  162. data/interim/pr_sharings_lines_survival_df.csv
  163. deps:
  164. - path: data/interim/pr_sharings_df.csv
  165. hash: md5
  166. md5: 343abf1b666b59e70e9f9ddd10762642
  167. size: 771169
  168. - path: data/repositories_download_status.json
  169. hash: md5
  170. md5: 985cc0f559f68de003cea224e8a7bc4d
  171. size: 177064
  172. - path: scripts/data/compute_changes_survival.py
  173. hash: md5
  174. md5: 8ad8a68a376a824ab1fb6ba1eea85863
  175. size: 23948
  176. outs:
  177. - path: data/interim/pr_sharings_changes_survival_df.csv
  178. hash: md5
  179. md5: 387450564b3b846886a5c046661c5d82
  180. size: 595511
  181. - path: data/interim/pr_sharings_lines_survival_df.csv
  182. hash: md5
  183. md5: fec947352a0452c506bd4b74eb6ffc28
  184. size: 55564668
  185. pr_split_survival:
  186. cmd: python scripts/data/compute_changes_survival.py data/interim/pr_sharings_split_commit_df.csv
  187. data/repositories_download_status.json data/interim/pr_sharings_split_commit_changes_survival_df.csv
  188. data/interim/pr_sharings_split_commit_lines_survival_df.csv
  189. deps:
  190. - path: data/interim/pr_sharings_split_commit_df.csv
  191. hash: md5
  192. md5: b61516427911535aa4df16aa63ae4480
  193. size: 1208561
  194. - path: data/repositories_download_status.json
  195. hash: md5
  196. md5: 985cc0f559f68de003cea224e8a7bc4d
  197. size: 177064
  198. - path: scripts/data/compute_changes_survival.py
  199. hash: md5
  200. md5: 8ad8a68a376a824ab1fb6ba1eea85863
  201. size: 23948
  202. outs:
  203. - path: data/interim/pr_sharings_split_commit_changes_survival_df.csv
  204. hash: md5
  205. md5: 5f6f413d380b722563537eebaa0ba4fa
  206. size: 1320298
  207. - path: data/interim/pr_sharings_split_commit_lines_survival_df.csv
  208. hash: md5
  209. md5: e6e8317b34dedf0839fc26def0424eb6
  210. size: 161049373
  211. issue_agg:
  212. cmd: python scripts/data/issue_sharings_to_agg.py data/external/DevGPT/ data/repositories_download_status.json
  213. data/interim/
  214. deps:
  215. - path: data/external/DevGPT/
  216. hash: md5
  217. md5: 223e6501a84a339b341bfb843595d1b2.dir
  218. size: 4182300528
  219. nfiles: 65
  220. - path: data/repositories_download_status.json
  221. hash: md5
  222. md5: 985cc0f559f68de003cea224e8a7bc4d
  223. size: 177064
  224. - path: scripts/data/issue_sharings_to_agg.py
  225. hash: md5
  226. md5: 762ebc067ad1d8c7c4d5abc608321947
  227. size: 17028
  228. outs:
  229. - path: data/interim/issue_sharings_df.csv
  230. hash: md5
  231. md5: 3efdd8aa822b83dd02978dd323313e52
  232. size: 718852
  233. - path: data/interim/issue_sharings_groupby_repo_df.csv
  234. hash: md5
  235. md5: 4e08f0712c3675e8fd26d7ae1e141e45
  236. size: 28098
  237. issue_survival:
  238. cmd: python scripts/data/compute_changes_survival.py data/interim/issue_sharings_df.csv
  239. data/repositories_download_status.json data/interim/issue_sharings_changes_survival_df.csv
  240. data/interim/issue_sharings_lines_survival_df.csv
  241. deps:
  242. - path: data/interim/issue_sharings_df.csv
  243. hash: md5
  244. md5: 3efdd8aa822b83dd02978dd323313e52
  245. size: 718852
  246. - path: data/repositories_download_status.json
  247. hash: md5
  248. md5: 985cc0f559f68de003cea224e8a7bc4d
  249. size: 177064
  250. - path: scripts/data/compute_changes_survival.py
  251. hash: md5
  252. md5: 8ad8a68a376a824ab1fb6ba1eea85863
  253. size: 23948
  254. outs:
  255. - path: data/interim/issue_sharings_changes_survival_df.csv
  256. hash: md5
  257. md5: 71da5434e85ed2e9505486b3c939b9d1
  258. size: 104116
  259. - path: data/interim/issue_sharings_lines_survival_df.csv
  260. hash: md5
  261. md5: b2461f13359cfeb23ecc0170957af687
  262. size: 25476881
  263. commit_similarities:
  264. cmd: python scripts/data/find_chatgpt_changes_similarities.py data/external/DevGPT/
  265. data/interim/commit_sharings_df.csv data/repositories_download_status.json data/interim/commit_sharings_similarities_df.csv
  266. deps:
  267. - path: data/external/DevGPT/
  268. hash: md5
  269. md5: 223e6501a84a339b341bfb843595d1b2.dir
  270. size: 4182300528
  271. nfiles: 65
  272. - path: data/interim/commit_sharings_df.csv
  273. hash: md5
  274. md5: dee35aeb0d0b7fa354b0022f9bd998a1
  275. size: 484886
  276. - path: data/repositories_download_status.json
  277. hash: md5
  278. md5: 985cc0f559f68de003cea224e8a7bc4d
  279. size: 177064
  280. - path: scripts/data/find_chatgpt_changes_similarities.py
  281. hash: md5
  282. md5: f03016677efbf785050bf58ef967389e
  283. size: 18579
  284. outs:
  285. - path: data/interim/commit_sharings_similarities_df.checkpoint_data.json
  286. hash: md5
  287. md5: d0681a952d0715de7a5ad05c9fad7d1e
  288. size: 6990471
  289. - path: data/interim/commit_sharings_similarities_df.csv
  290. hash: md5
  291. md5: f8ed4db14670b3f53d12424b750155d7
  292. size: 17490798
  293. pr_similarities:
  294. cmd: python scripts/data/find_chatgpt_changes_similarities.py data/external/DevGPT/
  295. data/interim/pr_sharings_df.csv data/repositories_download_status.json data/interim/pr_mergesha_sharings_similarities_df.csv
  296. deps:
  297. - path: data/external/DevGPT/
  298. hash: md5
  299. md5: 223e6501a84a339b341bfb843595d1b2.dir
  300. size: 4182300528
  301. nfiles: 65
  302. - path: data/interim/pr_sharings_df.csv
  303. hash: md5
  304. md5: 343abf1b666b59e70e9f9ddd10762642
  305. size: 771169
  306. - path: data/repositories_download_status.json
  307. hash: md5
  308. md5: 985cc0f559f68de003cea224e8a7bc4d
  309. size: 177064
  310. - path: scripts/data/find_chatgpt_changes_similarities.py
  311. hash: md5
  312. md5: f03016677efbf785050bf58ef967389e
  313. size: 18579
  314. outs:
  315. - path: data/interim/pr_mergesha_sharings_similarities_df.checkpoint_data.json
  316. hash: md5
  317. md5: 38fa01197e48f529a3dbed4aa46dc653
  318. size: 5704439
  319. - path: data/interim/pr_mergesha_sharings_similarities_df.csv
  320. hash: md5
  321. md5: 035a37ddef5afd506f95fc3ee0de6acb
  322. size: 7955642
  323. issue_similarities:
  324. cmd: python scripts/data/find_chatgpt_changes_similarities.py data/external/DevGPT/
  325. data/interim/issue_sharings_df.csv data/repositories_download_status.json data/interim/issue_sharings_similarities_df.csv
  326. deps:
  327. - path: data/external/DevGPT/
  328. hash: md5
  329. md5: 223e6501a84a339b341bfb843595d1b2.dir
  330. size: 4182300528
  331. nfiles: 65
  332. - path: data/interim/issue_sharings_df.csv
  333. hash: md5
  334. md5: 3efdd8aa822b83dd02978dd323313e52
  335. size: 718852
  336. - path: data/repositories_download_status.json
  337. hash: md5
  338. md5: 985cc0f559f68de003cea224e8a7bc4d
  339. size: 177064
  340. - path: scripts/data/find_chatgpt_changes_similarities.py
  341. hash: md5
  342. md5: f03016677efbf785050bf58ef967389e
  343. size: 18579
  344. outs:
  345. - path: data/interim/issue_sharings_similarities_df.checkpoint_data.json
  346. hash: md5
  347. md5: 02eb0ad8237c23192f7db1eab5c1c150
  348. size: 1014307
  349. - path: data/interim/issue_sharings_similarities_df.csv
  350. hash: md5
  351. md5: e5de736e9621fef7af71e8d20ca57ea3
  352. size: 1012465
Discard
Tip!

Press p or to see the previous file or, n or to see the next file