Register
Login
Resources
Docs Blog Datasets Glossary Case Studies Tutorials & Webinars
Product
Data Engine LLMs Platform Enterprise
Pricing Explore
Connect to our Discord channel

dvc.yaml 5.7 KB

You have to be logged in to leave a comment. Sign In
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
  1. stages:
  2. retrieve_cve_dates:
  3. cmd: python3 dependency_search/retrieve_cve_dates.py data/cve_df_filename data/published_cve_df_filename
  4. deps:
  5. - data/cve_df_filename
  6. - dependency_search/retrieve_cve_dates.py
  7. outs:
  8. - data/published_cve_df_filename
  9. retrieve_cve_info:
  10. cmd: python3 cve_information/retrieve_cve_info.py data/published_cve_df_filename
  11. data/unique_cve_info-cvss_cwe_etc.parquet
  12. deps:
  13. - data/published_cve_df_filename
  14. - cve_information/retrieve_cve_info.py
  15. outs:
  16. - data/unique_cve_info-cvss_cwe_etc.parquet
  17. retrieve_project_info:
  18. cmd: python3 projects_stats/retrieve_metadata_from_WoC_mongodb.py data/cve_df_filename
  19. data/unique_project_info.parquet
  20. deps:
  21. - data/cve_df_filename
  22. - projects_stats/retrieve_metadata_from_WoC_mongodb.py
  23. outs:
  24. - data/unique_project_info.parquet
  25. merge_cve_dates:
  26. cmd: python3 dependency_search/merge_cve_df_with_published_cve_df.py data/cve_df_filename
  27. data/published_cve_df_filename data/commits_with_published_cve_df
  28. deps:
  29. - data/cve_df_filename
  30. - data/published_cve_df_filename
  31. - dependency_search/merge_cve_df_with_published_cve_df.py
  32. outs:
  33. - data/commits_with_published_cve_df
  34. add_cvss_rankings:
  35. cmd: python3 cve_information/add_cvss_ranking.py data/unique_cve_info-cvss_cwe_etc.parquet
  36. data/unique_cve_info-cvss_cwe_ranking_etc.parquet
  37. deps:
  38. - cve_information/add_cvss_ranking.py
  39. - data/unique_cve_info-cvss_cwe_etc.parquet
  40. outs:
  41. - data/unique_cve_info-cvss_cwe_ranking_etc.parquet
  42. extension_to_language:
  43. cmd: python3 dependency_search/prepare_extension_to_language_dict.py data/extension_to_language.json
  44. deps:
  45. - dependency_search/prepare_extension_to_language_dict.py
  46. - https://raw.githubusercontent.com/github/linguist/master/lib/linguist/languages.yml
  47. outs:
  48. - data/extension_to_language.json:
  49. cache: false
  50. languages_for_cve:
  51. cmd: python3 dependency_search/find_programming_language_for_cve.py data/commits_with_published_cve_df
  52. data/extension_to_language.json data/combined_df
  53. deps:
  54. - data/commits_with_published_cve_df
  55. - data/extension_to_language.json
  56. - dependency_search/find_programming_language_for_cve.py
  57. outs:
  58. - data/combined_df
  59. language_to_class:
  60. cmd: python3 dependency_search/prepare_language_to_class_dict.py data/language_to_class.json
  61. deps:
  62. - dependency_search/prepare_language_to_class_dict.py
  63. outs:
  64. - data/language_to_class.json:
  65. cache: false
  66. dependency_df:
  67. cmd: python3 dependency_search/prepare_dep_df.py data/cve_df_filename data/dep_df
  68. deps:
  69. - data/cve_df_filename
  70. - dependency_search/prepare_dep_df.py
  71. outs:
  72. - data/dep_df
  73. clean_combined_df:
  74. cmd: python3 dependency_search/clean_data_before_cve_lifespan_calculation.py data/combined_df
  75. data/dep_df data/language_to_class.json data/cleaned_cve_df
  76. deps:
  77. - data/combined_df
  78. - data/dep_df
  79. - data/language_to_class.json
  80. - dependency_search/clean_data_before_cve_lifespan_calculation.py
  81. outs:
  82. - data/cleaned_cve_df
  83. compute_cve_lifespan:
  84. cmd: python3 dependency_search/calculate_cve_lifespan_per_project.py data/cleaned_cve_df
  85. data/language_to_class.json data/cve_lifespan_language_df data/cve_lifespan_df
  86. deps:
  87. - data/cleaned_cve_df
  88. - data/language_to_class.json
  89. - dependency_search/calculate_cve_lifespan_per_project.py
  90. outs:
  91. - data/cve_lifespan_language_df
  92. - data/cve_lifespan_df
  93. merge_cve_info_into_lifespan:
  94. cmd: python3 dependency_search/merge_cve_info_and_cve_lifespan.py data/unique_cve_info-cvss_cwe_ranking_etc.parquet
  95. data/cve_lifespan_language_df data/cve_lifespan_df data/cve_lifespan_and_cve_info_df data/cve_lifespan_language_and_cve_info_df
  96. deps:
  97. - data/cve_lifespan_language_df
  98. - data/cve_lifespan_df
  99. - data/unique_cve_info-cvss_cwe_ranking_etc.parquet
  100. - dependency_search/merge_cve_info_and_cve_lifespan.py
  101. outs:
  102. - data/cve_lifespan_and_cve_info_df
  103. - data/cve_lifespan_language_and_cve_info_df
  104. # NOTE: the following two "merge_project_info_*" stages may be moved before "merge_cve_info_into_lifespan" stage
  105. merge_project_info_into_lifespan:
  106. cmd: >-
  107. python3 projects_stats/merge_with_project_metadata.py
  108. data/cve_lifespan_and_cve_info_df data/unique_project_info.parquet
  109. data/cve_survival_input_df
  110. deps:
  111. - projects_stats/merge_with_project_metadata.py
  112. - data/unique_project_info.parquet
  113. - data/cve_lifespan_and_cve_info_df
  114. outs:
  115. - data/cve_survival_input_df
  116. merge_project_info_into_lifespan_language:
  117. cmd: >-
  118. python3 projects_stats/merge_with_project_metadata.py
  119. data/cve_lifespan_language_and_cve_info_df data/unique_project_info.parquet
  120. data/cve_survival_input_most_used_language_df
  121. deps:
  122. - projects_stats/merge_with_project_metadata.py
  123. - data/unique_project_info.parquet
  124. - data/cve_lifespan_language_and_cve_info_df
  125. outs:
  126. - data/cve_survival_input_most_used_language_df
  127. evaluate-cve_surv:
  128. cmd: >-
  129. python3 analysis/cve_surv_analysis.py
  130. --eval-path=eval/ --path-prefix=''
  131. data/cve_survival_input_df
  132. params:
  133. - eval.confidence
  134. - eval.bootstrap_samples
  135. - eval.description
  136. - eval.cve_survival_analysis
  137. deps:
  138. - analysis/cve_surv_analysis.py
  139. - data/cve_survival_input_df
  140. metrics:
  141. - eval/cve_surv_metrics.json:
  142. cache: false
  143. - eval/cve_surv_group_metrics.csv:
  144. cache: false
  145. - eval/cve_surv_statistics.csv:
  146. cache: false
  147. plots:
  148. - eval/cve_survival_function.png:
  149. cache: false
  150. outs:
  151. - eval/cve_surv_params.yaml:
  152. cache: false
Tip!

Press p or to see the previous file or, n or to see the next file

Comments

Loading...