Register
Login
Resources
Docs Blog Datasets Glossary Case Studies Tutorials & Webinars
Product
Data Engine LLMs Platform Enterprise
Pricing Explore
Connect to our Discord channel

bohr.lock 5.1 KB

You have to be logged in to leave a comment. Sign In
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
  1. {
  2. "config": {
  3. "bohr_framework_version": "0.4.5",
  4. "tasks": {
  5. "bugginess": {
  6. "top_artifact": "bohr.artifacts.commit.Commit",
  7. "label_categories": [
  8. "CommitLabel.NonBugFix",
  9. "CommitLabel.BugFix"
  10. ],
  11. "test_datasets": [
  12. "1151-commits",
  13. "berger",
  14. "herzig"
  15. ],
  16. "train_datasets": [
  17. "200k-commits"
  18. ],
  19. "label_column_name": "bug"
  20. },
  21. "smells": {
  22. "top_artifact": "bohr.artifacts.method.Method",
  23. "label_categories": [
  24. "SnippetLabel.NonSmelly",
  25. "SnippetLabel.Smelly"
  26. ],
  27. "test_datasets": [
  28. "smells-test"
  29. ],
  30. "train_datasets": [
  31. "smells-train"
  32. ],
  33. "label_column_name": "smelly"
  34. }
  35. },
  36. "datasets": {
  37. "berger": {
  38. "path": "berger.csv",
  39. "mapper": "bohr.templates.datamappers.commit.CommitMapper",
  40. "test_set": "true",
  41. "preprocessor": "copy",
  42. "loader": "csv"
  43. },
  44. "herzig": {
  45. "path": "herzig.csv",
  46. "mapper": "bohr.templates.datamappers.commit.CommitMapper",
  47. "test_set": "true",
  48. "preprocessor": "copy",
  49. "loader": "csv"
  50. },
  51. "1151-commits": {
  52. "path": "1151-commits.csv",
  53. "mapper": "bohr.templates.datamappers.commit.CommitMapper",
  54. "test_set": "true",
  55. "preprocessor": "copy",
  56. "loader": "csv"
  57. },
  58. "200k-commits": {
  59. "description": "desc",
  60. "path": "200k-commits.csv",
  61. "mapper": "bohr.templates.datamappers.commit.CommitMapper",
  62. "test_set": "false",
  63. "loader": "csv",
  64. "preprocessor": "copy"
  65. },
  66. "200k-commits-issues": {
  67. "description": "desc",
  68. "path": "200k-commits-issues.csv",
  69. "mapper": "bohr.templates.datamappers.issue.IssueMapper",
  70. "test_set": "false",
  71. "loader": "csv",
  72. "preprocessor": "copy",
  73. "keep_default_na": false,
  74. "dtype": {
  75. "labels": "str"
  76. }
  77. },
  78. "200k-commits-files": {
  79. "description": "desc",
  80. "path": "200k-commits-files.csv.7z",
  81. "mapper": "bohr.templates.datamappers.commitfile.CommitFileMapper",
  82. "test_set": "false",
  83. "loader": "csv",
  84. "preprocessor": "7z"
  85. },
  86. "200k-commits-link-issues": {
  87. "description": "desc",
  88. "path": "200k-commits-link-issues.csv",
  89. "test_set": "false",
  90. "loader": "csv",
  91. "preprocessor": "copy"
  92. },
  93. "200k-commits-manual-labels": {
  94. "description": "desc",
  95. "path": "200k-commits-manual-labels.csv",
  96. "mapper": "bohr.templates.datamappers.manuallabels.ManualLabelMapper",
  97. "test_set": "false",
  98. "loader": "csv",
  99. "preprocessor": "copy"
  100. },
  101. "smells-train": {
  102. "path": "smells-madeyski.csv",
  103. "path_preprocessed": "smells/train.csv",
  104. "mapper": "bohr.templates.datamappers.method.MethodMapper",
  105. "test_set": "false",
  106. "loader": "csv",
  107. "preprocessor": "data-preprocessing/smells.sh",
  108. "sep": ";"
  109. },
  110. "smells-test": {
  111. "path": "smells-madeyski.csv",
  112. "path_preprocessed": "smells/test.csv",
  113. "mapper": "bohr.templates.datamappers.method.MethodMapper",
  114. "test_set": "false",
  115. "loader": "csv",
  116. "preprocessor": "data-preprocessing/smells.sh",
  117. "sep": ";"
  118. }
  119. },
  120. "dataset-linkers": [
  121. {
  122. "from": "200k-commits",
  123. "to": "200k-commits-issues",
  124. "link": "200k-commits-link-issues"
  125. },
  126. {
  127. "from": "200k-commits",
  128. "to": "200k-commits-files"
  129. },
  130. {
  131. "from": "200k-commits",
  132. "to": "200k-commits-manual-labels"
  133. }
  134. ]
  135. },
  136. "heuristics": {
  137. "heuristics/bugginess.py": "9fa2be4c3ad70b831bf06a1c229ff1b6",
  138. "heuristics/idans_models.py": "b93f1f3e3b331252226f98010b1a77e3",
  139. "heuristics/manuallabels.py": "5120f1e19e5bfdaf6f61cfa064782e05",
  140. "heuristics/smells.py": "a2254c51be33d4ede33baab98ba18b09",
  141. "heuristics/tools/idansmodel.py": "e4204dabaa97bd04c3b1796b4dc951b9"
  142. },
  143. "manual_stages": {}
  144. }
Tip!

Press p or to see the previous file or, n or to see the next file

Comments

Loading...