Register
Login
Resources
Docs Blog Datasets Glossary Case Studies Tutorials & Webinars
Product
Data Engine LLMs Platform Enterprise
Pricing Explore
Connect to our Discord channel

bohr.json 3.5 KB

You have to be logged in to leave a comment. Sign In
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
  1. {"bohr_framework_version": "0.4.5",
  2. "tasks": {
  3. "bugginess": {
  4. "top_artifact": "bohr.artifacts.commit.Commit",
  5. "label_categories": [
  6. "CommitLabel.NonBugFix",
  7. "CommitLabel.BugFix"
  8. ],
  9. "test_datasets": [
  10. "1151-commits",
  11. "berger",
  12. "herzig"
  13. ],
  14. "train_datasets": [
  15. "200k-commits"
  16. ],
  17. "label_column_name": "bug"
  18. },
  19. "smells": {
  20. "top_artifact": "bohr.artifacts.method.Method",
  21. "label_categories": [
  22. "SnippetLabel.NonSmelly",
  23. "SnippetLabel.Smelly"
  24. ],
  25. "test_datasets": [
  26. "smells-test"
  27. ],
  28. "train_datasets": [
  29. "smells-train"
  30. ],
  31. "label_column_name": "smelly"
  32. }
  33. },
  34. "datasets": {
  35. "berger": {
  36. "path": "berger.csv",
  37. "mapper": "bohr.templates.datamappers.commit.CommitMapper",
  38. "test_set": "true",
  39. "preprocessor": "copy",
  40. "loader": "csv"
  41. },
  42. "herzig": {
  43. "path": "herzig.csv",
  44. "mapper": "bohr.templates.datamappers.commit.CommitMapper",
  45. "test_set": "true",
  46. "preprocessor": "copy",
  47. "loader": "csv"
  48. },
  49. "1151-commits": {
  50. "path": "1151-commits.csv",
  51. "mapper": "bohr.templates.datamappers.commit.CommitMapper",
  52. "test_set": "true",
  53. "preprocessor": "copy",
  54. "loader": "csv"
  55. },
  56. "200k-commits": {
  57. "description": "desc",
  58. "path": "200k-commits.csv",
  59. "mapper": "bohr.templates.datamappers.commit.CommitMapper",
  60. "test_set": "false",
  61. "loader": "csv",
  62. "preprocessor": "copy"
  63. },
  64. "200k-commits-issues": {
  65. "description": "desc",
  66. "path": "200k-commits-issues.csv",
  67. "mapper": "bohr.templates.datamappers.issue.IssueMapper",
  68. "test_set": "false",
  69. "loader": "csv",
  70. "preprocessor": "copy",
  71. "keep_default_na": false,
  72. "dtype": {"labels": "str"}
  73. },
  74. "200k-commits-files": {
  75. "description": "desc",
  76. "path": "200k-commits-files.csv.7z",
  77. "mapper": "bohr.templates.datamappers.commitfile.CommitFileMapper",
  78. "test_set": "false",
  79. "loader": "csv",
  80. "preprocessor": "7z"
  81. },
  82. "200k-commits-link-issues": {
  83. "description": "desc",
  84. "path": "200k-commits-link-issues.csv",
  85. "test_set": "false",
  86. "loader": "csv",
  87. "preprocessor": "copy"
  88. },
  89. "200k-commits-manual-labels": {
  90. "description": "desc",
  91. "path": "200k-commits-manual-labels.csv",
  92. "mapper": "bohr.templates.datamappers.manuallabels.ManualLabelMapper",
  93. "test_set": "false",
  94. "loader": "csv",
  95. "preprocessor": "copy"
  96. },
  97. "smells-train": {
  98. "path": "smells-madeyski.csv",
  99. "path_preprocessed": "smells/train.csv",
  100. "mapper": "bohr.templates.datamappers.method.MethodMapper",
  101. "test_set": "false",
  102. "loader": "csv",
  103. "preprocessor": "data-preprocessing/smells.sh",
  104. "sep": ";"
  105. },
  106. "smells-test": {
  107. "path": "smells-madeyski.csv",
  108. "path_preprocessed": "smells/test.csv",
  109. "mapper": "bohr.templates.datamappers.method.MethodMapper",
  110. "test_set": "false",
  111. "loader": "csv",
  112. "preprocessor": "data-preprocessing/smells.sh",
  113. "sep": ";"
  114. }
  115. },
  116. "dataset-linkers": [
  117. {
  118. "from": "200k-commits",
  119. "to": "200k-commits-issues",
  120. "link": "200k-commits-link-issues"
  121. }, {
  122. "from": "200k-commits",
  123. "to": "200k-commits-files"
  124. }, {
  125. "from": "200k-commits",
  126. "to": "200k-commits-manual-labels"
  127. }
  128. ]
  129. }
Tip!

Press p or to see the previous file or, n or to see the next file

Comments

Loading...