1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
|
- {
- "config": {
- "bohr_framework_version": "0.4.5",
- "tasks": {
- "bugginess": {
- "top_artifact": "bohr.artifacts.commit.Commit",
- "label_categories": [
- "CommitLabel.NonBugFix",
- "CommitLabel.BugFix"
- ],
- "test_datasets": [
- "1151-commits",
- "berger",
- "herzig"
- ],
- "train_datasets": [
- "200k-commits"
- ],
- "label_column_name": "bug"
- },
- "smells": {
- "top_artifact": "bohr.artifacts.method.Method",
- "label_categories": [
- "SnippetLabel.NonSmelly",
- "SnippetLabel.Smelly"
- ],
- "test_datasets": [
- "smells-test"
- ],
- "train_datasets": [
- "smells-train"
- ],
- "label_column_name": "smelly"
- }
- },
- "datasets": {
- "berger": {
- "path": "berger.csv",
- "mapper": "bohr.templates.datamappers.commit.CommitMapper",
- "test_set": "true",
- "preprocessor": "copy",
- "loader": "csv"
- },
- "herzig": {
- "path": "herzig.csv",
- "mapper": "bohr.templates.datamappers.commit.CommitMapper",
- "test_set": "true",
- "preprocessor": "copy",
- "loader": "csv"
- },
- "1151-commits": {
- "path": "1151-commits.csv",
- "mapper": "bohr.templates.datamappers.commit.CommitMapper",
- "test_set": "true",
- "preprocessor": "copy",
- "loader": "csv"
- },
- "200k-commits": {
- "description": "desc",
- "path": "200k-commits.csv",
- "mapper": "bohr.templates.datamappers.commit.CommitMapper",
- "test_set": "false",
- "loader": "csv",
- "preprocessor": "copy"
- },
- "200k-commits-issues": {
- "description": "desc",
- "path": "200k-commits-issues.csv",
- "mapper": "bohr.templates.datamappers.issue.IssueMapper",
- "test_set": "false",
- "loader": "csv",
- "preprocessor": "copy",
- "keep_default_na": false,
- "dtype": {
- "labels": "str"
- }
- },
- "200k-commits-files": {
- "description": "desc",
- "path": "200k-commits-files.csv.7z",
- "mapper": "bohr.templates.datamappers.commitfile.CommitFileMapper",
- "test_set": "false",
- "loader": "csv",
- "preprocessor": "7z"
- },
- "200k-commits-link-issues": {
- "description": "desc",
- "path": "200k-commits-link-issues.csv",
- "test_set": "false",
- "loader": "csv",
- "preprocessor": "copy"
- },
- "200k-commits-manual-labels": {
- "description": "desc",
- "path": "200k-commits-manual-labels.csv",
- "mapper": "bohr.templates.datamappers.manuallabels.ManualLabelMapper",
- "test_set": "false",
- "loader": "csv",
- "preprocessor": "copy"
- },
- "smells-train": {
- "path": "smells-madeyski.csv",
- "path_preprocessed": "smells/train.csv",
- "mapper": "bohr.templates.datamappers.method.MethodMapper",
- "test_set": "false",
- "loader": "csv",
- "preprocessor": "data-preprocessing/smells.sh",
- "sep": ";"
- },
- "smells-test": {
- "path": "smells-madeyski.csv",
- "path_preprocessed": "smells/test.csv",
- "mapper": "bohr.templates.datamappers.method.MethodMapper",
- "test_set": "false",
- "loader": "csv",
- "preprocessor": "data-preprocessing/smells.sh",
- "sep": ";"
- }
- },
- "dataset-linkers": [
- {
- "from": "200k-commits",
- "to": "200k-commits-issues",
- "link": "200k-commits-link-issues"
- },
- {
- "from": "200k-commits",
- "to": "200k-commits-files"
- },
- {
- "from": "200k-commits",
- "to": "200k-commits-manual-labels"
- }
- ]
- },
- "heuristics": {
- "heuristics/bugginess.py": "9fa2be4c3ad70b831bf06a1c229ff1b6",
- "heuristics/manuallabels.py": "5120f1e19e5bfdaf6f61cfa064782e05",
- "heuristics/smells.py": "a2254c51be33d4ede33baab98ba18b09"
- },
- "manual_stages": {}
- }
|