Skip to content

Commit 5033328

Browse files
author
Igor Rukhovich
authored
Second iteration of benchmark optimization (#72)
* A huge modelbuilders benchmark renovation + fixing of a bug in a report generator + reporting metrics as well * preparing for merge * Applying mypy & pep8 suggestions * Added metric type as a separate field * Newlines at the end:)
1 parent 38677fe commit 5033328

File tree

9 files changed

+614
-566
lines changed

9 files changed

+614
-566
lines changed

.gitignore

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,5 +14,5 @@ data
1414
*.npy
1515

1616
# Results
17-
results.json
17+
results*.json
1818
*.xlsx
Lines changed: 66 additions & 72 deletions
Original file line numberDiff line numberDiff line change
@@ -1,115 +1,109 @@
11
{
22
"common": {
3-
"lib": "modelbuilders",
4-
"data-format": "pandas",
5-
"data-order": "F",
6-
"dtype": "float32",
7-
"algorithm": "lgbm_mb"
3+
"lib": "modelbuilders",
4+
"data-format": "pandas",
5+
"data-order": "F",
6+
"dtype": "float32",
7+
"algorithm": "lgbm_mb"
88
},
99
"cases": [
1010
{
1111
"dataset": [
1212
{
13-
"source": "npy",
14-
"name": "airline-ohe",
15-
"training":
16-
{
17-
"x": "data/airline-ohe_x_train.npy",
18-
"y": "data/airline-ohe_y_train.npy"
13+
"source": "npy",
14+
"name": "airline-ohe",
15+
"training": {
16+
"x": "data/airline-ohe_x_train.npy",
17+
"y": "data/airline-ohe_y_train.npy"
1918
},
20-
"testing":
21-
{
22-
"x": "data/airline-ohe_x_test.npy",
23-
"y": "data/airline-ohe_y_test.npy"
19+
"testing": {
20+
"x": "data/airline-ohe_x_test.npy",
21+
"y": "data/airline-ohe_y_test.npy"
2422
}
2523
}
2624
],
27-
"reg-alpha": 0.9,
28-
"max-bin": 256,
25+
"reg-alpha": 0.9,
26+
"max-bin": 256,
2927
"scale-pos-weight": 2,
30-
"learning-rate": 0.1,
31-
"subsample": 1,
32-
"reg-lambda": 1,
28+
"learning-rate": 0.1,
29+
"subsample": 1,
30+
"reg-lambda": 1,
3331
"min-child-weight": 0,
34-
"max-depth": 8,
35-
"max-leaves": 256,
36-
"n-estimators": 1000,
37-
"objective": "binary"
32+
"max-depth": 8,
33+
"max-leaves": 256,
34+
"n-estimators": 1000,
35+
"objective": "binary"
3836
},
3937
{
4038
"dataset": [
4139
{
42-
"source": "npy",
43-
"name": "higgs1m",
44-
"training":
45-
{
46-
"x": "data/higgs1m_x_train.npy",
47-
"y": "data/higgs1m_y_train.npy"
40+
"source": "npy",
41+
"name": "higgs1m",
42+
"training": {
43+
"x": "data/higgs1m_x_train.npy",
44+
"y": "data/higgs1m_y_train.npy"
4845
},
49-
"testing":
50-
{
51-
"x": "data/higgs1m_x_test.npy",
52-
"y": "data/higgs1m_y_test.npy"
46+
"testing": {
47+
"x": "data/higgs1m_x_test.npy",
48+
"y": "data/higgs1m_y_test.npy"
5349
}
5450
}
5551
],
56-
"reg-alpha": 0.9,
57-
"max-bin": 256,
52+
"reg-alpha": 0.9,
53+
"max-bin": 256,
5854
"scale-pos-weight": 2,
59-
"learning-rate": 0.1,
60-
"subsample": 1,
61-
"reg-lambda": 1,
55+
"learning-rate": 0.1,
56+
"subsample": 1,
57+
"reg-lambda": 1,
6258
"min-child-weight": 0,
63-
"max-depth": 8,
64-
"max-leaves": 256,
65-
"n-estimators": 1000,
66-
"objective": "binary"
59+
"max-depth": 8,
60+
"max-leaves": 256,
61+
"n-estimators": 1000,
62+
"objective": "binary"
6763
},
6864
{
6965
"dataset": [
7066
{
71-
"source": "npy",
72-
"name": "mortgage1Q",
73-
"training":
74-
{
75-
"x": "data/mortgage1Q_x_train.npy",
76-
"y": "data/mortgage1Q_y_train.npy"
67+
"source": "npy",
68+
"name": "mortgage1Q",
69+
"training": {
70+
"x": "data/mortgage1Q_x_train.npy",
71+
"y": "data/mortgage1Q_y_train.npy"
7772
}
7873
}
7974
],
80-
"n-estimators": 100,
81-
"objective": "regression",
82-
"max-depth": 8,
75+
"n-estimators": 100,
76+
"objective": "regression",
77+
"max-depth": 8,
8378
"scale-pos-weight": 2,
84-
"learning-rate": 0.1,
85-
"subsample": 1,
86-
"reg-alpha": 0.9,
87-
"reg-lambda": 1,
79+
"learning-rate": 0.1,
80+
"subsample": 1,
81+
"reg-alpha": 0.9,
82+
"reg-lambda": 1,
8883
"min-child-weight": 0,
89-
"max-leaves": 256
84+
"max-leaves": 256
9085
},
9186
{
9287
"dataset": [
9388
{
94-
"source": "npy",
95-
"name": "mlsr",
96-
"training":
97-
{
98-
"x": "data/mlsr_x_train.npy",
99-
"y": "data/mlsr_y_train.npy"
89+
"source": "npy",
90+
"name": "mlsr",
91+
"training": {
92+
"x": "data/mlsr_x_train.npy",
93+
"y": "data/mlsr_y_train.npy"
10094
}
10195
}
10296
],
103-
"max-bin": 256,
104-
"learning-rate": 0.3,
105-
"subsample": 1,
106-
"reg-lambda": 2,
97+
"max-bin": 256,
98+
"learning-rate": 0.3,
99+
"subsample": 1,
100+
"reg-lambda": 2,
107101
"min-child-weight": 1,
108-
"min-split-loss": 0.1,
109-
"max-depth": 8,
110-
"max-leaves": 256,
111-
"n-estimators": 200,
112-
"objective": "multiclass"
102+
"min-split-loss": 0.1,
103+
"max-depth": 8,
104+
"max-leaves": 256,
105+
"n-estimators": 200,
106+
"objective": "multiclass"
113107
}
114108
]
115109
}

0 commit comments

Comments
 (0)