Skip to content

Commit 1d93057

Browse files
committed
Update fit_class_random_forest.json to official spec
fixes openEOPlatform/architecture-docs#220
1 parent f925ae5 commit 1d93057

File tree

1 file changed

+19
-24
lines changed

1 file changed

+19
-24
lines changed

openeo_driver/specs/openeo-processes/experimental/fit_class_random_forest.json

+19-24
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
{
22
"id": "fit_class_random_forest",
33
"summary": "Train a random forest classification model",
4-
"description": "Executes the fit of a random forest classification based on the user input of target and predictors. The Random Forest classification model is based on the approach by Breiman (2001).",
4+
"description": "Executes the fit of a random forest classification based on training data. The process does not include a separate split of the data in test, validation and training data. The Random Forest classification model is based on the approach by Breiman (2001).",
55
"categories": [
66
"machine learning"
77
],
@@ -24,13 +24,23 @@
2424
}
2525
},
2626
{
27-
"name": "training",
28-
"description": "The amount of training data to be used in the classification, given as a fraction. The sampling will be chosen randomly through the data object. The remaining data will be used as test data for the validation.",
29-
"schema": {
30-
"type": "number",
31-
"exclusiveMinimum": 0,
32-
"maximum": 1
33-
}
27+
"name": "max_variables",
28+
"description": "Specifies how many split variables will be used at a node.\n\nThe following options are available:\n\n- *integer*: The given number of variables are considered for each split.\n- `all`: All variables are considered for each split.\n- `log2`: The logarithm with base 2 of the number of variables are considered for each split.\n- `onethird`: A third of the number of variables are considered for each split.\n- `sqrt`: The square root of the number of variables are considered for each split. This is often the default for classification.",
29+
"schema": [
30+
{
31+
"type": "integer",
32+
"minimum": 1
33+
},
34+
{
35+
"type": "string",
36+
"enum": [
37+
"all",
38+
"log2",
39+
"onethird",
40+
"sqrt"
41+
]
42+
}
43+
]
3444
},
3545
{
3646
"name": "num_trees",
@@ -42,21 +52,6 @@
4252
"minimum": 1
4353
}
4454
},
45-
{
46-
"name": "mtry",
47-
"description": "Specifies how many split variables will be used at a node. Default value is `null`, which corresponds to the number of predictors divided by 3.",
48-
"optional": true,
49-
"default": null,
50-
"schema": [
51-
{
52-
"type": "integer",
53-
"minimum": 1
54-
},
55-
{
56-
"type": "null"
57-
}
58-
]
59-
},
6055
{
6156
"name": "seed",
6257
"description": "A randomization seed to use for the random sampling in training. If not given or `null`, no seed is used and results may differ on subsequent use.",
@@ -85,4 +80,4 @@
8580
"rel": "about"
8681
}
8782
]
88-
}
83+
}

0 commit comments

Comments
 (0)