-
Notifications
You must be signed in to change notification settings - Fork 5
Expand file tree
/
Copy pathparams.yaml
More file actions
28 lines (28 loc) · 754 Bytes
/
params.yaml
File metadata and controls
28 lines (28 loc) · 754 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
main:
# This seed will be used to seed the random number generator
# to ensure repeatibility of the data splits and other
# pseudo-random operations
random_seed: 42
data:
reference_dataset: "pipeline/data/preprocessing_data.csv"
# Threshold for Kolomorov-Smirnov test
ks_alpha: 0.05
test_size: 0.3
val_size: 0.3
# Stratify according to the target when splitting the data
# in train/test or in train/val
stratify: "salary"
train:
decision_tree:
criterion: "entropy"
splitter: "best"
max_depth: 13
xgboost:
n_estimators: 400
max_depth: 15
learning_rate: 0.1
subsample: 0.3
numerical_pipe:
model: 0
export_artifact: "pipeline/data/model_export"
export_encoder: "pipeline/data/encoder_export"