-
Notifications
You must be signed in to change notification settings - Fork 1
/
params.yaml
157 lines (126 loc) · 2.91 KB
/
params.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
base:
random_state : 36
target_col : class
test_size : 0.33
app:
host : 0.0.0.0
port : 8080
data:
raw_data:
train_batch: training_data
pred_batch: prediction_data
train:
good_data_dir : good/train
bad_data_dir: bad/train
pred:
good_data_dir: good/pred
bad_data_dir: bad/pred
mongodb:
scania_data_db_name: scania-data
scania_train_data_collection: scania-train-data
scania_pred_data_collection: scania-pred-data
knn_imputer:
n_neighbors : 3
weights : uniform
kmeans_cluster:
init : k-means++
max_clusters : 11
knee:
curve : convex
direction : decreasing
pca_model:
n_components: 100
s3_bucket:
input_files_bucket: input-files-for-train-and-pred
scania_model_bucket: scania-model
scania-mlflow_bucket: scania-mlflow
scania_pred_data_bucket: scania-pred-data
scania_train_data_bucket: scania-train-data
scania_raw_data_bucket: scania-raw-data
models_dir:
trained : trained
stag: staging
prod : production
model_utils:
verbose : 3
cv : 5
n_jobs : -1
save_format : .sav
model_params:
rf_model:
n_estimators:
- 10
- 50
- 100
- 130
criterion:
- gini
- entropy
max_features:
- auto
- log2
max_depth:
- 2
- 3
- 4
- 5
adaboost_model:
n_estimators:
- 10
- 50
- 100
- 130
learning_rate:
- 0.5
- 0.1
- 0.01
- 0.001
random_state:
- 0
- 100
- 200
- 300
mlflow_config:
experiment_name : scania-exp-2
run_name : mlops
serialization_format : cloudpickle
db_log:
train : scania_training_logs
pred : scania_prediction_logs
train_db_log:
model_training : model_training_log
col_validation : train_col_validation_log
data_transform : train_data_transform_log
export_csv : train_export_csv_log
general : train_general_log
db_insert: train_db_insert_log
load_prod_model : load_prod_model_log
missing_values_in_col : train_missing_values_log
name_validation : train_name_validation_log
train_main : train_main_log
values_from_schema : train_values_from_schema_log
pred_db_log:
col_validation : columnValidationLog
db_conn: databaseConnectionLog
data_transform : dataTransform
db_insert : dbInsertLog
db_create : dbTableCreateLog
export_csv : ExportToCsvLog
general : GeneralLog
missing_values_in_col : missingValuesInColumn
name_validation : nameValidationLog
pred_main : prediction_main_log
values_from_schema : valuesfromSchemaValidationLog
schema_file:
train_schema_file : schema_training.json
pred_schema_file : schema_prediction.json
elbow_plot_fig : K-Means_Elbow.PNG
null_values_csv_file : null_values.csv
pred_output_file : predictions.csv
regex_file: scania_regex.txt
export_csv_file:
train: train_input_file.csv
pred : pred_input_file.csv
templates:
dir : templates
index_html_file : index.html