try new data from epc with adjusted feature processing

This commit is contained in:
Michael Duong 2024-06-09 11:28:34 +01:00
parent 8cfe43b22d
commit a5574cd1e7
2 changed files with 25 additions and 24 deletions

View file

@ -21,7 +21,8 @@ default:
# data_filepath: s3://retrofit-data-dev/sap_change_model/2024-03-22-18-56-53/dataset_rooms.parquet
# data_filepath: s3://retrofit-data-dev/sap_change_model/2024-05-25-08-36-36/dataset_rooms.parquet
# data_filepath: s3://retrofit-data-dev/sap_change_model/2024-05-26-10-31-39/dataset_rooms.parquet
data_filepath: s3://retrofit-data-dev/sap_change_model/2024-05-28-19-08-25/dataset_rooms.parquet
# data_filepath: s3://retrofit-data-dev/sap_change_model/2024-05-28-19-08-25/dataset_rooms.parquet
data_filepath: s3://retrofit-data-dev/sap_change_model/2024-06-09-10-36-53/dataset_rooms.parquet
train_proportion: 0.9
output_train_filepath: ./data/prepared_data/train.parquet
output_test_filepath: ./data/prepared_data/test.parquet

View file

@ -40,7 +40,7 @@ stages:
default.feature_processor.feature_processor_config.target: heat_demand_ending
default.feature_processor.feature_processor_type: dataframe
default.prepare_data.data_filepath:
s3://retrofit-data-dev/sap_change_model/2024-05-28-19-08-25/dataset_rooms.parquet
s3://retrofit-data-dev/sap_change_model/2024-06-09-10-36-53/dataset_rooms.parquet
default.prepare_data.input_dataclient_type: aws-s3
default.prepare_data.output_dataclient_type: local
default.prepare_data.output_test_filepath: ./data/prepared_data/test.parquet
@ -49,8 +49,8 @@ stages:
outs:
- path: data/prepared_data/
hash: md5
md5: 63af74a6d808f37d7ab0010300e3f6bf.dir
size: 37110480
md5: 836c0dde274564fe214246c62b318aa6.dir
size: 38248585
nfiles: 2
build_model:
cmd: python 2_build_model.py
@ -61,8 +61,8 @@ stages:
size: 4820
- path: data/prepared_data
hash: md5
md5: 63af74a6d808f37d7ab0010300e3f6bf.dir
size: 37110480
md5: 836c0dde274564fe214246c62b318aa6.dir
size: 38248585
nfiles: 2
params:
configs/build_model.yaml:
@ -94,18 +94,18 @@ stages:
outs:
- path: data/fit_predictions/
hash: md5
md5: adc6e6cd0b396d9327123cabc0f3409e.dir
size: 2901081
md5: 894bbcfbb3ec256d7ec263625c0b6476.dir
size: 2967600
nfiles: 1
- path: data/model/
hash: md5
md5: 191092d9ed4218368408af7907aff787.dir
size: 719293313
md5: 6eb74e559b8264c7e3f4ebbd2e2dcdf5.dir
size: 723269665
nfiles: 36
- path: metrics/fit_metrics.json
hash: md5
md5: feb839b11d75217c02ee8b3d13362324
size: 223
md5: 84f3dd138e912a64d8ed2d648e6828d3
size: 222
generate_predictions:
cmd: python 3_generate_predictions.py
deps:
@ -115,13 +115,13 @@ stages:
size: 2464
- path: data/model
hash: md5
md5: 191092d9ed4218368408af7907aff787.dir
size: 719293313
md5: 6eb74e559b8264c7e3f4ebbd2e2dcdf5.dir
size: 723269665
nfiles: 36
- path: data/prepared_data
hash: md5
md5: 63af74a6d808f37d7ab0010300e3f6bf.dir
size: 37110480
md5: 836c0dde274564fe214246c62b318aa6.dir
size: 38248585
nfiles: 2
params:
configs/settings.yaml:
@ -133,8 +133,8 @@ stages:
outs:
- path: data/predictions/
hash: md5
md5: 794b1fb87d0693694782bef4d7443dfb.dir
size: 380445
md5: ef2bc137de75c36b7496e99048d16618.dir
size: 391474
nfiles: 1
generate_metrics:
cmd: python 4_generate_metrics.py
@ -145,13 +145,13 @@ stages:
size: 3447
- path: data/predictions
hash: md5
md5: 794b1fb87d0693694782bef4d7443dfb.dir
size: 380445
md5: ef2bc137de75c36b7496e99048d16618.dir
size: 391474
nfiles: 1
- path: data/prepared_data
hash: md5
md5: 63af74a6d808f37d7ab0010300e3f6bf.dir
size: 37110480
md5: 836c0dde274564fe214246c62b318aa6.dir
size: 38248585
nfiles: 2
params:
configs/settings.yaml:
@ -161,8 +161,8 @@ stages:
outs:
- path: metrics/metrics.json
hash: md5
md5: c0db9fdd237e4cae5692884d70bb4d4c
size: 221
md5: 0edb8ad9060a115617d41c72684b177c
size: 219
generate_scenerio_metrics:
cmd: python 5_generate_scenarios.py
deps: