run sap model with new data

This commit is contained in:
Michael Duong 2024-01-17 23:07:22 +00:00
parent 77888bb839
commit 0e31d67970
3 changed files with 24 additions and 24 deletions

View file

@ -13,7 +13,7 @@ default:
output_filepath: ./data/model/allmodels/
problem_type: regression
eval_metric: mean_squared_error #mean_absolute_error
time_limit: 400
time_limit: 600
presets: medium_quality
excluded_model_types: ['KNN', 'RF']
infer_limit: 0.05

View file

@ -22,7 +22,7 @@ default:
# data_filepath: s3://retrofit-data-dev/sap_change_model/floor_area_clean_test.parquet
# data_filepath: s3://retrofit-data-dev/sap_change_model/dataset_without_differencing.parquet
# data_filepath: s3://retrofit-data-dev/sap_change_model/dataset_test.parquet
data_filepath: s3://retrofit-data-dev/sap_change_model/dataset_refactor.parquet
data_filepath: s3://retrofit-data-dev/sap_change_model/dataset.parquet
train_proportion: 0.9
output_train_filepath: ./data/prepared_data/train.parquet
output_test_filepath: ./data/prepared_data/test.parquet

View file

@ -20,7 +20,7 @@ stages:
default.feature_processor.feature_processor_config.subsample_seed: 0
default.feature_processor.feature_processor_config.target: sap_ending
default.feature_processor.feature_processor_type: dataframe
default.prepare_data.data_filepath: s3://retrofit-data-dev/sap_change_model/dataset_refactor.parquet
default.prepare_data.data_filepath: s3://retrofit-data-dev/sap_change_model/dataset.parquet
default.prepare_data.input_dataclient_type: aws-s3
default.prepare_data.output_dataclient_type: local
default.prepare_data.output_test_filepath: ./data/prepared_data/test.parquet
@ -29,8 +29,8 @@ stages:
outs:
- path: data/prepared_data/
hash: md5
md5: 5d29397fcafe6b3dc4d51ffaf1e55239.dir
size: 39303409
md5: d047420c632d91203199b9a93b6b0134.dir
size: 39476967
nfiles: 2
build_model:
cmd: python 2_build_model.py
@ -41,8 +41,8 @@ stages:
size: 4149
- path: data/prepared_data
hash: md5
md5: 5d29397fcafe6b3dc4d51ffaf1e55239.dir
size: 39303409
md5: d047420c632d91203199b9a93b6b0134.dir
size: 39476967
nfiles: 2
params:
configs/build_model.yaml:
@ -58,7 +58,7 @@ stages:
output_filepath: ./data/model/allmodels/
problem_type: regression
eval_metric: mean_squared_error
time_limit: 400
time_limit: 600
presets: medium_quality
excluded_model_types:
- KNN
@ -68,13 +68,13 @@ stages:
outs:
- path: data/model/
hash: md5
md5: 6265dafedf579905c31c676e81c2a9c7.dir
size: 344212462
md5: 0ad794c5498acfcc79893a371b29be62.dir
size: 372199625
nfiles: 24
- path: metrics/fit_metrics.json
hash: md5
md5: 5cd6b92af1b1df753e20e9ea33629c4d
size: 224
md5: 534fa836074bdd9795b5879f0c479681
size: 225
generate_predictions:
cmd: python 3_generate_predictions.py
deps:
@ -84,13 +84,13 @@ stages:
size: 2464
- path: data/model
hash: md5
md5: 6265dafedf579905c31c676e81c2a9c7.dir
size: 344212462
md5: 0ad794c5498acfcc79893a371b29be62.dir
size: 372199625
nfiles: 24
- path: data/prepared_data
hash: md5
md5: 5d29397fcafe6b3dc4d51ffaf1e55239.dir
size: 39303409
md5: d047420c632d91203199b9a93b6b0134.dir
size: 39476967
nfiles: 2
params:
configs/settings.yaml:
@ -102,8 +102,8 @@ stages:
outs:
- path: data/predictions/
hash: md5
md5: b130faf5117b06897b2deed97f5868ee.dir
size: 367038
md5: 25ac7334855d5eacc5fd9e2879900f33.dir
size: 367393
nfiles: 1
generate_metrics:
cmd: python 4_generate_metrics.py
@ -114,13 +114,13 @@ stages:
size: 3484
- path: data/predictions
hash: md5
md5: b130faf5117b06897b2deed97f5868ee.dir
size: 367038
md5: 25ac7334855d5eacc5fd9e2879900f33.dir
size: 367393
nfiles: 1
- path: data/prepared_data
hash: md5
md5: 5d29397fcafe6b3dc4d51ffaf1e55239.dir
size: 39303409
md5: d047420c632d91203199b9a93b6b0134.dir
size: 39476967
nfiles: 2
params:
configs/settings.yaml:
@ -130,8 +130,8 @@ stages:
outs:
- path: metrics/metrics.json
hash: md5
md5: 3900cc1697d6d7308728b3d5b3025f85
size: 224
md5: a6fa095b4cc44e6dd7828708f8cca18b
size: 222
startup_cleanup:
cmd: python 0_startup_cleanup.py
deps: