From 63b928c828c4e8ae9ccc01f621f8d49494a0aa25 Mon Sep 17 00:00:00 2001 From: Michael Duong Date: Sun, 10 Sep 2023 10:49:19 +0000 Subject: [PATCH] test another experiment --- .../pipeline/src/configs/prepare_data.yaml | 2 +- modules/ml-pipeline/src/pipeline/src/dvc.lock | 34 +++++++++---------- 2 files changed, 18 insertions(+), 18 deletions(-) diff --git a/modules/ml-pipeline/src/pipeline/src/configs/prepare_data.yaml b/modules/ml-pipeline/src/pipeline/src/configs/prepare_data.yaml index 6a777af..4336185 100644 --- a/modules/ml-pipeline/src/pipeline/src/configs/prepare_data.yaml +++ b/modules/ml-pipeline/src/pipeline/src/configs/prepare_data.yaml @@ -1,6 +1,6 @@ dataclient_type: minio data_location: s3://dev_bucket -train_proportion: 0.9 +train_proportion: 0.1 output_train_filepath: ./data/prepared_data/train.parquet output_test_filepath: ./data/prepared_data/test.parquet diff --git a/modules/ml-pipeline/src/pipeline/src/dvc.lock b/modules/ml-pipeline/src/pipeline/src/dvc.lock index 0092858..956ef86 100644 --- a/modules/ml-pipeline/src/pipeline/src/dvc.lock +++ b/modules/ml-pipeline/src/pipeline/src/dvc.lock @@ -11,12 +11,12 @@ stages: configs/prepare_data.yaml: output_test_filepath: ./data/prepared_data/test.parquet output_train_filepath: ./data/prepared_data/train.parquet - train_proportion: 0.9 + train_proportion: 0.1 outs: - path: data/prepared_data/ hash: md5 - md5: b33066afcf18879beb7738317b840957.dir - size: 34895 + md5: 91a6bd7128a094ad083557b08e2b97e6.dir + size: 34952 nfiles: 2 build_model: cmd: python build_model.py @@ -27,8 +27,8 @@ stages: size: 3576 - path: data/prepared_data hash: md5 - md5: b33066afcf18879beb7738317b840957.dir - size: 34895 + md5: 91a6bd7128a094ad083557b08e2b97e6.dir + size: 34952 nfiles: 2 params: configs/build_model.yaml: @@ -41,7 +41,7 @@ stages: outs: - path: data/model/ hash: md5 - md5: 9e7589253302a779852158756c2a7bb9.dir + md5: fb041f589f43031bc176c2ca73599950.dir size: 1096 nfiles: 1 generate_predictions: @@ -49,13 +49,13 @@ stages: deps: - path: data/model hash: md5 - md5: 9e7589253302a779852158756c2a7bb9.dir + md5: fb041f589f43031bc176c2ca73599950.dir size: 1096 nfiles: 1 - path: data/prepared_data hash: md5 - md5: b33066afcf18879beb7738317b840957.dir - size: 34895 + md5: 91a6bd7128a094ad083557b08e2b97e6.dir + size: 34952 nfiles: 2 - path: generate_predictions.py hash: md5 @@ -68,21 +68,21 @@ stages: outs: - path: data/predictions/ hash: md5 - md5: b9c93c8c5fc441bdc0fb96cee19b1871.dir - size: 2121 + md5: e03eac67fceabe6c3d504446ae32f344.dir + size: 5384 nfiles: 1 generate_metrics: cmd: python generate_metrics.py deps: - path: data/predictions hash: md5 - md5: b9c93c8c5fc441bdc0fb96cee19b1871.dir - size: 2121 + md5: e03eac67fceabe6c3d504446ae32f344.dir + size: 5384 nfiles: 1 - path: data/prepared_data hash: md5 - md5: b33066afcf18879beb7738317b840957.dir - size: 34895 + md5: 91a6bd7128a094ad083557b08e2b97e6.dir + size: 34952 nfiles: 2 - path: generate_metrics.py hash: md5 @@ -95,5 +95,5 @@ stages: outs: - path: metrics/metrics.json hash: md5 - md5: 310e17ea14d1669035ab3c44c0204f57 - size: 183 + md5: 4adf69df1e693cf9ceb7ce68f6311bf6 + size: 181