# !pip install -r ../../requirements.txt

feature_engineering:
  run: true
  module: "my_project.custom_features"
  class_name: "MyFeatureTransformer"

from model_eval_suite import run_experiment, validate_champion, prep_data

import os
# Change the working directory to the project root
os.chdir('..')

prep_data(config_path="config/data_prep.yaml")

Loading raw data from: data/input_data/salifort_50k.csv
Performing initial holdout split...
Performing train/test split on development data...

✅ Train data saved to: data/dev_data/train_data.csv (30000 rows)
✅ Test data saved to: data/dev_data/test_data.csv (10000 rows)
✅ Holdout data saved to: data/holdout_data/holdout_data.csv (10000 rows)

# ========== Naive - Bayes ==========
run_experiment(user_config_path="config/classifier/guas_nb.yaml")

Registered model 'gnb_demo_01' already exists. Creating a new version of this model...
Created version '4' of model 'gnb_demo_01'.

⚠️ SHAP explainer creation failed: The passed model is not callable and cannot be analyzed directly with the given masker! Model: GaussianNB()

✅ Run complete: `gnb_demo_01`
📁 Artifacts saved to:
   - Plots:   exports/plots/gnb_demo_01
   - Reports: exports/reports/gnb_demo_01
📦 MLflow model: `gnb_demo_01`

--- Rendering Dashboards ---

# ========== Logistic Regression ==========
run_experiment(user_config_path="config/classifier/logreg.yaml")

Registered model 'logreg_baseline_01' already exists. Creating a new version of this model...
Created version '4' of model 'logreg_baseline_01'.

✅ Run complete: `logreg_baseline_01`
📁 Artifacts saved to:
   - Plots:   exports/plots/logreg_baseline_01
   - Reports: exports/reports/logreg_baseline_01
📦 MLflow model: `logreg_baseline_01`

--- Rendering Dashboards ---

# ========== XGBoost Classifier ==========

run_experiment(user_config_path="config/classifier/xgboost.yaml")

Fitting 5 folds for each of 108 candidates, totalling 540 fits

Registered model 'xgb_demo_01' already exists. Creating a new version of this model...
Created version '4' of model 'xgb_demo_01'.

✅ Run complete: `xgb_demo_01`
📁 Artifacts saved to:
   - Plots:   exports/plots/xgb_demo_01
   - Reports: exports/reports/xgb_demo_01
📦 MLflow model: `xgb_demo_01`

--- Rendering Dashboards ---

# ========== Linear Regression ==========
run_experiment(user_config_path="config/regressor/linreg.yaml")

Registered model 'linreg_demo_01' already exists. Creating a new version of this model...
Created version '4' of model 'linreg_demo_01'.

✅ Run complete: `linreg_demo_01`
📁 Artifacts saved to:
   - Plots:   exports/plots/linreg_demo_01
   - Reports: exports/reports/linreg_demo_01
📦 MLflow model: `linreg_demo_01`

--- Rendering Dashboards ---

# ========== XGBoost Regressor ==========
run_experiment(user_config_path="config/regressor/xgboost_reg.yaml")

Fitting 5 folds for each of 108 candidates, totalling 540 fits

Registered model 'xgbreg_demo_01' already exists. Creating a new version of this model...
Created version '4' of model 'xgbreg_demo_01'.

✅ Run complete: `xgbreg_demo_01`
📁 Artifacts saved to:
   - Plots:   exports/plots/xgbreg_demo_01
   - Reports: exports/reports/xgbreg_demo_01
📦 MLflow model: `xgbreg_demo_01`

--- Rendering Dashboards ---

# ========== Validate Classifer Champion Model ==========
validate_champion(config_path="config/xgb_validation.yaml")

--- 🚀 Starting Champion Model Validation: xgb_demo_01_production_validation ---
Loading model from: models:/xgb_demo_01/1
Loading holdout data from: data/holdout_data/holdout_data.csv
Loading baseline model from: models:/logreg_baseline_01/1
Evaluating baseline model...

Detected task type: classification

Generating final assessment plots...

Exporting validation artifacts...
Tagging model version with status: 'Production-Candidate'
--- ✅ Validation Complete for xgb_demo_01 v1 ---
--- 📊 Rendering Validation Dashboard ---

# ========== Validate Regressor Champion Model ==========
validate_champion(config_path="config/xgb_reg_validation.yaml")

--- 🚀 Starting Champion Model Validation: xgbreg_demo_01_production_validation ---
Loading model from: models:/xgbreg_demo_01/1
Loading holdout data from: data/holdout_data/holdout_data.csv
Loading baseline model from: models:/linreg_demo_01/1
Evaluating baseline model...

Detected task type: regression

Generating final assessment plots...
⚠️ Prediction interval plot is only available for ensemble models like RandomForestRegressor.
Exporting validation artifacts...
Tagging model version with status: 'Production-Candidate'

--- ✅ Validation Complete for xgbreg_demo_01 v1 ---
--- 📊 Rendering Validation Dashboard ---

🧪 Model Evaluation Suite Demo Notebook¶

📜 Configuration Setup¶

🔧 Custom Feature Engineering¶

📚 Dashboard Guidence¶

📉 Pre-Model Diagnostics Dashboard¶

📊 Model Evaluation Dashboard¶

📌 Core Imports¶

📤 Data Preparation¶

⚙️ Model Experiment Runs (Demo)¶

🔍 Classifier Models¶

📈 Regressor Models¶

⚠️ SHAP Error Handling¶

🔁 Cross-Validation Insight¶

🚨 Automated Alert Auditing¶

🏆 Champion Model Validation¶

Key Features¶

Validation Configurations Used in This Demo¶

✅ Wrap-Up and Next Steps¶

Next Steps¶