Note
Go to the end to download the full example code or to run this example in your browser via Binder
Model Comparison: Classification¶
Experiment initialization and data preparation
from piml import Experiment
from piml.models import TreeClassifier
from piml.models import FIGSClassifier
from piml.models import XGB2Classifier
exp = Experiment()
exp.data_loader(data="TaiwanCredit", silent=True)
exp.data_summary(feature_exclude=["LIMIT_BAL", "SEX", "EDUCATION", "MARRIAGE", "AGE"], silent=True)
exp.data_prepare(target="FlagDefault", task_type="classification", silent=True)
Train Model
exp.model_train(TreeClassifier(), name="Tree")
exp.model_train(FIGSClassifier(), name="FIGS")
exp.model_train(XGB2Classifier(), name="XGB2")
Accuracy comparison with ACC
exp.model_compare(models=["Tree", "FIGS", "XGB2"], show="accuracy_plot", metric="ACC", figsize=(5, 4))
data:image/s3,"s3://crabby-images/8cfb2/8cfb2b82e7288a5b7e16779682a51523b56eb2cc" alt="Predictive Performance"
Accuracy comparison with AUC
exp.model_compare(models=["Tree", "FIGS", "XGB2"], show="accuracy_plot", metric="AUC", figsize=(5, 4))
data:image/s3,"s3://crabby-images/3e238/3e23861039fa232c661ee1e3f56ec5925814b96c" alt="Predictive Performance"
Accuracy comparison with F1
exp.model_compare(models=["Tree", "FIGS", "XGB2"], show="accuracy_plot", metric="F1", figsize=(5, 4))
data:image/s3,"s3://crabby-images/43503/43503f2f1798ceb889f3b4045e25f6e6833e3574" alt="Predictive Performance"
Overfit comparison with ACC metric
exp.model_compare(models=["Tree", "FIGS", "XGB2"], show="overfit",
slice_method="histogram", slice_feature="PAY_1",
bins=10, metric="ACC", original_scale=True, figsize=(5, 4))
data:image/s3,"s3://crabby-images/87380/87380197d853f41d05817509238c8e9cef71f708" alt="Overfit Comparison"
Overfit comparison with AUC metric
exp.model_compare(models=["Tree", "FIGS", "XGB2"], show="overfit",
slice_method="histogram", slice_feature="PAY_1",
metric="AUC", original_scale=True, figsize=(5, 4))
data:image/s3,"s3://crabby-images/ccfbb/ccfbb2a38eaf0425af8224ab0273eae37b1cf24a" alt="Overfit Comparison"
Reliability bandwidth comparison
exp.model_compare(models=["Tree", "FIGS", "XGB2"], show="reliability_bandwidth", figsize=(5, 4))
data:image/s3,"s3://crabby-images/ba827/ba8276498173a4a92bb36dafa139ed42374201ee" alt="Uncertainty Comparison"
Reliability diagram comparison
exp.model_compare(models=["Tree", "FIGS", "XGB2"], show="reliability_perf", bins=10, figsize=(5, 4))
data:image/s3,"s3://crabby-images/5e985/5e985374a28b79ea810d9a357e2118fac5e5f535" alt="Reliability Diagram: Testing Data"
Robustness comparison with default settings
exp.model_compare(models=["Tree", "FIGS", "XGB2"], show="robustness_perf", figsize=(5, 4))
data:image/s3,"s3://crabby-images/64d8f/64d8f4f0738fa00fd06c25766fd01aa868cc9090" alt="Model Performance: Perturb on All Features"
Robustness comparison on worst alpha-percent samples
exp.model_compare(models=["Tree", "FIGS", "XGB2"], show="robustness_perf_worst", alpha=0.3, figsize=(5, 4))
data:image/s3,"s3://crabby-images/5934a/5934a2c21c7040a30f64e3fe6a1d95f3e68b19dd" alt="30%-Worst Sample Performance"
Resilience comparison with worst-sample scenario
exp.model_compare(models=["Tree", "FIGS", "XGB2"], show="resilience_perf",
resilience_method="worst-sample", immu_feature=None, metric="AUC", figsize=(5, 4))
data:image/s3,"s3://crabby-images/69aea/69aea16f42717f3a309fe097079894e43ebb0ed4" alt="Resilience Test"
Resilience distance comparison with worst-sample scenario
exp.model_compare(models=["Tree", "FIGS", "XGB2"], show="resilience_distance",
resilience_method="worst-sample", metric="AUC", alpha=0.3, figsize=(5, 4))
data:image/s3,"s3://crabby-images/31a51/31a51a45248a51841a9dd6829e839043e7d6b9e7" alt="Distribution Shift: 30%-Worst vs Remaining"
Total running time of the script: ( 1 minutes 21.717 seconds)
Estimated memory usage: 120 MB