Ettore Mariotti
CNAM

Repository

conda create --name cnamenv
conda activate cnamenv
pip3 install matplotlib numpy pytorch_lightning torch torchmetrics interpret scikit-learn xgboost
from sklearn.model_selection import train_test_split
from sklearn.datasets import fetch_california_housing

cali = fetch_california_housing()

x_full = cali['data']
y_full = cali['target']

x_tr, x_te, y_tr, y_te = train_test_split(x_full, y_full)
from CNAM import CNAMSystem
cnam = CNAMSystem(num_steps=50,
                  init_as_ebm=True,
                  task='regression',
                  batch_size=1000
                  )
cnam.fit(x_tr, y_tr, max_epochs=100, lr=1e-2)
from sklearn.metrics import r2_score

y_preds = cnam.predict(x_te)
score = r2_score(y_te, y_preds)
print(score)
0.7395
cnam.plot_shape_functions(x_te, feature_names=cali['feature_names'])
from sklearn.datasets import fetch_openml
from sklearn.preprocessing import LabelEncoder

magic_dataset = fetch_openml('MagicTelescope')

x_full = magic_dataset['data']
y_full = LabelEncoder().fit_transform(magic_dataset['target'])

x_tr, x_te, y_tr, y_te = train_test_split(x_full, y_full)
cnam = CNAMSystem(num_steps=50,
                  init_as_ebm=True,
                  task='classification',
                  batch_size=1000
                  )
cnam.fit(x_tr, y_tr, max_epochs=100, lr=1e-2)
from sklearn.metrics import roc_auc_score

y_probas_preds = cnam.predict_proba(x_te)
score = roc_auc_score(y_te, y_preds[:, 1])
print(score)
0.8991
cnam.plot_shape_functions(x_te.values, feature_names=magic_dataset['feature_names'])