import sys
sys.path.append("../../")

import numpy as np
import matplotlib.pyplot as plt
from maxwent import classification_2d, plot_classification_2d

x_train, y_train, x_ood = classification_2d()
ax = plot_classification_2d(x_train, y_train, x_ood)
ax.legend(loc="upper right"); plt.show()

import tensorflow as tf

base_net = tf.keras.Sequential()
base_net.add(tf.keras.layers.Input(shape=(2,)))
base_net.add(tf.keras.layers.Dense(100))
base_net.add(tf.keras.layers.ReLU())
base_net.add(tf.keras.layers.Dense(100))
base_net.add(tf.keras.layers.ReLU())
base_net.add(tf.keras.layers.Dense(1, activation="sigmoid"))
base_net.summary()

Model: "sequential"

┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
┃ Layer (type)                    ┃ Output Shape           ┃       Param # ┃
┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
│ dense (Dense)                   │ (None, 100)            │           300 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ re_lu (ReLU)                    │ (None, 100)            │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dense_1 (Dense)                 │ (None, 100)            │        10,100 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ re_lu_1 (ReLU)                  │ (None, 100)            │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dense_2 (Dense)                 │ (None, 1)              │           101 │
└─────────────────────────────────┴────────────────────────┴───────────────┘

 Total params: 10,501 (41.02 KB)

 Trainable params: 10,501 (41.02 KB)

 Non-trainable params: 0 (0.00 B)

base_net.compile(optimizer=tf.keras.optimizers.Adam(0.001), loss="bce")
base_net.fit(x_train, y_train, epochs=250, verbose=0);

y_pred = base_net.predict(x_ood, verbose=0)

ax = plot_classification_2d(x_train, y_train, x_ood)
unc = ax.scatter(x_ood[:, 0], x_ood[:, 1], c=y_pred, cmap="seismic")
plt.colorbar(unc, ax=ax, label='Predicted class')
ax.legend(loc="upper left"); plt.show()

y_pred = base_net.predict(x_ood, verbose=0).ravel()

uncertainties = -y_pred * np.log(y_pred + 1e-8) - (1 - y_pred) * np.log(1 - y_pred + 1e-8)

ax = plot_classification_2d(x_train, y_train, x_ood)
unc = ax.scatter(x_ood[:, 0], x_ood[:, 1], c=uncertainties, cmap="Blues")
plt.colorbar(unc, ax=ax, label='Uncertainty')
ax.legend(loc="upper left"); plt.show()

deep_ens = []

for _ in range(5):
    net = tf.keras.models.clone_model(base_net)
    net.compile(optimizer=tf.keras.optimizers.Adam(0.001), loss="bce")
    net.fit(x_train, y_train, epochs=250, verbose=0);
    deep_ens.append(net)

y_preds = [
    net.predict(x_ood, batch_size=1000, verbose=0)
    for net in deep_ens
]

uncertainties = np.std(y_preds, axis=0)

ax = plot_classification_2d(x_train, y_train, x_ood)
unc = ax.scatter(x_ood[:, 0], x_ood[:, 1], c=uncertainties, cmap="Blues")
plt.colorbar(unc, ax=ax, label='Uncertainty')
ax.legend(loc="upper left"); plt.show()

from maxwent import set_maxwent_model

stoch_net = set_maxwent_model(base_net)
stoch_net.summary()

Model: "sequential_1"

┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
┃ Layer (type)                    ┃ Output Shape           ┃       Param # ┃
┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
│ dense_3_mwe (DenseMaxWEnt)      │ (None, 100)            │           604 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ re_lu_2_mwe (ReLU)              │ (None, 100)            │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dense_4_mwe (DenseMaxWEnt)      │ (None, 100)            │        30,200 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ re_lu_3_mwe (ReLU)              │ (None, 100)            │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dense_5_mwe (DenseMaxWEnt)      │ (None, 1)              │        10,202 │
└─────────────────────────────────┴────────────────────────┴───────────────┘

 Total params: 41,006 (160.18 KB)

 Trainable params: 10,501 (41.02 KB)

 Non-trainable params: 30,505 (119.16 KB)

from maxwent import MaxWEnt

mwe = MaxWEnt(stoch_net, lambda_=1.)

mwe.compile(optimizer=tf.keras.optimizers.Adam(0.001), loss="bce")
mwe.fit(x_train, y_train, epochs=2500, verbose=0);

n_sample = 50

y_preds = [
    mwe.predict(x_ood, batch_size=1000, seed=123+i)
    for i in range(n_sample)
]
y_pred = np.mean(y_preds, axis=0)

uncertainties = -y_pred * np.log(y_pred) - (1 - y_pred) * np.log(1 - y_pred)

ax = plot_classification_2d(x_train, y_train, x_ood)
unc = ax.scatter(x_ood[:, 0], x_ood[:, 1], c=uncertainties, cmap="Blues")
plt.colorbar(unc, ax=ax, label='Uncertainty')
ax.legend(loc="upper right"); plt.show()

RuntimeWarning: divide by zero encountered in log
RuntimeWarning: invalid value encountered in multiply

y_pred = mwe.predict_mean(x_ood, batch_size=1000, clip=None, n_sample=50)

uncertainties = -y_pred * np.log(y_pred) - (1 - y_pred) * np.log(1 - y_pred)

ax = plot_classification_2d(x_train, y_train, x_ood)
unc = ax.scatter(x_ood[:, 0], x_ood[:, 1], c=uncertainties, cmap="Blues")
plt.colorbar(unc, ax=ax, label='Uncertainty')
ax.legend(loc="upper right"); plt.show()

RuntimeWarning: divide by zero encountered in log
RuntimeWarning: invalid value encountered in multiply

uncertainties = mwe.predict_std(x_ood, batch_size=1000, clip=None, n_sample=50).ravel()

ax = plot_classification_2d(x_train, y_train, x_ood)
unc = ax.scatter(x_ood[:, 0], x_ood[:, 1], c=uncertainties, cmap="Blues")
plt.colorbar(unc, ax=ax, label='Uncertainty')
ax.legend(loc="upper right"); plt.show()

stoch_net = set_maxwent_model(base_net)
mwe = MaxWEnt(stoch_net, lambda_=1.)

mwe.fit_svd(x_train)

mwe.compile(optimizer=tf.keras.optimizers.Adam(0.001), loss="mse")
mwe.fit(x_train, y_train, epochs=2500, verbose=0);

uncertainties = mwe.predict_std(x_ood, batch_size=1000, clip=None, n_sample=50).ravel()

ax = plot_classification_2d(x_train, y_train, x_ood)
unc = ax.scatter(x_ood[:, 0], x_ood[:, 1], c=uncertainties, cmap="Blues")
plt.colorbar(unc, ax=ax, label='Uncertainty')
ax.legend(loc="upper right"); plt.show()

Table of Contents

2D Classification Example

Setup

Base Network

Deep Ensemble

Maximum Weight Entropy

Stochasticity

Objective Function

Training

Inference