# Loading the necessary packages
%load_ext autoreload
%autoreload 2
%matplotlib inline

import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import logging
from sklearn.utils import Bunch

plt.rcParams['axes.grid'] = True
plt.rcParams['grid.linestyle'] = "dotted"

logging.getLogger('matplotlib.font_manager').disabled = True
logging.getLogger('matplotlib.ticker').disabled = True
logging.getLogger('matplotlib.colorbar').disabled = True
logging.basicConfig(level=logging.ERROR)

from rto.models.williams_otto import WilliamsOttoReactor, WilliamsOttoReactorSimplified
from rto.optimization.optimizer import ModifierAdaptationOptimizer, ModelBasedOptimizer
from rto.optimization.bayesian import ModelBasedBayesianOptimizer
from rto.rto import RTOBayesian, RTO
from rto.adaptation.ma_gaussian_processes import MAGaussianProcesses
from rto.utils import generate_samples_uniform
from rto.experiment.analysis import ExperimentAnalyzer

DATABASE = "/mnt/d/rto_data/thesis-analysis-02.db"


# Our complete model will be called the "plant"
plant = WilliamsOttoReactor()
# And the uncertain is the "model"
model = WilliamsOttoReactorSimplified()
# define the constraints
g0 = 0.12
g1 = 0.08
ubx = [6, 100]
lbx = [3, 70]
g = np.array([g0, g1])


# Define the input domain
grid_size = 50

u1 = np.linspace(2.5, 5.5, grid_size)
u2 = np.linspace(70, 90, grid_size)
xx, yy = np.meshgrid(u1, u2)

def get_grid_values(model, xx, yy, noise=None):
    # flatten each grid to a vector
    r1, r2 = xx.flatten(), yy.flatten()
    r1, r2 = r1.reshape((len(r1), 1)), r2.reshape((len(r2), 1))
    # horizontal stack vectors to create x1,x2 input for the model
    grid = np.hstack((r1,r2))
    # make predictions for the grid
    cost = np.array([model.get_objective(x, noise) for x in grid])
    g = np.array([model.get_constraints(x, noise) for x in grid])
    # reshape the predictions back into a grid
    zz_cost = cost.reshape(xx.shape)
    zz_g0 = g[:,0].reshape(xx.shape)
    zz_g1 = g[:,1].reshape(xx.shape)

    return zz_cost, zz_g0, zz_g1

z_plant, g0_plant, g1_plant = get_grid_values(plant, xx, yy)
z_model, g0_model, g1_model = get_grid_values(model, xx, yy)
g_plant = (g1_plant < g1)&(g0_plant < g0)
g_model = (g1_model < g1)&(g0_model < g0)


# Plot the decision surface
fig, ax = plt.subplots(1, 3, figsize=(16,6))
def plot_decision_surface(fig, ax, xx, yy, z_f, z_c, title, contour_type='contourf'):
    if(z_f is not None):
        ax.contour(xx, yy, z_f, colors='red')

    if(contour_type=='contourf'):
        CS = ax.contourf(xx, yy, z_c, cmap='viridis')
    else:
        CS = ax.contour(xx, yy, z_c, cmap='viridis')
    fig.colorbar(CS, ax=ax)
    ax.set_xlabel('Fa')
    ax.set_ylabel('Tr')
    ax.set_title(title)

plot_decision_surface(fig, ax[0], xx, yy, g_plant, z_plant, 'Plant')
plot_decision_surface(fig, ax[1], xx, yy, g_model, z_model, 'Model')
plot_decision_surface(fig, ax[2], xx, yy, None, z_plant - z_model, 'Mismatch')

fig.show()


optimizer = ModelBasedOptimizer(ub=ubx, lb=lbx, g=g, solver={'name': 'de', 'params': {'strategy': 'best1bin'}}, backoff=0.0)
f_plant, u_plant ,_ = optimizer.run(plant, [])
f_model, u_model ,_ = optimizer.run(model, [])

print(f'Plant: u*={u_plant}, f*={f_plant}')
print(f'Model: u*={u_model}, f*={f_model}')

Plant: u*=[ 4.38993154 80.6407439 ], f*=-75.78782943843999
Model: u*=[ 4.79163832 83.18083659], f*=-26.13215920589414


fig, ax = plt.subplots(figsize=(8,6))
model_cost = plant.get_objective(u_model)

plot_decision_surface(fig, ax, xx, yy, g_plant, z_plant, f'Model: {model_cost:.2f}\nPlant: {f_plant:.2f}')

ax.scatter(u_plant[0], u_plant[1], c='w', marker='*', s=150, zorder=5)
ax.scatter(u_model[0], u_model[1], c='w', marker='x', s=150, zorder=5)
fig.show()


# load the results
analyzer = ExperimentAnalyzer(DATABASE)
results_ma_de = analyzer.load('MA-GP-DE')
results_ma_sqp = analyzer.load('MA-GP-SQP')

results_processed_ma_de = analyzer.pre_process(results_ma_de, f_plant, u_plant)
results_processed_ma_sqp = analyzer.pre_process(results_ma_sqp, f_plant, u_plant)

results_ma_all = pd.concat([results_processed_ma_de, results_processed_ma_sqp], ignore_index=True)


_ = analyzer.plot_by_iteration(results_ma_all, 'dPhi', '$\Delta \phi$ (\%)', 'Cost optimality gap',style='run.status', hue='rto.type')
_ = analyzer.plot_by_iteration(results_ma_all, 'du', '$\Delta u$ (\%)', 'Input optimality gap',style='run.status', hue='rto.type')


def plot_convergence_comparison_surface(results_1, results_2, title, legend, initial_data_size=5):
    fig, ax = plt.subplots(figsize=(8,6))

    plot_decision_surface(fig, ax, xx, yy, g_plant, z_plant, title)
    u_rto_1 = np.stack(results_1['u'], axis=0)
    u_rto_2 = np.stack(results_2['u'], axis=0)

    u_rto_init = u_rto_1[:initial_data_size, :]
    u_rto_1 = u_rto_1[initial_data_size:, :]
    u_rto_2 = u_rto_2[initial_data_size:, :]

    ax.scatter(u_plant[0], u_plant[1], c='w', marker='*', s=150, zorder=6)
    ax.plot(u_rto_init[:,0], u_rto_init[:,1], 'md', zorder=4)
    line1, = ax.plot(u_rto_1[:,0], u_rto_1[:,1], 'ko-', zorder=4)
    line2, = ax.plot(u_rto_2[:,0], u_rto_2[:,1], 'b.-', zorder=5)
    ax.legend((line1, line2), legend)

    fig.show()

plot_convergence_comparison_surface(results_processed_ma_de, results_processed_ma_sqp, 'RTO MA-GP', ('DE','SQP'))


# load the results
results_ma_de_noise = analyzer.load('MA-GP-DE+noise')
results_ma_sqp_noise = analyzer.load('MA-GP-SQP+noise')

results_processed_ma_de_noise = analyzer.pre_process(results_ma_de_noise, f_plant, u_plant)
results_processed_ma_sqp_noise = analyzer.pre_process(results_ma_sqp_noise, f_plant, u_plant)

results_ma_noise_all = pd.concat([results_processed_ma_de_noise, results_processed_ma_sqp_noise], ignore_index=True)


_ = analyzer.plot_by_iteration(results_ma_noise_all, 'dPhi', '$\Delta \phi$ (\%)', 'Cost optimality gap',style='run.status', hue='rto.type')
_ = analyzer.plot_by_iteration(results_ma_noise_all, 'du', '$\Delta u$ (\%)', 'Input optimality gap',style='run.status', hue='rto.type')


# load the results
results_ma_de_noise_ds = analyzer.load('MA-GP-DE+noise-datasets')
results_ma_sqp_noise_ds = analyzer.load('MA-GP-SQP+noise-datasets')

results_processed_ma_de_noise_df = analyzer.pre_process(results_ma_de_noise_ds, f_plant, u_plant)
results_processed_ma_sqp_noise_df = analyzer.pre_process(results_ma_sqp_noise_ds, f_plant, u_plant)

results_ma_noise_datasets_all = pd.concat([results_processed_ma_de_noise_df, results_processed_ma_sqp_noise_df], ignore_index=True)


_ = analyzer.plot_by_iteration(results_ma_noise_datasets_all, 'dPhi', '$\Delta \phi$ (\%)', 'Cost optimality gap',style='run.status', hue='rto.type')
_ = analyzer.plot_by_iteration(results_ma_noise_datasets_all, 'du', '$\Delta u$ (\%)', 'Input optimality gap',style='run.status', hue='rto.type')
_ = analyzer.plot_by_iteration(results_ma_noise_datasets_all, 'best_plant_objective', '$\Phi (\$)$', 'Best objective',style='run.status', hue='rto.type')


# load the results
analyzer = ExperimentAnalyzer(DATABASE)
results_bay_de = analyzer.load('MA-GP-Bayesian-DE')
results_bay_sqp = analyzer.load('MA-GP-Bayesian-SQP')

results_processed_bay_de = analyzer.pre_process(results_bay_de, f_plant, u_plant)
results_processed_bay_sqp = analyzer.pre_process(results_bay_sqp, f_plant, u_plant)

results_bayes_all = pd.concat([results_processed_bay_de, results_processed_bay_sqp], ignore_index=True)


_ = analyzer.plot_by_iteration(results_bayes_all, 'dPhi', '$\Delta \phi$ (\%)', 'Cost optimality gap', style='run.status', hue='rto.type')
_ = analyzer.plot_by_iteration(results_bayes_all, 'du', '$\Delta u$ (\%)', 'Input optimality gap',style='run.status', hue='rto.type')


_ = analyzer.plot_by_iteration(results_bayes_all, 'g_0', '$g_0$', 'Constraint 0',style='run.status', hue='rto.type')
_ = analyzer.plot_by_iteration(results_bayes_all, 'g_1', '$g_1$', 'Constraint 1',style='run.status', hue='rto.type')


results_bayes_magp = pd.concat([results_processed_bay_de, results_processed_ma_de], ignore_index=True)

_ = analyzer.plot_by_iteration(results_bayes_magp, 'dPhi', '$\Delta \phi$ (\%)', 'Cost optimality gap', style='run.status', hue='rto.type')
_ = analyzer.plot_by_iteration(results_bayes_magp, 'du', '$\Delta u$ (\%)', 'Input optimality gap',style='run.status', hue='rto.type')


_ = analyzer.plot_by_iteration(results_bayes_magp, 'g_0', '$g_0$', 'Constraint 0',style='run.status', hue='rto.type')
_ = analyzer.plot_by_iteration(results_bayes_magp, 'g_1', '$g_1$', 'Constraint 1',style='run.status', hue='rto.type')


plot_convergence_comparison_surface(results_processed_bay_de, results_processed_ma_de, 'RTO', ('Bayesian','MA-GP'))


_ = analyzer.plot_by_iteration(results_bayes_magp, 'best_plant_objective', '$\Phi (\$)$', 'Best objective',style='run.status', hue='rto.type')


def get_grid_predictions(models, xx, yy):
    # unpack stuff
    fobj = models['f']
    scaler = models['gp_scaler']
    constraint0 = models['g_0']
    constraint1 = models['g_1']
    
    # flatten each grid to a vector
    r1, r2 = xx.flatten(), yy.flatten()
    r1, r2 = r1.reshape((len(r1), 1)), r2.reshape((len(r2), 1))
    # horizontal stack vectors to create x1,x2 input for the model
    grid = np.hstack((r1,r2))
    # make predictions for the grid
    cost = np.array([model.get_objective(x) + fobj.predict(scaler.transform(x.reshape(1,-1))) for x in grid])
    g_0 = np.array([model.get_constraints(x)[0] + constraint0.predict(scaler.transform(x.reshape(1,-1))) for x in grid])
    g_1 = np.array([model.get_constraints(x)[1] + constraint1.predict(scaler.transform(x.reshape(1,-1))) for x in grid])

    # reshape the predictions back into a grid
    zz_cost = cost.reshape(xx.shape)
    zz_g0 = g_0.reshape(xx.shape)
    zz_g1 = g_1.reshape(xx.shape)

    return zz_cost, zz_g0, zz_g1

def plot_gp_surface(fig, ax, xx, yy, z_f, title):
    CS = ax.contour(xx, yy, z_f)
    fig.colorbar(CS, ax=ax)
    ax.set_xlabel('Fa')
    ax.set_ylabel('Tr')
    ax.set_title(title)

def plot_gp_predictions(ax, i, gp_iterations, xx, yy, title, initial_data_size=5):
    f_gp, g0_gp, g1_gp = get_grid_predictions(gp_iterations[initial_data_size + i],xx,yy)
    g_gp = (g1_gp < g1)&(g0_gp < g0)
    plot_decision_surface(fig, ax, xx, yy, g_gp, f_gp, title)


def get_eic_grid(models, xx, yy, f_best):
    # unpack stuff
    fobj = models['f']
    scaler = models['gp_scaler']
    constraint0 = models['g_0']
    constraint1 = models['g_1']
    
    # flatten each grid to a vector
    r1, r2 = xx.flatten(), yy.flatten()
    r1, r2 = r1.reshape((len(r1), 1)), r2.reshape((len(r2), 1))
    # horizontal stack vectors to create x1,x2 input for the model
    grid = np.hstack((r1,r2))
    # make predictions for the grid
    ei = []
    eic = []
    g0_probs = []
    g1_probs = []

    for x in grid:
        xs = scaler.transform(x.reshape(1,-1))
        model_obj = model.get_objective(x)
        model_g = model.get_constraints(x)

        adaptation = Bunch(modifiers=[fobj.predict(xs, return_std=True), constraint0.predict(xs, return_std=True), constraint1.predict(xs, return_std=True)])
        ei_f = ModelBasedBayesianOptimizer.ei_acquisition(model_obj, adaptation, f_best)

        ei.append(ei_f)
        probs = ModelBasedBayesianOptimizer.constraint_probability(g, model_g, adaptation)
        eic.append(ei_f*np.prod(probs))
        g0_probs.append(probs[0])
        g1_probs.append(probs[1])


    # reshape the predictions back into a grid
    zz_ei = np.array(ei).reshape(xx.shape)
    zz_g0 = np.array(g0_probs).reshape(xx.shape)
    zz_g1 = np.array(g1_probs).reshape(xx.shape)
    zz_eic = np.array(eic).reshape(xx.shape)

    return zz_ei, zz_g0, zz_g1, zz_eic

def plot_eic_grid(ax, i, best_solutions, gp_iterations, xx, yy, initial_data_size=5):
    fbest = best_solutions.iloc[initial_data_size + i]
    f_gp, g0_gp, g1_gp, eic = get_eic_grid(gp_iterations[initial_data_size + i],xx,yy,fbest)
    plot_decision_surface(fig, ax[0], xx, yy, None, f_gp, 'EI')
    plot_decision_surface(fig, ax[1], xx, yy, None, g1_gp*g0_gp, '$Pr(G(x) <= g)$')
    plot_decision_surface(fig, ax[2], xx, yy, None, eic, 'EIC')

def plot_eic(i, results, gp_iterations, xx, yy, initial_data_size=5):
    fig, ax = plt.subplots(figsize=(10,8))
    fbest = results['best_plant_objective'].iloc[initial_data_size + i]
    _, _, _, eic = get_eic_grid(gp_iterations[initial_data_size + i],xx,yy,fbest)
    plot_decision_surface(fig, ax, xx, yy, None, eic, 'EIC')
    ax.scatter(u_plant[0], u_plant[1], c='r', marker='*', s=150, zorder=6)
    u_eic = results['u_opt'].iloc[initial_data_size + i]
    ax.scatter(u_eic[0], u_eic[1], c='r', marker='x', s=150, zorder=6)
    return fig, ax

def plot_eic_iterations(iterations, results, gp_models, initial_data_size=5):
    for i, itertrain in enumerate(iterations):
        fig, ax = plt.subplots(1,3,figsize=(20,6))
        plot_eic_grid(ax, itertrain, results['best_plant_objective'], gp_models,xx,yy)

        u_eic = results['u_opt'].iloc[initial_data_size + itertrain]
        
        ax[0].scatter(u_plant[0], u_plant[1], c='r', marker='*', s=150, zorder=6)
        ax[1].scatter(u_plant[0], u_plant[1], c='r', marker='*', s=150, zorder=6)
        ax[2].scatter(u_plant[0], u_plant[1], c='r', marker='*', s=150, zorder=6)

        ax[1].scatter(u_eic[0], u_eic[1], c='r', marker='x', s=150, zorder=6)
        ax[2].scatter(u_eic[0], u_eic[1], c='r', marker='x', s=150, zorder=6)

        fig.suptitle(f'Iteration: {itertrain}')
        fig.show()


# generate the results
gp_results_bay_de = [analyzer.load_run_models(run_id) for run_id in results_processed_bay_de['run.id']]
gp_results_bay_sqp = [analyzer.load_run_models(run_id) for run_id in results_processed_bay_sqp['run.id']]


plot_eic_iterations([0], results_processed_bay_de, gp_results_bay_de)


# zoom into the EIC function
u1_eic = np.linspace(4.2, 5.2, grid_size)
u2_eic = np.linspace(79, 84, grid_size)
xx_eic, yy_eic = np.meshgrid(u1_eic, u2_eic)

fig_eic, ax_eic = plot_eic(0, results_processed_bay_de, gp_results_bay_de, xx_eic, yy_eic)


iterations = [8,10,12,14,16]
plot_eic_iterations(iterations, results_processed_bay_de, gp_results_bay_de)


for it in iterations:
    plot_eic(it, results_processed_bay_de, gp_results_bay_de, xx_eic, yy_eic)


results_bay_datasets = analyzer.load('MA-GP-Bayesian-DE+noise-datasets')
results_bay_processed_datasets = analyzer.pre_process(results_bay_datasets, f_plant, u_plant)

results_bayes_magp_datasets = pd.concat([results_processed_ma_de_noise_df, results_bay_processed_datasets], ignore_index=True)

_ = analyzer.plot_by_iteration(results_bayes_magp_datasets, 'dPhi', '$\Delta \phi$ (\%)', 'Cost optimality gap', style='run.status', hue='rto.type')
_ = analyzer.plot_by_iteration(results_bayes_magp_datasets, 'du', '$\Delta u$ (\%)', 'Input optimality gap',style='run.status', hue='rto.type')
_ = analyzer.plot_by_iteration(results_bayes_magp_datasets, 'best_plant_objective', '$\Phi (\$)$', 'Best objective',style='run.status', hue='rto.type')

Real-Time Optimization¶

Modifier Adaptation with Bayesian Optimization using EIC acquisition¶

Preliminary thesis results¶

Problem Description¶

Analysis¶

Real-Time Optimization¶

Modifier Adaptation with Gaussian Processes¶

Effect of Noise¶

Using different initial data points¶

EIC acquisition function¶

Optimizer Choice¶

Comparison with MA-GP¶

Investigating the EIC decision surface¶

First iteration¶

Effect of initialization point EIC¶

Conclusion¶