control_simulation.py


import torch
import configparser
import control
from dataSettings import get_denormalized_dic, get_normalized_dic
from customModels import IanRNN, HiroLRAN, HiroLRANReLU, HiroLRANDiag
from train_helpers import get_state_mask, get_sample_time_state_mask, masked_loss
import numpy as np
from scipy.sparse import csr_matrix
import customDatasetMakers
import matplotlib.pyplot as plt
import prediction_helpers
import osqp
import scipy as sp
from scipy import sparse
from prediction_helpers import get_ml_truth, get_ml_profile_warmup, get_ml_actuator_trajectory, get_ml_predictions, get_considered_models, get_fast_profile_prediction


lstm_model_name = 'HiroLRAN_ne_noGas_all'
#lstm_model_name = 'HiroLRAN_alldiiid'
linear_model_name = lstm_model_name

config_filename = f'/projects/EKOLEMEN/profile_predictor/joe_hiro_models/{lstm_model_name}config'
config=configparser.ConfigParser()
config.read(config_filename)
output_filename_base=config['model']['output_filename_base']
profiles=config['inputs']['profiles'].split()
actuators=config['inputs']['actuators'].split()
parameters=config['inputs'].get('parameters','').split()
calculations=config['inputs'].get('calculations','').split()
linear_config_filename = f'/projects/EKOLEMEN/profile_predictor/joe_hiro_models/{linear_model_name}config'
config_linear=configparser.ConfigParser()
config_linear.read(linear_config_filename)
controller_actuators = config_linear['inputs']['actuators'].split()
controller_profiles = config_linear['inputs']['profiles'].split()
controller_parameters = config_linear['inputs']['parameters'].split()
latent_dim = int(config_linear['HiroLRAN']['latent_dim'])
data_filename = config['preprocess']['preprocessed_data_filenamebase'] + 'val.pkl'

lstm_model = prediction_helpers.get_considered_models(config_filename, ensemble=False)[0]

linear_model = prediction_helpers.get_considered_models(linear_config_filename, ensemble=False)[0]

x_test, y_test, shots, times =customDatasetMakers.ian_dataset(data_filename,profiles,parameters,calculations,actuators,sort_by_size=True)
shot_index = 55
wanted_sample = x_test[shot_index]
nwarmup = 3
starting_index = 0
end_index = len(wanted_sample) - nwarmup

N = 10 # prediction horizon
nsim = 100 # number of simulated timesteps

# get the simulator indices of the states and actuators that I want to control
future_controller_indices = [len(profiles)*33 + len(parameters) + len(actuators) + actuators.index(controller_actuators[i]) for i in range(len(controller_actuators))]
current_controller_indices = [len(profiles)*33 + len(parameters) + actuators.index(controller_actuators[i]) for i in range(len(controller_actuators))]
initial_state_index_list = [profiles.index(profiles[i]) for i in range(len(controller_profiles))]
state_indices = [num * 33 + i for num in initial_state_index_list for i in range(33)]
parameter_indices = [len(profiles)*33 + parameters.index(controller_parameters[i]) for i in range(len(controller_parameters))]
state_indices = state_indices + parameter_indices
# the state that I alter throughout the simulation
simulated_state = wanted_sample[starting_index:end_index, :].clone()
simulated_state = torch.unsqueeze(simulated_state, 0).float()
simulated_z_t = linear_model.encoder(simulated_state[:,nwarmup,state_indices].clone()).detach().numpy()

# set target state as experimental state
target_params = wanted_sample[starting_index:end_index, state_indices].clone() 
target_params = torch.unsqueeze(target_params, 0).float()
#target_params = target_params * 0 + 3
target_z_t = linear_model.encoder(target_params).detach().numpy()

# normalize Q!!!
Q_weights = np.ones(latent_dim)
Q = np.eye(latent_dim)
for i in range(latent_dim):
    Q[i,i] = Q_weights[i]
Q = csr_matrix(Q)

QN = Q
R_array = np.eye(len(controller_actuators))*0.1

# normalize R to max values of actuators
#R_array[3][3] = 0.00001
#R_array[4][4] = 0.00001

#R_array[controller_actuators.index('D_tot'), con#troller_actuators.index('D_tot')] = 1
R = csr_matrix(R_array)

# - linear constraints (# bmspinj, bmstinj, ip, pcbcoil, dstdenp, ech_pwr_tot)
#umin = np.array([4/2, 2/2, 0, 0, 4/2, 0])
#umax = np.array([10/2, 4/2, 1, 1, 8/2, 3])
#umin = np.array([-2/2])
#umax = np.array([10/2])


umin = np.array([-np.inf]*len(controller_actuators))
umax = np.array([np.inf]*len(controller_actuators))
#umin[2] = -1
#umin[4] = 0
xmin = np.array([-np.inf]*latent_dim)
xmax = np.array([np.inf]*latent_dim)

# set actuators that I don't want to control
blocked_actuators = ['ip','PCBCOIL']

for actuator in blocked_actuators:
    true_value = wanted_sample[starting_index+nwarmup, current_controller_indices[controller_actuators.index(actuator)]].clone().item()
    umin[controller_actuators.index(actuator)] = true_value
    umax[controller_actuators.index(actuator)] = true_value

#Ad = sparse.csc_matrix(linear_model.A.weight.data)
Ad = sparse.csc_matrix(torch.diag(linear_model.A.diagonal.data))
Bd = sparse.csc_matrix(linear_model.B.weight.data)
[nx, nu] = Bd.shape

q = np.hstack([np.kron(np.ones(N), -Q@(target_z_t[0,nwarmup,:])), -QN@(target_z_t[0,nwarmup,:]), np.zeros(N*nu)])
P = sparse.block_diag([sparse.kron(sparse.eye(N), Q), QN,
                       sparse.kron(sparse.eye(N), R)], format='csc')
Ax = sparse.kron(sparse.eye(N+1),-sparse.eye(nx)) + sparse.kron(sparse.eye(N+1, k=-1), Ad)
Bu = sparse.kron(sparse.vstack([sparse.csc_matrix((1, N)), sparse.eye(N)]), Bd)
Aeq = sparse.hstack([Ax, Bu])
leq = np.hstack([-simulated_z_t[0], np.zeros(N*nx)])
ueq = leq
Aineq = sparse.eye((N+1)*nx + N*nu)
lineq = np.hstack([np.kron(np.ones(N+1), xmin), np.kron(np.ones(N), umin)])
uineq = np.hstack([np.kron(np.ones(N+1), xmax), np.kron(np.ones(N), umax)])
A = sparse.vstack([Aeq, Aineq], format='csc')
l = np.hstack([leq, lineq])
u = np.hstack([ueq, uineq])

prob = osqp.OSQP()
prob.setup(P, q, A, l, u, warm_start=True, max_iter=10000)

latent_trajectory = []

for i in range(nsim):
    # Solve
    res = prob.solve()

    # Check solver status
    if res.info.status != 'solved':
        raise ValueError('OSQP did not solve the problem!')
    
    ctrl = torch.tensor(res.x[-N*nu:-(N-1)*nu]).float()
    print(ctrl)
    #x=res.x
    #obj_val = 0.5 * np.dot(x, P.dot(x)) + np.dot(q, x)
    #print(f'obj')
    #print(obj_val)
    #print(res.x)

    # change future actuator, and the current actuator of future timestep
    simulated_state[0,nwarmup+i-1,future_controller_indices] = ctrl
    simulated_state[0, nwarmup+i, current_controller_indices] = ctrl
    predicted_state = prediction_helpers.get_fast_profile_prediction(simulated_state[:,:nwarmup + i, :], lstm_model)
    if nwarmup + i < len(wanted_sample): # if I'm not at the end of the simulation
        simulated_state[:, nwarmup + i, 0:len(profiles)*33 + len(parameters)] = predicted_state

    predicted_z_t = linear_model.encoder(predicted_state[:, :, state_indices]).detach().numpy()
    latent_trajectory.append(predicted_z_t)

    # Update limits for blocked actuators
    for actuator in blocked_actuators:
        true_value = wanted_sample[starting_index+i+nwarmup, future_controller_indices[controller_actuators.index(actuator)]].clone().item()
        umin[controller_actuators.index(actuator)] = true_value
        umax[controller_actuators.index(actuator)] = true_value

    lineq = np.hstack([np.kron(np.ones(N+1), xmin), np.kron(np.ones(N), umin)])
    uineq = np.hstack([np.kron(np.ones(N+1), xmax), np.kron(np.ones(N), umax)])
    l = np.hstack([leq, lineq])
    u = np.hstack([ueq, uineq])

    l[:nx] = -predicted_z_t
    u[:nx] = -predicted_z_t

    # Update targets

    q = np.hstack([np.kron(np.ones(N), -Q@(target_z_t[0,nwarmup + i,:])), -QN@(target_z_t[0,nwarmup + i,:]), np.zeros(N*nu)])
    
    prob.update(l=l, u=u, q=q)
    print(f'timestep {i} done')

output_dict = {
    'real': {},
    'controlled': {}
}

prediction_length = end_index - starting_index - nwarmup
# got to input the correct times here
true_actuator_trajectory = get_ml_actuator_trajectory(x_test[shot_index:shot_index+1][starting_index:end_index], profiles, parameters, calculations, actuators, nwarmup=nwarmup, prediction_length=prediction_length) # nwarmup and full prediction actuators
true_warmup_profiles, true_warmup_parameters = get_ml_profile_warmup(x_test[shot_index:shot_index+1][starting_index:end_index], profiles, parameters, calculations, actuators, recorded_profiles=profiles, recorded_parameters=parameters, nwarmup=nwarmup) 
true_profiles, true_parameters = get_ml_truth(target_params, profiles, parameters, calculations, nwarmup=nwarmup, prediction_length=prediction_length) # get true state at t+1

controlled_actuator_trajectory = get_ml_actuator_trajectory(simulated_state, profiles, parameters, calculations, actuators, nwarmup=nwarmup, prediction_length=prediction_length)
controlled_warmup_profiles, controlled_warmup_parameters = get_ml_profile_warmup(simulated_state, profiles, parameters, calculations, actuators, recorded_profiles=profiles, recorded_parameters=parameters, nwarmup=nwarmup)
controlled_profiles, controlled_parameters = get_ml_truth(simulated_state, profiles, parameters, calculations, nwarmup=nwarmup, prediction_length=prediction_length)

combined_true_profiles = np.concatenate((true_warmup_profiles, true_profiles), axis=2)
combined_controlled_profiles = np.concatenate((controlled_warmup_profiles, controlled_profiles), axis=2)
combined_true_params = np.concatenate((true_warmup_parameters, true_parameters), axis=2)
combined_predicted_params = np.concatenate((controlled_warmup_parameters, controlled_parameters), axis=2)

output_dict['real']['profiles'] = combined_true_profiles
output_dict['real']['parameters'] = combined_true_params
output_dict['real']['actuators'] = true_actuator_trajectory
output_dict['controlled']['profiles'] = combined_controlled_profiles
output_dict['controlled']['parameters'] = combined_predicted_params
output_dict['controlled']['actuators'] = controlled_actuator_trajectory
output_dict['time'] = np.arange(len(true_actuator_trajectory[0,0,:]))*20

import pickle
with open(f'control_pickles/{lstm_model_name}{linear_model_name}{shot_index}.pkl', 'wb') as file:
    # Pickle the array and write it to the file
    pickle.dump(output_dict, file)

'''controlled_dict = customDatasetMakers.state_to_dic(controlled_state, profiles, parameters, actuators=actuators)
controlled_denormed_dict = get_denormalized_dic(controlled_dict)

real_state = wanted_sample[starting_index + nwarmup + 1:end_index,:].clone()
real_dict = customDatasetMakers.state_to_dic(real_state, profiles, parameters, actuators=actuators)
real_denormed_dict = get_denormalized_dic(real_dict)

output_dict['real'] = real_denormed_dict
output_dict['controlled'] = controlled_denormed_dict
output_dict['latent'] = np.array(latent_trajectory)

import pickle
with open(f'control_pickles/{lstm_model_name}{linear_model_name}{shot_index}.pkl', 'wb') as file:
    # Pickle the array and write it to the file
    pickle.dump(output_dict, file)
'''