mtbo_planner.py

#!/usr/bin/env python

import os, sys
import pickle
import numpy as np

from sklearn.preprocessing import StandardScaler

import torch
import gpytorch
from botorch.models import SingleTaskGP
from botorch.models import MixedSingleTaskGP

from gpytorch.kernels import ScaleKernel
from botorch.models.kernels.categorical import CategoricalKernel

from botorch.fit import fit_gpytorch_model
from botorch.optim import optimize_acqf, optimize_acqf_mixed, optimize_acqf_discrete
from botorch.acquisition import ExpectedImprovement

from olympus.planners import CustomPlanner, AbstractPlanner
from olympus import ParameterVector

from botorch.models.gpytorch import GPyTorchModel
from gpytorch.distributions import MultivariateNormal
from gpytorch.means import ConstantMean
from gpytorch.models import ExactGP
from gpytorch.kernels import RBFKernel, ScaleKernel, MaternKernel
from gpytorch.likelihoods import GaussianLikelihood
from gpytorch.mlls import ExactMarginalLogLikelihood

from botorch.models import MultiTaskGP


from utils import (
	cat_param_to_feat,
	propose_randomly,
	forward_transform,
	reverse_transform,
	infer_problem_type,
	project_to_olymp,
	create_available_options,
	get_bounds,
)


class CategoricalSingleTaskGP(ExactGP, GPyTorchModel):

	_num_outputs = 1

	def __init__(self, train_X, train_Y):
		''' Single task GP with a categorical kernel based on the Hamming distance

		Note: this kernel is NOT differentiable with respect to the inputs
		'''
		# squeeze output dim before passing train_Y to ExactGP
		super().__init__(train_X, train_Y.squeeze(-1), GaussianLikelihood())
		self.mean_module = ConstantMean()
		self.covar_module = ScaleKernel(
			base_kernel = CategoricalKernel(
				ard_num_dims=train_Y.shape[-1] # ARD for all categorical dimensions
			)
		)
		self.to(train_X)

	def forward(self, x):
		mean_x = self.mean_module(x)
		covar_x = self.covar_module(x)
		return MultivariateNormal(mean_x, covar_x)


class MultiTaskBO(CustomPlanner):
	''' Wrapper for mutitask Bayesian optimization using a multitask
	GP as the surrogate model.

	Args:
		goal (str): the optimization goal, "maximize", or "minimize"
		batch_size (int): number of samples to measure per batch (will be fixed at 1 for now)
		random_seed (int): the random seed to use
		num_init_design (int):  number of points to sample using the initial design strategy
		init_design_strategy (str): the inital design strategy, "random" or "sobol"
		tasks (list): list of dictionaries containing the tasks, dictionaties have
			strucure {'params': [...], 'values': [...]} where the values are 2d numpy
			arrays

	'''

	def __init__(
		self,
		goal='minimize',
		batch_size=1,
		random_seed=None,
		num_init_design=5,
		init_design_strategy='random',
		tasks=None,
		**kwargs,
	):
		AbstractPlanner.__init__(**locals())
		self.goal = goal
		self.batch_size = batch_size
		if random_seed is None:
			self.random_seed = np.random.randint(0, int(10e6))
		else:
			self.random_seed = random_seed
		np.random.seed(self.random_seed)
		self.num_init_design = num_init_design
		self.init_design_strategy = init_design_strategy
		self.tasks = tasks

		#>>>>>>>>
		# add the task id to the list of task dictionaries as
		# the task features
		for idx, task in enumerate(self.tasks):
			task['task_idx'] = idx+1.
		#<<<<<<<<


	def _set_param_space(self, param_space):
		''' set the Olympus parameter space (not actually really needed)
		'''
		# make attribute that indicates wether or not we are using descriptors for
		# categorical variables
		descriptors = []
		for p in self.param_space:
			descriptors.extend(p.descriptors)
		if all(d is None for d in descriptors):
			self.has_descriptors = False
		else:
			self.has_descriptors = True

	def build_train_data(self):
		''' build the training dataset at each iteration
		'''
		target_params = []
		target_values = []
		# adapt the target task params first --> change the categorical params to ohe
		for sample_ix, (targ_param, targ_value) in enumerate(zip(self._params, self._values)):
			sample_x = []
			for param_ix, (space_true, element) in enumerate(zip(self.param_space, targ_param)):
				if self.param_space[param_ix].type == 'categorical':
					feat = cat_param_to_feat(space_true, element)
					sample_x.extend(feat)
				else:
					sample_x.append(float(element))
			target_params.append(sample_x)
			target_values.append(targ_value)
		train_x = np.array(target_params)  # (# target obs, # param dim)
		train_y = np.array(target_values)  # (# target obs, 1)

		#>>>>>>>>
		target_task = {'params': train_x, 'values': train_y, 'task_idx': 0.0}
		all_tasks = self.tasks+[target_task]

		# concatenate together all of the tasks params and task idx

		train_x = []
		for task in all_tasks:
			idx = np.repeat(task['task_idx'], task['params'].shape[0]).reshape(-1, 1)
			params_w_idx = np.concatenate((task['params'], idx), axis=1)
			train_x.append(params_w_idx)
		train_x = np.concatenate(train_x)

		# concatenate together all of the tasks values (no task features needed)
		train_y = np.concatenate([task['values'] for task in all_tasks])

		#<<<<<<<<

		self._means_y = np.array([np.mean(train_y[:, ix]) for ix in range(train_y.shape[1])])
		# guard against the case where we have std = 0.0
		self._stds_y = np.array([np.std(train_y[:, ix]) for ix in range(train_y.shape[1])])
		self._stds_y = np.where(self._stds_y==0.0, 1., self._stds_y)

		# forward transform (standardization)
		train_y = forward_transform(train_y, self._means_y, self._stds_y)

		# convert to torch tensors and return
		return torch.tensor(train_x).double(), torch.tensor(train_y).double()


	def _tell(self, observations):
		''' unpack the current observations from Olympus

		Args:
			observations (obj): observations from Olympus
		'''
		self._params = observations.get_params() # string encodings of categorical params
		self._values = observations.get_values(as_array=True, opposite=self.flip_measurements)
		# make values 2d if they are not already
		if len(np.array(self._values).shape)==1:
			self._values = np.array(self._values).reshape(-1, 1)


	def _ask(self):

		# infer the problem type
		problem_type = infer_problem_type(self.param_space)

		if len(self._values) < self.num_init_design:
			# sample using initial design strategy
			sample, raw_sample = propose_randomly(1, self.param_space)
			return_params = ParameterVector().from_array(raw_sample[0], self.param_space)

		else:
			# use GP surrogate to propose the samples
			# get the scaled parameters and values
			self.train_x_scaled, self.train_y_scaled = self.build_train_data()

			# infer the model based on the parameter types
			if problem_type == 'fully_continuous':
				model = SingleTaskGP(self.train_x_scaled, self.train_y_scaled)
			elif problem_type == 'mixed':
				# TODO: implement a method to retrieve the categorical dimensions
				model = MixedSingleTaskGP(self.train_x_scaled, self.train_y_scaled, cat_dims=None)
			elif problem_type == 'fully_categorical':

				#>>>>>>>>
				model = MultiTaskGP(
					self.train_x_scaled,
					self.train_y_scaled,
					task_feature=-1,  # the index of the task feature (last inedx here)
					output_tasks=[0], # a list of task indices to compute the output
				)
				#<<<<<<<<


			# fit the GP
			mll = ExactMarginalLogLikelihood(model.likelihood, model)
			fit_gpytorch_model(mll)

			# get the incumbent point
			#>>>>>>>>
			f_best_argmin = torch.argmin(self.train_y_scaled[-self._values.shape[0]:])
			f_best_scaled = self.train_y_scaled[f_best_argmin][0].float()
			#>>>>>>>>
			#f_best_raw    = self._values[f_best_argmin][0]

			acqf = ExpectedImprovement(model, f_best_scaled, objective=None, maximize=False) # always minimization in Olympus

			bounds = get_bounds(self.param_space, self.has_descriptors)
			choices_feat, choices_cat = None, None

			if problem_type == 'fully_continuous':
				results, _ = optimize_acqf(
					acq_function=acqf,
					bounds=bounds,
					num_restarts=200,
					q=self.batch_size,
					raw_samples=1000
				)
			elif problem_type == 'mixed':
				results, _ = optimize_acqf_mixed(
					acq_function=acqf,
					bounds=bounds,
					num_restarts=200,
					q=self.batch_size,
					raw_samples=1000
				)
			elif problem_type == 'fully_categorical':
				# need to implement the choices input, which is a
				# (num_choices * d) torch.Tensor of the possible choices
				# need to generate fully cartesian product space of possible
				# choices
				choices_feat, choices_cat = create_available_options(self.param_space, self._params)

				results, _ = optimize_acqf_discrete(
					acq_function=acqf,
					q=self.batch_size,
					max_batch_size=1000,
					choices=choices_feat,
					unique=True
				)

			# convert the results form torch tensor to numpy
			results_np = np.squeeze(results.detach().numpy())
			# project the sample back to Olympus format
			sample = project_to_olymp(
				results_np, self.param_space,
				has_descriptors=self.has_descriptors,
				choices_feat=choices_feat, choices_cat=choices_cat,
			)
			return_params = [ParameterVector().from_dict(sample, self.param_space)]

		return return_params


#============
# DEBUGGING
#============

if __name__ == '__main__':

	from olympus.objects import (
		ParameterContinuous,
		ParameterDiscrete,
		ParameterCategorical,
	)
	from olympus.campaigns import Campaign, ParameterSpace
	from olympus.surfaces import Surface

	PARAM_TYPE = 'perovskites_descriptors'

	if PARAM_TYPE == 'continuous':
		pass

	elif PARAM_TYPE == 'perovskites':
		# load in the perovskites dataset
		lookup_df = pickle.load(open('datasets_emulators/perovskites/perovskites.pkl', 'rb'))

		# make a function for measuring the perovskite bandgap
		def measure(param):
			''' lookup the HSEO6 bandgap for given perovskite component
			'''
			match = lookup_df.loc[
							(lookup_df.organic == param['organic']) &
							(lookup_df.anion == param['anion']) &
							(lookup_df.cation == param['cation'])
						]
			assert len(match)==1
			bandgap = match.loc[:, 'hse06'].to_numpy()[0]
			return bandgap

		#>>>>>>>>
		def sample_tasks(num_points, param_space, random_state=None):
			'''  sample some GGA level bandgap measurements
			'''
			samples = lookup_df.sample(
				n=num_points, replace=False, random_state=random_state,
			)
			param_str = samples[['organic', 'anion', 'cation']].values
			params = []
			for sample_ix, targ_param in enumerate(param_str):
				sample_x = []
				for param_ix, (space_true, element) in enumerate(zip(param_space, targ_param)):
					feat = cat_param_to_feat(space_true, element)
					sample_x.extend(feat)

				params.append(sample_x)
			params = torch.tensor(np.array(params))
			values = torch.tensor(samples['gga'].values.reshape(-1, 1))

			return [{'params': params, 'values': values}]
		#<<<<<<<<

		# build the experiment
		organic_options = lookup_df.organic.unique().tolist()
		anion_options = lookup_df.anion.unique().tolist()
		cation_options = lookup_df.cation.unique().tolist()

		# make the parameter space
		param_space = ParameterSpace()

		organic_param = ParameterCategorical(
			name='organic',
			options=organic_options,
			descriptors=[None for _ in organic_options],
		)
		param_space.add(organic_param)

		anion_param = ParameterCategorical(
			name='anion',
			options=anion_options,
			descriptors=[None for _ in anion_options],
		)
		param_space.add(anion_param)

		cation_param = ParameterCategorical(
			name='cation',
			options=cation_options,
			descriptors=[None for _ in cation_options],
		)
		param_space.add(cation_param)

		#>>>>>>>>
		# sample some low-fidelity points
		gga_tasks = sample_tasks(num_points=50, param_space=param_space, random_state=100700)
		planner = MultiTaskBO(
			goal='minimize', tasks=gga_tasks
		)
		planner.set_param_space(param_space)
		#<<<<<<<<

		campaign = Campaign()
		campaign.set_param_space(param_space)

		BUDGET = 192

		OPT = ['hydrazinium', 'I', 'Sn'] # value = 1.5249 eV

		for iter in range(BUDGET):
			samples = planner.recommend(campaign.observations)
			measurement = measure(samples[0])
			print(f'ITER : {iter}\tSAMPLES : {samples}\t MEASUREMENT : {measurement}')
			campaign.add_observation(samples[0], measurement)

			# check for convergence
			if [samples[0]['organic'], samples[0]['anion'], samples[0]['cation']] == OPT:
				print(f'FOUND OPTIMUM AFTER {iter+1} ITERATIONS!')
				break


	elif PARAM_TYPE == 'perovskites_descriptors':
		# load in the perovskites dataset
		lookup_df = pickle.load(open('datasets_emulators/perovskites/perovskites.pkl', 'rb'))

		# make a function for measuring the perovskite bandgap
		def measure(param):
			''' lookup the HSEO6 bandgap for given perovskite component
			'''
			match = lookup_df.loc[
							(lookup_df.organic == param['organic']) &
							(lookup_df.anion == param['anion']) &
							(lookup_df.cation == param['cation'])
						]
			assert len(match)==1
			bandgap = match.loc[:, 'hse06'].to_numpy()[0]
			return bandgap

		#>>>>>>>>
		def sample_tasks(num_points, param_space, random_state=None):
			'''  sample some GGA level bandgap measurements
			'''
			samples = lookup_df.sample(
				n=num_points, replace=False, random_state=random_state,
			)
			param_str = samples[['organic', 'anion', 'cation']].values
			params = []
			for sample_ix, targ_param in enumerate(param_str):
				sample_x = []
				for param_ix, (space_true, element) in enumerate(zip(param_space, targ_param)):
					feat = cat_param_to_feat(space_true, element)
					sample_x.extend(feat)
				params.append(sample_x)
			params = torch.tensor(np.array(params))
			values = torch.tensor(samples['gga'].values.reshape(-1, 1))

			return [{'params': params, 'values': values}]
		#<<<<<<<<

		def get_descriptors(element, kind):
			''' retrive the descriptors for a given element
			'''
			return lookup_df.loc[(lookup_df[kind]==element)].loc[:, lookup_df.columns.str.startswith(f'{kind}-')].values[0].tolist()


		# build the experiment
		organic_options = lookup_df.organic.unique().tolist()
		anion_options = lookup_df.anion.unique().tolist()
		cation_options = lookup_df.cation.unique().tolist()

		# make the parameter space
		param_space = ParameterSpace()

		organic_param = ParameterCategorical(
			name='organic',
			options=organic_options,
			descriptors=[get_descriptors(option, 'organic') for option in organic_options],
		)
		param_space.add(organic_param)

		anion_param = ParameterCategorical(
			name='anion',
			options=anion_options,
			descriptors=[get_descriptors(option, 'anion') for option in anion_options],
		)
		param_space.add(anion_param)

		cation_param = ParameterCategorical(
			name='cation',
			options=cation_options,
			descriptors=[get_descriptors(option, 'cation') for option in cation_options],
		)
		param_space.add(cation_param)

		#>>>>>>>>
		# sample some low-fidelity points
		gga_tasks = sample_tasks(num_points=192, param_space=param_space, random_state=100700)
		planner = MultiTaskBO(
			goal='minimize', tasks=gga_tasks
		)
		planner.set_param_space(param_space)
		#<<<<<<<<

		campaign = Campaign()
		campaign.set_param_space(param_space)

		BUDGET = 192

		OPT = ['hydrazinium', 'I', 'Sn'] # value = 1.5249 eV

		for iter in range(BUDGET):
			samples = planner.recommend(campaign.observations)
			measurement = measure(samples[0])
			print(f'ITER : {iter}\tSAMPLES : {samples}\t MEASUREMENT : {measurement}')
			campaign.add_observation(samples[0], measurement)

			# check for convergence
			if [samples[0]['organic'], samples[0]['anion'], samples[0]['cation']] == OPT:
				print(f'FOUND OPTIMUM AFTER {iter+1} ITERATIONS!')
				break