Spaces:

AccelerationConsortium
/

crabnet-hyperparameter

Running

App Files Files Community

crabnet-hyperparameter / app.py

sgbaird

add open in colab badge for github gist

013d919 verified 11 months ago

raw

history blame contribute delete

11.4 kB

	import numpy as np
	import gradio as gr
	import pandas as pd
	from sklearn.preprocessing import MinMaxScaler
	from surrogate import CrabNetSurrogateModel, PARAM_BOUNDS
	from pydantic import (
	BaseModel,
	ValidationError,
	ValidationInfo,
	field_validator,
	model_validator,
	)

	model = CrabNetSurrogateModel()

	# Define the input parameters
	example_parameterization = {
	"N": 3,
	"alpha": 0.5,
	"d_model": 512,
	"dim_feedforward": 2048,
	"dropout": 0.1,
	"emb_scaler": 0.5,
	"epochs_step": 10,
	"eps": 0.000001,
	"fudge": 0.02,
	"heads": 4,
	"k": 6,
	"lr": 0.001,
	"pe_resolution": 5000,
	"ple_resolution": 5000,
	"pos_scaler": 0.5,
	"weight_decay": 0,
	"batch_size": 32,
	"out_hidden4": 128,
	"betas1": 0.9,
	"betas2": 0.999,
	"bias": False,
	"criterion": "RobustL1",
	"elem_prop": "mat2vec",
	"train_frac": 0.5,
	}

	example_results = model.surrogate_evaluate([example_parameterization])
	example_result = example_results[0]

	# Initialize and fit scalers for each parameter
	scalers = {}
	for param_info in PARAM_BOUNDS:
	if param_info["type"] == "range":
	scaler = MinMaxScaler()
	# Fit the scaler using the parameter bounds
	scaler.fit([[bound] for bound in param_info["bounds"]])
	scalers[param_info["name"]] = scaler

	# HACK: Hardcoded
	BLINDED_PARAM_BOUNDS = [
	{"name": "x1", "type": "range", "bounds": [0.0, 1.0]},
	{"name": "x2", "type": "range", "bounds": [0.0, 1.0]},
	{"name": "x3", "type": "range", "bounds": [0.0, 1.0]},
	{"name": "x4", "type": "range", "bounds": [0.0, 1.0]},
	{"name": "x5", "type": "range", "bounds": [0.0, 1.0]},
	{"name": "x6", "type": "range", "bounds": [0.0, 1.0]},
	{"name": "x7", "type": "range", "bounds": [0.0, 1.0]},
	{"name": "x8", "type": "range", "bounds": [0.0, 1.0]},
	{"name": "x9", "type": "range", "bounds": [0.0, 1.0]},
	{"name": "x10", "type": "range", "bounds": [0.0, 1.0]},
	{"name": "x11", "type": "range", "bounds": [0.0, 1.0]},
	{"name": "x12", "type": "range", "bounds": [0.0, 1.0]},
	{"name": "x13", "type": "range", "bounds": [0.0, 1.0]},
	{"name": "x14", "type": "range", "bounds": [0.0, 1.0]},
	{"name": "x15", "type": "range", "bounds": [0.0, 1.0]},
	{"name": "x16", "type": "range", "bounds": [0.0, 1.0]},
	{"name": "x17", "type": "range", "bounds": [0.0, 1.0]},
	{"name": "x18", "type": "range", "bounds": [0.0, 1.0]},
	{"name": "x19", "type": "range", "bounds": [0.0, 1.0]},
	{"name": "x20", "type": "range", "bounds": [0.0, 1.0]},
	{"name": "c1", "type": "choice", "values": ["c1_0", "c1_1"]},
	{"name": "c2", "type": "choice", "values": ["c2_0", "c2_1"]},
	{"name": "c3", "type": "choice", "values": ["c3_0", "c3_1", "c3_2"]},
	{"name": "fidelity1", "type": "range", "bounds": [0.0, 1.0]},
	]


	class BlindedParameterization(BaseModel):
	x1: float # int
	x2: float
	x3: float # int
	x4: float # int
	x5: float
	x6: float
	x7: float # int
	x8: float
	x9: float
	x10: float # int
	x11: float # int
	x12: float
	x13: float # int
	x14: float # int
	x15: float
	x16: float # int
	x17: float # int
	x18: float # int
	x19: float
	x20: float
	c1: str # bool
	c2: str
	c3: str
	fidelity1: float

	@field_validator("*")
	def check_bounds(cls, v: int, info: ValidationInfo) -> int:
	param = next(
	(item for item in BLINDED_PARAM_BOUNDS if item["name"] == info.field_name),
	None,
	)
	if param is None:
	return v

	if param["type"] == "range":
	min_val, max_val = param["bounds"]
	if not min_val <= v <= max_val:
	raise ValueError(
	f"{info.field_name} must be between {min_val} and {max_val}"
	)
	elif param["type"] == "choice":
	if v not in param["values"]:
	raise ValueError(f"{info.field_name} must be one of {param['values']}")

	return v

	@model_validator(mode="after")
	def check_constraints(self) -> "BlindedParameterization":
	if self.x19 > self.x20:
	raise ValueError(
	f"Received x19={self.x19} which should be less than x20={self.x20}"
	)
	if self.x6 + self.x15 > 1.0:
	raise ValueError(
	f"Received x6={self.x6} and x15={self.x15} which should sum to less than or equal to 1.0" # noqa: E501
	)


	# Conversion from original to blinded representation
	def convert_to_blinded(params):
	blinded_params = {}
	numeric_index = 1
	choice_index = 1
	for param in PARAM_BOUNDS:
	if param["type"] == "range":
	key = f"x{numeric_index}" if param["name"] != "train_frac" else "fidelity1"
	blinded_params[key] = scalers[param["name"]].transform(
	[[params[param["name"]]]]
	)[0][0]
	numeric_index += 1 if param["name"] != "train_frac" else 0
	elif param["type"] == "choice":
	key = f"c{choice_index}"
	choice_index = param["values"].index(params[param["name"]])
	blinded_params[key] = f"{key}_{choice_index}"
	choice_index += 1
	return blinded_params


	# Conversion from blinded to original representation
	def convert_from_blinded(blinded_params):
	original_params = {}
	numeric_index = 1
	choice_index = 1
	for param in PARAM_BOUNDS:
	if param["type"] == "range":
	key = f"x{numeric_index}" if param["name"] != "train_frac" else "fidelity1"
	original_params[param["name"]] = scalers[param["name"]].inverse_transform(
	[[blinded_params[key]]]
	)[0][0]
	numeric_index += 1 if param["name"] != "train_frac" else 0
	elif param["type"] == "choice":
	key = f"c{choice_index}"
	choice_value = blinded_params[key].split("_")[-1]
	original_params[param["name"]] = param["values"][int(choice_value)]
	choice_index += 1
	return original_params


	def evaluate(*args):
	# Assume args are in the order of BLINDED_PARAM_BOUNDS
	blinded_params = dict(zip([param["name"] for param in BLINDED_PARAM_BOUNDS], args))
	original_params = convert_from_blinded(blinded_params)
	BlindedParameterization(**blinded_params) # Validation

	params_list = [original_params]
	results = model.surrogate_evaluate(params_list)
	results_list = [list(result.values()) for result in results]
	return results_list


	def get_interface(param_info, numeric_index, choice_index):
	key = param_info["name"]
	default_value = example_parameterization[key]
	if param_info["type"] == "range":
	# Rescale the parameter to be between 0 and 1
	scaler = scalers[key]
	scaler.fit([[bound] for bound in param_info["bounds"]])
	scaled_value = scaler.transform([[default_value]])[0][0]
	scaled_bounds = scaler.transform([[bound] for bound in param_info["bounds"]])
	label = f"fidelity1" if key == "train_frac" else f"x{numeric_index}"
	return (
	gr.Slider( # Change this line
	value=scaled_value,
	minimum=scaled_bounds[0][0],
	maximum=scaled_bounds[1][0],
	label=label,
	step=(scaled_bounds[1][0] - scaled_bounds[0][0]) / 100,
	),
	numeric_index + 1,
	choice_index,
	)
	elif param_info["type"] == "choice":
	return (
	gr.Radio(
	choices=[
	f"c{choice_index}_{i}" for i in range(len(param_info["values"]))
	],
	label=f"c{choice_index}",
	value=f"c{choice_index}_{param_info['values'].index(default_value)}",
	),
	numeric_index,
	choice_index + 1,
	)


	# test the evaluate function
	blinded_results = evaluate([0.5] 20, "c1_0", "c2_0", "c3_0", 0.5)

	numeric_index = 1
	choice_index = 1
	inputs = []
	for param in PARAM_BOUNDS:
	input, numeric_index, choice_index = get_interface(
	param, numeric_index, choice_index
	)
	inputs.append(input)

	iface = gr.Interface(
	title="Advanced Optimization",
	fn=evaluate,
	inputs=inputs,
	outputs=gr.Numpy(
	value=np.array([list(example_result.values())]),
	headers=[f"y{i+1}" for i in range(len(example_result))],
	col_count=(len(example_result), "fixed"),
	datatype=["number"] * len(example_result),
	),
	description="""
	[![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/gist/sgbaird/78fbb50753c1089f487152817779fd74/hf-crabnet-hyperparameter.ipynb)

	## Objectives

	Minimize `y1`, `y2`, `y3`, and `y4`

	### Correlations

	- `y1` and `y2` are correlated
	- `y1` is anticorrelated with `y3`
	- `y2` is anticorrelated with `y3`

	### Noise

	`y1`, `y2`, and `y3` are stochastic with heteroskedastic, parameter-free
	noise, whereas `y4` is deterministic, but still considered 'black-box'. In
	other words, repeat calls with the same input arguments will result in
	different values for `y1`, `y2`, and `y3`, but the same value for `y4`.

	### Objective thresholds

	If `y1` is greater than 0.2, the result is considered "bad" no matter how
	good the other values are. If `y2` is greater than 0.7, the result is
	considered "bad" no matter how good the other values are. If `y3` is greater
	than 1800, the result is considered "bad" no matter how good the other
	values are. If `y4` is greater than 40e6, the result is considered "bad" no
	matter how good the other values are.

	## Search Space

	### Fidelity

	`fidelity1` is a fidelity parameter. The lowest fidelity is 0, and the
	highest fidelity is 1. The higher the fidelity, the more expensive the
	evaluation, and the higher the quality.

	NOTE: `fidelity1` and `y3` are correlated.

	### Constraints

	- x<sub>19</sub> < x<sub>20</sub>
	- x<sub>6</sub> + x<sub>15</sub> ≤ 1.0

	### Parameter bounds

	- 0 ≤ x<sub>i</sub> ≤ 1 for i ∈ {1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13,
	14, 15, 16, 17, 18, 19, 20}
	- c<sub>1</sub> ∈ {c1_0, c1_1}
	- c<sub>2</sub> ∈ {c2_0, c2_1}
	- c<sub>3</sub> ∈ {c3_0, c3_1, c3_2}
	- 0 ≤ fidelity1 ≤ 1

	## Notion of best

	Thresholded Pareto front hypervolume vs. running cost for three different
	budgets, and averaged over 10 search campaigns.

	## References:

	1. Baird, S. G.; Liu, M.; Sparks, T. D. High-Dimensional Bayesian
	Optimization of 23 Hyperparameters over 100 Iterations for an
	Attention-Based Network to Predict Materials Property: A Case Study on
	CrabNet Using Ax Platform and SAASBO. Computational Materials Science
	2022, 211, 111505. https://doi.org/10.1016/j.commatsci.2022.111505.

	2. Baird, S. G.; Parikh, J. N.; Sparks, T. D. Materials Science
	Optimization Benchmark Dataset for High-Dimensional, Multi-Objective,
	Multi-Fidelity Optimization of CrabNet Hyperparameters. ChemRxiv March
	7, 2023. https://doi.org/10.26434/chemrxiv-2023-9s6r7.
	""",
	)
	iface.launch(show_error=True)