diff --git a/.devcontainer/Dockerfile b/.devcontainer/Dockerfile deleted file mode 100644 index 2300915..0000000 --- a/.devcontainer/Dockerfile +++ /dev/null @@ -1,5 +0,0 @@ -# See here for image contents: https://github.com/microsoft/vscode-dev-containers/tree/v0.245.0/containers/python-3/.devcontainer/base.Dockerfile - -# [Choice] Python version (use -bullseye variants on local arm64/Apple Silicon): 3, 3.10, 3.9, 3.8, 3.7, 3.6, 3-bullseye, 3.10-bullseye, 3.9-bullseye, 3.8-bullseye, 3.7-bullseye, 3.6-bullseye, 3-buster, 3.10-buster, 3.9-buster, 3.8-buster, 3.7-buster, 3.6-buster -ARG VARIANT="3.10-bullseye" -FROM mcr.microsoft.com/vscode/devcontainers/python:0-${VARIANT} \ No newline at end of file diff --git a/.devcontainer/devcontainer.json b/.devcontainer/devcontainer.json deleted file mode 100644 index 684b518..0000000 --- a/.devcontainer/devcontainer.json +++ /dev/null @@ -1,45 +0,0 @@ -// For format details, see https://aka.ms/devcontainer.json. For config options, see the README at: -// https://github.com/microsoft/vscode-dev-containers/tree/v0.245.0/containers/python-3 -{ - "name": "Python 3", - "build": { - "dockerfile": "Dockerfile", - "context": "..", - "args": { - // Update 'VARIANT' to pick a Python version: 3, 3.10, 3.9, 3.8, 3.7, 3.6 - // Append -bullseye or -buster to pin to an OS version. - // Use -bullseye variants on local on arm64/Apple Silicon. - "VARIANT": "3.10-bullseye", - // Options - "NODE_VERSION": "none" - } - }, - // Configure tool-specific properties. - "customizations": { - // Configure properties specific to VS Code. - "vscode": { - // // Set *default* container specific settings.json values on container create. - // "settings": { - // "python.defaultInterpreterPath": "/home/vscode/venv/bin/python" - // }, - // Add the IDs of extensions you want installed when the container is created. - "extensions": [ - "ms-python.python", - "ms-python.vscode-pylance", - "GitHub.vscode-github-actions", - "GitHub.copilot", - "GitHub.copilot-chat" - ] - } - }, - // Use 'forwardPorts' to make a list of ports inside the container available locally. - // "forwardPorts": [], - // Use 'postCreateCommand' to run commands after the container is created. - "onCreateCommand": "sudo cp .devcontainer/welcome.txt /usr/local/etc/vscode-dev-containers/first-run-notice.txt", - "postCreateCommand": "sudo -H pip3 install -r requirements.txt" // alternatively, `pip3 install --user -r requirements.txt` - // Comment out to connect as root instead. More info: https://aka.ms/vscode-remote/containers/non-root. - // "remoteUser": "vscode", - // "features": { - // "azure-cli": "latest" - // } -} \ No newline at end of file diff --git a/.devcontainer/welcome.txt b/.devcontainer/welcome.txt deleted file mode 100644 index 8921939..0000000 --- a/.devcontainer/welcome.txt +++ /dev/null @@ -1,5 +0,0 @@ -👋 Welcome to Codespaces! Wait a few seconds for the Python requirements to install. - -📝 In the meantime, begin following the instructions in the README. - -đŸ€” If you have questions, use the GitHub Copilot "Chat" extension along the left panel (note: you may need to click the ellipses (...) to see the extension) diff --git a/.github/.keep b/.github/.keep deleted file mode 100644 index e69de29..0000000 diff --git a/.github/workflows/classroom.yml b/.github/workflows/classroom.yml index 92a4edd..b58bdff 100644 --- a/.github/workflows/classroom.yml +++ b/.github/workflows/classroom.yml @@ -16,8 +16,11 @@ jobs: uses: actions/checkout@v4 - name: Hello world test id: hello-world-test - uses: education/autograding-python-grader@v1 + uses: education/autograding-command-grader@v1 with: + test-name: Hello world test + setup-command: sudo -H pip3 install pytest + command: pytest timeout: 5 max-score: 5 - name: Autograding Reporter diff --git a/.github/workflows/docker-image.yml b/.github/workflows/docker-image.yml deleted file mode 100644 index 763a95f..0000000 --- a/.github/workflows/docker-image.yml +++ /dev/null @@ -1,18 +0,0 @@ -name: Docker Image CI - -on: - pull_request: - branches: [ "main" ] - # Allow mannually trigger - workflow_dispatch: - -jobs: - - build: - - runs-on: ubuntu-latest - - steps: - - uses: actions/checkout@v3 - - name: Build the Codespaces container image - run: docker build . --file .devcontainer/Dockerfile diff --git a/.gitignore b/.gitignore deleted file mode 100644 index 4ded053..0000000 --- a/.gitignore +++ /dev/null @@ -1,5 +0,0 @@ -**/__pycache__/ -.pytest_cache/ -*.pyc -.coverage -*.egg-info/ diff --git a/.vscode/launch.json b/.vscode/launch.json deleted file mode 100644 index 948a236..0000000 --- a/.vscode/launch.json +++ /dev/null @@ -1,16 +0,0 @@ -{ - // Use IntelliSense to learn about possible attributes. - // Hover to view descriptions of existing attributes. - // For more information, visit: https://go.microsoft.com/fwlink/?linkid=830387 - "version": "0.2.0", - "configurations": [ - { - "name": "Python: Current File", - "type": "python", - "request": "launch", - "program": "${file}", - "console": "integratedTerminal", - "justMyCode": true - } - ] -} \ No newline at end of file diff --git a/.vscode/settings.json b/.vscode/settings.json deleted file mode 100644 index 1f2b0f4..0000000 --- a/.vscode/settings.json +++ /dev/null @@ -1,10 +0,0 @@ -{ - "python.testing.pytestArgs": [ - "." - ], - "python.testing.unittestEnabled": false, - "python.testing.pytestEnabled": true, - "githubPullRequests.ignoredPullRequestBranches": [ - "main" - ] -} \ No newline at end of file diff --git a/LICENSE b/LICENSE new file mode 100644 index 0000000..d07993a --- /dev/null +++ b/LICENSE @@ -0,0 +1,22 @@ +MIT License + +Copyright (c) 2024 Dieter Plessers +Copyright (c) 2024 AC BO Hackathon + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. diff --git a/README.md b/README.md index da21a6d..be24328 100644 --- a/README.md +++ b/README.md @@ -1,15 +1,41 @@ -# Autograding Example: Python -This example project is written in Python, and tested with pytest. - -## The assignment -The tests are failing right now because the method isn't outputting the correct string. Fixing this up will make the tests green. - -## Setup command - -See `postCreateCommand` from [`devcontainer.json`](.devcontainer/devcontainer.json). - -## Run command -`pytest` - -## Notes -- pip's install path is not included in the PATH var by default, so without installing via `sudo -H`, pytest would be unaccessible. +# Bayesian Optimisation for Zeolite Synthesis Zeolite + +## Overview +Summarizing poster + +## Scope +This repository was initiated as an entry for the [Bayesian Optimization Hackathon for Chemistry and Materials](https://ac-bo-hackathon.github.io/), held on March 27-28, 2024, and sponsored by the Acceleration Consortium and Merck KGaA. Here, we propose Bayesian optimization within the field of zeolite synthesis. This concept is also explained in a [short video](https://www.youtube.com/watch?v=4lFEUixwkE8). + +Despite their significant industrial applications as catalysts, ion exchangers and adsorbents, the synthesis of zeolites predominantly relies on heuristics, experience and a sprinkle of magic. Employing Bayesian optimization has the potential to swiftly navigate the extensive parameter space in zeolite synthesis research and reduce associated costs. + +## [Introductory text](./zeolite_synthesis_bo_introduction.md) on zeolites, zeolite synthesis and Bayesian optimization +In [zeolite_synthesis_bo_introduction.md](./zeolite_synthesis_bo_introduction.md) we provide an overview of the following topics: +1. **Zeolites:** definition, properties and relevance in industry +2. **Zeolite Synthesis:** typical procedures, ingredients and equipments +3. **Zeolite Synthesis Optimization:** the limited literature on active learning for zeolite synthesis is discussed, and considerations regarding BO: + 3.1 Parameter space of a zeolite synthesis + 3.2 Constraints of a zeolite synthesis + 3.3 Objectives that might be pursued in zeolite synthesis + 3.4 Zeolite synthesis datasets that are available in literature +4. **Discussion:** various aspects of BO in zeolite synthesis are discussed, and how they can be tackled +5. **References** + +While numerous references are provided for further exploration, this document is self-contained and aims to be easily understood. We hope it inspires the reader to consider active learning approaches in their zeolite synthesis endeavors. +This introductory text is also provided as [pdf](./zeolite_synthesis_bo_introduction.pdf). + +## [Notebook](./demo_zeolite_synthesis_bo.ipynb) tutorial on Bayesian optimization for zeolite synthesis (with [Ax](https://ax.dev/)) Open In Colab +Within the [demo_zeolite_synthesis_bo.ipynb](./demo_zeolite_synthesis_bo.ipynb) notebook, we illustrate the concepts of the introductory text with code, leveraging real-world literature data acquired through grid search in [Table S4](https://pubs.acs.org/doi/suppl/10.1021/acs.chemmater.9b03738/suppl_file/cm9b03738_si_001.pdf#page=10) and [Table S3](https://pubs.acs.org/doi/suppl/10.1021/jacs.1c07590/suppl_file/ja1c07590_si_001.pdf#page=9) in the Supporting Information of respectively [*Chem. Mater.* **2020**, *32*, 273–285](https://pubs.acs.org/doi/abs/10.1021/acs.chemmater.9b03738) and [*J. Am. Chem. Soc.* **2021**, *143*, 16243–16255](https://pubs.acs.org/doi/10.1021/jacs.1c07590). + +This notebook is divided into two sections: +1. The first section uses Bayesian optimization to **optimize an analytical dummy function** using zeolite synthesis parameters, showing a significant improvement compared to grid search. +2. The second section uses Bayesian optimization to **propose a new experiment** based on existing literature data. + +A common overarching objective in zeolite synthesis is to achieve a **high yield** of the desired zeolite product. In the papers under consideration, a more specialized goal involves **maximizing the presence of proximal Al pairs** within synthesized CHA zeolites, which is required for stabilizing Fe2+ sites (so-called divalent cation capacity, DCC). Upon activation, these sites can selectively oxidize methane to **methanol**. Accordingly, we will provide examples with synthesis yield, DCC and methanol yield as optimization objectives for the Bayesian optimization process. + +The various examples touch upon different aspects of Bayesian optimization, including **continuous variables, categorical variables, mixed variable types, parameter constraints, as well as single and multiple objectives**. + + + + + + diff --git a/demo_zeolite_synthesis_bo.ipynb b/demo_zeolite_synthesis_bo.ipynb new file mode 100644 index 0000000..deb1fe9 --- /dev/null +++ b/demo_zeolite_synthesis_bo.ipynb @@ -0,0 +1,2181 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "33956ea9-21bf-41a8-9c4a-d24f89d1d52d", + "metadata": {}, + "source": [ + "# Code Demonstration: Bayesian Optimization for Zeolite Synthesis" + ] + }, + { + "cell_type": "markdown", + "id": "72398f31-f1bc-459f-aca4-6358d7e1a0c8", + "metadata": {}, + "source": [ + "Author: Plessers Dieter \n", + "March 28th, 2024" + ] + }, + { + "cell_type": "markdown", + "id": "e8b0873e-52ee-41ad-8ea6-dda138b77892", + "metadata": {}, + "source": [ + "## Table of Contents \n", + "[Introduction](#Introduction) \n", + "[Import necessary packages](#Packages) \n", + "\n", + "[Part 1: Optimize an Analytical 'Dummy' Function with Zeolite Synthesis Parameters](#Part1)\n", + "* [1.1 Define Dummy Analytical Objective Functions](#Part1.1) \n", + "* [1.2 Define a Function that Optimizes the Dummy Function with Ax Package](#Part1.2)\n", + "* [1.3 Single-Objective with 4 Continuous Variables](#Part1.3) \n", + "* [1.4 Multi-Objective with 4 Continuous Variables](#Part1.4)\n", + "* [1.5 Multi-Objective with 4 Continuous Variables and 2 Categorical Variables](#Part1.5) \n", + "* [1.6 Multi-Objective with 4 Continuous Variables, 2 Categorical Variables and Parameter Constraints](#Part1.6)\n", + "* [1.7 Code Example without Using the General `optimize_experiment_ax` Function of Part 1.2](#Part1.7)\n", + " \n", + "[Part 2: Propose a New Experiment Based on a Batch of Prior (Literature) Experiments](#Part2)\n", + "* [2.1 Define a Function that Proposes the Next Best Experiment with Ax Package](#Part2.1) \n", + "* [2.2 Collect the Literature Input and Output Data](#Part2.2)\n", + "* [2.3 Single-Objective (Synthesis Yield) with 3 Continuous Variables and 2 Categorical Variables](#Part2.3) \n", + "* [2.4 Multi-Objective (Synthesis Yield + Methanol Production) with 3 Continuous Variables and 2 Categorical Variables](#Part2.4)\n" + ] + }, + { + "cell_type": "markdown", + "id": "e3c2a160-5c0a-4e9c-bfcd-45491aef19b9", + "metadata": {}, + "source": [ + "## Introduction \n", + "#### Scope \n", + "This Jupyter notebook accompanies an introductory text on Bayesian optimization (BO) for zeolite synthesis. In the text, we outlined a **typical parameter space with tunable variables and constraints, along with possible objectives derived from a zeolite target application**. Within this notebook, we exemplify these concepts with code, leveraging real-world literature data acquired through grid search in [Table S4](https://pubs.acs.org/doi/suppl/10.1021/acs.chemmater.9b03738/suppl_file/cm9b03738_si_001.pdf#page=10) and [Table S3](https://pubs.acs.org/doi/suppl/10.1021/jacs.1c07590/suppl_file/ja1c07590_si_001.pdf#page=9) in the Supporting Information of respectively:\n", + "\n", + "1. Devos, J.; Bols, M. L.; Plessers, D.; Goethem, C. Van; Seo, J. W.; Hwang, S.-J.; Sels, B. F.; Dusselier, M. Synthesis–Structure–Activity Relations in Fe-CHA for C–H Activation: Control of Al Distribution by Interzeolite Conversion. [*Chem. Mater.* **2020**, *32*, 273–285](https://pubs.acs.org/doi/abs/10.1021/acs.chemmater.9b03738). \n", + "2. Bols, M. L.; Devos, J.; Rhoda, H. M.; Plessers, D.; Solomon, E. I.; Schoonheydt, R. A.; Sels, B. F.; Dusselier, M. Selective Formation of $\\alpha$-Fe(II) Sites on Fe-Zeolites through One-Pot Synthesis. [*J. Am. Chem. Soc.* **2021**, *143*, 16243–16255](https://pubs.acs.org/doi/10.1021/jacs.1c07590). \n", + "\n", + "A common overarching objective in zeolite synthesis is to achieve a **high yield** of the desired zeolite product. In the papers under consideration, a more specialized goal involves **maximizing the presence of proximal Al pairs** within synthesized CHA zeolites, which is required for stabilizing Fe2+ sites (so-called divalent cation capacity, DCC). Upon activation, these sites can selectively oxidize methane to **methanol**. Accordingly, we will provide examples with synthesis yield, DCC and methanol yield as optimization objectives for the Bayesian optimization process.\n", + "\n", + "This notebook is divided into two sections: \n", + "1. The first section uses Bayesian optimization to optimize an analytical dummy function using zeolite synthesis parameters. \n", + "2. The second section uses Bayesian optimization to propose a new experiment based on existing literature data.\n", + "\n", + "#### [Part 1: Optimize an Analytical 'Dummy' Function with Zeolite Synthesis Parameters](#Part1)\n", + "We create a ['dummy' function](#Part1.1) linking the input parameters of zeolite synthesis to a specific output. The Bayesian optimizer operates without knowledge of the underlying analytical function we have defined, but this approach allows us to run a Bayesian optimization scheme as follows: 1) BO suggests parameters for experimentation based on a list of previous experimental outcomes, 2) our analytical function yields the outcome of the suggested experiment, 3) the outcome is added to the list of previous experimental outcomes and 4) this process is iteratively repeated. \n", + "\n", + "We run three different experiment modes to demonstrate various options available with BO:\n", + "\n", + "1. Four **continuous** variables with a **single** objective (high synthesis yield) [[link]](#Part1.3) \n", + "2. Four **continuous** variables with **multiple** objectives (high synthesis yield and high DCC) [[link]](#Part1.4) \n", + "3. **Mixed variable types** (4 continuous and 2 categorical) with **multiple** objectives (high synthesis yield and high DCC) [[link]](#Part1.5) \n", + "4. **Mixed variable types** (4 continuous and 2 categorical) with **parameter constraints** and with **multiple objectives** (high synthesis yield and high DCC) [[link]](#Part1.6) \n", + "\n", + "In the simplest case of 4 continuous variables, a grid search choosing 3 values per variable would require $3^4=81$ experiments, with no guarantee that any of these experiments will come close to the global optimum. In contrast, it can be seen in the code that the Bayesian optimizer reaches close to the global optimum in less than 30 iterations. \n", + " \n", + "#### [Part 2: Propose a New Experiment Based on a Batch of Prior (Literature) Experiments](#Part2)\n", + "Here Bayesian optimization is applied within a **real-world context** where the underlying target function remains unknown. We start from a batch of experiments collected from literature, and we allow the Bayesian optimizer to **suggest the next experiment**. This process aims to explore the search space further and/or leverage past results. In practice, one would implement the suggested experiment, incorporate its outcome into the existing results, and subsequently rerun the Bayesian optimization algorithm. We provide an example with **mixed variable types** (3 continuous and 2 categorical) with a **single-objective** and **multi-objective** target.\n", + "\r\n", + "\n", + "\n" + ] + }, + { + "cell_type": "markdown", + "id": "293ba810-16e0-4db1-8bd8-ed91705d0fe5", + "metadata": {}, + "source": [ + "## Import necessary packages " + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "id": "bec011d0-be00-428b-b4e3-ace5c2940f3e", + "metadata": {}, + "outputs": [], + "source": [ + "import numpy as np\n", + "\n", + "# Ax (adaptive experimentation) is the package we use for BO: https://ax.dev/\n", + "try:\n", + " import ax\n", + "except: \n", + " %pip install ax-platform\n", + "from ax.service.ax_client import AxClient, ObjectiveProperties\n", + "from ax.modelbridge.generation_strategy import GenerationStrategy, GenerationStep\n", + "from ax.modelbridge.registry import Models\n", + "from ax.service.utils.instantiation import ObjectiveProperties\n", + "\n", + "# We will use plotly to plot the optimization trace of a single-objective experiment\n", + "try: \n", + " import plotly\n", + "except:\n", + " %pip install plotly\n", + "import plotly.graph_objects as go\n", + "\n", + "from IPython.display import display # Enables the display of more than one dataframe per code cell\n", + "import pandas as pd\n", + "pd.set_option('max_colwidth', None) # Show full width Panda columns\n", + "from collections import OrderedDict\n", + "\n", + "# To hide all the info and warning messages of Ax. Comment the next lines if you want to see them.\n", + "import logging, sys\n", + "logging.disable(sys.maxsize)\n", + "import warnings\n", + "warnings.filterwarnings('ignore')\n" + ] + }, + { + "cell_type": "markdown", + "id": "4f326992-3de6-443f-875b-d72e35aaab7b", + "metadata": {}, + "source": [ + "## Part 1: Optimize an Analytical 'Dummy' Function with Zeolite Synthesis Parameters " + ] + }, + { + "cell_type": "markdown", + "id": "6c7517af-a5d3-4d5c-b7e9-05af59588548", + "metadata": {}, + "source": [ + "### 1.1 Define Dummy Analytical Objective Functions " + ] + }, + { + "cell_type": "markdown", + "id": "2b43f842-8109-499d-a064-048b377cb9b3", + "metadata": {}, + "source": [ + "Here we will define analytical functions for BO to **minimize**:\n", + "1) The first function has 4 continuous variables with a single objective\n", + "2) The second function has 4 continuous variables with two objectives\n", + "3) The third fuctions has 4 continuous and 2 categorical variables with 2 objectives\n", + "\n", + "We choose a simple function definition that has a **clear global minimum** (both for single and multi-objective) around \n", + "x1 = 0.35 $\\ \\ \\ $ (molar ratio of organic structure directing agents (OSDA) compared to Si) \n", + "x2 = 12.5 $\\ \\ \\ $ (the molar ratio of water compared to Si) \n", + "x3 = 140 $\\ \\ \\ \\ $ (synthesis temperature (°C)) \n", + "x4 = 24 $\\ \\ \\ \\ \\ \\ $ (synthesis time (h)) \n", + "x5 = Static $\\ $ (stirring mode) \n", + "x6 = Fumed (silicon source)" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "fae9fcab-28a4-4245-8354-677b7a4034d1", + "metadata": {}, + "outputs": [], + "source": [ + "def dummy_function_4_continuous_1_objective(x1, x2, x3, x4, obj_name1):\n", + " y1 = float((90*x1- 90*0.35)**2 + (x2-12.5)**2 + (x3-140)**2 + (x4/8-24/8)**2 + np.cos(x1*x2*x3*x4))\n", + " return {obj_name1:y1}\n", + " \n", + "def dummy_function_4_continuous_2_objective(x1, x2, x3, x4, obj_name1, obj_name2):\n", + " y1 = float((90*x1- 90*0.35)**2 + (x2-12.5)**2 + (x3-140)**2 + (x4/8-24/8)**2 + np.cos(x1*x2*x3*x4))\n", + " y2 = float((90*x1- 90*0.35)**2 + (x2-12.5)**2 + (x3-140)**2 + (x4/8-24/8)**2 + np.sin(x1*x2*x3*x4))\n", + "\n", + " # In our case, standard error is 0.0, since we are computing a synthetic function.\n", + " # See: https://ax.dev/tutorials/multiobjective_optimization.html\n", + " return {obj_name1:(y1, 0.0), obj_name2 : (y2, 0.0)}\n", + "\n", + "def dummy_function_4_continuous_2_categorical_2_objective(x1, x2, x3, x4, c1, c2, obj_name1, obj_name2):\n", + "\n", + " # The penalty lookup idea comes from https://honegumi.readthedocs.io/en/latest/\n", + " penalty_lookup1 = {\"Stirring\": 5000, \"Tumbling\": 2500, \"Static\": 0.0}\n", + " penalty_lookup2 = {\"Colloidal\": 5000, \"Fumed\": 0.0}\n", + " \n", + " y1 = float((90*x1- 90*0.35)**2 + (x2-12.5)**2 + (x3-140)**2 + (x4/8-24/8)**2 + np.cos(x1*x2*x3*x4))\n", + " y1 += penalty_lookup1[c1] + penalty_lookup2[c2]\n", + " \n", + " y2 = float((90*x1- 90*0.35)**2 + (x2-12.5)**2 + (x3-140)**2 + (x4/8-24/8)**2 + np.sin(x1*x2*x3*x4))\n", + " y2 += penalty_lookup1[c1] + penalty_lookup2[c2]\n", + " \n", + " # In our case, standard error is 0.0, since we are computing a synthetic function.\n", + " # See: https://ax.dev/tutorials/multiobjective_optimization.html\n", + " return {obj_name1:(y1, 0.0), obj_name2 : (y2, 0.0)}\n" + ] + }, + { + "cell_type": "markdown", + "id": "9b4cc353-4c83-42f8-9bfd-bf1d926e97e0", + "metadata": {}, + "source": [ + "### 1.2 Define a Function that Optimizes the Dummy Function with Ax Package " + ] + }, + { + "cell_type": "markdown", + "id": "fdb712df-d17b-4662-a671-ddf0b3335c2c", + "metadata": {}, + "source": [ + "Here we will create a **general function** `optimize_experiment_ax` to run a BO experiment with the Ax package. This general function allows focus on the output of the experiments further on, without repeatedly modifying similar sections of code. At the end, we offer an example code not using this general function, which may be employed if only one type of experiment is considered. \n", + "\n", + "The `optimize_experiment_ax` function takes a list of **objective names** (can be any length, so single or multi-objective), an **analytical function** of the objectives (defined in [section 1.1](#Part1.1)), a list of **continuous parameters**, a list of **categorical parameters**, a list of parameter **constraints**, and an amount of **iterations**. This function will be used throughout part 1 of the notebook to run different experiments. \n", + "\n", + "\n", + "This function is inspired by the different options provided by **Honegumi** (https://honegumi.readthedocs.io/en/latest/), and can easily be modified to incorporate batch sizes. " + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "5bcfb4b9-c580-4061-9b95-34a66f1667c6", + "metadata": {}, + "outputs": [], + "source": [ + "def to_plotly(axplotconfig):\n", + " \"\"\"Converts AxPlotConfig to plotly Figure.\"\"\"\n", + " data = axplotconfig[0][\"data\"]\n", + " layout = axplotconfig[0][\"layout\"]\n", + " fig = go.Figure({\"data\": data, \"layout\": layout})\n", + " return fig\n", + " \n", + "def optimize_experiment_ax(list_obj_names, objective_function, continuous_parameters_list, categorical_parameters_list, \n", + " parameter_constraints_lists, iterations):\n", + " \"\"\"\n", + " Creates an optimization experiment with the Ax package. \n", + " Inputs: \n", + " list_obj_names: list with all the objective names\n", + " objective_function: function used to calculate objectives\n", + " continuous_parameters_list: list of continuous parameters for the objective function\n", + " categorical_parameters_list: list of categorical parameters for the objective function\n", + " parameter_constraints_lists: list of constraints in the parameter space\n", + " iterations: number of iterations for the BO algorithm\n", + "\n", + " Outputs:\n", + " The best parameters and their objective function outputs are printed.\n", + " For single-objective experiments, the optimization trace is plotted. \n", + "\n", + " Source:\n", + " This function is inspired by the different options provided by Honegumi (https://honegumi.readthedocs.io/en/latest/)\n", + " \"\"\"\n", + "\n", + " all_parameters_list = continuous_parameters_list + categorical_parameters_list\n", + " objectives_dictionary={}\n", + " for obj_name in list_obj_names:\n", + " objectives_dictionary[obj_name]=ObjectiveProperties(minimize=True)\n", + " \n", + " ax_client = AxClient(verbose_logging=False)\n", + " ax_client.create_experiment(parameters= all_parameters_list, \n", + " parameter_constraints = parameter_constraints_lists,\n", + " objectives = objectives_dictionary \n", + " )\n", + " \n", + " for _ in range(iterations):\n", + " parameterization, trial_index = ax_client.get_next_trial()\n", + " \n", + " # Extract parameters and collect in dictionary\n", + " dict_extract_parameters={}\n", + " for parameter_info in all_parameters_list:\n", + " parameter_name = parameter_info[\"name\"]\n", + " dict_extract_parameters[parameter_name] = parameterization[parameter_name]\n", + " \n", + " # Calculate the results by plugging the parameters and objective names in the provided objective function\n", + " results = objective_function(*dict_extract_parameters.values(), *list_obj_names)\n", + " ax_client.complete_trial(trial_index=trial_index, raw_data=results)\n", + "\n", + " # Create dataframe with details of all experiment iterations\n", + " df_experiments = ax_client.generation_strategy.trials_as_df\n", + " number_of_experiments_to_show= min(iterations, 5)\n", + " print(f'The details of the last {number_of_experiments_to_show} experiments:')\n", + " display(df_experiments.tail())\n", + "\n", + " if len(list_obj_names) == 1:\n", + " # Single-objective optimization\n", + " # Get the AxClient's optimization trace \n", + " optimization_trace = ax_client.get_optimization_trace()\n", + " \n", + " # Convert the optimization trace to a Plotly figure and plot it\n", + " fig = to_plotly(optimization_trace)\n", + " fig.show(renderer='png')\n", + "\n", + " # Output the best parameters and their corresponding objective values\n", + " best_parameters, value = ax_client.get_best_parameters()\n", + " print('The best parameters were:')\n", + " display(best_parameters)\n", + " print('\\nThe objective value for the best parameters was:')\n", + " display(value[0])\n", + "\n", + " else:\n", + " # Multi-objective optimization\n", + " # Output the Pareto optimal parameters and their corresponding objective values\n", + " best_parameters = ax_client.get_pareto_optimal_parameters()\n", + " print('The Pareto optimal parameters were:')\n", + " display(list(best_parameters.values())[0][0])\n", + " print('\\nThe objective values for the Pareto optimal parameters were:')\n", + " display(list(best_parameters.values())[0][1][0])\n", + " \n", + " return None" + ] + }, + { + "cell_type": "markdown", + "id": "e2739dec-a5c4-4a32-bdbb-de0c014cf4dc", + "metadata": {}, + "source": [ + "### 1.3 Single-Objective with 4 Continuous Variables " + ] + }, + { + "cell_type": "markdown", + "id": "2f9df5b9-9b2a-4785-a347-061da3d110fd", + "metadata": {}, + "source": [ + "The first demonstration uses the general function [`optimize_experiment_ax`](#Part1.2) to optimize an experiment with **4 continuous variables** with typical ranges that are based on [Table S4](https://pubs.acs.org/doi/suppl/10.1021/acs.chemmater.9b03738/suppl_file/cm9b03738_si_001.pdf#page=10) in the Supporting Information of [reference 1](https://pubs.acs.org/doi/abs/10.1021/acs.chemmater.9b03738): \n", + "* the molar ratio of organic structure directing agents (OSDA) compared to Si \n", + "* the molar ratio of water compared to Si\n", + "* synthesis temperature (°C)\n", + "* synthesis time (h)\n", + "\n", + "The **single target variable** is synthesis yield. We assume that minimizing the above defined [dummy function](#Part1.1) `dummy_function_4_continuous_1_objective` corresponds to maximizing the yield of the zeolite synthesis. We also plot the **optimization trace** of the BO algorithm throughout the different experiment iterations.\n" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "c1825bf3-f5be-4504-834b-f18551cecd63", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The details of the last 5 experiments:\n" + ] + }, + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Generation StepGeneration ModelTrial IndexTrial StatusArm Parameterizations
25GenerationStep_1BoTorch25COMPLETED{'25_0': {'OSDA_molar_ratio': 0.38, 'H2O_molar_ratio': 13.61, 'Synthesis_temperature': 136.78, 'Synthesis_time': 28.85}}
26GenerationStep_1BoTorch26COMPLETED{'26_0': {'OSDA_molar_ratio': 0.38, 'H2O_molar_ratio': 20.35, 'Synthesis_temperature': 143.58, 'Synthesis_time': 2.0}}
27GenerationStep_1BoTorch27COMPLETED{'27_0': {'OSDA_molar_ratio': 0.36, 'H2O_molar_ratio': 11.54, 'Synthesis_temperature': 142.55, 'Synthesis_time': 37.52}}
28GenerationStep_1BoTorch28COMPLETED{'28_0': {'OSDA_molar_ratio': 0.38, 'H2O_molar_ratio': 5.0, 'Synthesis_temperature': 138.76, 'Synthesis_time': 2.0}}
29GenerationStep_1BoTorch29COMPLETED{'29_0': {'OSDA_molar_ratio': 0.35, 'H2O_molar_ratio': 12.39, 'Synthesis_temperature': 138.91, 'Synthesis_time': 25.45}}
\n", + "
" + ], + "text/plain": [ + " Generation Step Generation Model Trial Index Trial Status \\\n", + "25 GenerationStep_1 BoTorch 25 COMPLETED \n", + "26 GenerationStep_1 BoTorch 26 COMPLETED \n", + "27 GenerationStep_1 BoTorch 27 COMPLETED \n", + "28 GenerationStep_1 BoTorch 28 COMPLETED \n", + "29 GenerationStep_1 BoTorch 29 COMPLETED \n", + "\n", + " Arm Parameterizations \n", + "25 {'25_0': {'OSDA_molar_ratio': 0.38, 'H2O_molar_ratio': 13.61, 'Synthesis_temperature': 136.78, 'Synthesis_time': 28.85}} \n", + "26 {'26_0': {'OSDA_molar_ratio': 0.38, 'H2O_molar_ratio': 20.35, 'Synthesis_temperature': 143.58, 'Synthesis_time': 2.0}} \n", + "27 {'27_0': {'OSDA_molar_ratio': 0.36, 'H2O_molar_ratio': 11.54, 'Synthesis_temperature': 142.55, 'Synthesis_time': 37.52}} \n", + "28 {'28_0': {'OSDA_molar_ratio': 0.38, 'H2O_molar_ratio': 5.0, 'Synthesis_temperature': 138.76, 'Synthesis_time': 2.0}} \n", + "29 {'29_0': {'OSDA_molar_ratio': 0.35, 'H2O_molar_ratio': 12.39, 'Synthesis_temperature': 138.91, 'Synthesis_time': 25.45}} " + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "" + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The best parameters were:\n" + ] + }, + { + "data": { + "text/plain": [ + "{'OSDA_molar_ratio': 0.34775812136334816,\n", + " 'H2O_molar_ratio': 12.389732172987166,\n", + " 'Synthesis_temperature': 138.9139401644853,\n", + " 'Synthesis_time': 25.450990377516668}" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\n", + "The objective value for the best parameters was:\n" + ] + }, + { + "data": { + "text/plain": [ + "{'Synthesis_yield': 0.8177388940177934}" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "optimize_experiment_ax(list_obj_names = ['Synthesis_yield'],\n", + " objective_function = dummy_function_4_continuous_1_objective,\n", + " continuous_parameters_list = [{\"name\": \"OSDA_molar_ratio\", \"type\": \"range\", \"bounds\": [0.1, 1.0]},\n", + " {\"name\": \"H2O_molar_ratio\", \"type\": \"range\", \"bounds\": [5.0, 100.0]},\n", + " {\"name\": \"Synthesis_temperature\", \"type\": \"range\", \"bounds\": [100.0, 200.0]},\n", + " {\"name\": \"Synthesis_time\", \"type\": \"range\", \"bounds\": [2.0, 432.0]},\n", + " ],\n", + " categorical_parameters_list = [],\n", + " parameter_constraints_lists = [],\n", + " iterations=30)" + ] + }, + { + "cell_type": "markdown", + "id": "c1e91c48-fc9c-40c6-9ef5-7a9251db33da", + "metadata": {}, + "source": [ + "### 1.4 Multi-Objective with 4 Continuous Variables " + ] + }, + { + "cell_type": "markdown", + "id": "91b6dbc9-cf6b-4090-99f2-a2a027c188af", + "metadata": {}, + "source": [ + "The second demonstration uses the general function [`optimize_experiment_ax`](#Part1.2) to optimize an experiment with **4 continuous variables** with typical ranges that are based on [Table S4](https://pubs.acs.org/doi/suppl/10.1021/acs.chemmater.9b03738/suppl_file/cm9b03738_si_001.pdf#page=10) in the Supporting Information of [reference 1](https://pubs.acs.org/doi/abs/10.1021/acs.chemmater.9b03738): \n", + "* the molar ratio of organic structure directing agents (OSDA) compared to Si \n", + "* the molar ratio of water compared to Si\n", + "* synthesis temperature (°C)\n", + "* synthesis time (h)\n", + "\n", + "The **2 target variables** are synthesis yield and DCC (divalent cation capacity). We assume that minimizing the above defined [dummy function](#Part1.1) `dummy_function_4_continuous_2_objective` corresponds to maximizing the yield and DCC of the zeolite synthesis. Refer to https://ax.dev/tutorials/multiobjective_optimization.html for more background information." + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "id": "498f8715-7d4c-47d6-98d6-2ac1f8dcba15", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The details of the last 5 experiments:\n" + ] + }, + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Generation StepGeneration ModelTrial IndexTrial StatusArm Parameterizations
25GenerationStep_1BoTorch25COMPLETED{'25_0': {'OSDA_molar_ratio': 0.35, 'H2O_molar_ratio': 12.76, 'Synthesis_temperature': 140.14, 'Synthesis_time': 23.7}}
26GenerationStep_1BoTorch26COMPLETED{'26_0': {'OSDA_molar_ratio': 0.38, 'H2O_molar_ratio': 11.41, 'Synthesis_temperature': 140.21, 'Synthesis_time': 23.86}}
27GenerationStep_1BoTorch27COMPLETED{'27_0': {'OSDA_molar_ratio': 0.36, 'H2O_molar_ratio': 13.2, 'Synthesis_temperature': 140.56, 'Synthesis_time': 23.78}}
28GenerationStep_1BoTorch28COMPLETED{'28_0': {'OSDA_molar_ratio': 0.33, 'H2O_molar_ratio': 8.25, 'Synthesis_temperature': 143.34, 'Synthesis_time': 2.0}}
29GenerationStep_1BoTorch29COMPLETED{'29_0': {'OSDA_molar_ratio': 0.35, 'H2O_molar_ratio': 12.67, 'Synthesis_temperature': 139.9, 'Synthesis_time': 30.48}}
\n", + "
" + ], + "text/plain": [ + " Generation Step Generation Model Trial Index Trial Status \\\n", + "25 GenerationStep_1 BoTorch 25 COMPLETED \n", + "26 GenerationStep_1 BoTorch 26 COMPLETED \n", + "27 GenerationStep_1 BoTorch 27 COMPLETED \n", + "28 GenerationStep_1 BoTorch 28 COMPLETED \n", + "29 GenerationStep_1 BoTorch 29 COMPLETED \n", + "\n", + " Arm Parameterizations \n", + "25 {'25_0': {'OSDA_molar_ratio': 0.35, 'H2O_molar_ratio': 12.76, 'Synthesis_temperature': 140.14, 'Synthesis_time': 23.7}} \n", + "26 {'26_0': {'OSDA_molar_ratio': 0.38, 'H2O_molar_ratio': 11.41, 'Synthesis_temperature': 140.21, 'Synthesis_time': 23.86}} \n", + "27 {'27_0': {'OSDA_molar_ratio': 0.36, 'H2O_molar_ratio': 13.2, 'Synthesis_temperature': 140.56, 'Synthesis_time': 23.78}} \n", + "28 {'28_0': {'OSDA_molar_ratio': 0.33, 'H2O_molar_ratio': 8.25, 'Synthesis_temperature': 143.34, 'Synthesis_time': 2.0}} \n", + "29 {'29_0': {'OSDA_molar_ratio': 0.35, 'H2O_molar_ratio': 12.67, 'Synthesis_temperature': 139.9, 'Synthesis_time': 30.48}} " + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The Pareto optimal parameters were:\n" + ] + }, + { + "data": { + "text/plain": [ + "{'OSDA_molar_ratio': 0.3514134608325845,\n", + " 'H2O_molar_ratio': 12.763524283729826,\n", + " 'Synthesis_temperature': 140.14219782729086,\n", + " 'Synthesis_time': 23.698891067110903}" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\n", + "The objective values for the Pareto optimal parameters were:\n" + ] + }, + { + "data": { + "text/plain": [ + "{'DCC': 0.24512712912701318, 'Synthesis_yield': 0.04231119590133403}" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "optimize_experiment_ax(list_obj_names = ['DCC', 'Synthesis_yield'],\n", + " objective_function = dummy_function_4_continuous_2_objective,\n", + " continuous_parameters_list = [{\"name\": \"OSDA_molar_ratio\", \"type\": \"range\", \"bounds\": [0.1, 1.0]},\n", + " {\"name\": \"H2O_molar_ratio\", \"type\": \"range\", \"bounds\": [5.0, 100.0]},\n", + " {\"name\": \"Synthesis_temperature\", \"type\": \"range\", \"bounds\": [100.0, 200.0]},\n", + " {\"name\": \"Synthesis_time\", \"type\": \"range\", \"bounds\": [2.0, 432.0]},\n", + " ],\n", + " categorical_parameters_list = [],\n", + " parameter_constraints_lists = [],\n", + " iterations=30)" + ] + }, + { + "cell_type": "markdown", + "id": "267ec0c3-0aec-4294-b3ad-9d3c5bfc099e", + "metadata": {}, + "source": [ + "### 1.5 Multi-Objective with 4 Continuous Variables and 2 Categorical Variables " + ] + }, + { + "cell_type": "markdown", + "id": "b11b8976-7a1c-4030-a735-727db98cf320", + "metadata": {}, + "source": [ + "The third demonstration uses the general function [`optimize_experiment_ax`](#Part1.2) to optimize an experiment with **4 continuous variables** with typical ranges that are based on [Table S4](https://pubs.acs.org/doi/suppl/10.1021/acs.chemmater.9b03738/suppl_file/cm9b03738_si_001.pdf#page=10) in the Supporting Information of [reference 1](https://pubs.acs.org/doi/abs/10.1021/acs.chemmater.9b03738): \n", + "* the molar ratio of organic structure directing agents (OSDA) compared to Si \n", + "* the molar ratio of water compared to Si\n", + "* synthesis temperature (°C)\n", + "* synthesis time (h)\n", + "\n", + "We also add **2 categorical variables** that are inspired of [Table S3](https://pubs.acs.org/doi/suppl/10.1021/jacs.1c07590/suppl_file/ja1c07590_si_001.pdf#page=9) in the Supporting Information of [reference 2](https://pubs.acs.org/doi/10.1021/jacs.1c07590): \n", + "* Stirring mode: stirring (600 rpm), tumbling or static. \n", + "* Silicon source: colloidal silica or fumed silica.\n", + "\n", + "The **2 target variables** are synthesis yield and DCC (divalent cation capacity). We assume that minimizing the above defined [dummy function](#Part1.1) `dummy_function_4_continuous_2_categorical_2_objective` corresponds to maximizing the yield and DCC of the zeolite synthesis. Refer to https://ax.dev/tutorials/multiobjective_optimization.html for more background information." + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "id": "88f3cbdb-d13b-4875-b86b-7efe5094f6e6", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The details of the last 5 experiments:\n" + ] + }, + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Generation StepGeneration ModelTrial IndexTrial StatusArm Parameterizations
25GenerationStep_1BoTorch25COMPLETED{'25_0': {'OSDA_molar_ratio': 0.35, 'H2O_molar_ratio': 12.04, 'Synthesis_temperature': 139.7, 'Synthesis_time': 27.79, 'Stirring': 'Static', 'Silicon_source': 'Fumed'}}
26GenerationStep_1BoTorch26COMPLETED{'26_0': {'OSDA_molar_ratio': 0.34, 'H2O_molar_ratio': 11.67, 'Synthesis_temperature': 140.26, 'Synthesis_time': 25.62, 'Stirring': 'Static', 'Silicon_source': 'Fumed'}}
27GenerationStep_1BoTorch27COMPLETED{'27_0': {'OSDA_molar_ratio': 0.35, 'H2O_molar_ratio': 12.09, 'Synthesis_temperature': 140.02, 'Synthesis_time': 29.19, 'Stirring': 'Static', 'Silicon_source': 'Fumed'}}
28GenerationStep_1BoTorch28COMPLETED{'28_0': {'OSDA_molar_ratio': 0.34, 'H2O_molar_ratio': 12.8, 'Synthesis_temperature': 140.5, 'Synthesis_time': 26.23, 'Stirring': 'Static', 'Silicon_source': 'Fumed'}}
29GenerationStep_1BoTorch29COMPLETED{'29_0': {'OSDA_molar_ratio': 0.34, 'H2O_molar_ratio': 12.48, 'Synthesis_temperature': 140.3, 'Synthesis_time': 27.02, 'Stirring': 'Static', 'Silicon_source': 'Fumed'}}
\n", + "
" + ], + "text/plain": [ + " Generation Step Generation Model Trial Index Trial Status \\\n", + "25 GenerationStep_1 BoTorch 25 COMPLETED \n", + "26 GenerationStep_1 BoTorch 26 COMPLETED \n", + "27 GenerationStep_1 BoTorch 27 COMPLETED \n", + "28 GenerationStep_1 BoTorch 28 COMPLETED \n", + "29 GenerationStep_1 BoTorch 29 COMPLETED \n", + "\n", + " Arm Parameterizations \n", + "25 {'25_0': {'OSDA_molar_ratio': 0.35, 'H2O_molar_ratio': 12.04, 'Synthesis_temperature': 139.7, 'Synthesis_time': 27.79, 'Stirring': 'Static', 'Silicon_source': 'Fumed'}} \n", + "26 {'26_0': {'OSDA_molar_ratio': 0.34, 'H2O_molar_ratio': 11.67, 'Synthesis_temperature': 140.26, 'Synthesis_time': 25.62, 'Stirring': 'Static', 'Silicon_source': 'Fumed'}} \n", + "27 {'27_0': {'OSDA_molar_ratio': 0.35, 'H2O_molar_ratio': 12.09, 'Synthesis_temperature': 140.02, 'Synthesis_time': 29.19, 'Stirring': 'Static', 'Silicon_source': 'Fumed'}} \n", + "28 {'28_0': {'OSDA_molar_ratio': 0.34, 'H2O_molar_ratio': 12.8, 'Synthesis_temperature': 140.5, 'Synthesis_time': 26.23, 'Stirring': 'Static', 'Silicon_source': 'Fumed'}} \n", + "29 {'29_0': {'OSDA_molar_ratio': 0.34, 'H2O_molar_ratio': 12.48, 'Synthesis_temperature': 140.3, 'Synthesis_time': 27.02, 'Stirring': 'Static', 'Silicon_source': 'Fumed'}} " + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The Pareto optimal parameters were:\n" + ] + }, + { + "data": { + "text/plain": [ + "{'OSDA_molar_ratio': 0.34576462735686786,\n", + " 'H2O_molar_ratio': 12.042266849002447,\n", + " 'Synthesis_temperature': 139.70090696302174,\n", + " 'Synthesis_time': 27.788607802183623,\n", + " 'Stirring': 'Static',\n", + " 'Silicon_source': 'Fumed'}" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\n", + "The objective values for the Pareto optimal parameters were:\n" + ] + }, + { + "data": { + "text/plain": [ + "{'DCC': 0.468011099197156, 'Synthesis_yield': 0.7500239907244577}" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "optimize_experiment_ax(list_obj_names = ['DCC', 'Synthesis_yield'],\n", + " objective_function = dummy_function_4_continuous_2_categorical_2_objective,\n", + " continuous_parameters_list = [{\"name\": \"OSDA_molar_ratio\", \"type\": \"range\", \"bounds\": [0.1, 1.0]},\n", + " {\"name\": \"H2O_molar_ratio\", \"type\": \"range\", \"bounds\": [5.0, 100.0]},\n", + " {\"name\": \"Synthesis_temperature\", \"type\": \"range\", \"bounds\": [100.0, 200.0]},\n", + " {\"name\": \"Synthesis_time\", \"type\": \"range\", \"bounds\": [2.0, 432.0]},\n", + " ],\n", + " categorical_parameters_list = [{\"name\": \"Stirring\", \"type\": \"choice\", \"is_ordered\": False,\"values\": [\"Stirring\", \"Tumbling\", \"Static\"]},\n", + " {\"name\": \"Silicon_source\", \"type\": \"choice\", \"is_ordered\": False,\"values\": [\"Colloidal\", \"Fumed\"]},\n", + " ],\n", + " parameter_constraints_lists = [],\n", + " iterations=30)" + ] + }, + { + "cell_type": "markdown", + "id": "32a88991-c821-41a3-b317-d4c2af0c817b", + "metadata": {}, + "source": [ + "### 1.6 Multi-Objective with 4 Continuous Variables, 2 Categorical Variables and Parameter Constraints " + ] + }, + { + "cell_type": "markdown", + "id": "5e679fc4-ed26-4d9a-99b7-3b22e56d8a4b", + "metadata": {}, + "source": [ + "The fourth demonstration uses the general function [`optimize_experiment_ax`](#Part1.2) to optimize an experiment with **4 continuous variables** with typical ranges that are based on [Table S4](https://pubs.acs.org/doi/suppl/10.1021/acs.chemmater.9b03738/suppl_file/cm9b03738_si_001.pdf#page=10) in the Supporting Information of [reference 1](https://pubs.acs.org/doi/abs/10.1021/acs.chemmater.9b03738): \n", + "* the molar ratio of organic structure directing agents (OSDA) compared to Si \n", + "* the molar ratio of water compared to Si\n", + "* synthesis temperature (°C)\n", + "* synthesis time (h)\n", + "\n", + "We also add **2 categorical variables** that are inspired of [Table S3](https://pubs.acs.org/doi/suppl/10.1021/jacs.1c07590/suppl_file/ja1c07590_si_001.pdf#page=9) in the Supporting Information of [reference 2](https://pubs.acs.org/doi/10.1021/jacs.1c07590): \n", + "* Stirring mode: stirring (600 rpm), tumbling or static. \n", + "* Silicon source: colloidal silica or fumed silica.\n", + "\n", + "Lastly, we add **one parameter constraint**. In the context of zeolite synthesis, parameter constraints are uncommon (the parameter bounds are sufficient), so we invent a physically meaningless constraint for illustrative purposes. This constraint will prevent attaining the global minimum, where approximately H2O_molar_ratio = 12.5 and Synthesis_temperature = 140\n", + "* (H2O_molar_ratio) + (Synthesis_temperature) <= 145\n", + "\n", + "The **2 target variables** are synthesis yield and DCC (divalent cation capacity). We assume that minimizing the above defined [dummy function](#Part1.1) `dummy_function_4_continuous_2_categorical_2_objective` corresponds to maximizing the yield and DCC of the zeolite synthesis. Refer to https://ax.dev/tutorials/multiobjective_optimization.html for more background information." + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "id": "e5e76038-b015-4ae3-8e90-2ceebff5e44d", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The details of the last 5 experiments:\n" + ] + }, + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Generation StepGeneration ModelTrial IndexTrial StatusArm Parameterizations
25GenerationStep_1BoTorch25COMPLETED{'25_0': {'OSDA_molar_ratio': 0.35, 'H2O_molar_ratio': 8.65, 'Synthesis_temperature': 136.35, 'Synthesis_time': 22.99, 'Stirring': 'Static', 'Silicon_source': 'Fumed'}}
26GenerationStep_1BoTorch26COMPLETED{'26_0': {'OSDA_molar_ratio': 0.34, 'H2O_molar_ratio': 8.55, 'Synthesis_temperature': 136.45, 'Synthesis_time': 23.4, 'Stirring': 'Static', 'Silicon_source': 'Fumed'}}
27GenerationStep_1BoTorch27COMPLETED{'27_0': {'OSDA_molar_ratio': 0.34, 'H2O_molar_ratio': 8.08, 'Synthesis_temperature': 136.92, 'Synthesis_time': 20.49, 'Stirring': 'Static', 'Silicon_source': 'Fumed'}}
28GenerationStep_1BoTorch28COMPLETED{'28_0': {'OSDA_molar_ratio': 0.34, 'H2O_molar_ratio': 8.05, 'Synthesis_temperature': 136.95, 'Synthesis_time': 18.65, 'Stirring': 'Static', 'Silicon_source': 'Fumed'}}
29GenerationStep_1BoTorch29COMPLETED{'29_0': {'OSDA_molar_ratio': 0.34, 'H2O_molar_ratio': 8.49, 'Synthesis_temperature': 136.51, 'Synthesis_time': 23.21, 'Stirring': 'Static', 'Silicon_source': 'Fumed'}}
\n", + "
" + ], + "text/plain": [ + " Generation Step Generation Model Trial Index Trial Status \\\n", + "25 GenerationStep_1 BoTorch 25 COMPLETED \n", + "26 GenerationStep_1 BoTorch 26 COMPLETED \n", + "27 GenerationStep_1 BoTorch 27 COMPLETED \n", + "28 GenerationStep_1 BoTorch 28 COMPLETED \n", + "29 GenerationStep_1 BoTorch 29 COMPLETED \n", + "\n", + " Arm Parameterizations \n", + "25 {'25_0': {'OSDA_molar_ratio': 0.35, 'H2O_molar_ratio': 8.65, 'Synthesis_temperature': 136.35, 'Synthesis_time': 22.99, 'Stirring': 'Static', 'Silicon_source': 'Fumed'}} \n", + "26 {'26_0': {'OSDA_molar_ratio': 0.34, 'H2O_molar_ratio': 8.55, 'Synthesis_temperature': 136.45, 'Synthesis_time': 23.4, 'Stirring': 'Static', 'Silicon_source': 'Fumed'}} \n", + "27 {'27_0': {'OSDA_molar_ratio': 0.34, 'H2O_molar_ratio': 8.08, 'Synthesis_temperature': 136.92, 'Synthesis_time': 20.49, 'Stirring': 'Static', 'Silicon_source': 'Fumed'}} \n", + "28 {'28_0': {'OSDA_molar_ratio': 0.34, 'H2O_molar_ratio': 8.05, 'Synthesis_temperature': 136.95, 'Synthesis_time': 18.65, 'Stirring': 'Static', 'Silicon_source': 'Fumed'}} \n", + "29 {'29_0': {'OSDA_molar_ratio': 0.34, 'H2O_molar_ratio': 8.49, 'Synthesis_temperature': 136.51, 'Synthesis_time': 23.21, 'Stirring': 'Static', 'Silicon_source': 'Fumed'}} " + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The Pareto optimal parameters were:\n" + ] + }, + { + "data": { + "text/plain": [ + "{'OSDA_molar_ratio': 0.34503914342964936,\n", + " 'H2O_molar_ratio': 8.64551286485448,\n", + " 'Synthesis_temperature': 136.35448713516206,\n", + " 'Synthesis_time': 22.991767675435288,\n", + " 'Stirring': 'Static',\n", + " 'Silicon_source': 'Fumed'}" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\n", + "The objective values for the Pareto optimal parameters were:\n" + ] + }, + { + "data": { + "text/plain": [ + "{'DCC': 28.414187472214962, 'Synthesis_yield': 28.29822867583607}" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "optimize_experiment_ax(list_obj_names = ['DCC', 'Synthesis_yield'],\n", + " objective_function = dummy_function_4_continuous_2_categorical_2_objective,\n", + " continuous_parameters_list = [{\"name\": \"OSDA_molar_ratio\", \"type\": \"range\", \"bounds\": [0.1, 1.0]},\n", + " {\"name\": \"H2O_molar_ratio\", \"type\": \"range\", \"bounds\": [5.0, 100.0]},\n", + " {\"name\": \"Synthesis_temperature\", \"type\": \"range\", \"bounds\": [100.0, 200.0]},\n", + " {\"name\": \"Synthesis_time\", \"type\": \"range\", \"bounds\": [2.0, 432.0]},\n", + " ],\n", + " categorical_parameters_list = [{\"name\": \"Stirring\", \"type\": \"choice\", \"is_ordered\": False,\"values\": [\"Stirring\", \"Tumbling\", \"Static\"]},\n", + " {\"name\": \"Silicon_source\", \"type\": \"choice\", \"is_ordered\": False,\"values\": [\"Colloidal\", \"Fumed\"]},\n", + " ],\n", + " parameter_constraints_lists = [\"H2O_molar_ratio + Synthesis_temperature <= 145.0\"],\n", + " iterations=30)" + ] + }, + { + "cell_type": "markdown", + "id": "c396a207-acc7-4771-86aa-3c3510582185", + "metadata": {}, + "source": [ + "### 1.7 Code Example without Using the General `optimize_experiment_ax` Function of Part 1.2 " + ] + }, + { + "cell_type": "markdown", + "id": "71011e62-d53e-4568-8323-c8bcc2a1a0e4", + "metadata": {}, + "source": [ + "The fifth demonstration shows an experiment with **4 continuous variables** with typical ranges that are based on [Table S4](https://pubs.acs.org/doi/suppl/10.1021/acs.chemmater.9b03738/suppl_file/cm9b03738_si_001.pdf#page=10) in the Supporting Information of [reference 1](https://pubs.acs.org/doi/abs/10.1021/acs.chemmater.9b03738), but this time **without using the general function** [`optimize_experiment_ax`](#Part1.2). This is how one would probably use Ax when there is only one type of experiment. \n", + "\n", + "* the molar ratio of organic structure directing agents (OSDA) compared to Si \n", + "* the molar ratio of water compared to Si\n", + "* synthesis temperature (°C)\n", + "* synthesis time (h)\n", + "\n", + "The **single target variable** is synthesis yield. We assume that minimizing the above defined [dummy function](#Part1.1) `dummy_function_4_continuous_1_objective` corresponds to maximizing the yield of the zeolite synthesis. We also plot the **optimization trace** of the BO algorithm throughout the different experiment iterations." + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "id": "d6d2d76c-e6ca-481c-bdc9-5c59221f7436", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The details of the last 5 experiment iterations:\n" + ] + }, + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Generation StepGeneration ModelTrial IndexTrial StatusArm Parameterizations
25GenerationStep_1BoTorch25COMPLETED{'25_0': {'OSDA_molar_ratio': 0.36, 'H2O_molar_ratio': 12.41, 'Synthesis_temperature': 140.96, 'Synthesis_time': 21.67}}
26GenerationStep_1BoTorch26COMPLETED{'26_0': {'OSDA_molar_ratio': 0.37, 'H2O_molar_ratio': 11.45, 'Synthesis_temperature': 141.27, 'Synthesis_time': 2.0}}
27GenerationStep_1BoTorch27COMPLETED{'27_0': {'OSDA_molar_ratio': 0.34, 'H2O_molar_ratio': 12.26, 'Synthesis_temperature': 139.76, 'Synthesis_time': 21.9}}
28GenerationStep_1BoTorch28COMPLETED{'28_0': {'OSDA_molar_ratio': 0.1, 'H2O_molar_ratio': 5.0, 'Synthesis_temperature': 200.0, 'Synthesis_time': 2.0}}
29GenerationStep_1BoTorch29COMPLETED{'29_0': {'OSDA_molar_ratio': 0.13, 'H2O_molar_ratio': 5.0, 'Synthesis_temperature': 132.33, 'Synthesis_time': 234.7}}
\n", + "
" + ], + "text/plain": [ + " Generation Step Generation Model Trial Index Trial Status \\\n", + "25 GenerationStep_1 BoTorch 25 COMPLETED \n", + "26 GenerationStep_1 BoTorch 26 COMPLETED \n", + "27 GenerationStep_1 BoTorch 27 COMPLETED \n", + "28 GenerationStep_1 BoTorch 28 COMPLETED \n", + "29 GenerationStep_1 BoTorch 29 COMPLETED \n", + "\n", + " Arm Parameterizations \n", + "25 {'25_0': {'OSDA_molar_ratio': 0.36, 'H2O_molar_ratio': 12.41, 'Synthesis_temperature': 140.96, 'Synthesis_time': 21.67}} \n", + "26 {'26_0': {'OSDA_molar_ratio': 0.37, 'H2O_molar_ratio': 11.45, 'Synthesis_temperature': 141.27, 'Synthesis_time': 2.0}} \n", + "27 {'27_0': {'OSDA_molar_ratio': 0.34, 'H2O_molar_ratio': 12.26, 'Synthesis_temperature': 139.76, 'Synthesis_time': 21.9}} \n", + "28 {'28_0': {'OSDA_molar_ratio': 0.1, 'H2O_molar_ratio': 5.0, 'Synthesis_temperature': 200.0, 'Synthesis_time': 2.0}} \n", + "29 {'29_0': {'OSDA_molar_ratio': 0.13, 'H2O_molar_ratio': 5.0, 'Synthesis_temperature': 132.33, 'Synthesis_time': 234.7}} " + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "" + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The best parameters were:\n" + ] + }, + { + "data": { + "text/plain": [ + "{'OSDA_molar_ratio': 0.34406537118593616,\n", + " 'H2O_molar_ratio': 12.255890900708632,\n", + " 'Synthesis_temperature': 139.7614030816516,\n", + " 'Synthesis_time': 21.90491099424178}" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\n", + "The objective value for the best parameters was:\n" + ] + }, + { + "data": { + "text/plain": [ + "{'Synthesis_yield': 0.4317714423295911}" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "obj_name1 = \"Synthesis_yield\"\n", + " \n", + "ax_client = AxClient(verbose_logging=False)\n", + "ax_client.create_experiment(parameters=[{\"name\": \"OSDA_molar_ratio\", \"type\": \"range\", \"bounds\": [0.1, 1.0]},\n", + " {\"name\": \"H2O_molar_ratio\", \"type\": \"range\", \"bounds\": [5.0, 100.0]},\n", + " {\"name\": \"Synthesis_temperature\", \"type\": \"range\", \"bounds\": [100.0, 200.0]},\n", + " {\"name\": \"Synthesis_time\", \"type\": \"range\", \"bounds\": [2.0, 432.0]},\n", + " ],\n", + " objectives={obj_name1: ObjectiveProperties(minimize=True),},\n", + " )\n", + "\n", + "for _ in range(30):\n", + " parameterization, trial_index = ax_client.get_next_trial()\n", + "\n", + " # Extract parameters\n", + " x1 = parameterization[\"OSDA_molar_ratio\"]\n", + " x2 = parameterization[\"H2O_molar_ratio\"]\n", + " x3 = parameterization[\"Synthesis_temperature\"]\n", + " x4 = parameterization[\"Synthesis_time\"]\n", + " \n", + " results = dummy_function_4_continuous_1_objective(x1, x2, x3, x4, obj_name1=obj_name1)\n", + " ax_client.complete_trial(trial_index=trial_index, raw_data=results)\n", + "\n", + "best_parameters, value = ax_client.get_best_parameters()\n", + "\n", + "# Create dataframe with details of all experiment iterations\n", + "df_experiments = ax_client.generation_strategy.trials_as_df\n", + "print('The details of the last 5 experiment iterations:')\n", + "display(df_experiments.tail())\n", + "\n", + "# Get the AxClient's optimization trace using the built-in plotting method\n", + "optimization_trace = ax_client.get_optimization_trace()\n", + "\n", + "# Convert the optimization trace to a Plotly figure and plot it\n", + "fig = to_plotly(optimization_trace)\n", + "fig.show(renderer='png')\n", + "\n", + "# Output the best parameters and their corresponding objective values\n", + "print('The best parameters were:')\n", + "display(best_parameters)\n", + "print('\\nThe objective value for the best parameters was:')\n", + "display(value[0])" + ] + }, + { + "cell_type": "markdown", + "id": "e3e390de-f733-4f34-bfdb-2d094e7cbcfb", + "metadata": {}, + "source": [ + "## Part 2: Propose a New Experiment Based on a Batch of Prior (Literature) Experiments " + ] + }, + { + "cell_type": "markdown", + "id": "883f3525-fa4a-47b4-b4bb-ce858debf643", + "metadata": {}, + "source": [ + "Here Bayesian optimization is applied within a **real-world context** where the underlying target function remains unknown. We start from a batch of experiments collected from literature, and we allow the Bayesian optimizer to **suggest the next experiment**. This process aims to explore the search space further and/or leverage past results. In practice, one would carry out the suggested experiment, incorporate its outcome into the existing results, and subsequently rerun the Bayesian optimization algorithm." + ] + }, + { + "cell_type": "markdown", + "id": "d33d5ee3-637c-4cd7-9af5-36ecb0e7e607", + "metadata": {}, + "source": [ + "### 2.1 Define a Function that Proposes the Next Best Experiment with Ax Package " + ] + }, + { + "cell_type": "markdown", + "id": "d36c6596-8c8a-4476-98d7-cf0d0cc4004c", + "metadata": {}, + "source": [ + "Here we will create a **general function** `propose_experiment_ax` to propose a next best experiment with the Ax package. This general function allows focus on the output of the experiments further on, without repeatedly modifying similar sections of code. \n", + "\n", + "The `propose_experiment_ax` function takes a list of **continuous parameters**, a list of **categorical parameters**, a list of parameter **constraints**, a dataframe with **previous continuous experimental inputs**, a dataframe with **previous categorical experimental inputs** and a dictionary with **previous experimental outcomes (single or multi-objective)**. \n", + "\n", + "This function is inspired by the the following GitHub issue: https://github.com/Facebook/ax/issues/743." + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "id": "1c2547c1-beb5-4e29-baa6-c41eff675ece", + "metadata": {}, + "outputs": [], + "source": [ + "def propose_experiment_ax(continuous_parameters_list, categorical_parameters_list, parameter_constraints_lists,\n", + " df_prior_experiments_input_continuous, df_prior_experiments_input_categorical, \n", + " dictionary_prior_experiments_output):\n", + " \"\"\"\n", + " Proposes the next best experiment with the Ax package. \n", + " Inputs: \n", + " continuous_parameters_list: list of continuous parameters for the objective function\n", + " categorical_parameters_list: list of categorical parameters for the objective function\n", + " parameter_constraints_lists: list of constraints in the parameter space\n", + " df_prior_experiments_input_continuous: dataframe with the previous experimental inputs of the continuous parameters\n", + " df_prior_experiments_input_categorical: dataframe with the previous experimental inputs of the categorical parameters\n", + " dictionary_prior_experiments_output: a dictionary {objective_name : objective_result} in which objective_name is a string naming the objective,\n", + " and objective_result is a pandas Series with the previous experimental outcomes \n", + " Outputs:\n", + " A suggestion for the best subsequent experiment to try out.\n", + " For single-objective experiments, the best previous parameters and their objective function output are printed.\n", + "\n", + " Source:\n", + " This function is inspired by the following GitHub issue: https://github.com/Facebook/ax/issues/743 \n", + " \"\"\"\n", + " all_parameters_list = continuous_parameters_list + categorical_parameters_list\n", + " \n", + " df_prior_experiments_input_all = pd.concat([df_prior_experiments_input_continuous, df_prior_experiments_input_categorical], axis=1)\n", + " df_prior_experiments_output_all = pd.concat(dictionary_prior_experiments_output.values(), axis=1)\n", + " df_prior_experiments_input_output_all = pd.concat([df_prior_experiments_input_all, df_prior_experiments_output_all], axis=1)\n", + " print('The considered dataset with previous experimental inputs and outputs:')\n", + " display(df_prior_experiments_input_output_all)\n", + "\n", + " objectives_dictionary={}\n", + " for obj_name in dictionary_prior_experiments_output.keys():\n", + " objectives_dictionary[obj_name]=ObjectiveProperties(minimize=False)\n", + " \n", + " # Skip the pseudo-random suggested points by specifying a custom generation strategy\n", + " # See: https://ax.dev/tutorials/generation_strategy.html and\n", + " # https://ax.dev/docs/bayesopt.html#tradeoff-between-parallelism-and-total-number-of-trials\n", + " gs = GenerationStrategy(steps=[GenerationStep(model=Models.GPEI, num_trials=-1, max_parallelism=3)])\n", + "\n", + " # Setup the experiment\n", + " ax_client = AxClient(generation_strategy=gs, verbose_logging=False)\n", + " ax_client.create_experiment(parameters=all_parameters_list, \n", + " parameter_constraints=parameter_constraints_lists, \n", + " objectives=objectives_dictionary)\n", + "\n", + " # Attach the training data\n", + " for i in range(df_prior_experiments_input_all.shape[0]):\n", + " ax_client.attach_trial(df_prior_experiments_input_all.iloc[i, :].to_dict())\n", + "\n", + " result_dictionary={}\n", + " for obj_name in dictionary_prior_experiments_output.keys():\n", + " # We assume standard error is 0.0\n", + " result_dictionary[obj_name] = (dictionary_prior_experiments_output[obj_name][i], 0.0)\n", + " ax_client.complete_trial(trial_index=i, raw_data=result_dictionary)\n", + " \n", + " # Produce a single next suggested experiment\n", + " next_experiment, trial_index = ax_client.get_next_trial()\n", + " print(\"\\nNext suggested experiment:\" )\n", + " display(next_experiment)\n", + "\n", + " if len(dictionary_prior_experiments_output.keys()) == 1 :\n", + " # Single-objective experiment\n", + " # Output the best parameters and their corresponding objective values\n", + " best_parameters, value = ax_client.get_best_parameters()\n", + " print('\\nThe best parameters were:')\n", + " display(best_parameters)\n", + " print('\\nThe objective value for the best parameters was:')\n", + " display(value[0])\n", + " \n", + " return None" + ] + }, + { + "cell_type": "markdown", + "id": "dab418c7-4257-45e1-a4f9-a2aabb9ef5e3", + "metadata": {}, + "source": [ + "### 2.2 Collect the Literature Input and Output Data " + ] + }, + { + "cell_type": "markdown", + "id": "c0292d5b-6fe0-4e08-a9aa-d138f0661555", + "metadata": {}, + "source": [ + "The objective of the considered study was to find a one-pot synthesis of Fe-CHA zeolites that maximizes the methanol yield when the synthesized material is activated and reacted with methane. 'One-pot' means that Fe is already added in the zeolite synthesis, instead of being post-synthetically ion-exchanged on the zeolite.\n", + "\n", + "The input literature data are based on [Table S3](https://pubs.acs.org/doi/suppl/10.1021/jacs.1c07590/suppl_file/ja1c07590_si_001.pdf#page=9) in the Supporting Information of [reference 2](https://pubs.acs.org/doi/10.1021/jacs.1c07590). A reasonable value was chosen for missing data.\n", + "\n", + "The **continuous** variables are:\n", + "* the molar ratio of organic structure directing agents, OSDA, compared to Si \n", + "* the molar ratio of water compared to Si\n", + "* the molar ratio of Fe compared to Si\n", + "\n", + "The **categorical** variables are:\n", + "* Fe source: iron(III) acetate (A) or iron(III) nitrate (N).\n", + "* Stirring mode: stirring (600 rpm) or static.\n", + "\n", + "The **2 target variables** are based on respectively [Table S3](https://pubs.acs.org/doi/suppl/10.1021/jacs.1c07590/suppl_file/ja1c07590_si_001.pdf#page=9) and [Table S4](https://pubs.acs.org/doi/suppl/10.1021/jacs.1c07590/suppl_file/ja1c07590_si_001.pdf#page=10) in the Supporting Information of [reference 2](https://pubs.acs.org/doi/10.1021/jacs.1c07590):\n", + "* Zeolite synthesis yield \n", + "* Methanol yield (MeOH/Al)\n" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "id": "46777f23-c717-46c2-830b-e929618976c3", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\n", + "Literature input data with the experimental Synthesis_yield and Methanol_yield outcome. This will be fed as prior information to BO:\n" + ] + }, + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
OSDA_molar_ratioH2O_molar_ratioFe_molar_ratioFe_SaltStirringSynthesis_yieldMethanol_yield
00.3615.40.019AStatic0.830.089
10.3314.10.016AStatic0.850.085
20.3615.50.018NStatic0.960.084
30.3615.50.017NStatic0.840.108
40.3615.50.035AStatic0.930.116
50.3615.50.037NStirring1.000.063
60.3414.40.039NStirring0.910.108
70.3615.50.055AStatic0.000.053
80.3615.60.055NStatic0.000.013
90.3615.50.090AStatic0.000.020
100.3314.10.016AStirring0.910.062
\n", + "
" + ], + "text/plain": [ + " OSDA_molar_ratio H2O_molar_ratio Fe_molar_ratio Fe_Salt Stirring \\\n", + "0 0.36 15.4 0.019 A Static \n", + "1 0.33 14.1 0.016 A Static \n", + "2 0.36 15.5 0.018 N Static \n", + "3 0.36 15.5 0.017 N Static \n", + "4 0.36 15.5 0.035 A Static \n", + "5 0.36 15.5 0.037 N Stirring \n", + "6 0.34 14.4 0.039 N Stirring \n", + "7 0.36 15.5 0.055 A Static \n", + "8 0.36 15.6 0.055 N Static \n", + "9 0.36 15.5 0.090 A Static \n", + "10 0.33 14.1 0.016 A Stirring \n", + "\n", + " Synthesis_yield Methanol_yield \n", + "0 0.83 0.089 \n", + "1 0.85 0.085 \n", + "2 0.96 0.084 \n", + "3 0.84 0.108 \n", + "4 0.93 0.116 \n", + "5 1.00 0.063 \n", + "6 0.91 0.108 \n", + "7 0.00 0.053 \n", + "8 0.00 0.013 \n", + "9 0.00 0.020 \n", + "10 0.91 0.062 " + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/plain": [ + "OSDA_molar_ratio float64\n", + "H2O_molar_ratio float64\n", + "Fe_molar_ratio float64\n", + "Fe_Salt object\n", + "Stirring object\n", + "Synthesis_yield float64\n", + "Methanol_yield float64\n", + "dtype: object" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "parameter_names = [\"OSDA_molar_ratio\", \"H2O_molar_ratio\", \"Fe_molar_ratio\", \"Fe_Salt\", \"Stirring\"]\n", + "\n", + "X_train = np.array([[0.36, 15.4, 0.019, 'A', 'Static'],\n", + " [0.33, 14.1, 0.016, 'A', 'Static'],\n", + " [0.36, 15.5, 0.018, 'N', 'Static'],\n", + " [0.36, 15.5, 0.017, 'N', 'Static'],\n", + " [0.36, 15.5, 0.035, 'A', 'Static'],\n", + " [0.36, 15.5, 0.037, 'N', 'Stirring'],\n", + " [0.34, 14.4, 0.039, 'N', 'Stirring'],\n", + " [0.36, 15.5, 0.055, 'A', 'Static'],\n", + " [0.36, 15.6, 0.055, 'N', 'Static'],\n", + " [0.36, 15.5, 0.090, 'A', 'Static'],\n", + " [0.33, 14.1, 0.016, 'A', 'Stirring'],\n", + " ])\n", + "\n", + "X_train = pd.DataFrame(X_train, columns=parameter_names)\n", + "dict_types = {'OSDA_molar_ratio': 'float64', 'H2O_molar_ratio': 'float64', 'Fe_molar_ratio': 'float64', \n", + " 'Fe_Salt': 'object', 'Stirring': 'object' }\n", + "X_train = X_train.astype(dict_types)\n", + "\n", + "y_train_yield = np.array([0.83, 0.85, 0.96, 0.84, 0.93, 1.0, 0.91, 0.0, 0.0, 0.0, 0.91])\n", + "y_train_methanol = np.array([0.089, 0.085, 0.084, 0.108, 0.116, 0.063, 0.108, 0.053, 0.013, 0.020, 0.062])\n", + "\n", + "print('\\nLiterature input data with the experimental Synthesis_yield and Methanol_yield outcome. This will be fed as prior information to BO:')\n", + "X_total = X_train.copy()\n", + "X_total['Synthesis_yield'] = y_train_yield.tolist()\n", + "X_total['Methanol_yield'] = y_train_methanol.tolist()\n", + "display(X_total)\n", + "display(X_total.dtypes)\n" + ] + }, + { + "cell_type": "markdown", + "id": "e69374e8-c314-4614-974b-eb9726fa4978", + "metadata": {}, + "source": [ + "### 2.3 Single-Objective (Synthesis Yield) with 3 Continuous Variables and 2 Categorical Variables " + ] + }, + { + "cell_type": "markdown", + "id": "105100e5-d6ba-4081-9538-16a84692ada9", + "metadata": {}, + "source": [ + "In this scenario, we are interested in **maximizing the zeolite synthesis yield** (single-objective). We run [`propose_experiment_ax`](#Part2.1) to generate the next best experiment to try out in the labaratory. " + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "id": "0a3c541d-7756-48bd-9bdf-90d9cec023ff", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The considered dataset with previous experimental inputs and outputs:\n" + ] + }, + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
OSDA_molar_ratioH2O_molar_ratioFe_molar_ratioFe_SaltStirringSynthesis_yield
00.3615.40.019AStatic0.83
10.3314.10.016AStatic0.85
20.3615.50.018NStatic0.96
30.3615.50.017NStatic0.84
40.3615.50.035AStatic0.93
50.3615.50.037NStirring1.00
60.3414.40.039NStirring0.91
70.3615.50.055AStatic0.00
80.3615.60.055NStatic0.00
90.3615.50.090AStatic0.00
100.3314.10.016AStirring0.91
\n", + "
" + ], + "text/plain": [ + " OSDA_molar_ratio H2O_molar_ratio Fe_molar_ratio Fe_Salt Stirring \\\n", + "0 0.36 15.4 0.019 A Static \n", + "1 0.33 14.1 0.016 A Static \n", + "2 0.36 15.5 0.018 N Static \n", + "3 0.36 15.5 0.017 N Static \n", + "4 0.36 15.5 0.035 A Static \n", + "5 0.36 15.5 0.037 N Stirring \n", + "6 0.34 14.4 0.039 N Stirring \n", + "7 0.36 15.5 0.055 A Static \n", + "8 0.36 15.6 0.055 N Static \n", + "9 0.36 15.5 0.090 A Static \n", + "10 0.33 14.1 0.016 A Stirring \n", + "\n", + " Synthesis_yield \n", + "0 0.83 \n", + "1 0.85 \n", + "2 0.96 \n", + "3 0.84 \n", + "4 0.93 \n", + "5 1.00 \n", + "6 0.91 \n", + "7 0.00 \n", + "8 0.00 \n", + "9 0.00 \n", + "10 0.91 " + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\n", + "Next suggested experiment:\n" + ] + }, + { + "data": { + "text/plain": [ + "{'OSDA_molar_ratio': 0.3597986726498765,\n", + " 'H2O_molar_ratio': 15.488919708603255,\n", + " 'Fe_molar_ratio': 0.023291856734901355,\n", + " 'Fe_Salt': 'N',\n", + " 'Stirring': 'Static'}" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\n", + "The best parameters were:\n" + ] + }, + { + "data": { + "text/plain": [ + "{'OSDA_molar_ratio': 0.36,\n", + " 'H2O_molar_ratio': 15.5,\n", + " 'Fe_molar_ratio': 0.037,\n", + " 'Fe_Salt': 'N',\n", + " 'Stirring': 'Stirring'}" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\n", + "The objective value for the best parameters was:\n" + ] + }, + { + "data": { + "text/plain": [ + "{'Synthesis_yield': 1.0}" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "propose_experiment_ax(continuous_parameters_list = [{\"name\": \"OSDA_molar_ratio\", \"type\": \"range\", \"bounds\": [0.30, 0.40]},\n", + " {\"name\": \"H2O_molar_ratio\", \"type\": \"range\", \"bounds\": [14.0, 16.0]},\n", + " {\"name\": \"Fe_molar_ratio\", \"type\": \"range\", \"bounds\": [0.01, 0.10]},\n", + " ],\n", + " categorical_parameters_list = [{\"name\": \"Fe_Salt\", \"type\": \"choice\", \"is_ordered\": False,\"values\": [\"A\", \"N\"]},\n", + " {\"name\": \"Stirring\", \"type\": \"choice\", \"is_ordered\": False, \"values\": [\"Stirring\", \"Static\"]},\n", + " ], \n", + " parameter_constraints_lists = [],\n", + " df_prior_experiments_input_continuous = X_total[[\"OSDA_molar_ratio\", \"H2O_molar_ratio\", \"Fe_molar_ratio\"]],\n", + " df_prior_experiments_input_categorical = X_total[[\"Fe_Salt\", \"Stirring\"]],\n", + " dictionary_prior_experiments_output = {\"Synthesis_yield\" : X_total.loc[:,\"Synthesis_yield\"]} \n", + " )\n", + " " + ] + }, + { + "cell_type": "markdown", + "id": "374d8a9e-df50-4855-b771-ab061603b4cc", + "metadata": {}, + "source": [ + "### 2.4 Multi-Objective (Synthesis Yield + Methanol Production) with 3 Continuous Variables and 2 Categorical Variables " + ] + }, + { + "cell_type": "markdown", + "id": "40fcd82c-648b-4204-8b49-29fdff9960fa", + "metadata": {}, + "source": [ + "In this scenario, we are interested in **maximizing both the zeolite synthesis yield and the methanol production** (multi-objective). We run [`propose_experiment_ax`](#Part2.1) to generate the next best experiment to try out in the labaratory. " + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "id": "23cf5c47-f360-4fc1-9a2a-4586732e2f2b", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The considered dataset with previous experimental inputs and outputs:\n" + ] + }, + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
OSDA_molar_ratioH2O_molar_ratioFe_molar_ratioFe_SaltStirringSynthesis_yieldMethanol_yield
00.3615.40.019AStatic0.830.089
10.3314.10.016AStatic0.850.085
20.3615.50.018NStatic0.960.084
30.3615.50.017NStatic0.840.108
40.3615.50.035AStatic0.930.116
50.3615.50.037NStirring1.000.063
60.3414.40.039NStirring0.910.108
70.3615.50.055AStatic0.000.053
80.3615.60.055NStatic0.000.013
90.3615.50.090AStatic0.000.020
100.3314.10.016AStirring0.910.062
\n", + "
" + ], + "text/plain": [ + " OSDA_molar_ratio H2O_molar_ratio Fe_molar_ratio Fe_Salt Stirring \\\n", + "0 0.36 15.4 0.019 A Static \n", + "1 0.33 14.1 0.016 A Static \n", + "2 0.36 15.5 0.018 N Static \n", + "3 0.36 15.5 0.017 N Static \n", + "4 0.36 15.5 0.035 A Static \n", + "5 0.36 15.5 0.037 N Stirring \n", + "6 0.34 14.4 0.039 N Stirring \n", + "7 0.36 15.5 0.055 A Static \n", + "8 0.36 15.6 0.055 N Static \n", + "9 0.36 15.5 0.090 A Static \n", + "10 0.33 14.1 0.016 A Stirring \n", + "\n", + " Synthesis_yield Methanol_yield \n", + "0 0.83 0.089 \n", + "1 0.85 0.085 \n", + "2 0.96 0.084 \n", + "3 0.84 0.108 \n", + "4 0.93 0.116 \n", + "5 1.00 0.063 \n", + "6 0.91 0.108 \n", + "7 0.00 0.053 \n", + "8 0.00 0.013 \n", + "9 0.00 0.020 \n", + "10 0.91 0.062 " + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\n", + "Next suggested experiment:\n" + ] + }, + { + "data": { + "text/plain": [ + "{'OSDA_molar_ratio': 0.3526783041131582,\n", + " 'H2O_molar_ratio': 15.331573897619075,\n", + " 'Fe_molar_ratio': 0.033573534446308506,\n", + " 'Fe_Salt': 'A',\n", + " 'Stirring': 'Static'}" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "propose_experiment_ax(continuous_parameters_list = [{\"name\": \"OSDA_molar_ratio\", \"type\": \"range\", \"bounds\": [0.30, 0.40]},\n", + " {\"name\": \"H2O_molar_ratio\", \"type\": \"range\", \"bounds\": [14.0, 16.0]},\n", + " {\"name\": \"Fe_molar_ratio\", \"type\": \"range\", \"bounds\": [0.01, 0.10]},\n", + " ],\n", + " categorical_parameters_list = [{\"name\": \"Fe_Salt\", \"type\": \"choice\", \"is_ordered\": False,\"values\": [\"A\", \"N\"]},\n", + " {\"name\": \"Stirring\", \"type\": \"choice\", \"is_ordered\": False, \"values\": [\"Stirring\", \"Static\"]},\n", + " ], \n", + " parameter_constraints_lists = [],\n", + " df_prior_experiments_input_continuous = X_total[[\"OSDA_molar_ratio\", \"H2O_molar_ratio\", \"Fe_molar_ratio\"]],\n", + " df_prior_experiments_input_categorical = X_total[[\"Fe_Salt\", \"Stirring\"]],\n", + " dictionary_prior_experiments_output = {\"Synthesis_yield\" : X_total.loc[:,\"Synthesis_yield\"], \n", + " \"Methanol_yield\" : X_total.loc[:,\"Methanol_yield\"],\n", + " } \n", + " ) " + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python [conda env:jupyter_vscode]", + "language": "python", + "name": "conda-env-jupyter_vscode-py" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.12.1" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/hello.py b/hello.py deleted file mode 100644 index a025bbf..0000000 --- a/hello.py +++ /dev/null @@ -1,2 +0,0 @@ -def hello_world(): - return "Hello!" diff --git a/hello_test.py b/hello_test.py deleted file mode 100644 index 708a061..0000000 --- a/hello_test.py +++ /dev/null @@ -1,5 +0,0 @@ -import hello - - -def test_hello(): - assert hello.hello_world() == "Hello World!" diff --git a/images/BO_Zeolite.png b/images/BO_Zeolite.png new file mode 100644 index 0000000..511ede8 Binary files /dev/null and b/images/BO_Zeolite.png differ diff --git a/images/Poster_BO_Zeolite.png b/images/Poster_BO_Zeolite.png new file mode 100644 index 0000000..518a580 Binary files /dev/null and b/images/Poster_BO_Zeolite.png differ diff --git a/images/Zeolite_rings.png b/images/Zeolite_rings.png new file mode 100644 index 0000000..4b479d7 Binary files /dev/null and b/images/Zeolite_rings.png differ diff --git a/images/Zeolite_synthesis_equipment.png b/images/Zeolite_synthesis_equipment.png new file mode 100644 index 0000000..1226c6c Binary files /dev/null and b/images/Zeolite_synthesis_equipment.png differ diff --git a/images/Zeolite_topologies.png b/images/Zeolite_topologies.png new file mode 100644 index 0000000..d8143a5 Binary files /dev/null and b/images/Zeolite_topologies.png differ diff --git a/pyproject.toml b/pyproject.toml deleted file mode 100644 index c953815..0000000 --- a/pyproject.toml +++ /dev/null @@ -1,2 +0,0 @@ -[build-system] -requires = ["setuptools", "wheel"] \ No newline at end of file diff --git a/requirements.txt b/requirements.txt index 097a011..6843d9e 100644 --- a/requirements.txt +++ b/requirements.txt @@ -1,9 +1,11 @@ --e . # package from this repo -# numpy -# scipy -# pandas -# matplotlib -# matplotlib-inline -# ipython -# ipykernel -pytest +numpy +pandas +plotly +ax +ipython +collections + +# optional +logging +sys +warnings diff --git a/setup.cfg b/setup.cfg deleted file mode 100644 index cc93fb7..0000000 --- a/setup.cfg +++ /dev/null @@ -1,11 +0,0 @@ -[metadata] -name = helper_functions -version = 0.1 - -[options] -packages = find: -package_dir = - =src - -[options.packages.find] -where=src \ No newline at end of file diff --git a/src/mock1/__init__.py b/src/mock1/__init__.py deleted file mode 100644 index d98cc4b..0000000 --- a/src/mock1/__init__.py +++ /dev/null @@ -1,2 +0,0 @@ -"""Mock function that gets installed by requirements.txt""" -from mock1._mock1 import Mock1 diff --git a/src/mock1/_mock1.py b/src/mock1/_mock1.py deleted file mode 100644 index 43f32d9..0000000 --- a/src/mock1/_mock1.py +++ /dev/null @@ -1,6 +0,0 @@ -class Mock1: - def __init__(self): - pass - - def mock(self): - print("this is a mock function") diff --git a/src/mock2/__init__.py b/src/mock2/__init__.py deleted file mode 100644 index 9d29bf3..0000000 --- a/src/mock2/__init__.py +++ /dev/null @@ -1,2 +0,0 @@ -"""Mock function that gets installed by requirements.txt""" -from mock2._mock2 import Mock2 diff --git a/src/mock2/_mock2.py b/src/mock2/_mock2.py deleted file mode 100644 index f5b7725..0000000 --- a/src/mock2/_mock2.py +++ /dev/null @@ -1,6 +0,0 @@ -class Mock2: - def __init__(self): - pass - - def mock(self): - print("this is a mock function") diff --git a/zeolite_synthesis_bo_introduction.md b/zeolite_synthesis_bo_introduction.md new file mode 100644 index 0000000..7f24929 --- /dev/null +++ b/zeolite_synthesis_bo_introduction.md @@ -0,0 +1,238 @@ +# Navigating black box zeolite synthesis with Bayesian optimization + +Author: Plessers Dieter +March 28th, 2024 +*Department of Microbial and Molecular Systems, Center for Sustainable Catalysis and Engineering, KU Leuven-University of Leuven, Belgium.* + +## 0. Scope + +This introductory document proposes the integration of active learning techniques such as Bayesian optimization into zeolite synthesis research. We first provide an overview of zeolites and their importance. Subsequently, we explore the standard components of zeolite synthesis experiments, including reagents, equipment, and conditions. We then delve into the potential of Bayesian optimization to accelerate zeolite synthesis experiments and reduce associated costs. The optimization problem addressed by Bayesian optimization is outlined, detailing a typical parameter space with tunable variables and constraints, along with possible objectives derived from a target application. Additionally, we briefly highlight a few zeolite synthesis datasets that recently have been compiled from literature. The final discussion section further elaborates on various facets of the Bayesian optimization process and introduces a specific coding example with real-world data, provided in the [accompanying Jupyter notebook](./demo_zeolite_synthesis_bo.ipynb). + +While numerous references are provided for further exploration, this document is self-contained and aims to be easily understood. We hope it inspires the reader to consider active learning approaches in their zeolite synthesis endeavors. + +## 1. Zeolites – Microporous Materials + +Zeolites are porous, crystalline aluminosilicates built from linked \[SiO4\] and \[AlO4\]\- tetrahedra in which every oxygen atom is shared between neighboring Si or Al atoms (i.e. T-atoms).[^1][^2][^3] These T-atoms are arranged together in secondary building units (SBUs), that are connected and form a three-dimensional framework with channels and cages. The existence of multiple SBUs and numerous ways to connect them results in a theoretical enormous amount of zeolite topologies.[^4] Topologies observed experimentally or in nature are represented by a three letter code (e.g. FAU for faujasite, CHA for chabazite). All known zeolite topologies can be found on the website of the International Zeolite Association (IZA).[^5] As of March 2024, the website lists 256 distinct topologies, excluding intergrowths. The unique ring, pore and channel system of each zeolite topology determines their potential applications. Figure 1 illustrates the topologies of the most relevant commercial zeolites. + +Relevant zeolite topologies + +**Figure 1.** Framework structures of the most relevant zeolite topologies. Vertices represent T atoms (usually Si and Al) connected via O-atoms (not depicted)*.* Dashed lines demarcate the unit cells. All figures are sourced from the online IZA Database.[^5] + +Pore and channel dimensions, typically in the Ă„ngström scale, are characterized by the number *n* of T-atoms in the limiting ring, denoted as *n*MR (*n*\-membered ring) (Figure 2). Ring sizes vary from 3MR to 24MR, and exhibit various shapes, from circular to elliptical.[^5][^6] This ring and channel system enables zeolites to function as molecular sieves, allowing only molecules smaller than the free diameter to traverse the rings, while larger molecules are excluded.[^1][^2] Zeolites are also known for their shape selectivity, wherein the distribution of products in a reaction system is influenced by how reactants, intermediates, and products fit within the cage and channel structure of the zeolites.[^7] Moreover, atoms beyond the first coordination sphere can impact the reactivity of active sites by guiding substrate approach and/or by (de)stabilizing the active site or transition state. These effects, known as 'second-sphere effects' play a crucial role in zeolite reactivity.[^8][^9] + +Different ring sizes + +**Figure 2.** Different ring sizes in zeolites.[^9][^10] + +A specific zeolite topology is defined by the spatial arrangement of its lattice, regardless of the material’s chemical composition. Consequently, even within materials sharing the same zeolite topology, numerous parameters remain adjustable. Among these, the most prevalent is the amount and distribution of aluminum (Al) atoms within the zeolite lattice. Each \[AlO4\]\- tetrahedron introduces one negative lattice charge, which is counterbalanced by exchangeable, extra-framework cations. These cations can be protons, imparting zeolites with their distinctive acidic properties,[^11] or metal cations such as transition metal ions (TMIs), employed in redox reactions.[^9] They can also be combined in bifunctional catalysis.[^12] + +Thanks to their thermal stability, low cost (particularly for commercially available bulk zeolites like depicted in Figure 1) and unique chemical properties (acidity, cation exchange capacity, molecular sieving capabilities
), zeolites find extensive use across various industrial sectors. They are integral components in detergents (such as washing powders), they serve as adsorbents and desiccants,[^13] and they play critical roles in petrochemistry, notably as acid catalysts in the fluid catalytic cracking (FCC) process.[^14] Beyond these applications, zeolites demonstrate remarkable versatility, being employed in sensors,[^15] membranes[^16] and redox processes, such as the removal of nitrogen-containing exhaust gases where Cu-exchanged CHA zeolites are at the forefront of selective catalytic reduction (SCR) of NOx gasses in vehicles.[^17][^18] The vast applicability of zeolites is evidenced by their annual production of approximately 6 million tons, with a global market valued at around 13 billion USD.[^19] + +In addition to their extensive industrial applications, the favorable properties of zeolites guarantee their continued significance in fundamental research, both within academia and industry. Zeolites persist as one of the most extensively studied materials for various innovative applications, with numerous laboratories worldwide striving to optimize the synthesis process, customize the resulting properties of zeolites, and discover new topologies.[^20] + +## 2. Zeolite Synthesis – Ingredients and Equipment + +The zeolite synthesis research field boasts a rich history,[^21] reflected in the abundance of literature detailing various synthesis recipes for each zeolite topology (and different materials within the topology). These recipes span from straightforward methods with minimal ingredients, resilient to experimental errors, to intricate procedures demanding specialized equipment.[^22] Typically, hydrothermal synthesis methods are employed, involving the mixing of precursors in water followed by crystallization under elevated temperature and pressure conditions. + +A ‘typical’ hydrothermal zeolite synthesis procedure involves combining a silicon source, an aluminum source, an organic structure-directing agent (OSDA) serving as a template to fill the zeolite pores during synthesis (afterwards removed via calcination), inorganic cations (typically alkali metal hydroxides) and water.[^22] These ingredients are mixed within an inert Teflon liner and placed inside a stainless steel autoclave (Figure 3A), which is quite literally a black box for which it is hard to understand, let alone predict, the internal processes.[^23] The synthesis occurs at autogenous pressure in an oven maintained at a certain temperature (typically 100-200°C) for a specific time (typically 3-7 days, though durations may vary). The synthesis can occur under stirring conditions using a magnetic stirring bar within the Teflon liner, by tumbling the autoclave in the oven, or under static conditions without agitation. An optional step prior to hydrothermal synthesis involves stirring the synthesis solution or gel for a period (often a day) at room temperature, known as ‘aging’. + +However, the term ‘typical zeolite synthesis’ is somewhat contradictory since there are numerous variations on this process. While the aforementioned ingredients are common, they are not strictly required. Additionally, many other components could be introduced, such as fluoride as a mineralizer, alternative metals (e.g. B, Fe, Zn) for lattice incorporation alongside or in place of aluminum, a secondary OSDA, or the application of ultrasound or microwaves during synthesis.[^22] Even applying a voltage with electrodes recently emerged as a novel possibility.[^24] However, most of these unconventional conditions are utilized for niche materials with limited industrial significance, often due to the exotic requirements of such conditions. + +Zeolite synthesis equipment + +**Figure 3.** A) Teflon liners and corresponding autoclaves.[^25] B) Multi-autoclave system for high-throughput parallel experiments with a robotic arm.[^26] + +This brief overview of zeolite synthesis highlights the vast parameter space involved and the ongoing challenge of fully understanding the crystallization mechanisms. Consequently, despite the significant industrial importance of zeolites, their synthesis predominantly relies on heuristic approaches, practitioner experience, and an element of serendipity. An experienced zeolite synthesis practitioner can narrow down this parameter space by drawing from literature and past experiences. For instance, they might opt for a fixed set of ingredients and consider a limited range of temperatures and concentrations. Within this confined search space, typically, either a grid search or a random search is conducted. This process can be arduous, especially considering the sensitivity of certain zeolite synthesis processes to small changes in conditions. Fortunately, in many laboratories, parallel experiments using small multi-autoclave synthesis systems accelerate this process (Figure 3B).[^26] Figure 3B also offers a glimpse into a future with fully autonomous systems, where robots handle synthesis solution preparation, oven transfer, and synthesis product characterization. When integrated with ‘intelligent’ experimental design techniques like active learning, such as Bayesian optimization, this advancement could pave the way for the development of self-driving laboratories, drastically enhancing the pace of discovery and optimization in zeolite synthesis.[^27] + +## 3. Zeolite Synthesis – Optimization + +As discussed in the previous section, active learning has the potential to navigate the extensive parameter space of black box zeolite syntheses. This would prove beneficial in both manual and self-driving laboratories, saving time, reducing associated costs, and increasing the likelihood of discovering materials that are close to optimal. + +Nonetheless, conducting a search on Science Direct and Google Scholar using the terms "zeolite Bayesian optimization" and "zeolite active learning" yields only a limited number of relevant examples, excluding cases where active learning is employed to optimize machine learning model hyperparameters: + +1. Bayesian optimization was employed to experimentally find optimal Si/Al and Cu loading for Cu-CHA zeolites to optimize catalytic activity and selectivity in the partial oxidation of methane to methanol. As the CHA zeolites were commercially purchased, the Si/Al ratio was limited to 4 possibilities (categorical), whereas the in-house Cu ion exchange allowed for a continuous range of Cu loading.[^28] +2. Bayesian optimization was employed to experimentally determine the optimal metal loading of Cu/Fe-CHA catalysts, aiming to maximize their performance in both fresh and hydrothermally aged conditions for the selective catalytic reduction of NOx in diesel engine exhaust.[^29] +3. Bayesian optimization was used to find mechanically superior zeolite structures (in term of shear and bulk moduli calculated with DFT and machine learning) in an existing database containing approximately 590,000 hypothetical zeolites.[^30] + +However, none of these examples directly relate to zeolite synthesis. The first example effectively illustrates how an optimized in-house synthesis could lead to further improvement of the catalyst. This would involve expanding the feasible range of Si/Al values and considering additional variables such as synthesis temperature and duration, which can impact Al distribution. Thus, it appears that the zeolite synthesis field with its associated large parameter space could benefit from leveraging active learning methods. Therefore, the optimization characteristics are explored below, building upon the earlier section detailing zeolite synthesis ingredients and equipment. + +### 3.1 Parameter Space + +Zeolite synthesis involves numerous inherently **continuous** variables, such as the concentrations of the aforementioned ingredients. Typically, syntheses are presented in literature as molar ratio *xi* of ingredient *i* with respect to silicon, e.g., 1 Si: 0.1 Al: 0.5 OSDA: 0.2 Na+: 30 H2O. Given the known synthesis volume in the teflon liner, these ratios determine the required ingredient masses. Consequently, in Bayesian optimization, it is sufficient to optimize the molar ratio values. Other continuous variables include synthesis temperature, duration, and stirring/tumbling speed. + +The parameter bounds encompass reasonable molar ratio values (ranging from a lower bound of 0 to upper bounds determined by the ingredient and target, such as *xAl* < 0.5), along with constraints linked to equipment specifications. These constraints may include the maximum temperature of the synthesis oven and the predefined maximum speeds for stirring and tumbling systems. Depending on the equipment at hand, certain continuous variables may need to be discretized. For instance, in a setup where only one tumbling speed is available, the tumbling variable would become categorical: {Yes, No}. + +On the other hand, the selection of precursor materials is **categorical**. Even though the difference between certain sources seems minimal, they could have a small difference in solubility or basicity and lead to different crystallization kinetics.[^31] + +Below, we list several standard choices for the typical hydrothermal synthesis outlined above: + +| **Precursor** | **Options** | +| --- | --- | +| | | +| Silicon | Colloidal (Ludox HS-40, Ludox AS-40
), fumed (aerosil, Cab-O-Sil
), solid (sodium silicates, other zeolites in an interzeolite conversion
), liquids (tetraethyl orthosilicate
) 
 | +| Aluminum | Aluminum metal, Al(OH)3, Al(NO3)3, Al2(SO4)3, NaAlO2
 | +| OSDA | Typically one to a few OSDAs are known to effectively template the pores of a specific zeolite topology. For example, the typical OSDA for CHA synthesis is N,N,N-trimethyladamantylammonium hydroxide, but alternatives like tetraethylammonium hydroxide have also been documented.[^32] However, most often, a fixed OSDA is chosen a priori, and other variables are adjusted, as syntheses with different OSDAs may require entirely different conditions. | +| Inorganic cation | LiOH, NaOH, KOH, CsOH, NaCl
 | +| Water | Demineralized water is preferred for reproducibility, and further filtration (e.g., Milli-Q purification) is desirable. Therefore, no choices are to be made in this regard. | + +### 3.2 Constraints + +In zeolite synthesis, additional constraints on top of the specified bounds for the parameter space are uncommon. For instance, one might envision rare scenarios where both Al and a small amount of B are desired in the synthesis. Then a constraint could be introduced, e.g.: 10*xB* < *xAl*. Another scenario might involve limiting the total synthesis cost by assigning a monetary value to each parameter. + +### 3.3 Objectives + +Various objectives might be pursued depending on the economic considerations of the process and the specific application requirements: + +**General objectives:** + +- Attaining high crystallinity of the resulting zeolite. +- Ensuring high purity by minimizing the presence of side-products. + +**Economic objectives:** + +- Achieving a high synthesis yield. +- Maintaining low concentrations of expensive ingredients such as the organic structure-directing agent (OSDA), or other potentially harmful ingredients like fluoride. +- Operating at low synthesis temperatures. +- Reducing the synthesis time. + +**Application objectives:** + +- Targeting specific Si/Al ratios, which might be important for acid-catalyzed applications and also influences the zeolite stability.[^33] +- Controlling the distribution of aluminum within the structure, important for ion exchange and catalysis.[^34] +- Adjusting crystal size or morphology to optimize catalysis, adsorption or separation applications.[^35] + +Most of these objectives are correlated in positive or negative ways. For instance, low crystal size is generally accomplished through lower synthesis temperatures, favoring nucleation over crystal growth. However, this also results in slow nucleation and crystal growth and – depending on the synthesis time – low yields.[^36] + +### 3.4 Zeolite Synthesis Datasets + +Most zeolite synthesis papers include tables, either in the main text or supplementary information, that contain the molar ratios of the ingredients used in the ‘grid search’ synthesis experiments. The exact procedure and details of the ingredients are often described in textual form in the method sections. Following the recent advancements in material informatics, some studies have systematically scraped and summarized zeolite synthesis data. The data can be combined with structural parameters available on the IZA website for the respective topologies.[^5] + +Jensen et al. gathered data for 1,200 distinct synthetic pathways for Ge-containing zeolites[^37] and 5,663 synthesis routes specifying OSDAs.[^38] Muraoka et al. compiled a dataset with 686 unique OSDA-free synthesis routes for 23 distinct frameworks, detailing gel compositions and reaction conditions.[^39] However, these datasets are rather small and do not fully encapsulate all parameters essential for zeolite synthesis: synthesis composition, OSDA and reaction conditions. + +In a recent impressive development, Pan et al. introduced ZeoSyn, a comprehensive dataset containing 23,961 zeolite synthesis pathways for 233 distinct zeolite topologies, representing over 80% of synthesized frameworks to date, using 921 unique OSDAs.[^40] Each synthesis route details gel composition (a combination of 51 possible ingredients, including Si, Al, P, Na+, K+, OH−, F−, Ge, Ti, B, OSDA, H2O and additional solvents), reaction conditions and the resulting zeolite structure (or absence thereof, e.g. formation of dense or amorphous phases). In some cases, resulting zeolite properties such as Si/Al ratio, crystal size, crystallinity and BET surface area are reported. Each synthesis pathway is cross-referenced with the corresponding article from which it was sourced, alongside its publication year. The dataset is available on GitHub.[^41] + +## 4. Discussion + +Despite the significant industrial importance of zeolites, their synthesis primarily relies on heuristic approaches, domain knowledge, and a degree of serendipity. An experienced researcher can narrow down the extensive zeolite synthesis parameter space by drawing from literature and past experiences. Typically, within this constrained search space, practitioners resort to either a grid search or a random search. However, this procedure can prove time-consuming and costly. Active learning techniques, such as Bayesian optimization, offer the potential to more efficiently navigate the parameter space of black box zeolite syntheses and increase the likelihood of discovering materials that are close to optimal. + +Zeolite synthesis involves numerous continuous and categorical variables (see the Zeolite Synthesis sections). Depending on the considered search space, **mixed variable type** Bayesian optimization becomes necessary.[^42][^43] Additionally, many syntheses are **multi-objective**;[^44] for example, researchers may seek high synthesis yield coupled with a small crystal size. As mentioned earlier, laboratories often conduct parallel experiments using small multi-autoclave synthesis systems. Such setups could benefit from **batch** Bayesian optimization, which involves evaluating multiple candidate solutions simultaneously in each iteration of the optimization process. This can potentially reduce the total number of iterations required to find the desired solution.[^45][^46] + +One advantage of the extensive history of zeolite synthesis is the abundance of recipes available for most interesting topologies. Furthermore, unlike many other fields, failed synthesis attempts are frequently documented in the literature.[^40] Optimization campaigns enriched by **knowledge transfer** from past campaigns could identify desired materials with fewer experiments.[^47] + +Nowadays, various packages, such as Ax[^48], BayBE[^49] and scikit-optimize[^50]
, readily provide access to these different aspects of Bayesian optimization. In the [accompanying Jupyter notebook](./demo_zeolite_synthesis_bo.ipynb), we illustrate these features using real-world literature data.[^51][^52] One of the objectives of these studies was to maximize the amount of proximal Al pairs in synthesized CHA zeolites, which is required for stabilizing Fe2+ sites. Upon activation, these sites can selectively oxidize methane to methanol. The importance of these proximal Al pairs is underscored by the fact that in Cu-CHA zeolites, conversely, a low concentration of proximal Al pairs is preferred. In this context, these proximal Al pairs stabilize redox-inactive Cu2+ species that do not participate in the oxidation of methane to methanol.[^53][^54] + +Two approaches are followed in the notebook: +1) Optimization of a simulated analytical target function based on synthesis parameters. +2) Existing literature data is fed as prior experimental data to the Bayesian optimization algorithm, which then recommends subsequent experimental conditions to try out. + +This [code demonstration](./demo_zeolite_synthesis_bo.ipynb) showcases the effectiveness of Bayesian optimization in zeolite synthesis, hopefully encouraging the exploration of active learning approaches in similar endeavors. Open In Colab + +## References + +[^1]: Davis, M. E. Zeolites and Molecular Sieves: Not Just Ordinary Catalysts. [*Ind. Eng. Chem. Res.* **1991**, *30*, 1675–1683.](https://doi.org/10.1021/ie00056a001) + +[^2]: Flanigen, E. M. Chapter 2 - Zeolites and Molecular Sieves an Historical Perspective. In *Studies in Surface Science and Catalysis*; Van Bekkum, H., Flanigen, E. M., Jacobs, P. A., Jansen, J. C., Eds.; [Elsevier Science B.V., 2001; Vol. 137, pp 11–35.](https://doi.org/10.1016/S0167-2991(01)80243-3) + +[^3]: Dusselier, M.; Davis, M. E. Small-Pore Zeolites: Synthesis and Catalysis. [*Chem. Rev.* **2018**, *118*, 5265–5329.](https://doi.org/10.1021/acs.chemrev.7b00738) + +[^4]: Pophale, R.; Cheeseman, P. A.; Deem, M. W. A Database of New Zeolite-like Materials. [*Phys. Chem. Chem. Phys.* **2011**, *13*, 12407–12412.](https://doi.org/10.1039/C0CP02255A) + +[^5]: Structure Commission of the International Zeolite Association. Database of Zeolite Structures. . + +[^6]: Baerlocher, C.; McCusker, L. B.; Olson, D. H. [*Atlas of Zeolite Framework Types*; Elsevier, 2007.](https://www.sciencedirect.com/book/9780444530646/atlas-of-zeolite-framework-types) + +[^7]: Csicsery, S. M. Shape-Selective Catalysis in Zeolites. [*Zeolites* **1984**, *4*, 116–126.](https://doi.org/10.1016/0144-2449(84)90024-1) + +[^8]: Snyder, B. E. R.; Vanelderen, P.; Schoonheydt, R. A.; Sels, B. F.; Solomon, E. I. Second-Sphere Effects on Methane Hydroxylation in Cu-Zeolites. [*J. Am. Chem. Soc.* **2018**, *140*, 9236–9243.](https://doi.org/10.1021/jacs.8b05320) + +[^9]: Snyder, B. E. R.; Bols, M. L.; Schoonheydt, R. A.; Sels, B. F.; Solomon, E. I. Iron and Copper Active Sites in Zeolites and Their Correlation to Metalloenzymes. [*Chem. Rev.* **2018**, *118*, 2718–2768.](https://doi.org/10.1021/acs.chemrev.7b00344) + +[^10]: Plessers, D.; Bols, M. L.; Rhoda, H. M.; Heyer, A. J.; Solomon, E. I.; Sels, B. F.; Schoonheydt, R. A. Single Site Spectroscopy of Transition Metal Ions and Reactive Oxygen Complexes in Zeolites. [In *Comprehensive Inorganic Chemistry III*; Reedijk, J., Poeppelmeier, K. R., Eds.; Elsevier, 2023; pp 148–164.](https://doi.org/10.1016/B978-0-12-823144-9.00008-X) + +[^11]: Derouane, E. G.; VĂ©drine, J. C.; Ramos Pinto, R.; Borges, P. M.; Costa, L.; Lemos, M. A. N. D. A.; Lemos, F.; RamĂŽa Ribeiro, F. The Acidity of Zeolites: Concepts, Measurements and Relation to Catalysis: A Review on Experimental and Theoretical Methods for the Study of Zeolite Acidity. [*Catal. Rev. - Sci. Eng.* **2013**, *55*, 454–515.](https://doi.org/10.1080/01614940.2013.822266) + +[^12]: Zhang, Q.; Gao, S.; Yu, J. Metal Sites in Zeolites: Synthesis, Characterization, and Catalysis. [*Chem. Rev.* **2023**, *123*, 6039–6106.](https://doi.org/10.1021/acs.chemrev.2c00315) + +[^13]: PĂ©rez-Botella, E.; Valencia, S.; Rey, F. Zeolites in Adsorption Processes: State of the Art and Future Prospects. [*Chem. Rev.* **2022**, *122*, 17647–17695.](https://doi.org/10.1021/acs.chemrev.2c00140) + +[^14]: Yilmaz, B.; MĂŒller, U. Catalytic Applications of Zeolites in Chemical Industry. [*Top. Catal.* **2009**, *52*, 888–895.](https://doi.org/10.1007/s11244-009-9226-0) + +[^15]: Xu, X.; Wang, J.; Long, Y. Zeolite-Based Materials for Gas Sensors. [*Sensors* **2006**, *6*, 1751–1764.](https://doi.org/10.3390/s6121751) + +[^16]: Rangnekar, N.; Mittal, N.; Elyassi, B.; Caro, J.; Tsapatsis, M. Zeolite Membranes - a Review and Comparison with MOFs. [*Chem. Soc. Rev.* **2015**, *44*, 7128–7154.](https://doi.org/10.1039/C5CS00292C) + +[^17]: Beale, A. M.; Gao, F.; Lezcano-Gonzalez, I.; Peden, C. H. F.; Szanyi, J. Recent Advances in Automotive Catalysis for NOx Emission Control by Small-Pore Microporous Materials. [*Chem. Soc. Rev.* **2015**, *44*, 7371–7405.](https://doi.org/10.1039/C5CS00108K) + +[^18]: Zhang, R.; Liu, N.; Lei, Z.; Chen, B. Selective Transformation of Various Nitrogen-Containing Exhaust Gases toward N2 over Zeolite Catalysts. [*Chem. Rev.* **2016**, *116*, 3658–3721.](https://doi.org/10.1021/acs.chemrev.5b00474) + +[^19]: Zeolite Market Size, Share & Trends Analysis Report By Application (Catalyst, Adsorbent, Detergent Builder), By Product (Natural, Synthetic), By Region (North America, Europe, APAC, CSA, MEA), And Segment Forecasts, 2022 - 2030. ISBN 978-1-68038-601-1. . + +[^20]: Davis, M. E. Zeolites from a Materials Chemistry Perspective. [*Chem. Mater.* **2014**, *26*, 239–245.](https://doi.org/10.1021/cm401914u) + +[^21]: Cundy, C. S.; Cox, P. A. The Hydrothermal Synthesis of Zeolites: History and Development from the Eearliest Days to the Present Time. [*Chem. Rev.* **2003**, *103*, 663–701.](https://doi.org/10.1021/cr020060i) + +[^22]: Deneyer, A.; Ke, Q.; Devos, J.; Dusselier, M. Zeolite Synthesis under Nonconventional Conditions: Reagents, Reactors, and Modi Operandi. [*Chem. Mater.* **2020**, *32*, 4884–4919.](https://doi.org/10.1021/acs.chemmater.9b04741) + +[^23]: Asselman, K.; Kirschhock, C.; Breynaert, E. Illuminating the Black Box: A Perspective on Zeolite Crystallization in Inorganic Media. [*Acc. Chem. Res.* **2023**, *56*, 2391–2402.](https://doi.org/10.1021/acs.accounts.3c00269) + +[^24]: Ivanushkin, G.; Dusselier, M. Engineering Lewis Acidity in Zeolite Catalysts by Electrochemical Release of Heteroatoms during Synthesis. [*Chem. Mater.* **2023**, *35*, 5049–5058.](https://doi.org/10.1021/acs.chemmater.3c00552) + +[^25]: Hydrothermal Synthesis. . + +[^26]: Moliner, M.; Serra, J. M.; Corma, A.; Argente, E.; Valero, S.; Botti, V. Application of Artificial Neural Networks to High-Throughput Synthesis of Zeolites. [*Microporous Mesoporous Mater.* **2005**, *78*, 73–81.](https://doi.org/10.1016/j.micromeso.2004.09.018) + +[^27]: Tom, G.; Schmid, S. P.; Baird, S. G.; Cao, Y.; Darvish, K.; Hao, H.; Lo, S.; Pablo-GarcĂ­a, S.; Rajaonson, E. M.; Skreta, M.; Yoshikawa, N.; Corapi, S.; Akkoc, G. D.; Strieth-Kalthoff, F.; Seifrid, M.; Aspuru-Guzik, A. Self-Driving Laboratories for Chemistry and Materials Science. [*ChemRxiv* **2024**, doi:10.26434/chemrxiv-2024-rj946.](https://doi.org/10.26434/chemrxiv-2024-rj946) + +[^28]: Ohyama, J.; Tsuchimura, Y.; Yoshida, H.; Machida, M.; Nishimura, S.; Takahashi, K. Bayesian-Optimization-Based Improvement of Cu-CHA Catalysts for Direct Partial Oxidation of CH4. [*J. Phys. Chem. C* **2022**, *126*, 19660–19666.](https://doi.org/10.1021/acs.jpcc.2c04229) + +[^29]: Lim, S.; Lee, H.; Bae, S.; Shin, J. S.; Kim, D. H.; Lee, J. M. Bayesian Optimization for Automobile Catalyst Development. [In *14th International Symposium on Process Systems Engineering*; Elsevier, 2022; Vol. 49, pp 1213–1218.](https://doi.org/10.1016/B978-0-323-85159-6.50202-5) + +[^30]: Kim, N.; Min, K. Accelerated Discovery of Zeolite Structures with Superior Mechanical Properties via Active Learning. [*J. Phys. Chem. Lett.* **2021**, *12*, 2334–2339.](https://doi.org/10.1021/acs.jpclett.1c00339) + +[^31]: Liang, D.; Liu, Y.; Zhang, R.; Xie, Q.; Zhang, L. A Review on the Influence Factors in the Synthesis of Zeolites and the Transformation Behavior of Silicon and Aluminum During the Process. [*Comments Inorg. Chem.* **2024**, *00*, 1–37.](https://doi.org/10.1080/02603594.2024.2309878) + +[^32]: MartĂ­n, N.; Moliner, M.; Corma, A. High Yield Synthesis of High-Silica Chabazite by Combining the Role of Zeolite Precursors and Tetraethylammonium: SCR of NOx. [*Chem. Commun.* **2015**, *51*, 9965–9968.](https://doi.org/10.1039/C5CC02670A) + +[^33]: Li, J.; Gao, M.; Yan, W.; Yu, J. Regulation of the Si/Al Ratios and Al Distributions of Zeolites and Their Impact on Properties. [*Chem. Sci.* **2022**, *14*, 1935–1959.](https://doi.org/10.1039/D2SC06010H) + +[^34]: Knott, B. C.; Nimlos, C. T.; Robichaud, D. J.; Nimlos, M. R.; Kim, S.; Gounder, R. Consideration of the Aluminum Distribution in Zeolites in Theoretical and Experimental Catalysis Research. [*ACS Catal.* **2018**, *8*, 770–784.](https://doi.org/10.1021/acscatal.7b03676) + +[^35]: Li, S.; Li, J.; Dong, M.; Fan, S.; Zhao, T.; Wang, J.; Fan, W. Strategies to Control Zeolite Particle Morphology. [*Chem. Soc. Rev.* **2019**, *48*, 885–907.](https://doi.org/10.1039/C8CS00774H) + +[^36]: Larsen, S. C. Nanocrystalline Zeolites and Zeolite Structures: Synthesis, Characterization, and Applications. [*J. Phys. Chem. C* **2007**, *111*, 18464–18474.](https://doi.org/10.1021/jp074980m) + +[^37]: Jensen, Z.; Kim, E.; Kwon, S.; Gani, T. Z. H.; RomĂĄn-Leshkov, Y.; Moliner, M.; Corma, A.; Olivetti, E. A Machine Learning Approach to Zeolite Synthesis Enabled by Automatic Literature Data Extraction. [*ACS Cent. Sci.* **2019**.](https://doi.org/10.1021/acscentsci.9b00193) + +[^38]: Jensen, Z.; Kwon, S.; Schwalbe-Koda, D.; Paris, C.; GĂłmez-Bombarelli, R.; RomĂĄn-Leshkov, Y.; Corma, A.; Moliner, M.; Olivetti, E. A. Discovering Relationships between OSDAs and Zeolites through Data Mining and Generative Neural Networks. [*ACS Cent. Sci.* **2021**, *7*, 858–867.](https://doi.org/10.1021/acscentsci.1c00024) + +[^39]: Muraoka, K.; Sada, Y.; Miyazaki, D.; Chaikittisilp, W.; Okubo, T. Linking Synthesis and Structure Descriptors from a Large Collection of Synthetic Records of Zeolite Materials. [*Nat. Commun.* **2019**, *10*, 1–11.](https://doi.org/10.1038/s41467-019-12394-0) + +[^40]: Pan, E.; Kwon, S.; Jensen, Z.; Xie, M.; GĂłmez-Bombarelli, R.; Moliner, M.; RomĂĄn-Leshkov, Y.; Olivetti, E. ZeoSyn: A Comprehensive Zeolite Synthesis Dataset Enabling Machine-Learning Rationalization of Hydrothermal Parameters. [*ACS Cent. Sci.* **2024**.](https://doi.org/10.1021/acscentsci.3c01615) + +[^41]: Pan, E.; Kwon, S.; Jensen, Z.; Xie, M.; GĂłmez-Bombarelli, R.; Moliner, M.; RomĂĄn-Leshkov, Y.; Olivetti, E. ZeoSyn: A Comprehensive Zeolite Synthesis Dataset Enabling Machine-learning Rationalization of Hydrothermal Parameters (ACS Central Science 2024). . + +[^42]: HĂ€se, F.; Aldeghi, M.; Hickman, R. J.; Roch, L. M.; Aspuru-Guzik, A. Gryffin: An Algorithm for Bayesian Optimization of Categorical Variables Informed by Expert Knowledge. [*Appl. Phys. Rev.* **2021**, *8*.](https://doi.org/10.1063/5.0048164) + +[^43]: Aldulaijan, N.; Marsden, J. A.; Manson, J. A.; Clayton, A. D. Adaptive Mixed Variable Bayesian Self-Optimisation of Catalytic Reactions. [*React. Chem. Eng.* **2023**, 308–316.](https://doi.org/10.1039/D3RE00476G) + +[^44]: Torres, J. A. G.; Lau, S. H.; Anchuri, P.; Stevens, J. M.; Tabora, J. E.; Li, J.; Borovika, A.; Adams, R. P.; Doyle, A. G. A Multi-Objective Active Learning Platform and Web App for Reaction Optimization. [*J. Am. Chem. Soc.* **2022**, *144*, 19999–20007.](https://doi.org/10.1021/jacs.2c08592) + +[^45]: HĂ€se, F.; Roch, L. M.; Kreisbeck, C.; Aspuru-Guzik, A. Phoenics: A Bayesian Optimizer for Chemistry. [*ACS Cent. Sci.* **2018**, *4*, 1134–1145.](https://doi.org/10.1021/acscentsci.8b00307) + +[^46]: GonzĂĄlez, L. D.; Zavala, V. M. New Paradigms for Exploiting Parallel Experiments in Bayesian Optimization. [*Comput. Chem. Eng.* **2023**, *170*, 108110.](https://doi.org/10.1016/j.compchemeng.2022.108110) + +[^47]: Hickman, R. J.; RuĆŸa, J.; Tribukait, H.; Roch, L. M.; GarcĂ­a-DurĂĄn, A. Equipping Data-Driven Experiment Planning for Self-Driving Laboratories with Semantic Memory: Case Studies of Transfer Learning in Chemical Reaction Optimization. [*React. Chem. Eng.* **2023**, *8*, 2284–2296.](https://doi.org/10.1039/D3RE00008G) + +[^48]: Ax, Adaptive Experimentation Platform. . + +[^49]: BayBE - A Bayesian Back End for Design of Experiments. . + +[^50]: Scikit-optimize, Sequential model-based optimization in Python. . + +[^51]: Devos, J.; Bols, M. L.; Plessers, D.; Goethem, C. Van; Seo, J. W.; Hwang, S.-J.; Sels, B. F.; Dusselier, M. Synthesis–Structure–Activity Relations in Fe-CHA for C–H Activation: Control of Al Distribution by Interzeolite Conversion. [*Chem. Mater.* **2020**, *32*, 273–285.](https://doi.org/10.1021/acs.chemmater.9b03738) + +[^52]: Bols, M. L.; Devos, J.; Rhoda, H. M.; Plessers, D.; Solomon, E. I.; Schoonheydt, R. A.; Sels, B. F.; Dusselier, M. Selective Formation of α-Fe(II) Sites on Fe-Zeolites through One-Pot Synthesis. [*J. Am. Chem. Soc.* **2021**, *143*, 16243–16255.](https://doi.org/10.1021/jacs.1c07590) + +[^53]: Pappas, D. K.; Borfecchia, E.; Dyballa, M.; Pankin, I. A.; Lomachenko, K. A.; Martini, A.; Signorile, M.; Teketel, S.; Arstad, B.; Berlier, G.; Lamberti, C.; Bordiga, S.; Olsbye, U.; Lillerud, K. P.; Svelle, S.; Beato, P. Methane to Methanol: Structure–Activity Relationships for Cu-CHA. [*J. Am. Chem. Soc.* **2017**, *139*, 14961–14975.](https://doi.org/10.1021/jacs.7b06472) + +[^54]: Rhoda, H. M.; Plessers, D.; Heyer, A. J.; Bols, M. L.; Schoonheydt, R. A.; Sels, B. F.; Solomon, E. I. Spectroscopic Definition of a Highly Reactive Site in Cu-CHA for Selective Methane Oxidation: Tuning a Mono-ÎŒ-Oxo Dicopper(II) Active Site for Reactivity. [*J. Am. Chem. Soc.* **2021**, *143*, 7531–7540.](https://doi.org/10.1021/jacs.1c02835) diff --git a/zeolite_synthesis_bo_introduction.pdf b/zeolite_synthesis_bo_introduction.pdf new file mode 100644 index 0000000..2745005 Binary files /dev/null and b/zeolite_synthesis_bo_introduction.pdf differ