Scienfitz's picture
Upload 5 files
6c15b97 verified
import gradio as gr
import pandas as pd
# Goal: Maximize
# Data Source: Shields et al. https://www.nature.com/articles/s41586-021-03213-y
def lookup(
concentration: float, temperature: float, solvent: str, ligand: str, base: str
):
data = pd.read_csv("./data.csv", delimiter=",", index_col=None)
other = pd.DataFrame.from_records(
{
"Concentration": concentration,
"Temp_C": temperature,
"Ligand": ligand,
"Solvent": solvent,
"Base": base,
},
index=[0],
)
merged_df = pd.merge(
left=data.reset_index(),
right=other,
on=other.columns.tolist(),
how="right",
sort=False,
).dropna(subset="index")
idxs_matched = pd.Index(merged_df["index"].values)
if len(idxs_matched) < len(other):
raise IndexError(
"When doing exact lookup some rows could not be found. Try "
"approximate lookup or check reference data."
)
if len(idxs_matched) > len(other):
raise IndexError(
"When doing exact lookup some rows in the reference dataframe appear "
"duplicated. Check reference data."
)
return data["yield"][idxs_matched[0]]
solvents = {
"DMAc": r"CC(N(C)C)=O",
"Butyornitrile": r"CCCC#N",
"Butyl Ester": r"CCCCOC(C)=O",
"p-Xylene": r"CC1=CC=C(C)C=C1",
}
ligands = {
"BrettPhos": r"CC(C)C1=CC(C(C)C)=C(C(C(C)C)=C1)C2=C(P(C3CCCCC3)C4CCCCC4)C(OC)=CC=C2OC",
"Di-tert-butylphenylphosphine": r"CC(C)(C)P(C1=CC=CC=C1)C(C)(C)C",
"(t-Bu)PhCPhos": r"CN(C)C1=CC=CC(N(C)C)=C1C2=CC=CC=C2P(C(C)(C)C)C3=CC=CC=C3",
"Tricyclohexylphosphine": r"P(C1CCCCC1)(C2CCCCC2)C3CCCCC3",
"PPh3": r"P(C1=CC=CC=C1)(C2=CC=CC=C2)C3=CC=CC=C3",
"XPhos": r"CC(C1=C(C2=CC=CC=C2P(C3CCCCC3)C4CCCCC4)C(C(C)C)=CC(C(C)C)=C1)C",
"P(2-furyl)3": r"P(C1=CC=CO1)(C2=CC=CO2)C3=CC=CO3",
"Methyldiphenylphosphine": r"CP(C1=CC=CC=C1)C2=CC=CC=C2",
"1268824-69-6": r"CC(OC1=C(P(C2CCCCC2)C3CCCCC3)C(OC(C)C)=CC=C1)C",
"JackiePhos": r"FC(F)(F)C1=CC(P(C2=C(C3=C(C(C)C)C=C(C(C)C)C=C3C(C)C)C(OC)=CC=C2OC)C4=CC(C(F)(F)F)=CC(C(F)(F)F)=C4)=CC(C(F)(F)F)=C1",
"SCHEMBL15068049": r"C[C@]1(O2)O[C@](C[C@]2(C)P3C4=CC=CC=C4)(C)O[C@]3(C)C1",
"Me2PPh": r"CP(C)C1=CC=CC=C1",
}
bases = {
"Potassium acetate": r"O=C([O-])C.[K+]",
"Potassium pivalate": r"O=C([O-])C(C)(C)C.[K+]",
"Cesium acetate": r"O=C([O-])C.[Cs+]",
"Cesium pivalate": r"O=C([O-])C(C)(C)C.[Cs+]",
}
defaults = (0.1, 90, "DMAc", "JackiePhos", "Cesium acetate")
iface = gr.Interface(
fn=lookup,
inputs=[
gr.Radio(label="Concentration", choices=[0.057, 0.1, 0.153], value=defaults[0]),
gr.Radio(label="Temperature", choices=[90, 105, 120], value=defaults[1]),
gr.Radio(label="Solvent", choices=list(solvents.keys()), value=defaults[2]),
gr.Radio(label="Ligand", choices=list(ligands.keys()), value=defaults[3]),
gr.Radio(label="Base", choices=list(bases.keys()), value=defaults[4]),
],
outputs=gr.Number(lookup(*defaults), label="yield value (maximize)"),
)
iface.launch()