Dean
/
Chemformer
mirror of https://github.com/MolecularAI/Chemformer


  
1

	
2

	
3

	
4

	
5

	
6

	
7

	
8

	
9

	
10

	
11

	
12

	
13

	
14

	
15

	
16

	
17

	
18

	
19

	
20

	
21

	
22

	
23

	
24

	
25

	
26

	
27

	
28

	
29

	
30

	
31

	
32

	
33

	
34

	
35

	
36

	
37

	
38

	
39

	
40

	
41

	
42

	
43

	
44

	
45

	
46

	
47

	
48

	
49

	
50

	
51

	
52

	
53

	
54

	
55

	
56

	
57

	
58

	
59

	
60

	
61

	
62

	
63

	
64

	
65

	
66

	
67

	
68

	
69

	
70

	
71

	
72

	
73

	
74

	
75

	
76

	
77

	
78

	
79

	
80

	
81

	
82

	
83

	
84

	
            import os
from typing import List

import omegaconf as oc
from fastapi import FastAPI
from service_utils import calculate_llhs, estimate_compound_llhs, get_predictions

from molbart.models import Chemformer

app = FastAPI()

# Container for data, classes that can be loaded upon startup of the REST API
config = oc.OmegaConf.load("../molbart/config/predict.yaml")

config.batch_size = 64
config.n_gpus = 1
config.model_path = os.environ["CHEMFORMER_MODEL"]
config.model_type = "bart"
config.n_beams = 10
config.task = os.environ["CHEMFORMER_TASK"]
config.vocabulary_path = os.environ["CHEMFORMER_VOCAB"]
config.datamodule = None

global_items = {"chemformer": Chemformer(config)}


@app.post("/chemformer-api/predict")
def predict(smiles_list: List[str], n_beams: int = 10):
    smiles, log_lhs, original_smiles = get_predictions(global_items["chemformer"], smiles_list, n_beams)

    output = []
    for item_pred, item_lhs, item_smiles in zip(smiles, log_lhs, original_smiles):
        output.append(
            {
                "input": item_smiles,
                "output": list(item_pred),
                "lhs": [float(val) for val in item_lhs],
            }
        )
    return output


@app.post("/chemformer-api/log_likelihood")
def log_likelihood(reactants: List[str], products: List[str]):
    log_lhs = calculate_llhs(global_items["chemformer"], reactants, products)

    output = []
    for prod_smi, react_smi, llhs in zip(products, reactants, log_lhs):
        output.append(
            {
                "product_smiles": str(prod_smi),
                "reactant_smiles": str(react_smi),
                "log_likelihood": float(llhs),
            }
        )
    return output


@app.post("/chemformer-api/compound_log_likelihood")
def compound_log_likelihood(reactants: List[str], products: List[str], n_augments: int = 10):
    log_lhs = estimate_compound_llhs(global_items["chemformer"], reactants, products, n_augments=n_augments)

    output = []
    for prod_smi, react_smi, llhs in zip(products, reactants, log_lhs):
        output.append(
            {
                "product_smiles": str(prod_smi),
                "reactant_smiles": str(react_smi),
                "log_likelihood": float(llhs),
            }
        )
    return output


if __name__ == "__main__":
    import uvicorn

    uvicorn.run(
        "chemformer_service:app",
        host="0.0.0.0",
        port=8003,
        log_level="info",
        reload=False,
    )