cole-group · AsmaFeriel000 · Dec 4, 2025 · Dec 4, 2025 · Dec 4, 2025 · Dec 4, 2025
diff --git a/tutorials/auto-fegrow.py b/tutorials/auto-fegrow.py
@@ -0,0 +1,142 @@
+#!/usr/bin/env python
+# coding: utf-8
+
+# # FEgrow: An Open-Source Molecular Builder and Free Energy Preparation Workflow
+#
+# **Authors: Mateusz K Bieniek, Ben Cree, Rachael Pirie, Joshua T. Horton, Natalie J. Tatum, Daniel J. Cole**
+
+# ## Overview
+#
+# Building and scoring molecules can be further streamlined by employing our established protocol. Here we show how to quickly build a library and score the entire library automatically for more than one recepetor.
+
+import os  # afk
+from glob import glob  # afk
+
+import prody
+from rdkit import Chem
+
+import fegrow
+from fegrow import ChemSpace
+
+
+from dask.distributed import LocalCluster
+
+
+def main():
+    OUTPUT_DIR = "fegrow_result"
+
+    lc = LocalCluster(processes=True, n_workers=None, threads_per_worker=1)
+
+    counter = 1
+
+    input_folder = "./autofegrow-inputs/receptors_with_hydrogens"
+
+    # Find all .pdb files in the input folder
+    pdb_files = glob(os.path.join(input_folder, "*.pdb"))
+
+    for pdb_file in pdb_files:
+        # Prepare the ligand template
+        print(" pdb file {} read in".format(counter))
+
+        # scaffold = Chem.SDMolSupplier(core_5R83_path)[0]
+        scaffold = Chem.SDMolSupplier("autofegrow-inputs/coreh.sdf")[0]
+
+        with open("autofegrow-inputs/smiles-test-MERS.txt") as f:
+            mols = f.read().splitlines()
+
+            print("loading core finished round {}".format(counter))
+            print("creating chemspace with dask round {}".format(counter))
+
+            # create the chemical space
+            cs = ChemSpace(dask_cluster=lc)
+            cs.add_scaffold(scaffold)
+
+            smiles = mols[0:]
+            cs.add_smiles(smiles, protonate=True)
+            cs
+
+            sys = prody.parsePDB(pdb_file)
+            rec = sys.select("not (nucleic or hetatm or water)")
+            prody.writePDB("rec.pdb", rec)
+
+            os.makedirs(OUTPUT_DIR) if not os.path.exists(OUTPUT_DIR) else None
+            fegrow.fix_receptor(
+                "rec.pdb", "{}/rec_final_{}.pdb".format(OUTPUT_DIR, counter)
+            )
+            print("pdb file into rec_final {}".format(counter))
+
+            cs.add_protein("{}/rec_final_{}.pdb".format(OUTPUT_DIR, counter))
+            print(
+                "successfully added pdb {} to chemspace to evaluate conformers on it".format(
+                    counter
+                )
+            )
+
+            cs.evaluate(
+                num_conf=500, gnina_gpu=False, penalty=0.0, al_ignore_penalty=False
+            )
+
+            cs.to_sdf("cs_optimised_molecules_in_rec_{}.sdf".format(counter))
+
+            for i in range(len(cs)):
+                try:
+                    cs[i].to_file(
+                        "best_conformers_in_rec_{0}_{1}.pdb".format(counter, i)
+                    )  # afk
+                except AttributeError:
+                    print("No conformer for molecule", i)
+
+                for i in range(len(cs)):
+                    pdb_filename = "best_conformers_in_rec_{0}_{1}.pdb".format(
+                        counter, i
+                    )
+                    sdf_filename = os.path.join(
+                        OUTPUT_DIR, "rec_{0}_mol{1}.sdf".format(counter, i)
+                    )
+                    pdb_first_model = "tmp_first_model_{0}_{1}.pdb".format(counter, i)
+
+                    try:
+                        cs[i].to_file(pdb_filename)
+
+                        with open(pdb_filename, "r") as infile:
+                            lines = infile.readlines()
+
+                        inside_model = False
+                        first_model_lines = []
+                        for line in lines:
+                            if line.startswith("MODEL"):
+                                if inside_model:
+                                    break
+                                inside_model = True
+                            if inside_model:
+                                first_model_lines.append(line)
+                            if line.startswith("ENDMDL") and inside_model:
+                                break
+
+                        if not first_model_lines:
+                            first_model_lines = lines
+
+                        with open(pdb_first_model, "w") as outfile:
+                            outfile.writelines(first_model_lines)
+
+                        os.system(
+                            "obabel -ipdb {} -O {}".format(
+                                pdb_first_model, sdf_filename
+                            )
+                        )
+
+                        os.remove(pdb_first_model)
+
+                    except AttributeError:
+                        print("No conformer for molecule", i)
+
+        cs.df.to_csv("MERS-out.csv", index=True)
+
+        counter += 1
+
+
+if __name__ == "__main__":
+    import multiprocessing
+
+    multiprocessing.freeze_support()  # Especially needed for frozen executables
+    main()
diff --git a/tutorials/autofegrow-inputs/coreh.sdf b/tutorials/autofegrow-inputs/coreh.sdf
@@ -0,0 +1,28 @@
+core.pdb
+ OpenBabel05012510463D
+
+ 11 11  0  0  0  0  0  0  0  0999 V2000
+    5.7640    0.2340   17.3690 N   0  0  0  0  0  0  0  0  0  0  0  0
+    6.1040    0.0970   19.7620 C   0  0  0  0  0  0  0  0  0  0  0  0
+    6.4230   -0.2110   18.4440 C   0  0  0  0  0  0  0  0  0  0  0  0
+    4.7290    1.0360   17.5780 C   0  0  0  0  0  0  0  0  0  0  0  0
+    4.2770    1.4340   18.8610 C   0  0  0  0  0  0  0  0  0  0  0  0
+    4.9840    0.9420   19.9950 C   0  0  0  0  0  0  0  0  0  0  0  0
+    6.6621   -0.2757   20.5460 H   0  0  0  0  0  0  0  0  0  0  0  0
+    7.2317   -0.8316   18.2830 H   0  0  0  0  0  0  0  0  0  0  0  0
+    4.2203    1.3931   16.7542 H   0  0  0  0  0  0  0  0  0  0  0  0
+    3.4631    2.0591   18.9697 H   0  0  0  0  0  0  0  0  0  0  0  0
+    4.6934    1.1902   20.9536 H   0  0  0  0  0  0  0  0  0  0  0  0
+  1  3  2  0  0  0  0
+  1  4  1  0  0  0  0
+  2  3  1  0  0  0  0
+  2  6  2  0  0  0  0
+  2  7  1  0  0  0  0
+  3  8  1  0  0  0  0
+  4  5  2  0  0  0  0
+  4  9  1  0  0  0  0
+  5  6  1  0  0  0  0
+  5 10  1  0  0  0  0
+  6 11  1  0  0  0  0
+M  END
+$$$$