From 466fd4f172e667c2be2389ac5f5bebe4a2b59e4e Mon Sep 17 00:00:00 2001 From: Hong-Rui Lin Date: Wed, 10 Apr 2024 02:14:38 +0800 Subject: [PATCH] [feature] receptor preprocessor options, deprecated PDBQT file format as receptor input --- .../application/unidock_pipeline.py | 55 ++++++++++++------- .../unidock_tools/modules/docking/unidock.py | 7 +-- .../receptor_preprocessor_runner.py | 5 +- 3 files changed, 40 insertions(+), 27 deletions(-) diff --git a/unidock_tools/src/unidock_tools/application/unidock_pipeline.py b/unidock_tools/src/unidock_tools/application/unidock_pipeline.py index 81e05cd..5479bcd 100644 --- a/unidock_tools/src/unidock_tools/application/unidock_pipeline.py +++ b/unidock_tools/src/unidock_tools/application/unidock_pipeline.py @@ -49,7 +49,6 @@ "debug": False, } - class UniDock(Base): def __init__(self, receptor: Path, @@ -60,36 +59,54 @@ def __init__(self, size_x: float = 22.5, size_y: float = 22.5, size_z: float = 22.5, - workdir: Path = Path("docking_pipeline"), + kept_ligand_resname_list: Optional[List[str]] = None, + prepared_hydrogen: bool = True, + preserve_original_resname: bool = True, + covalent_residue_atom_info_list: Optional[List[Tuple[str, str]]] = None, + generate_ad4_grids: bool = False, + workdir: Path = Path('docking_pipeline'), ): """ - Initializes a MultiConfDock object. + Initializes a UniDock object. Args: - receptor (Path): Path to the receptor file in pdbqt format. - ligands (List[Path]): List of paths to the ligand files in sdf format. + receptor (Path): Path to the receptor file in PDB format. + ligands (List[Path]): List of paths to the ligand files in SDF format. center_x (float): X-coordinate of the center of the docking box. center_y (float): Y-coordinate of the center of the docking box. center_z (float): Z-coordinate of the center of the docking box. size_x (float, optional): Size of the docking box in the x-dimension. Defaults to 22.5. size_y (float, optional): Size of the docking box in the y-dimension. Defaults to 22.5. size_z (float, optional): Size of the docking box in the z-dimension. Defaults to 22.5. - workdir (Path, optional): Path to the working directory. Defaults to Path("MultiConfDock"). + workdir (Path, optional): Path to the working directory. Defaults to Path("docking_pipeline"). """ self.check_dependencies() self.workdir = workdir self.workdir.mkdir(parents=True, exist_ok=True) - if receptor.suffix == ".pdb": - ###pdb2pdbqt(receptor, workdir.joinpath(receptor.stem + ".pdbqt")) - ###receptor = workdir.joinpath(receptor.stem + ".pdbqt") - receptor_pdbqt_file_name = receptor_preprocessor(str(receptor), working_dir_name=str(workdir)) - self.receptor = receptor_pdbqt_file_name - if receptor.suffix != ".pdbqt": - logging.error("receptor file must be pdb/pdbqt format") + if receptor.suffix != '.pdb': + logging.error('receptor file must be in PDB format!') exit(1) - self.receptor = receptor + else: + receptor_pdbqt_file_name = receptor_preprocessor(str(receptor), + kept_ligand_resname_list=kept_ligand_resname_list, + prepared_hydrogen=prepared_hydrogen, + preserve_original_resname=preserve_original_resname, + target_center=(center_x, center_y, center_z), + box_size=(size_x, size_y, size_z), + covalent_residue_atom_info_list=covalent_residue_atom_info_list, + generate_ad4_grids=generate_ad4_grids, + working_dir_name=str(workdir)) + + self.receptor = receptor_pdbqt_file_name + + if generate_ad4_grids: + receptor_file_dir_name = os.path.dirname(self.receptor) + self.ad4_map_prefix = os.path.join(receptor_file_dir_name, 'protein') + else: + self.ad4_map_prefix = '' + self.mols = sum([read_ligand(ligand) for ligand in ligands], []) self.mols = [PropertyMol(mol) for mol in self.mols] self.center_x = center_x @@ -168,7 +185,7 @@ def docking(self, receptor=self.receptor, ligands=ligand_list, output_dir=output_dir, center_x=self.center_x, center_y=self.center_y, center_z=self.center_z, size_x=self.size_x, size_y=self.size_y, size_z=self.size_z, - scoring=scoring_function, num_modes=num_modes, + scoring=scoring_function, ad4_map_prefix=self.ad4_map_prefix, num_modes=num_modes, search_mode=search_mode, exhaustiveness=exhaustiveness, max_step=max_step, seed=seed, refine_step=refine_step, energy_range=energy_range, score_only=score_only, local_only=local_only, @@ -269,9 +286,9 @@ def get_parser() -> argparse.ArgumentParser: parser = argparse.ArgumentParser(description="UniDock") parser.add_argument("-r", "--receptor", type=str, required=True, - help="Receptor file in pdbqt format.") + help="Receptor file in PDB format.") parser.add_argument("-l", "--ligands", type=lambda s: s.split(','), default=None, - help="Ligand file in sdf format. Specify multiple files separated by commas.") + help="Ligand file in SDF format. Specify multiple files separated by commas.") parser.add_argument("-i", "--ligand_index", type=str, default=None, help="A text file containing the path of ligand files in sdf format.") @@ -336,8 +353,8 @@ def main_cli(): Command line interface for UniDock. Input files: - -r, --receptor: receptor file in pdbqt format - -l, --ligands: ligand file in sdf format, separated by commas(,) + -r, --receptor: receptor file in PDB format + -l, --ligands: ligand file in SDF format, separated by commas(,) -i, --ligand_index: a text file containing the path of ligand files in sdf format Docking box: diff --git a/unidock_tools/src/unidock_tools/modules/docking/unidock.py b/unidock_tools/src/unidock_tools/modules/docking/unidock.py index 279b451..5fb371a 100644 --- a/unidock_tools/src/unidock_tools/modules/docking/unidock.py +++ b/unidock_tools/src/unidock_tools/modules/docking/unidock.py @@ -19,6 +19,7 @@ def __init__(self, size_z: float = 22.5, output_dir: Optional[Union[str, os.PathLike]] = None, scoring: str = "vina", + ad4_map_prefix: str = "", num_modes: int = 10, search_mode: str = "", exhaustiveness: int = 256, @@ -29,9 +30,6 @@ def __init__(self, score_only: bool = False, local_only: bool = False ): - self.mgltools_python_path = "" - self.prepare_gpf4_script_path = "" - self.ad4_map_data_path = "" self.workdir = make_tmp_dir("unidock") cmd = ["unidock"] @@ -42,8 +40,7 @@ def __init__(self, size_z = min(size_z*2, 25) if scoring.lower() == "ad4": - map_prefix = os.path.join(self.workdir, 'receptor_grids', 'protein_conf_0', 'protein') - cmd += ["--maps", str(map_prefix)] + cmd += ["--maps", str(ad4_map_prefix)] else: cmd += ["--receptor", str(receptor)] diff --git a/unidock_tools/src/unidock_tools/modules/protein_prep/receptor_preprocessor_runner.py b/unidock_tools/src/unidock_tools/modules/protein_prep/receptor_preprocessor_runner.py index 1a51a7e..1f691b4 100644 --- a/unidock_tools/src/unidock_tools/modules/protein_prep/receptor_preprocessor_runner.py +++ b/unidock_tools/src/unidock_tools/modules/protein_prep/receptor_preprocessor_runner.py @@ -83,7 +83,7 @@ def receptor_preprocessor( protein_pdb_file_name: str, protein_conf_name: str = 'protein_conf_0', kept_ligand_resname_list: Optional[List[str]] = None, - prepared_hydrogen: bool = False, + prepared_hydrogen: bool = True, preserve_original_resname: bool = True, target_center: Tuple[float, float, float] = (0.0, 0.0, 0.0), box_size: Tuple[float, float, float] = (22.5, 22.5, 22.5), @@ -106,9 +106,8 @@ def receptor_preprocessor( runner.run() protein_pdbqt_file_name = runner.protein_pdbqt_file_name return protein_pdbqt_file_name - - + if __name__ == "__main__": import argparse import shutil