From d214bf78f531d16179882b120e235458b695c486 Mon Sep 17 00:00:00 2001 From: Lester Hedges Date: Mon, 27 Nov 2023 13:20:43 +0000 Subject: [PATCH] Add support for ORCA backend when using Sire interface. --- bin/emle-server | 8 +++ emle/emle.py | 110 +++++++++++++++++++++++++++++++------- emle/sander_calculator.py | 3 +- 3 files changed, 101 insertions(+), 20 deletions(-) diff --git a/bin/emle-server b/bin/emle-server index 51813fa..2a881ab 100755 --- a/bin/emle-server +++ b/bin/emle-server @@ -72,6 +72,7 @@ try: log = int(os.getenv("EMLE_LOG")) except: log = 1 +orca_template = os.getenv("EMLE_ORCA_TEMPLATE") deepmd_model = os.getenv("EMLE_DEEPMD_MODEL") rascal_model = os.getenv("EMLE_RASCAL_MODEL") parm7 = os.getenv("EMLE_PARM7") @@ -126,6 +127,7 @@ env = { "qm_indices": qm_indices, "sqm_theory": sqm_theory, "restart": restart, + "orca_template": orca_template, "log": log, } @@ -256,6 +258,12 @@ parser.add_argument( action=argparse.BooleanOptionalAction, required=False, ) +parser.add_argument( + "--orca-template", + type=str, + help="the path to a template ORCA input file (only used when using the ORCA backend via Sire)", + required=False, +) parser.add_argument( "--log", type=int, diff --git a/emle/emle.py b/emle/emle.py index 813b94e..fecaf80 100644 --- a/emle/emle.py +++ b/emle/emle.py @@ -368,6 +368,7 @@ def __init__( interpolate_steps=None, restart=False, device=None, + orca_template=None, log=1, ): """Constructor. @@ -451,6 +452,10 @@ def __init__( The name of the device to be used by PyTorch. Options are "cpu" or "cuda". + orca_template: str + The path to a template ORCA input file. This is required when using + the ORCA backend when using emle-engine with Sire. + log : int The frequency of logging energies to file. """ @@ -828,6 +833,18 @@ def __init__( else: self._log = log + if orca_template is not None: + if not isinstance(template, str): + raise TypeError("'orca_template' must be of type 'str'") + # Convert to an absolute path. + abs_orca_template = os.path.abspath(orca_template) + + if not os.path.isfile(abs_orca_template): + raise IOError(f"Unable to locate ORCA template file: '{orca_template}'") + self._orca_template = abs_orca_template + else: + self._orca_template = None + # Initialise a null SanderCalculator object. self._sander_calculator = None @@ -939,6 +956,7 @@ def __init__( "interpolate_steps": interpolate_steps, "restart": restart, "device": device, + "orca_template": None if orca_template is None else self._orca_template, "plugin_path": plugin_path, "log": log, } @@ -1396,9 +1414,12 @@ def _sire_callback(self, atomic_numbers, charges_mm, xyz_qm, xyz_mm): # ORCA. elif self._backend == "orca": - raise ValueError( - "Sire interface is currently unsupported when using the ORCA backend!" - ) + try: + E_vac, grad_vac = self._run_orca(orca_input, xyz_file_qm) + except: + raise RuntimeError( + "Failed to calculate in vacuo energies using ORCA backend!" + ) # Sander. elif self._backend == "sander": @@ -2446,7 +2467,9 @@ def _run_deepmd(self, xyz, elements): -(force[0] * EV_TO_HARTREE * BOHR_TO_ANGSTROM) / (x + 1), ) - def _run_orca(self, orca_input, xyz_file_qm): + def _run_orca( + self, orca_input=None, xyz_file_qm=None, atomic_numbers=None, xyz_qm=None + ): """ Internal function to compute in vacuo energies and gradients using ORCA. @@ -2470,16 +2493,61 @@ def _run_orca(self, orca_input, xyz_file_qm): The in vacuo QM gradient in Eh/Bohr. """ - if not isinstance(orca_input, str): + if orca_input is not None and not isinstance(orca_input, str): raise TypeError("'orca_input' must be of type 'str'.") - if not os.path.isfile(orca_input): + if orca_input is not None and not os.path.isfile(orca_input): raise IOError(f"Unable to locate the ORCA input file: {orca_input}") - if not isinstance(xyz_file_qm, str): + if xyz_qm_file is not None and not isinstance(xyz_file_qm, str): raise TypeError("'xyz_file_qm' must be of type 'str'.") - if not os.path.isfile(xyz_file_qm): + if xyz_qm_file is not None and not os.path.isfile(xyz_file_qm): raise IOError(f"Unable to locate the ORCA QM xyz file: {xyz_file_qm}") + if atomic_numbers is not None and not isinstance(atomic_numbers, np.ndarray): + raise TypeError("'atomic_numbers' must be of type 'numpy.ndarray'") + if atomic_numbers is not None and atomic_numbers.dtype != np.int64: + raise TypeError("'atomic_numbers' must have dtype 'int'.") + + if xyz_qm is not None and not isinstance(xyz_qm, np.ndarray): + raise TypeError("'xyz_qm' must be of type 'numpy.ndarray'") + if xyz_qm is not None and xyz_qm.dtype != np.float64: + raise TypeError("'xyz_qm' must have dtype 'float64'.") + + # ORCA input files take precedence. + is_orca_input = True + if orca_input is None or xyz_file_qm is None: + if atomic_numbers is None: + raise ValueError("No atomic numbers specified!") + if xyz_qm is None: + raise ValueError("No QM coordinates specified!") + + is_orca_input = False + + if self._orca_template is None: + raise ValueError("No ORCA template file specified!") + + fd_orca_input, orca_input = tempfile.mkstemp( + prefix="orc_job_", suffix=".inp", text=True + ) + fd_xyz_file_qm, xyz_file_qm = tempfile.mkstemp( + prefix="inpfile_", suffix=".xyz", text=True + ) + + # Copy the template file. + shutil.copyfile(self._orca_template, orca_input) + + # Add the QM coordinate file path. + with open(orca_input, "w") as f: + f.write(f'*xyzfile "{os.path.basename(xyz_file_qm)}"\n') + + # Write the xyz input file. + with open(xyz_file_qm, "w") as f: + f.write(f"{len(atomic_numbers):5d}\n\n") + for num, xyz in zip(atomic_numbers, xyz_qm): + f.write( + f"{num:3d} {xyz[0]:21.17f} {xyz[1]:21.17f} {xyz[2]:21.17f}\n" + ) + # Create a temporary working directory. with tempfile.TemporaryDirectory() as tmp: # Work out the name of the input files. @@ -2487,18 +2555,22 @@ def _run_orca(self, orca_input, xyz_file_qm): xyz_name = f"{tmp}/{os.path.basename(xyz_file_qm)}" # Copy the files to the working directory. - shutil.copyfile(orca_input, inp_name) - shutil.copyfile(xyz_file_qm, xyz_name) + if is_orca_input: + shutil.copyfile(orca_input, inp_name) + shutil.copyfile(xyz_file_qm, xyz_name) - # Edit the input file to remove the point charges. - lines = [] - with open(inp_name, "r") as f: - for line in f: - if not line.startswith("%pointcharges"): - lines.append(line) - with open(inp_name, "w") as f: - for line in lines: - f.write(line) + # Edit the input file to remove the point charges. + lines = [] + with open(inp_name, "r") as f: + for line in f: + if not line.startswith("%pointcharges"): + lines.append(line) + with open(inp_name, "w") as f: + for line in lines: + f.write(line) + else: + shutil.move(orca_input, inp_name) + shutil.move(xyz_file_qm, xyz_name) # Create the ORCA command. command = f"{self._orca_exe} {inp_name}" diff --git a/emle/sander_calculator.py b/emle/sander_calculator.py index 3fdc311..3d0eab9 100644 --- a/emle/sander_calculator.py +++ b/emle/sander_calculator.py @@ -94,7 +94,8 @@ def calculate( self.results = { "energy": energy.tot * KCAL_MOL_TO_HARTREE, "forces": np.array(forces).reshape((-1, 3)) - * KCAL_MOL_TO_HARTREE * BOHR_TO_ANGSTROM, + * KCAL_MOL_TO_HARTREE + * BOHR_TO_ANGSTROM, } @staticmethod