MI-FNO link (#157)

* MI-FNO helper class. Added tests + reconstruction of MI energy, support for building sermonic operators for fragments
sandbox-quantum · Jun 7, 2022 · 2011b87 · 2011b87
1 parent c6e8f41
commit 2011b87
Show file tree

Hide file tree

Showing 13 changed files with 373 additions and 6 deletions.
diff --git a/tangelo/problem_decomposition/__init__.py b/tangelo/problem_decomposition/__init__.py
@@ -14,3 +14,4 @@
 
 from .dmet.dmet_problem_decomposition import DMETProblemDecomposition
 from .oniom.oniom_problem_decomposition import ONIOMProblemDecomposition
+from .incremental.mifno_helper import MIFNOHelper
diff --git a/tangelo/problem_decomposition/incremental/__init__.py b/tangelo/problem_decomposition/incremental/__init__.py
@@ -0,0 +1,13 @@
+# Copyright 2021 Good Chemistry Company.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
diff --git a/tangelo/problem_decomposition/incremental/mifno_helper.py b/tangelo/problem_decomposition/incremental/mifno_helper.py
@@ -0,0 +1,268 @@
+# Copyright 2021 Good Chemistry Company.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""This file provides helpers in order to import data coming from a MI-FNO job
+from QEMIST Cloud, providing the users with both fragment information as well as
+reference results obtained by the classical solvers in QEMIST Cloud. The
+fragments can be passed to a quantum solver or be used for a quantum computing
+experiment.
+
+Currently, the fragment energies can only be recomputed with a quantum
+algorihtms (the interface of MI-FNO fragments and classical algorithms is not
+implemented yet).
+"""
+
+from functools import reduce
+import itertools
+import os
+import requests
+import warnings
+import json
+
+import h5py
+import numpy as np
+import pandas as pd
+
+
+class MIFNOHelper():
+    """Python object to post-process, fetch and manipulate QEMIST Cloud MI-FNO
+    results. The use case for this is to map MI-FNO subproblems into
+    fermionic Hamiltonians acting as inputs. This object keeps track of the
+    classical results.
+
+    Attributes:
+        e_tot (float): Total MI-FNO energy.
+        e_corr (float): Correlation energy (e_tot - e_mf).
+        e_mf (float): Mean-field energy.
+        frag_info (dict): Information about each fragment. The keys are related
+            to the truncation number (int) . The nested dictionaries have keys
+             refering to the sampled active space (e.g. '(1,)' or '(0, 2)') They
+            contain information about the correction term, epsilon, list of
+            truncated orbitals and more.
+
+    Properties:
+        to_dataframe (pandas.DataFrame): Converted frag_info dict into a pandas
+            DataFrame.
+        fragment_ids (list of string): List of all fragment identifiers.
+        frag_info_flattened (dictionary): The nested frag_info without the first
+            layer (keys = truncation number).
+    """
+
+    def __init__(self, json_file=None, results_object=None):
+        """Initialization method to process the classical results. A json path
+        or a python dictionary object can be passed to the method (not both).
+
+        Args:
+            json_file (string): Path to a json file containing the results from
+                QEMIST Cloud.
+            results_object (dict): Classical computation results (QEMIST Cloud
+                output).
+        """
+
+        # Raise error/warnings if input is not as expected. Only a single input
+        # must be provided to avoid conflicts.
+        if not (bool(json_file) ^ bool(results_object)):
+            raise ValueError(f"A json file path OR a dictionary object must be provided when instantiating {self.__class__.__name__}.")
+
+        if json_file:
+            assert os.path.isfile(json_file), f"The file {json_file} does not exist."
+
+            with open(json_file, "r") as f:
+                results_object = json.loads(f.read())
+
+            results_object["subproblem_data"] = {int(k): v for k, v in results_object["subproblem_data"].items()}
+
+        # Incremental (problem decomposition) quantities.
+        self.e_tot = results_object["energy_total"]
+        self.e_corr = results_object["energy_correlation"]
+        self.e_mf = results_object["mean_field_energy"]
+
+        relevant_info = {
+            "energy_total",
+            "energy_correlation",
+            "epsilon",
+            "correction",
+            "frozen_orbitals_truncated",
+            "mo_coefficients"
+        }
+
+        # Selecting only the FNO keys found in 'relevant_info'.
+        self.frag_info = dict()
+        for n_body, fragments_per_truncation in results_object["subproblem_data"].items():
+            self.frag_info[n_body] = dict()
+            for frag_id, frag_result in fragments_per_truncation.items():
+                self.frag_info[n_body][frag_id] = {k: frag_result.get(k, None) for k in relevant_info}
+
+            # Verify if the MO coefficients are there.
+            if "mo_coefficients" not in frag_result:
+                raise KeyError(f"MO coefficient not found in the {frag_id} "
+                    "results. Verify that the export_fragment_data flag is set "
+                    "to True for the MI-FNO calculation in QEMIST Cloud.")
+
+    def __repr__(self):
+        """Format the object to print the energies and the fragment information
+        as a pandas.DataFrame.
+        """
+
+        str_rep = f"(All the energy values are in hartree)\n" \
+                  f"Total MI-FNO energy = {self.e_tot}\n" \
+                  f"Correlation energy = {self.e_corr}\n" \
+                  f"Mean-field energy = {self.e_mf}\n" \
+                  f"{self.to_dataframe}"
+
+        return str_rep
+
+    @property
+    def to_dataframe(self):
+        """Outputs the fragment informations as a pandas.DataFrame."""
+        df = pd.DataFrame.from_dict(self.frag_info_flattened, orient="index")
+
+        # Replace frozen_orbitals_truncated=None with an empty list.
+        df["frozen_orbitals_truncated"] = df["frozen_orbitals_truncated"].apply(lambda d: d if isinstance(d, list) else [])
+
+        return df.drop(["mo_coefficients"], axis=1)
+
+    @property
+    def fragment_ids(self):
+        """Outputs the fragment ids in a list."""
+        return list(itertools.chain.from_iterable([d.keys() for d in self.frag_info.values()]))
+
+    @property
+    def frag_info_flattened(self):
+        """Outputs the nested frag_info without the first layer."""
+        return reduce(lambda a, b: {**a, **b}, self.frag_info.values())
+
+    def retrieve_mo_coeff(self, destination_folder=os.getcwd()):
+        """Function to fetch molecular orbital coefficients. A download path can
+        be provided to change the directory where the files will be downloaded.
+        If the files already exist, the function skips the download step. The
+        array is stored in the ["mo_coefficients"]["array"] entry in the
+        frag_info dictionary attribute.
+
+        Args:
+            destination_folder (string): Users can specify a path to a
+                destination folder, where the files containing the coefficients
+                will be downloaded. The default value is the directory where the
+                user's python script is run.
+        """
+        if not os.path.isdir(destination_folder):
+            raise FileNotFoundError(f"The {destination_folder} path does not exist.")
+        absolute_path = os.path.abspath(destination_folder)
+
+        # For each fragment, fetch the molecular orbital coefficients from the
+        # HDF5 files.
+        n_files = len(self.fragment_ids)
+        i_file = 1
+        for n_body_fragments in self.frag_info.values():
+            for frag_id, frag in n_body_fragments.items():
+                file_path = os.path.join(absolute_path, frag["mo_coefficients"]["key"] + ".hdf5")
+
+                if not os.path.exists(file_path):
+                    print(f"Downloading and writing MO coefficients file to {file_path} ({i_file} / {n_files})")
+                    response = requests.get(frag["mo_coefficients"]["s3_url"])
+
+                    with open(file_path, "wb") as file:
+                        file.write(response.content)
+                    i_file += 1
+
+                with h5py.File(file_path, "r") as file:
+                    mo_coeff = np.array(file["mo_coefficients"])
+
+                n_body_fragments[frag_id]["mo_coefficients"]["array"] = mo_coeff
+
+    def compute_fermionoperator(self, molecule, frag_id):
+        """Computes the fermionic Hamiltonian for a MI-FNO fragment.
+
+        Args:
+            molecule (SecondQuantizedMolecule): Full molecule description.
+            frag_id (string): Fragment id, e.g. "(0, )", "(1, 2)", ...
+
+        Returns:
+            FermionOperator: Fermionic operator for the specified fragment id.
+        """
+
+        if not all(["array" in d["mo_coefficients"] for d in self.frag_info_flattened.values()]):
+            raise RuntimeError(f"The molecular orbital coefficients are not available. Please call the {self.__class__.__name__}.get_mo_coeff method.")
+
+        n_body = len(eval(frag_id))
+        mo_coeff = self.frag_info[n_body][frag_id]["mo_coefficients"]["array"]
+        frozen_orbitals = self.frag_info[n_body][frag_id]["frozen_orbitals_truncated"]
+
+        # Something is wrong if the molecule provided does not have the same
+        # mean-field energy.
+        assert round(molecule.mf_energy, 6) == round(self.e_mf, 6),  \
+            "The molecule's mean-field energy is different than the one from " \
+            "the results. Please verify that the molecular quantities are "\
+            "the same as the one in the MI-FNO computation."
+
+        # Returning a new molecule with the right frozen orbital.
+        new_molecule = molecule.freeze_mos(frozen_orbitals, inplace=False)
+
+        return new_molecule._get_fermionic_hamiltonian(mo_coeff)
+
+    def mi_summation(self, user_provided_energies=None):
+        r"""Recomputes the total energy for the method of increments (MI).
+        Each increment corresponds to "new" correlation energy from the n-body
+        problem. This method makes computing the total energy with new
+        results possible.
+
+        It computes the epsilons with the MP2 correction:
+        \epsilon_{i} = E_c(i)
+        \epsilon_{ij} = E_c(ij) - \epsilon_{i} - \epsilon_{i}
+        \epsilon_{ijk} = E_c(ijk) - \epsilon_{ij} - \epsilon_{ik}
+            - \epsilon_{jk} - \epsilon_{i} - \epsilon_{j} - \epsilon_{k}
+        etc.
+
+        Args:
+            user_provided_energies (dict): New energy values provided by the
+                user, used instead of the corresponding pre-computed ones. E.g.
+                {"(0, )": -1.234} or {"(1, )": -1.234, "(0, 1)": -5.678}.
+
+        Returns:
+            float: Method of increment total energy.
+        """
+        if user_provided_energies is None:
+            user_provided_energies = dict()
+        else:
+            fragment_correction = {k: v["correction"] for k, v in self.frag_info_flattened.items()}
+            user_provided_energies = {frag_id: e + fragment_correction[frag_id] for frag_id, e in user_provided_energies.items()}
+
+        fragment_energies = {k: v["energy_total"] for k, v in self.frag_info_flattened.items()}
+
+        # Update to consider energies taken from a calculation.
+        fragment_energies.update(user_provided_energies)
+
+        n_body_max = max(self.frag_info.keys())
+
+        # Perform the incremental sumamtion.
+        epsilons = dict()
+        for n_body in range(1, n_body_max + 1):
+            for frag_id in self.frag_info[n_body].keys():
+                corr_energy = fragment_energies[frag_id] - self.e_mf
+                epsilons[frag_id] = corr_energy
+
+                if n_body > 1:
+                    for n_increment in range(1, n_body):
+                        for frag_increment in itertools.combinations(eval(frag_id), n_increment):
+                            epsilons[frag_id] -= epsilons[str(frag_increment)]
+
+        # Check if epsilon < 0, i.e. positive correlation energy increment.
+        for frag_id, eps in epsilons.items():
+            if eps > 0.:
+                warnings.warn(f"Epsilon for frag_id {frag_id} is positive "
+                    f"({eps}). With MI, there is no reason to consider a "
+                    "fragment returning a positive correlation energy. Please "
+                    "check your calculations.", RuntimeWarning)
+
+        return self.e_mf + sum(epsilons.values())
diff --git a/...ts/incremental/data/1c296842b3f2ace38fb7dfa8937cbba87fb286604018adf033df9478d17631a8.hdf5 b/...ts/incremental/data/1c296842b3f2ace38fb7dfa8937cbba87fb286604018adf033df9478d17631a8.hdf5
diff --git a/...ts/incremental/data/266b4d7beccb2d1eae4b28d22608c1c0df99e8989f5d8d5762b34c3c0a7173ab.hdf5 b/...ts/incremental/data/266b4d7beccb2d1eae4b28d22608c1c0df99e8989f5d8d5762b34c3c0a7173ab.hdf5
diff --git a/...ts/incremental/data/415b3a854809ad4f73af4bedfb8972b4f01f48872663b42f8f3980a7ba7aa616.hdf5 b/...ts/incremental/data/415b3a854809ad4f73af4bedfb8972b4f01f48872663b42f8f3980a7ba7aa616.hdf5
Original file line number	Diff line number	Diff line change
Expand Up		@@ -14,3 +14,4 @@

		from .dmet.dmet_problem_decomposition import DMETProblemDecomposition
		from .oniom.oniom_problem_decomposition import ONIOMProblemDecomposition
		from .incremental.mifno_helper import MIFNOHelper