Merge pull request #25 from biomedbigdata/quepistasis_paralleltempering

Adding parallel tempering as a backend for quepistasis
daisybio · Feb 6, 2024 · 6da8f14 · 6da8f14
2 parents 714cdc2 + 1fdcf8f
commit 6da8f14
Show file tree

Hide file tree

Showing 6 changed files with 411 additions and 1 deletion.
diff --git a/quepistasis/header/python_wrapper.h b/quepistasis/header/python_wrapper.h
@@ -25,11 +25,21 @@ class PythonWrapper {
      */
     PyObject *pModuleQAOA = nullptr;
 
+    /**
+     * Object representing the module used to interact with the Parallel Tempering procedure
+     */
+    PyObject *pModuleParallelTempering = nullptr;
+
     /**
      * Object representing the function to call "run_quantum_annealer" function in Python
      */
     PyObject *pFuncQuantumAnnealer = nullptr;
 
+    /**
+     * Object representing the function to call "run_parallel_tempering" function in Python
+     */
+    PyObject *pFuncParallelTempering = nullptr;
+
     /**
      * Object representing the function to call "run_quantum_annealer" function in Python
      */
@@ -145,6 +155,24 @@ class PythonWrapper {
         double rev_annealing_ramp_time, double rev_annealing_pause_time, double rev_annealing_s_target, 
         const char* save_path);
 
+
+    /**
+     * @brief Run the quantum annealer method in Python
+     * @param h: Ising formulation h coefficients (which in Python results in the object np.nparray[float] of shape (N,))
+     * @param j: Ising formulation J coefficients (which - together with start and end params - in Python results in the object dict[tuple(int,int) -> float])
+     * @param start: vector Ising formulation J starting index
+     * @param end: vector Ising formulation J starting index
+     * @param num_chains Number of parallel walkers
+     * @param num_steps Number of operations per walker
+     * @param save_path: Path where to save the file including the first part of the file name
+     * @return solution to the Ising problem or the empty list in case of errors.
+     */
+    std::vector<int> run_parallel_tempering(
+        std::vector<double> h, std::vector<double> J, std::vector<int> start, std::vector<int> end,
+        int num_chains, int num_steps, const char* save_path);
+
+
+
     /**
      * @brief Run the optimizers available of Azure QIO
      * @param h: Ising formulation h coefficients (which in Python results in the object np.nparray[float] of shape (N,))

diff --git a/quepistasis/header/snps_optimization.h b/quepistasis/header/snps_optimization.h
@@ -177,6 +177,16 @@ class snps_qubo_matrix : public matrix {
         char* initial_state = nullptr, const char* save_path = nullptr);
 
 
+    /**
+     * @brief Solve the current QUBO matrix with quantum annealing (call Python then D-Wave devices). In case of errors the return value is the empty vector.
+     * @param num_chains Number of parallel walkers
+     * @param num_steps Number of operations per walker
+     * @param save_path Path where to save the file including the first part of the file name
+     * @return A vector of 'n_cliques' elements, each element represents a suggested SNPs set OR the empty vector in case of errors. 
+     */
+    std::vector<std::vector<int>> solve_cpu_parallel_tempering(int num_chains, int num_steps, const char* save_path);
+
+
     /**
      * @brief Solve the current QUBO matrix with quantum annealing (call Python then D-Wave devices). In case of errors the return value is the empty vector.
      * @param token: D-Wave platform token

diff --git a/quepistasis/parallel_tempering.py b/quepistasis/parallel_tempering.py
@@ -0,0 +1,296 @@
+import numpy as np
+from abc import ABC, abstractmethod
+from utils import Trace
+from joblib import Parallel, delayed
+import random
+
+
+class ParallelTempering(ABC):
+
+    def __init__(self, num_chains, num_steps, betas):
+        """
+        Initialize the ParallelTempering instance.
+
+        Parameters:
+        - num_chains (int): Number of parallel chains.
+        - num_steps (int): Number of MCMC steps for each chain.
+        - betas (array-like): Temperatures for each chain.
+        """
+        self.num_chains = num_chains
+        self.num_steps = num_steps
+        self.betas = betas
+        self.chains = None
+        self.log_likes = None
+
+    @abstractmethod
+    def initial_probability(self):
+        """
+        Abstract method to provide the initial probability configuration for each chain.
+        """
+        pass
+
+    @abstractmethod
+    def log_like(self, x):
+        """
+        Abstract method to provide the log likelihood function for a given configuration.
+
+        Parameters:
+        - x (array-like): Configuration for which to calculate the log likelihood.
+
+        Returns:
+        - float: Log likelihood.
+        """
+        pass
+
+    @abstractmethod
+    def log_prior(self, x):
+        """
+        Abstract method to provide the log prior function for a given configuration.
+
+        Parameters:
+        - x (array-like): Configuration for which to calculate the log prior.
+
+        Returns:
+        - float: Log prior.
+        """
+        pass
+
+    def metropolis_hastings_proposal(self, x, beta):
+        """
+        Metropolis-Hastings proposal for binary variables.
+
+        Parameters:
+        - x (array-like): Current configuration.
+        - beta (float): Inverse temperature for the current chain.
+
+        Returns:
+        - array-like: Proposed configuration.
+        """
+        proposal = np.copy(x)
+        flip_index = np.random.randint(len(x))
+        proposal[flip_index] *= -1
+        return proposal
+
+    def acceptance_probability(self, old_prob, new_prob, beta):
+        """
+        Calculate the acceptance probability for the Metropolis-Hastings step.
+
+        Parameters:
+        - old_prob (float): Log probability of the current configuration.
+        - new_prob (float): Log probability of the proposed configuration.
+        - beta (float): Inverse temperature for the current chain.
+
+        Returns:
+        - float: Acceptance probability.
+        """
+        return min(1, np.exp(beta * (old_prob - new_prob)))
+
+    def initialize_chain(self, i):
+        self.chains[i, 0] = self.initial_probability()
+        self.log_likes[i, 0] = self.log_like(self.chains[i, 0]) + self.log_prior(self.chains[i, 0])
+
+    def step_chain(self, step, i):
+        current_chain = self.chains[i, step - 1]
+        current_log_prob = self.log_like(current_chain) + self.log_prior(current_chain)
+
+        # Perform Metropolis-Hastings proposal
+        proposed_chain = self.metropolis_hastings_proposal(current_chain, self.betas[i])
+
+        # Calculate log likelihood and log prior for proposed chain
+        proposed_log_prob = self.log_like(proposed_chain) + self.log_prior(proposed_chain)
+
+        # Accept or reject the proposed chain
+        if np.log(np.random.uniform()) < self.acceptance_probability(current_log_prob, proposed_log_prob, self.betas[i]):
+            self.chains[i, step] = proposed_chain
+            self.log_likes[i, step] = proposed_log_prob
+        else:
+            self.chains[i, step] = current_chain
+            self.log_likes[i, step] = current_log_prob
+
+    def run(self):
+        """
+        Run the Parallel Tempering MCMC algorithm.
+
+        Returns:
+        - tuple: Chains and log likelihoods.
+        """
+        ndim = len(self.initial_probability())
+        self.chains = np.zeros((self.num_chains, self.num_steps, ndim))
+        self.log_likes = np.zeros((self.num_chains, self.num_steps))
+
+        for i in range(self.num_chains):
+            self.initialize_chain(i)
+
+        for step in range(1, self.num_steps):
+
+            for i in range(self.num_chains):
+                self.step_chain(step, i)
+
+            # Exchange states between adjacent chains
+            for i in range(self.num_chains - 1):
+                diff_prob = self.betas[i + 1] * (self.log_likes[i, step] - self.log_likes[i + 1, step])
+                if np.log(np.random.uniform()) < diff_prob:
+                    # Swap states between chains i and i+1
+                    self.chains[i, step], self.chains[i + 1, step] = self.chains[i + 1, step], self.chains[i, step]
+                    self.log_likes[i, step], self.log_likes[i + 1, step] = self.log_likes[i + 1, step], self.log_likes[i, step]
+
+        return self.chains, self.log_likes
+
+    def run_parallel(self):
+        """
+        Run the Parallel Tempering MCMC algorithm in parallel.
+
+        Returns:
+        - tuple: Chains and log likelihoods.
+        """
+
+        ndim = len(self.initial_probability())
+        self.chains = np.zeros((self.num_chains, self.num_steps, ndim))
+        self.log_likes = np.zeros((self.num_chains, self.num_steps))
+
+        # Initialize chains and log likelihoods for each chain
+        Parallel(n_jobs=self.num_chains, backend="threading")(delayed(self.initialize_chain)(i) for i in range(self.num_chains))
+        print(self.chains)
+
+        for step in range(1, self.num_steps):
+
+            # Run Metropolis-Hastings proposals and updates in parallel
+            Parallel(n_jobs=self.num_chains, backend="threading")(delayed(self.step_chain)(step, i) for i in range(self.num_chains))
+            print(self.chains)
+
+            # Exchange states between adjacent chains
+            for i in range(self.num_chains - 1):
+                diff_prob = self.betas[i + 1] * (self.log_likes[i, step] - self.log_likes[i + 1, step])
+                if np.log(np.random.uniform()) < diff_prob:
+                    # Swap states between chains i and i+1
+                    self.chains[i, step], self.chains[i + 1, step] = self.chains[i + 1, step], self.chains[i, step]
+                    self.log_likes[i, step], self.log_likes[i + 1, step] = self.log_likes[i + 1, step], self.log_likes[i, step]
+
+        return self.chains, self.log_likes
+
+class IsingParallelTempering(ParallelTempering):
+
+    def __init__(self, h, J, num_chains, num_steps, betas):
+        """
+        Initialize the IsingParallelTempering instance.
+
+        Parameters:
+        - h (numpy array): External magnetic field.
+        - J (dictionary): Coupling strengths between spins (interaction matrix).
+        - num_chains (int): Number of parallel chains.
+        - num_steps (int): Number of MCMC steps for each chain.
+        - betas (array-like): Temperatures for each chain.
+        """
+        super().__init__(num_chains, num_steps, betas)
+        self.h = h
+        self.J = J
+        self.ising_upper = np.sum(np.abs(self.h)) + np.sum(np.abs(np.array(list(J.values()))))
+        self.ndim = len(h)
+
+    def initial_probability(self):
+        """
+        Generate the initial spin configuration.
+
+        Returns:
+        - array-like: Initial spin configuration (+1 or -1).
+        """
+        return np.random.choice([-1, 1], size=self.ndim)
+
+    @staticmethod
+    def ising_energy(x, h, J):
+        energy = np.sum(h * x)
+        for (i, j), value in J.items():
+            energy += value * x[i] * x[j]
+        return energy
+
+    def log_like(self, x):
+        """
+        Calculate the log likelihood for a given spin configuration.
+
+        Parameters:
+        - x (array-like): Spin configuration for which to calculate the log likelihood.
+
+        Returns:
+        - float: Log likelihood
+        """
+        energy = self.ising_energy(x, self.h, self.J)
+        return -1 * (self.ising_upper - energy)
+
+    def log_prior(self, x):
+        """
+        Calculate the log prior for a given spin configuration.
+
+        Parameters:
+        - x (array-like): Spin configuration for which to calculate the log prior.
+
+        Returns:
+        - float: Log prior (always 0.0 in this example).
+        """
+        return 0.0
+
+    def get_solution(self):
+        """
+        Return the solution of the optimization problem. 
+        
+        Returns:
+        - np.ndarray: spin configuration of the best solution.
+        - float: Log likelihood of the best solution.
+        - float: Energy of the best solution.
+        """
+
+        best_chain_index, best_step_index = np.unravel_index(np.argmin(self.log_likes), self.log_likes.shape)
+        best_configuration = self.chains[best_chain_index, best_step_index]
+        best_log_likelihood = self.log_likes[best_chain_index, best_step_index]
+        best_energy = self.ising_energy(best_configuration, self.h, self.J)
+        return best_configuration, best_log_likelihood, best_energy
+
+
+def sparsify_solution(spins, MAX_UP_SPIN=10):
+    # delete snps if they are too many
+    indexes_to_one = [i for i, value in enumerate(spins) if value == 1]
+    if len(indexes_to_one) > MAX_UP_SPIN:
+        random.shuffle(indexes_to_one)
+        for idx in indexes_to_one[MAX_UP_SPIN:]:
+            spins[idx] = -1
+    return spins
+
+
+def run_parallel_tempering(h, J, num_chains, num_steps, save_path):
+
+    # trace the input except for the qubo formulation itself which is too large
+    trace = Trace(print=True, path=save_path)
+    trace.add('input', None, 'num_chains', num_chains)
+    trace.add('input', None, 'num_steps', num_steps)
+    trace.add('input', None, 'save_path', save_path)
+    betas = np.geomspace(1, 1e-2, num_chains)
+    ising_pt = IsingParallelTempering(h, J, num_chains, num_steps, betas)
+    ising_pt.run_parallel()
+    spins, loglike, energy = ising_pt.get_solution()
+    spins = [int(i) for i in spins.tolist()]
+    trace.add('solution', 'original', 'spins', spins)
+    trace.add('solution', 'original', 'loglike', loglike)
+    trace.add('solution', 'original', 'energy', energy)
+    spins = sparsify_solution(spins, 10)
+    trace.add('solution', 'sparsified', 'spins', spins)
+    trace.add('solution', 'sparsified', 'loglike', None)
+    trace.add('solution', 'sparsified', 'energy', IsingParallelTempering.ising_energy(spins, h, J))
+    return spins
+
+def test_parallel_tempering(parallel=False):
+    """
+    Run a basic Ising model to check if the code works correctly.
+    """
+    h = np.array([5, 10, -20])
+    J = {(0, 1): 1, (1, 2): 2}
+
+    num_chains = 2
+    num_steps = 3
+    betas = np.geomspace(1, 1e-2, num_chains)
+
+    ising_pt = IsingParallelTempering(h, J, num_chains, num_steps, betas)
+    if parallel:
+        ising_pt.run_parallel()
+    else:
+        ising_pt.run()
+    spins, loglike, energy = ising_pt.get_solution()
+    print(f"{spins=} {loglike=} {energy=}")
diff --git a/quepistasis/quantum_annealer.py b/quepistasis/quantum_annealer.py
@@ -265,7 +265,7 @@ def run_quantum_annealer(token, h, J, num_reads, solver_idx,
     client.close()
     trace.save()
 
-    if best_fw_energy > best_fw_energy:
+    if best_fw_energy > best_rev_energy:
         return best_fw_sample if type(best_fw_sample) == 'list' else best_fw_sample.tolist()
     else:
         return best_rev_sample if type(best_rev_sample) == 'list' else best_rev_sample.tolist()