perses/dispersed/smc.py

import openmmtools.cache as cache
import os
import copy
from perses.dispersed.utils import *

from openmmtools.states import ThermodynamicState, CompoundThermodynamicState, SamplerState
import numpy as np
import mdtraj as md
import simtk.unit as unit
import logging
import time
from collections import namedtuple
from perses.annihilation.lambda_protocol import LambdaProtocol
from perses.annihilation.lambda_protocol import RelativeAlchemicalState
from perses.dispersed import *
import random
import pymbar
from perses.dispersed.parallel import Parallelism
from openmmtools import utils
# Instantiate logger
logging.basicConfig(level = logging.NOTSET)
_logger = logging.getLogger("sMC")
_logger.setLevel(logging.INFO)

cache.global_context_cache.platform = configure_platform(utils.get_fastest_platform().getName())
EquilibriumFEPTask = namedtuple('EquilibriumInput', ['sampler_state', 'inputs', 'outputs'])
DISTRIBUTED_ERROR_TOLERANCE = 1e-4

class SequentialMonteCarlo():
    """
    This class represents an sMC particle that runs a nonequilibrium switching protocol.
    It is a batteries-included engine for conducting sequential Monte Carlo sampling.

    WARNING: take care in writing trajectory file as saving positions to memory is costly.  Either do not write the configuration or save sparse positions.
    """

    supported_resampling_methods = {'multinomial': multinomial_resample}
    supported_observables = {'ESS': ESS, 'CESS': CESS}

    def __init__(self,
                 factory,
                 lambda_protocol = 'default',
                 temperature = 300 * unit.kelvin,
                 trajectory_directory = 'test',
                 trajectory_prefix = 'out',
                 atom_selection = 'not water',
                 timestep = 1 * unit.femtoseconds,
                 collision_rate = 1 / unit.picoseconds,
                 eq_splitting_string = 'V R O R V',
                 neq_splitting_string = 'V R O R V',
                 ncmc_save_interval = None,
                 measure_shadow_work = False,
                 neq_integrator = 'langevin',
                 compute_endstate_correction = True,
                 external_parallelism = None,
                 internal_parallelism = {'library': ('dask', 'LSF'),
                                         'num_processes': 2}
                                         ):
        """
        Parameters
        ----------
        factory : perses.annihilation.relative.HybridTopologyFactory - compatible object
        lambda_protocol : str, default 'default'
            the flavor of scalar lambda protocol used to control electrostatic, steric, and valence lambdas
        temperature : float unit.Quantity
            Temperature at which to perform the simulation, default 300K
        trajectory_directory : str, default 'test'
            Where to write out trajectories resulting from the calculation. If None, no writing is done.
        trajectory_prefix : str, default None
            What prefix to use for this calculation's trajectory files. If none, no writing is done.
        atom_selection : str, default not water
            MDTraj selection syntax for which atomic coordinates to save in the trajectories. Default strips
            all water.
        timestep : float unit.Quantity, default 1 * units.femtoseconds
            the timestep for running MD
        collision_rate : float unit.Quantity, default 1 / unit.picoseconds
            the collision rate for running MD
        eq_splitting_string : str, default 'V R O R V'
            The integrator splitting to use for equilibrium simulation
        neq_splitting_string : str, default 'V R O R V'
            The integrator splitting to use for nonequilibrium switching simulation
        ncmc_save_interval : int, default None
            interval with which to write ncmc trajectory.  If None, trajectory will not be saved.
            We will assert that the n_lambdas % ncmc_save_interval = 0; otherwise, the protocol will not be complete
        measure_shadow_work : bool, default False
            whether to measure the shadow work of the integrator.
            WARNING : this is not currently supported
        neq_integrator : str, default 'langevin'
            which integrator to use
        compute_endstate_correction : bool, default True
            whether to compute the importance weight to the alchemical endstates
        external_parallelism : dict('parallelism': perses.dispersed.parallel.Parallelism, 'available_workers': list(str)), default None
            an external parallelism dictionary;
            external_parallelism is used if the entire SequentialMonteCarlo class is allocated workers by an external client (i.e.
            there exists a Parallelism.client object that is allocating distributed workers to several SequentialMonteCarlo classes simultaneously)

        internal_parallelism : dict, default {'library': ('dask', 'LSF'), 'num_processes': 2}
            dictionary of parameters to instantiate a client and run parallel computation internally.  internal parallelization is handled by default
            if None, external worker arguments have to be specified, otherwise, no parallel computation will be conducted, and annealing will be conducted locally.
            internal_parallelism is used when the SequentialMonteCarlo class is allowed to create its own Parallelism.client object to allocate workers on a
            cluster.
        """
        _logger.info(f"Initializing SequentialMonteCarlo")

        #pull necessary attributes from factory
        self.factory = factory

        #context cache
        self.context_cache = cache.global_context_cache

        #use default protocol
        self.lambda_protocol = lambda_protocol

        #handle both eq and neq parameters
        self.temperature = temperature
        self.timestep = timestep
        self.collision_rate = collision_rate

        self.measure_shadow_work = measure_shadow_work
        self.neq_integrator = neq_integrator
        if measure_shadow_work:
            raise Exception(f"measure_shadow_work is not currently supported.  Aborting!")


        #handle equilibrium parameters
        self.eq_splitting_string = eq_splitting_string

        #handle storage and names
        self.trajectory_directory = trajectory_directory
        self.trajectory_prefix = trajectory_prefix
        self.atom_selection = atom_selection

        #handle neq parameters
        self.neq_splitting_string = neq_splitting_string
        self.ncmc_save_interval = ncmc_save_interval

        #lambda states:
        self.lambda_endstates = {'forward': [0.0,1.0], 'reverse': [1.0, 0.0]}

        #instantiate trajectory filenames
        if self.trajectory_directory and self.trajectory_prefix:
            self.write_traj = True
            self.eq_trajectory_filename = {lambda_state: os.path.join(os.getcwd(), self.trajectory_directory, f"{self.trajectory_prefix}.eq.lambda_{lambda_state}.h5") for lambda_state in self.lambda_endstates['forward']}
            self.neq_traj_filename = {direct: os.path.join(os.getcwd(), self.trajectory_directory, f"{self.trajectory_prefix}.neq.lambda_{direct}") for direct in self.lambda_endstates.keys()}
            self.topology = self.factory.hybrid_topology
        else:
            self.write_traj = False
            self.eq_trajectory_filename = {0: None, 1: None}
            self.neq_traj_filename = {'forward': None, 'reverse': None}
            self.topology = None

        # subset the topology appropriately:
        self.atom_selection_string = atom_selection
        # subset the topology appropriately:
        if self.atom_selection_string is not None:
            atom_selection_indices = self.factory.hybrid_topology.select(self.atom_selection_string)
            self.atom_selection_indices = atom_selection_indices
        else:
            self.atom_selection_indices = None

        # instantiating equilibrium file/rp collection dicts
        self._eq_dict = {0: [], 1: [], '0_decorrelated': None, '1_decorrelated': None, '0_reduced_potentials': [], '1_reduced_potentials': []}
        self._eq_files_dict = {0: [], 1: []}
        self._eq_timers = {0: [], 1: []}
        self._neq_timers = {'forward': [], 'reverse': []}

        #instantiate nonequilibrium work dicts: the keys indicate from which equilibrium thermodynamic state the neq_switching is conducted FROM (as opposed to TO)
        self.cumulative_work = {'forward': [], 'reverse': []}
        self.incremental_work = copy.deepcopy(self.cumulative_work)
        self.shadow_work = copy.deepcopy(self.cumulative_work)
        self.nonequilibrium_timers = copy.deepcopy(self.cumulative_work)
        self.total_jobs = 0
        #self.failures = copy.deepcopy(self.cumulative_work)
        self.dg_EXP = copy.deepcopy(self.cumulative_work)
        self.dg_BAR = None

        #instantiate thermodynamic state
        lambda_alchemical_state = RelativeAlchemicalState.from_system(self.factory.hybrid_system)
        lambda_alchemical_state.set_alchemical_parameters(0.0, LambdaProtocol(functions = self.lambda_protocol))
        self.thermodynamic_state = CompoundThermodynamicState(ThermodynamicState(self.factory.hybrid_system, temperature = self.temperature),composable_states = [lambda_alchemical_state])

        # set the SamplerState for the lambda 0 and 1 equilibrium simulations
        sampler_state = SamplerState(self.factory.hybrid_positions,
                                          box_vectors=self.factory.hybrid_system.getDefaultPeriodicBoxVectors())
        self.sampler_states = {0: copy.deepcopy(sampler_state), 1: copy.deepcopy(sampler_state)}

        #endstate corrections?
        self.compute_endstate_correction = compute_endstate_correction

        #implement the appropriate parallelism
        self.implement_parallelism(external_parallelism = external_parallelism,
                                   internal_parallelism = internal_parallelism)

    def implement_parallelism(self, external_parallelism, internal_parallelism):
        """
        Function to implement the approprate parallelism given input arguments.
        This is exposed as a method in case the class already exists and the user wants to change the parallelism scheme.

        Parameters
        ----------
        external_parallelism : dict('parallelism': perses.dispersed.parallel.Parallelism, 'available_workers': list(str)), default None
            an external parallelism dictionary
        internal_parallelism : dict, default {'library': ('dask', 'LSF'), 'num_processes': 2}
            dictionary of parameters to instantiate a client and run parallel computation internally.  internal parallelization is handled by default
            if None, external worker arguments have to be specified, otherwise, no parallel computation will be conducted, and annealing will be conducted locally.

        """
        #parallelism implementables
        if external_parallelism is not None and internal_parallelism is not None:
            raise Exception(f"external parallelism were given, but an internal parallelization scheme was also specified.  Aborting!")
        if external_parallelism is not None:
            self.external_parallelism, self.internal_parallelism = True, False
            self.parallelism, self.workers = external_parallelism['parallelism'], external_parallelism['workers']
            self.parallelism_parameters = None
            assert self.parallelism.client is not None, f"the external parallelism class has not yet an activated client."
        elif internal_parallelism is not None:
            self.external_parallelism, self.internal_parallelism = False, True
            self.parallelism, self.workers = Parallelism(), internal_parallelism['num_processes']
            self.parallelism_parameters = internal_parallelism
        else:
            _logger.warning(f"both internal and external parallelisms are unspecified.  Defaulting to not_parallel.")
            self.external_parallelism, self.internal_parallelism = False, True
            self.parallelism_parameters = {'library': None, 'num_processes': None}
            self.parallelism, self.workers = Parallelism(), 0

        if external_parallelism is not None and internal_parallelism is not None:
            raise Exception(f"external parallelism were given, but an internal parallelization scheme was also specified.  Aborting!")


    def _activate_annealing_workers(self):
        """
        wrapper to distribute workers and create appropriate worker attributes for annealing
        """
        _logger.debug(f"activating annealing workers...")
        if self.internal_parallelism:
            _logger.debug(f"found internal parallelism; activating client with the following parallelism parameters: {self.parallelism_parameters}")
            #we have to activate the client
            self.parallelism.activate_client(library = self.parallelism_parameters['library'],
                                             num_processes = self.parallelism_parameters['num_processes'])
            workers = list(self.parallelism.workers.values())
        elif self.external_parallelism:
            #the client is already active
            workers = self.parallelism_parameters['available_workers']
        else:
            raise Exception(f"either internal or external parallelism must be True.")

        #now client.run to broadcast the vars
        broadcast_remote_worker = 'remote' if self.parallelism.client is not None else self


        addresses = self.parallelism.run_all(func = activate_LocallyOptimalAnnealing, #func
                                             arguments = (copy.deepcopy(self.thermodynamic_state), #arg: thermodynamic state
                                                          broadcast_remote_worker, #arg: remote worker
                                                          self.lambda_protocol, #arg: lambda protocol
                                                          self.timestep, #arg: timestep
                                                          self.collision_rate, #arg: collision_rate
                                                          self.temperature, #arg: temperature
                                                          self.neq_splitting_string, #arg: neq_splitting string
                                                          self.ncmc_save_interval, #arg: ncmc_save_interval
                                                          self.topology, #arg: topology
                                                          self.atom_selection_indices, #arg: subset atoms
                                                          self.measure_shadow_work, #arg: measure_shadow_work
                                                          self.neq_integrator, #arg: integrator,
                                                          self.compute_endstate_correction #arg: compute_endstate_correction
                                                         ),
                                             workers = workers) #workers
    def _deactivate_annealing_workers(self):
        """
        wrapper to deactivate workers and delete appropriate worker attributes for annealing
        """
        if self.internal_parallelism:
            _logger.debug(f"\t\tfound internal parallelism; deactivating client.")
            #we have to deactivate the client
            if self.parallelism.client is None:
                #then we are running local annealing
                deactivate_worker_attributes(remote_worker = self)

            self.parallelism.deactivate_client()

        elif self.external_parallelism:
            #the client is already active; we don't have the authority to deactivate
            workers = self.parallelism_parameters['available_workers']
            pass_remote_worker = 'remote' if self.parallelism.client is not None else self
            deactivate_worker_attributes(remote_worker = pass_remote_worker)
        else:
            raise Exception(f"either internal or external parallelism must be True.")

    def AIS(self,
            num_particles,
            protocols = {'forward': np.linspace(0,1, 1000), 'reverse': np.linspace(1,0,1000)},
            num_integration_steps = 1,
            return_timer = False,
            rethermalize = False):
        """
        Conduct vanilla AIS (i.e. nonequilibrium switching FEP) with a given protocol (for each direction), specified annealing time per lambda, and support for rethermalization (i.e. velocity resampling)
        NOTE: AIS is NaN-safe

        Parameters
        ----------
        num_particles : int
            number of particles to run in each direction
        protocols : dict of {direction : np.array}, default {'forward': np.linspace(0,1, 1000), 'reverse': np.linspace(1,0,1000)},
            the dictionary of forward and reverse protocols.  if None, the protocols will be trailblazed.
        num_integration_steps : int
            number of integration steps per proposal
        return_timer : bool, default False
            whether to time the annealing protocol
        rethermalize : bool, default False
            whether to rethermalize velocities after proposal
        """
        _logger.debug(f"conducting vanilla AIS")
        directions = list(protocols.keys())
        for _direction in directions:
            assert _direction in ['forward', 'reverse'], f"direction {_direction} is not an appropriate direction"

        self.protocols = protocols

        self._activate_annealing_workers()
        if self.internal_parallelism:
            workers = None
        elif self.external_parallelism:
            workers = self.parallelism_parameters['available_workers']
        _logger.debug(f"\tin choosing the remote worker, the parallelism client is: {self.parallelism.client}")
        remote_worker = 'remote' if self.parallelism.client is not None else self
        _logger.debug(f"\tthe remote worker is: {remote_worker}")

        sMC_futures = {_direction: None for _direction in directions} # initialize futures with None objects (we only collect these once)
        sMC_sampler_states = {_direction: np.array([self.pull_trajectory_snapshot(int(self.protocols[_direction][0])) for _ in range(num_particles)]) for _direction in directions}
        #Note: we can also add functionality to launch jobs on-the-fly, but for now we just randomly pull equilibrium snapshots from a pre-computed equilibrium distribution
        self.sMC_timers = {_direction: None for _direction in directions} #the timers are collected once per particle
        sMC_cumulative_works = {_direction : None for _direction in directions} #again, theses are only collected once
        worker_retrieval = {} #this is an on-the-fly timer for each direction...
        self.particle_failures = {_direction: None for _direction in directions} #log the particle failures
        self.endstate_corrections = {_direction: None for _direction in directions} # log the endstate corrections

        for _direction in directions:
            worker_retrieval[_direction] = time.time()
            _logger.info(f"entering {_direction} direction to launch annealing jobs.")
            #make iterable lists for anneal deployment
            iterables = []
            iterables.append([remote_worker] * num_particles) #remote_worker
            iterables.append(list(sMC_sampler_states[_direction])) #sampler_state
            iterables.append([self.protocols[_direction]] * num_particles) #lambdas
            iterables.append([None]*num_particles) #noneq_trajectory_filename
            iterables.append([num_integration_steps] * num_particles) #num_integration_steps
            iterables.append([return_timer] * num_particles) #return timer
            iterables.append([False] * num_particles)
            iterables.append([rethermalize] * num_particles) #rethermalize
            _compute_incremental_works = [True] * num_particles #only compute incremental work remotely if it is AIS
            iterables.append(_compute_incremental_works) # whether to compute incremental works

            for job in range(num_particles):
                if self.ncmc_save_interval is not None: #check if we should make 'trajectory_filename' not None
                    iterables[3][job] = self.neq_traj_filename[_direction] + f".iteration_{job:04}.h5"


            scattered_futures = [self.parallelism.scatter(iterable) for iterable in iterables]
            sMC_futures[_direction] = self.parallelism.deploy(func = call_anneal_method,
                                                              arguments = tuple(scattered_futures),
                                                              workers = workers)
            assert len(sMC_futures[_direction]) == num_particles, f"num_particles ({num_particles}) and the length of futures ({len(sMC_futures[_direction])}) do not match"

        #collect futures into one list and see progress
        all_futures = [item for sublist in list(sMC_futures.values()) for item in sublist]
        self.parallelism.progress(futures = all_futures)

        #now we collect the finished futures
        _collected_observables = {}
        for _direction in directions:
            _logger.debug(f"collecting annealing jobs in direction {_direction}...")
            _futures = self.parallelism.gather_results(futures = sMC_futures[_direction], omit_errors = True)
            if remote_worker == 'remote':
                assert len(_futures) == num_particles, f"num_particles ({num_particles}) and the length of the collected futures ({len(_futures)}) do not match.  _all_anneal_method is supposed to be safe!"


            #collect tuple results
            _incremental_works = [_iter[0] for _iter in _futures]
            _sampler_states = [_iter[1] for _iter in _futures]
            _timers = [_iter[2] for _iter in _futures]
            _passes = [_iter[3] for _iter in _futures]
            return_endstate_corrections = [_iter[4] for _iter in _futures]
            pass_indices = [index for index in range(num_particles) if _passes[index] == True]
            successful_incremental_works = [item for index, item in enumerate(_incremental_works) if _passes[index] == True]
            failed_annealing_jobs = [index for index, item in enumerate(_incremental_works) if _passes[index] == False]
            assert all(q is not None for q in successful_incremental_works), f"all passing annealing jobs have been filtered but are still returning NoneType objects"
            _logger.debug(f"\tfailed annealing jobs: {failed_annealing_jobs}")
            self.particle_failures[_direction] = failed_annealing_jobs if len(failed_annealing_jobs) > 0 else None
            self.endstate_corrections[_direction] = [item for index, item in enumerate(return_endstate_corrections) if _passes[index] == True]

            #append the incremental works
            _logger.debug(f"\tincremental works for direction {_direction}: {np.array(_incremental_works).shape}")
            _concatenated_incremental_work = np.concatenate((np.array([np.zeros(len(successful_incremental_works))]).T, np.array(successful_incremental_works)), axis = 1)
            sMC_cumulative_works[_direction] = np.cumsum(_concatenated_incremental_work, axis = 1)
            _logger.debug(f"\tsMC cumulative works for direction {_direction}: {sMC_cumulative_works[_direction]}")
            assert np.std(sMC_cumulative_works[_direction][:,0]) <= np.std(sMC_cumulative_works[_direction][:,-1]), f"the variance of the particle weights is not increasing..."


            #append the _timers
            self.sMC_timers[_direction] = _timers if return_timer else None

            print(f"\t{_direction} retrieval time: {time.time() - worker_retrieval[_direction]}")

        _logger.debug(f"deactivating annealing workers...")
        self._deactivate_annealing_workers()
        self.compute_sMC_free_energy(sMC_cumulative_works)
        _logger.debug(f"terminating AIS successfully!")


    def sMC(self,
            num_particles,
            protocols = {'forward': np.linspace(0,1, 1000), 'reverse': np.linspace(1,0,1000)},
            trailblaze = None,
            resample = None,
            directions = ['forward','reverse'],
            num_integration_steps = 1,
            return_timer = False,
            rethermalize = False):
        """
        Conduct SequentialMonteCarlo sampling with a trailblazed protocol.  Resampling is supported.

        Parameters
        ----------
        num_particles : int
            number of particles to run in each direction
        protocols : dict of {direction : np.array}, default {'forward': np.linspace(0,1, 1000), 'reverse': np.linspace(1,0,1000)},
            the dictionary of forward and reverse protocols.  if None, the protocols will be trailblazed.
        trailblaze : dict, default None
            which observable/criterion to use for trailblazing and the threshold
            if None, trailblazing is not conducted;
            else: the dict must have the following format:
                {'criterion': str, 'threshold': float}
        resample : dict, default None
            the resample dict specifies the resampling criterion and threshold, as well as the resampling method used.  if None, no resampling is conduced;
            otherwise, the resample dict must take the following form:
            {'criterion': str, 'method': str, 'threshold': float}
            the directions to run.
        num_integration_steps : int
            number of integration steps per proposal
        return_timer : bool, default False
            whether to time the annealing protocol
        rethermalize : bool, default False
            whether to rethermalize velocities after proposal
        """
        _logger.debug(f"conducting generalized sMC...")

        _logger.debug(f"conducting argument assertions...")
        #direction assertions
        for _direction in directions:
            assert _direction in ['forward', 'reverse'], f"direction {_direction} is not an appropriate direction"

        starting_lines, finish_lines = {}, {}

        #check protocols:
        if protocols is not None:
            assert trailblaze is None, f"neither 'protocols' nor 'trailblaze' is None.  Conflict!"
            assert all(_key in directions for _key in protocols), f"{_key} is not a supported direction.  Supported directions include {directions}"
            assert all(type(_val) == np.ndarray for _val in protocols.values()), f"all dictionary values in 'protocols' must be np.ndarrays"
            _trailblaze = False
        else:
            _logger.debug(f"protocols is None; attempting to parse 'trailblaze'")
            assert trailblaze is not None, f"both 'protocols' and 'trailblaze' are None; there is no annealing to conduct."
            if trailblaze is not None:
                assert set(trailblaze.keys()) == set(['criterion', 'threshold']), f"the trailblaze keys are not supported"
                assert trailblaze['criterion'] in list(self.supported_observables.keys()), f"the specified trailblazing criterion is not supported"
                assert type(trailblaze['threshold']) == float, f"the specified trailblaze threshold is not a float"
                _trailblaze = True

        #create end-to-ends
        _logger.debug(f"conducting end-to-end builds...")
        if 'forward' in directions:
            assert protocols['forward'][0] == 0.0 and protocols['forward'][-1] == 1.0, f"the forward protocol must start at 0.0 and end at 1.0"
            starting_lines['forward'] = 0.0
            finish_lines['forward'] = 1.0
        if 'reverse' in directions:
            assert protocols['reverse'][0] == 1.0 and protocols['reverse'][-1] == 0.0, f"the reverse protocol must start at 1.0 and end at 0.0"
            starting_lines['reverse'] = 1.0
            finish_lines['reverse'] = 0.0

        #check resample
        if resample is not None:
            _logger.debug(f"resample is not None; conducting resampling assertions...")
            assert set(resample.keys()) == set(['criterion', 'method', 'threshold']), f"'resample does not contain the appropriate keys.  see documentation'"
            assert resample['criterion'] in list(self.supported_observables.keys()), f"the specified resampling criterion is not supported"
            assert resample['method'] in list(self.supported_resampling_methods), f"the specified resampling method is not supported."
            assert type(resample['threshold'] == float), f"the resampling thrshold must be a float"
            _resample = True
        else:
            _logger.debug(f"resampling is None")
            _resample = False

        #initialize the new protocols
        _logger.debug(f"initializing protocols...")
        self.protocols = {_direction : [starting_lines[_direction]] for _direction in directions}
        _logger.debug(f"\tinitial protocols: {self.protocols}")

        _logger.debug(f"activating annealing workers")
        self._activate_annealing_workers()
        if self.internal_parallelism:
            workers = None
        elif self.external_parallelism:
            workers = self.parallelism_parameters['available_workers']
        _logger.debug(f"\tin choosing the remote worker, the parallelism client is: {self.parallelism.client}")
        remote_worker = 'remote' if self.parallelism.client is not None else self
        _logger.debug(f"\tthe remote worker is: {remote_worker}")

        sMC_futures = {_direction: None for _direction in directions}
        _logger.debug(f"\tsMC_futures: {sMC_futures}")

        sMC_sampler_states = {_direction: np.array([self.pull_trajectory_snapshot(int(self.protocols[_direction][0])) for _ in range(num_particles)]) for _direction in directions}
        sMC_sampler_states = {_direction: None for _direction in directions}
        _logger.debug(f"\tsMC_sampler_states: {sMC_sampler_states}")

        sMC_timers = {_direction: [] for _direction in directions}
        _logger.debug(f"sMC_timers: {sMC_timers}")

        sMC_incremental_works = {_direction: None for _direction in directions}
        _logger.debug(f"\tsMC_incremental_works: {sMC_incremental_works}")


        sMC_cumulative_works = {_direction : [np.zeros(num_particles)] for _direction in directions}
        _logger.debug(f"\tsMC_cumulative_works: {sMC_cumulative_works}")

        sMC_observables = {_direction : [] for _direction in directions}
        _logger.debug(f"\tsMC_observables: {sMC_observables}")

        sMC_particle_ancestries = {_direction : [np.arange(num_particles)] for _direction in directions}
        _logger.debug(f"\tsMC_particle_ancestries: {sMC_particle_ancestries}")

        worker_retrieval = {}
        _lambdas = {}

        #now we can launch annealing jobs and manage them on-the-fly
        current_lambdas = starting_lines
        iteration_number = 0

        _logger.debug(f"commencing annealing...")
        while current_lambdas != finish_lines:
            _logger.debug(f"entering iteration {iteration_number}; current_lambdas are {current_lambdas}")
            start_timer = time.time()

            #sample/resample
            _logger.debug(f"\tattempting sampling/resampling...")
            for _direction in directions:
                if current_lambdas[_direction] == finish_lines[_direction]: #if this direction is done...
                    _logger.info(f"\tdirection {_direction} is complete.  omitting resample.")
                    continue

                if iteration_number == 0: #this is the first iteration and we have to pull sampler states unbiasedly
                    sMC_sampler_states.update({_direction: np.array([self.pull_trajectory_snapshot(int(self.protocols[_direction][0])) for _ in range(num_particles)])})
                elif _resample:
                    _logger.debug(f"\tattempting to resample particles...")
                    #Note: the cumulative works we pull for resampling are not the last cumulative works, but the second to last.
                        #the last cumulative works are the penultimate cumulative works plus the incremental works;
                        #however, often, the resampling criteria (if conditional, require the separation of cumulative and incremental works)
                        #implicitly, self._resample will compute the ultimate cumulative works
                    normalized_observable_value, resampled_works, resampled_indices, resample_bool = self._resample(incremental_works = sMC_incremental_works[_direction],
                                                                                                 cumulative_works = sMC_cumulative_works[_direction][-2],
                                                                                                 observable = resample['criterion'],
                                                                                                 resampling_method = resample['method'],
                                                                                                 resample_observable_threshold = resample['threshold'])
                    if resample_bool:
                        _logger.debug(f"\tresample is True")
                        sMC_observables[_direction][-1] = normalized_observable_value #update the previous observables with the resampled observable
                        sMC_cumulative_works[_direction][-1] = resampled_works #update the ultimate cumulative work

                        #we need a deepcopy to prevent annealing over the same sampler state in a single iteration with local annealing
                        new_sampler_states = np.array([copy.deepcopy(sMC_sampler_states[_direction][i]) for i in resampled_indices])
                        sMC_sampler_states.update({_direction: new_sampler_states})
                    else:
                        #we don't need to update the ultimate observables, cumulative works, or sampler_states
                        pass

                    #however, we do need to update the particle ancestries...
                    new_particle_ancestries = np.array([sMC_particle_ancestries[_direction][-1][i] for i in resampled_indices])
                    sMC_particle_ancestries[_direction].append(new_particle_ancestries)
                else: #we are not resampling
                    #the sampler states are updated by gathering the workers' sampler states
                    #the observables are calculated in the trailblaze attempt pass
                    #the cumulative works are unchanged
                    #we do not return particle ancestries if no resampling is conducted
                    _logger.debug(f"not resampling.  omitting sMC updates")

            #attempt to trailblaze lambdas and launch workers
            _logger.debug(f"\tincrementing lambdas...")
            for _direction in directions:
                if current_lambdas[_direction] == finish_lines[_direction]: #if this direction is done...
                    _logger.debug(f"\tdirection {_direction} is complete.  omitting trailblazing.")
                    continue

                if _trailblaze:
                    _logger.debug(f"\ttrailblazing lambdas in {_direction} direction")
                    #gather sampler states and cumulative works in a concurrent manner (i.e. flatten them)
                    sampler_states = sMC_sampler_states[_direction]
                    cumulative_works = sMC_cumulative_works[_direction][-1]
                    if iteration_number == 0:
                        initial_guess = None
                    else:
                        initial_guess = min([2 * self.protocols[_direction][-1] - self.protocols[_direction][-2], 1.0]) if _direction == 'forward' else max([2 * self.protocols[_direction][-1] - self.protocols[_direction][-2], 0.0])

                    _new_lambda, normalized_observable, incremental_works = self.binary_search(sampler_states = sampler_states,
                                                                                               cumulative_works = cumulative_works,
                                                                                               start_val = current_lambdas[_direction],
                                                                                               end_val = finish_lines[_direction],
                                                                                               observable = self.supported_observables[trailblaze['criterion']],
                                                                                               observable_threshold = trailblaze['threshold'] * sMC_observables[_direction][-1],
                                                                                               initial_guess = initial_guess)
                    sMC_incremental_works.update({_direction: incremental_works})
                    _logger.info(f"\t\tlambda increments: {current_lambdas[_direction]} to {_new_lambda}.")
                    _logger.info(f"\t\tnormalized observable: {normalized_observable}.  Observable threshold is {trailblaze['threshold'] * sMC_observables[_direction][-1]}")
                    self.protocols[_direction].append(_new_lambda)
                    sMC_observables[_direction].append(normalized_observable)
                    _lambdas.update({_direction: np.array([current_lambdas[_direction], _new_lambda])})
                    #the current lambdas will be updated at the end of the loop
                else:
                    start_val, end_val = self.protocols[_direction][iteration_number], self.protocols[_direction][iteration_number + 1]
                    _logger.debug(f"\tnot trailblazing; annealing lambda from {start_val} to {end_val}")
                    self.thermodynamic_state.set_alchemical_parameters(start_val, LambdaProtocol(functions = self.lambda_protocol))
                    current_rps = np.array([compute_reduced_potential(self.thermodynamic_state, sampler_state) for sampler_state in sampler_states])
                    #if we are not trailblazing, then the local observable is computed from the resampling observable
                    normalized_observable, incremental_works = compute_lambda_increment(new_val, sMC_sampler_states[_direction], resample['criterion'], current_rps, sMC_cumulative_works[_direction][-1])
                    sMC_incremental_works.update({_direction: incremental_works})
                    sMC_observables[_direction].append(normalized_observable)
                    _lambdas.update({_direction: np.array(start_val, end_val)})
                    #the current lambdas will be updated at the end of the loop

            #now we want to execute distributed/local annealing depending on the remote worker
            _logger.debug(f"\tconducting annealing execution...")
            for _direction in directions:
                if current_lambdas[_direction] == finish_lines[_direction]:
                    _logger.info(f"\tdirection {_direction} is complete.  omitting annealing")
                    continue
                worker_retrieval[_direction] = time.time()
                _logger.info(f"\t\tentering {_direction} direction to launch annealing jobs.")

                _logger.info(f"\t\tthe current lambdas for annealing are {_lambdas[_direction]}")

                #make construct iterable list for distributed annealing
                iterables = []
                iterables.append([remote_worker] * num_particles) #remote_worker
                iterables.append(list(sMC_sampler_states[_direction])) #sampler_state
                iterables.append([_lambdas[_direction]] * num_particles) #lambdas
                iterables.append([None]*num_particles) #noneq_trajectory_filename
                iterables.append([num_integration_steps] * num_particles) #num_integration_steps
                iterables.append([return_timer] * num_particles) #return timer
                iterables.append([True] * num_particles) #return_sampler_state
                iterables.append([rethermalize] * num_particles) #rethermalize
                iterables.append([True] * num_particles) # whether to compute incremental works

                for job in range(num_particles):
                    if self.ncmc_save_interval is not None: #check if we should make 'trajectory_filename' not None
                        iterables[2][job] = self.neq_traj_filename[_direction] + f".iteration_{job:04}.h5"


                scattered_futures = [self.parallelism.scatter(iterable) for iterable in iterables]
                sMC_futures.update({_direction: self.parallelism.deploy(func = call_anneal_method,
                                                                  arguments = tuple(scattered_futures),
                                                                  workers = workers)})

            #collect futures into one list and see progress
            all_futures = [item for sublist in list(sMC_futures.values()) for item in sublist]
            self.parallelism.progress(futures = all_futures)

            #now we collect the finished futures
            _logger.debug(f"\tretreiving annealing executions...")
            for _direction in directions:
                if current_lambdas[_direction] == finish_lines[_direction]:
                    _logger.info(f"\tdirection {_direction} is complete.  omitting job collection")
                    continue
                _logger.debug(f"\t\tcollecting annealing jobs in direction {_direction}...")
                _futures = self.parallelism.gather_results(futures = sMC_futures[_direction])

                #collect tuple results
                _incremental_works = [_iter[0] for _iter in _futures]
                _sampler_states = [_iter[1] for _iter in _futures]
                _timers = [_iter[2] for _iter in _futures]


                #make sure incremental works are the same on distributed annealing as they are locally with trailblaze/not-trailblaze
                assert all(abs(i - j) < DISTRIBUTED_ERROR_TOLERANCE for i, j in zip(np.array(_incremental_works).flatten(), sMC_incremental_works[_direction])), f"the incremental works between the local and distributed platforms do not match"
                #if this is true, we can update the cumulative work dict
                sMC_cumulative_works[_direction].append(np.add(sMC_cumulative_works[_direction][-1], sMC_incremental_works[_direction]))

                #append the sampler_states
                sMC_sampler_states[_direction] = np.array(_sampler_states)

                #append the _timers
                sMC_timers[_direction].append(_timers)

                print(f"\t{_direction} retrieval time: {time.time() - worker_retrieval[_direction]}")

            #report the updated logger dicts and observables
            for _direction in directions:
                if current_lambdas[_direction] != finish_lines[_direction]:
                    current_lambdas[_direction] = _lambdas[_direction][-1] #update the lambda with the current lambda

            end_timer = time.time() - start_timer
            iteration_number += 1
            _logger.info(f"iteration took {end_timer} seconds.")
            _logger.debug(f"\n")

        _logger.debug(f"deactivating annealing workers...")
        self._deactivate_annealing_workers()
        for _direction in directions:
            _lst = sMC_cumulative_works[_direction]
            sMC_cumulative_works.update({_direction: np.array(_lst).T}) #the cumulative work dimensions should be num_particles * num_iterations
        self.compute_sMC_free_energy(sMC_cumulative_works)
        self.sMC_observables = sMC_observables
        if _resample:
            _logger.debug(f"computing particle ancestries and survival rates...")
            self.survival_rate = compute_survival_rate(sMC_particle_ancestries)
            self.particle_ancestries = {_direction : np.array([q.flatten() for q in sMC_particle_ancestries[_direction]]) for _direction in sMC_particle_ancestries.keys()}
        else:
            _logger.debug(f"omitting particles ancestries and survivial rates (no resampling)...")
            self.survival_rate = None
            self.particle_ancestries = None


    def compute_sMC_free_energy(self, cumulative_work_dict):
        """
        Method to compute the free energy of sMC_anneal type cumultaive work dicts, whether the dicts are constructed
        via AIS or generalized sMC.  The self.cumulative_works, self.dg_EXP, and self.dg_BAR (if applicable) are returned as
        instance attributes.

        Parameters
        ----------
        cumulative_work_dict : dict
            dictionary of the form {_direction <str>: np.nddarray of shape (num_particles, iterations)}
            where _direction is 'forward' or 'reverse' and np.2darray is of the shape (num_particles, iteration_number + 2)
        """
        _logger.debug(f"computing free energies...")
        self.cumulative_work = {}
        self.dg_EXP = {}
        for _direction, _lst in cumulative_work_dict.items():
            self.cumulative_work[_direction] = _lst
            self.dg_EXP[_direction] = np.array([pymbar.EXP(_lst[:,i]) for i in range(_lst.shape[1])])
            _logger.debug(f"cumulative_work for {_direction}: {self.cumulative_work[_direction]}")
        if len(list(self.cumulative_work.keys())) == 2:
            self.dg_BAR = pymbar.BAR(self.cumulative_work['forward'][:, -1], self.cumulative_work['reverse'][:, -1])

    def minimize_sampler_states(self):
        """
        simple wrapper function to minimize the input sampler states
        """
        # initialize by minimizing
        for state in self.lambda_endstates['forward']: # 0.0, 1.0
            self.thermodynamic_state.set_alchemical_parameters(state, LambdaProtocol(functions = self.lambda_protocol))
            minimize(self.thermodynamic_state, self.sampler_states[int(state)])

    def pull_trajectory_snapshot(self, endstate):
        """
        Draw randomly a single snapshot from self._eq_files_dict

        Parameters
        ----------
        endstate: int
            lambda endstate from which to extract an equilibrated snapshot, either 0 or 1
        Returns
        -------
        sampler_state: openmmtools.SamplerState
            sampler state with positions and box vectors if applicable
        """
        #pull a random index
        assert endstate in [0,1], f"the endstate ({endstate}) is not 0 or 1"
        index = random.choice(self._eq_dict[f"{endstate}_decorrelated"])
        files = [key for key in self._eq_files_dict[endstate].keys() if index in self._eq_files_dict[endstate][key]]
        assert len(files) == 1, f"files: {files} doesn't have one entry; index: {index}, eq_files_dict: {self._eq_files_dict[endstate]}"
        file = files[0]
        file_index = self._eq_files_dict[endstate][file].index(index)

        #now we load file as a traj and create a sampler state with it
        traj = md.load_frame(file, file_index)
        positions = traj.openmm_positions(0)
        box_vectors = traj.openmm_boxes(0)
        sampler_state = SamplerState(positions, box_vectors = box_vectors)

        return sampler_state

    def equilibrate(self,
                    n_equilibration_iterations = 1,
                    n_steps_per_equilibration = 5000,
                    endstates = [0,1],
                    max_size = 1024*1e3,
                    decorrelate=False,
                    timer = False,
                    minimize = False):
        """
        Run the equilibrium simulations a specified number of times at the lambda 0, 1 states. This can be used to equilibrate
        the simulation before beginning the free energy calculation.

        Parameters
        ----------
        n_equilibration_iterations : int; default 1
            number of equilibrium simulations to run, each for lambda = 0, 1.
        n_steps_per_equilibration : int, default 5000
            number of integration steps to take in an equilibration iteration
        endstates : list, default [0,1]
            at which endstate(s) to conduct n_equilibration_iterations (either [0] ,[1], or [0,1])
        max_size : float, default 1.024e6 (bytes)
            number of bytes allotted to the current writing-to file before it is finished and a new equilibrium file is initiated.
        decorrelate : bool, default False
            whether to parse all written files serially and remove correlated snapshots; this returns an ensemble of iid samples in theory.
        timer : bool, default False
            whether to trigger the timing in the equilibration; this adds an item to the EquilibriumResult, which is a list of times for various
            processes in the feptask equilibration scheme.
        minimize : bool, default False
            Whether to minimize the sampler state before conducting equilibration. This is passed directly to feptasks.run_equilibration

        Returns
        -------
        equilibrium_result : perses.dispersed.feptasks.EquilibriumResult
            equilibrium result namedtuple
        """

        _logger.debug(f"conducting equilibration")
        for endstate in endstates:
            assert endstate in [0, 1], f"the endstates contains {endstate}, which is not in [0, 1]"

        # run a round of equilibrium
        _logger.debug(f"iterating through endstates to submit equilibrium jobs")
        EquilibriumFEPTask_list = []
        for state in endstates: #iterate through the specified endstates (0 or 1) to create appropriate EquilibriumFEPTask inputs
            _logger.debug(f"\tcreating lambda state {state} EquilibriumFEPTask")
            self.thermodynamic_state.set_alchemical_parameters(float(state), lambda_protocol = LambdaProtocol(functions = self.lambda_protocol))
            input_dict = {'thermodynamic_state': copy.deepcopy(self.thermodynamic_state),
                          'nsteps_equil': n_steps_per_equilibration,
                          'topology': self.factory.hybrid_topology,
                          'n_iterations': n_equilibration_iterations,
                          'splitting': self.eq_splitting_string,
                          'atom_indices_to_save': None,
                          'trajectory_filename': None,
                          'max_size': max_size,
                          'timer': timer,
                          '_minimize': minimize,
                          'file_iterator': 0,
                          'timestep': self.timestep}


            if self.write_traj:
                _logger.debug(f"\twriting traj to {self.eq_trajectory_filename[state]}")
                equilibrium_trajectory_filename = self.eq_trajectory_filename[state]
                input_dict['trajectory_filename'] = equilibrium_trajectory_filename
            else:
                _logger.debug(f"\tnot writing traj")

            if self._eq_dict[state] == []:
                _logger.debug(f"\tself._eq_dict[{state}] is empty; initializing file_iterator at 0 ")
            else:
                last_file_num = int(self._eq_dict[state][-1][0][-7:-3])
                _logger.debug(f"\tlast file number: {last_file_num}; initiating file iterator as {last_file_num + 1}")
                file_iterator = last_file_num + 1
                input_dict['file_iterator'] = file_iterator
            task = EquilibriumFEPTask(sampler_state = self.sampler_states[state], inputs = input_dict, outputs = None)
            EquilibriumFEPTask_list.append(task)

        _logger.debug(f"scattering and mapping run_equilibrium task")
        #we need not concern ourselves with _adaptive here since we are only running vanilla MD on 1 or 2 endstates


        if self.external_parallelism:
            #the client is already active
            #we only run a max of 2 parallel runs at once, so we can pull 2 workers
            num_available_workers = min(len(endstates), len(self.parallelism_parameters['available_workers']))
            workers = np.random.choice(self.parallelism_parameters['available_workers'], size = num_available_workers, replace = False)
            scatter_futures = self.parallelism.scatter(EquilibriumFEPTask_list, workers = workers)
            futures = self.parallelism.deploy(run_equilibrium, (scatter_futures,), workers = workers)
        elif self.internal_parallelism:
            #we have to activate the client
            if self.parallelism_parameters['library'] is None: #then we are running locally
                _parallel_processes = 0
            else:
                _parallel_processes = min(len(endstates), self.parallelism_parameters['num_processes'])

            self.parallelism.activate_client(library = self.parallelism_parameters['library'], num_processes = _parallel_processes)
            scatter_futures = self.parallelism.scatter(EquilibriumFEPTask_list)
            futures = self.parallelism.deploy(run_equilibrium, (scatter_futures,))
        else:
            raise Exception(f"either internal or external parallelism must be True.")

        self.parallelism.progress(futures)
        eq_results = self.parallelism.gather_results(futures)

        if self.internal_parallelism:
            #deactivte the client
            self.parallelism.deactivate_client()
        else:
            #we do not deactivate the external parallelism because the current class has no authority over it.  It simply borrows the allotted workers for a short time
            pass

        #the rest of the function is independent of the dask workers...


        for state, eq_result in zip(endstates, eq_results):
            _logger.debug(f"\tcomputing equilibrium task future for state = {state}")
            self._eq_dict[state].extend(eq_result.outputs['files'])
            self._eq_dict[f"{state}_reduced_potentials"].extend(eq_result.outputs['reduced_potentials'])
            self.sampler_states.update({state: eq_result.sampler_state})
            self._eq_timers[state].append(eq_result.outputs['timers'])

        _logger.debug(f"collections complete.")
        if decorrelate: # if we want to decorrelate all sample
            _logger.debug(f"decorrelating data")
            for state in endstates:
                _logger.debug(f"\tdecorrelating lambda = {state} data.")
                traj_filename = self.eq_trajectory_filename[state]
                if os.path.exists(traj_filename[:-2] + f'0000' + '.h5'):
                    _logger.debug(f"\tfound traj filename: {traj_filename[:-2] + f'0000' + '.h5'}; proceeding...")
                    [t0, g, Neff_max, A_t, uncorrelated_indices] = compute_timeseries(np.array(self._eq_dict[f"{state}_reduced_potentials"]))
                    _logger.debug(f"\tt0: {t0}; Neff_max: {Neff_max}; uncorrelated_indices: {uncorrelated_indices}")
                    self._eq_dict[f"{state}_decorrelated"] = uncorrelated_indices

                    #now we just have to turn the file tuples into an array
                    _logger.debug(f"\treorganizing decorrelated data; files w/ num_snapshots are: {self._eq_dict[state]}")
                    iterator, corrected_dict = 0, {}
                    for tupl in self._eq_dict[state]:
                        new_list = [i + iterator for i in range(tupl[1])]
                        iterator += len(new_list)
                        decorrelated_list = [i for i in new_list if i in uncorrelated_indices]
                        corrected_dict[tupl[0]] = decorrelated_list
                    self._eq_files_dict[state] = corrected_dict
                    _logger.debug(f"\t corrected_dict for state {state}: {corrected_dict}")

    def _resample(self,
                  incremental_works,
                  cumulative_works,
                  observable = 'ESS',
                  resampling_method = 'multinomial',
                  resample_observable_threshold = 0.5):
        """
        Attempt to resample particles given an observable diagnostic and a resampling method.

        Parameters
        ----------
        incremental_works : np.array() of floats
            the incremental work accumulated from importance sampling at time t
        cumulative_works : np.array() of floats
            the cumulative work accumulated from importance sampling from time t = 1 : t-1
        observable : str, default 'ESS'
            the observable used as a resampling diagnostic; this calls a key in supported_observables
        resampling_method: str, default 'multinomial'
            method used to resample, this calls a key in supported_resampling_methods
        resample_observable_threshold : float, default 0.5
            the threshold to diagnose a resampling event.
            If None, will automatically return without observables

        Returns
        -------
        normalized_observable_value: float
            the value of the observable
        resampled_works : np.array() floats
            the resampled total works at iteration t
        resampled_indices : np.array() int
            resampled particle indices
        resample_bool : boolean
            whether resampling is actually conducted


        """
        num_particles = incremental_works.shape[0]

        normalized_observable_value = self.supported_observables[observable](cumulative_works, incremental_works)
        _logger.debug(f"\t\tstart resampled normalized observable value: {normalized_observable_value}")
        total_works = np.add(cumulative_works, incremental_works)

        #decide whether to resample
        _logger.debug(f"\t\tnormalized observable value: {normalized_observable_value}")
        if normalized_observable_value <= resample_observable_threshold: #then we resample
            resample_bool = True
            _logger.debug(f"\t\tnormalized observable value ({normalized_observable_value}) <= {resample_observable_threshold}.  Resampling")

            #resample
            resampled_works, resampled_indices = self.supported_resampling_methods[resampling_method](total_works = total_works,
                                                                                                      num_resamples = num_particles)

            normalized_observable_value = 1.0
        else:
            resample_bool = False
            _logger.debug(f"\t\tnormalized observable value ({normalized_observable_value}) > {resample_observable_threshold}.  Skipping resampling.")
            resampled_works = total_works
            resampled_indices = np.arange(num_particles)

        _logger.debug(f"\t\tfinal resampled normalized observable_value: {normalized_observable_value}")
        return normalized_observable_value, resampled_works, resampled_indices, resample_bool

    def compute_lambda_increment(self, new_val, sampler_states, observable, current_rps, cumulative_works):
        """
        internal method to compute observables and incremental works locally
        """
        self.thermodynamic_state.set_alchemical_parameters(new_val, LambdaProtocol(functions = self.lambda_protocol))
        new_rps = np.array([compute_reduced_potential(self.thermodynamic_state, sampler_state) for sampler_state in sampler_states])
        _observable = observable(cumulative_works, new_rps - current_rps)
        incremental_works = new_rps - current_rps
        return _observable, incremental_works


    def binary_search(self,
                  sampler_states,
                  cumulative_works,
                  start_val,
                  end_val,
                  observable,
                  observable_threshold,
                  max_iterations=100,
                  initial_guess = None,
                  precision_threshold = 1e-6):
        """
        Given corresponding start_val and end_val of observables, conduct a binary search to find min value for which the observable threshold
        is exceeded.
        Parameters
        ----------
        sampler_states : np.array(openmmtools.states.SamplerState)
            numpy array of sampler states
        cumulative_works : np.array(float)
            cumulative works of corresponding sampler states
        start_val: float
            start value of binary search
        end_val: float
            end value of binary search
        observable : function
            function to compute an observable
        observable_threshold : float
            the threshold of the observable used to satisfy the binary search criterion
        max_iterations: int, default 20
            maximum number of interations to conduct
        initial_guess: float, default None
            guess where the threshold is achieved
        precision_threshold: float, default None
            precision threshold below which, the max iteration will break

        Returns
        -------
        midpoint: float
            maximum value that doesn't exceed threshold
        _observable : float
            observed value of observable
        _incremental_works : np.ndarray of floats
            the incremental works of the lambda update
        """
        _base_end_val = end_val
        right_bound = end_val
        left_bound = start_val
        _logger.debug(f"\t\tmin, max values: {start_val}, {end_val}. ")
        self.thermodynamic_state.set_alchemical_parameters(start_val, LambdaProtocol(functions = self.lambda_protocol))
        current_rps = np.array([compute_reduced_potential(self.thermodynamic_state, sampler_state) for sampler_state in sampler_states])

        if initial_guess is not None:
            midpoint = initial_guess
        else:
            midpoint = (left_bound + right_bound) * 0.5

        for iteration in range(max_iterations):
            if iteration != 0:
                midpoint = (left_bound + right_bound) * 0.5

            _observable, _incremental_works = self.compute_lambda_increment(new_val = midpoint,
                                             sampler_states = sampler_states,
                                             observable = observable,
                                             current_rps = current_rps,
                                             cumulative_works = cumulative_works)
            if _observable <= observable_threshold:
                right_bound = midpoint
            else:
                left_bound = midpoint

            if precision_threshold is not None:
                if abs(right_bound - left_bound) <= precision_threshold:
                    midpoint = right_bound
                    _observable, _incremental_works = self.compute_lambda_increment(new_val = midpoint,
                                                     sampler_states = sampler_states,
                                                     observable = observable,
                                                     current_rps = current_rps,
                                                     cumulative_works = cumulative_works)
                    break


        return midpoint, _observable, _incremental_works