GeoMop · martinspetlik · Aug 8, 2022 · Aug 23, 2022 · May 9, 2023 · Aug 3, 2023
diff --git a/examples/shooting/shooting_1D_mcqmc.py b/examples/shooting/shooting_1D_mcqmc.py
@@ -0,0 +1,252 @@
+import numpy as np
+import mlmc.estimator as est
+from mlmc.estimator import Estimate, estimate_n_samples_for_target_variance
+from mlmc.sampler import Sampler
+from mlmc.sample_storage import Memory
+from mlmc.sampling_pool import OneProcessPool
+from examples.shooting.simulation_shooting_1D import ShootingSimulation1D
+from mlmc.quantity.quantity import make_root_quantity
+from mlmc.quantity.quantity_estimate import moments, estimate_mean
+from mlmc.moments import Legendre
+from mlmc.plot.plots import Distribution
+
+
+# Tutorial class for 1D shooting simulation, includes
+# - samples scheduling
+# - process results:
+#           - create Quantity instance
+#           - approximate density
+class ProcessShooting1D:
+
+    def __init__(self):
+        n_levels = 3
+        # Number of MLMC levels
+        step_range = [1, 1e-3]
+        # step_range [simulation step at the coarsest level, simulation step at the finest level]
+        level_parameters = ProcessShooting1D.determine_level_parameters(n_levels, step_range)
+        # Determine each level parameters (in this case, simulation step at each level), level_parameters should be
+        # simulation dependent
+        self._sample_sleep = 0#30
+        # Time to do nothing just to make sure the simulations aren't constantly checked, useful mainly for PBS run
+        self._sample_timeout = 60
+        # Maximum waiting time for running simulations
+        self._adding_samples_coef = 0.1
+        self._n_moments = 20
+        # number of generalized statistical moments used for MLMC number of samples estimation
+        self._quantile = 0.01
+        # Setting parameters that are utilized when scheduling samples
+        ###
+        # MLMC run
+        ###
+        sampler = self.create_sampler(level_parameters=level_parameters)
+        # Create sampler (mlmc.Sampler instance) - crucial class that controls MLMC run
+        self.generate_samples(sampler, n_samples=None, target_var=1e-3)
+        # Generate MLMC samples, there are two ways:
+        # 1) set exact number of samples at each level,
+        #    e.g. for 5 levels - self.generate_samples(sampler, n_samples=[1000, 500, 250, 100, 50])
+        # 2) set target variance of MLMC estimates,
+        #    e.g. self.generate_samples(sampler, n_samples=None, target_var=1e-6)
+        self.all_collect(sampler)
+        # Check if all samples are finished
+        ###
+        # Postprocessing
+        ###
+        self.process_results(sampler, n_levels)
+        # Postprocessing, MLMC is finished at this point
+
+    def create_sampler(self, level_parameters):
+        """
+        Create:
+        # sampling pool - the way sample simulations are executed
+        # sample storage - stores sample results
+        # sampler - controls MLMC execution
+        :param level_parameters: list of lists
+        :return: mlmc.sampler.Sampler instance
+        """
+        # Create OneProcessPool - all run in the same process
+        sampling_pool = OneProcessPool()
+        # There is another option mlmc.sampling_pool.ProcessPool() - supports local parallel sample simulation run
+        # sampling_pool = ProcessPool(n), n - number of parallel simulations, depends on computer architecture
+
+        # Simulation configuration which is passed to simulation constructor
+        simulation_config = {
+            "start_position": np.array([0, 0]),
+            "start_velocity": np.array([10, 0]),
+            "area_borders":  np.array([-100, 200, -300, 400]),
+            "max_time": 10,
+            "complexity": 2,  # used for initial estimate of number of operations per sample
+            'fields_params': dict(model='gauss', dim=1, sigma=1, corr_length=0.1),
+        }
+
+        # Create simulation factory, instance of class that inherits from mlmc.sim.simulation
+        simulation_factory = ShootingSimulation1D(config=simulation_config)
+
+        # Create simple sample storage
+        # Memory() storage keeps samples in computer main memory
+        sample_storage = Memory()
+        # We support also HDF file storage mlmc.sample_storage_hdf.SampleStorageHDF()
+        # sample_storage = SampleStorageHDF(file_path=path_to_HDF5_file)
+
+        # Create sampler
+        # Controls the execution of MLMC
+        sampler = Sampler(sample_storage=sample_storage, sampling_pool=sampling_pool, sim_factory=simulation_factory,
+                          level_parameters=level_parameters)
+        return sampler
+
+    def generate_samples(self, sampler, n_samples=None, target_var=None):
+        """
+        Generate MLMC samples
+        :param sampler: mlmc.sampler.Sampler instance
+        :param n_samples: None or list, number of samples at each level
+        :param target_var: target variance of MLMC estimates
+        :return: None
+        """
+        # The number of samples is set by user
+        if n_samples is not None:
+            sampler.set_initial_n_samples(n_samples)
+        # The number of initial samples is determined automatically
+        else:
+            sampler.set_initial_n_samples()
+        # Samples are scheduled and the program is waiting for all of them to be completed.
+        sampler.schedule_samples()
+        sampler.ask_sampling_pool_for_samples(sleep=self._sample_sleep, timeout=self._sample_timeout)
+        self.all_collect(sampler)
+
+        # MLMC estimates target variance is set
+        if target_var is not None:
+            # The mlmc.quantity.quantity.Quantity instance is created
+            # parameters 'storage' and 'q_specs' are obtained from sample_storage,
+            # originally 'q_specs' is set in the simulation class
+            root_quantity = make_root_quantity(storage=sampler.sample_storage,
+                                               q_specs=sampler.sample_storage.load_result_format())
+
+            # Moment functions object is created
+            # The MLMC algorithm determines number of samples according to the moments variance,
+            # Type of moment functions (Legendre by default) might affect the total number of MLMC samples
+            moments_fn = self.set_moments(root_quantity, sampler.sample_storage, n_moments=self._n_moments)
+            estimate_obj = Estimate(root_quantity, sample_storage=sampler.sample_storage,
+                                                   moments_fn=moments_fn)
+
+            # Initial estimation of the number of samples at each level
+            variances, n_ops = estimate_obj.estimate_diff_vars_regression(sampler.n_finished_samples)
+            # Firstly, the variance of moments and execution time of samples at each level are calculated from already finished samples
+            n_estimated = estimate_n_samples_for_target_variance(target_var, variances, n_ops,
+                                                                           n_levels=sampler.n_levels)
+
+            #####
+            # MLMC sampling algorithm - gradually schedules samples and refines the total number of samples
+            #####
+            # Loop until number of estimated samples is greater than the number of scheduled samples
+            while not sampler.process_adding_samples(n_estimated, self._sample_sleep, self._adding_samples_coef,
+                                                     timeout=self._sample_timeout):
+                # New estimation according to already finished samples
+                variances, n_ops = estimate_obj.estimate_diff_vars_regression(sampler._n_scheduled_samples)
+                n_estimated = estimate_n_samples_for_target_variance(target_var, variances, n_ops,
+                                                                     n_levels=sampler.n_levels)
+
+    def set_moments(self, quantity, sample_storage, n_moments=25):
+        true_domain = Estimate.estimate_domain(quantity, sample_storage, quantile=self._quantile)
+        return Legendre(n_moments, true_domain)
+
+    def all_collect(self, sampler):
+        """
+        Collect samples, wait until all samples are finished
+        :param sampler: mlmc.sampler.Sampler object
+        :return: None
+        """
+        running = 1
+        while running > 0:
+            running = 0
+            running += sampler.ask_sampling_pool_for_samples()
+            print("N running: ", running)
+
+    def process_results(self, sampler, n_levels):
+        """
+        Process MLMC results
+        :param sampler: mlmc.sampler.Sampler instance
+        :param n_levels: int, number of MLMC levels
+        :return: None
+        """
+        sample_storage = sampler.sample_storage
+        # Load result format from the sample storage
+        result_format = sample_storage.load_result_format()
+        # Create Quantity instance representing our real quantity of interest
+        root_quantity = make_root_quantity(sample_storage, result_format)
+
+        print("N collected ", sample_storage.get_n_collected())
+
+        # It is possible to access items of the quantity according to the result format
+        target = root_quantity['target']
+        time = target[10]
+        position = time['0']
+        q_value = position[0]
+
+        # Compute moments, first estimate domain of moment functions
+        estimated_domain = Estimate.estimate_domain(q_value, sample_storage, quantile=self._quantile)
+        moments_fn = Legendre(self._n_moments, estimated_domain)
+
+        # Create estimator for the quantity
+        estimator = Estimate(quantity=q_value, sample_storage=sample_storage, moments_fn=moments_fn)
+        # Estimate moment means and variances
+        means, vars = estimator.estimate_moments(moments_fn)
+
+        est.plot_checks(quantity=q_value, sample_storage=sample_storage, moments_fn=moments_fn)
+        est.consistency_check(quantity=q_value, sample_storage=sample_storage)
+        estimator.kurtosis_check(q_value)
+
+        # Generally, root quantity has different domain than its items
+        root_quantity_estimated_domain = Estimate.estimate_domain(root_quantity, sample_storage,
+                                                                                 quantile=self._quantile)
+        root_quantity_moments_fn = Legendre(self._n_moments, root_quantity_estimated_domain)
+
+        # There is another possible approach to calculating all moments at once and then select desired quantity
+        moments_quantity = moments(root_quantity, moments_fn=root_quantity_moments_fn, mom_at_bottom=True)
+        moments_mean = estimate_mean(moments_quantity)
+        target_mean = moments_mean['target']
+        time_mean = target_mean[10]  # times: [1]
+        location_mean = time_mean['0']  # locations: ['0']
+        value_mean = location_mean[0]  # result shape: (1,)
+
+        assert value_mean.mean[0] == 1
+        self.approx_distribution(estimator, n_levels, tol=1e-8)
+
+    def approx_distribution(self, estimator, n_levels, tol=1.95):
+        """
+        Probability density function approximation
+        :param estimator: mlmc.estimator.Estimate instance, it contains quantity for which the density is approximated
+        :param n_levels: int, number of MLMC levels
+        :param tol: Tolerance of the fitting problem, with account for variances in moments.
+        :return: None
+        """
+        distr_obj, result, _, _ = estimator.construct_density(tol=tol)
+        distr_plot = Distribution(title="distributions", error_plot=None)
+        distr_plot.add_distribution(distr_obj)
+
+        if n_levels == 1:
+            samples = estimator.get_level_samples(level_id=0)[..., 0]
+            distr_plot.add_raw_samples(np.squeeze(samples))
+        distr_plot.show(None)
+        distr_plot.reset()
+
+    @staticmethod
+    def determine_level_parameters(n_levels, step_range):
+        """
+        Determine level parameters,
+        In this case, a step of fine simulation at each level
+        :param n_levels: number of MLMC levels
+        :param step_range: simulation step range
+        :return: list of lists
+        """
+        assert step_range[0] > step_range[1]
+        level_parameters = []
+        for i_level in range(n_levels):
+            if n_levels == 1:
+                level_param = 1
+            else:
+                level_param = i_level / (n_levels - 1)
+            level_parameters.append([step_range[0] ** (1 - level_param) * step_range[1] ** level_param])
+        return level_parameters
+
+
+if __name__ == "__main__":
+    ProcessShooting1D()