cositools · avalluvan · Aug 5, 2024 · Aug 5, 2024 · Aug 5, 2024 · Aug 12, 2024
diff --git a/cosipy/image_deconvolution/RLparallelscript.py b/cosipy/image_deconvolution/RLparallelscript.py
@@ -0,0 +1,61 @@
+from pathlib import Path
+
+import logging
+logger = logging.getLogger(__name__)
+
+from mpi4py import MPI
+from histpy import Histogram
+
+from cosipy.response import FullDetectorResponse
+from cosipy.image_deconvolution import ImageDeconvolution, DataIFWithParallel, DataIF_COSI_DC2
+
+# Define MPI variables
+MASTER = 0                      # Indicates master process
+DRM_DIR = Path('/Users/penguin/Documents/Grad School/Research/COSI/COSIpy/docs/tutorials/data')
+DATA_DIR = Path('/Users/penguin/Documents/Grad School/Research/COSI/COSIpy/docs/tutorials/image_deconvolution/511keV/GalacticCDS')
+
+def main():
+    '''
+    Main script to create a parallel execution-compatible
+    dataset using DataIFWithParallel and call ImageDeconvolution
+    '''
+
+    # Set up MPI
+    comm = MPI.COMM_WORLD
+
+    # Create dataset
+    dataset = DataIFWithParallel(name = '511keV',
+                                 event_filename = '511keV_dc2_galactic_event.hdf5',
+                                 bkg_filename = '511keV_dc2_galactic_bkg.hdf5',
+                                 drm_filename = 'psr_gal_511_DC2.h5',
+                                 comm = comm)     # Convert dataset to a list of datasets before passing to RichardsonLucy class
+
+    # bkg = Histogram.open(DATA_DIR / '511keV_dc2_galactic_bkg.hdf5')
+    # event = Histogram.open(DATA_DIR / '511keV_dc2_galactic_event.hdf5')
+    # image_response = Histogram.open(DRM_DIR / 'psr_gal_511_DC2.h5')
+    # dataset = DataIF_COSI_DC2.load(name = "511keV",             # Create a dataset compatible with ImageDeconvolution: name (unique identifier), event data, background model, response, coordinate system conversion matrix (if detector response is not in galactic coordinates)
+    #                                event_binned_data = event.project(['Em', 'Phi', 'PsiChi']),
+    #                                dict_bkg_binned_data = {"total": bkg.project(['Em', 'Phi', 'PsiChi'])},
+    #                                rsp = image_response)
+
+    # Create image deconvolution object
+    image_deconvolution = ImageDeconvolution()
+
+    # set data_interface to image_deconvolution
+    image_deconvolution.set_dataset([dataset])
+
+    # set a parameter file for the image deconvolution
+    parameter_filepath = DATA_DIR / 'imagedeconvolution_parfile_gal_511keV.yml'
+    image_deconvolution.read_parameterfile(parameter_filepath)
+
+    # Initialize model
+    image_deconvolution.initialize(comm=comm)
+
+    # Execute deconvolution
+    image_deconvolution.run_deconvolution()
+
+    # MPI Shutdown
+    MPI.Finalize()
+
+if __name__ == "__main__":
+    main()
diff --git a/cosipy/image_deconvolution/RichardsonLucy.py b/cosipy/image_deconvolution/RichardsonLucy.py
@@ -1,11 +1,15 @@
 import os
 import copy
-import numpy as np
-import astropy.units as u
-import astropy.io.fits as fits
 import logging
+
+# logging setup
 logger = logging.getLogger(__name__)
 
+# Import third party libraries
+import numpy as np
+import pandas as pd
+import astropy.units as u
+from astropy.io import fits
 from histpy import Histogram
 
 from .deconvolution_algorithm_base import DeconvolutionAlgorithmBase
@@ -36,7 +40,7 @@ class RichardsonLucy(DeconvolutionAlgorithmBase):
 
     """
 
-    def __init__(self, initial_model, dataset, mask, parameter):
+    def __init__(self, initial_model:Histogram, dataset:list, mask, parameter, comm=None):
 
         DeconvolutionAlgorithmBase.__init__(self, initial_model, dataset, mask, parameter)
 
@@ -66,16 +70,26 @@ def __init__(self, initial_model, dataset, mask, parameter):
             else:
                 os.makedirs(self.save_results_directory)
 
+        if comm is None:
+            self.MASTER = True
+        elif comm.Get_rank() == 0:
+            self.MASTER = True
+        else:
+            self.MASTER = False
+
     def initialization(self):
         """
-        initialization before running the image deconvolution
+        initialization before performing image deconvolution
         """
+
+        # Master
+        if self.MASTER:
+            # Clear results
+            self.results.clear()
+
         # clear counter 
         self.iteration_count = 0
 
-        # clear results
-        self.results.clear()
-
         # copy model
         self.model = copy.deepcopy(self.initial_model)
 
@@ -93,10 +107,6 @@ def initialization(self):
             self.response_weighting_filter = (self.summed_exposure_map.contents / np.max(self.summed_exposure_map.contents))**self.response_weighting_index
             logger.info("The response weighting filter was calculated.")
 
-        # expected count histograms
-        self.expectation_list = self.calc_expectation_list(model = self.initial_model, dict_bkg_norm = self.dict_bkg_norm)
-        logger.info("The expected count histograms were calculated with the initial model map.")
-
         # calculate summed background models for M-step
         if self.do_bkg_norm_optimization:
             self.dict_summed_bkg_model = {}
@@ -112,9 +122,14 @@ def pre_processing(self):
     def Estep(self):
         """
         E-step (but it will be skipped).
-        Note that self.expectation_list is updated in self.post_processing().
         """
-        pass
+
+        # expected count histograms
+        self.expectation_list = self.calc_expectation_list(model = self.model, dict_bkg_norm = self.dict_bkg_norm)
+        logger.info("The expected count histograms were calculated with the initial model map.")
+
+        # At the end of this function, all processes should have a complete `self.expectation_list`
+        # to proceed to the Mstep function
 
     def Mstep(self):
         """
@@ -129,7 +144,7 @@ def Mstep(self):
 
         if self.mask is not None:
             self.delta_model = self.delta_model.mask_pixels(self.mask)
-
+            
         # background normalization optimization
         if self.do_bkg_norm_optimization:
             for key in self.dict_bkg_norm.keys():
@@ -146,6 +161,11 @@ def Mstep(self):
 
                 self.dict_bkg_norm[key] = bkg_norm
 
+        # At the end of this function, all the nodes will have a full
+        # copy of delta_model. Although this is not necessary, this is
+        # the easiest way without editing RichardsonLucy.py.
+        # The same applies for self.dict_bkg_norm
+
     def post_processing(self):
         """
         Here three processes will be performed.
@@ -154,6 +174,7 @@ def post_processing(self):
         - acceleration of RL algirithm: the normalization of delta map is increased as long as the updated image has no non-negative components.
         """
 
+        # All
         self.processed_delta_model = copy.deepcopy(self.delta_model)
 
         if self.do_response_weighting:
@@ -172,15 +193,15 @@ def post_processing(self):
 
         if self.mask is not None:
             self.model = self.model.mask_pixels(self.mask)
-
-        # update expectation_list
-        self.expectation_list = self.calc_expectation_list(self.model, dict_bkg_norm = self.dict_bkg_norm)
-        logger.debug("The expected count histograms were updated with the new model map.")
 
         # update loglikelihood_list
         self.loglikelihood_list = self.calc_loglikelihood_list(self.expectation_list)
         logger.debug("The loglikelihood list was updated with the new expected count histograms.")
 
+        # At the end of this function, all MPI processes needs to have a full
+        # copy of updated model. They calculate it from delta_model (which is
+        # distributed by MPI.Bcast) independently
+
     def register_result(self):
         """
         The values below are stored at the end of each iteration.
@@ -193,21 +214,23 @@ def register_result(self):
         - loglikelihood: log-likelihood
         """
 
-        this_result = {"iteration": self.iteration_count, 
-                       "model": copy.deepcopy(self.model), 
-                       "delta_model": copy.deepcopy(self.delta_model),
-                       "processed_delta_model": copy.deepcopy(self.processed_delta_model),
-                       "background_normalization": copy.deepcopy(self.dict_bkg_norm),
-                       "alpha": self.alpha, 
-                       "loglikelihood": copy.deepcopy(self.loglikelihood_list)}
-
-        # show intermediate results
-        logger.info(f'  alpha: {this_result["alpha"]}')
-        logger.info(f'  background_normalization: {this_result["background_normalization"]}')
-        logger.info(f'  loglikelihood: {this_result["loglikelihood"]}')
+        # Master
+        if self.MASTER:
+            this_result = {"iteration": self.iteration_count, 
+                        "model": copy.deepcopy(self.model), 
+                        "delta_model": copy.deepcopy(self.delta_model),
+                        "processed_delta_model": copy.deepcopy(self.processed_delta_model),
+                        "background_normalization": copy.deepcopy(self.dict_bkg_norm),
+                        "alpha": self.alpha, 
+                        "loglikelihood": copy.deepcopy(self.loglikelihood_list)}
+
+            # show intermediate results
+            logger.info(f'  alpha: {this_result["alpha"]}')
+            logger.info(f'  background_normalization: {this_result["background_normalization"]}')
+            logger.info(f'  loglikelihood: {this_result["loglikelihood"]}')
 
-        # register this_result in self.results
-        self.results.append(this_result)
+            # register this_result in self.results
+            self.results.append(this_result)
 
     def check_stopping_criteria(self):
         """
@@ -217,6 +240,7 @@ def check_stopping_criteria(self):
         -------
         bool
         """
+
         if self.iteration_count < self.iteration_max:
             return False
         return True
@@ -225,38 +249,41 @@ def finalization(self):
         """
         finalization after running the image deconvolution
         """
-        if self.save_results == True:
-            logger.info('Saving results in {self.save_results_directory}')
 
-            # model
-            for this_result in self.results:
-                iteration_count = this_result["iteration"]
+        # Master
+        if self.MASTER:
+            if self.save_results == True:
+                logger.info('Saving results in {self.save_results_directory}')
+
+                # model
+                for this_result in self.results:
+                    iteration_count = this_result["iteration"]
 
-                this_result["model"].write(f"{self.save_results_directory}/model_itr{iteration_count}.hdf5", overwrite = True)
-                this_result["delta_model"].write(f"{self.save_results_directory}/delta_model_itr{iteration_count}.hdf5", overwrite = True)
-                this_result["processed_delta_model"].write(f"{self.save_results_directory}/processed_delta_model_itr{iteration_count}.hdf5", overwrite = True)
+                    this_result["model"].write(f"{self.save_results_directory}/model_itr{iteration_count}_2.hdf5", overwrite = True)
+                    this_result["delta_model"].write(f"{self.save_results_directory}/delta_model_itr{iteration_count}_2.hdf5", overwrite = True)
+                    this_result["processed_delta_model"].write(f"{self.save_results_directory}/processed_delta_model_itr{iteration_count}_2.hdf5", overwrite = True)
 
-            #fits
-            primary_hdu = fits.PrimaryHDU()
+                #fits
+                primary_hdu = fits.PrimaryHDU()
 
-            col_iteration = fits.Column(name='iteration', array=[float(result['iteration']) for result in self.results], format='K')
-            col_alpha = fits.Column(name='alpha', array=[float(result['alpha']) for result in self.results], format='D')
-            cols_bkg_norm = [fits.Column(name=key, array=[float(result['background_normalization'][key]) for result in self.results], format='D') 
-                             for key in self.dict_bkg_norm.keys()]
-            cols_loglikelihood = [fits.Column(name=f"{self.dataset[i].name}", array=[float(result['loglikelihood'][i]) for result in self.results], format='D') 
-                                  for i in range(len(self.dataset))]
+                col_iteration = fits.Column(name='iteration', array=[float(result['iteration']) for result in self.results], format='K')
+                col_alpha = fits.Column(name='alpha', array=[float(result['alpha']) for result in self.results], format='D')
+                cols_bkg_norm = [fits.Column(name=key, array=[float(result['background_normalization'][key]) for result in self.results], format='D') 
+                                for key in self.dict_bkg_norm.keys()]
+                cols_loglikelihood = [fits.Column(name=f"{self.dataset[i].name}", array=[float(result['loglikelihood'][i]) for result in self.results], format='D') 
+                                    for i in range(len(self.dataset))]
 
-            table_alpha = fits.BinTableHDU.from_columns([col_iteration, col_alpha])
-            table_alpha.name = "alpha"
+                table_alpha = fits.BinTableHDU.from_columns([col_iteration, col_alpha])
+                table_alpha.name = "alpha"
 
-            table_bkg_norm = fits.BinTableHDU.from_columns([col_iteration] + cols_bkg_norm)
-            table_bkg_norm.name = "bkg_norm"
+                table_bkg_norm = fits.BinTableHDU.from_columns([col_iteration] + cols_bkg_norm)
+                table_bkg_norm.name = "bkg_norm"
 
-            table_loglikelihood = fits.BinTableHDU.from_columns([col_iteration] + cols_loglikelihood)
-            table_loglikelihood.name = "loglikelihood"
+                table_loglikelihood = fits.BinTableHDU.from_columns([col_iteration] + cols_loglikelihood)
+                table_loglikelihood.name = "loglikelihood"
 
-            hdul = fits.HDUList([primary_hdu, table_alpha, table_bkg_norm, table_loglikelihood])
-            hdul.writeto(f'{self.save_results_directory}/results.fits',  overwrite=True)
+                hdul = fits.HDUList([primary_hdu, table_alpha, table_bkg_norm, table_loglikelihood])
+                hdul.writeto(f'{self.save_results_directory}/results.fits',  overwrite=True)
 
     def calc_alpha(self, delta_model, model):
         """
@@ -267,6 +294,7 @@ def calc_alpha(self, delta_model, model):
         float
             Acceleration parameter
         """
+
         diff = -1 * (model / delta_model).contents
 
         diff[(diff <= 0) | (delta_model.contents == 0)] = np.inf

diff --git a/cosipy/image_deconvolution/__init__.py b/cosipy/image_deconvolution/__init__.py
@@ -2,6 +2,7 @@
 
 from .image_deconvolution_data_interface_base import ImageDeconvolutionDataInterfaceBase
 from .dataIF_COSI_DC2 import DataIF_COSI_DC2
+from .dataIFWithParallelSupport import DataIFWithParallel
 
 from .model_base import ModelBase
 from .allskyimage import AllSkyImageModel

diff --git a/cosipy/image_deconvolution/allskyimage.py b/cosipy/image_deconvolution/allskyimage.py
@@ -151,9 +151,11 @@ def set_values_from_parameters(self, parameter):
         if algorithm_name == "flat":
             unit = u.Unit(algorithm_parameter['unit'])
             for idx, value in enumerate(algorithm_parameter['value']):
-                self[:,idx] = value * unit
+                self[:,idx] = value * unit      # TODO: Why is this indexed as [:, idx] instead of [idx, :]?
     #    elif algorithm_name == ... 
     #       ...
+        else:
+            raise ValueError(f'Model algorithm {algorithm_name} not supported')
 
     def set_values_from_extendedmodel(self, extendedmodel):
         """