debug

implenment loading data from MongoDB.
regular backup
2023-11-02 11:03:19 +01:00 · 2023-10-30 17:53:03 +01:00 · 2023-09-28 17:24:44 +02:00 · 2023-09-28 17:03:50 +02:00 · 2023-09-28 16:59:50 +02:00 · 2023-09-28 16:54:37 +02:00
8 changed files with 6941 additions and 139 deletions
--- a/Analyser/FringeRemoval.py
+++ b/Analyser/FringeRemoval.py
@ -0,0 +1,347 @@
+import numpy as np
+from scipy.linalg import lu
+
+import xarray as xr
+
+class InvalidDimException(Exception):
+    "Raised when the program can not identify (index of images, x, y) axes."
+    def __init__(self, dims):
+        if len(dims)>3:
+            self.message = 'The input data must have two or three axes: (index of images(alternative), x, y)'
+        else:
+            self.message = 'Can not identify (index of images(alternative), x, y) from ' + str(dims)
+        super().__init__(self.message)
+
+
+class DataSizeException(Exception):
+    "Raised when the shape of the data is not correct."
+    def __init__(self):
+        self.message = 'The input data size does not match.'
+        super().__init__(self.message)
+
+
+class FringeRemoval():
+    """
+    FRINGEREMOVAL - Fringe removal and noise reduction from absorption images.
+    Creates an optimal reference image for each absorption image in a set as 
+    a linear combination of reference images, with coefficients chosen to 
+    minimize the least-squares residuals between each absorption image and 
+    the optimal reference image. The coefficients are obtained by solving a 
+    linear set of equations using matrix inverse by LU decomposition.
+
+    Application of the algorithm is described in C. F. Ockeloen et al, Improved 
+    detection of small atom numbers through image processing, arXiv:1007.2136 (2010).
+
+    Adapted from a MATLAB script copy provided by Guoxian Su.
+    Original Authors: Shannon Whitlock, Caspar Ockeloen
+    Reference: C. F. Ockeloen, A. F. Tauschinsky, R. J. C. Spreeuw, and
+               S. Whitlock, Improved detection of small atom numbers through 
+               image processing, arXiv:1007.2136
+    May 2009;
+    
+    """
+    
+    def __init__(self) -> None:
+        """Initialize the class
+        """
+        self.nimgsR = 0 # The number of the reference images
+        self.xdim = 0 # The shape of x axis
+        self.ydim = 0 # The shape of y axis
+        
+        self._mask = None # The mask array to choose the region of interest for fringes removal
+        self._center = None # Set the mask array by center and span
+        self._span = None
+        
+        self.reshape=True # If it is necessary to reshape the data from (index of images(alternative), x, y) to (y, x, index of images(alternative))
+        
+        self.P = None
+        self.L = None
+        self.U = None
+    
+    @property
+    def center(self):
+        """The getter of the center of region of insterest (ROI)
+
+        :return: The center of region of insterest (ROI)
+        :rtype: tuple
+        """
+        return self._center
+    
+    @center.setter
+    def center(self, value):
+        """The setter of the center of region of insterest (ROI)
+
+        :param value: The center of region of insterest (ROI)
+        :type value: tuple
+        """
+        self._mask = None
+        self._center = value
+
+    @property
+    def span(self):
+        """The getter of the span of region of insterest (ROI) 
+
+        :return: The span of region of insterest (ROI) 
+        :rtype: tuple
+        """
+        return self._span
+
+    @span.setter
+    def span(self, value):
+        """The setter of the span of region of insterest (ROI) 
+
+        :param value: The span of region of insterest (ROI) 
+        :type value: tuple
+        """
+        self._mask = None
+        self._span = value
+        
+    def reshape_data(self, data):
+        """The function is to reshape the data to the correct shape.
+        In order to minimize the calculation time, the data has to have a shape of (y, x, index of images(alternative)).
+        However, usually the input data has a shape of (index of images(alternative), x, y).
+        It can also convert the xarray DataArray and Dataset to numpy array.
+
+        :param data: The input data.
+        :type data: xarray, numpy array or list
+        :raises InvalidDimException: Raised when the program can not identify (index of images, x, y) axes.
+        :raises InvalidDimException: Raised when the shape of the data is not correct.
+        :return: The data with correct shape
+        :rtype: xarray, numpy array or list
+        """
+        
+        if data is None:
+            return data
+
+        if isinstance(data, type(xr.DataArray())):
+            
+            dims = data.dims
+            
+            if len(dims)>3:
+                raise InvalidDimException(dims)
+            
+            xAxis = None
+            yAxis = None
+            if len(dims) == 2:
+                imageAxis = ''
+            else:
+                imageAxis = None
+                
+            for dim in dims:
+                if (dim == 'x') or ('_x' in dim):
+                    xAxis = dim
+                elif (dim == 'y') or ('_y' in dim):
+                    yAxis = dim
+                else:
+                    imageAxis = dim
+                    
+            if (xAxis is None) or (yAxis is None) or (imageAxis is None):
+                raise InvalidDimException(dims)
+            
+            if len(dims) == 2:
+                data = data.transpose(yAxis, xAxis)
+            else:
+                data = data.transpose(yAxis, xAxis, imageAxis)
+                
+            data = data.to_numpy()
+            
+        else:
+            data = np.array(data)
+            if len(data.shape) == 3:
+                data = np.swapaxes(data, 0, 2)
+                # data = np.swapaxes(data, 0, 1)
+            elif len(data.shape) == 2:
+                data = np.swapaxes(data, 0, 1)
+        
+        return data
+    
+    def _reshape_absorption_images(self, data):
+        
+        if data is None:
+            return data
+
+        if isinstance(data, type(xr.DataArray())):
+            
+            dims = data.dims
+            
+            if len(dims)>3:
+                raise InvalidDimException(dims)
+            
+            xAxis = None
+            yAxis = None
+            if len(dims) == 2:
+                imageAxis = ''
+            else:
+                imageAxis = None
+                
+            for dim in dims:
+                if (dim == 'x') or ('_x' in dim):
+                    xAxis = dim
+                elif (dim == 'y') or ('_y' in dim):
+                    yAxis = dim
+                else:
+                    imageAxis = dim
+                    
+            if (xAxis is None) or (yAxis is None) or (imageAxis is None):
+                raise InvalidDimException(dims)
+            
+            if len(dims) == 2:
+                data = data.transpose(yAxis, xAxis)
+            else:
+                data = data.transpose(yAxis, xAxis, imageAxis)
+            
+            self.nimgs = len(data[imageAxis])
+            
+            data = data.stack(axis=[yAxis, xAxis])
+            
+        else:
+            data = np.array(data)
+            if len(data.shape) == 3:
+                data = np.swapaxes(data, 0, 2)
+                # data = np.swapaxes(data, 0, 1)
+            elif len(data.shape) == 2:
+                data = np.swapaxes(data, 0, 1)
+        
+        return data
+    
+    @property
+    def referenceImages(self):
+        res = self._referenceImages.reshape(self.ydim, self.xdim, self.nimgsR)
+        res = np.swapaxes(res, 0, 2)
+        return res
+    
+    @referenceImages.setter
+    def referenceImages(self, value):
+        if value is None:
+            self._referenceImages = None
+            return 
+        
+        if self.reshape:
+            value = self.reshape_data(value)
+        elif isinstance(value, type(xr.DataArray())):
+            value = value.to_numpy()
+            
+        self.nimgsR = value.shape[2]
+        self.xdim = value.shape[1]
+        self.ydim = value.shape[0]
+        
+        self._referenceImages = (value.reshape(self.xdim * self.ydim, self.nimgsR).astype(np.float32))
+
+    def add_reference_images(self, data):
+        """Add a new reference images
+
+        :param data: The new reference image.
+        :type data: xarray, numpy array or list
+        :raises DataSizeException: Raised when the shape of the data is not correct.
+        """
+        
+        if self.reshape:
+            data = self.reshape_data(data)
+        elif isinstance(data, type(xr.DataArray())):
+            data = data.to_numpy()
+        
+        if not ((data.shape[0]==self.ydim) and (data.shape[1]==self.xdim)):
+            raise DataSizeException
+
+        data = data.reshape(self.xdim * self.ydim)
+        
+        self._referenceImages = np.append(self._referenceImages, data, axis=1)
+    
+    def _remove_first_reference_images(self):
+        """Remove the first reference images
+        """
+        self._referenceImages = np.delete(self._referenceImages, 0, axis=1)
+    
+    def update_reference_images(self, data):
+        """Update the reference images set by removing the first one and adding a new one at the end.
+
+        :param data: The new reference image.
+        :type data: xarray, numpy array or list
+        """
+        self._remove_first_reference_images()
+        self.add_reference_images(data)
+
+        self.decompose_referenceImages()
+        
+    @property
+    def mask(self):
+        return self._mask
+    
+    @mask.setter
+    def mask(self, value):
+        if self.reshape:
+            value = self.reshape_data(value)
+        elif isinstance(value, type(xr.DataArray())):
+            value = value.to_numpy()
+            
+        if not ((value.shape[0]==self.ydim) and (value.shape[1]==self.xdim)):
+            raise DataSizeException
+        
+        self._mask = value
+        
+        self._center = None
+        self._span = None
+        
+        self.k = np.where(self._mask.flatten() == 1)[0]
+    
+    def _auto_mask(self):
+        mask = np.ones((self.ydim, self.xdim), dtype=np.uint8)
+        if not self._center is None:
+            x_start = int(self._center[0] - self._span[0] / 2)
+            x_end = int(self._center[0] + self._span[0] / 2)
+            y_end = int(self._center[1] + self._span[1] / 2)
+            y_start = int(self._center[1] - self._span[1] / 2)
+            
+            mask[y_start:y_end, x_start:x_end] = 0
+        
+        return mask
+    
+    def decompose_referenceImages(self):
+        if self._mask is None:
+            self.mask = self._auto_mask()
+        self.P, self.L, self.U = lu(self._referenceImages[self.k, :].T @ self._referenceImages[self.k, :], permute_l = False, p_indices = True)
+    
+    def _fringe_removal(self, absorptionImages):
+        
+        b = self.temp @ absorptionImages[self.k]
+        c = np.linalg.solve(self.U, np.linalg.solve(self.L[self.P], b))
+        optrefimages = (self._referenceImages @ c)
+        
+        return optrefimages
+    
+    def fringe_removal(self, absorptionImages, referenceImages=None, mask=None, reshape=None, dask='parallelized'):
+        """
+        This function will generate a 'fake' background images, which can help to remove the fringes.
+        
+        Important: Please substract the drak images from the both of images with atoms and without atoms before using this function!!!
+
+        :param absorptionImages: A set of images with atoms in absorption imaging
+        :type absorptionImages: xarray, numpy array or list
+        :param referenceImages: A set of images without atoms in absorption imaging, defaults to None
+        :type referenceImages: xarray, numpy array or list, optional
+        :param mask: An array to choose the region of interest for fringes removal, defaults to None, defaults to None
+        :type mask: numpy array, optional
+        :param reshape: If it needs to reshape the data, defaults to None
+        :type reshape: bool, optional
+        :param dask: Please refer to xarray.apply_ufunc()
+        :type dask: {"forbidden", "allowed", "parallelized"}, optional
+        :return: The 'fake' background to help removing the fringes
+        :rtype: xarray array
+        """
+        if not reshape is None:
+            self.reshape = reshape
+        if not referenceImages is None:
+            self.referenceImages = referenceImages
+        if not mask is None:
+            self.mask = mask
+        if self.P is None:
+            self.decompose_referenceImages()
+        
+        if self.reshape:
+            absorptionImages = self._reshape_absorption_images(absorptionImages)
+        
+        self.temp = self._referenceImages[self.k, :].T
+        
+        optrefimages = xr.apply_ufunc(self._fringe_removal, absorptionImages, input_core_dims=[['axis']], output_core_dims=[['axis']], dask=dask, vectorize=True, output_dtypes=float)
+        
+        return optrefimages.unstack()
--- a/Analyser/ImagingAnalyser.py
+++ b/Analyser/ImagingAnalyser.py
@ -2,6 +2,10 @@ import numpy as np
 import xarray as xr
 import copy

+from DataContainer.ReadData import read_hdf5_file
+from Analyser.FringeRemoval import FringeRemoval
+from ToolFunction.ToolFunction import get_scanAxis
+

 class ImageAnalyser():
    """A class for operate with and analyse images
@ -15,11 +19,15 @@ class ImageAnalyser():
            'background': 'background',
            'dark': 'dark',
            'OD':'OD',
+            'optimumBackground':'optimumBackground'
        }
        self._center = None
        self._span = None
        self._fraction = None
-    
+
+        self._fringeRemoval = FringeRemoval()
+        self.fringeRemovalReferenceImages = None
+        
    @property
    def image_name(self):
        """The getter of the names of three standard images for absorption images
@ -150,7 +158,7 @@ class ImageAnalyser():
        res.attrs = copy.copy(dataArray.attrs)
        return res
    
-    def crop_image(self, dataSet, center=None, span=None):
+    def crop_image(self, dataSet, center=None, span=None, fringeRemoval=False):
        """Crop the image according to the region of interest (ROI).

        :param dataSet: The images
@ -159,6 +167,8 @@ class ImageAnalyser():
        :type center: tuple, optional
        :param span: the span of region of insterest (ROI), defaults to None
        :type span: tuple, optional
+        :param fringeRemoval: If also crop the reference background images for finges removal function, defaults to False
+        :type fringeRemoval: bool, optional
        :return: The croped images
        :rtype: xarray DataArray or DataSet
        """
@ -192,6 +202,13 @@ class ImageAnalyser():
                dataSet[key].attrs['y_center'] = center[1]
                dataSet[key].attrs['x_span'] = span[0]
                dataSet[key].attrs['y_span'] = span[1]
+        
+        if fringeRemoval:
+            scanAxis = list(get_scanAxis(self.fringeRemovalReferenceImages))
+            if not scanAxis[1] is None:
+                self._fringeRemoval.referenceImages = self.fringeRemovalReferenceImages.isel(x=slice(x_start, x_end), y=slice(y_start, y_end)).stack(_imgIdx=scanAxis)
+            else:
+                self._fringeRemoval.referenceImages = self.fringeRemovalReferenceImages.isel(x=slice(x_start, x_end), y=slice(y_start, y_end))

        return dataSet.isel(x=slice(x_start, x_end), y=slice(y_start, y_end))
    
@ -220,6 +237,32 @@ class ImageAnalyser():
            return imageOD[0]
        else:
            return imageOD
+    
+    def get_OD_no_dark(self, imageAtom, imageBackground):
+        """Calculate the OD image for absorption imaging without dark images.
+
+        :param imageAtom: The image with atoms
+        :type imageAtom: numpy array
+        :param imageBackground: The image without atoms
+        :type imageBackground: numpy array
+        :param imageDrak: The image without light
+        :type imageDrak: numpy array
+        :return: The OD images
+        :rtype: numpy array
+        """
+
+        numerator = np.atleast_1d(imageBackground)
+        denominator = np.atleast_1d(imageAtom)
+        
+        numerator[numerator == 0] = 1
+        denominator[denominator == 0] = 1
+        imageOD = np.abs(np.divide(denominator, numerator)) 
+        imageOD= -np.log(imageOD)
+
+        if len(imageOD) == 1:
+            return imageOD[0]
+        else:
+            return imageOD

    def get_Ncount(self, dataSet, dim=['x', 'y'], **kwargs):
        """Sum all the value in the image to give the Ncount.
@ -233,11 +276,13 @@ class ImageAnalyser():
        """
        return dataSet.sum(dim=['x', 'y'], **kwargs)

-    def get_absorption_images(self, dataSet, dask='allowed', keep_attrs=True, **kwargs):
+    def get_absorption_images(self, dataSet, fringeRemoval=False, dask='allowed', keep_attrs=True, **kwargs):
        """Calculate the OD images for absorption imaging.

        :param dataSet: The data from absorption imaging.
        :type dataSet: xarray DataSet
+        :param fringeRemoval: If use fringe removal function, defaults to False
+        :type fringeRemoval: bool, optional
        :param dask: over write of the same argument in xarray.apply_ufunc, defaults to 'allowed'
        :type dask: str, optional
        :param keep_attrs: over write of the same argument in xarray.apply_ufunc, defaults to True
@ -253,11 +298,33 @@ class ImageAnalyser():
            }
        )

-        dataSet = dataSet.assign(
-            {
-                self._image_name['OD']: xr.apply_ufunc(self.get_OD, dataSet[self._image_name['atoms']], dataSet[self._image_name['background']], dataSet[self._image_name['dark']], **kwargs)
-            }
-        )
+        if fringeRemoval:
+            
+            dataSetAtoms = dataSet[self._image_name['atoms']] - dataSet[self._image_name['dark']]
+            
+            scanAxis = list(get_scanAxis(dataSet))
+            if not scanAxis[1] is None:
+                OptimumRef = self._fringeRemoval.fringe_removal(dataSetAtoms.stack(_imgIdx=scanAxis))
+            else:
+                OptimumRef = self._fringeRemoval.fringe_removal(dataSetAtoms)
+            
+            dataSet = dataSet.assign(
+                {
+                    self._image_name['optimumBackground']: OptimumRef
+                }
+            )
+            
+            dataSet = dataSet.assign(
+                {
+                    self._image_name['OD']: xr.apply_ufunc(self.get_OD_no_dark, dataSetAtoms, dataSet[self._image_name['optimumBackground']], **kwargs)
+                }
+            )
+        else:
+            dataSet = dataSet.assign(
+                {
+                    self._image_name['OD']: xr.apply_ufunc(self.get_OD, dataSet[self._image_name['atoms']], dataSet[self._image_name['background']], dataSet[self._image_name['dark']], **kwargs)
+                }
+            )
        
        # dataSet[self._image_name['OD']].attrs.update(dataSet.attrs)

@ -282,6 +349,77 @@ class ImageAnalyser():
        )

        xr.apply_ufunc(self.get_OD, dataSet[self._image_name['atoms']], dataSet[self._image_name['background']], dataSet[self._image_name['dark']], **kwargs)
+    
+    @property
+    def fringeRemovalCenter(self):
+        """The getter of the center of region of insterest (ROI)

+        :return: The center of region of insterest (ROI)
+        :rtype: tuple
+        """
+        return self._fringeRemoval.center
+    
+    @fringeRemovalCenter.setter
+    def fringeRemovalCenter(self, value):
+        """The setter of the center of region of insterest (ROI)

-    
+        :param value: The center of region of insterest (ROI)
+        :type value: tuple
+        """
+        self._fringeRemoval.center = value
+
+    @property
+    def fringeRemovalSpan(self):
+        """The getter of the span of region of insterest (ROI) 
+
+        :return: The span of region of insterest (ROI) 
+        :rtype: tuple
+        """
+        return self._fringeRemoval.span
+
+    @fringeRemovalSpan.setter
+    def fringeRemovalSpan(self, value):
+        """The setter of the span of region of insterest (ROI) 
+
+        :param value: The span of region of insterest (ROI) 
+        :type value: tuple
+        """
+        self._fringeRemoval.span = value
+        
+    def load_fringe_removal_background_from_hdf5(self, img_dir, SequenceName, date, shotNum, group, crop=False, load=False, **kwargs):
+        """Load the reference background images from hdf5 files of one single shot.  
+
+        :param img_dir: The path of the folder storing data.
+        :type img_dir: str
+        :param SequenceName: The name of the sequence
+        :type SequenceName: str
+        :param date: The date when the shot was taken in 'YYYY/MM/DD'.
+        :type date: str
+        :param shotNum: The number of the shot
+        :type shotNum: str
+        :param group: The name of the group storing the imgaes
+        :type group: str
+        :param crop: If crop the data, defaults to False
+        :type crop: bool, optional
+        :param load: If load the data into RAM, defaults to False
+        :type load: bool, optional
+        """
+        folderPath = img_dir + SequenceName + "/" + date
+        filePath = folderPath + "/" + shotNum + "/*.h5"
+        
+        dataSet = read_hdf5_file(filePath, group, **kwargs)
+        scanAxis = dataSet.scanAxis
+        
+        dataSet = dataSet[self._image_name['background']] - dataSet[self._image_name['dark']]
+        dataSet.attrs['scanAxis'] = scanAxis
+        
+        if crop:
+            dataSet = self.crop_image(dataSet)
+        
+        if load:
+            self.fringeRemovalReferenceImages = dataSet.load()
+        else:
+            self.fringeRemovalReferenceImages = dataSet
+    
+    def load_fringe_removal_background_from_database():
+        pass
--- a/DataContainer/MongoDB.py
+++ b/DataContainer/MongoDB.py
@ -2,12 +2,17 @@ from collections import OrderedDict

 import numpy as np
 import pymongo
+from pymongo import MongoClient
 import xarray_mongodb
 import bson
 import builtins

 import xarray as xr
-
+# import sys
+# #sys.path.insert(0, 'C:/Users/Fabrizio Klassen/PycharmProjects/DyLabDataViewer/src/bin/Analyser/AnalyserScript')
+# import sys
+# sys.path.append('../')
+# from bin.Analyser.AnalyserScript.ToolFunction.ToolFunction import get_date
 from ToolFunction.ToolFunction import get_date


@ -18,7 +23,7 @@ npArrayType = type(np.array([0]))
 class MongoDB:
    """A class for communicate with our MongoDB.
    """
-    
+
    def __init__(self, mongoClient, mongoDB, date=None) -> None:
        """Initialize the class with given handle to our MongoDB client and database.

@ -32,11 +37,11 @@ class MongoDB:
        self.mongoClient = mongoClient
        self.mongoDB = mongoDB
        self.xdb = xarray_mongodb.XarrayMongoDB(mongoDB)
-        
+
        if date is None:
            date= get_date()
        self.set_date(date)
-        
+
    def _convert_numpy_type(self, data):
        """Convert from numpy type to normal python type.

@ -45,6 +50,10 @@ class MongoDB:
        :return: The converted data
        :rtype: normal python data type
        """
+        
+        if data is None:
+            return None
+        
        for key in data:
            typeKey = type(data[key])
            if typeKey in npTypeDict:
@ -57,7 +66,7 @@ class MongoDB:
                except:
                    pass
        return data
-    
+
    def _break_dataSet(self, dataSet, scanAxis=None):
        """Stack the scan axes of data

@ -68,16 +77,16 @@ class MongoDB:
        :return: The stacked xarray DataSet or DataArray stored the data
        :rtype: xarray DataSet or DataArray
        """
-        
+
        if scanAxis is None:
-            scanAxis = dataSet.attrs['scanAxis'] 
-            
+            scanAxis = dataSet.attrs['scanAxis']
+
        dataArray = dataSet.shotNum
-            
-        stackedDataArray = dataArray.stack(_scanAxis=tuple(scanAxis))          
+
+        stackedDataArray = dataArray.stack(_scanAxis=tuple(scanAxis))

        return stackedDataArray
-        
+
    def set_date(self, date):
        """Set the date of data

@ -88,8 +97,8 @@ class MongoDB:
        self.year = int(date[0])
        self.month = int(date[1])
        self.day = int(date[2])
-        
-    def create_global(self, shotNum, dataSet=None, date=None):
+
+    def create_global(self, shotNum, dataSet=None, date=None, overwrite=True, runNum=None):
        """Creat a the global document in MongoDB

        :param shotNum: The shot number
@ -98,40 +107,66 @@ class MongoDB:
        :type dataSet: xarray DataSet, optional
        :param date: the date of the data, defaults to None
        :type date: str, optional
+        :param overwrite: If overwrite the exist global document, defaults to True
+        :type overwrite: bool, optional
        """
+        
        if not date is None:
            self.set_date(date)
-        
-        data = {
-            'year': self.year,
-            'month': self.month,
-            'day': self.day,
-            'shotNum': shotNum,
-        }

-        self.mongoDB['global'].delete_many(data)
+        if runNum is None:
+            data = {
+                'year': self.year,
+                'month': self.month,
+                'day': self.day,
+                'shotNum': shotNum,
+            }
+            runNum = 0
+        else:
+            data = {
+                'year': self.year,
+                'month': self.month,
+                'day': self.day,
+                'shotNum': shotNum,
+                'runNum': runNum,
+            }
+            
        
+        if overwrite:
+            self.mongoDB['global'].delete_many(data)
+        else:
+            res = self.mongoDB['global'].find_one(data)
+            if not res is None:
+                if not len(res)==0:
+                    return
+
        data = {
            'year': self.year,
            'month': self.month,
            'day': self.day,
            'shotNum': shotNum,
-            'runNum': 0,
+            'runNum': runNum,
            'global_parameters' : {},
        }
        
+        if dataSet is None:
+            self.mongoDB['global'].insert_one(data)
+            return
+        
+        if ('scanAxis' in dataSet.attrs) and len(dataSet.attrs['scanAxis'])==0:
+            del dataSet.attrs['scanAxis']
+            del dataSet.attrs['scanAxisLength']
+        
        global_parameters = self._convert_numpy_type(dataSet.attrs)
-        
-        if not dataSet is None:
-            data['global_parameters'].update(global_parameters)
-          
+        data['global_parameters'].update(global_parameters)
+
        data = self._convert_numpy_type(data)
-        
+
        if 'scanAxis' in dataSet.attrs:
-            
+
            del data['global_parameters']['scanAxis']
            del data['global_parameters']['scanAxisLength']
-            
+
            scanAxis = dataSet.attrs['scanAxis']
            data['global_parameters'].update(
                {
@ -139,40 +174,40 @@ class MongoDB:
                    for key in scanAxis
                }
            )
-            
+
            stackedDataArray = self._break_dataSet(dataSet)
            try:
                stackedDataArray.load()
            except:
                pass
-            
+
            stackedDataArray = stackedDataArray.groupby('_scanAxis')
-            
+
            for i in stackedDataArray:
-                
+
                stackedDataArray_single = i[1]
-                
+
                data.update(
                    {
                        'runNum': int(stackedDataArray_single.item())
                    }
                )
-                
+
                data['global_parameters'].update(
                    {
                        key: stackedDataArray_single[key].item()
                        for key in scanAxis
                    }
                )
-                
+
                if '_id' in data:
                    del data['_id']
-                
+
                self.mongoDB['global'].insert_one(data)
-        
+
        else:
            self.mongoDB['global'].insert_one(data)
-    
+
    def _add_data_normal(self, shotNum, runNum, data):
        """Write the data directly to the global document

@ -183,21 +218,21 @@ class MongoDB:
        :param data: The data to be written
        :type data: normal python data type
        """
-        
+
        if runNum is None:
            runNum = 0
-        
-        filter = {   
+
+        filter = {
            'year': self.year,
            'month': self.month,
            'day': self.day,
            'shotNum': shotNum,
            'runNum': runNum,
        }
-        
+
        self.mongoDB['global'].update_one(filter, {"$set": data}, upsert=False)
-        
-    def _add_data_xarray_dataArray(self, shotNum, dataArray, name=None, scanAxis=None):
+
+    def _add_data_xarray_dataArray(self, shotNum, dataArray, name=None, scanAxis=None, runNum=None):
        """Write the data in a type of xarray DataArray to the MongoDb.

        :param shotNum: The shot number
@ -212,13 +247,45 @@ class MongoDB:
        
        if scanAxis is None:
            scanAxis = list(dataArray.coords)
-            
+        
+        if name is None:
+            name = dataArray.name
+
        dataArray.attrs = self._convert_numpy_type(dataArray.attrs)
+        
+        if scanAxis is None or len(scanAxis) == 0:
            
+            if runNum is None:
+                return
+            
+            filter = {
+                'year': self.year,
+                'month': self.month,
+                'day': self.day,
+                'shotNum': shotNum,
+                'runNum': runNum,
+            }
+            
+            mongoID, _ = self.xdb.put(dataArray)
+
+            data_label = {
+                name:
+                    {
+                        'name': name,
+                        'mongoID': mongoID,
+                        'engine': 'xarray',
+                        'dtype': 'dataArray',
+                    }
+            }
+
+            self.mongoDB['global'].update_one(filter, {"$set": data_label}, upsert=False)
+            
+            return 
+        
        stackedDataArray = dataArray.stack(_scanAxis=tuple(scanAxis))
        stackedDataArray = stackedDataArray.groupby('_scanAxis')
        
-        filter = {   
+        filter = {
                'year': self.year,
                'month': self.month,
                'day': self.day,
@ -226,31 +293,31 @@ class MongoDB:
            }
        
        for i in stackedDataArray:
-            
+
            stackedDataArray_single = i[1].drop('_scanAxis')
-            
+
            global_parameters = {
                'global_parameters.' + key: stackedDataArray_single[key].item()
                for key in scanAxis
            }

            filter.update(global_parameters)
-            
+
            mongoID, _ = self.xdb.put(stackedDataArray_single)
-            
+
            data_label = {
-                dataArray.name: 
+                name:
                    {
-                        'name': dataArray.name,
+                        'name': name,
                        'mongoID': mongoID,
                        'engine': 'xarray',
                        'dtype': 'dataArray',
                    }
            }
-            
+
            self.mongoDB['global'].update_one(filter, {"$set": data_label}, upsert=False)
-    
-    def _add_data_xarray_dataSet(self, shotNum, dataSet, name, scanAxis=None):
+
+    def _add_data_xarray_dataSet(self, shotNum, dataSet, name, scanAxis=None, runNum=None):
        """Write the data in a type of xarray DataSet to the MongoDb.

        :param shotNum: The shot number
@ -262,40 +329,32 @@ class MongoDB:
        :param scanAxis: The scan axes of the data, defaults to None
        :type scanAxis: array like, optional
        """
-        
+
        if scanAxis is None:
            scanAxis = list(dataSet.coords)
-            
+
        dataSet.attrs = self._convert_numpy_type(dataSet.attrs)
-        
+
        for key in list(dataSet.data_vars):
            dataSet[key].attrs = self._convert_numpy_type(dataSet[key].attrs)
-            
-        stackedDataSet = dataSet.stack(_scanAxis=tuple(scanAxis))
-        stackedDataSet = stackedDataSet.groupby('_scanAxis')
        
-        filter = {   
-            'year': self.year,
-            'month': self.month,
-            'day': self.day,
-            'shotNum': shotNum,
-        }
-        
-        for i in stackedDataSet:
+        if scanAxis is None or len(scanAxis) == 0:
            
-            stackedDataSet_single = i[1].drop('_scanAxis')
+            if runNum is None:
+                return
            
-            global_parameters = {
-                'global_parameters.' + key: stackedDataSet_single[key].item()
-                for key in scanAxis
+            filter = {
+                'year': self.year,
+                'month': self.month,
+                'day': self.day,
+                'shotNum': shotNum,
+                'runNum': runNum,
            }
-
-            filter.update(global_parameters)
-        
+            
            mongoID, _ = self.xdb.put(dataSet)
-        
+
            data_label = {
-                name: 
+                name:
                    {
                        'name': name,
                        'mongoID': mongoID,
@ -303,9 +362,46 @@ class MongoDB:
                        'dtype': 'dataSet',
                    }
            }
-        
+
            self.mongoDB['global'].update_one(filter, {"$set": data_label}, upsert=False)
-    
+            
+            return
+
+        stackedDataSet = dataSet.stack(_scanAxis=tuple(scanAxis))
+        stackedDataSet = stackedDataSet.groupby('_scanAxis')
+
+        filter = {
+            'year': self.year,
+            'month': self.month,
+            'day': self.day,
+            'shotNum': shotNum,
+        }
+
+        for i in stackedDataSet:
+
+            stackedDataSet_single = i[1].drop('_scanAxis')
+
+            global_parameters = {
+                'global_parameters.' + key: stackedDataSet_single[key].item()
+                for key in scanAxis
+            }
+
+            filter.update(global_parameters)
+
+            mongoID, _ = self.xdb.put(stackedDataSet_single)
+
+            data_label = {
+                name:
+                    {
+                        'name': name,
+                        'mongoID': mongoID,
+                        'engine': 'xarray',
+                        'dtype': 'dataSet',
+                    }
+            }
+
+            self.mongoDB['global'].update_one(filter, {"$set": data_label}, upsert=False)
+
    def _add_data_additional(self, shotNum, runNum, data, name):
        """Write the data in an additional document

@ -318,22 +414,22 @@ class MongoDB:
        :param name: The name of the data
        :type name: str
        """
-        
+
        if runNum is None:
            runNum = 0
-        
-        filter = {   
+
+        filter = {
            'year': self.year,
            'month': self.month,
            'day': self.day,
            'shotNum': shotNum,
            'runNum': runNum,
        }
-        
+
        mongoID = self.mongoDB.additional.insert_one(data).inserted_id
-        
+
        data_label = {
-            name: 
+            name:
                {
                    'name': name,
                    'mongoID': mongoID,
@ -341,9 +437,9 @@ class MongoDB:
                    'dtype': 'dict',
                }
        }
-        
+
        self.mongoDB['global'].update_one(filter, {"$set": data_label}, upsert=False)
-        
+
    def add_data(self, shotNum, data, runNum=None, date=None, name=None, engine='normal'):
        """Write a new data to MongoDB

@ -362,17 +458,17 @@ class MongoDB:
        """
        if not date is None:
            self.set_date(date)
-            
+
        if engine == 'normal':
            self._add_data_normal(shotNum=shotNum, runNum=runNum, data=data)
        elif engine == 'xarray':
            if isinstance(data, type(xr.Dataset())):
-                self._add_data_xarray_dataSet(shotNum=shotNum, dataSet=data, name=name)
+                self._add_data_xarray_dataSet(shotNum=shotNum, dataSet=data, runNum=runNum, name=name)
            else:
-                self._add_data_xarray_dataArray(shotNum=shotNum, dataArray=data, name=name)
+                self._add_data_xarray_dataArray(shotNum=shotNum, dataArray=data, runNum=runNum, name=name)
        elif engine == 'additional':
            self._add_data_additional(shotNum=shotNum, runNum=runNum, data=data, name=name)
-    
+
    def read_global_single(self, shotNum, runNum, date=None):
        """Read the global document of specified shot and run from MongoDB.

@ -385,20 +481,20 @@ class MongoDB:
        :return: The global document
        :rtype: dict
        """
-        
+
        if not date is None:
            self.set_date(date)
-        
-        filter = {   
+
+        filter = {
            'year': self.year,
            'month': self.month,
            'day': self.day,
            'shotNum': shotNum,
            'runNum': runNum,
        }
-        
+
        return self.mongoDB['global'].find_one(filter)
-    
+
    def read_global_all(self, shotNum, date=None):
        """Read the global document of all runs in the specified shot from MongoDB, and extract the scan axes.

@ -409,29 +505,28 @@ class MongoDB:
        :return: The global document
        :rtype: dict
        """
-        
+
        from xarray.core.utils import equivalent
-        
+
        if not date is None:
            self.set_date(date)
-        
-        filter = {   
+
+        filter = {
            'year': self.year,
            'month': self.month,
            'day': self.day,
            'shotNum': shotNum,
        }
-        
+
        result = {}
        dropped_attrs = OrderedDict()
-        
+
        docs = self.mongoDB['global'].find(filter).sort('runNum')
        docs = [doc['global_parameters'] for doc in docs]
-        
        for doc in docs:
-            
+
            global_parameters = doc
-            
+
            result.update(
                {
                    key: value
@ -439,34 +534,34 @@ class MongoDB:
                    if key not in result and key not in dropped_attrs.keys()
                }
            )
-            
+
            result = {
                key: value
                for key, value in result.items()
                if key not in global_parameters or equivalent(global_parameters[key], value)
            }
-            
+
            dropped_attrs.update(
                {
                    key: []
-                    for key in global_parameters if key not in result 
+                    for key in global_parameters if key not in result
                }
            )
-            
+
        for doc in docs:
-            
+
            global_parameters = doc
-            
+
            dropped_attrs.update(
                {
                    key: np.append(dropped_attrs[key], global_parameters[key])
                    for key in dropped_attrs.keys()
                }
-            )        
-    
+            )
+
        scan_attrs = OrderedDict()
        scan_length = []
-        
+
        for attrs_key in dropped_attrs.keys():
            flag = True
            for key in scan_attrs.keys():
@ -495,7 +590,7 @@ class MongoDB:
        )

        return result
-    
+
    def _load_data_single(self, mongoID, engine):
        """load the document according to given _ID

@ -506,12 +601,12 @@ class MongoDB:
        :return: The engine for different types of the data
        :rtype: str
        """
-        
+
        if engine == 'xarray':
            return self.xdb.get(mongoID)
        if engine == 'additional':
            return self.mongoDB.additional.find_one({'_id': mongoID})
-    
+
    def load_data_single(self, shotNum=None, runNum=None, globalDict=None, date=None, field=None):
        """go through the given global document and find all the MongoDB object, then replace them with the document they linked to.

@ -528,31 +623,143 @@ class MongoDB:
        :return: The document with loaded data
        :rtype: dict
        """
-                
+
        if not date is None:
            self.set_date(date)
-        
+
        if globalDict is None:
            globalDict = self.read_global_single(shotNum=shotNum, runNum=runNum)
-        
+
        if field is None:
            field = globalDict
-        
+
        res = {}
-        
+
        for key in field:
            if isinstance(globalDict[key], dict) and ('mongoID' in globalDict[key]):
                mongoID = globalDict[key]['mongoID']
                engine = globalDict[key]['engine']
-                
+
                res.update(
                    {
                        key: self._load_data_single(mongoID=mongoID, engine=engine)
                    }
                )
-                
+
        return res
-                
-    def load_data(self, shotNum=None, globalDict=None, date=None, field=None):
-        # load all the data of specified shot
-        pass
+
+    def load_data(self, shotNum, data_key=None, globalDict=None, date=None):
+        """load observables of given shot"""
+        """the documents of a given shot can carry a variety of data types, i.e. optical density,
+        N_count, centerx etc. In order to not load all the data and take too much RAM, the user
+        is presented with a drop down featuring all possible observables. Only after selection the 
+        actual data is being loaded
+
+        :param shotNum: The shot number, defaults to None
+        :type shotNum: str, optional
+        :param date: The date of the data ('YYYY/MM/DD'), defaults to None
+        :type date: str, optional
+        :return: All data types in the given shot
+        :rtype: list
+        """
+        # set date
+        if not date is None:
+            self.set_date(date)
+
+        # collect global parameters and scan axes
+        if globalDict is None:
+            globalDict = self.read_global_all(shotNum=shotNum, date=date)
+
+        # initialize output dictionary
+        res = {'year': self.year, 'month': self.month, 'day': self.day, 'global_parameters': {}}
+
+        # add all global parameters except scan axes
+        res['global_parameters'].update(
+            {
+                key: value
+                for key, value in globalDict.items()
+                if key not in ['scanAxis', 'scanAxisLength']
+            }
+        )
+
+        # find data
+        filter = {
+            'year': self.year,
+            'month': self.month,
+            'day': self.day,
+            'shotNum': shotNum,
+        }
+
+        docs = self.mongoDB['global'].find(filter).sort('runNum')
+        
+        if data_key is None:
+            data_key = [key for key in docs[0] if not key in ['year', 'month', 'day', 'shotNum', 'runNum', 'global_parameters', '_id']]
+        
+        for key in data_key:
+            res[key] = self._load_data(shotNum=shotNum, data_key=key, globalDict=globalDict)
+        
+        res['global_parameters'].update(
+            {
+                'scanAxis': globalDict['scanAxis'],
+                'scanAxisLength': globalDict['scanAxisLength'],
+            }
+        )
+        
+        return res
+    
+    def _load_data(self, shotNum, data_key, globalDict):
+        """load all the data of specified shot"""
+        """go through the given global document and find all the MongoDB object, then replace them with the document they linked to.
+
+        :param shotNum: The shot number, defaults to None
+        :type shotNum: str, optional
+        :param globalDict: All global parameters plus scan axes and scan axes length, defaults to None
+        :type globalDict: dict, optional
+        :param date: The date of the data ('YYYY/MM/DD'), defaults to None
+        :type date: str, optional
+        :return: Data from all runs of given shot including global parameters and date
+        :rtype: dict
+        """
+
+        # collect data from all docs of given shot
+        filter = {
+            'year': self.year,
+            'month': self.month,
+            'day': self.day,
+            'shotNum': shotNum,
+        }
+
+        # find matching docs
+        docs = self.mongoDB['global'].find(filter).sort('runNum')
+
+        data = []
+        i = 0
+        for doc in docs:
+            key=data_key
+            if isinstance(doc[key], dict) and ('mongoID' in doc[key]):
+                mongoID = doc[key]['mongoID']
+                engine = doc[key]['engine']
+                single_data = self._load_data_single(mongoID=mongoID, engine=engine)
+                for axis in globalDict['scanAxis']:
+                    
+                    if not axis in single_data.coords:
+                        single_data = single_data.assign_coords({axis:globalDict[axis][i]})
+                    
+                    if not axis in single_data.dims:
+                        single_data = single_data.expand_dims(axis)
+            else:
+                engine = None
+                single_data = doc[key]
+                        
+            data.append(single_data)
+            
+            i = i + 1
+
+        # combine data along coordinate axes
+        try:
+            if engine =='xarray':
+                data = xr.combine_by_coords(data)
+        except:
+            pass
+
+        return data
--- a/droplet.pdf
+++ b/droplet.pdf
--- a/droplet1.pdf
+++ b/droplet1.pdf
--- a/finges.ipynb
+++ b/finges.ipynb
--- a/requirements.txt
+++ b/requirements.txt
@ -0,0 +1,77 @@
+asteval==0.9.31
+asttokens==2.4.0
+backcall==0.2.0
+bokeh==3.2.2
+click==8.1.7
+cloudpickle==2.2.1
+colorama==0.4.6
+comm==0.1.4
+contourpy==1.1.1
+cycler==0.11.0
+dask==2023.9.2
+debugpy==1.8.0
+decorator==5.1.1
+distributed==2023.9.2
+dnspython==2.4.2
+exceptiongroup==1.1.3
+executing==1.2.0
+finufft==2.1.0
+fonttools==4.42.1
+fsspec==2023.9.1
+future==0.18.3
+h5netcdf==1.2.0
+h5py==3.9.0
+importlib-metadata==6.8.0
+importlib-resources==6.1.0
+ipykernel==6.25.2
+ipython==8.15.0
+jedi==0.19.0
+Jinja2==3.1.2
+jupyter_client==8.3.1
+jupyter_core==5.3.1
+kiwisolver==1.4.5
+lmfit==1.2.2
+locket==1.0.0
+MarkupSafe==2.1.3
+matplotlib==3.8.0
+matplotlib-inline==0.1.6
+msgpack==1.0.6
+nest-asyncio==1.5.8
+numpy==1.26.0
+packaging==23.1
+pandas==2.1.1
+parso==0.8.3
+partd==1.4.0
+pickleshare==0.7.5
+Pillow==10.0.1
+platformdirs==3.10.0
+prompt-toolkit==3.0.39
+psutil==5.9.5
+pure-eval==0.2.2
+Pygments==2.16.1
+pymongo==4.5.0
+pyparsing==3.1.1
+python-dateutil==2.8.2
+pytz==2023.3.post1
+pywin32==306
+PyYAML==6.0.1
+pyzmq==25.1.1
+scipy==1.11.2
+six==1.16.0
+sortedcontainers==2.4.0
+stack-data==0.6.2
+tblib==2.0.0
+toolz==0.12.0
+tornado==6.3.3
+traitlets==5.10.0
+typing_extensions==4.8.0
+tzdata==2023.3
+uncertainties==3.1.7
+urllib3==2.0.5
+wcwidth==0.2.6
+xarray==2023.8.0
+xarray-mongodb==0.2.1
+xrft==1.0.1
+xyzservices==2023.7.0
+zict==3.0.0
+zipp==3.17.0
--- a/testLoadMongoDB.ipynb
+++ b/testLoadMongoDB.ipynb
Author	SHA1	Message	Date
Gao	3e4edd8b0c	debug	2023-11-02 11:03:19 +01:00
Gao	f1e547b1be	implenment loading data from MongoDB.	2023-10-30 17:53:03 +01:00
Gao	fbe70b4fca	regular backup	2023-09-28 17:24:44 +02:00
Gao	f6c6688d6e	add more commit	2023-09-28 17:03:50 +02:00
Gao	fde33c3648	add commit	2023-09-28 16:59:50 +02:00
Gao	80bba9ef71	add commits	2023-09-28 16:54:37 +02:00
Gao	e82cc5bb77	debug	2023-09-28 16:51:44 +02:00
Gao	87d6ff49c9	optimize the fringes removal function	2023-09-28 16:35:30 +02:00
Gao	6d841ef992	implenment parallel computing	2023-09-28 15:04:56 +02:00
Gao	b17c05bf30	regular backup	2023-09-27 18:10:03 +02:00
Gao	b70bc5faf5	implenment fringe removal class	2023-09-27 15:56:39 +02:00