Merged latest dev

GrimmSnark · Aug 13, 2019 · 8626189 · 8626189
2 parents 5828581 + 6233eda
commit 8626189
Show file tree

Hide file tree

Showing 33 changed files with 4,159 additions and 790 deletions.
diff --git a/.style.yapf b/.style.yapf
@@ -0,0 +1,4 @@
+[style]
+based_on_style = google
+spaces_before_comment = 8,16,24,32,40,48,56,64,72,80
+column_limit = 120
diff --git a/.yapfignore b/.yapfignore
@@ -0,0 +1,6 @@
+# We mostly just want to run yapf on the module code
+docs/
+demos/obsolete/
+sandbox/
+SLURM/
+use_cases/
diff --git a/README.md b/README.md
@@ -146,7 +146,7 @@ A list of known issues can be found [here](https://github.com/flatironinstitute/
 
 ## Documentation & Wiki
 
-Documentation of the code can be found [here](http://flatironinstitute.github.io/CaImAn/). 
+Documentation of the code can be found [here](https://caiman.readthedocs.io/en/master/). 
 Moreover, our [wiki page](https://github.com/flatironinstitute/CaImAn/wiki) covers some aspects of the code. 
 
 ### Installation for behavioral analysis

diff --git a/caiman/base/movies.py b/caiman/base/movies.py
@@ -1189,7 +1189,7 @@ def load(file_name:Union[str,List[str]], fr:float=30, start_time:float=0, meta_d
     """
     # case we load movie from file
     if max(top, bottom, left, right) > 0 and type(file_name) is str:
-        file_name = [file_name] # type: ignore # mypy doesn't like that this changes type # type: ignore # mypy doesn't like that this changes type # type: ignore # mypy doesn't like that this changes type # type: ignore # mypy doesn't like that this changes type # type: ignore # mypy doesn't like that this changes type
+        file_name = [file_name] # type: ignore # mypy doesn't like that this changes type
 
     if type(file_name) is list:
         if shape is not None:

diff --git a/caiman/base/rois.py b/caiman/base/rois.py
@@ -22,7 +22,7 @@
 from past.utils import old_div
 from scipy.ndimage.filters import gaussian_filter
 from scipy.ndimage import label, center_of_mass
-from skimage.morphology import remove_small_objects, remove_small_holes, dilation
+from skimage.morphology import remove_small_objects, remove_small_holes, dilation, closing
 import scipy
 from scipy import ndimage as ndi
 from scipy.optimize import linear_sum_assignment
@@ -75,6 +75,7 @@ def com(A:np.ndarray, d1:int, d2:int, d3:Optional[int]=None) -> np.array:
             np.outer(np.ones(d3), np.outer(np.arange(d2), np.ones(d1)).ravel()).ravel(),
             np.outer(np.arange(d3), np.outer(np.ones(d2), np.ones(d1)).ravel()).ravel()],
             dtype=A.dtype)
+
     cm = (Coor * A / A.sum(axis=0)).T
     return np.array(cm)
 
@@ -108,14 +109,14 @@ def extract_binary_masks_from_structural_channel(Y, min_area_size:int=30, min_ho
                             mean image used to detect cell boundaries
     """
 
-    mR = Y.mean(axis=0)
+    mR = Y.mean(axis=0) if Y.ndim == 3 else Y
     img = cv2.blur(mR, (gSig, gSig))
     img = (img - np.min(img)) / (np.max(img) - np.min(img)) * 255.
     img = img.astype(np.uint8)
 
     th = cv2.adaptiveThreshold(img, np.max(
         img), cv2.ADAPTIVE_THRESH_GAUSSIAN_C, cv2.THRESH_BINARY, gSig, 0)
-    th = remove_small_holes(th > 0, min_size=min_hole_size)
+    th = remove_small_holes(th > 0, area_threshold=min_hole_size)
     th = remove_small_objects(th, min_size=min_area_size)
     areas = label(th)
 
@@ -126,7 +127,7 @@ def extract_binary_masks_from_structural_channel(Y, min_area_size:int=30, min_ho
         if expand_method == 'dilation':
             temp = dilation(temp, selem=selem)
         elif expand_method == 'closing':
-            temp = dilation(temp, selem=selem)
+            temp = closing(temp, selem=selem)
 
         A[:, i] = temp.flatten('F')
 

diff --git a/caiman/base/timeseries.py b/caiman/base/timeseries.py
@@ -129,15 +129,14 @@ def save(self,
              var_name_hdf5='mov',
              sess_desc='some_description',
              identifier='some identifier',
-             exp_desc='experiment description',
              imaging_plane_description='some imaging plane description',
              emission_lambda=520.0,
              indicator='OGB-1',
              location='brain',
              starting_time=0.,
              experimenter='Dr Who',
-             lab_name='',
-             institution='',
+             lab_name=None,
+             institution=None,
              experiment_description='Experiment Description',
              session_id='Session ID'):
         """

diff --git a/caiman/cluster.py b/caiman/cluster.py
@@ -1,6 +1,5 @@
 #!/usr/bin/env python
 # -*- coding: utf-8 -*-
-
 """ functions related to the creation and management of the cluster
 
 We put arrays on disk as raw bytes, extending along the first dimension.
@@ -40,7 +39,12 @@
 
 logger = logging.getLogger(__name__)
 
-def extract_patch_coordinates(dims:Tuple, rf:Union[List,Tuple], stride:Union[List[int],Tuple], border_pix:int=0, indices=[slice(None)]*2) -> Tuple[List, List]:
+
+def extract_patch_coordinates(dims: Tuple,
+                              rf: Union[List, Tuple],
+                              stride: Union[List[int], Tuple],
+                              border_pix: int = 0,
+                              indices=[slice(None)] * 2) -> Tuple[List, List]:
     """
     Partition the FOV in patches
     and return the indexed in 2D and 1D (flatten, order='F') formats
@@ -58,25 +62,24 @@ def extract_patch_coordinates(dims:Tuple, rf:Union[List,Tuple], stride:Union[Lis
 
     sl_start = [0 if sl.start is None else sl.start for sl in indices]
     sl_stop = [dim if sl.stop is None else sl.stop for (sl, dim) in zip(indices, dims)]
-    sl_step = [1 for sl in indices]  # not used
+    sl_step = [1 for sl in indices]    # not used
     dims_large = dims
     dims = np.minimum(np.array(dims) - border_pix, sl_stop) - np.maximum(border_pix, sl_start)
 
     coords_flat = []
     shapes = []
-    iters = [list(range(rf[i], dims[i] - rf[i], 2 * rf[i] - stride[i])) + [dims[i] - rf[i]]
-             for i in range(len(dims))]
+    iters = [list(range(rf[i], dims[i] - rf[i], 2 * rf[i] - stride[i])) + [dims[i] - rf[i]] for i in range(len(dims))]
 
     coords = np.empty(list(map(len, iters)) + [len(dims)], dtype=np.object)
     for count_0, xx in enumerate(iters[0]):
         coords_x = np.arange(xx - rf[0], xx + rf[0] + 1)
         coords_x = coords_x[(coords_x >= 0) & (coords_x < dims[0])]
-        coords_x += border_pix*0 + np.maximum(sl_start[0], border_pix)
+        coords_x += border_pix * 0 + np.maximum(sl_start[0], border_pix)
 
         for count_1, yy in enumerate(iters[1]):
             coords_y = np.arange(yy - rf[1], yy + rf[1] + 1)
             coords_y = coords_y[(coords_y >= 0) & (coords_y < dims[1])]
-            coords_y += border_pix*0 + np.maximum(sl_start[1], border_pix)
+            coords_y += border_pix * 0 + np.maximum(sl_start[1], border_pix)
 
             if len(dims) == 2:
                 idxs = np.meshgrid(coords_x, coords_y)
@@ -86,7 +89,7 @@ def extract_patch_coordinates(dims:Tuple, rf:Union[List,Tuple], stride:Union[Lis
 
                 coords_ = np.ravel_multi_index(idxs, dims_large, order='F')
                 coords_flat.append(coords_.flatten())
-            else:  # 3D data
+            else:      # 3D data
 
                 if border_pix > 0:
                     raise Exception(
@@ -109,7 +112,8 @@ def extract_patch_coordinates(dims:Tuple, rf:Union[List,Tuple], stride:Union[Lis
 
 
 #%%
-def apply_to_patch(mmap_file, shape:Tuple[Any,Any,Any], dview, rf, stride, function, *args, **kwargs) -> Tuple[List,Any,Tuple]:
+def apply_to_patch(mmap_file, shape: Tuple[Any, Any, Any], dview, rf, stride, function, *args,
+                   **kwargs) -> Tuple[List, Any, Tuple]:
     """
     apply function to patches in parallel or not
 
@@ -152,11 +156,9 @@ def apply_to_patch(mmap_file, shape:Tuple[Any,Any,Any], dview, rf, stride, funct
         stride1 = stride
         stride2 = stride
 
-    idx_flat, idx_2d = extract_patch_coordinates(
-        (d1, d2), rf=(rf1, rf2), stride=(stride1, stride2))
+    idx_flat, idx_2d = extract_patch_coordinates((d1, d2), rf=(rf1, rf2), stride=(stride1, stride2))
 
-    shape_grid = tuple(np.ceil(
-        (d1 * 1. / (rf1 * 2 - stride1), d2 * 1. / (rf2 * 2 - stride2))).astype(np.int))
+    shape_grid = tuple(np.ceil((d1 * 1. / (rf1 * 2 - stride1), d2 * 1. / (rf2 * 2 - stride2))).astype(np.int))
     if d1 <= rf1 * 2:
         shape_grid = (1, shape_grid[1])
     if d2 <= rf2 * 2:
@@ -167,8 +169,7 @@ def apply_to_patch(mmap_file, shape:Tuple[Any,Any,Any], dview, rf, stride, funct
     args_in = []
 
     for id_f, id_2d in zip(idx_flat[:], idx_2d[:]):
-        args_in.append((mmap_file.filename, id_f,
-                        id_2d, function, args, kwargs))
+        args_in.append((mmap_file.filename, id_f, id_2d, function, args, kwargs))
 
     logger.debug("Flat index is of length " + str(len(idx_flat)))
     if dview is not None:
@@ -184,19 +185,20 @@ def apply_to_patch(mmap_file, shape:Tuple[Any,Any,Any], dview, rf, stride, funct
 
         file_res = list(map(function_place_holder, args_in))
     return file_res, idx_flat, shape_grid
+
+
 #%%
 
 
-def function_place_holder(args_in:Tuple) -> np.ndarray:
+def function_place_holder(args_in: Tuple) -> np.ndarray:
     #todo: todocument
 
     file_name, idx_, shapes, function, args, kwargs = args_in
     Yr, _, _ = load_memmap(file_name)
     Yr = Yr[idx_, :]
     Yr.filename = file_name
     _, T = Yr.shape
-    Y = np.reshape(Yr, (shapes[1], shapes[0], T),
-                   order='F').transpose([2, 0, 1])
+    Y = np.reshape(Yr, (shapes[1], shapes[0], T), order='F').transpose([2, 0, 1])
     [T, d1, d2] = Y.shape
 
     res_fun = function(Y, *args, **kwargs)
@@ -208,10 +210,11 @@ def function_place_holder(args_in:Tuple) -> np.ndarray:
 
     return res_fun
 
+
 #%%
 
 
-def start_server(slurm_script:str=None, ipcluster:str="ipcluster", ncpus:int=None) -> None:
+def start_server(slurm_script: str = None, ipcluster: str = "ipcluster", ncpus: int = None) -> None:
     """
     programmatically start the ipyparallel server
 
@@ -220,7 +223,7 @@ def start_server(slurm_script:str=None, ipcluster:str="ipcluster", ncpus:int=Non
             number of processors
 
         ipcluster : str
-            ipcluster binary file name; requires 4 path separators on Windows. ipcluster="C:\\\\Anaconda2\\\\Scripts\\\\ipcluster.exe"
+            ipcluster binary file name; requires 4 path separators on Windows. ipcluster="C:\\\\Anaconda3\\\\Scripts\\\\ipcluster.exe"
             Default: "ipcluster"
     """
     logger.info("Starting cluster...")
@@ -230,21 +233,21 @@ def start_server(slurm_script:str=None, ipcluster:str="ipcluster", ncpus:int=Non
     if slurm_script is None:
 
         if ipcluster == "ipcluster":
-            subprocess.Popen(
-                "ipcluster start -n {0}".format(ncpus), shell=True, close_fds=(os.name != 'nt'))
+            subprocess.Popen("ipcluster start -n {0}".format(ncpus), shell=True, close_fds=(os.name != 'nt'))
         else:
-            subprocess.Popen(shlex.split(
-                "{0} start -n {1}".format(ipcluster, ncpus)), shell=True, close_fds=(os.name != 'nt'))
+            subprocess.Popen(shlex.split("{0} start -n {1}".format(ipcluster, ncpus)),
+                             shell=True,
+                             close_fds=(os.name != 'nt'))
         time.sleep(1.5)
         # Check that all processes have started
         client = ipyparallel.Client()
         time.sleep(1.5)
         while len(client) < ncpus:
-            sys.stdout.write(".")  # Give some visual feedback of things starting
-            sys.stdout.flush()     # (de-buffered)
+            sys.stdout.write(".")                              # Give some visual feedback of things starting
+            sys.stdout.flush()                                 # (de-buffered)
             time.sleep(0.5)
         logger.debug('Making sure everything is up and running')
-        client.direct_view().execute('__a=1', block=True)  # when done on all, we're set to go
+        client.direct_view().execute('__a=1', block=True)      # when done on all, we're set to go
     else:
         shell_source(slurm_script)
         pdir, profile = os.environ['IPPPDIR'], os.environ['IPPPROFILE']
@@ -256,18 +259,18 @@ def start_server(slurm_script:str=None, ipcluster:str="ipcluster", ncpus:int=Non
         c.close()
         sys.stdout.write("start_server: done\n")
 
-def shell_source(script:str) -> None:
+
+def shell_source(script: str) -> None:
     """ Run a source-style bash script, copy resulting env vars to current process. """
     # XXX This function is weird and maybe not a good idea. People easily might expect
     #     it to handle conditionals. Maybe just make them provide a key-value file
     #introduce echo to indicate the end of the output
-    pipe = subprocess.Popen(". %s; env; echo 'FINISHED_CLUSTER'" %
-                            script, stdout=subprocess.PIPE, shell=True)
+    pipe = subprocess.Popen(". %s; env; echo 'FINISHED_CLUSTER'" % script, stdout=subprocess.PIPE, shell=True)
 
     env = dict()
     while True:
         line = pipe.stdout.readline().decode('utf-8').rstrip()
-        if 'FINISHED_CLUSTER' in line: # find the keyword set above to determine the end of the output stream
+        if 'FINISHED_CLUSTER' in line:         # find the keyword set above to determine the end of the output stream
             break
         logger.debug("shell_source parsing line[" + str(line) + "]")
         lsp = str(line).split("=", 1)
@@ -277,7 +280,8 @@ def shell_source(script:str) -> None:
     os.environ.update(env)
     pipe.stdout.close()
 
-def stop_server(ipcluster:str='ipcluster', pdir:str=None, profile:str=None, dview=None) -> None:
+
+def stop_server(ipcluster: str = 'ipcluster', pdir: str = None, profile: str = None, dview=None) -> None:
     """
     programmatically stops the ipyparallel server
 
@@ -315,7 +319,7 @@ def stop_server(ipcluster:str='ipcluster', pdir:str=None, profile:str=None, dvie
             try:
                 shutil.rmtree('./log/')
             except:
-                logger.info('creating log folder') # FIXME Not what this means
+                logger.info('creating log folder')     # FIXME Not what this means
 
             files = glob.glob('*.log')
             os.mkdir('./log')
@@ -325,11 +329,15 @@ def stop_server(ipcluster:str='ipcluster', pdir:str=None, profile:str=None, dvie
 
         else:
             if ipcluster == "ipcluster":
-                proc = subprocess.Popen(
-                    "ipcluster stop", shell=True, stderr=subprocess.PIPE, close_fds=(os.name != 'nt'))
+                proc = subprocess.Popen("ipcluster stop",
+                                        shell=True,
+                                        stderr=subprocess.PIPE,
+                                        close_fds=(os.name != 'nt'))
             else:
                 proc = subprocess.Popen(shlex.split(ipcluster + " stop"),
-                                        shell=True, stderr=subprocess.PIPE, close_fds=(os.name != 'nt'))
+                                        shell=True,
+                                        stderr=subprocess.PIPE,
+                                        close_fds=(os.name != 'nt'))
 
             line_out = proc.stderr.readline()
             if b'CRITICAL' in line_out:
@@ -348,10 +356,15 @@ def stop_server(ipcluster:str='ipcluster', pdir:str=None, profile:str=None, dvie
             proc.stderr.close()
 
     logger.info("stop_cluster(): done")
+
+
 #%%
 
 
-def setup_cluster(backend:str='multiprocessing', n_processes:int=None, single_thread:bool=False, ignore_preexisting:bool=False) -> Tuple[Any, Any, Optional[int]]:
+def setup_cluster(backend: str = 'multiprocessing',
+                  n_processes: int = None,
+                  single_thread: bool = False,
+                  ignore_preexisting: bool = False) -> Tuple[Any, Any, Optional[int]]:
     """Setup and/or restart a parallel cluster.
     Args:
         backend: str
@@ -386,7 +399,7 @@ def setup_cluster(backend:str='multiprocessing', n_processes:int=None, single_th
                 stop_server()
             except:
                 logger.debug('Nothing to stop')
-            slurm_script = '/mnt/home/agiovann/SOFTWARE/CaImAn/SLURM/slurmStart.sh'
+            slurm_script = '/mnt/home/agiovann/SOFTWARE/CaImAn/SLURM/slurmStart.sh' # FIXME: Make this a documented environment variable
             logger.info([str(n_processes), slurm_script])
             start_server(slurm_script=slurm_script, ncpus=n_processes)
             pdir, profile = os.environ['IPPPDIR'], os.environ['IPPPROFILE']
@@ -397,7 +410,7 @@ def setup_cluster(backend:str='multiprocessing', n_processes:int=None, single_th
             stop_server()
             start_server(ncpus=n_processes)
             c = Client()
-            logger.info('Started ipyparallel cluster: Using ' + str(len(c)) + ' processes')
+            logger.info(f'Started ipyparallel cluster: Using {len(c)} processes')
             dview = c[:len(c)]
 
         elif (backend == 'multiprocessing') or (backend == 'local'):
@@ -411,16 +424,16 @@ def setup_cluster(backend:str='multiprocessing', n_processes:int=None, single_th
                         'A cluster is already runnning. Terminate with dview.terminate() if you want to restart.')
             if (platform.system() == 'Darwin') and (sys.version_info > (3, 0)):
                 try:
-                    if 'kernel' in get_ipython().trait_names(): # type: ignore
-                                                                # If you're on OSX and you're running under Jupyter or Spyder,
-                                                                # which already run the code in a forkserver-friendly way, this
-                                                                # can eliminate some setup and make this a reasonable approach.
-                                                                # Otherwise, seting VECLIB_MAXIMUM_THREADS=1 or using a different
-                                                                # blas/lapack is the way to avoid the issues.
-                                                                # See https://github.com/flatironinstitute/CaImAn/issues/206 for more
-                                                                # info on why we're doing this (for now).
+                    if 'kernel' in get_ipython().trait_names():        # type: ignore
+                                                                       # If you're on OSX and you're running under Jupyter or Spyder,
+                                                                       # which already run the code in a forkserver-friendly way, this
+                                                                       # can eliminate some setup and make this a reasonable approach.
+                                                                       # Otherwise, seting VECLIB_MAXIMUM_THREADS=1 or using a different
+                                                                       # blas/lapack is the way to avoid the issues.
+                                                                       # See https://github.com/flatironinstitute/CaImAn/issues/206 for more
+                                                                       # info on why we're doing this (for now).
                         multiprocessing.set_start_method('forkserver', force=True)
-                except: # If we're not running under ipython, don't do anything.
+                except:                                                # If we're not running under ipython, don't do anything.
                     pass
             c = None