nholschuh
diff --git a/‎Untitled.ipynb
100644100755 b/‎Untitled.ipynb
100644100755
diff --git a/‎calculate_flowlines.py
100644100755
+203-33 b/‎calculate_flowlines.py
100644100755
+203-33
diff --git a/‎compare_list.py
100644100755 b/‎compare_list.py
100644100755
diff --git a/‎edgetrim_mask.py
100644100755 b/‎edgetrim_mask.py
100644100755
diff --git a/‎find_pixelcoords.py
100644100755
+11-3 b/‎find_pixelcoords.py
100644100755
+11-3
diff --git a/‎generate_pickingpdf.py
100644100755
+14-11 b/‎generate_pickingpdf.py
100644100755
+14-11
diff --git a/‎get_contour_data.py
100644100755 b/‎get_contour_data.py
100644100755
@@ -1,7 +1,22 @@
 import numpy as np
 import matplotlib.pyplot as plt
+import tqdm
+import xarray as xr
 
-def calculate_flowlines(x,y,u,v,seed_points,max_error=0.00001):
+################ This is the import statement required to reference scripts within the package
+import os,sys,glob
+ndh_tools_path_opts = [
+    '/mnt/data01/Code/',
+    '/mnt/l/mnt/data01/Code/',
+    '/home/common/HolschuhLab/Code/'
+]
+for i in ndh_tools_path_opts:
+    if os.path.isfile(i): sys.path.append(i)
+################################################################################################
+
+import NDH_Tools as ndh
+
+def calculate_flowlines(input_xr,seed_points,uv_varnames=['u','v'],xy_varnames=['x','y'],steps=20000,ds=2,forward0_both1_backward2=1):
     """
     % (C) Nick Holschuh - Amherst College -- 2022 ([email protected])
     %
@@ -10,7 +25,7 @@ def calculate_flowlines(x,y,u,v,seed_points,max_error=0.00001):
     %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
     % The inputs are:
     %
-    %     input_array -- array of data to analyze
+    %     input_xr -- xarray dataarray that has the gradient objects in it
     %
     %%%%%%%%%%%%%%%
     % The outputs are:
@@ -20,34 +35,189 @@ def calculate_flowlines(x,y,u,v,seed_points,max_error=0.00001):
     %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
     """ 
 
-    ################# This uses a modified plt.streamline to pass through a user-editable keyword
-    ################# argument "max_error", which goes into the interpolater to guarantee
-    ################# accurate streammline calculation. Copy this version of streamplot
-    ################# into your matplotlib directory to enable the use of streamline
-    ################# calculation from NDH_Tools
-
-    
-    sls = []
-    
-    if isinstance(seed_points,list):
-        seed_points = np.array(seed_points)
-    
-    if len(seed_points.shape) == 1:
-        seed_points = np.expand_dims(seed_points,axis=0)
-    
-    fig = plt.figure()
-    
-    for ind0, sp in enumerate(seed_points[:,0]):
-        streamlines = plt.streamplot(x,y,u,v,start_points=[seed_points[ind0,:]], max_error=max_error)
-
-
-        ########### Here we extract the coordinate information along the streamline
-        sl = [streamlines.lines.get_paths()[0].vertices[0]]
-        for i in streamlines.lines.get_paths():
-            sl.append(i.vertices[1])
-
-        sls.append(np.array(sl))
-    
-    plt.close(fig)
-    
-    return sls
+    ##################### Here, we standardize the naming convention within the xarray object
+    input_xr = input_xr.rename({xy_varnames[0]:'x',xy_varnames[1]:'y'})
+    uv_scalar = np.sqrt(input_xr[uv_varnames[0]].values**2 + input_xr[uv_varnames[1]].values**2)
+    input_xr[uv_varnames[0]] = (('y','x'),input_xr[uv_varnames[0]].values/uv_scalar)
+    input_xr[uv_varnames[1]] = (('y','x'),input_xr[uv_varnames[1]].values/uv_scalar)
+
+
+    #################### We initialize the objects for the flowline calculation
+    flowlines = []
+
+    #################### Here is the forward calculation
+    if forward0_both1_backward2 <= 1:
+        temp_xs = np.expand_dims(seed_points[:,0],0)
+        temp_ys = np.expand_dims(seed_points[:,1],0)
+
+        for ind0 in tqdm.tqdm(np.arange(steps)):
+            x_search = xr.DataArray(temp_xs[-1,:],dims=['vector_index'])
+            y_search = xr.DataArray(temp_ys[-1,:],dims=['vector_index'])
+            new_u = input_xr[uv_varnames[0]].sel(x=x_search,y=y_search,method='nearest')
+            new_v = input_xr[uv_varnames[1]].sel(x=x_search,y=y_search,method='nearest')
+
+            ######### This is an order of magnitude slower
+            #new_u = input_xr[uv_varnames[0]].interp(x=x_search,y=y_search)
+            #new_v = input_xr[uv_varnames[1]].interp(x=x_search,y=y_search)
+
+            temp_xs = np.concatenate([temp_xs,temp_xs[-1:,:]+new_u.values.T*ds])
+            temp_ys = np.concatenate([temp_ys,temp_ys[-1:,:]+new_v.values.T*ds])
+
+        xs = temp_xs
+        ys = temp_ys
+    else:
+        xs = np.empty([2,1])
+        ys = np.empty([2,1])
+
+
+    #################### Here is the backward calculation
+    if forward0_both1_backward2 >= 1:
+        temp_xs = np.expand_dims(seed_points[:,0],0)
+        temp_ys = np.expand_dims(seed_points[:,1],0)
+
+        for ind0 in tqdm.tqdm(np.arange(steps)):
+            x_search = xr.DataArray(temp_xs[-1,:],dims=['vector_index'])
+            y_search = xr.DataArray(temp_ys[-1,:],dims=['vector_index'])
+            new_u = input_xr[uv_varnames[0]].sel(x=x_search,y=y_search,method='nearest')
+            new_v = input_xr[uv_varnames[1]].sel(x=x_search,y=y_search,method='nearest')
+
+            ######### This is an order of magnitude slower
+            #new_u = input_xr[uv_varnames[0]].interp(x=x_search,y=y_search)
+            #new_v = input_xr[uv_varnames[1]].interp(x=x_search,y=y_search)
+
+            temp_xs = np.concatenate([temp_xs,temp_xs[-1:,:]-new_u.values.T*ds])
+            temp_ys = np.concatenate([temp_ys,temp_ys[-1:,:]-new_v.values.T*ds])
+
+        xs = np.concatenate([np.flipud(temp_xs),xs])
+        ys = np.concatenate([np.flipud(temp_ys),ys])  
+
+
+
+    flowlines = []
+    for ind0 in np.arange(len(xs[0,:])):
+        xy = np.stack([xs[:,ind0],ys[:,ind0]]).T
+        flowlines.append(xy)
+        
+    return flowlines
+
+##########################################################################################
+#### This version of the code doesn't work quite right...
+##########################################################################################
+##def calculate_flowlines(x,y,u,v,seed_points,max_error=0.00001,retry_count_threshold=10):
+##    """
+##    % (C) Nick Holschuh - Amherst College -- 2022 ([email protected])
+##    %
+##    % This function prints out the minimum and maximum values of an array
+##    %
+##    %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+##    % The inputs are:
+##    %
+##    %     input_array -- array of data to analyze
+##    %
+##    %%%%%%%%%%%%%%%
+##    % The outputs are:
+##    %
+##    %      output -- the min and max in a 1x2 array
+##    %
+##    %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+##    """ 
+##
+##    ################# This uses a modified plt.streamline to pass through a user-editable keyword
+##    ################# argument "max_error", which goes into the interpolater to guarantee
+##    ################# accurate streamline calculation. Copy the updated version of streamplot
+##    ################# into your matplotlib directory to enable the use of streamline
+##    ################# calculation from NDH_Tools (in streamline.py, which calls _integrate_rk12)
+##
+##    if isinstance(seed_points,list):
+##        seed_points = np.array(seed_points)
+##
+##    if len(seed_points.shape) == 1:
+##        seed_points = np.expand_dims(seed_points,axis=0)
+##
+##    ###################### Initialize the returned object
+##    final_sls = []
+##    for ind0 in np.arange(len(seed_points[:,0])):
+##        final_sls.append([])
+##
+##    retry_count = 0
+##    retry_inds = np.arange(0,len(seed_points[:,0]))
+##    seed_subset = seed_points
+##
+##    while len(retry_inds) > 0:
+##
+##        sls = []
+##
+##        ################# Calculate the streamlines for all unfound seed points
+##        fig = plt.figure()
+##        if retry_count == 0:
+##            print('The initial streamline calculation -- this can be slow. Finding '+str(len(seed_subset[:,0]))+' streamlines')
+##        try:
+##            streamlines = plt.streamplot(x,y,u,v,start_points=seed_points, max_error=max_error, density=100)
+##        except:
+##            streamlines = plt.streamplot(x,y,u,v,start_points=seed_points, density=100)
+##            if retry_count == 0:
+##                print('Note: You need to update your matplotlib streamline.py and reduce the max error for this to work properly')
+##        plt.close(fig)
+##
+##        ################# Here we extract the coordinate info from the streamlines
+##        sl_deconstruct = []
+##        for i in streamlines.lines.get_paths():
+##            sl_deconstruct.append(i.vertices[1])
+##        sl_deconstruct = np.array(sl_deconstruct)
+##
+##        ################ Here we separate the streamlines based on large breaks in distance
+##        sl_dist = ndh.distance_vector(sl_deconstruct[:,0],sl_deconstruct[:,1],1)
+##        dist_mean = np.mean(sl_dist)
+##        breaks = np.where(sl_dist > (dist_mean+1)*50)[0]
+##        if len(breaks) > 0:
+##            breaks = np.concatenate([np.array([-1]),breaks,np.array([len(sl_deconstruct[:,0])])])+1
+##        else:
+##            breaks = np.array([0,len(sl_deconstruct[:,0])+1])
+##
+##        for ind0 in np.arange(len(breaks)-1):
+##            sls.append(sl_deconstruct[breaks[ind0]:breaks[ind0+1],:])
+##
+##        ################ Here we identify which streamline goes with which seed_point
+##        matching = []
+##        for ind0 in np.arange(len(seed_subset[:,0])):
+##            dists = []
+##            for ind1,sl in enumerate(sls):
+##                comp_vals = ndh.find_nearest_xy(sl,seed_subset[ind0,:])
+##                dists.append(comp_vals['distance'][0])
+##            best = np.where(np.array(dists) < 1e-8)[0]
+##            try:
+##                matching.append(best[0])
+##            except:
+##                matching.append(-1)
+##
+##        ################# populate the final object
+##        for ind0,i in enumerate(matching):
+##            if i != -1:
+##                final_sls[retry_inds[ind0]] = sls[i]
+##
+##        ################# Finally, we identify the new set of streamlines that need to be computed, based on which have no match
+##        new_retry_inds = np.where(np.array(matching) == -1)[0]
+##        seed_subset = seed_points[retry_inds[new_retry_inds],:]
+##        retry_inds = retry_inds[new_retry_inds]
+##
+##        if len(retry_inds) > 0:
+##            retry_count = retry_count+1
+##            print('Recalculating for nearly overlapping points -- try '+str(retry_count)+'. Finding '+str(len(seed_subset[:,0]))+' streamlines')
+##            
+##        if retry_count > retry_count_threshold:
+##            break
+##
+##    if 0:
+##        plt.figure()
+##        plt.plot(test_dist)
+##        plt.axhline(dist_median,c='orange')
+##
+##    if 0:
+##        plt.figure()
+##        plt.plot(test[:,0],test[:,1],c='blue')
+##        for i in final_sls:
+##            plt.plot(i[:,0],i[:,1],c='red')
+##        plt.plot(seed_points[:,0],seed_points[:,1],'o')
+##
+##
+##    return final_sls
@@ -40,6 +40,7 @@ def find_pixelcoords(im_filename,original_width,original_height,im_pick_params=0
     import NDH_Tools as ndh
     import numpy as np
     import cv2
+    import tqdm
 
 
     im_handle = Image.open(im_filename)
@@ -50,16 +51,16 @@ def find_pixelcoords(im_filename,original_width,original_height,im_pick_params=0
     ######################### This method only works if the image is perfectly white outside of the axes
     if 0:
         im_frame = np.where(np_frame[:,:,3] == 255)
-
+    
         cinds = ndh.minmax(im_frame[1])
         rinds = ndh.minmax(im_frame[0])
     else:
     ########################## This is meant to handle some spillover of lines and points outside the image
         row_sum = np.sum(np_frame[:,:,2] == 255,axis=1)
         col_sum = np.sum(np_frame[:,:,2] == 255,axis=0)
 
-        rinds = ndh.minmax(np.where(row_sum > np.mean(row_sum)))
-        cinds = ndh.minmax(np.where(col_sum > np.mean(col_sum)))
+        rinds = ndh.minmax(np.where(row_sum <= np.percentile(row_sum,80)-1))
+        cinds = ndh.minmax(np.where(col_sum <= np.percentile(col_sum,80)-1))
 
     xrange = np.linspace(0,original_width,cinds[1]-cinds[0])
     yrange = np.linspace(0,original_height,rinds[1]-rinds[0])
@@ -89,6 +90,12 @@ def find_pixelcoords(im_filename,original_width,original_height,im_pick_params=0
         ############ Here, we post-process the picks to deal with gaps / multiple layers, etc.        
         #######################################################################################
         ########### Finally, we loop through the edge_trims and the picks, and pull out just the relevant info
+
+        #print('--- Total number of countoured objects to process: %d' %len(process_contours))
+        mod_step = 10**np.floor(np.log10(len(process_contours)/10));
+
+        
+        #for ind2 in tqdm.tqdm(range(len(process_contours))):
         for ind2 in range(len(process_contours)):
 
             pick_img = np.zeros_like(process_im)
@@ -213,6 +220,7 @@ def find_pixelcoords(im_filename,original_width,original_height,im_pick_params=0
             pick_output.append(pick_temp)
         else:
             pick_output.append(pick_temp)
+
 
 
     return pick_output
@@ -71,20 +71,21 @@ def generate_pickingpdf(fn,picking_root_dir,frame_spacing=25,surf_dir='CSARP_sur
         fn_list[-3] = surf_dir
         fn2 = '/'.join(fn_list)
 
-        try:
-            surfdata = ndh.loadmat(fn2)
-            surf_dims = surfdata['surf']['y'][1].shape
-            bot_ind = ndh.find_nearest(data['Time'],np.max(surfdata['surf']['y'][1]))
-        except:
-            print(fn2+' could not be found')
-            fn2 = 0
-            bot_ind = {'index':[len(data['Time'])-25]}
+        #try:
+        surfdata = ndh.loadmat(fn2)
+        surf_dims = surfdata['surf']['y'][1].shape
+        bot_ind = ndh.find_nearest(data['Time'],np.array([np.max(surfdata['surf']['y'][1])]))
+        bot_ind['index'] = [np.min([bot_ind['index'][0]+150,len(data['Time'])])]
+        #except:
+        #    print(fn2+' could not be found')
+        #    fn2 = 0
+        #    bot_ind = {'index':[len(data['Time'])]}
 
         #### Now we loop through the frames we want to plot and generate an image for
         frame_print = np.arange(0,len(xy['x']),frame_spacing)
         for ind1,i in enumerate(frame_print):
             ndh.remove_image(ax,1,verbose=0)
-            ax.imshow(np.squeeze(np.log10(data['Tomo']['img'][:bot_ind['index'][0]+25,:,i])),cmap='bone_r')
+            ax.imshow(np.squeeze(np.log10(data['Tomo']['img'][:bot_ind['index'][0],:,i])),cmap='bone_r')
             ax.set_aspect('auto')
             if fn2 != 0:
                 ndh.remove_line(ax,1,verbose=0)
@@ -95,7 +96,7 @@ def generate_pickingpdf(fn,picking_root_dir,frame_spacing=25,surf_dir='CSARP_sur
                 pass
 
             plt.axis('off')
-            plt.savefig('%s%s/%s/Frame_%0.4d_fs_%0.2d_crop_%0.4d.png' %(picking_root_dir,seg,frame,i,frame_spacing,bot_ind['index'][0]+25))
+            plt.savefig('%s%s/%s/Frame_%0.4d_fs_%0.2d_crop_%0.4d.png' %(picking_root_dir,seg,frame,i,frame_spacing,bot_ind['index'][0]))
 
 
         print('Completed the image generation')
@@ -105,7 +106,7 @@ def generate_pickingpdf(fn,picking_root_dir,frame_spacing=25,surf_dir='CSARP_sur
 
         ########## This converts all the images to a single pdf
         pdfroot = picking_root_dir+'To_Pick/'+seg+'/'
-        pdfend = '%s_fs_%0.2d_crop_%0.4d.pdf' %(frame,frame_spacing,bot_ind['index'][0]+25)
+        pdfend = '%s_fs_%0.2d_crop_%0.4d.pdf' %(frame,frame_spacing,bot_ind['index'][0])
         pdfname=pdfroot+pdfend
 
         frames = '%s%s/%s/*.png' % (picking_root_dir,seg,frame)
@@ -145,7 +146,9 @@ def generate_pickingpdf(fn,picking_root_dir,frame_spacing=25,surf_dir='CSARP_sur
             max_num = len(file_list)
             seg = file_list[-1].split('/')[-2]
             froot = seg
+            
         num_range = np.arange(1,max_num+1,1)
+        print('Images from '+str(max_num)+' files')