PyPI - celldetective - Versions diffs - 1.1.1.post3__py3-none-any.whl → 1.2.0__py3-none-any.whl - Mend

celldetective 1.1.1.post3py3-none-any.whl → 1.2.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (42) hide show

celldetective/__init__.py +2 -1
celldetective/__main__.py +17 -0
celldetective/extra_properties.py +62 -34
celldetective/gui/__init__.py +1 -0
celldetective/gui/analyze_block.py +2 -1
celldetective/gui/classifier_widget.py +18 -10
celldetective/gui/control_panel.py +57 -6
celldetective/gui/layouts.py +14 -11
celldetective/gui/neighborhood_options.py +21 -13
celldetective/gui/plot_signals_ui.py +39 -11
celldetective/gui/process_block.py +413 -95
celldetective/gui/retrain_segmentation_model_options.py +17 -4
celldetective/gui/retrain_signal_model_options.py +106 -6
celldetective/gui/signal_annotator.py +110 -30
celldetective/gui/signal_annotator2.py +2708 -0
celldetective/gui/signal_annotator_options.py +3 -1
celldetective/gui/survival_ui.py +15 -6
celldetective/gui/tableUI.py +248 -43
celldetective/io.py +598 -416
celldetective/measure.py +919 -969
celldetective/models/pair_signal_detection/blank +0 -0
celldetective/neighborhood.py +482 -340
celldetective/preprocessing.py +81 -61
celldetective/relative_measurements.py +648 -0
celldetective/scripts/analyze_signals.py +1 -1
celldetective/scripts/measure_cells.py +28 -8
celldetective/scripts/measure_relative.py +103 -0
celldetective/scripts/segment_cells.py +5 -5
celldetective/scripts/track_cells.py +4 -1
celldetective/scripts/train_segmentation_model.py +23 -18
celldetective/scripts/train_signal_model.py +33 -0
celldetective/segmentation.py +67 -29
celldetective/signals.py +402 -8
celldetective/tracking.py +8 -2
celldetective/utils.py +144 -12
{celldetective-1.1.1.post3.dist-info → celldetective-1.2.0.dist-info}/METADATA +8 -8
{celldetective-1.1.1.post3.dist-info → celldetective-1.2.0.dist-info}/RECORD +42 -38
{celldetective-1.1.1.post3.dist-info → celldetective-1.2.0.dist-info}/WHEEL +1 -1
tests/test_segmentation.py +1 -1
{celldetective-1.1.1.post3.dist-info → celldetective-1.2.0.dist-info}/LICENSE +0 -0
{celldetective-1.1.1.post3.dist-info → celldetective-1.2.0.dist-info}/entry_points.txt +0 -0
{celldetective-1.1.1.post3.dist-info → celldetective-1.2.0.dist-info}/top_level.txt +0 -0

celldetective/neighborhood.py CHANGED Viewed

@@ -8,17 +8,15 @@ from mahotas.features import haralick
 from scipy.ndimage import zoom
 import os
 import subprocess
-from celldetective.utils import rename_intensity_column, create_patch_mask, remove_redundant_features
+from celldetective.utils import contour_of_instance_segmentation, rename_intensity_column, create_patch_mask, remove_redundant_features, extract_identity_col
 from scipy.spatial.distance import cdist
-from celldetective.measure import contour_of_instance_segmentation
 from celldetective.io import locate_labels, get_position_pickle, get_position_table
 import re
 abs_path = os.sep.join([os.path.split(os.path.dirname(os.path.realpath(__file__)))[0], 'celldetective'])
-def set_live_status(setA,setB,status, not_status_option):
+def set_live_status(setA, setB, status, not_status_option):
 	"""
 	Updates the live status for cells in two datasets based on specified status columns and options.
@@ -48,45 +46,47 @@ def set_live_status(setA,setB,status, not_status_option):
 	"""
-	if status is None:
+	print(f"Provided statuses: {status}...")
+	if status is None or status==["live_status","live_status"] or status==[None,None]:
 		setA.loc[:,'live_status'] = 1
 		setB.loc[:,'live_status'] = 1
 		status = ['live_status', 'live_status']
 	elif isinstance(status,list):
 		assert len(status)==2,'Please provide only two columns to classify cells as alive or dead.'
-		if status[0] is None:
+		if status[0] is None or status[0]=='live_status':
 			setA.loc[:,'live_status'] = 1
 			status[0] = 'live_status'
-		elif status[0] is not None and isinstance(not_status_option,list):
-			setA.loc[setA[status[0]]==2,status[0]] = 1 #already happened events become event
+		elif status[0] is not None and isinstance(not_status_option, list):
+			setA.loc[setA[status[0]] == 2, status[0]] = 1  # already happened events become event
 			if not_status_option[0]:
 				setA.loc[:,'not_'+status[0]] = [not a if a==0 or a==1 else np.nan for a in setA.loc[:,status[0]].values]
 				status[0] = 'not_'+status[0]
-		if status[1] is None:
+		if status[1] is None or status[1]=='live_status':
 			setB.loc[:,'live_status'] = 1
 			status[1] = 'live_status'
-		elif status[1] is not None and isinstance(not_status_option,list):
-			setB.loc[setB[status[1]]==2,status[1]] = 1 #already happened events become event
+		elif status[1] is not None and isinstance(not_status_option, list):
+			setB.loc[setB[status[1]] == 2, status[1]] = 1  # already happened events become event
 			if not_status_option[1]:
-				setB.loc[:,'not_'+status[1]] = [not a if a==0 or a==1 else np.nan for a in setB.loc[:,status[1]].values]
-				status[1] = 'not_'+status[1]
+				setB.loc[:, 'not_' + status[1]] = [not a if a == 0 or a == 1 else np.nan for a in
+												   setB.loc[:, status[1]].values]
+				status[1] = 'not_' + status[1]
 		assert status[0] in list(setA.columns)
 		assert status[1] in list(setB.columns)
 	setA = setA.reset_index(drop=True)
-	setB = setB.reset_index(drop=True)
+	setB = setB.reset_index(drop=True)
 	return setA, setB, status
-def compute_attention_weight(dist_matrix, cut_distance, opposite_cell_status, opposite_cell_ids, axis=1, include_dead_weight=True):
+def compute_attention_weight(dist_matrix, cut_distance, opposite_cell_status, opposite_cell_ids, axis=1,
+							 include_dead_weight=True):
 	"""
 	Computes the attention weight for each cell based on its proximity to cells of an opposite type within a specified distance.
 	This function calculates the attention weight for cells by considering the distance to the cells of an opposite type
-	within a given cutoff distance. It optionally considers only the 'live' opposite cells based on their status. The function
+	within a given cutoff distance. It optionally considers only the 'live' opposite cells based on their status. The function
 	returns two arrays: one containing the attention weights and another containing the IDs of the closest opposite cells.
 	Parameters
@@ -117,34 +117,36 @@ def compute_attention_weight(dist_matrix, cut_distance, opposite_cell_status, op
 	closest_opposite = np.empty(dist_matrix.shape[axis])
 	for i in range(dist_matrix.shape[axis]):
-		if axis==1:
-			row = dist_matrix[:,i]
-		elif axis==0:
-			row = dist_matrix[i,:]
-		row[row==0.] = 1.0E06
-		nbr_opposite = len(row[row<=cut_distance])
+		if axis == 1:
+			row = dist_matrix[:, i]
+		elif axis == 0:
+			row = dist_matrix[i, :]
+		row[row == 0.] = 1.0E06
+		nbr_opposite = len(row[row <= cut_distance])
 		if not include_dead_weight:
-			stat = opposite_cell_status[np.where(row<=cut_distance)[0]]
-			nbr_opposite = len(stat[stat==1])
-			index_subpop = np.argmin(row[opposite_cell_status==1])
-			closest_opposite[i] = opposite_cell_ids[opposite_cell_status==1][index_subpop]
+			stat = opposite_cell_status[np.where(row <= cut_distance)[0]]
+			nbr_opposite = len(stat[stat == 1])
+			index_subpop = np.argmin(row[opposite_cell_status == 1])
+			closest_opposite[i] = opposite_cell_ids[opposite_cell_status == 1][index_subpop]
 		else:
 			closest_opposite[i] = opposite_cell_ids[np.argmin(row)]
-		if nbr_opposite>0:
-			weight = 1./float(nbr_opposite)
+		if nbr_opposite > 0:
+			weight = 1. / float(nbr_opposite)
 			weights[i] = weight
 	return weights, closest_opposite
-def distance_cut_neighborhood(setA, setB, distance, mode='two-pop', status=None, not_status_option=None, compute_cum_sum=True,
+def distance_cut_neighborhood(setA, setB, distance, mode='two-pop', status=None, not_status_option=None,
+							  compute_cum_sum=True,
 							  attention_weight=True, symmetrize=True, include_dead_weight=True,
-							  column_labels={'track': "TRACK_ID", 'time': 'FRAME', 'x': 'POSITION_X', 'y': 'POSITION_Y'}):
+							  column_labels={'track': "TRACK_ID", 'time': 'FRAME', 'x': 'POSITION_X',
+											 'y': 'POSITION_Y'}):
 	"""
-	Match neighbors in set A and B within a circle of radius d.
+	Match neighbors in set A and B within a circle of radius d.
 	Parameters
 	----------
@@ -154,7 +156,7 @@ def distance_cut_neighborhood(setA, setB, distance, mode='two-pop', status=None,
 		Cut-distance in pixels to match neighboring pairs.
 	mode: str
 		neighboring mode, between 'two-pop' (e.g. target-effector) and 'self' (target-target or effector-effector).
-	status: None or status
+	status: None or status
 		name to look for cells to ignore (because they are dead). By default all cells are kept.
 	compute_cum_sum: bool,
 		compute cumulated time of presence of neighbours (only if trajectories available for both sets)
@@ -170,112 +172,115 @@ def distance_cut_neighborhood(setA, setB, distance, mode='two-pop', status=None,
 	if setA is not None and setB is not None:
 		setA, setB, status = set_live_status(setA, setB, status, not_status_option)
 	else:
-		return None,None
+		return None, None
-	# Check distance option
+	# Check distance option
 	if not isinstance(distance, list):
 		distance = [distance]
 	for d in distance:
 		# loop over each provided distance
-		if mode=='two-pop':
+		if mode == 'two-pop':
 			neigh_col = f'neighborhood_2_circle_{d}_px'
-		elif mode=='self':
+		elif mode == 'self':
 			neigh_col = f'neighborhood_self_circle_{d}_px'
 		cl = []
-		for s in [setA,setB]:
+		for s in [setA, setB]:
 			# Check whether data can be tracked
 			temp_column_labels = column_labels.copy()
-			if not 'TRACK_ID' in list(s.columns):
-				temp_column_labels.update({'track': 'ID'})
-				compute_cum_sum = False # if no tracking data then cum_sum is not relevant
+			id_col = extract_identity_col(s)
+			temp_column_labels.update({'track': id_col})
+			if id_col=='ID':
+				compute_cum_sum = False  # if no tracking data then cum_sum is not relevant
 			cl.append(temp_column_labels)
 			# Remove nan tracks (cells that do not belong to a track)
 			s[neigh_col] = np.nan
 			s[neigh_col] = s[neigh_col].astype(object)
-			s.dropna(subset=[cl[-1]['track']],inplace=True)
+			s.dropna(subset=[cl[-1]['track']], inplace=True)
 		# Loop over each available timestep
-		timeline = np.unique(np.concatenate([setA[cl[0]['time']].to_numpy(), setB[cl[1]['time']].to_numpy()])).astype(int)
+		timeline = np.unique(np.concatenate([setA[cl[0]['time']].to_numpy(), setB[cl[1]['time']].to_numpy()])).astype(
+			int)
 		for t in tqdm(timeline):
-			index_A = list(setA.loc[setA[cl[0]['time']]==t].index)
-			coordinates_A = setA.loc[setA[cl[0]['time']]==t,[cl[0]['x'], cl[0]['y']]].to_numpy()
-			ids_A = setA.loc[setA[cl[0]['time']]==t,cl[0]['track']].to_numpy()
-			status_A = setA.loc[setA[cl[0]['time']]==t,status[0]].to_numpy()
+			index_A = list(setA.loc[setA[cl[0]['time']] == t].index)
+			coordinates_A = setA.loc[setA[cl[0]['time']] == t, [cl[0]['x'], cl[0]['y']]].to_numpy()
+			ids_A = setA.loc[setA[cl[0]['time']] == t, cl[0]['track']].to_numpy()
+			status_A = setA.loc[setA[cl[0]['time']] == t, status[0]].to_numpy()
-			index_B = list(setB.loc[setB[cl[1]['time']]==t].index)
-			coordinates_B = setB.loc[setB[cl[1]['time']]==t,[cl[1]['x'], cl[1]['y']]].to_numpy()
-			ids_B = setB.loc[setB[cl[1]['time']]==t,cl[1]['track']].to_numpy()
-			status_B = setB.loc[setB[cl[1]['time']]==t,status[1]].to_numpy()
+			index_B = list(setB.loc[setB[cl[1]['time']] == t].index)
+			coordinates_B = setB.loc[setB[cl[1]['time']] == t, [cl[1]['x'], cl[1]['y']]].to_numpy()
+			ids_B = setB.loc[setB[cl[1]['time']] == t, cl[1]['track']].to_numpy()
+			status_B = setB.loc[setB[cl[1]['time']] == t, status[1]].to_numpy()
 			if len(ids_A) > 0 and len(ids_B) > 0:
 				# compute distance matrix
 				dist_map = cdist(coordinates_A, coordinates_B, metric="euclidean")
 				if attention_weight:
-					weights, closest_A = compute_attention_weight(dist_map, d, status_A, ids_A, axis=1, include_dead_weight=include_dead_weight)
+					weights, closest_A = compute_attention_weight(dist_map, d, status_A, ids_A, axis=1,
+																  include_dead_weight=include_dead_weight)
 				# Target centric
 				for k in range(dist_map.shape[0]):
-					col = dist_map[k,:]
-					col[col==0.] = 1.0E06
-					neighs_B = np.array([ids_B[i] for i in np.where((col<=d))[0]])
-					status_neigh_B = np.array([status_B[i] for i in np.where((col<=d))[0]])
-					dist_B = [round(col[i],2) for i in np.where((col<=d))[0]]
-					if len(dist_B)>0:
-						closest_B_cell = neighs_B[np.argmin(dist_B)]
+					col = dist_map[k, :]
+					col[col == 0.] = 1.0E06
+					neighs_B = np.array([ids_B[i] for i in np.where((col <= d))[0]])
+					status_neigh_B = np.array([status_B[i] for i in np.where((col <= d))[0]])
+					dist_B = [round(col[i], 2) for i in np.where((col <= d))[0]]
+					if len(dist_B) > 0:
+						closest_B_cell = neighs_B[np.argmin(dist_B)]
 					if symmetrize and attention_weight:
 						n_neighs = float(len(neighs_B))
 						if not include_dead_weight:
-							n_neighs_alive = len(np.where(status_neigh_B==1)[0])
+							n_neighs_alive = len(np.where(status_neigh_B == 1)[0])
 							neigh_count = n_neighs_alive
 						else:
 							neigh_count = n_neighs
-						if neigh_count>0:
-							weight_A = 1./neigh_count
+						if neigh_count > 0:
+							weight_A = 1. / neigh_count
 						else:
 							weight_A = np.nan
-						if not include_dead_weight and status_A[k]==0:
+						if not include_dead_weight and status_A[k] == 0:
 							weight_A = 0
 					neighs = []
 					setA.at[index_A[k], neigh_col] = []
 					for n in range(len(neighs_B)):
 						# index in setB
-						n_index = np.where(ids_B==neighs_B[n])[0][0]
+						n_index = np.where(ids_B == neighs_B[n])[0][0]
 						# Assess if neigh B is closest to A
 						if attention_weight:
-							if closest_A[n_index]==ids_A[k]:
+							if closest_A[n_index] == ids_A[k]:
 								closest = True
 							else:
 								closest = False
 						if symmetrize:
 							# Load neighborhood previous data
 							sym_neigh = setB.loc[index_B[n_index], neigh_col]
-							if neighs_B[n]==closest_B_cell:
-								closest_b=True
+							if neighs_B[n] == closest_B_cell:
+								closest_b = True
 							else:
-								closest_b=False
+								closest_b = False
 							if isinstance(sym_neigh, list):
 								sym_neigh.append({'id': ids_A[k], 'distance': dist_B[n], 'status': status_A[k]})
 							else:
-								sym_neigh = [{'id': ids_A[k], 'distance': dist_B[n],'status': status_A[k]}]
+								sym_neigh = [{'id': ids_A[k], 'distance': dist_B[n], 'status': status_A[k]}]
 							if attention_weight:
 								sym_neigh[-1].update({'weight': weight_A, 'closest': closest_b})
 						# Write the minimum info about neighborhing cell B
 						neigh_dico = {'id': neighs_B[n], 'distance': dist_B[n], 'status': status_neigh_B[n]}
 						if attention_weight:
@@ -283,33 +288,42 @@ def distance_cut_neighborhood(setA, setB, distance, mode='two-pop', status=None,
 						if compute_cum_sum:
 							# Compute the integrated presence of the neighboring cell B
-							assert cl[1]['track'] == 'TRACK_ID','The set B does not seem to contain tracked data. The cumulative time will be meaningless.'
-							past_neighs = [[ll['id'] for ll in l] if len(l)>0 else [None] for l in setA.loc[(setA[cl[0]['track']]==ids_A[k])&(setA[cl[0]['time']]<=t), neigh_col].to_numpy()]
+							assert cl[1][
+									   'track'] == 'TRACK_ID', 'The set B does not seem to contain tracked data. The cumulative time will be meaningless.'
+							past_neighs = [[ll['id'] for ll in l] if len(l) > 0 else [None] for l in setA.loc[
+								(setA[cl[0]['track']] == ids_A[k]) & (setA[cl[0]['time']] <= t), neigh_col].to_numpy()]
 							past_neighs = [item for sublist in past_neighs for item in sublist]
 							if attention_weight:
-								past_weights = [[ll['weight'] for ll in l] if len(l)>0 else [None] for l in setA.loc[(setA[cl[0]['track']]==ids_A[k])&(setA[cl[0]['time']]<=t), neigh_col].to_numpy()]
+								past_weights = [[ll['weight'] for ll in l] if len(l) > 0 else [None] for l in setA.loc[
+									(setA[cl[0]['track']] == ids_A[k]) & (
+												setA[cl[0]['time']] <= t), neigh_col].to_numpy()]
 								past_weights = [item for sublist in past_weights for item in sublist]
-							cum_sum = len(np.where(past_neighs==neighs_B[n])[0])
-							neigh_dico.update({'cumulated_presence': cum_sum+1})
+							cum_sum = len(np.where(past_neighs == neighs_B[n])[0])
+							neigh_dico.update({'cumulated_presence': cum_sum + 1})
 							if attention_weight:
-								cum_sum_weighted = np.sum([w if l==neighs_B[n] else 0 for l,w in zip(past_neighs, past_weights)])
+								cum_sum_weighted = np.sum(
+									[w if l == neighs_B[n] else 0 for l, w in zip(past_neighs, past_weights)])
 								neigh_dico.update({'cumulated_presence_weighted': cum_sum_weighted + weights[n_index]})
 						if symmetrize:
 							setB.at[index_B[n_index], neigh_col] = sym_neigh
 						neighs.append(neigh_dico)
 					setA.at[index_A[k], neigh_col] = neighs
 	return setA, setB
-def compute_neighborhood_at_position(pos, distance, population=['targets','effectors'], theta_dist=None, img_shape=(2048,2048), return_tables=False, clear_neigh=False, event_time_col=None,
-	neighborhood_kwargs={'mode': 'two-pop','status': None, 'not_status_option': None,'include_dead_weight': True,"compute_cum_sum": False,"attention_weight": True, 'symmetrize': True}):
+def compute_neighborhood_at_position(pos, distance, population=['targets', 'effectors'], theta_dist=None,
+									 img_shape=(2048, 2048), return_tables=False, clear_neigh=False,
+									 event_time_col=None,
+									 neighborhood_kwargs={'mode': 'two-pop', 'status': None, 'not_status_option': None,
+														  'include_dead_weight': True, "compute_cum_sum": False,
+														  "attention_weight": True, 'symmetrize': True}):
 	"""
 	Computes neighborhood metrics for specified cell populations within a given position, based on distance criteria and additional parameters.
@@ -347,12 +361,12 @@ def compute_neighborhood_at_position(pos, distance, population=['targets','effec
 	------
 	AssertionError
 		If the specified position path does not exist or if the number of distances and edge thresholds do not match.
 	"""
-	pos = pos.replace('\\','/')
+	pos = pos.replace('\\', '/')
 	pos = rf"{pos}"
-	assert os.path.exists(pos),f'Position {pos} is not a valid path.'
+	assert os.path.exists(pos), f'Position {pos} is not a valid path.'
 	if isinstance(population, str):
 		population = [population, population]
@@ -363,75 +377,116 @@ def compute_neighborhood_at_position(pos, distance, population=['targets','effec
 		theta_dist = [theta_dist]
 	if theta_dist is None:
-		theta_dist = [0.9*d for d in distance]
-	assert len(theta_dist)==len(distance),'Incompatible number of distances and number of edge thresholds.'
+		theta_dist = [0.9 * d for d in distance]
+	assert len(theta_dist) == len(distance), 'Incompatible number of distances and number of edge thresholds.'
-	if population[0]==population[1]:
+	if population[0] == population[1]:
 		neighborhood_kwargs.update({'mode': 'self'})
-	if population[1]!=population[0]:
+	if population[1] != population[0]:
 		neighborhood_kwargs.update({'mode': 'two-pop'})
 	df_A, path_A = get_position_table(pos, population=population[0], return_path=True)
 	df_B, path_B = get_position_table(pos, population=population[1], return_path=True)
+	if clear_neigh:
+		if os.path.exists(path_A.replace('.csv','.pkl')):
+			os.remove(path_A.replace('.csv','.pkl'))
+		if os.path.exists(path_B.replace('.csv','.pkl')):
+			os.remove(path_B.replace('.csv','.pkl'))
+		df_pair, pair_path = get_position_table(pos, population='pairs', return_path=True)
+		if df_pair is not None:
+			os.remove(pair_path)
 	df_A_pkl = get_position_pickle(pos, population=population[0], return_path=False)
 	df_B_pkl = get_position_pickle(pos, population=population[1], return_path=False)
 	if df_A_pkl is not None:
 		pkl_columns = np.array(df_A_pkl.columns)
 		neigh_columns = np.array([c.startswith('neighborhood') for c in pkl_columns])
-		cols = list(pkl_columns[neigh_columns]) + ['TRACK_ID','FRAME']
+		cols = list(pkl_columns[neigh_columns]) + ['FRAME']
+		id_col = extract_identity_col(df_A_pkl)
+		cols.append(id_col)
+		on_cols = [id_col, 'FRAME']
 		print(f'Recover {cols} from the pickle file...')
-		df_A = pd.merge(df_A, df_A_pkl.loc[:,cols], how="outer", on=['TRACK_ID','FRAME'])
-		print(df_A.columns)
+		try:
+			df_A = pd.merge(df_A, df_A_pkl.loc[:,cols], how="outer", on=on_cols)
+			print(df_A.columns)
+		except Exception as e:
+			print(f'Failure to merge pickle and csv files: {e}')
 	if df_B_pkl is not None and df_B is not None:
 		pkl_columns = np.array(df_B_pkl.columns)
 		neigh_columns = np.array([c.startswith('neighborhood') for c in pkl_columns])
-		cols = list(pkl_columns[neigh_columns]) + ['TRACK_ID','FRAME']
+		cols = list(pkl_columns[neigh_columns]) + ['FRAME']
+		id_col = extract_identity_col(df_B_pkl)
+		cols.append(id_col)
+		on_cols = [id_col, 'FRAME']
 		print(f'Recover {cols} from the pickle file...')
-		df_B = pd.merge(df_B, df_B_pkl.loc[:,cols], how="outer", on=['TRACK_ID','FRAME'])
+		try:
+			df_B = pd.merge(df_B, df_B_pkl.loc[:,cols], how="outer", on=on_cols)
+		except Exception as e:
+			print(f'Failure to merge pickle and csv files: {e}')
 	if clear_neigh:
 		unwanted = df_A.columns[df_A.columns.str.contains('neighborhood')]
 		df_A = df_A.drop(columns=unwanted)
 		unwanted = df_B.columns[df_B.columns.str.contains('neighborhood')]
-		df_B = df_B.drop(columns=unwanted)
+		df_B = df_B.drop(columns=unwanted)
-	df_A, df_B = distance_cut_neighborhood(df_A,df_B, distance,**neighborhood_kwargs)
-	if df_A is None or df_B is None:
+	df_A, df_B = distance_cut_neighborhood(df_A, df_B, distance, **neighborhood_kwargs)
+	if df_A is None or df_B is None or len(df_A)==0:
 		return None
-	for td,d in zip(theta_dist, distance):
+	for td, d in zip(theta_dist, distance):
-		if neighborhood_kwargs['mode']=='two-pop':
+		if neighborhood_kwargs['mode'] == 'two-pop':
 			neigh_col = f'neighborhood_2_circle_{d}_px'
-		elif neighborhood_kwargs['mode']=='self':
+		elif neighborhood_kwargs['mode'] == 'self':
 			neigh_col = f'neighborhood_self_circle_{d}_px'
-		edge_filter_A = (df_A['POSITION_X'] > td)&(df_A['POSITION_Y'] > td)&(df_A['POSITION_Y'] < (img_shape[0] - td))&(df_A['POSITION_X'] < (img_shape[1] - td))
-		edge_filter_B = (df_B['POSITION_X'] > td)&(df_B['POSITION_Y'] > td)&(df_B['POSITION_Y'] < (img_shape[0] - td))&(df_B['POSITION_X'] < (img_shape[1] - td))
-		df_A.loc[~edge_filter_A, neigh_col] = np.nan
-		df_B.loc[~edge_filter_B, neigh_col] = np.nan
+		# edge_filter_A = (df_A['POSITION_X'] > td)&(df_A['POSITION_Y'] > td)&(df_A['POSITION_Y'] < (img_shape[0] - td))&(df_A['POSITION_X'] < (img_shape[1] - td))
+		# edge_filter_B = (df_B['POSITION_X'] > td)&(df_B['POSITION_Y'] > td)&(df_B['POSITION_Y'] < (img_shape[0] - td))&(df_B['POSITION_X'] < (img_shape[1] - td))
+		# df_A.loc[~edge_filter_A, neigh_col] = np.nan
+		# df_B.loc[~edge_filter_B, neigh_col] = np.nan
+		print('Count neighborhood...')
 		df_A = compute_neighborhood_metrics(df_A, neigh_col, metrics=['inclusive','exclusive','intermediate'], decompose_by_status=True)
-		if neighborhood_kwargs['symmetrize']:
-			df_B = compute_neighborhood_metrics(df_B, neigh_col, metrics=['inclusive','exclusive','intermediate'], decompose_by_status=True)
-		df_A = mean_neighborhood_before_event(df_A, neigh_col, event_time_col)
-		df_A = mean_neighborhood_after_event(df_A, neigh_col, event_time_col)
-	df_A.to_pickle(path_A.replace('.csv','.pkl'))
-	if not population[0]==population[1]:
-		df_B.to_pickle(path_B.replace('.csv','.pkl'))
+		# if neighborhood_kwargs['symmetrize']:
+		# 	df_B = compute_neighborhood_metrics(df_B, neigh_col, metrics=['inclusive','exclusive','intermediate'], decompose_by_status=True)
+		print('Done...')
+		if 'TRACK_ID' in list(df_A.columns):
+			if not np.all(df_A['TRACK_ID'].isnull()):
+				print('Estimate average neighborhood before/after event...')
+				df_A = mean_neighborhood_before_event(df_A, neigh_col, event_time_col)
+				if event_time_col is not None:
+					df_A = mean_neighborhood_after_event(df_A, neigh_col, event_time_col)
+				print('Done...')
+	df_A.to_pickle(path_A.replace('.csv', '.pkl'))
+	if not population[0] == population[1]:
+		# Remove neighborhood column
+		for td, d in zip(theta_dist, distance):
+			if neighborhood_kwargs['mode'] == 'two-pop':
+				neigh_col = f'neighborhood_2_circle_{d}_px'
+			elif neighborhood_kwargs['mode'] == 'self':
+				neigh_col = f'neighborhood_self_circle_{d}_px'
+			df_B = df_B.drop(columns=[neigh_col])
+		df_B.to_pickle(path_B.replace('.csv', '.pkl'))
 	unwanted = df_A.columns[df_A.columns.str.startswith('neighborhood_')]
 	df_A2 = df_A.drop(columns=unwanted)
 	df_A2.to_csv(path_A, index=False)
-	if not population[0]==population[1]:
+	if not population[0] == population[1]:
 		unwanted = df_B.columns[df_B.columns.str.startswith('neighborhood_')]
 		df_B_csv = df_B.drop(unwanted, axis=1, inplace=False)
-		df_B_csv.to_csv(path_B,index=False)
+		df_B_csv.to_csv(path_B, index=False)
 	if return_tables:
 		return df_A, df_B
@@ -480,17 +535,21 @@ def compute_neighborhood_metrics(neigh_table, neigh_col, metrics=['inclusive','e
 	>>> neigh_col = 'neighborhood_info'
 	>>> updated_neigh_table = compute_neighborhood_metrics(neigh_table, neigh_col, metrics=['inclusive'], decompose_by_status=True)
 	# Computes the inclusive count of neighbors for each cell, decomposed by cell status.
 	"""
 	neigh_table = neigh_table.reset_index(drop=True)
 	if 'position' in list(neigh_table.columns):
-		groupbycols = ['position','TRACK_ID']
+		groupbycols = ['position']
 	else:
-		groupbycols = ['TRACK_ID']
+		groupbycols = []
+	id_col = extract_identity_col(neigh_table)
+	groupbycols.append(id_col)
 	neigh_table.sort_values(by=groupbycols+['FRAME'],inplace=True)
-	for tid,group in neigh_table.groupby(groupbycols):
+	for tid, group in neigh_table.groupby(groupbycols):
 		group = group.dropna(subset=neigh_col)
 		indices = list(group.index)
 		neighbors = group[neigh_col].to_numpy()
@@ -536,49 +595,52 @@ def compute_neighborhood_metrics(neigh_table, neigh_col, metrics=['inclusive','e
 			if 'intermediate' in metrics:
 				n_intermediate[t] = np.sum(weights_at_t)
 			if 'exclusive' in metrics:
-				n_exclusive[t] = sum([c==1.0 for c in closest_at_t])
+				n_exclusive[t] = sum([c == 1.0 for c in closest_at_t])
 			if decompose_by_status:
 				if 'inclusive' in metrics:
-					n_inclusive_status_0[t] = sum([s==0.0 for s in status_at_t])
-					n_inclusive_status_1[t] = sum([s==1.0 for s in status_at_t])
+					n_inclusive_status_0[t] = sum([s == 0.0 for s in status_at_t])
+					n_inclusive_status_1[t] = sum([s == 1.0 for s in status_at_t])
 				if 'intermediate' in metrics:
 					weights_at_t = np.array(weights_at_t)
 					# intermediate
-					weights_status_1 = weights_at_t[np.array([s==1.0 for s in status_at_t],dtype=bool)]
-					weights_status_0 = weights_at_t[np.array([s==0.0 for s in status_at_t],dtype=bool)]
+					weights_status_1 = weights_at_t[np.array([s == 1.0 for s in status_at_t], dtype=bool)]
+					weights_status_0 = weights_at_t[np.array([s == 0.0 for s in status_at_t], dtype=bool)]
 					n_intermediate_status_1[t] = np.sum(weights_status_1)
 					n_intermediate_status_0[t] = np.sum(weights_status_0)
 				if 'exclusive' in metrics:
-					n_exclusive_status_0[t] = sum([c==1.0 if s==0.0 else False for c,s in zip(closest_at_t,status_at_t)])
-					n_exclusive_status_1[t] = sum([c==1.0 if s==1.0 else False for c,s in zip(closest_at_t,status_at_t)])
+					n_exclusive_status_0[t] = sum(
+						[c == 1.0 if s == 0.0 else False for c, s in zip(closest_at_t, status_at_t)])
+					n_exclusive_status_1[t] = sum(
+						[c == 1.0 if s == 1.0 else False for c, s in zip(closest_at_t, status_at_t)])
 		if 'inclusive' in metrics:
-			neigh_table.loc[indices, 'inclusive_count_'+neigh_col] = n_inclusive
+			neigh_table.loc[indices, 'inclusive_count_' + neigh_col] = n_inclusive
 		if 'intermediate' in metrics:
-			neigh_table.loc[indices, 'intermediate_count_'+neigh_col] = n_intermediate
+			neigh_table.loc[indices, 'intermediate_count_' + neigh_col] = n_intermediate
 		if 'exclusive' in metrics:
-			neigh_table.loc[indices, 'exclusive_count_'+neigh_col] = n_exclusive
+			neigh_table.loc[indices, 'exclusive_count_' + neigh_col] = n_exclusive
 		if decompose_by_status:
 			if 'inclusive' in metrics:
-				neigh_table.loc[indices, 'inclusive_count_s0_'+neigh_col] = n_inclusive_status_0
-				neigh_table.loc[indices, 'inclusive_count_s1_'+neigh_col] = n_inclusive_status_1
+				neigh_table.loc[indices, 'inclusive_count_s0_' + neigh_col] = n_inclusive_status_0
+				neigh_table.loc[indices, 'inclusive_count_s1_' + neigh_col] = n_inclusive_status_1
 			if 'intermediate' in metrics:
-				neigh_table.loc[indices, 'intermediate_count_s0_'+neigh_col] = n_intermediate_status_0
-				neigh_table.loc[indices, 'intermediate_count_s1_'+neigh_col] = n_intermediate_status_1
-			if 'exclusive' in metrics:
-				neigh_table.loc[indices, 'exclusive_count_s0_'+neigh_col] = n_exclusive_status_0
-				neigh_table.loc[indices, 'exclusive_count_s1_'+neigh_col] = n_exclusive_status_1
+				neigh_table.loc[indices, 'intermediate_count_s0_' + neigh_col] = n_intermediate_status_0
+				neigh_table.loc[indices, 'intermediate_count_s1_' + neigh_col] = n_intermediate_status_1
+			if 'exclusive' in metrics:
+				neigh_table.loc[indices, 'exclusive_count_s0_' + neigh_col] = n_exclusive_status_0
+				neigh_table.loc[indices, 'exclusive_count_s1_' + neigh_col] = n_exclusive_status_1
 	return neigh_table
-def mean_neighborhood_before_event(neigh_table, neigh_col, event_time_col, metrics=['inclusive','exclusive','intermediate']):
+def mean_neighborhood_before_event(neigh_table, neigh_col, event_time_col,
+								   metrics=['inclusive', 'exclusive', 'intermediate']):
 	"""
 	Computes the mean neighborhood metrics for each cell track before a specified event time.
@@ -607,52 +669,64 @@ def mean_neighborhood_before_event(neigh_table, neigh_col, event_time_col, metri
 	"""
+	neigh_table = neigh_table.reset_index(drop=True)
 	if 'position' in list(neigh_table.columns):
-		groupbycols = ['position','TRACK_ID']
+		groupbycols = ['position']
 	else:
-		groupbycols = ['TRACK_ID']
+		groupbycols = []
+	id_col = extract_identity_col(neigh_table)
+	groupbycols.append(id_col)
 	neigh_table.sort_values(by=groupbycols+['FRAME'],inplace=True)
 	suffix = '_before_event'
 	if event_time_col is None:
 		print('No event time was provided... Estimating the mean neighborhood over the whole observation time...')
-		neigh_table.loc[:,'event_time_temp'] = neigh_table['FRAME'].max()
+		neigh_table.loc[:, 'event_time_temp'] = neigh_table['FRAME'].max()
 		event_time_col = 'event_time_temp'
 		suffix = ''
-	for tid,group in neigh_table.groupby(groupbycols):
+	for tid, group in neigh_table.groupby(groupbycols):
 		group = group.dropna(subset=neigh_col)
 		indices = list(group.index)
 		event_time_values = group[event_time_col].to_numpy()
-		if len(event_time_values)>0:
+		if len(event_time_values) > 0:
 			event_time = event_time_values[0]
 		else:
 			continue
-		if event_time<0.:
+		if event_time < 0.:
 			event_time = group['FRAME'].max()
 		if 'intermediate' in metrics:
-			valid_counts_intermediate = group.loc[group['FRAME']<=event_time,'intermediate_count_s1_'+neigh_col].to_numpy()
-			if len(valid_counts_intermediate[valid_counts_intermediate==valid_counts_intermediate])>0:
-				neigh_table.loc[indices, f'mean_count_intermediate_{neigh_col}{suffix}'] = np.nanmean(valid_counts_intermediate)
+			valid_counts_intermediate = group.loc[
+				group['FRAME'] <= event_time, 'intermediate_count_s1_' + neigh_col].to_numpy()
+			if len(valid_counts_intermediate[valid_counts_intermediate == valid_counts_intermediate]) > 0:
+				neigh_table.loc[indices, f'mean_count_intermediate_{neigh_col}{suffix}'] = np.nanmean(
+					valid_counts_intermediate)
 		if 'inclusive' in metrics:
-			valid_counts_inclusive = group.loc[group['FRAME']<=event_time,'inclusive_count_s1_'+neigh_col].to_numpy()
-			if len(valid_counts_inclusive[valid_counts_inclusive==valid_counts_inclusive])>0:
-				neigh_table.loc[indices, f'mean_count_inclusive_{neigh_col}{suffix}'] = np.nanmean(valid_counts_inclusive)
+			valid_counts_inclusive = group.loc[
+				group['FRAME'] <= event_time, 'inclusive_count_s1_' + neigh_col].to_numpy()
+			if len(valid_counts_inclusive[valid_counts_inclusive == valid_counts_inclusive]) > 0:
+				neigh_table.loc[indices, f'mean_count_inclusive_{neigh_col}{suffix}'] = np.nanmean(
+					valid_counts_inclusive)
 		if 'exclusive' in metrics:
-			valid_counts_exclusive = group.loc[group['FRAME']<=event_time,'exclusive_count_s1_'+neigh_col].to_numpy()
-			if len(valid_counts_exclusive[valid_counts_exclusive==valid_counts_exclusive])>0:
-				neigh_table.loc[indices, f'mean_count_exclusive_{neigh_col}{suffix}'] = np.nanmean(valid_counts_exclusive)
+			valid_counts_exclusive = group.loc[
+				group['FRAME'] <= event_time, 'exclusive_count_s1_' + neigh_col].to_numpy()
+			if len(valid_counts_exclusive[valid_counts_exclusive == valid_counts_exclusive]) > 0:
+				neigh_table.loc[indices, f'mean_count_exclusive_{neigh_col}{suffix}'] = np.nanmean(
+					valid_counts_exclusive)
-	if event_time_col=='event_time_temp':
+	if event_time_col == 'event_time_temp':
 		neigh_table = neigh_table.drop(columns='event_time_temp')
 	return neigh_table
-def mean_neighborhood_after_event(neigh_table, neigh_col, event_time_col, metrics=['inclusive','exclusive','intermediate']):
+def mean_neighborhood_after_event(neigh_table, neigh_col, event_time_col,
+								  metrics=['inclusive', 'exclusive', 'intermediate']):
 	"""
 	Computes the mean neighborhood metrics for each cell track after a specified event time.
@@ -681,54 +755,67 @@ def mean_neighborhood_after_event(neigh_table, neigh_col, event_time_col, metric
 	"""
+	neigh_table = neigh_table.reset_index(drop=True)
 	if 'position' in list(neigh_table.columns):
-		groupbycols = ['position','TRACK_ID']
+		groupbycols = ['position']
 	else:
-		groupbycols = ['TRACK_ID']
+		groupbycols = []
+	id_col = extract_identity_col(neigh_table)
+	groupbycols.append(id_col)
 	neigh_table.sort_values(by=groupbycols+['FRAME'],inplace=True)
 	suffix = '_after_event'
 	if event_time_col is None:
-		neigh_table.loc[:,'event_time_temp'] = None #neigh_table['FRAME'].max()
+		neigh_table.loc[:, 'event_time_temp'] = None  # neigh_table['FRAME'].max()
 		event_time_col = 'event_time_temp'
 		suffix = ''
-	for tid,group in neigh_table.groupby(groupbycols):
+	for tid, group in neigh_table.groupby(groupbycols):
 		group = group.dropna(subset=neigh_col)
 		indices = list(group.index)
 		event_time_values = group[event_time_col].to_numpy()
-		if len(event_time_values)>0:
+		if len(event_time_values) > 0:
 			event_time = event_time_values[0]
 		else:
 			continue
-		if event_time is not None and (event_time>=0.):
+		if event_time is not None and (event_time >= 0.):
 			if 'intermediate' in metrics:
-				valid_counts_intermediate = group.loc[group['FRAME']>event_time,'intermediate_count_s1_'+neigh_col].to_numpy()
-				if len(valid_counts_intermediate[valid_counts_intermediate==valid_counts_intermediate])>0:
-					neigh_table.loc[indices, f'mean_count_intermediate_{neigh_col}{suffix}'] = np.nanmean(valid_counts_intermediate)
+				valid_counts_intermediate = group.loc[
+					group['FRAME'] > event_time, 'intermediate_count_s1_' + neigh_col].to_numpy()
+				if len(valid_counts_intermediate[valid_counts_intermediate == valid_counts_intermediate]) > 0:
+					neigh_table.loc[indices, f'mean_count_intermediate_{neigh_col}{suffix}'] = np.nanmean(
+						valid_counts_intermediate)
 			if 'inclusive' in metrics:
-				valid_counts_inclusive = group.loc[group['FRAME']>event_time,'inclusive_count_s1_'+neigh_col].to_numpy()
-				if len(valid_counts_inclusive[valid_counts_inclusive==valid_counts_inclusive])>0:
-					neigh_table.loc[indices, f'mean_count_inclusive_{neigh_col}{suffix}'] = np.nanmean(valid_counts_inclusive)
+				valid_counts_inclusive = group.loc[
+					group['FRAME'] > event_time, 'inclusive_count_s1_' + neigh_col].to_numpy()
+				if len(valid_counts_inclusive[valid_counts_inclusive == valid_counts_inclusive]) > 0:
+					neigh_table.loc[indices, f'mean_count_inclusive_{neigh_col}{suffix}'] = np.nanmean(
+						valid_counts_inclusive)
 			if 'exclusive' in metrics:
-				valid_counts_exclusive = group.loc[group['FRAME']>event_time,'exclusive_count_s1_'+neigh_col].to_numpy()
-				if len(valid_counts_exclusive[valid_counts_exclusive==valid_counts_exclusive])>0:
-					neigh_table.loc[indices, f'mean_count_exclusive_{neigh_col}{suffix}'] = np.nanmean(valid_counts_exclusive)
+				valid_counts_exclusive = group.loc[
+					group['FRAME'] > event_time, 'exclusive_count_s1_' + neigh_col].to_numpy()
+				if len(valid_counts_exclusive[valid_counts_exclusive == valid_counts_exclusive]) > 0:
+					neigh_table.loc[indices, f'mean_count_exclusive_{neigh_col}{suffix}'] = np.nanmean(
+						valid_counts_exclusive)
-	if event_time_col=='event_time_temp':
+	if event_time_col == 'event_time_temp':
 		neigh_table = neigh_table.drop(columns='event_time_temp')
 	return neigh_table
 # New functions for direct cell-cell contact neighborhood
 def sign(num):
 	return -1 if num < 0 else 1
 def contact_neighborhood(labelsA, labelsB=None, border=3, connectivity=2):
 	labelsA = labelsA.astype(float)
@@ -736,50 +823,50 @@ def contact_neighborhood(labelsA, labelsB=None, border=3, connectivity=2):
 		labelsB = labelsB.astype(float)
 	print(f"Border = {border}")
 	if border > 0:
 		print(labelsA.shape, border * (-1))
 		labelsA_edge = contour_of_instance_segmentation(label=labelsA, distance=border * (-1)).astype(float)
-		labelsA[np.where(labelsA_edge>0)] = labelsA_edge[np.where(labelsA_edge>0)]
+		labelsA[np.where(labelsA_edge > 0)] = labelsA_edge[np.where(labelsA_edge > 0)]
 		if labelsB is not None:
 			labelsB_edge = contour_of_instance_segmentation(label=labelsB, distance=border * (-1)).astype(float)
-			labelsB[np.where(labelsB_edge>0)] = labelsB_edge[np.where(labelsB_edge>0)]
+			labelsB[np.where(labelsB_edge > 0)] = labelsB_edge[np.where(labelsB_edge > 0)]
 	if labelsB is not None:
-		labelsA[labelsA!=0] = -labelsA[labelsA!=0]
+		labelsA[labelsA != 0] = -labelsA[labelsA != 0]
 		labelsAB = merge_labels(labelsA, labelsB)
 		labelsBA = merge_labels(labelsB, labelsA)
 		label_cases = [labelsAB, labelsBA]
 	else:
 		label_cases = [labelsA]
 	coocurrences = []
 	for lbl in label_cases:
 		coocurrences.extend(find_contact_neighbors(lbl, connectivity=connectivity))
-	unique_pairs = np.unique(coocurrences,axis=0)
+	unique_pairs = np.unique(coocurrences, axis=0)
 	if labelsB is not None:
-		neighs = np.unique([tuple(sorted(p)) for p in unique_pairs if p[0]!=p[1] and sign(p[0])!=sign(p[1])],axis=0)
+		neighs = np.unique([tuple(sorted(p)) for p in unique_pairs if p[0] != p[1] and sign(p[0]) != sign(p[1])],
+						   axis=0)
 	else:
-		neighs = np.unique([tuple(sorted(p)) for p in unique_pairs if p[0]!=p[1]],axis=0)
+		neighs = np.unique([tuple(sorted(p)) for p in unique_pairs if p[0] != p[1]], axis=0)
 	return neighs
 def merge_labels(labelsA, labelsB):
 	labelsA = labelsA.astype(float)
 	labelsB = labelsB.astype(float)
 	labelsAB = labelsA.copy()
-	labelsAB[np.where(labelsB!=0)] = labelsB[np.where(labelsB!=0)]
+	labelsAB[np.where(labelsB != 0)] = labelsB[np.where(labelsB != 0)]
 	return labelsAB
 def find_contact_neighbors(labels, connectivity=2):
-	assert labels.ndim==2,"Wrong dimension for labels..."
-	g, nodes = pixel_graph(labels, mask=labels.astype(bool),connectivity=connectivity)
+	assert labels.ndim == 2, "Wrong dimension for labels..."
+	g, nodes = pixel_graph(labels, mask=labels.astype(bool), connectivity=connectivity)
 	g.eliminate_zeros()
 	coo = g.tocoo()
@@ -788,18 +875,19 @@ def find_contact_neighbors(labels, connectivity=2):
 	center_values = labels.ravel()[center_coords]
 	neighbor_values = labels.ravel()[neighbor_coords]
-	touching_masks = np.column_stack((center_values, neighbor_values))
+	touching_masks = np.column_stack((center_values, neighbor_values))
 	return touching_masks
-def mask_contact_neighborhood(setA, setB, labelsA, labelsB, distance, mode='two-pop', status=None, not_status_option=None, compute_cum_sum=True,
+def mask_contact_neighborhood(setA, setB, labelsA, labelsB, distance, mode='two-pop', status=None,
+							  not_status_option=None, compute_cum_sum=True,
 							  attention_weight=True, symmetrize=True, include_dead_weight=True,
-							  column_labels={'track': "TRACK_ID", 'time': 'FRAME', 'x': 'POSITION_X', 'y': 'POSITION_Y', 'mask_id': 'class_id'}):
+							  column_labels={'track': "TRACK_ID", 'time': 'FRAME', 'x': 'POSITION_X', 'y': 'POSITION_Y',
+											 'mask_id': 'class_id'}):
 	"""
-	Match neighbors in set A and B within a circle of radius d.
+	Match neighbors in set A and B within a circle of radius d.
 	Parameters
 	----------
@@ -809,7 +897,7 @@ def mask_contact_neighborhood(setA, setB, labelsA, labelsB, distance, mode='two-
 		Cut-distance in pixels to match neighboring pairs.
 	mode: str
 		neighboring mode, between 'two-pop' (e.g. target-effector) and 'self' (target-target or effector-effector).
-	status: None or status
+	status: None or status
 		name to look for cells to ignore (because they are dead). By default all cells are kept.
 	compute_cum_sum: bool,
 		compute cumulated time of presence of neighbours (only if trajectories available for both sets)
@@ -825,57 +913,59 @@ def mask_contact_neighborhood(setA, setB, labelsA, labelsB, distance, mode='two-
 	if setA is not None and setB is not None:
 		setA, setB, status = set_live_status(setA, setB, status, not_status_option)
 	else:
-		return None,None
+		return None, None
-	# Check distance option
+	# Check distance option
 	if not isinstance(distance, list):
 		distance = [distance]
 	for d in distance:
 		# loop over each provided distance
-		if mode=='two-pop':
+		if mode == 'two-pop':
 			neigh_col = f'neighborhood_2_contact_{d}_px'
-		elif mode=='self':
+		elif mode == 'self':
 			neigh_col = f'neighborhood_self_contact_{d}_px'
 		cl = []
-		for s in [setA,setB]:
+		for s in [setA, setB]:
 			# Check whether data can be tracked
 			temp_column_labels = column_labels.copy()
-			if not 'TRACK_ID' in list(s.columns):
-				temp_column_labels.update({'track': 'ID'})
-				compute_cum_sum = False # if no tracking data then cum_sum is not relevant
+			id_col = extract_identity_col(s)
+			temp_column_labels.update({'track': id_col})
+			if id_col=='ID':
+				compute_cum_sum = False  # if no tracking data then cum_sum is not relevant
 			cl.append(temp_column_labels)
 			# Remove nan tracks (cells that do not belong to a track)
 			s[neigh_col] = np.nan
 			s[neigh_col] = s[neigh_col].astype(object)
-			s.dropna(subset=[cl[-1]['track']],inplace=True)
+			s.dropna(subset=[cl[-1]['track']], inplace=True)
 		# Loop over each available timestep
-		timeline = np.unique(np.concatenate([setA[cl[0]['time']].to_numpy(), setB[cl[1]['time']].to_numpy()])).astype(int)
+		timeline = np.unique(np.concatenate([setA[cl[0]['time']].to_numpy(), setB[cl[1]['time']].to_numpy()])).astype(
+			int)
 		for t in tqdm(timeline):
-			index_A = list(setA.loc[setA[cl[0]['time']]==t].index)
-			coordinates_A = setA.loc[setA[cl[0]['time']]==t,[cl[0]['x'], cl[0]['y']]].to_numpy()
-			ids_A = setA.loc[setA[cl[0]['time']]==t,cl[0]['track']].to_numpy()
-			mask_ids_A = setA.loc[setA[cl[0]['time']]==t,cl[0]['mask_id']].to_numpy()
-			status_A = setA.loc[setA[cl[0]['time']]==t,status[0]].to_numpy()
-			index_B = list(setB.loc[setB[cl[1]['time']]==t].index)
-			coordinates_B = setB.loc[setB[cl[1]['time']]==t,[cl[1]['x'], cl[1]['y']]].to_numpy()
-			ids_B = setB.loc[setB[cl[1]['time']]==t,cl[1]['track']].to_numpy()
-			mask_ids_B = setB.loc[setB[cl[1]['time']]==t,cl[1]['mask_id']].to_numpy()
-			status_B = setB.loc[setB[cl[1]['time']]==t,status[1]].to_numpy()
+			index_A = list(setA.loc[setA[cl[0]['time']] == t].index)
+			coordinates_A = setA.loc[setA[cl[0]['time']] == t, [cl[0]['x'], cl[0]['y']]].to_numpy()
+			ids_A = setA.loc[setA[cl[0]['time']] == t, cl[0]['track']].to_numpy()
+			mask_ids_A = setA.loc[setA[cl[0]['time']] == t, cl[0]['mask_id']].to_numpy()
+			status_A = setA.loc[setA[cl[0]['time']] == t, status[0]].to_numpy()
+			index_B = list(setB.loc[setB[cl[1]['time']] == t].index)
+			coordinates_B = setB.loc[setB[cl[1]['time']] == t, [cl[1]['x'], cl[1]['y']]].to_numpy()
+			ids_B = setB.loc[setB[cl[1]['time']] == t, cl[1]['track']].to_numpy()
+			mask_ids_B = setB.loc[setB[cl[1]['time']] == t, cl[1]['mask_id']].to_numpy()
+			status_B = setB.loc[setB[cl[1]['time']] == t, status[1]].to_numpy()
 			print(f"Frame {t}")
-			print(f"{mask_ids_A=}",f"{mask_ids_B}")
+			print(f"{mask_ids_A=}", f"{mask_ids_B}")
 			if len(ids_A) > 0 and len(ids_B) > 0:
 				# compute distance matrix
 				dist_map = cdist(coordinates_A, coordinates_B, metric="euclidean")
@@ -886,21 +976,21 @@ def mask_contact_neighborhood(setA, setB, labelsA, labelsB, distance, mode='two-
 					lblB = labelsB
 				print(f"Distance {d} for contact as border")
-				contact_pairs = contact_neighborhood(labelsA[t], labelsB=lblB, border=d, connectivity=2)
+				contact_pairs = contact_neighborhood(labelsA[t], labelsB=lblB, border=d, connectivity=2)
 				print(t, f"{np.unique(labelsA[t])=}")
 				print(f"Frame {t}: found the following contact pairs: {contact_pairs}...")
 				# Put infinite distance to all non-contact pairs (something like this)
-				plot_map=False
+				plot_map = False
-				if len(contact_pairs)>0:
+				if len(contact_pairs) > 0:
 					mask = np.ones_like(dist_map).astype(bool)
 					indices_to_keep = []
 					for cp in contact_pairs:
-						if np.any(cp<0):
-							if cp[0]<0:
+						if np.any(cp < 0):
+							if cp[0] < 0:
 								mask_A = cp[1]
 								mask_B = np.abs(cp[0])
 							else:
@@ -912,8 +1002,8 @@ def mask_contact_neighborhood(setA, setB, labelsA, labelsB, distance, mode='two-
 						try:
-							idx_A = np.where(mask_ids_A==int(mask_A))[0][0]
-							idx_B = np.where(mask_ids_B==int(mask_B))[0][0]
+							idx_A = np.where(mask_ids_A == int(mask_A))[0][0]
+							idx_B = np.where(mask_ids_B == int(mask_B))[0][0]
 							print(idx_A, idx_B)
 							indices_to_keep.append([idx_A,idx_B])
 						except Exception as e:
@@ -921,17 +1011,17 @@ def mask_contact_neighborhood(setA, setB, labelsA, labelsB, distance, mode='two-
 							pass
 					print(f'Indices to keep: {indices_to_keep}...')
-					if len(indices_to_keep)>0:
+					if len(indices_to_keep) > 0:
 						indices_to_keep = np.array(indices_to_keep)
-						mask[indices_to_keep[:,0],indices_to_keep[:,1]] = False
-						if mode=='self':
-							mask[indices_to_keep[:,1],indices_to_keep[:,0]] = False
+						mask[indices_to_keep[:, 0], indices_to_keep[:, 1]] = False
+						if mode == 'self':
+							mask[indices_to_keep[:, 1], indices_to_keep[:, 0]] = False
 						dist_map[mask] = 1.0E06
 						plot_map=True
 					else:
 						dist_map[:,:] = 1.0E06
 				else:
-					dist_map[:,:] = 1.0E06
+					dist_map[:, :] = 1.0E06
 				# PROCEED all the same?? --> I guess so
 				# if plot_map:
@@ -943,62 +1033,63 @@ def mask_contact_neighborhood(setA, setB, labelsA, labelsB, distance, mode='two-
 				d_filter = 1.0E05
 				if attention_weight:
-					weights, closest_A = compute_attention_weight(dist_map, d_filter, status_A, ids_A, axis=1, include_dead_weight=include_dead_weight)
+					weights, closest_A = compute_attention_weight(dist_map, d_filter, status_A, ids_A, axis=1,
+																  include_dead_weight=include_dead_weight)
 				# Target centric
 				for k in range(dist_map.shape[0]):
-					col = dist_map[k,:]
-					col[col==0.] = 1.0E06
-					neighs_B = np.array([ids_B[i] for i in np.where((col<=d_filter))[0]])
-					status_neigh_B = np.array([status_B[i] for i in np.where((col<=d_filter))[0]])
-					dist_B = [round(col[i],2) for i in np.where((col<=d_filter))[0]]
-					if len(dist_B)>0:
-						closest_B_cell = neighs_B[np.argmin(dist_B)]
+					col = dist_map[k, :]
+					col[col == 0.] = 1.0E06
+					neighs_B = np.array([ids_B[i] for i in np.where((col <= d_filter))[0]])
+					status_neigh_B = np.array([status_B[i] for i in np.where((col <= d_filter))[0]])
+					dist_B = [round(col[i], 2) for i in np.where((col <= d_filter))[0]]
+					if len(dist_B) > 0:
+						closest_B_cell = neighs_B[np.argmin(dist_B)]
 					if symmetrize and attention_weight:
 						n_neighs = float(len(neighs_B))
 						if not include_dead_weight:
-							n_neighs_alive = len(np.where(status_neigh_B==1)[0])
+							n_neighs_alive = len(np.where(status_neigh_B == 1)[0])
 							neigh_count = n_neighs_alive
 						else:
 							neigh_count = n_neighs
-						if neigh_count>0:
-							weight_A = 1./neigh_count
+						if neigh_count > 0:
+							weight_A = 1. / neigh_count
 						else:
 							weight_A = np.nan
-						if not include_dead_weight and status_A[k]==0:
+						if not include_dead_weight and status_A[k] == 0:
 							weight_A = 0
 					neighs = []
 					setA.at[index_A[k], neigh_col] = []
 					for n in range(len(neighs_B)):
 						# index in setB
-						n_index = np.where(ids_B==neighs_B[n])[0][0]
+						n_index = np.where(ids_B == neighs_B[n])[0][0]
 						# Assess if neigh B is closest to A
 						if attention_weight:
-							if closest_A[n_index]==ids_A[k]:
+							if closest_A[n_index] == ids_A[k]:
 								closest = True
 							else:
 								closest = False
 						if symmetrize:
 							# Load neighborhood previous data
 							sym_neigh = setB.loc[index_B[n_index], neigh_col]
-							if neighs_B[n]==closest_B_cell:
-								closest_b=True
+							if neighs_B[n] == closest_B_cell:
+								closest_b = True
 							else:
-								closest_b=False
+								closest_b = False
 							if isinstance(sym_neigh, list):
 								sym_neigh.append({'id': ids_A[k], 'distance': dist_B[n], 'status': status_A[k]})
 							else:
-								sym_neigh = [{'id': ids_A[k], 'distance': dist_B[n],'status': status_A[k]}]
+								sym_neigh = [{'id': ids_A[k], 'distance': dist_B[n], 'status': status_A[k]}]
 							if attention_weight:
 								sym_neigh[-1].update({'weight': weight_A, 'closest': closest_b})
 						# Write the minimum info about neighborhing cell B
 						neigh_dico = {'id': neighs_B[n], 'distance': dist_B[n], 'status': status_neigh_B[n]}
 						if attention_weight:
@@ -1006,33 +1097,43 @@ def mask_contact_neighborhood(setA, setB, labelsA, labelsB, distance, mode='two-
 						if compute_cum_sum:
 							# Compute the integrated presence of the neighboring cell B
-							assert cl[1]['track'] == 'TRACK_ID','The set B does not seem to contain tracked data. The cumulative time will be meaningless.'
-							past_neighs = [[ll['id'] for ll in l] if len(l)>0 else [None] for l in setA.loc[(setA[cl[0]['track']]==ids_A[k])&(setA[cl[0]['time']]<=t), neigh_col].to_numpy()]
+							assert cl[1][
+									   'track'] == 'TRACK_ID', 'The set B does not seem to contain tracked data. The cumulative time will be meaningless.'
+							past_neighs = [[ll['id'] for ll in l] if len(l) > 0 else [None] for l in setA.loc[
+								(setA[cl[0]['track']] == ids_A[k]) & (setA[cl[0]['time']] <= t), neigh_col].to_numpy()]
 							past_neighs = [item for sublist in past_neighs for item in sublist]
 							if attention_weight:
-								past_weights = [[ll['weight'] for ll in l] if len(l)>0 else [None] for l in setA.loc[(setA[cl[0]['track']]==ids_A[k])&(setA[cl[0]['time']]<=t), neigh_col].to_numpy()]
+								past_weights = [[ll['weight'] for ll in l] if len(l) > 0 else [None] for l in setA.loc[
+									(setA[cl[0]['track']] == ids_A[k]) & (
+												setA[cl[0]['time']] <= t), neigh_col].to_numpy()]
 								past_weights = [item for sublist in past_weights for item in sublist]
-							cum_sum = len(np.where(past_neighs==neighs_B[n])[0])
-							neigh_dico.update({'cumulated_presence': cum_sum+1})
+							cum_sum = len(np.where(past_neighs == neighs_B[n])[0])
+							neigh_dico.update({'cumulated_presence': cum_sum + 1})
 							if attention_weight:
-								cum_sum_weighted = np.sum([w if l==neighs_B[n] else 0 for l,w in zip(past_neighs, past_weights)])
+								cum_sum_weighted = np.sum(
+									[w if l == neighs_B[n] else 0 for l, w in zip(past_neighs, past_weights)])
 								neigh_dico.update({'cumulated_presence_weighted': cum_sum_weighted + weights[n_index]})
 						if symmetrize:
 							setB.at[index_B[n_index], neigh_col] = sym_neigh
 						neighs.append(neigh_dico)
 					setA.at[index_A[k], neigh_col] = neighs
 	return setA, setB
-def compute_contact_neighborhood_at_position(pos, distance, population=['targets','effectors'], theta_dist=None, img_shape=(2048,2048), return_tables=False, clear_neigh=False, event_time_col=None,
-	neighborhood_kwargs={'mode': 'two-pop','status': None, 'not_status_option': None,'include_dead_weight': True,"compute_cum_sum": False,"attention_weight": True, 'symmetrize': True}):
+def compute_contact_neighborhood_at_position(pos, distance, population=['targets', 'effectors'], theta_dist=None,
+											 img_shape=(2048, 2048), return_tables=False, clear_neigh=False,
+											 event_time_col=None,
+											 neighborhood_kwargs={'mode': 'two-pop', 'status': None,
+																  'not_status_option': None,
+																  'include_dead_weight': True, "compute_cum_sum": False,
+																  "attention_weight": True, 'symmetrize': True}):
 	"""
 	Computes neighborhood metrics for specified cell populations within a given position, based on distance criteria and additional parameters.
@@ -1070,12 +1171,12 @@ def compute_contact_neighborhood_at_position(pos, distance, population=['targets
 	------
 	AssertionError
 		If the specified position path does not exist or if the number of distances and edge thresholds do not match.
 	"""
-	pos = pos.replace('\\','/')
+	pos = pos.replace('\\', '/')
 	pos = rf"{pos}"
-	assert os.path.exists(pos),f'Position {pos} is not a valid path.'
+	assert os.path.exists(pos), f'Position {pos} is not a valid path.'
 	if isinstance(population, str):
 		population = [population, population]
@@ -1086,16 +1187,27 @@ def compute_contact_neighborhood_at_position(pos, distance, population=['targets
 		theta_dist = [theta_dist]
 	if theta_dist is None:
-		theta_dist = [0 for d in distance] #0.9*d
-	assert len(theta_dist)==len(distance),'Incompatible number of distances and number of edge thresholds.'
+		theta_dist = [0 for d in distance]  # 0.9*d
+	assert len(theta_dist) == len(distance), 'Incompatible number of distances and number of edge thresholds.'
-	if population[0]==population[1]:
+	if population[0] == population[1]:
 		neighborhood_kwargs.update({'mode': 'self'})
-	if population[1]!=population[0]:
+	if population[1] != population[0]:
 		neighborhood_kwargs.update({'mode': 'two-pop'})
 	df_A, path_A = get_position_table(pos, population=population[0], return_path=True)
 	df_B, path_B = get_position_table(pos, population=population[1], return_path=True)
+	if df_A is None or df_B is None:
+		return None
+	if clear_neigh:
+		if os.path.exists(path_A.replace('.csv','.pkl')):
+			os.remove(path_A.replace('.csv','.pkl'))
+		if os.path.exists(path_B.replace('.csv','.pkl')):
+			os.remove(path_B.replace('.csv','.pkl'))
+		df_pair, pair_path = get_position_table(pos, population='pairs', return_path=True)
+		if df_pair is not None:
+			os.remove(pair_path)
 	df_A_pkl = get_position_pickle(pos, population=population[0], return_path=False)
 	df_B_pkl = get_position_pickle(pos, population=population[1], return_path=False)
@@ -1103,19 +1215,36 @@ def compute_contact_neighborhood_at_position(pos, distance, population=['targets
 	if df_A_pkl is not None:
 		pkl_columns = np.array(df_A_pkl.columns)
 		neigh_columns = np.array([c.startswith('neighborhood') for c in pkl_columns])
-		cols = list(pkl_columns[neigh_columns]) + ['TRACK_ID','FRAME']
+		cols = list(pkl_columns[neigh_columns]) + ['FRAME']
+		id_col = extract_identity_col(df_A_pkl)
+		cols.append(id_col)
+		on_cols = [id_col, 'FRAME']
 		print(f'Recover {cols} from the pickle file...')
-		df_A = pd.merge(df_A, df_A_pkl.loc[:,cols], how="outer", on=['TRACK_ID','FRAME'])
-		print(df_A.columns)
+		try:
+			df_A = pd.merge(df_A, df_A_pkl.loc[:,cols], how="outer", on=on_cols)
+			print(df_A.columns)
+		except Exception as e:
+			print(f'Failure to merge pickle and csv files: {e}')
 	if df_B_pkl is not None and df_B is not None:
 		pkl_columns = np.array(df_B_pkl.columns)
 		neigh_columns = np.array([c.startswith('neighborhood') for c in pkl_columns])
-		cols = list(pkl_columns[neigh_columns]) + ['TRACK_ID','FRAME']
+		cols = list(pkl_columns[neigh_columns]) + ['FRAME']
+		id_col = extract_identity_col(df_B_pkl)
+		cols.append(id_col)
+		on_cols = [id_col, 'FRAME']
 		print(f'Recover {cols} from the pickle file...')
-		df_B = pd.merge(df_B, df_B_pkl.loc[:,cols], how="outer", on=['TRACK_ID','FRAME'])
+		try:
+			df_B = pd.merge(df_B, df_B_pkl.loc[:,cols], how="outer", on=on_cols)
+		except Exception as e:
+			print(f'Failure to merge pickle and csv files: {e}')
 	labelsA = locate_labels(pos, population=population[0])
-	if population[1]==population[0]:
+	if population[1] == population[0]:
 		labelsB = None
 	else:
 		labelsB = locate_labels(pos, population=population[1])
@@ -1124,18 +1253,18 @@ def compute_contact_neighborhood_at_position(pos, distance, population=['targets
 		unwanted = df_A.columns[df_A.columns.str.contains('neighborhood')]
 		df_A = df_A.drop(columns=unwanted)
 		unwanted = df_B.columns[df_B.columns.str.contains('neighborhood')]
-		df_B = df_B.drop(columns=unwanted)
+		df_B = df_B.drop(columns=unwanted)
 	print(f"Distance: {distance} for mask contact")
-	df_A, df_B = mask_contact_neighborhood(df_A, df_B, labelsA, labelsB, distance,**neighborhood_kwargs)
-	if df_A is None or df_B is None:
+	df_A, df_B = mask_contact_neighborhood(df_A, df_B, labelsA, labelsB, distance, **neighborhood_kwargs)
+	if df_A is None or df_B is None or len(df_A)==0:
 		return None
-	for td,d in zip(theta_dist, distance):
+	for td, d in zip(theta_dist, distance):
-		if neighborhood_kwargs['mode']=='two-pop':
+		if neighborhood_kwargs['mode'] == 'two-pop':
 			neigh_col = f'neighborhood_2_contact_{d}_px'
-		elif neighborhood_kwargs['mode']=='self':
+		elif neighborhood_kwargs['mode'] == 'self':
 			neigh_col = f'neighborhood_self_contact_{d}_px'
 		df_A.loc[df_A['class_id'].isnull(),neigh_col] = np.nan
@@ -1145,26 +1274,34 @@ def compute_contact_neighborhood_at_position(pos, distance, population=['targets
 		# df_A.loc[~edge_filter_A, neigh_col] = np.nan
 		# df_B.loc[~edge_filter_B, neigh_col] = np.nan
-		df_A = compute_neighborhood_metrics(df_A, neigh_col, metrics=['inclusive','intermediate'], decompose_by_status=True)
-		if neighborhood_kwargs['symmetrize']:
-			df_B = compute_neighborhood_metrics(df_B, neigh_col, metrics=['inclusive','intermediate'], decompose_by_status=True)
-		df_A = mean_neighborhood_before_event(df_A, neigh_col, event_time_col, metrics=['inclusive','intermediate'])
-		if event_time_col is not None:
-			df_A = mean_neighborhood_after_event(df_A, neigh_col, event_time_col, metrics=['inclusive','intermediate'])
-	df_A.to_pickle(path_A.replace('.csv','.pkl'))
-	if not population[0]==population[1]:
-		df_B.to_pickle(path_B.replace('.csv','.pkl'))
+		df_A = compute_neighborhood_metrics(df_A, neigh_col, metrics=['inclusive', 'intermediate'],
+											decompose_by_status=True)
+		if 'TRACK_ID' in list(df_A.columns):
+			if not np.all(df_A['TRACK_ID'].isnull()):
+				df_A = mean_neighborhood_before_event(df_A, neigh_col, event_time_col, metrics=['inclusive','intermediate'])
+				if event_time_col is not None:
+					df_A = mean_neighborhood_after_event(df_A, neigh_col, event_time_col, metrics=['inclusive', 'intermediate'])
+				print('Done...')
+	df_A.to_pickle(path_A.replace('.csv', '.pkl'))
+	if not population[0] == population[1]:
+		# Remove neighborhood column
+		for td, d in zip(theta_dist, distance):
+			if neighborhood_kwargs['mode'] == 'two-pop':
+				neigh_col = f'neighborhood_2_contact_{d}_px'
+			elif neighborhood_kwargs['mode'] == 'self':
+				neigh_col = f'neighborhood_self_contact_{d}_px'
+			df_B = df_B.drop(columns=[neigh_col])
+		df_B.to_pickle(path_B.replace('.csv', '.pkl'))
 	unwanted = df_A.columns[df_A.columns.str.startswith('neighborhood_')]
 	df_A2 = df_A.drop(columns=unwanted)
 	df_A2.to_csv(path_A, index=False)
-	if not population[0]==population[1]:
+	if not population[0] == population[1]:
 		unwanted = df_B.columns[df_B.columns.str.startswith('neighborhood_')]
 		df_B_csv = df_B.drop(unwanted, axis=1, inplace=False)
-		df_B_csv.to_csv(path_B,index=False)
+		df_B_csv.to_csv(path_B, index=False)
 	if return_tables:
 		return df_A, df_B
@@ -1179,10 +1316,15 @@ if __name__ == "__main__":
 	print('None')
 	pos = "/home/torro/Documents/Experiments/NKratio_Exp/W5/500"
-	test,_ = compute_neighborhood_at_position(pos, [62], population=['targets','effectors'], theta_dist=None, img_shape=(2048,2048), return_tables=True, clear_neigh=True,
-	neighborhood_kwargs={'mode': 'two-pop','status': ['class', None],'not_status_option': [True, False],'include_dead_weight': True,"compute_cum_sum": False,"attention_weight": True, 'symmetrize': False})
-	#test = compute_neighborhood_metrics(test, 'neighborhood_self_circle_150_px', metrics=['inclusive','exclusive','intermediate'], decompose_by_status=True)
+	test, _ = compute_neighborhood_at_position(pos, [62], population=['targets', 'effectors'], theta_dist=None,
+											   img_shape=(2048, 2048), return_tables=True, clear_neigh=True,
+											   neighborhood_kwargs={'mode': 'two-pop', 'status': ['class', None],
+																	'not_status_option': [True, False],
+																	'include_dead_weight': True,
+																	"compute_cum_sum": False, "attention_weight": True,
+																	'symmetrize': False})
+	# test = compute_neighborhood_metrics(test, 'neighborhood_self_circle_150_px', metrics=['inclusive','exclusive','intermediate'], decompose_by_status=True)
 	print(test.columns)
 	#print(segment(None,'test'))

celldetective 1.1.1.post3__py3-none-any.whl → 1.2.0__py3-none-any.whl

celldetective 1.1.1.post3py3-none-any.whl → 1.2.0py3-none-any.whl