From 438cd4c536ae77950981a91b878c51cf6936a462 Mon Sep 17 00:00:00 2001 From: d33bs Date: Wed, 18 May 2022 15:34:51 -0600 Subject: [PATCH 1/2] non-copy/inplace renames for memory performance in merge_single_cells work towards #195 --- pycytominer/cyto_utils/cells.py | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/pycytominer/cyto_utils/cells.py b/pycytominer/cyto_utils/cells.py index debb209d..780749d7 100644 --- a/pycytominer/cyto_utils/cells.py +++ b/pycytominer/cyto_utils/cells.py @@ -713,8 +713,10 @@ def merge_single_cells( sc_df = ( self.image_df.merge(sc_df, on=self.merge_cols, how="right") - .rename(self.linking_col_rename, axis="columns") - .rename(self.full_merge_suffix_rename, axis="columns") + # pandas rename performance may be improved using copy=False, inplace=False + # reference: https://ryanlstevens.github.io/2022-05-06-pandasColumnRenaming/ + .rename(self.linking_col_rename, axis="columns", copy=False, inplace=False) + .rename(self.full_merge_suffix_rename, axis="columns", copy=False, inplace=False) ) if single_cell_normalize: # Infering features is tricky with non-canonical data From 4e53eed7effa6a623752694966372a79dfabbf0b Mon Sep 17 00:00:00 2001 From: d33bs Date: Fri, 20 May 2022 10:07:15 -0600 Subject: [PATCH 2/2] black formatting --- pycytominer/cyto_utils/cells.py | 7 +++++-- 1 file changed, 5 insertions(+), 2 deletions(-) diff --git a/pycytominer/cyto_utils/cells.py b/pycytominer/cyto_utils/cells.py index 780749d7..7fd8a7e4 100644 --- a/pycytominer/cyto_utils/cells.py +++ b/pycytominer/cyto_utils/cells.py @@ -715,8 +715,11 @@ def merge_single_cells( self.image_df.merge(sc_df, on=self.merge_cols, how="right") # pandas rename performance may be improved using copy=False, inplace=False # reference: https://ryanlstevens.github.io/2022-05-06-pandasColumnRenaming/ - .rename(self.linking_col_rename, axis="columns", copy=False, inplace=False) - .rename(self.full_merge_suffix_rename, axis="columns", copy=False, inplace=False) + .rename( + self.linking_col_rename, axis="columns", copy=False, inplace=False + ).rename( + self.full_merge_suffix_rename, axis="columns", copy=False, inplace=False + ) ) if single_cell_normalize: # Infering features is tricky with non-canonical data