From 20c8ce2cf73582407a4d9c8902353df571669c90 Mon Sep 17 00:00:00 2001 From: benjijamorris <54606172+benjijamorris@users.noreply.github.com> Date: Wed, 9 Oct 2024 15:29:31 -0700 Subject: [PATCH] Admin/update precommit (#438) * update precommit * style changes with updated precommit * bandit skips * precommit * fix file checking * check if prior is str --------- Co-authored-by: Benjamin Morris --- .pre-commit-config.yaml | 35 +++++++++---------- configs/model/im2im/ijepa.yaml | 2 +- .../api/cyto_dl_model/cyto_dl_base_model.py | 6 ++-- cyto_dl/callbacks/outlier_detection.py | 6 ++-- cyto_dl/dataframe/readers.py | 2 +- .../dataframe/dataframe_datamodule.py | 2 +- .../dataframe/grouped_dataframe_datamodule.py | 2 +- cyto_dl/datamodules/smartcache.py | 19 ++++++---- cyto_dl/image/io/aicsimage_loader.py | 6 ++-- cyto_dl/image/io/monai_bio_reader.py | 5 +-- cyto_dl/image/io/skimage_reader.py | 2 +- .../image/transforms/multiscale_cropper.py | 2 +- cyto_dl/loggers/mlflow.py | 19 +++++----- cyto_dl/models/base_model.py | 2 +- cyto_dl/models/basic_model.py | 4 +-- .../timepoint_classification.py | 2 +- cyto_dl/models/handlers/base_handler.py | 6 ++-- cyto_dl/models/im2im/gan.py | 4 +-- cyto_dl/models/im2im/multi_task.py | 10 +++--- cyto_dl/models/im2im/utils/instance_seg.py | 15 ++++---- cyto_dl/models/vae/base_vae.py | 3 +- cyto_dl/models/vae/image_canon_vae.py | 2 +- cyto_dl/models/vae/image_encoder.py | 3 +- cyto_dl/models/vae/image_vae.py | 2 +- cyto_dl/models/vae/priors/gaussian.py | 9 ++--- .../discriminators/n_layer_discriminator.py | 2 +- cyto_dl/nn/head/base_head.py | 24 +++++++------ cyto_dl/nn/head/gan_head.py | 22 ++++++------ cyto_dl/nn/head/mae_head.py | 22 ++++++------ cyto_dl/nn/head/mask_head.py | 22 ++++++------ cyto_dl/nn/losses/gan_loss.py | 3 +- cyto_dl/nn/losses/gaussian_nll_loss.py | 14 +++++--- cyto_dl/nn/mlp.py | 2 +- cyto_dl/nn/point_cloud/dgcnn.py | 10 +++--- cyto_dl/nn/point_cloud/folding_net.py | 6 ++-- cyto_dl/nn/point_cloud/graph_functions.py | 4 +-- cyto_dl/nn/spatial_transformer.py | 3 +- cyto_dl/nn/vits/blocks/cross_attention.py | 19 +++++----- cyto_dl/nn/vits/seg.py | 10 +++--- cyto_dl/utils/checkpoint.py | 4 ++- cyto_dl/utils/rich_utils.py | 12 ++++--- cyto_dl/utils/spharm/rotation.py | 2 +- scripts/publish_bumpver_handler.py | 1 - 43 files changed, 184 insertions(+), 168 deletions(-) diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml index 06880e5f0..0d39192bd 100644 --- a/.pre-commit-config.yaml +++ b/.pre-commit-config.yaml @@ -9,7 +9,7 @@ ci: repos: - repo: https://github.com/pre-commit/pre-commit-hooks - rev: v4.3.0 + rev: v5.0.0 hooks: # list of supported hooks: https://pre-commit.com/hooks.html - id: trailing-whitespace @@ -26,35 +26,35 @@ repos: # python code formatting - repo: https://github.com/psf/black - rev: 22.6.0 + rev: 24.10.0 hooks: - id: black args: [--line-length, "99"] # python import sorting - repo: https://github.com/PyCQA/isort - rev: 5.12.0 + rev: 5.13.2 hooks: - id: isort args: ["--profile", "black", "--filter-files"] # python upgrading syntax to newer version - repo: https://github.com/asottile/pyupgrade - rev: v2.32.1 + rev: v3.17.0 hooks: - id: pyupgrade args: [--py38-plus] # python docstring formatting - repo: https://github.com/myint/docformatter - rev: v1.4 + rev: v1.7.5 hooks: - id: docformatter args: [--in-place, --wrap-summaries=99, --wrap-descriptions=99] # python check (PEP8), programming errors and code complexity - repo: https://github.com/PyCQA/flake8 - rev: 4.0.1 + rev: 7.1.1 hooks: - id: flake8 args: @@ -67,14 +67,14 @@ repos: # python security linter - repo: https://github.com/PyCQA/bandit - rev: "1.7.1" + rev: "1.7.10" hooks: - id: bandit args: ["-s", "B101"] # yaml formatting - repo: https://github.com/pre-commit/mirrors-prettier - rev: v2.7.1 + rev: v4.0.0-alpha.8 hooks: - id: prettier types: [yaml] @@ -82,13 +82,13 @@ repos: # shell scripts linter - repo: https://github.com/shellcheck-py/shellcheck-py - rev: v0.8.0.4 + rev: v0.10.0.1 hooks: - id: shellcheck # md formatting - repo: https://github.com/executablebooks/mdformat - rev: 0.7.14 + rev: 0.7.17 hooks: - id: mdformat args: ["--number"] @@ -96,12 +96,10 @@ repos: - mdformat-gfm - mdformat-tables - mdformat_frontmatter - # - mdformat-toc - # - mdformat-black # word spelling linter - repo: https://github.com/codespell-project/codespell - rev: v2.1.0 + rev: v2.3.0 hooks: - id: codespell args: @@ -110,13 +108,13 @@ repos: # jupyter notebook cell output clearing - repo: https://github.com/kynan/nbstripout - rev: 0.5.0 + rev: 0.7.1 hooks: - id: nbstripout # jupyter notebook linting - repo: https://github.com/nbQA-dev/nbQA - rev: 1.4.0 + rev: 1.8.7 hooks: - id: nbqa-black args: ["--line-length=99"] @@ -130,17 +128,18 @@ repos: ] - repo: https://github.com/dosisod/refurb - rev: v1.3.0 + rev: v2.0.0 hooks: - id: refurb language_version: python3.10 args: - --ignore - FURB120 + - --ignore + - FURB123 - repo: https://github.com/asottile/blacken-docs - rev: v1.12.1 + rev: 1.19.0 hooks: - id: blacken-docs args: [--line-length=120] - additional_dependencies: [black==21.12b0] diff --git a/configs/model/im2im/ijepa.yaml b/configs/model/im2im/ijepa.yaml index 40ea24201..0ae285162 100644 --- a/configs/model/im2im/ijepa.yaml +++ b/configs/model/im2im/ijepa.yaml @@ -6,7 +6,7 @@ save_dir: ${paths.output_dir} encoder: _target_: cyto_dl.nn.vits.encoder.JEPAEncoder - patch_size: 2 # patch_size * num_patches should equl data._aux.patch_shape + patch_size: 2 # patch_size * num_patches should equal data._aux.patch_shape num_patches: ${model._aux.num_patches} emb_dim: 16 num_layer: 2 diff --git a/cyto_dl/api/cyto_dl_model/cyto_dl_base_model.py b/cyto_dl/api/cyto_dl_model/cyto_dl_base_model.py index a06c4a740..31cb8347c 100644 --- a/cyto_dl/api/cyto_dl_model/cyto_dl_base_model.py +++ b/cyto_dl/api/cyto_dl_model/cyto_dl_base_model.py @@ -36,9 +36,9 @@ def _get_experiment_type(cls) -> ExperimentType: def from_existing_config(cls, config_filepath: Path): """Returns a model from an existing config. - :param config_filepath: path to a .yaml config file that will be used as the basis - for this CytoDLBaseModel (must be generated by the CytoDLBaseModel subclass that wants - to use it). + :param config_filepath: path to a .yaml config file that will be used as the basis for this + CytoDLBaseModel (must be generated by the CytoDLBaseModel subclass that wants to use + it). """ return cls(OmegaConf.load(config_filepath)) diff --git a/cyto_dl/callbacks/outlier_detection.py b/cyto_dl/callbacks/outlier_detection.py index 9e66694f2..d80f05982 100644 --- a/cyto_dl/callbacks/outlier_detection.py +++ b/cyto_dl/callbacks/outlier_detection.py @@ -64,7 +64,7 @@ def fn(_, __, output): return fn def _update_covariance(self, output, layer_name): - """record spatial mean and cov of channel activations per image in batch.""" + """Record spatial mean and cov of channel activations per image in batch.""" output = self.flatten_activations(output) if self.mu[layer_name] is None: self.mu[layer_name] = np.zeros(output.shape[1]) @@ -76,7 +76,7 @@ def _update_covariance(self, output, layer_name): self.n += 1 def on_train_epoch_start(self, trainer, pl_module): - """set forward hook.""" + """Set forward hook.""" if trainer.current_epoch == trainer.max_epochs - self.n_epochs: named_modules = dict([*pl_module.backbone.named_modules()]) for layer_name in self.layer_names: @@ -101,7 +101,7 @@ def _calculate_mahalanobis(self, output, layer_name): self.activations[layer_name].append(out) def _inference_start(self, pl_module): - """add mahalanobis calculation hook and calculate inverse covariance matrix.""" + """Add mahalanobis calculation hook and calculate inverse covariance matrix.""" if self._run: named_modules = dict([*pl_module.backbone.named_modules()]) for layer_name in self.layer_names: diff --git a/cyto_dl/dataframe/readers.py b/cyto_dl/dataframe/readers.py index 03305178a..9f1b54ce5 100644 --- a/cyto_dl/dataframe/readers.py +++ b/cyto_dl/dataframe/readers.py @@ -149,7 +149,7 @@ def read_dataframe( include_columns = sorted(list(include_columns)) required_columns = sorted(list(required_columns)) - if len(include_columns) == 0: + if not include_columns: include_columns = None if isinstance(dataframe, str): diff --git a/cyto_dl/datamodules/dataframe/dataframe_datamodule.py b/cyto_dl/datamodules/dataframe/dataframe_datamodule.py index 384aba2db..9c2fcfe14 100644 --- a/cyto_dl/datamodules/dataframe/dataframe_datamodule.py +++ b/cyto_dl/datamodules/dataframe/dataframe_datamodule.py @@ -163,7 +163,7 @@ def get_dataset(self, split): return self.datasets[split][sample] def make_dataloader(self, split): - kwargs = dict(**self.dataloader_kwargs) + kwargs = {**self.dataloader_kwargs} kwargs["shuffle"] = kwargs.get("shuffle", True) and split == "train" kwargs["batch_size"] = self.batch_size diff --git a/cyto_dl/datamodules/dataframe/grouped_dataframe_datamodule.py b/cyto_dl/datamodules/dataframe/grouped_dataframe_datamodule.py index 288abb0c8..37a2aa0de 100644 --- a/cyto_dl/datamodules/dataframe/grouped_dataframe_datamodule.py +++ b/cyto_dl/datamodules/dataframe/grouped_dataframe_datamodule.py @@ -116,7 +116,7 @@ def __init__( self.target_columns = target_columns def make_dataloader(self, split): - kwargs = dict(**self.dataloader_kwargs) + kwargs = {**self.dataloader_kwargs} kwargs["shuffle"] = kwargs.get("shuffle", True) and split == "train" subset = self.get_dataset(split) diff --git a/cyto_dl/datamodules/smartcache.py b/cyto_dl/datamodules/smartcache.py index db9ddad80..f1787a0c1 100644 --- a/cyto_dl/datamodules/smartcache.py +++ b/cyto_dl/datamodules/smartcache.py @@ -1,3 +1,4 @@ +from itertools import chain from pathlib import Path from typing import Optional, Union @@ -118,14 +119,18 @@ def _get_file_args(self, row): for timepoint in timepoints: img_data.append( { - "dimension_order_out": "ZYX"[-self.spatial_dims :] - if not use_neighbors - else "T" + "ZYX"[-self.spatial_dims :], + "dimension_order_out": ( + "ZYX"[-self.spatial_dims :] + if not use_neighbors + else "T" + "ZYX"[-self.spatial_dims :] + ), "C": row[self.channel_column], "scene": scene, - "T": timepoint - if not use_neighbors - else [timepoint + i for i in range(self.num_neighbors + 1)], + "T": ( + timepoint + if not use_neighbors + else [timepoint + i for i in range(self.num_neighbors + 1)] + ), "original_path": row[self.img_path_column], } ) @@ -136,7 +141,7 @@ def get_per_file_args(self, df): timepoints/channels/scenes for each file in the dataframe.""" with ProgressBar(): img_data = dask.compute(*[self._get_file_args(row) for row in df.itertuples()]) - img_data = [item for sublist in img_data for item in sublist] + img_data = list(chain.from_iterable(img_data)) return img_data def prepare_data(self): diff --git a/cyto_dl/image/io/aicsimage_loader.py b/cyto_dl/image/io/aicsimage_loader.py index 0ca9b6ea8..4c7b5a220 100644 --- a/cyto_dl/image/io/aicsimage_loader.py +++ b/cyto_dl/image/io/aicsimage_loader.py @@ -9,9 +9,9 @@ class AICSImageLoaderd(Transform): """Enumerates scenes and timepoints for dictionary with format. - {path_key: path, channel_key: channel, scene_key: scene, timepoint_key: timepoint}. - Differs from monai_bio_reader in that reading kwargs are passed in the dictionary, instead of - fixed at initialization. + {path_key: path, channel_key: channel, scene_key: scene, timepoint_key: timepoint}. Differs + from monai_bio_reader in that reading kwargs are passed in the dictionary, instead of fixed at + initialization. """ def __init__( diff --git a/cyto_dl/image/io/monai_bio_reader.py b/cyto_dl/image/io/monai_bio_reader.py index 89e7e0726..88d11c318 100644 --- a/cyto_dl/image/io/monai_bio_reader.py +++ b/cyto_dl/image/io/monai_bio_reader.py @@ -30,10 +30,7 @@ def __init__(self, dask_load: bool = True, **reader_kwargs): def read(self, data: Union[Sequence[PathLike], PathLike]): filenames: Sequence[PathLike] = ensure_tuple(data) - img_ = [] - for name in filenames: - img_.append(BioImage(f"{name}")) - + img_ = [BioImage(name) for name in filenames] return img_ if len(filenames) > 1 else img_[0] def get_data(self, img) -> Tuple[np.ndarray, Dict]: diff --git a/cyto_dl/image/io/skimage_reader.py b/cyto_dl/image/io/skimage_reader.py index 5844a0e46..c2a6ee6a4 100644 --- a/cyto_dl/image/io/skimage_reader.py +++ b/cyto_dl/image/io/skimage_reader.py @@ -25,7 +25,7 @@ def read(self, data: Union[Sequence[PathLike], PathLike]): filenames: Sequence[PathLike] = ensure_tuple(data) img_ = [] for name in filenames: - this_im = imread(f"{name}") + this_im = imread(name) if self.channels: this_im = this_im[self.channels] diff --git a/cyto_dl/image/transforms/multiscale_cropper.py b/cyto_dl/image/transforms/multiscale_cropper.py index 5cd999fa6..1f05b38b9 100644 --- a/cyto_dl/image/transforms/multiscale_cropper.py +++ b/cyto_dl/image/transforms/multiscale_cropper.py @@ -92,7 +92,7 @@ def _apply_slice(data, slicee): @staticmethod def _generate_slice(start_coords: Sequence[int], roi_size: Sequence[int]) -> slice: """Creates slice starting at `start_coords` of size `roi_size`""" - return [slice(None, None)] + [ + return [slice(None, None)] + [ # noqa: FURB140 slice(start, end) for start, end in zip(start_coords, start_coords + roi_size) ] diff --git a/cyto_dl/loggers/mlflow.py b/cyto_dl/loggers/mlflow.py index e23f6a2a8..9b2fd2df3 100644 --- a/cyto_dl/loggers/mlflow.py +++ b/cyto_dl/loggers/mlflow.py @@ -55,7 +55,7 @@ def log_hyperparams(self, params: Union[Dict[str, Any], Namespace], mode="train" with tempfile.TemporaryDirectory() as tmp_dir: conf_path = Path(tmp_dir) / f"{mode}.yaml" - with open(conf_path, "w") as f: + with conf_path.open("w") as f: config = OmegaConf.create(params) OmegaConf.save(config=config, f=f) @@ -133,7 +133,7 @@ def _after_save_checkpoint(self, ckpt_callback: ModelCheckpoint) -> None: self.run_id, local_path=best_path, artifact_path=artifact_path ) - os.unlink(best_path) + best_path.unlink() else: filepath = ckpt_callback.best_model_path @@ -149,7 +149,7 @@ def _after_save_checkpoint(self, ckpt_callback: ModelCheckpoint) -> None: self.run_id, local_path=last_path, artifact_path=artifact_path ) - os.unlink(last_path) + last_path.unlink() else: self.experiment.log_artifact( self.run_id, local_path=filepath, artifact_path=artifact_path @@ -157,9 +157,12 @@ def _after_save_checkpoint(self, ckpt_callback: ModelCheckpoint) -> None: def _delete_local_artifact(repo, artifact_path): - artifact_path = local_file_uri_to_path( - os.path.join(repo._artifact_dir, artifact_path) if artifact_path else repo._artifact_dir + artifact_path = Path( + local_file_uri_to_path( + os.path.join(repo._artifact_dir, artifact_path) + if artifact_path + else repo._artifact_dir + ) ) - - if os.path.isfile(artifact_path): - os.remove(artifact_path) + if artifact_path.is_file(): + artifact_path.unlink() diff --git a/cyto_dl/models/base_model.py b/cyto_dl/models/base_model.py index 3dedcba35..8ef795252 100644 --- a/cyto_dl/models/base_model.py +++ b/cyto_dl/models/base_model.py @@ -23,7 +23,7 @@ def _is_primitive(value): - if isinstance(value, (type(None), bool, str, int, float)): + if value is None or isinstance(value, (bool, str, int, float)): return True if isinstance(value, (tuple, list)): diff --git a/cyto_dl/models/basic_model.py b/cyto_dl/models/basic_model.py index 14560b34c..52a3834eb 100644 --- a/cyto_dl/models/basic_model.py +++ b/cyto_dl/models/basic_model.py @@ -59,11 +59,11 @@ def __init__( super().__init__(metrics=metrics) - if network is None and pretrained_weights is None: + if network is pretrained_weights is None: raise ValueError("`network` and `pretrained_weights` can't both be None.") if pretrained_weights is not None: - pretrained_weights = torch.load(pretrained_weights) + pretrained_weights = torch.load(pretrained_weights) # nosec B614 if network is not None: self.network = network diff --git a/cyto_dl/models/classification/timepoint_classification.py b/cyto_dl/models/classification/timepoint_classification.py index dbd70c553..e20bc0e8d 100644 --- a/cyto_dl/models/classification/timepoint_classification.py +++ b/cyto_dl/models/classification/timepoint_classification.py @@ -50,7 +50,7 @@ def predict_step(self, batch, batch_idx): batch, "predict", logits, - name=f"{batch['track_id'].cpu().item()}", + name=str(batch["track_id"].cpu().item()), ) timepoints = np.array(batch["timepoints"][0][1:-1].split(",")).astype(int) diff --git a/cyto_dl/models/handlers/base_handler.py b/cyto_dl/models/handlers/base_handler.py index bdbff8226..90759927f 100644 --- a/cyto_dl/models/handlers/base_handler.py +++ b/cyto_dl/models/handlers/base_handler.py @@ -76,12 +76,12 @@ def postprocess(self, data): mode = self.config["return"].get("mode", "network") if mode == "path": - path = self.config["return"].get("path", "/tmp") # nosec: B108 + path = self.config["return"].get("path", "/tmp") # nosec B108 response_path = Path(path) / f"{uuid.uuid4()}.pt" - torch.save(data, response_path) + torch.save(data, response_path) # nosec B614 return [str(response_path)] buf = io.BytesIO() - torch.save(data, buf) + torch.save(data, buf) # nosec B614 buf.seek(0) return [buf.read()] diff --git a/cyto_dl/models/im2im/gan.py b/cyto_dl/models/im2im/gan.py index 30d8a704a..00fceeda2 100644 --- a/cyto_dl/models/im2im/gan.py +++ b/cyto_dl/models/im2im/gan.py @@ -95,7 +95,7 @@ def configure_optimizers(self): return (opts, scheds) def _train_forward(self, batch, stage, save_image, run_heads): - """during training we are only dealing with patches,so we can calculate per-patch loss, + """During training we are only dealing with patches,so we can calculate per-patch loss, metrics, postprocessing etc.""" z = self.backbone(batch[self.hparams.x_key]) return { @@ -106,7 +106,7 @@ def _train_forward(self, batch, stage, save_image, run_heads): } def _inference_forward(self, batch, stage, save_image, run_heads): - """during inference, we need to calculate per-fov loss/metrics/postprocessing. + """During inference, we need to calculate per-fov loss/metrics/postprocessing. To avoid storing and passing to each head the intermediate results of the backbone, we need to run backbone + taskheads patch by patch, then do saving/postprocessing/etc on the entire diff --git a/cyto_dl/models/im2im/multi_task.py b/cyto_dl/models/im2im/multi_task.py index 9ac05c05b..d8b8f0d13 100644 --- a/cyto_dl/models/im2im/multi_task.py +++ b/cyto_dl/models/im2im/multi_task.py @@ -111,7 +111,7 @@ def configure_optimizers(self): return (opts, scheds) def _train_forward(self, batch, stage, n_postprocess, run_heads): - """during training we are only dealing with patches,so we can calculate per-patch loss, + """During training we are only dealing with patches,so we can calculate per-patch loss, metrics, postprocessing etc.""" z = self.backbone(batch[self.hparams.x_key]) return { @@ -124,7 +124,7 @@ def forward(self, x, run_heads): return {task: self.task_heads[task](z) for task in run_heads} def _inference_forward(self, batch, stage, n_postprocess, run_heads): - """during inference, we need to calculate per-fov loss/metrics/postprocessing. + """During inference, we need to calculate per-fov loss/metrics/postprocessing. To avoid storing and passing to each head the intermediate results of the backbone, we need to run backbone + taskheads patch by patch, then do saving/postprocessing/etc on the entire @@ -173,7 +173,7 @@ def _sum_losses(self, losses): return losses def _get_unrun_heads(self, io_map): - """returns heads that don't have outputs yet.""" + """Returns heads that don't have outputs yet.""" updated_run_heads = [] # check that all output files exist for each head for head, head_io_map in io_map.items(): @@ -184,7 +184,7 @@ def _get_unrun_heads(self, io_map): return updated_run_heads def _combine_io_maps(self, io_maps): - """aggregate io_maps from per-head to per-input image.""" + """Aggregate io_maps from per-head to per-input image.""" io_map = {} # create input-> per head output mapping for head, head_io_map in io_maps.items(): @@ -218,7 +218,7 @@ def _get_run_heads(self, batch, stage, batch_idx): return run_heads, io_map def _to_tensor(self, batch): - """convert monai metatensors to tensors.""" + """Convert monai metatensors to tensors.""" for k, v in batch.items(): if isinstance(v, MetaTensor): batch[k] = v.as_tensor() diff --git a/cyto_dl/models/im2im/utils/instance_seg.py b/cyto_dl/models/im2im/utils/instance_seg.py index 9223321ff..78a9fd971 100644 --- a/cyto_dl/models/im2im/utils/instance_seg.py +++ b/cyto_dl/models/im2im/utils/instance_seg.py @@ -90,10 +90,7 @@ def skeleton_tall(self, img, max_label): return tall_skeleton def label_2d(self, img): - """ - dim = 2: return labeled image - dim = 3: label each z slice separately - """ + """Dim = 2: return labeled image dim = 3: label each z slice separately.""" if self.dim == 2: out, _ = label(img) return out @@ -185,9 +182,9 @@ def embed_from_skel(self, skel: np.ndarray, iseg: np.ndarray): if len(object_points) == 2: crop_embedding[:, object_points[0], object_points[1]] = point_embeddings elif len(object_points) == 3: - crop_embedding[ - :, object_points[0], object_points[1], object_points[2] - ] = point_embeddings + crop_embedding[:, object_points[0], object_points[1], object_points[2]] = ( + point_embeddings + ) crop_embedding = torch.from_numpy(self.smooth_embedding(crop_embedding)) @@ -432,7 +429,7 @@ def _get_point_embeddings(self, object_points, skeleton_points): return dist, tree.data[idx].T.astype(int) def kd_clustering(self, embeddings, skel): - """assign embedded points to closest skeleton.""" + """Assign embedded points to closest skeleton.""" skel = find_boundaries(skel, mode="inner") * skel # propagate labels to boundaries skel_points = np.stack(skel.nonzero()).T embed_points = np.stack(embeddings).T @@ -446,7 +443,7 @@ def kd_clustering(self, embeddings, skel): return embedding_labels def remove_small_skeletons(self, skel): - """remove small skeletons below self.min_size that are not touching the edge of the + """Remove small skeletons below self.min_size that are not touching the edge of the image.""" skel_removed = skel.copy() regions = find_objects(skel) diff --git a/cyto_dl/models/vae/base_vae.py b/cyto_dl/models/vae/base_vae.py index d2eda552c..b167464b9 100644 --- a/cyto_dl/models/vae/base_vae.py +++ b/cyto_dl/models/vae/base_vae.py @@ -30,6 +30,7 @@ def __init__( **base_kwargs, ): """Instantiate a basic VAE model. + Parameters ---------- encoder: nn.Module @@ -107,7 +108,7 @@ def __init__( super().__init__(metrics=metrics, **base_kwargs) for key in prior.keys(): - if isinstance(prior[key], (str, type(None))): + if prior[key] is None or isinstance(prior[key], str): if prior[key] == "gaussian": prior[key] = IsotropicGaussianPrior(dimensionality=latent_dim) else: diff --git a/cyto_dl/models/vae/image_canon_vae.py b/cyto_dl/models/vae/image_canon_vae.py index a67396788..2d1429354 100644 --- a/cyto_dl/models/vae/image_canon_vae.py +++ b/cyto_dl/models/vae/image_canon_vae.py @@ -124,7 +124,7 @@ def __init__( ) ) - if isinstance(prior, (str, type(None))): + if prior is None or isinstance(prior, str): if prior == "gaussian": encoder_out_size = 2 * latent_dim else: diff --git a/cyto_dl/models/vae/image_encoder.py b/cyto_dl/models/vae/image_encoder.py index 1374c43c7..c97fd85e4 100644 --- a/cyto_dl/models/vae/image_encoder.py +++ b/cyto_dl/models/vae/image_encoder.py @@ -143,8 +143,7 @@ def forward(self, x): y = self.net(x) pool_dims = (2, 3) if self.spatial_dims == 2 else (2, 3, 4) - y = y.tensor - y = y.mean(dim=pool_dims) + y = y.tensor.mean(dim=pool_dims) y_embedding = y[:, : self.out_dim] diff --git a/cyto_dl/models/vae/image_vae.py b/cyto_dl/models/vae/image_vae.py index 5d65d398f..a64e82e82 100644 --- a/cyto_dl/models/vae/image_vae.py +++ b/cyto_dl/models/vae/image_vae.py @@ -175,7 +175,7 @@ def __init__( _Scale(last_scale), ) - if isinstance(prior, (str, type(None))): + if prior is None or isinstance(prior, str): if prior == "gaussian": encoder_out_size = 2 * latent_dim else: diff --git a/cyto_dl/models/vae/priors/gaussian.py b/cyto_dl/models/vae/priors/gaussian.py index 01e1482c3..12b807736 100644 --- a/cyto_dl/models/vae/priors/gaussian.py +++ b/cyto_dl/models/vae/priors/gaussian.py @@ -51,8 +51,8 @@ def kl_divergence(cls, mean, logvar, tc_penalty_weight=None, reduction="sum"): @classmethod def sample(cls, mean, logvar): std = torch.exp(0.5 * logvar) - eps = torch.randn_like(std) - return eps.mul(std).add(mean) + eps = torch.randn_like(std).mul(std).add(mean) + return eps def forward(self, z, mode="kl", inference=False, **kwargs): mean_logvar = z @@ -130,8 +130,9 @@ def param_size(self): @classmethod def kl_divergence(cls, mu1, mu2, logvar1, logvar2, tc_penalty_weight=None, reduction="sum"): - """Computes the Kullback-Leibler divergence between two diagonal - gaussians (not necessarily isotropic). It also works batch-wise. + """Computes the Kullback-Leibler divergence between two diagonal gaussians (not necessarily + isotropic). It also works batch-wise. + Parameters ---------- mu1: torch.Tensor diff --git a/cyto_dl/nn/discriminators/n_layer_discriminator.py b/cyto_dl/nn/discriminators/n_layer_discriminator.py index 0cb021fac..bf8ed8ea2 100644 --- a/cyto_dl/nn/discriminators/n_layer_discriminator.py +++ b/cyto_dl/nn/discriminators/n_layer_discriminator.py @@ -33,7 +33,7 @@ def __init__( super().__init__() if dim not in (2, 3): raise ValueError(f"dim must be 2 or 3, got {dim}") - if type(norm_layer) == functools.partial: + if isinstance(norm_layer, functools.partial): use_bias = norm_layer.func != nn.BatchNorm3d else: use_bias = norm_layer != nn.BatchNorm3d diff --git a/cyto_dl/nn/head/base_head.py b/cyto_dl/nn/head/base_head.py index 8737f8fed..cc8621e6b 100644 --- a/cyto_dl/nn/head/base_head.py +++ b/cyto_dl/nn/head/base_head.py @@ -39,7 +39,7 @@ def _postprocess(self, img, img_type, n_postprocess=1): return [self.postprocess[img_type](img[i]) for i in range(n_postprocess)] def generate_io_map(self, input_filenames): - """generates map between input files and output files for a head. + """Generates map between input files and output files for a head. Only used for prediction """ @@ -80,14 +80,16 @@ def run_head( return { "loss": loss, "pred": self._postprocess(y_hat, img_type="prediction", n_postprocess=n_postprocess), - "target": self._postprocess( - batch[self.head_name], img_type="input", n_postprocess=n_postprocess - ) - if stage != "predict" - else None, - "input": self._postprocess( - batch[self.x_key], img_type="input", n_postprocess=n_postprocess - ) - if stage != "predict" - else None, + "target": ( + self._postprocess( + batch[self.head_name], img_type="input", n_postprocess=n_postprocess + ) + if stage != "predict" + else None + ), + "input": ( + self._postprocess(batch[self.x_key], img_type="input", n_postprocess=n_postprocess) + if stage != "predict" + else None + ), } diff --git a/cyto_dl/nn/head/gan_head.py b/cyto_dl/nn/head/gan_head.py index 9072bb9bb..164db32ed 100644 --- a/cyto_dl/nn/head/gan_head.py +++ b/cyto_dl/nn/head/gan_head.py @@ -81,14 +81,16 @@ def run_head( "loss_D": loss_D, "loss_G": loss_G, "pred": self._postprocess(y_hat, img_type="prediction", n_postprocess=n_postprocess), - "target": self._postprocess( - batch[self.head_name], img_type="input", n_postprocess=n_postprocess - ) - if stage != "predict" - else None, - "input": self._postprocess( - batch[self.x_key], img_type="input", n_postprocess=n_postprocess - ) - if stage != "predict" - else None, + "target": ( + self._postprocess( + batch[self.head_name], img_type="input", n_postprocess=n_postprocess + ) + if stage != "predict" + else None + ), + "input": ( + self._postprocess(batch[self.x_key], img_type="input", n_postprocess=n_postprocess) + if stage != "predict" + else None + ), } diff --git a/cyto_dl/nn/head/mae_head.py b/cyto_dl/nn/head/mae_head.py index a630855bf..693d10be5 100644 --- a/cyto_dl/nn/head/mae_head.py +++ b/cyto_dl/nn/head/mae_head.py @@ -27,14 +27,16 @@ def run_head( return { "loss": loss, "pred": self._postprocess(y_hat, img_type="prediction", n_postprocess=n_postprocess), - "target": self._postprocess( - batch[self.head_name], img_type="input", n_postprocess=n_postprocess - ) - if stage != "predict" - else None, - "input": self._postprocess( - batch[self.x_key], img_type="input", n_postprocess=n_postprocess - ) - if stage != "predict" - else None, + "target": ( + self._postprocess( + batch[self.head_name], img_type="input", n_postprocess=n_postprocess + ) + if stage != "predict" + else None + ), + "input": ( + self._postprocess(batch[self.x_key], img_type="input", n_postprocess=n_postprocess) + if stage != "predict" + else None + ), } diff --git a/cyto_dl/nn/head/mask_head.py b/cyto_dl/nn/head/mask_head.py index a255ec2d0..fa3de7117 100644 --- a/cyto_dl/nn/head/mask_head.py +++ b/cyto_dl/nn/head/mask_head.py @@ -56,14 +56,16 @@ def run_head( return { "loss": loss, "pred": self._postprocess(y_hat, img_type="prediction", n_postprocess=n_postprocess), - "target": self._postprocess( - batch[self.head_name], img_type="input", n_postprocess=n_postprocess - ) - if stage != "predict" - else None, - "input": self._postprocess( - batch[self.x_key], img_type="input", n_postprocess=n_postprocess - ) - if stage != "predict" - else None, + "target": ( + self._postprocess( + batch[self.head_name], img_type="input", n_postprocess=n_postprocess + ) + if stage != "predict" + else None + ), + "input": ( + self._postprocess(batch[self.x_key], img_type="input", n_postprocess=n_postprocess) + if stage != "predict" + else None + ), } diff --git a/cyto_dl/nn/losses/gan_loss.py b/cyto_dl/nn/losses/gan_loss.py index f21657418..bb703da90 100644 --- a/cyto_dl/nn/losses/gan_loss.py +++ b/cyto_dl/nn/losses/gan_loss.py @@ -55,7 +55,8 @@ def get_target_tensor(self, prediction: torch.Tensor, target_is_real: bool): A label tensor filled with ground truth label, and with the size of input """ target_tensor = self.real_label if target_is_real else self.fake_label - return target_tensor.expand_as(prediction) + target_tensor = target_tensor.expand_as(prediction) # noqa: FURB184 + return target_tensor def __call__(self, prediction: torch.Tensor, target_is_real: bool): """Calculate loss given Discriminator's output and grount truth labels. diff --git a/cyto_dl/nn/losses/gaussian_nll_loss.py b/cyto_dl/nn/losses/gaussian_nll_loss.py index a15ca62c8..7f78371b8 100644 --- a/cyto_dl/nn/losses/gaussian_nll_loss.py +++ b/cyto_dl/nn/losses/gaussian_nll_loss.py @@ -21,9 +21,13 @@ def forward(self, input: Tensor, target: Tensor) -> Tensor: log_sigma = (sigma + self.eps).log().detach() loss = ( - 0.5 * torch.pow((target - input) / log_sigma.exp(), 2) - + log_sigma - + 0.5 * np.log(2 * np.pi) - ).reshape(input.shape[0], -1) + ( + 0.5 * torch.pow((target - input) / log_sigma.exp(), 2) + + log_sigma + + 0.5 * np.log(2 * np.pi) + ) + .reshape(input.shape[0], -1) + .sum(dim=1, keepdim=True) + ) - return loss.sum(dim=1, keepdim=True) + return loss diff --git a/cyto_dl/nn/mlp.py b/cyto_dl/nn/mlp.py index 0cbc221fb..96703ebe5 100644 --- a/cyto_dl/nn/mlp.py +++ b/cyto_dl/nn/mlp.py @@ -30,7 +30,7 @@ def __init__( net = [_make_block(sum(self.input_dims), hidden_layers[0])] - net += [ + net += [ # noqa: FURB140 _make_block(input_dim, output_dim) for (input_dim, output_dim) in zip(hidden_layers[0:], hidden_layers[1:]) ] diff --git a/cyto_dl/nn/point_cloud/dgcnn.py b/cyto_dl/nn/point_cloud/dgcnn.py index ce801d8bc..e34ad17e1 100644 --- a/cyto_dl/nn/point_cloud/dgcnn.py +++ b/cyto_dl/nn/point_cloud/dgcnn.py @@ -254,8 +254,9 @@ def _generate_plane_features(self, points, cond, plane="xz"): # scatter plane features from points fea_plane = cond.new_zeros(*view_dims1) cond = cond.permute(*permute_dims1) # B x 512 x T - fea_plane = scatter_mean(cond, index, out=fea_plane) # B x 512 x reso^2 - fea_plane = fea_plane.reshape(*view_dims2) # sparce matrix (B x 512 x reso x reso) + fea_plane = scatter_mean(cond, index, out=fea_plane).reshape( + *view_dims2 + ) # sparse matrix (B x 512 x reso x reso) # process the plane features with UNet if self.unet is not None: @@ -269,10 +270,9 @@ def _generate_grid_features(self, p, c): # scatter grid features from points fea_grid = c.new_zeros(p.size(0), self.num_features, self.reso_grid**3) c = c.permute(0, 2, 1) - fea_grid = scatter_mean(c, index, out=fea_grid) # B x C x reso^3 - fea_grid = fea_grid.reshape( + fea_grid = scatter_mean(c, index, out=fea_grid).reshape( p.size(0), self.num_features, self.reso_grid, self.reso_grid, self.reso_grid - ) # sparce matrix (B x 512 x reso x reso) + ) # sparse matrix (B x 512 x reso x reso) if self.unet3d is not None: fea_grid = self.unet3d(fea_grid) diff --git a/cyto_dl/nn/point_cloud/folding_net.py b/cyto_dl/nn/point_cloud/folding_net.py index 574efa626..91012183c 100644 --- a/cyto_dl/nn/point_cloud/folding_net.py +++ b/cyto_dl/nn/point_cloud/folding_net.py @@ -71,10 +71,8 @@ def __init__( def forward(self, x): x = self.project(x) - grid = self.grid.unsqueeze(0).expand(x.shape[0], -1, -1) - grid = grid.type_as(x) - x = x.unsqueeze(1) - cw_exp = x.expand(-1, grid.shape[1], -1) + grid = self.grid.unsqueeze(0).expand(x.shape[0], -1, -1).type_as(x) + cw_exp = x.unsqueeze(1).expand(-1, grid.shape[1], -1) cat1 = torch.cat((cw_exp, grid), dim=2) folding_result1 = self.folding1(cat1) diff --git a/cyto_dl/nn/point_cloud/graph_functions.py b/cyto_dl/nn/point_cloud/graph_functions.py index 9b51fd717..c71048c17 100644 --- a/cyto_dl/nn/point_cloud/graph_functions.py +++ b/cyto_dl/nn/point_cloud/graph_functions.py @@ -24,9 +24,7 @@ def knn(x, k): if idx_base.device != idx.device: idx_base = idx_base.to(idx.device) - idx = idx + idx_base - idx = idx.view(-1) - + idx = (idx + idx_base).view(-1) return idx diff --git a/cyto_dl/nn/spatial_transformer.py b/cyto_dl/nn/spatial_transformer.py index 1fa9ab86c..556903513 100644 --- a/cyto_dl/nn/spatial_transformer.py +++ b/cyto_dl/nn/spatial_transformer.py @@ -56,8 +56,7 @@ def __init__(self, n_input_ch=2, patch_shape=(64, 256, 512), n_conv_filters=32): self.fc_loc[2].bias.data.copy_(torch.tensor([0, 0, 0], dtype=torch.float)) def forward(self, x): - xs = self.localization(x) - xs = xs.view(-1, self.output_shape) + xs = self.localization(x).view(-1, self.output_shape) offsets = self.fc_loc(xs).squeeze() # create identity transformation matrix with only shifts theta = torch.eye(3, 4).reshape(1, 3, 4).repeat(x.shape[0], 1, 1) diff --git a/cyto_dl/nn/vits/blocks/cross_attention.py b/cyto_dl/nn/vits/blocks/cross_attention.py index a9dc47d38..d583e6d75 100644 --- a/cyto_dl/nn/vits/blocks/cross_attention.py +++ b/cyto_dl/nn/vits/blocks/cross_attention.py @@ -49,7 +49,7 @@ def __init__( self.proj_drop = nn.Dropout(proj_drop) def forward(self, x, y): - """query from decoder (x), key and value from encoder (y)""" + """Query from decoder (x), key and value from encoder (y)""" B, N, C = x.shape Ny = y.shape[1] q = self.q(x).reshape(B, N, self.num_heads, C // self.num_heads).permute(0, 2, 1, 3) @@ -60,15 +60,18 @@ def forward(self, x, y): ) k, v = kv[0], kv[1] - attn = F.scaled_dot_product_attention( - q, - k, - v, - dropout_p=self.attn_drop, + attn = ( + F.scaled_dot_product_attention( + q, + k, + v, + dropout_p=self.attn_drop, + ) + .transpose(1, 2) + .reshape(B, N, C) ) - x = attn.transpose(1, 2).reshape(B, N, C) - x = self.proj(x) + x = self.proj(attn) x = self.proj_drop(x) return x diff --git a/cyto_dl/nn/vits/seg.py b/cyto_dl/nn/vits/seg.py index ca36e465d..3e10e91a1 100644 --- a/cyto_dl/nn/vits/seg.py +++ b/cyto_dl/nn/vits/seg.py @@ -11,10 +11,8 @@ class EncodedSkip(torch.nn.Module): def __init__(self, spatial_dims, num_patches, emb_dim, n_decoder_filters, layer): super().__init__() - """ - layer = 0 is the smallest resolution, n is the highest - as the layer increases, the image size increases and the number of filters decreases - """ + """Layer = 0 is the smallest resolution, n is the highest as the layer increases, the image + size increases and the number of filters decreases.""" upsample = 2**layer self.n_out_channels = n_decoder_filters // (upsample**spatial_dims) @@ -50,7 +48,7 @@ def forward(self, features): class SuperresDecoder(torch.nn.Module): - """create unet-like decoder where each decoder layer is a fed a skip connection consisting of a + """Create unet-like decoder where each decoder layer is a fed a skip connection consisting of a different weighted sum of intermediate layer features.""" def __init__( @@ -223,7 +221,7 @@ def __init__( **encoder_kwargs, ) if encoder_ckpt is not None: - model = torch.load(encoder_ckpt, map_location="cuda:0") + model = torch.load(encoder_ckpt, map_location="cuda:0") # nosec B614 enc_state_dict = { k.replace("backbone.encoder.", ""): v for k, v in model["state_dict"].items() diff --git a/cyto_dl/utils/checkpoint.py b/cyto_dl/utils/checkpoint.py index e6f98aaea..597251869 100644 --- a/cyto_dl/utils/checkpoint.py +++ b/cyto_dl/utils/checkpoint.py @@ -7,7 +7,9 @@ def load_checkpoint(model, load_params): "ckpt_path" ), "ckpt_path must be provided to with argument weights_only=True" # load model from state dict to get around trainer.max_epochs limit, useful for resuming model training from existing weights - state_dict = torch.load(load_params["ckpt_path"], map_location="cpu")["state_dict"] + state_dict = torch.load(load_params["ckpt_path"], map_location="cpu")[ + "state_dict" + ] # nosec B614 model.load_state_dict(state_dict, strict=load_params.get("strict", True)) # set ckpt_path to None to avoid loading checkpoint again with model.fit/model.test load_params["ckpt_path"] = None diff --git a/cyto_dl/utils/rich_utils.py b/cyto_dl/utils/rich_utils.py index 3fc5815d4..79e20ab92 100644 --- a/cyto_dl/utils/rich_utils.py +++ b/cyto_dl/utils/rich_utils.py @@ -45,8 +45,12 @@ def print_config_tree( # add fields from `print_order` to queue for field in print_order: - queue.append(field) if field in cfg else log.warning( - f"Field '{field}' not found in config. Skipping '{field}' config printing..." + ( + queue.append(field) + if field in cfg + else log.warning( + f"Field '{field}' not found in config. Skipping '{field}' config printing..." + ) ) # add all the other fields to queue (not specified in `print_order`) @@ -71,7 +75,7 @@ def print_config_tree( # save config tree to file if save_to_file: - with open(Path(cfg.paths.output_dir, "config_tree.log"), "w") as file: + with Path(cfg.paths.output_dir, "config_tree.log").open("w") as file: rich.print(tree, file=file) @@ -93,7 +97,7 @@ def enforce_tags(cfg: DictConfig, save_to_file: bool = False) -> None: log.info(f"Tags: {cfg.tags}") if save_to_file: - with open(Path(cfg.paths.output_dir, "tags.log"), "w") as file: + with Path(cfg.paths.output_dir, "tags.log").open("w") as file: rich.print(cfg.tags, file=file) diff --git a/cyto_dl/utils/spharm/rotation.py b/cyto_dl/utils/spharm/rotation.py index 06549ca73..991d415c7 100644 --- a/cyto_dl/utils/spharm/rotation.py +++ b/cyto_dl/utils/spharm/rotation.py @@ -96,7 +96,7 @@ def flip_spharm(input, paired_indices, flips=-1): def get_band_indices(columns, max_band, prefix="", flat=False): - """get the tensor indices for each band, based on the column order of the batch loader (given + """Get the tensor indices for each band, based on the column order of the batch loader (given by `columns`, assuming that it is in the same order). this is passed to `rotate_spharm` later, to rotate the spherical harmonics around the z axis diff --git a/scripts/publish_bumpver_handler.py b/scripts/publish_bumpver_handler.py index 0b2a51ada..7061eef0e 100644 --- a/scripts/publish_bumpver_handler.py +++ b/scripts/publish_bumpver_handler.py @@ -1,7 +1,6 @@ # this file is intended to be called by a github workflow (.github/workflows/publish_to_pypi.yaml) # it makes decisions based on the current version and the component specified for bumping, # which the workflow cannot do - """ TESTING: - add and commit any changes (keep track of this commit hash)