Skip to content

Commit

Permalink
Admin/update precommit (#438)
Browse files Browse the repository at this point in the history
* update precommit

* style changes with updated precommit

* bandit skips

* precommit

* fix file checking

* check if prior is str

---------

Co-authored-by: Benjamin Morris <[email protected]>
  • Loading branch information
benjijamorris and Benjamin Morris authored Oct 9, 2024
1 parent 5cafa7a commit 20c8ce2
Show file tree
Hide file tree
Showing 43 changed files with 184 additions and 168 deletions.
35 changes: 17 additions & 18 deletions .pre-commit-config.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -9,7 +9,7 @@ ci:

repos:
- repo: https://github.com/pre-commit/pre-commit-hooks
rev: v4.3.0
rev: v5.0.0
hooks:
# list of supported hooks: https://pre-commit.com/hooks.html
- id: trailing-whitespace
Expand All @@ -26,35 +26,35 @@ repos:

# python code formatting
- repo: https://github.com/psf/black
rev: 22.6.0
rev: 24.10.0
hooks:
- id: black
args: [--line-length, "99"]

# python import sorting
- repo: https://github.com/PyCQA/isort
rev: 5.12.0
rev: 5.13.2
hooks:
- id: isort
args: ["--profile", "black", "--filter-files"]

# python upgrading syntax to newer version
- repo: https://github.com/asottile/pyupgrade
rev: v2.32.1
rev: v3.17.0
hooks:
- id: pyupgrade
args: [--py38-plus]

# python docstring formatting
- repo: https://github.com/myint/docformatter
rev: v1.4
rev: v1.7.5
hooks:
- id: docformatter
args: [--in-place, --wrap-summaries=99, --wrap-descriptions=99]

# python check (PEP8), programming errors and code complexity
- repo: https://github.com/PyCQA/flake8
rev: 4.0.1
rev: 7.1.1
hooks:
- id: flake8
args:
Expand All @@ -67,41 +67,39 @@ repos:

# python security linter
- repo: https://github.com/PyCQA/bandit
rev: "1.7.1"
rev: "1.7.10"
hooks:
- id: bandit
args: ["-s", "B101"]

# yaml formatting
- repo: https://github.com/pre-commit/mirrors-prettier
rev: v2.7.1
rev: v4.0.0-alpha.8
hooks:
- id: prettier
types: [yaml]
language_version: 17.9.0

# shell scripts linter
- repo: https://github.com/shellcheck-py/shellcheck-py
rev: v0.8.0.4
rev: v0.10.0.1
hooks:
- id: shellcheck

# md formatting
- repo: https://github.com/executablebooks/mdformat
rev: 0.7.14
rev: 0.7.17
hooks:
- id: mdformat
args: ["--number"]
additional_dependencies:
- mdformat-gfm
- mdformat-tables
- mdformat_frontmatter
# - mdformat-toc
# - mdformat-black

# word spelling linter
- repo: https://github.com/codespell-project/codespell
rev: v2.1.0
rev: v2.3.0
hooks:
- id: codespell
args:
Expand All @@ -110,13 +108,13 @@ repos:

# jupyter notebook cell output clearing
- repo: https://github.com/kynan/nbstripout
rev: 0.5.0
rev: 0.7.1
hooks:
- id: nbstripout

# jupyter notebook linting
- repo: https://github.com/nbQA-dev/nbQA
rev: 1.4.0
rev: 1.8.7
hooks:
- id: nbqa-black
args: ["--line-length=99"]
Expand All @@ -130,17 +128,18 @@ repos:
]

- repo: https://github.com/dosisod/refurb
rev: v1.3.0
rev: v2.0.0
hooks:
- id: refurb
language_version: python3.10
args:
- --ignore
- FURB120
- --ignore
- FURB123

- repo: https://github.com/asottile/blacken-docs
rev: v1.12.1
rev: 1.19.0
hooks:
- id: blacken-docs
args: [--line-length=120]
additional_dependencies: [black==21.12b0]
2 changes: 1 addition & 1 deletion configs/model/im2im/ijepa.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -6,7 +6,7 @@ save_dir: ${paths.output_dir}

encoder:
_target_: cyto_dl.nn.vits.encoder.JEPAEncoder
patch_size: 2 # patch_size * num_patches should equl data._aux.patch_shape
patch_size: 2 # patch_size * num_patches should equal data._aux.patch_shape
num_patches: ${model._aux.num_patches}
emb_dim: 16
num_layer: 2
Expand Down
6 changes: 3 additions & 3 deletions cyto_dl/api/cyto_dl_model/cyto_dl_base_model.py
Original file line number Diff line number Diff line change
Expand Up @@ -36,9 +36,9 @@ def _get_experiment_type(cls) -> ExperimentType:
def from_existing_config(cls, config_filepath: Path):
"""Returns a model from an existing config.
:param config_filepath: path to a .yaml config file that will be used as the basis
for this CytoDLBaseModel (must be generated by the CytoDLBaseModel subclass that wants
to use it).
:param config_filepath: path to a .yaml config file that will be used as the basis for this
CytoDLBaseModel (must be generated by the CytoDLBaseModel subclass that wants to use
it).
"""
return cls(OmegaConf.load(config_filepath))

Expand Down
6 changes: 3 additions & 3 deletions cyto_dl/callbacks/outlier_detection.py
Original file line number Diff line number Diff line change
Expand Up @@ -64,7 +64,7 @@ def fn(_, __, output):
return fn

def _update_covariance(self, output, layer_name):
"""record spatial mean and cov of channel activations per image in batch."""
"""Record spatial mean and cov of channel activations per image in batch."""
output = self.flatten_activations(output)
if self.mu[layer_name] is None:
self.mu[layer_name] = np.zeros(output.shape[1])
Expand All @@ -76,7 +76,7 @@ def _update_covariance(self, output, layer_name):
self.n += 1

def on_train_epoch_start(self, trainer, pl_module):
"""set forward hook."""
"""Set forward hook."""
if trainer.current_epoch == trainer.max_epochs - self.n_epochs:
named_modules = dict([*pl_module.backbone.named_modules()])
for layer_name in self.layer_names:
Expand All @@ -101,7 +101,7 @@ def _calculate_mahalanobis(self, output, layer_name):
self.activations[layer_name].append(out)

def _inference_start(self, pl_module):
"""add mahalanobis calculation hook and calculate inverse covariance matrix."""
"""Add mahalanobis calculation hook and calculate inverse covariance matrix."""
if self._run:
named_modules = dict([*pl_module.backbone.named_modules()])
for layer_name in self.layer_names:
Expand Down
2 changes: 1 addition & 1 deletion cyto_dl/dataframe/readers.py
Original file line number Diff line number Diff line change
Expand Up @@ -149,7 +149,7 @@ def read_dataframe(
include_columns = sorted(list(include_columns))
required_columns = sorted(list(required_columns))

if len(include_columns) == 0:
if not include_columns:
include_columns = None

if isinstance(dataframe, str):
Expand Down
2 changes: 1 addition & 1 deletion cyto_dl/datamodules/dataframe/dataframe_datamodule.py
Original file line number Diff line number Diff line change
Expand Up @@ -163,7 +163,7 @@ def get_dataset(self, split):
return self.datasets[split][sample]

def make_dataloader(self, split):
kwargs = dict(**self.dataloader_kwargs)
kwargs = {**self.dataloader_kwargs}
kwargs["shuffle"] = kwargs.get("shuffle", True) and split == "train"
kwargs["batch_size"] = self.batch_size

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -116,7 +116,7 @@ def __init__(
self.target_columns = target_columns

def make_dataloader(self, split):
kwargs = dict(**self.dataloader_kwargs)
kwargs = {**self.dataloader_kwargs}
kwargs["shuffle"] = kwargs.get("shuffle", True) and split == "train"
subset = self.get_dataset(split)

Expand Down
19 changes: 12 additions & 7 deletions cyto_dl/datamodules/smartcache.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,4 @@
from itertools import chain
from pathlib import Path
from typing import Optional, Union

Expand Down Expand Up @@ -118,14 +119,18 @@ def _get_file_args(self, row):
for timepoint in timepoints:
img_data.append(
{
"dimension_order_out": "ZYX"[-self.spatial_dims :]
if not use_neighbors
else "T" + "ZYX"[-self.spatial_dims :],
"dimension_order_out": (
"ZYX"[-self.spatial_dims :]
if not use_neighbors
else "T" + "ZYX"[-self.spatial_dims :]
),
"C": row[self.channel_column],
"scene": scene,
"T": timepoint
if not use_neighbors
else [timepoint + i for i in range(self.num_neighbors + 1)],
"T": (
timepoint
if not use_neighbors
else [timepoint + i for i in range(self.num_neighbors + 1)]
),
"original_path": row[self.img_path_column],
}
)
Expand All @@ -136,7 +141,7 @@ def get_per_file_args(self, df):
timepoints/channels/scenes for each file in the dataframe."""
with ProgressBar():
img_data = dask.compute(*[self._get_file_args(row) for row in df.itertuples()])
img_data = [item for sublist in img_data for item in sublist]
img_data = list(chain.from_iterable(img_data))
return img_data

def prepare_data(self):
Expand Down
6 changes: 3 additions & 3 deletions cyto_dl/image/io/aicsimage_loader.py
Original file line number Diff line number Diff line change
Expand Up @@ -9,9 +9,9 @@
class AICSImageLoaderd(Transform):
"""Enumerates scenes and timepoints for dictionary with format.
{path_key: path, channel_key: channel, scene_key: scene, timepoint_key: timepoint}.
Differs from monai_bio_reader in that reading kwargs are passed in the dictionary, instead of
fixed at initialization.
{path_key: path, channel_key: channel, scene_key: scene, timepoint_key: timepoint}. Differs
from monai_bio_reader in that reading kwargs are passed in the dictionary, instead of fixed at
initialization.
"""

def __init__(
Expand Down
5 changes: 1 addition & 4 deletions cyto_dl/image/io/monai_bio_reader.py
Original file line number Diff line number Diff line change
Expand Up @@ -30,10 +30,7 @@ def __init__(self, dask_load: bool = True, **reader_kwargs):

def read(self, data: Union[Sequence[PathLike], PathLike]):
filenames: Sequence[PathLike] = ensure_tuple(data)
img_ = []
for name in filenames:
img_.append(BioImage(f"{name}"))

img_ = [BioImage(name) for name in filenames]
return img_ if len(filenames) > 1 else img_[0]

def get_data(self, img) -> Tuple[np.ndarray, Dict]:
Expand Down
2 changes: 1 addition & 1 deletion cyto_dl/image/io/skimage_reader.py
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@ def read(self, data: Union[Sequence[PathLike], PathLike]):
filenames: Sequence[PathLike] = ensure_tuple(data)
img_ = []
for name in filenames:
this_im = imread(f"{name}")
this_im = imread(name)
if self.channels:
this_im = this_im[self.channels]

Expand Down
2 changes: 1 addition & 1 deletion cyto_dl/image/transforms/multiscale_cropper.py
Original file line number Diff line number Diff line change
Expand Up @@ -92,7 +92,7 @@ def _apply_slice(data, slicee):
@staticmethod
def _generate_slice(start_coords: Sequence[int], roi_size: Sequence[int]) -> slice:
"""Creates slice starting at `start_coords` of size `roi_size`"""
return [slice(None, None)] + [
return [slice(None, None)] + [ # noqa: FURB140
slice(start, end) for start, end in zip(start_coords, start_coords + roi_size)
]

Expand Down
19 changes: 11 additions & 8 deletions cyto_dl/loggers/mlflow.py
Original file line number Diff line number Diff line change
Expand Up @@ -55,7 +55,7 @@ def log_hyperparams(self, params: Union[Dict[str, Any], Namespace], mode="train"

with tempfile.TemporaryDirectory() as tmp_dir:
conf_path = Path(tmp_dir) / f"{mode}.yaml"
with open(conf_path, "w") as f:
with conf_path.open("w") as f:
config = OmegaConf.create(params)
OmegaConf.save(config=config, f=f)

Expand Down Expand Up @@ -133,7 +133,7 @@ def _after_save_checkpoint(self, ckpt_callback: ModelCheckpoint) -> None:
self.run_id, local_path=best_path, artifact_path=artifact_path
)

os.unlink(best_path)
best_path.unlink()

else:
filepath = ckpt_callback.best_model_path
Expand All @@ -149,17 +149,20 @@ def _after_save_checkpoint(self, ckpt_callback: ModelCheckpoint) -> None:
self.run_id, local_path=last_path, artifact_path=artifact_path
)

os.unlink(last_path)
last_path.unlink()
else:
self.experiment.log_artifact(
self.run_id, local_path=filepath, artifact_path=artifact_path
)


def _delete_local_artifact(repo, artifact_path):
artifact_path = local_file_uri_to_path(
os.path.join(repo._artifact_dir, artifact_path) if artifact_path else repo._artifact_dir
artifact_path = Path(
local_file_uri_to_path(
os.path.join(repo._artifact_dir, artifact_path)
if artifact_path
else repo._artifact_dir
)
)

if os.path.isfile(artifact_path):
os.remove(artifact_path)
if artifact_path.is_file():
artifact_path.unlink()
2 changes: 1 addition & 1 deletion cyto_dl/models/base_model.py
Original file line number Diff line number Diff line change
Expand Up @@ -23,7 +23,7 @@


def _is_primitive(value):
if isinstance(value, (type(None), bool, str, int, float)):
if value is None or isinstance(value, (bool, str, int, float)):
return True

if isinstance(value, (tuple, list)):
Expand Down
4 changes: 2 additions & 2 deletions cyto_dl/models/basic_model.py
Original file line number Diff line number Diff line change
Expand Up @@ -59,11 +59,11 @@ def __init__(

super().__init__(metrics=metrics)

if network is None and pretrained_weights is None:
if network is pretrained_weights is None:
raise ValueError("`network` and `pretrained_weights` can't both be None.")

if pretrained_weights is not None:
pretrained_weights = torch.load(pretrained_weights)
pretrained_weights = torch.load(pretrained_weights) # nosec B614

if network is not None:
self.network = network
Expand Down
2 changes: 1 addition & 1 deletion cyto_dl/models/classification/timepoint_classification.py
Original file line number Diff line number Diff line change
Expand Up @@ -50,7 +50,7 @@ def predict_step(self, batch, batch_idx):
batch,
"predict",
logits,
name=f"{batch['track_id'].cpu().item()}",
name=str(batch["track_id"].cpu().item()),
)

timepoints = np.array(batch["timepoints"][0][1:-1].split(",")).astype(int)
Expand Down
6 changes: 3 additions & 3 deletions cyto_dl/models/handlers/base_handler.py
Original file line number Diff line number Diff line change
Expand Up @@ -76,12 +76,12 @@ def postprocess(self, data):
mode = self.config["return"].get("mode", "network")

if mode == "path":
path = self.config["return"].get("path", "/tmp") # nosec: B108
path = self.config["return"].get("path", "/tmp") # nosec B108
response_path = Path(path) / f"{uuid.uuid4()}.pt"
torch.save(data, response_path)
torch.save(data, response_path) # nosec B614
return [str(response_path)]

buf = io.BytesIO()
torch.save(data, buf)
torch.save(data, buf) # nosec B614
buf.seek(0)
return [buf.read()]
Loading

0 comments on commit 20c8ce2

Please sign in to comment.