From 921537b108d8f4523ec682fdb755a4c31abd206b Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Wed, 12 Jul 2023 11:17:45 -0700 Subject: [PATCH 01/50] adding platforms for build and push --- .github/workflows/publish-to-docker-hub.yml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.github/workflows/publish-to-docker-hub.yml b/.github/workflows/publish-to-docker-hub.yml index d2ea7d23..764de922 100644 --- a/.github/workflows/publish-to-docker-hub.yml +++ b/.github/workflows/publish-to-docker-hub.yml @@ -27,9 +27,10 @@ jobs: password: ${{ secrets.DOCKERHUB_TOKEN }} - name: Build and push id: docker_build - uses: docker/build-push-action@v2.7.0 + uses: docker/build-push-action@v4 # prev 2.7.0 with: context: . + platforms: linux/amd64,linux/arm64 # new line for m1/m2 macs push: true tags: | pathml/pathml:latest From 092402f7a3b94412ccc52d6460ade522bdeb3d9b Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Fri, 14 Jul 2023 09:34:35 -0700 Subject: [PATCH 02/50] updating push action version and adding platforms for mac support --- .github/workflows/publish-to-docker-hub.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/publish-to-docker-hub.yml b/.github/workflows/publish-to-docker-hub.yml index 764de922..e7424d4f 100644 --- a/.github/workflows/publish-to-docker-hub.yml +++ b/.github/workflows/publish-to-docker-hub.yml @@ -27,10 +27,10 @@ jobs: password: ${{ secrets.DOCKERHUB_TOKEN }} - name: Build and push id: docker_build - uses: docker/build-push-action@v4 # prev 2.7.0 + uses: docker/build-push-action@v4 with: context: . - platforms: linux/amd64,linux/arm64 # new line for m1/m2 macs + platforms: linux/amd64,linux/arm64 push: true tags: | pathml/pathml:latest From a6ee90339fd208e4fc666514e1f98c5fbf584005 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Mon, 17 Jul 2023 06:28:33 -0700 Subject: [PATCH 03/50] changing openslide version in environ yml --- environment.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/environment.yml b/environment.yml index 3910502f..457f49b2 100644 --- a/environment.yml +++ b/environment.yml @@ -24,7 +24,7 @@ dependencies: - protobuf==3.20.1 - deepcell==0.11.0 - opencv-contrib-python==4.5.3.56 - - openslide-python==1.1.2 + - openslide-python==1.2.0 - scanpy==1.8.2 - anndata==0.7.8 - tqdm==4.62.3 From e6bd53bc66c04858f6e43e0b3adb376fba4a145c Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Mon, 17 Jul 2023 06:34:40 -0700 Subject: [PATCH 04/50] adding adjusted openslide dependency in yml --- environment.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/environment.yml b/environment.yml index 457f49b2..c140b04d 100644 --- a/environment.yml +++ b/environment.yml @@ -24,7 +24,7 @@ dependencies: - protobuf==3.20.1 - deepcell==0.11.0 - opencv-contrib-python==4.5.3.56 - - openslide-python==1.2.0 + - openslide-python==1.2.0 - scanpy==1.8.2 - anndata==0.7.8 - tqdm==4.62.3 From a57b7f66225b94a2414e585d9f5d20a2cd77cf89 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Fri, 11 Aug 2023 10:07:14 -0700 Subject: [PATCH 05/50] adding inference to init file --- pathml/__init__.py | 1 + 1 file changed, 1 insertion(+) diff --git a/pathml/__init__.py b/pathml/__init__.py index bd878e09..8c1bcc84 100644 --- a/pathml/__init__.py +++ b/pathml/__init__.py @@ -6,6 +6,7 @@ from . import datasets as ds from . import ml from . import preprocessing as pp +from .inference import * from ._logging import PathMLLogger from ._version import __version__ from .core import * # noqa: F403 From 6c8cf28915bcc61f015316d8e9ad4f9ae22402ea Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Fri, 11 Aug 2023 10:08:23 -0700 Subject: [PATCH 06/50] add inference classes and functions --- pathml/inference/__init__.py | 6 + pathml/inference/inference.py | 314 ++++++++++++++++++++++++++++++++++ 2 files changed, 320 insertions(+) create mode 100644 pathml/inference/__init__.py create mode 100644 pathml/inference/inference.py diff --git a/pathml/inference/__init__.py b/pathml/inference/__init__.py new file mode 100644 index 00000000..84f56e04 --- /dev/null +++ b/pathml/inference/__init__.py @@ -0,0 +1,6 @@ +""" +Copyright 2023, Dana-Farber Cancer Institute and Weill Cornell Medicine +License: GNU GPL 2.0 +""" + +from .inference import * \ No newline at end of file diff --git a/pathml/inference/inference.py b/pathml/inference/inference.py new file mode 100644 index 00000000..d94915da --- /dev/null +++ b/pathml/inference/inference.py @@ -0,0 +1,314 @@ +""" +Copyright 2023, Dana-Farber Cancer Institute and Weill Cornell Medicine +License: GNU GPL 2.0 +""" + +import os +import numpy as np +from pathml.core import SlideData, Tile +from pathml.preprocessing import Pipeline +import pathml.preprocessing.transforms as Transforms +import onnx +import onnxruntime as ort +import pathml + + +def remove_initializer_from_input(model_path, new_path): + """Removes initializers from HaloAI ONNX models + Taken from https://github.com/microsoft/onnxruntime/blob/main/tools/python/remove_initializer_from_input.py + + Args: + model_path (str): path to ONNX model, + new_path (str): path to save adjusted model w/o initializers, + + Returns: + ONNX model w/o initializers to run inference using PathML + """ + + model = onnx.load(model_path) + + inputs = model.graph.input + name_to_input = {} + for onnx_input in inputs: + name_to_input[onnx_input.name] = onnx_input + + for initializer in model.graph.initializer: + if initializer.name in name_to_input: + inputs.remove(name_to_input[initializer.name]) + + onnx.save(model, new_path) + + +def check_onnx_clean(model_path): + """Checks if the model has had it's initalizers removed from input graph. + Adapted from from https://github.com/microsoft/onnxruntime/blob/main/tools/python/remove_initializer_from_input.py + + Args: + model_path (str): path to ONNX model, + + Returns: + Boolean if there are initializers in input graph. + """ + + model = onnx.load(model_path) + + inputs = model.graph.input + name_to_input = {} + for onnx_input in inputs: + name_to_input[onnx_input.name] = onnx_input + + for initializer in model.graph.initializer: + if initializer.name in name_to_input: + return True + +# Base class +# I think this should still inherit from Transforms to make the tiling easier/so we don't have to rewrite so much existing code +class InferenceBase(Transforms.Transform): + """ + Base class for all ONNX Models. + Each transform must operate on a Tile. + """ + + def __init__(self): + self.model_card = { + 'name' : None, + 'num_classes' : None, + 'model_type' : None, + 'notes' : None, + 'model_input_notes': None, + 'model_output_notes' : None, + 'citation': None + } + + def __repr__(self): + return "Base class for all ONNX models" + + + def get_model_card(self): + return self.model_card + + def set_name(self, name): + self.model_card['name'] = name + + def set_num_classes(self, num): + self.model_card['num_classes'] = num + + def set_model_type(self, model_type): + self.model_card['model_type'] = model_type + + def set_notes(self, note): + self.model_card['notes'] = note + + def set_model_input_notes(self, note): + self.model_card['model_input_notes'] = note + + def set_model_output_notes(self, note): + self.model_card['model_output_notes'] = note + + def set_citation(self, citation): + self.model_card['citation'] = citation + + + def reshape(self, image): + """standard reshaping of tile image""" + # flip dimensions + # follows convention used here https://github.com/Dana-Farber-AIOS/pathml/blob/master/pathml/ml/dataset.py + + if image.ndim == 3: + # swap axes from HWC to CHW + image = image.transpose(2, 0, 1) + # add a dimesion bc onnx models usually have batch size as first dim: e.g. (1, channel, height, width) + image = np.expand_dims(image, axis = 0) + + return image + else: + # in this case, we assume that we have XYZCT channel order + # so we swap axes to TCZYX for batching + # note we are not adding a dim here for batch bc we assume that subsetting will create a batch "placeholder" dim + image = image.T + + return image + + def F(self, target): + """functional implementation""" + raise NotImplementedError + + def apply(self, tile): + """modify Tile object in-place""" + raise NotImplementedError + +# class to handle local onnx models +class Inference(InferenceBase): + """Transformation to run inferrence on ONNX model. + + Assumptions: + - The ONNX model has been cleaned by `remove_initializer_from_input` first + + Args: + model_path (str): path to ONNX model w/o initializers, + input_name (str): name of the input the ONNX model accepts + """ + def __init__(self, model_path = None, input_name = 'data', num_classes = None, model_type = None, local = True): + super().__init__() + + + self.input_name = input_name + self.num_classes = num_classes + self.model_type = model_type + self.local = local + + if self.local: + # using a local onnx model + self.model_path = model_path + else: + # if using a model from the model zoo, set the local path to a temp file + self.model_path = 'temp.onnx' + + # fill in parts of the model_card with the following info + self.model_card['num_classes'] = self.num_classes + self.model_card['model_type'] = self.model_type + + + # check if there are initializers in input graph if using a local model + if local: + if check_onnx_clean(model_path): + raise ValueError("The ONNX model still has graph initializers in the input graph. Use `remove_initializer_from_input` to remove them.") + else: + pass + + + def __repr__(self): + if self.local: + return f"Class to handle ONNX model locally stored at {self.model_path}" + else: + return f"Class to handle a {self.model_card['model_name']} from the PathML model zoo." + + def inference(self, image): + + # reshape the image + image = self.reshape(image) + + # load fixed model + onnx_model = onnx.load(self.model_path) + + # check tile dimensions match ONNX input dimensions + input_node = onnx_model.graph.input + + dimensions = [] + for input in input_node: + if input.name == self.input_name: + input_shape = input.type.tensor_type.shape.dim + for dim in input_shape: + dimensions.append(dim.dim_value) + + assert image.shape[-1] == dimensions[-1] and image.shape[-2] == dimensions[-2], f'expecting tile shape of {dimensions[-2]} by {dimensions[-1]}, got {image.shape[-2]} by {image.shape[-1]}' + + # check onnx model + onnx.checker.check_model(onnx_model) + + # start an inference session + ort_sess = ort.InferenceSession(self.model_path) + + # create model output, returns a list + model_output = ort_sess.run(None, {self.input_name: image.astype('f')}) + + return model_output + + def F(self, image): + + # run inference function + prediction_map = self.inference(image) + + # single task model + if len(prediction_map) == 1: + # return first and only prediction array in the list + return prediction_map[0] + + # multi task model + else: + # concatenate prediction results + # assumes that the tasks all output prediction arrays of same dimension on H and W + # To Do: figure out solution for way different tasks such as if a model does both segmentation and classification + result_array = np.concatenate(prediction_map, axis = 1) + return result_array + + def apply(self, tile): + tile.image = self.F(tile.image) + +class HaloAIInference(Inference): + """Transformation to run inferrence on HALO AI ONNX model. + + Assumptions: + - Assumes that the ONNX model returns a tensor in which there is one prediction map for each class + - For example, if there are 5 classes, the ONNX model will output a (1, 5, Height, Weight) tensor + - If you select to argmax the classes, the class assumes a softmax or sigmoid has already been applied + - HaloAI ONNX models always have 20 class maps so you need to index into the first x maps if you have x classes + + + Args: + model_path (str): path to ONNX model w/o initializers, + num_classes (int): number of classes in the data, + input_name (str): name of the input the ONNX model accepts + """ + def __init__(self, model_path = None, input_name = 'data', num_classes = None, model_type = None, local = True): + super().__init__(model_path, input_name, num_classes, model_type, local) + + self.model_card['num_classes'] = self.num_classes + self.model_card['model_type'] = self.model_type + + + def __repr__(self): + return f"Class to handle HALO AI ONNX model locally stored at {self.model_path}" + + def F(self, image): + + prediction_map = self.inference(image) + + prediction_map = prediction_map[0][:, 0 : self.num_classes, :, :] + + return prediction_map + + def apply(self, tile): + tile.image = self.F(tile.image) + +# class to handle remote onnx models +# ToDo create function to remove model after tiling is done would be a sep line in workflow +class RemoteTestHoverNet(Inference): + """Transformation to run inferrence on ONNX model. + + Citation for model: + Pocock J, Graham S, Vu QD, Jahanifar M, Deshpande S, Hadjigeorghiou G, Shephard A, Bashir RM, Bilal M, Lu W, Epstein D. + TIAToolbox as an end-to-end library for advanced tissue image analytics. Communications medicine. 2022 Sep 24;2(1):120. + + Args: + model_path (str): temp file name to download onnx from huggingface, + input_name (str): name of the input the ONNX model accepts + """ + def __init__(self, model_path = 'temp.onnx', input_name = 'data', num_classes = 5, model_type = 'Segmentation', local = False): + super().__init__(model_path, input_name, num_classes, model_type, local) + + # specify URL of the model in PathML public repository + url = 'https://huggingface.co/pathml/test/resolve/main/hovernet_fast_tiatoolbox_fixed.onnx' + + # download model, save as temp.onnx + with open(self.model_path, 'wb') as out_file: + content = requests.get(url, stream=True).content + out_file.write(content) + + + self.model_card['num_classes'] = self.num_classes + self.model_card['model_type'] = self.model_type + self.model_card['name'] = 'Tiabox HoverNet Test' + self.model_card['model_input_notes'] = 'Accepts tiles of 256 x 256' + self.model_card['citation'] = 'Pocock J, Graham S, Vu QD, Jahanifar M, Deshpande S, Hadjigeorghiou G, Shephard A, Bashir RM, Bilal M, Lu W, Epstein D. TIAToolbox as an end-to-end library for advanced tissue image analytics. Communications medicine. 2022 Sep 24;2(1):120.' + + + def __repr__(self): + return "Class to handle remote TIAToolBox HoverNet test ONNX. See model card for citation." + + def apply(self, tile): + tile.image = self.F(tile.image) + + def remove(self): + # remove the temp.onnx model + os.remove(self.model_path) \ No newline at end of file From 34237f2f1695a94305102566572a145c6adc1c37 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Fri, 11 Aug 2023 10:08:50 -0700 Subject: [PATCH 07/50] add tests for inference --- tests/inference_tests/test_inference.py | 136 ++++++++++++++++++++++++ 1 file changed, 136 insertions(+) create mode 100644 tests/inference_tests/test_inference.py diff --git a/tests/inference_tests/test_inference.py b/tests/inference_tests/test_inference.py new file mode 100644 index 00000000..950bdce4 --- /dev/null +++ b/tests/inference_tests/test_inference.py @@ -0,0 +1,136 @@ +import os +import numpy as np +import onnx +import onnxruntime as ort +import pytest + +from pathml.inference import * + + +def test_remove_initializer_from_input(): + # Create a temporary ONNX model file + model_path = "test_model.onnx" + # temp_file = tempfile.NamedTemporaryFile(delete=False) + # temp_file.close() + + # Create a sample ONNX model with initializer and graph input + model = onnx.ModelProto() + model.ir_version = 4 + + # Add inputs to the graph + input_1 = model.graph.input.add() + input_1.name = "input_1" + + input_2 = model.graph.input.add() + input_2.name = "input_2" + + # Add an initializer that matches one of the inputs + initializer = model.graph.initializer.add() + initializer.name = "input_2" + + # Save the model to a file + onnx.save(model, model_path) + + # Call the function to remove initializers + new_model_path = "new_model.onnx" + remove_initializer_from_input(model_path, new_model_path) + + # Assert that the initializer has been removed from the new model + new_model = onnx.load(new_model_path) + input_names = [input.name for input in new_model.graph.input] + assert initializer.name not in input_names + + # Clean up the temporary files + os.remove(model_path) + os.remove(new_model_path) + +def test_check_onnx_clean(): + # Create a temporary ONNX model file + model_path = "test_model.onnx" + # temp_file = tempfile.NamedTemporaryFile(delete=False) + # temp_file.close() + + # Create a sample ONNX model with initializer and graph input + model = onnx.ModelProto() + model.ir_version = 4 + + # Add inputs to the graph + input_1 = model.graph.input.add() + input_1.name = "input_1" + + input_2 = model.graph.input.add() + input_2.name = "input_2" + + # Add an initializer that matches one of the inputs + initializer = model.graph.initializer.add() + initializer.name = "input_2" + + # Save the model to a file + onnx.save(model, model_path) + + if check_onnx_clean(model_path): + pass + else: + raise ValueError('check_onnx_clean function is not working') + + # Clean up the temporary files + os.remove(model_path) + +def test_InferenceBase(): + + # initialize InferenceBase + test = InferenceBase() + + # test setter functions + test.set_name('name') + + test.set_num_classes('num_classes') + + test.set_model_type('model_type') + + test.set_notes('notes') + + test.set_model_input_notes('model_input_notes') + + test.set_model_output_notes('model_output_notes') + + test.set_citation('citation') + + for key in test.model_card: + assert key == test.model_card[key], f"function for {key} is not working" + + # test reshape function + random = np.random.rand(1,2,3) + assert test.reshape(random).shape == (1, 3, 1, 2), "reshape function is not working on 3d arrays" + + random = np.random.rand(1,2,3,4,5) + assert test.reshape(random).shape == (5,4,3,2,1), "reshape function is not working on 5d arrays" + +def test_Inference(tileHE): + + new_path = '../random_model.onnx' + + inference = Inference(model_path = new_path, input_name = 'data', num_classes = 1, model_type = 'segmentation') + + orig_im = tileHE.image + inference.apply(tileHE) + assert np.array_equal(tileHE.image, inference.F(orig_im)) + +def test_HaloAIInference(tileHE): + + new_path = '../random_model.onnx' + + inference = HaloAIInference(model_path = new_path, input_name = 'data', num_classes = 1, model_type = 'segmentation') + orig_im = tileHE.image + inference.apply(tileHE) + assert np.array_equal(tileHE.image, inference.F(orig_im)) + +def test_RemoteTestHoverNet(tileHE): + + inference = RemoteTestHoverNet() + + orig_im = tileHE.image + inference.apply(tileHE) + assert np.array_equal(tileHE.image, inference.F(orig_im)) + + inference.remove() \ No newline at end of file From 980c6620f87a22034017aa44104bbb9f25685abd Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Fri, 11 Aug 2023 10:15:15 -0700 Subject: [PATCH 08/50] fixed import statements --- pathml/inference/__init__.py | 9 ++++++++- pathml/inference/inference.py | 2 +- 2 files changed, 9 insertions(+), 2 deletions(-) diff --git a/pathml/inference/__init__.py b/pathml/inference/__init__.py index 84f56e04..b4b9c58e 100644 --- a/pathml/inference/__init__.py +++ b/pathml/inference/__init__.py @@ -3,4 +3,11 @@ License: GNU GPL 2.0 """ -from .inference import * \ No newline at end of file +from .inference import ( + remove_initializer_from_input, + check_onnx_clean, + InferenceBase, + Inference, + HaloAIInference, + RemoteTestHoverNet +) \ No newline at end of file diff --git a/pathml/inference/inference.py b/pathml/inference/inference.py index d94915da..3020320e 100644 --- a/pathml/inference/inference.py +++ b/pathml/inference/inference.py @@ -11,7 +11,7 @@ import onnx import onnxruntime as ort import pathml - +import requests def remove_initializer_from_input(model_path, new_path): """Removes initializers from HaloAI ONNX models From 77d5d4d82c27f3dcbf5b31a1e179a0f924387bd9 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Fri, 11 Aug 2023 10:20:26 -0700 Subject: [PATCH 09/50] fixing import statements in the init and the test inference --- pathml/__init__.py | 2 +- tests/inference_tests/test_inference.py | 9 ++++++++- 2 files changed, 9 insertions(+), 2 deletions(-) diff --git a/pathml/__init__.py b/pathml/__init__.py index 8c1bcc84..0ae82c6b 100644 --- a/pathml/__init__.py +++ b/pathml/__init__.py @@ -6,7 +6,7 @@ from . import datasets as ds from . import ml from . import preprocessing as pp -from .inference import * +import .inference from ._logging import PathMLLogger from ._version import __version__ from .core import * # noqa: F403 diff --git a/tests/inference_tests/test_inference.py b/tests/inference_tests/test_inference.py index 950bdce4..d6b99cc8 100644 --- a/tests/inference_tests/test_inference.py +++ b/tests/inference_tests/test_inference.py @@ -4,7 +4,14 @@ import onnxruntime as ort import pytest -from pathml.inference import * +from pathml.inference import ( + remove_initializer_from_input, + check_onnx_clean, + InferenceBase, + Inference, + HaloAIInference, + RemoteTestHoverNet +) def test_remove_initializer_from_input(): From b3d295a8ae2547551e0c3d3635e13c02f7d551f4 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Fri, 11 Aug 2023 10:24:33 -0700 Subject: [PATCH 10/50] fixing init files --- pathml/__init__.py | 4 ++-- pathml/inference/__init__.py | 8 ++++---- 2 files changed, 6 insertions(+), 6 deletions(-) diff --git a/pathml/__init__.py b/pathml/__init__.py index 0ae82c6b..1889e4be 100644 --- a/pathml/__init__.py +++ b/pathml/__init__.py @@ -6,7 +6,7 @@ from . import datasets as ds from . import ml from . import preprocessing as pp -import .inference +from . import inference from ._logging import PathMLLogger from ._version import __version__ -from .core import * # noqa: F403 +from .core import * # noqa: F403 \ No newline at end of file diff --git a/pathml/inference/__init__.py b/pathml/inference/__init__.py index b4b9c58e..59b2e4fe 100644 --- a/pathml/inference/__init__.py +++ b/pathml/inference/__init__.py @@ -5,9 +5,9 @@ from .inference import ( remove_initializer_from_input, - check_onnx_clean, - InferenceBase, - Inference, - HaloAIInference, + check_onnx_clean, + InferenceBase + Inference, + HaloAIInference, RemoteTestHoverNet ) \ No newline at end of file From d144d918529fee58603add10733d236abbc1b07b Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Fri, 11 Aug 2023 10:28:43 -0700 Subject: [PATCH 11/50] fixing comma in inference init --- pathml/inference/__init__.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/pathml/inference/__init__.py b/pathml/inference/__init__.py index 59b2e4fe..aca4d69b 100644 --- a/pathml/inference/__init__.py +++ b/pathml/inference/__init__.py @@ -6,7 +6,7 @@ from .inference import ( remove_initializer_from_input, check_onnx_clean, - InferenceBase + InferenceBase, Inference, HaloAIInference, RemoteTestHoverNet From 51841aa54893701433db2c382a11a3accd7008d8 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Fri, 11 Aug 2023 10:35:21 -0700 Subject: [PATCH 12/50] getting rid of unused packages --- pathml/inference/inference.py | 7 ++----- tests/inference_tests/test_inference.py | 2 -- 2 files changed, 2 insertions(+), 7 deletions(-) diff --git a/pathml/inference/inference.py b/pathml/inference/inference.py index 3020320e..15c094da 100644 --- a/pathml/inference/inference.py +++ b/pathml/inference/inference.py @@ -5,12 +5,9 @@ import os import numpy as np -from pathml.core import SlideData, Tile -from pathml.preprocessing import Pipeline import pathml.preprocessing.transforms as Transforms import onnx -import onnxruntime as ort -import pathml +import onnxruntime import requests def remove_initializer_from_input(model_path, new_path): @@ -207,7 +204,7 @@ def inference(self, image): onnx.checker.check_model(onnx_model) # start an inference session - ort_sess = ort.InferenceSession(self.model_path) + ort_sess = onnxruntime.InferenceSession(self.model_path) # create model output, returns a list model_output = ort_sess.run(None, {self.input_name: image.astype('f')}) diff --git a/tests/inference_tests/test_inference.py b/tests/inference_tests/test_inference.py index d6b99cc8..0d1b6ec1 100644 --- a/tests/inference_tests/test_inference.py +++ b/tests/inference_tests/test_inference.py @@ -1,8 +1,6 @@ import os import numpy as np import onnx -import onnxruntime as ort -import pytest from pathml.inference import ( remove_initializer_from_input, From 6044024243c555b3e74bcd16ada06796723ca247 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Fri, 11 Aug 2023 10:53:37 -0700 Subject: [PATCH 13/50] fixed files via black --- pathml/inference/__init__.py | 2 +- pathml/inference/inference.py | 312 +++++++++++++----------- tests/inference_tests/test_inference.py | 116 +++++---- 3 files changed, 236 insertions(+), 194 deletions(-) diff --git a/pathml/inference/__init__.py b/pathml/inference/__init__.py index aca4d69b..bf14de1f 100644 --- a/pathml/inference/__init__.py +++ b/pathml/inference/__init__.py @@ -9,5 +9,5 @@ InferenceBase, Inference, HaloAIInference, - RemoteTestHoverNet + RemoteTestHoverNet, ) \ No newline at end of file diff --git a/pathml/inference/inference.py b/pathml/inference/inference.py index 15c094da..880a4cbf 100644 --- a/pathml/inference/inference.py +++ b/pathml/inference/inference.py @@ -4,24 +4,25 @@ """ import os -import numpy as np +import numpy as np import pathml.preprocessing.transforms as Transforms import onnx -import onnxruntime -import requests +import onnxruntime +import requests + def remove_initializer_from_input(model_path, new_path): """Removes initializers from HaloAI ONNX models Taken from https://github.com/microsoft/onnxruntime/blob/main/tools/python/remove_initializer_from_input.py - + Args: model_path (str): path to ONNX model, new_path (str): path to save adjusted model w/o initializers, Returns: ONNX model w/o initializers to run inference using PathML - """ - + """ + model = onnx.load(model_path) inputs = model.graph.input @@ -35,18 +36,18 @@ def remove_initializer_from_input(model_path, new_path): onnx.save(model, new_path) - + def check_onnx_clean(model_path): - """Checks if the model has had it's initalizers removed from input graph. + """Checks if the model has had it's initalizers removed from input graph. Adapted from from https://github.com/microsoft/onnxruntime/blob/main/tools/python/remove_initializer_from_input.py - + Args: model_path (str): path to ONNX model, Returns: - Boolean if there are initializers in input graph. - """ - + Boolean if there are initializers in input graph. + """ + model = onnx.load(model_path) inputs = model.graph.input @@ -56,75 +57,74 @@ def check_onnx_clean(model_path): for initializer in model.graph.initializer: if initializer.name in name_to_input: - return True + return True + # Base class -# I think this should still inherit from Transforms to make the tiling easier/so we don't have to rewrite so much existing code +# I think this should still inherit from Transforms to make the tiling easier/so we don't have to rewrite so much existing code class InferenceBase(Transforms.Transform): """ Base class for all ONNX Models. Each transform must operate on a Tile. """ - - def __init__(self): + + def __init__(self): self.model_card = { - 'name' : None, - 'num_classes' : None, - 'model_type' : None, - 'notes' : None, - 'model_input_notes': None, - 'model_output_notes' : None, - 'citation': None - } + "name": None, + "num_classes": None, + "model_type": None, + "notes": None, + "model_input_notes": None, + "model_output_notes": None, + "citation": None, + } def __repr__(self): return "Base class for all ONNX models" - - + def get_model_card(self): return self.model_card - + def set_name(self, name): - self.model_card['name'] = name - + self.model_card["name"] = name + def set_num_classes(self, num): - self.model_card['num_classes'] = num - + self.model_card["num_classes"] = num + def set_model_type(self, model_type): - self.model_card['model_type'] = model_type - + self.model_card["model_type"] = model_type + def set_notes(self, note): - self.model_card['notes'] = note - + self.model_card["notes"] = note + def set_model_input_notes(self, note): - self.model_card['model_input_notes'] = note - + self.model_card["model_input_notes"] = note + def set_model_output_notes(self, note): - self.model_card['model_output_notes'] = note - + self.model_card["model_output_notes"] = note + def set_citation(self, citation): - self.model_card['citation'] = citation - - + self.model_card["citation"] = citation + def reshape(self, image): """standard reshaping of tile image""" - # flip dimensions + # flip dimensions # follows convention used here https://github.com/Dana-Farber-AIOS/pathml/blob/master/pathml/ml/dataset.py - + if image.ndim == 3: - # swap axes from HWC to CHW + # swap axes from HWC to CHW image = image.transpose(2, 0, 1) - # add a dimesion bc onnx models usually have batch size as first dim: e.g. (1, channel, height, width) - image = np.expand_dims(image, axis = 0) - - return image + # add a dimesion bc onnx models usually have batch size as first dim: e.g. (1, channel, height, width) + image = np.expand_dims(image, axis=0) + + return image else: # in this case, we assume that we have XYZCT channel order # so we swap axes to TCZYX for batching # note we are not adding a dim here for batch bc we assume that subsetting will create a batch "placeholder" dim image = image.T - - return image + + return image def F(self, target): """functional implementation""" @@ -133,179 +133,203 @@ def F(self, target): def apply(self, tile): """modify Tile object in-place""" raise NotImplementedError - -# class to handle local onnx models + + +# class to handle local onnx models class Inference(InferenceBase): """Transformation to run inferrence on ONNX model. - + Assumptions: - - The ONNX model has been cleaned by `remove_initializer_from_input` first - + - The ONNX model has been cleaned by `remove_initializer_from_input` first + Args: model_path (str): path to ONNX model w/o initializers, input_name (str): name of the input the ONNX model accepts - """ - def __init__(self, model_path = None, input_name = 'data', num_classes = None, model_type = None, local = True): - super().__init__() - - - self.input_name = input_name + """ + + def __init__( + self, + model_path=None, + input_name="data", + num_classes=None, + model_type=None, + local=True, + ): + super().__init__() + + self.input_name = input_name self.num_classes = num_classes self.model_type = model_type self.local = local - + if self.local: # using a local onnx model self.model_path = model_path - else: + else: # if using a model from the model zoo, set the local path to a temp file - self.model_path = 'temp.onnx' - + self.model_path = "temp.onnx" + # fill in parts of the model_card with the following info - self.model_card['num_classes'] = self.num_classes - self.model_card['model_type'] = self.model_type - - + self.model_card["num_classes"] = self.num_classes + self.model_card["model_type"] = self.model_type + # check if there are initializers in input graph if using a local model if local: if check_onnx_clean(model_path): - raise ValueError("The ONNX model still has graph initializers in the input graph. Use `remove_initializer_from_input` to remove them.") + raise ValueError( + "The ONNX model still has graph initializers in the input graph. Use `remove_initializer_from_input` to remove them." + ) else: - pass + pass - def __repr__(self): if self.local: return f"Class to handle ONNX model locally stored at {self.model_path}" else: return f"Class to handle a {self.model_card['model_name']} from the PathML model zoo." - + def inference(self, image): - # reshape the image - image = self.reshape(image) - - # load fixed model + image = self.reshape(image) + + # load fixed model onnx_model = onnx.load(self.model_path) - - # check tile dimensions match ONNX input dimensions + + # check tile dimensions match ONNX input dimensions input_node = onnx_model.graph.input - + dimensions = [] - for input in input_node: - if input.name == self.input_name: + for input in input_node: + if input.name == self.input_name: input_shape = input.type.tensor_type.shape.dim for dim in input_shape: - dimensions.append(dim.dim_value) - - assert image.shape[-1] == dimensions[-1] and image.shape[-2] == dimensions[-2], f'expecting tile shape of {dimensions[-2]} by {dimensions[-1]}, got {image.shape[-2]} by {image.shape[-1]}' - + dimensions.append(dim.dim_value) + + assert ( + image.shape[-1] == dimensions[-1] and image.shape[-2] == dimensions[-2] + ), f"expecting tile shape of {dimensions[-2]} by {dimensions[-1]}, got {image.shape[-2]} by {image.shape[-1]}" + # check onnx model onnx.checker.check_model(onnx_model) - + # start an inference session ort_sess = onnxruntime.InferenceSession(self.model_path) - - # create model output, returns a list - model_output = ort_sess.run(None, {self.input_name: image.astype('f')}) - + + # create model output, returns a list + model_output = ort_sess.run(None, {self.input_name: image.astype("f")}) + return model_output - + def F(self, image): - # run inference function - prediction_map = self.inference(image) - + prediction_map = self.inference(image) + # single task model if len(prediction_map) == 1: - # return first and only prediction array in the list - return prediction_map[0] - + # return first and only prediction array in the list + return prediction_map[0] + # multi task model else: # concatenate prediction results # assumes that the tasks all output prediction arrays of same dimension on H and W # To Do: figure out solution for way different tasks such as if a model does both segmentation and classification - result_array = np.concatenate(prediction_map, axis = 1) - return result_array - + result_array = np.concatenate(prediction_map, axis=1) + return result_array + def apply(self, tile): tile.image = self.F(tile.image) + class HaloAIInference(Inference): """Transformation to run inferrence on HALO AI ONNX model. - + Assumptions: - Assumes that the ONNX model returns a tensor in which there is one prediction map for each class - For example, if there are 5 classes, the ONNX model will output a (1, 5, Height, Weight) tensor - If you select to argmax the classes, the class assumes a softmax or sigmoid has already been applied - HaloAI ONNX models always have 20 class maps so you need to index into the first x maps if you have x classes - - + + Args: model_path (str): path to ONNX model w/o initializers, - num_classes (int): number of classes in the data, + num_classes (int): number of classes in the data, input_name (str): name of the input the ONNX model accepts - """ - def __init__(self, model_path = None, input_name = 'data', num_classes = None, model_type = None, local = True): - super().__init__(model_path, input_name, num_classes, model_type, local) - - self.model_card['num_classes'] = self.num_classes - self.model_card['model_type'] = self.model_type - - + """ + + def __init__( + self, + model_path=None, + input_name="data", + num_classes=None, + model_type=None, + local=True, + ): + super().__init__(model_path, input_name, num_classes, model_type, local) + + self.model_card["num_classes"] = self.num_classes + self.model_card["model_type"] = self.model_type + def __repr__(self): return f"Class to handle HALO AI ONNX model locally stored at {self.model_path}" - + def F(self, image): - prediction_map = self.inference(image) - + prediction_map = prediction_map[0][:, 0 : self.num_classes, :, :] - + return prediction_map - + def apply(self, tile): tile.image = self.F(tile.image) - -# class to handle remote onnx models + + +# class to handle remote onnx models # ToDo create function to remove model after tiling is done would be a sep line in workflow class RemoteTestHoverNet(Inference): """Transformation to run inferrence on ONNX model. - + Citation for model: - Pocock J, Graham S, Vu QD, Jahanifar M, Deshpande S, Hadjigeorghiou G, Shephard A, Bashir RM, Bilal M, Lu W, Epstein D. + Pocock J, Graham S, Vu QD, Jahanifar M, Deshpande S, Hadjigeorghiou G, Shephard A, Bashir RM, Bilal M, Lu W, Epstein D. TIAToolbox as an end-to-end library for advanced tissue image analytics. Communications medicine. 2022 Sep 24;2(1):120. - + Args: model_path (str): temp file name to download onnx from huggingface, input_name (str): name of the input the ONNX model accepts - """ - def __init__(self, model_path = 'temp.onnx', input_name = 'data', num_classes = 5, model_type = 'Segmentation', local = False): + """ + + def __init__( + self, + model_path="temp.onnx", + input_name="data", + num_classes=5, + model_type="Segmentation", + local=False, + ): super().__init__(model_path, input_name, num_classes, model_type, local) - + # specify URL of the model in PathML public repository - url = 'https://huggingface.co/pathml/test/resolve/main/hovernet_fast_tiatoolbox_fixed.onnx' - - # download model, save as temp.onnx - with open(self.model_path, 'wb') as out_file: + url = "https://huggingface.co/pathml/test/resolve/main/hovernet_fast_tiatoolbox_fixed.onnx" + + # download model, save as temp.onnx + with open(self.model_path, "wb") as out_file: content = requests.get(url, stream=True).content out_file.write(content) - - - self.model_card['num_classes'] = self.num_classes - self.model_card['model_type'] = self.model_type - self.model_card['name'] = 'Tiabox HoverNet Test' - self.model_card['model_input_notes'] = 'Accepts tiles of 256 x 256' - self.model_card['citation'] = 'Pocock J, Graham S, Vu QD, Jahanifar M, Deshpande S, Hadjigeorghiou G, Shephard A, Bashir RM, Bilal M, Lu W, Epstein D. TIAToolbox as an end-to-end library for advanced tissue image analytics. Communications medicine. 2022 Sep 24;2(1):120.' - - + + self.model_card["num_classes"] = self.num_classes + self.model_card["model_type"] = self.model_type + self.model_card["name"] = "Tiabox HoverNet Test" + self.model_card["model_input_notes"] = "Accepts tiles of 256 x 256" + self.model_card[ + "citation" + ] = "Pocock J, Graham S, Vu QD, Jahanifar M, Deshpande S, Hadjigeorghiou G, Shephard A, Bashir RM, Bilal M, Lu W, Epstein D. TIAToolbox as an end-to-end library for advanced tissue image analytics. Communications medicine. 2022 Sep 24;2(1):120." + def __repr__(self): return "Class to handle remote TIAToolBox HoverNet test ONNX. See model card for citation." - + def apply(self, tile): tile.image = self.F(tile.image) - + def remove(self): - # remove the temp.onnx model - os.remove(self.model_path) \ No newline at end of file + # remove the temp.onnx model + os.remove(self.model_path) \ No newline at end of file diff --git a/tests/inference_tests/test_inference.py b/tests/inference_tests/test_inference.py index 0d1b6ec1..a91bb1b7 100644 --- a/tests/inference_tests/test_inference.py +++ b/tests/inference_tests/test_inference.py @@ -1,14 +1,16 @@ import os import numpy as np import onnx +import onnxruntime as ort +import pytest -from pathml.inference import ( +from pathml.inference import ( remove_initializer_from_input, - check_onnx_clean, - InferenceBase, - Inference, - HaloAIInference, - RemoteTestHoverNet + check_onnx_clean, + InferenceBase, + Inference, + HaloAIInference, + RemoteTestHoverNet, ) @@ -43,12 +45,13 @@ def test_remove_initializer_from_input(): # Assert that the initializer has been removed from the new model new_model = onnx.load(new_model_path) input_names = [input.name for input in new_model.graph.input] - assert initializer.name not in input_names + assert initializer.name not in input_names # Clean up the temporary files os.remove(model_path) os.remove(new_model_path) - + + def test_check_onnx_clean(): # Create a temporary ONNX model file model_path = "test_model.onnx" @@ -76,66 +79,81 @@ def test_check_onnx_clean(): if check_onnx_clean(model_path): pass else: - raise ValueError('check_onnx_clean function is not working') + raise ValueError("check_onnx_clean function is not working") # Clean up the temporary files os.remove(model_path) - -def test_InferenceBase(): - + + +def test_InferenceBase(): # initialize InferenceBase test = InferenceBase() - - # test setter functions - test.set_name('name') - - test.set_num_classes('num_classes') - - test.set_model_type('model_type') - - test.set_notes('notes') - - test.set_model_input_notes('model_input_notes') - - test.set_model_output_notes('model_output_notes') - - test.set_citation('citation') - + + # test setter functions + test.set_name("name") + + test.set_num_classes("num_classes") + + test.set_model_type("model_type") + + test.set_notes("notes") + + test.set_model_input_notes("model_input_notes") + + test.set_model_output_notes("model_output_notes") + + test.set_citation("citation") + for key in test.model_card: assert key == test.model_card[key], f"function for {key} is not working" - - # test reshape function - random = np.random.rand(1,2,3) - assert test.reshape(random).shape == (1, 3, 1, 2), "reshape function is not working on 3d arrays" - - random = np.random.rand(1,2,3,4,5) - assert test.reshape(random).shape == (5,4,3,2,1), "reshape function is not working on 5d arrays" - -def test_Inference(tileHE): - - new_path = '../random_model.onnx' - - inference = Inference(model_path = new_path, input_name = 'data', num_classes = 1, model_type = 'segmentation') - + + # test reshape function + random = np.random.rand(1, 2, 3) + assert test.reshape(random).shape == ( + 1, + 3, + 1, + 2, + ), "reshape function is not working on 3d arrays" + + random = np.random.rand(1, 2, 3, 4, 5) + assert test.reshape(random).shape == ( + 5, + 4, + 3, + 2, + 1, + ), "reshape function is not working on 5d arrays" + + +def test_Inference(tileHE): + new_path = "../random_model.onnx" + + inference = Inference( + model_path=new_path, input_name="data", num_classes=1, model_type="segmentation" + ) + orig_im = tileHE.image inference.apply(tileHE) assert np.array_equal(tileHE.image, inference.F(orig_im)) - -def test_HaloAIInference(tileHE): - new_path = '../random_model.onnx' - inference = HaloAIInference(model_path = new_path, input_name = 'data', num_classes = 1, model_type = 'segmentation') +def test_HaloAIInference(tileHE): + new_path = "../random_model.onnx" + + inference = HaloAIInference( + model_path=new_path, input_name="data", num_classes=1, model_type="segmentation" + ) orig_im = tileHE.image inference.apply(tileHE) assert np.array_equal(tileHE.image, inference.F(orig_im)) -def test_RemoteTestHoverNet(tileHE): +def test_RemoteTestHoverNet(tileHE): inference = RemoteTestHoverNet() orig_im = tileHE.image inference.apply(tileHE) assert np.array_equal(tileHE.image, inference.F(orig_im)) - - inference.remove() \ No newline at end of file + + inference.remove() \ No newline at end of file From e6002d2c3e0ad0e38b9d867b956025db2b76f11a Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Fri, 11 Aug 2023 11:03:56 -0700 Subject: [PATCH 14/50] fixed spacing and alpha order --- pathml/__init__.py | 7 +++---- pathml/inference/__init__.py | 10 +++++----- pathml/inference/inference.py | 7 +++++-- tests/inference_tests/test_inference.py | 14 +++++++------- 4 files changed, 20 insertions(+), 18 deletions(-) diff --git a/pathml/__init__.py b/pathml/__init__.py index 1889e4be..5865c6ea 100644 --- a/pathml/__init__.py +++ b/pathml/__init__.py @@ -1,12 +1,11 @@ """ -Copyright 2021, Dana-Farber Cancer Institute and Weill Cornell Medicine +Copyright 2023, Dana-Farber Cancer Institute and Weill Cornell Medicine License: GNU GPL 2.0 """ from . import datasets as ds -from . import ml +from . import inference, ml from . import preprocessing as pp -from . import inference from ._logging import PathMLLogger from ._version import __version__ -from .core import * # noqa: F403 \ No newline at end of file +from .core import * # noqa: F403 diff --git a/pathml/inference/__init__.py b/pathml/inference/__init__.py index bf14de1f..dd2b9a39 100644 --- a/pathml/inference/__init__.py +++ b/pathml/inference/__init__.py @@ -4,10 +4,10 @@ """ from .inference import ( - remove_initializer_from_input, - check_onnx_clean, - InferenceBase, - Inference, HaloAIInference, + Inference, + InferenceBase, RemoteTestHoverNet, -) \ No newline at end of file + check_onnx_clean, + remove_initializer_from_input, +) diff --git a/pathml/inference/inference.py b/pathml/inference/inference.py index 880a4cbf..4274bc35 100644 --- a/pathml/inference/inference.py +++ b/pathml/inference/inference.py @@ -4,12 +4,15 @@ """ import os + import numpy as np -import pathml.preprocessing.transforms as Transforms import onnx import onnxruntime import requests +import pathml.preprocessing.transforms as Transforms + + def remove_initializer_from_input(model_path, new_path): """Removes initializers from HaloAI ONNX models @@ -332,4 +335,4 @@ def apply(self, tile): def remove(self): # remove the temp.onnx model - os.remove(self.model_path) \ No newline at end of file + os.remove(self.model_path) diff --git a/tests/inference_tests/test_inference.py b/tests/inference_tests/test_inference.py index a91bb1b7..4fef292e 100644 --- a/tests/inference_tests/test_inference.py +++ b/tests/inference_tests/test_inference.py @@ -1,19 +1,19 @@ import os + import numpy as np import onnx -import onnxruntime as ort -import pytest from pathml.inference import ( - remove_initializer_from_input, - check_onnx_clean, - InferenceBase, - Inference, HaloAIInference, + Inference, + InferenceBase, RemoteTestHoverNet, + check_onnx_clean, + remove_initializer_from_input, ) + def test_remove_initializer_from_input(): # Create a temporary ONNX model file model_path = "test_model.onnx" @@ -156,4 +156,4 @@ def test_RemoteTestHoverNet(tileHE): inference.apply(tileHE) assert np.array_equal(tileHE.image, inference.F(orig_im)) - inference.remove() \ No newline at end of file + inference.remove() From 35a3df1611e8b85dd942ca27f06f20c3e4ee9c2a Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Fri, 11 Aug 2023 11:25:06 -0700 Subject: [PATCH 15/50] added dependencies --- environment.yml | 2 ++ pathml/inference/inference.py | 1 - 2 files changed, 2 insertions(+), 1 deletion(-) diff --git a/environment.yml b/environment.yml index c140b04d..fc11831e 100644 --- a/environment.yml +++ b/environment.yml @@ -23,6 +23,8 @@ dependencies: - python-javabridge==4.0.0 - protobuf==3.20.1 - deepcell==0.11.0 + - onnx==1.14.0 + - onnxruntime==1.15.1 - opencv-contrib-python==4.5.3.56 - openslide-python==1.2.0 - scanpy==1.8.2 diff --git a/pathml/inference/inference.py b/pathml/inference/inference.py index 4274bc35..83ec0093 100644 --- a/pathml/inference/inference.py +++ b/pathml/inference/inference.py @@ -13,7 +13,6 @@ import pathml.preprocessing.transforms as Transforms - def remove_initializer_from_input(model_path, new_path): """Removes initializers from HaloAI ONNX models Taken from https://github.com/microsoft/onnxruntime/blob/main/tools/python/remove_initializer_from_input.py From c015ff866faf0a3a669404ee9c8845686291fb79 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Fri, 11 Aug 2023 11:33:40 -0700 Subject: [PATCH 16/50] re black the test inference file --- tests/inference_tests/test_inference.py | 1 - 1 file changed, 1 deletion(-) diff --git a/tests/inference_tests/test_inference.py b/tests/inference_tests/test_inference.py index 4fef292e..27446324 100644 --- a/tests/inference_tests/test_inference.py +++ b/tests/inference_tests/test_inference.py @@ -13,7 +13,6 @@ ) - def test_remove_initializer_from_input(): # Create a temporary ONNX model file model_path = "test_model.onnx" From 0dd09b8a3dda2420eaa607e61aac7f464cb8c1aa Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Mon, 14 Aug 2023 07:47:53 -0700 Subject: [PATCH 17/50] update protobuf version in envi yml --- environment.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/environment.yml b/environment.yml index fc11831e..2cfddff9 100644 --- a/environment.yml +++ b/environment.yml @@ -21,7 +21,7 @@ dependencies: - pip: - python-bioformats==4.0.0 - python-javabridge==4.0.0 - - protobuf==3.20.1 + - protobuf==3.20.2 - deepcell==0.11.0 - onnx==1.14.0 - onnxruntime==1.15.1 From 5657efbe2b4444012c9d25895baf3354313143df Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Mon, 14 Aug 2023 08:01:11 -0700 Subject: [PATCH 18/50] changing numpy version --- environment.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/environment.yml b/environment.yml index 2cfddff9..2541b9b5 100644 --- a/environment.yml +++ b/environment.yml @@ -6,7 +6,7 @@ channels: dependencies: - pip==21.3.1 - - numpy==1.19.5 + - numpy==1.21.6 - scipy==1.7.3 - scikit-image==0.18.3 - matplotlib==3.5.1 From 0b7df6b827ffa3ce72cdcc42417fb47168737705 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Mon, 14 Aug 2023 08:35:04 -0700 Subject: [PATCH 19/50] adjusting deepcel version --- environment.yml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/environment.yml b/environment.yml index 2541b9b5..258ed401 100644 --- a/environment.yml +++ b/environment.yml @@ -22,7 +22,8 @@ dependencies: - python-bioformats==4.0.0 - python-javabridge==4.0.0 - protobuf==3.20.2 - - deepcell==0.11.0 + # - deepcell==0.11.0 + - deepcell==0.12.7 - onnx==1.14.0 - onnxruntime==1.15.1 - opencv-contrib-python==4.5.3.56 From 4612a68396c9ef125ca8df4928339dfc2956b22f Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Mon, 14 Aug 2023 09:03:00 -0700 Subject: [PATCH 20/50] deleted comment from yml file --- environment.yml | 1 - 1 file changed, 1 deletion(-) diff --git a/environment.yml b/environment.yml index 258ed401..cc4308a6 100644 --- a/environment.yml +++ b/environment.yml @@ -22,7 +22,6 @@ dependencies: - python-bioformats==4.0.0 - python-javabridge==4.0.0 - protobuf==3.20.2 - # - deepcell==0.11.0 - deepcell==0.12.7 - onnx==1.14.0 - onnxruntime==1.15.1 From 4cd57a5844cf2219daf09bffb98db139a28a27f1 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Mon, 14 Aug 2023 09:24:16 -0700 Subject: [PATCH 21/50] updating pytest version --- environment.yml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/environment.yml b/environment.yml index cc4308a6..d00aca02 100644 --- a/environment.yml +++ b/environment.yml @@ -15,7 +15,8 @@ dependencies: - h5py==3.1.0 - dask==2021.12.0 - pydicom==2.2.2 - - pytest==6.2.5 + # - pytest==6.2.5 + - pytest==7.4.0 - pre-commit==2.16.0 - coverage==5.5 - pip: From 05f19e76ed83e83ee549024147af47d28222ea75 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Mon, 14 Aug 2023 09:51:04 -0700 Subject: [PATCH 22/50] setting pandas version --- environment.yml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/environment.yml b/environment.yml index d00aca02..a8c7a5b9 100644 --- a/environment.yml +++ b/environment.yml @@ -27,7 +27,8 @@ dependencies: - onnx==1.14.0 - onnxruntime==1.15.1 - opencv-contrib-python==4.5.3.56 - - openslide-python==1.2.0 + - openslide-python==1.2.0 + - pandas==1.5.2 - scanpy==1.8.2 - anndata==0.7.8 - tqdm==4.62.3 From ddb1b07d537f419f3a64e7453cc9b0077704c50b Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Mon, 14 Aug 2023 10:11:04 -0700 Subject: [PATCH 23/50] adding test onnx and fixing path in test file --- tests/inference_tests/test_inference.py | 4 ++-- tests/testdata/random_model.onnx | 23 +++++++++++++++++++++++ 2 files changed, 25 insertions(+), 2 deletions(-) create mode 100644 tests/testdata/random_model.onnx diff --git a/tests/inference_tests/test_inference.py b/tests/inference_tests/test_inference.py index 27446324..03e1cdc3 100644 --- a/tests/inference_tests/test_inference.py +++ b/tests/inference_tests/test_inference.py @@ -126,7 +126,7 @@ def test_InferenceBase(): def test_Inference(tileHE): - new_path = "../random_model.onnx" + new_path = "../testdata/andom_model.onnx" inference = Inference( model_path=new_path, input_name="data", num_classes=1, model_type="segmentation" @@ -138,7 +138,7 @@ def test_Inference(tileHE): def test_HaloAIInference(tileHE): - new_path = "../random_model.onnx" + new_path = "../testdata/andom_model.onnx" inference = HaloAIInference( model_path=new_path, input_name="data", num_classes=1, model_type="segmentation" diff --git a/tests/testdata/random_model.onnx b/tests/testdata/random_model.onnx new file mode 100644 index 00000000..3f028573 --- /dev/null +++ b/tests/testdata/random_model.onnx @@ -0,0 +1,23 @@ +pytorch2.0.0:ÿ +‘ +data + conv.weight + conv.bias3 +/conv/Conv"Conv* + dilations@@ * +group * + kernel_shape@@ * +pads@@@@ * +strides@@  torch_jit*…B conv.weightJlÚã>½¦=ãŒ*½…&¬= R¼N¹½Qp€=R·.¾p&r½Dè2>Ì4Å=d2#½ÝS½é‡?>˜ä<}2r½ù).<|V~;¾±ý@½HE8¾@Ó>ÅLô½/¶/>Ëñ~½Æ…˼s. ¾*B conv.biasJ œA¾Z +data + + + +ô +ôb +3 + + + +ô +ôB \ No newline at end of file From af07fb0922080d5a033e9641158816d86b6ee500 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Mon, 14 Aug 2023 11:05:50 -0700 Subject: [PATCH 24/50] fixing remote test --- tests/inference_tests/test_inference.py | 24 ++++++++++++++++++------ 1 file changed, 18 insertions(+), 6 deletions(-) diff --git a/tests/inference_tests/test_inference.py b/tests/inference_tests/test_inference.py index 03e1cdc3..2a5d9d3d 100644 --- a/tests/inference_tests/test_inference.py +++ b/tests/inference_tests/test_inference.py @@ -3,6 +3,7 @@ import numpy as np import onnx +from pathml.core import SlideData from pathml.inference import ( HaloAIInference, Inference, @@ -126,7 +127,7 @@ def test_InferenceBase(): def test_Inference(tileHE): - new_path = "../testdata/andom_model.onnx" + new_path = "../testdata/random_model.onnx" inference = Inference( model_path=new_path, input_name="data", num_classes=1, model_type="segmentation" @@ -138,7 +139,7 @@ def test_Inference(tileHE): def test_HaloAIInference(tileHE): - new_path = "../testdata/andom_model.onnx" + new_path = "../testdata/random_model.onnx" inference = HaloAIInference( model_path=new_path, input_name="data", num_classes=1, model_type="segmentation" @@ -148,11 +149,22 @@ def test_HaloAIInference(tileHE): assert np.array_equal(tileHE.image, inference.F(orig_im)) -def test_RemoteTestHoverNet(tileHE): +def test_RemoteTestHoverNet(): inference = RemoteTestHoverNet() - orig_im = tileHE.image - inference.apply(tileHE) - assert np.array_equal(tileHE.image, inference.F(orig_im)) + wsi = SlideData("../testdata/small_HE.svs") + + tiles = wsi.generate_tiles(shape=(256, 256), pad=False) + a = 0 + test_tile = None + + while a == 0: + for tile in tiles: + test_tile = tile + a += 1 + + orig_im = test_tile.image + inference.apply(test_tile) + assert np.array_equal(test_tile.image, inference.F(orig_im)) inference.remove() From 7048a4e3566eeb88a4109b79c37d33dd3c204ab1 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Mon, 14 Aug 2023 11:26:57 -0700 Subject: [PATCH 25/50] fixing path to onnx model in test data --- tests/inference_tests/test_inference.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/tests/inference_tests/test_inference.py b/tests/inference_tests/test_inference.py index 2a5d9d3d..8d812865 100644 --- a/tests/inference_tests/test_inference.py +++ b/tests/inference_tests/test_inference.py @@ -127,7 +127,7 @@ def test_InferenceBase(): def test_Inference(tileHE): - new_path = "../testdata/random_model.onnx" + new_path = "tests/testdata/random_model.onnx" inference = Inference( model_path=new_path, input_name="data", num_classes=1, model_type="segmentation" @@ -139,7 +139,7 @@ def test_Inference(tileHE): def test_HaloAIInference(tileHE): - new_path = "../testdata/random_model.onnx" + new_path = "tests/testdata/random_model.onnx" inference = HaloAIInference( model_path=new_path, input_name="data", num_classes=1, model_type="segmentation" @@ -152,7 +152,7 @@ def test_HaloAIInference(tileHE): def test_RemoteTestHoverNet(): inference = RemoteTestHoverNet() - wsi = SlideData("../testdata/small_HE.svs") + wsi = SlideData("tests/testdata/small_HE.svs") tiles = wsi.generate_tiles(shape=(256, 256), pad=False) a = 0 From f76314a8f6d43e864f2b408ff58a01c76bf6cb41 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Tue, 15 Aug 2023 11:08:31 -0700 Subject: [PATCH 26/50] changing numpy to latest version --- environment.yml | 9 ++++----- 1 file changed, 4 insertions(+), 5 deletions(-) diff --git a/environment.yml b/environment.yml index a8c7a5b9..e7a65761 100644 --- a/environment.yml +++ b/environment.yml @@ -6,7 +6,7 @@ channels: dependencies: - pip==21.3.1 - - numpy==1.21.6 + - numpy==1.25.2 # orig = 1.19.5 - scipy==1.7.3 - scikit-image==0.18.3 - matplotlib==3.5.1 @@ -15,20 +15,19 @@ dependencies: - h5py==3.1.0 - dask==2021.12.0 - pydicom==2.2.2 - # - pytest==6.2.5 - - pytest==7.4.0 + - pytest==7.4.0 # orig = 6.2.5 - pre-commit==2.16.0 - coverage==5.5 - pip: - python-bioformats==4.0.0 - python-javabridge==4.0.0 - protobuf==3.20.2 - - deepcell==0.12.7 + - deepcell==0.12.7 # orig = 0.11.0 - onnx==1.14.0 - onnxruntime==1.15.1 - opencv-contrib-python==4.5.3.56 - openslide-python==1.2.0 - - pandas==1.5.2 + - pandas==1.5.2 # orig no req - scanpy==1.8.2 - anndata==0.7.8 - tqdm==4.62.3 From 69c8ce623c854cd65a6bf075a880f8b5f81dc919 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Tue, 15 Aug 2023 11:32:07 -0700 Subject: [PATCH 27/50] adjusting numpy to 1.24.0 --- environment.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/environment.yml b/environment.yml index e7a65761..bdbfdcf7 100644 --- a/environment.yml +++ b/environment.yml @@ -6,7 +6,7 @@ channels: dependencies: - pip==21.3.1 - - numpy==1.25.2 # orig = 1.19.5 + - numpy==1.24.0 # orig = 1.19.5 - scipy==1.7.3 - scikit-image==0.18.3 - matplotlib==3.5.1 From a5d28ac82a6f1a4a2f7379bb7c808881ce70808b Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Tue, 15 Aug 2023 11:44:34 -0700 Subject: [PATCH 28/50] switching to numpy 1.22.4 --- environment.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/environment.yml b/environment.yml index bdbfdcf7..43d65319 100644 --- a/environment.yml +++ b/environment.yml @@ -6,7 +6,7 @@ channels: dependencies: - pip==21.3.1 - - numpy==1.24.0 # orig = 1.19.5 + - numpy==1.22.4 # orig = 1.19.5 - scipy==1.7.3 - scikit-image==0.18.3 - matplotlib==3.5.1 From c84cc247e83875eca7ab8c8af8d4565bde15a306 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Thu, 17 Aug 2023 13:28:36 -0700 Subject: [PATCH 29/50] adding pandas --- environment.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/environment.yml b/environment.yml index 43d65319..e8a5469e 100644 --- a/environment.yml +++ b/environment.yml @@ -27,8 +27,8 @@ dependencies: - onnxruntime==1.15.1 - opencv-contrib-python==4.5.3.56 - openslide-python==1.2.0 - - pandas==1.5.2 # orig no req - scanpy==1.8.2 - anndata==0.7.8 - tqdm==4.62.3 - loguru==0.5.3 + - pandas==1.5.2 # orig no req From 6c7268e59504d21119514e791e66b0586d9fd75e Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Wed, 6 Sep 2023 10:32:52 -0700 Subject: [PATCH 30/50] adding repr tests --- tests/inference_tests/test_inference.py | 16 ++++++++++++++++ 1 file changed, 16 insertions(+) diff --git a/tests/inference_tests/test_inference.py b/tests/inference_tests/test_inference.py index 8d812865..806bef7f 100644 --- a/tests/inference_tests/test_inference.py +++ b/tests/inference_tests/test_inference.py @@ -107,6 +107,10 @@ def test_InferenceBase(): for key in test.model_card: assert key == test.model_card[key], f"function for {key} is not working" + assert "Base class for all ONNX models" == repr(test) + + assert test.model_card == test.get_model_card() + # test reshape function random = np.random.rand(1, 2, 3) assert test.reshape(random).shape == ( @@ -137,6 +141,8 @@ def test_Inference(tileHE): inference.apply(tileHE) assert np.array_equal(tileHE.image, inference.F(orig_im)) + assert repr(inference) == "Class to handle ONNX model locally stored at {new_path}" + def test_HaloAIInference(tileHE): new_path = "tests/testdata/random_model.onnx" @@ -148,6 +154,11 @@ def test_HaloAIInference(tileHE): inference.apply(tileHE) assert np.array_equal(tileHE.image, inference.F(orig_im)) + assert ( + repr(inference) + == "Class to handle HALO AI ONNX model locally stored at {new_path}" + ) + def test_RemoteTestHoverNet(): inference = RemoteTestHoverNet() @@ -167,4 +178,9 @@ def test_RemoteTestHoverNet(): inference.apply(test_tile) assert np.array_equal(test_tile.image, inference.F(orig_im)) + assert ( + repr(inference) + == "Class to handle remote TIAToolBox HoverNet test ONNX. See model card for citation." + ) + inference.remove() From c4c2795dc826f4cdfb582e64ae723237e339a76b Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Wed, 6 Sep 2023 10:37:05 -0700 Subject: [PATCH 31/50] fixing print statements in repr tests --- tests/inference_tests/test_inference.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/tests/inference_tests/test_inference.py b/tests/inference_tests/test_inference.py index 806bef7f..dd3c51fa 100644 --- a/tests/inference_tests/test_inference.py +++ b/tests/inference_tests/test_inference.py @@ -141,7 +141,7 @@ def test_Inference(tileHE): inference.apply(tileHE) assert np.array_equal(tileHE.image, inference.F(orig_im)) - assert repr(inference) == "Class to handle ONNX model locally stored at {new_path}" + assert repr(inference) == f"Class to handle ONNX model locally stored at {new_path}" def test_HaloAIInference(tileHE): @@ -156,7 +156,7 @@ def test_HaloAIInference(tileHE): assert ( repr(inference) - == "Class to handle HALO AI ONNX model locally stored at {new_path}" + == f"Class to handle HALO AI ONNX model locally stored at {new_path}" ) From 2b0263ef818b58b3c20179282c0f64c49bfe95d2 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Thu, 7 Sep 2023 08:03:50 -0700 Subject: [PATCH 32/50] adding example notebook and fixing comments in inference file --- examples/InferenceOnnx_tutorial.ipynb | 805 ++++++++++++++++++++++++++ pathml/inference/inference.py | 3 - 2 files changed, 805 insertions(+), 3 deletions(-) create mode 100644 examples/InferenceOnnx_tutorial.ipynb diff --git a/examples/InferenceOnnx_tutorial.ipynb b/examples/InferenceOnnx_tutorial.ipynb new file mode 100644 index 00000000..98c67052 --- /dev/null +++ b/examples/InferenceOnnx_tutorial.ipynb @@ -0,0 +1,805 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "c4e08d2c-f53e-4366-888d-ab72819b4c2f", + "metadata": {}, + "source": [ + "# PathML ONNX Tutorial\n", + "\n", + "Written by James Wen. James_Wen@dfci.harvard.edu. \n", + "\n", + "[![View on GitHub](https://img.shields.io/badge/View-on%20GitHub-lightgrey?logo=github)](https://github.com/Dana-Farber-AIOS/pathml/blob/master/examples/)\n", + "\n", + "## Updates\n", + "August 09, 2023\n", + "- Simplified the class name structure\n", + "- Added \"model cards\" via base class\n", + "- Added setter functions to the base class to edit model card\n", + "- New fxn to check if model is clean (without initializers in the input graph) \n", + "\n", + "## Introduction\n", + "\n", + "This notebook is a tutorial on how to use the future ONNX `inference` feature in PathML. \n", + "\n", + "Some notes:\n", + "- The ONNX inference pipeline uses the existing PathML Pipeline and Transforms infrastructure.\n", + " - ONNX labels are saved to a `pathml.core.slide_data.SlideData` object as `tiles`.\n", + " - Users can iterate over the tiles as they would when using this feature for preprocessing. \n", + "- Preprocessing images before inference\n", + " - Users will need to create their own bespoke `pathml.preprocessing.transforms.transform` method to preprocess images before inference if necessary.\n", + " - A guide on how to create preprocessing pipelines is [here](https://pathml.readthedocs.io/en/latest/creating_pipelines.html). \n", + " - A guide on how to run preprocessing pipelines is [here](https://pathml.readthedocs.io/en/latest/running_pipelines.html). \n", + "- ONNX Model Initializers \n", + " - ONNX models often have neural network initializers stored in the input graph. This means that the user is expected to specify initializer values when running inference. To solve this issue, we have a function that removes the network initializers from the input graph. This functions is adopted from the `onnxruntime` [github](https://github.com/microsoft/onnxruntime/blob/main/tools/python/remove_initializer_from_input.py). \n", + " - We also have a function that checks if the initializers have been removed from the input graph before running inference. Both of these functions are described more below. \n", + "- When using a model stored remotely on HuggingFace, the model is *downloaded locally* before being used. The user will need to delete the model after running `Pipeline` with a method that comes with the model class. An example of how to do this is below. \n", + "\n", + "## Quick Sample Code\n", + "- Below is an example of how users would use the ONNX inference feature in PathML with a locally stored model.\n", + "```python\n", + "# load packages\n", + "from pathml.core import SlideData\n", + "\n", + "from pathml.preprocessing import Pipeline\n", + "import pathml.preprocessing.transforms as Transforms\n", + "\n", + "from pathml.inference import Inference, remove_initializer_from_input\n", + "\n", + "# Define slide path\n", + "slide_path = 'PATH TO SLIDE'\n", + "\n", + "# Set path to model \n", + "model_path = 'PATH TO ONNX MODEL'\n", + "# Define path to export fixed model\n", + "new_path = 'PATH TO SAVE NEW ONNX MODEL'\n", + "\n", + "# Fix the ONNX model by removing initializers. Save new model to `new_path`. \n", + "remove_initializer_from_input(model_path, new_path) \n", + "\n", + "inference = Inference(model_path = new_path, input_name = 'data', num_classes = 8, model_type = 'segmentation')\n", + "\n", + "# Create a transformation list\n", + "transformation_list = [\n", + " inference\n", + "] \n", + "\n", + "# Initialize pathml.core.slide_data.SlideData object\n", + "wsi = SlideData(slide_path, stain = 'Fluor')\n", + "\n", + "# Set up PathML pipeline\n", + "pipeline = Pipeline(transformation_list)\n", + "\n", + "# Run Inference\n", + "wsi.run(pipeline, tile_size = 1280, level = 0)\n", + "```\n", + "\n", + "- Below is an example of how users would use the ONNX inference feature in PathML with a model stored in the public HuggingFace repository.\n", + "```python\n", + "# load packages\n", + "from pathml.core import SlideData\n", + "\n", + "from pathml.preprocessing import Pipeline\n", + "import pathml.preprocessing.transforms as Transforms\n", + "\n", + "from pathml.inference import RemoteTestHoverNet\n", + "\n", + "# Define slide path\n", + "slide_path = 'PATH TO SLIDE'\n", + "\n", + "inference = RemoteTestHoverNet()\n", + "\n", + "# Create a transformation list\n", + "transformation_list = [\n", + " inference\n", + "] \n", + "\n", + "# Initialize pathml.core.slide_data.SlideData object\n", + "wsi = SlideData(slide_path)\n", + "\n", + "# Set up PathML pipeline\n", + "pipeline = Pipeline(transformation_list)\n", + "\n", + "# Run Inference\n", + "wsi.run(pipeline, tile_size = 256)\n", + "\n", + "# DELETE ONNX MODEL DOWNLOADED FROM HUGGINGFACE\n", + "inference.remove() \n", + "```" + ] + }, + { + "cell_type": "markdown", + "id": "886a74a3-b905-40dd-9b3e-4e1b90918f9b", + "metadata": {}, + "source": [ + "## Load Packages\n", + "\n", + "**NOTE**\n", + "- Please put in your environment name in the following line if you are using a jupyter notebook. If not, you may remove this line. \n", + " `os.environ[\"JAVA_HOME\"] = \"/opt/conda/envs/YOUR ENVIRONMENET NAME\"` " + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "id": "436b91f3-6338-4043-8742-496b354544aa", + "metadata": {}, + "outputs": [], + "source": [ + "import os\n", + "os.environ[\"JAVA_HOME\"] = \"/opt/conda/envs/YOUR ENVIRONMENET NAME\" # TO DO: CHANGE THIS TO YOUR ENVIRONMENT NAME\n", + "import numpy as np \n", + "import onnx\n", + "import onnxruntime as ort \n", + "import requests\n", + "\n", + "from pathml.core import SlideData, Tile\n", + "from dask.distributed import Client\n", + "from pathml.preprocessing import Pipeline\n", + "import pathml.preprocessing.transforms as Transforms\n", + "\n", + "from pathml.inference import (\n", + " HaloAIInference,\n", + " Inference,\n", + " InferenceBase,\n", + " RemoteTestHoverNet,\n", + " check_onnx_clean,\n", + " remove_initializer_from_input,\n", + ")" + ] + }, + { + "cell_type": "markdown", + "id": "34e9fb8c-0148-4184-ba6b-cf5dae63a869", + "metadata": {}, + "source": [ + "## ONNX Inference Class and ONNX Model Fixer\n", + "\n", + "- Here is the raw code for the functions that handle the initializers in the ONNX model and the classes that run the inference.\n", + "\n", + "### Functions to remove initializers and check that initializers have been removed.\n", + "\n", + "- `remove_initializer_from_input`\n", + " - This function removes any initializers from the input graph of the ONNX model.\n", + " - Without removing the initializers from the input graph, users will not be able to run inference.\n", + " - Adapted from the `onnxruntime` [github](https://github.com/microsoft/onnxruntime/blob/main/tools/python/remove_initializer_from_input.py). \n", + " - Users specify:\n", + " - `model_path` (str): path to ONNX model,\n", + " - `new_path` (str): path to save adjusted model w/o initializers\n", + " - We will run this function on all models placed in our model zoo, so users will not have to run it unless they are working with their own local models.\n", + " \n", + "
\n", + " \n", + "- `check_onnx_clean`\n", + " - Checks if the initializers are in the input graph\n", + " - Returns `True` and a `ValueError` if there are initializers in the input graph\n", + " - Adapted from the `onnxruntime` [github](https://github.com/microsoft/onnxruntime/blob/main/tools/python/remove_initializer_from_input.py). \n", + " - Users specify:\n", + " - `model_path` (str): path to ONNX model\n", + "\n", + "### Inference Classes\n", + "\n", + "
\n", + "\n", + "- `InferenceBase`\n", + " - This class inherits from `pathml.preprocessing.transforms.transform`, similar to all of the preprocessing transformations. Inheriting from `transforms.transform` allows us to use the existing `Pipeline` function in PathML which users should be familar with. \n", + " - This is the base class for all Inference classes for ONNX modeling\n", + " - Each instance of a class also comes with a `model_card` which specifies certain details of the model in dictionary form. The default parameters are:\n", + " - ```python \n", + " self.model_card = {\n", + " 'name' : None, \n", + " 'num_classes' : None,\n", + " 'model_type' : None, \n", + " 'notes' : None, \n", + " 'model_input_notes': None, \n", + " 'model_output_notes' : None,\n", + " 'citation': None \n", + " } \n", + " ``` \n", + " - Model cards are where important information about the model should be kept. Since they are in dictionary form, the user can add keys and values as they see fit. \n", + " - This class also has getter and setter functions to adjust the `model_card`. Certain functions include `get_model_card`, `set_name`, `set_num_classes`, etc. \n", + " \n", + "
\n", + " \n", + "- `Inference` \n", + " - This class is for when the user wants to use an ONNX model stored locally. \n", + " - Calls the `check_onnx_clean` function to check if the model is clean.\n", + " - Users specify:\n", + " - `model_path` (str): path to ONNX model,\n", + " - `input_name` (str): name of input for ONNX model, *defaults to `data`* \n", + " - `num_classes` (int): number of outcome classes, \n", + " - `model_type` (str): type of model (classification, segmentation) \n", + " - `local` (bool): if you are using a local model or a remote model, *defaults to `True`* \n", + " \n", + "
\n", + " \n", + "- `HaloAIInference`\n", + " - This class inherits from `Inference`\n", + " - HaloAI ONNX models always return 20 prediction maps: this class will subset and return the necessary ones. \n", + "\n", + "
\n", + "\n", + "- `RemoteTestHoverNet` \n", + " - This class inherits from `Inference` and is the test class for public models hosted on `HuggingFace`. \n", + " - `local` is automatically set to `False` \n", + " - Our current test model is a HoverNet from [TIAToolbox](https://github.com/TissueImageAnalytics/tiatoolbox)\n", + " - Pocock J, Graham S, Vu QD, Jahanifar M, Deshpande S, Hadjigeorghiou G, Shephard A, Bashir RM, Bilal M, Lu W, Epstein D. TIAToolbox as an end-to-end library for advanced tissue image analytics. Communications medicine. 2022 Sep 24;2(1):120.\n", + " - Its `model_card` is:\n", + " - ```python \n", + " {'name': 'Tiabox HoverNet Test',\n", + " 'num_classes': 5,\n", + " 'model_type': 'Segmentation',\n", + " 'notes': None,\n", + " 'model_input_notes': 'Accepts tiles of 256 x 256',\n", + " 'model_output_notes': None,\n", + " 'citation': 'Pocock J, Graham S, Vu QD, Jahanifar M, Deshpande S, Hadjigeorghiou G, Shephard A, Bashir RM, Bilal M, Lu W, Epstein D. TIAToolbox as an end-to-end library for advanced tissue image analytics. Communications medicine. 2022 Sep 24;2(1):120.'}\n", + " ```\n", + " \n", + "### Raw Code\n", + "\n", + "Below is the raw code for your convenience. You can also find the raw code on our github. \n", + "[![View on GitHub](https://img.shields.io/badge/View-on%20GitHub-lightgrey?logo=github)](https://github.com/Dana-Farber-AIOS/pathml/tree/master/pathml)" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "3339cf66-8de6-4af1-9d3e-7312cd69eb33", + "metadata": {}, + "outputs": [], + "source": [ + "def remove_initializer_from_input(model_path, new_path):\n", + " \"\"\"Removes initializers from HaloAI ONNX models\n", + " Taken from https://github.com/microsoft/onnxruntime/blob/main/tools/python/remove_initializer_from_input.py\n", + "\n", + " Args:\n", + " model_path (str): path to ONNX model,\n", + " new_path (str): path to save adjusted model w/o initializers,\n", + "\n", + " Returns:\n", + " ONNX model w/o initializers to run inference using PathML\n", + " \"\"\"\n", + "\n", + " model = onnx.load(model_path)\n", + "\n", + " inputs = model.graph.input\n", + " name_to_input = {}\n", + " for onnx_input in inputs:\n", + " name_to_input[onnx_input.name] = onnx_input\n", + "\n", + " for initializer in model.graph.initializer:\n", + " if initializer.name in name_to_input:\n", + " inputs.remove(name_to_input[initializer.name])\n", + "\n", + " onnx.save(model, new_path)\n", + "\n", + "\n", + "def check_onnx_clean(model_path):\n", + " \"\"\"Checks if the model has had it's initalizers removed from input graph.\n", + " Adapted from from https://github.com/microsoft/onnxruntime/blob/main/tools/python/remove_initializer_from_input.py\n", + "\n", + " Args:\n", + " model_path (str): path to ONNX model,\n", + "\n", + " Returns:\n", + " Boolean if there are initializers in input graph.\n", + " \"\"\"\n", + "\n", + " model = onnx.load(model_path)\n", + "\n", + " inputs = model.graph.input\n", + " name_to_input = {}\n", + " for onnx_input in inputs:\n", + " name_to_input[onnx_input.name] = onnx_input\n", + "\n", + " for initializer in model.graph.initializer:\n", + " if initializer.name in name_to_input:\n", + " return True\n", + "\n", + "\n", + "# Base class\n", + "class InferenceBase(Transforms.Transform):\n", + " \"\"\"\n", + " Base class for all ONNX Models.\n", + " Each transform must operate on a Tile.\n", + " \"\"\"\n", + "\n", + " def __init__(self):\n", + " self.model_card = {\n", + " \"name\": None,\n", + " \"num_classes\": None,\n", + " \"model_type\": None,\n", + " \"notes\": None,\n", + " \"model_input_notes\": None,\n", + " \"model_output_notes\": None,\n", + " \"citation\": None,\n", + " }\n", + "\n", + " def __repr__(self):\n", + " return \"Base class for all ONNX models\"\n", + "\n", + " def get_model_card(self):\n", + " return self.model_card\n", + "\n", + " def set_name(self, name):\n", + " self.model_card[\"name\"] = name\n", + "\n", + " def set_num_classes(self, num):\n", + " self.model_card[\"num_classes\"] = num\n", + "\n", + " def set_model_type(self, model_type):\n", + " self.model_card[\"model_type\"] = model_type\n", + "\n", + " def set_notes(self, note):\n", + " self.model_card[\"notes\"] = note\n", + "\n", + " def set_model_input_notes(self, note):\n", + " self.model_card[\"model_input_notes\"] = note\n", + "\n", + " def set_model_output_notes(self, note):\n", + " self.model_card[\"model_output_notes\"] = note\n", + "\n", + " def set_citation(self, citation):\n", + " self.model_card[\"citation\"] = citation\n", + "\n", + " def reshape(self, image):\n", + " \"\"\"standard reshaping of tile image\"\"\"\n", + " # flip dimensions\n", + " # follows convention used here https://github.com/Dana-Farber-AIOS/pathml/blob/master/pathml/ml/dataset.py\n", + "\n", + " if image.ndim == 3:\n", + " # swap axes from HWC to CHW\n", + " image = image.transpose(2, 0, 1)\n", + " # add a dimesion bc onnx models usually have batch size as first dim: e.g. (1, channel, height, width)\n", + " image = np.expand_dims(image, axis=0)\n", + "\n", + " return image\n", + " else:\n", + " # in this case, we assume that we have XYZCT channel order\n", + " # so we swap axes to TCZYX for batching\n", + " # note we are not adding a dim here for batch bc we assume that subsetting will create a batch \"placeholder\" dim\n", + " image = image.T\n", + "\n", + " return image\n", + "\n", + " def F(self, target):\n", + " \"\"\"functional implementation\"\"\"\n", + " raise NotImplementedError\n", + "\n", + " def apply(self, tile):\n", + " \"\"\"modify Tile object in-place\"\"\"\n", + " raise NotImplementedError\n", + "\n", + "\n", + "# class to handle local onnx models\n", + "class Inference(InferenceBase):\n", + " \"\"\"Transformation to run inferrence on ONNX model.\n", + "\n", + " Assumptions:\n", + " - The ONNX model has been cleaned by `remove_initializer_from_input` first\n", + "\n", + " Args:\n", + " model_path (str): path to ONNX model w/o initializers,\n", + " input_name (str): name of the input the ONNX model accepts\n", + " \"\"\"\n", + "\n", + " def __init__(\n", + " self,\n", + " model_path=None,\n", + " input_name=\"data\",\n", + " num_classes=None,\n", + " model_type=None,\n", + " local=True,\n", + " ):\n", + " super().__init__()\n", + "\n", + " self.input_name = input_name\n", + " self.num_classes = num_classes\n", + " self.model_type = model_type\n", + " self.local = local\n", + "\n", + " if self.local:\n", + " # using a local onnx model\n", + " self.model_path = model_path\n", + " else:\n", + " # if using a model from the model zoo, set the local path to a temp file\n", + " self.model_path = \"temp.onnx\"\n", + "\n", + " # fill in parts of the model_card with the following info\n", + " self.model_card[\"num_classes\"] = self.num_classes\n", + " self.model_card[\"model_type\"] = self.model_type\n", + "\n", + " # check if there are initializers in input graph if using a local model\n", + " if local:\n", + " if check_onnx_clean(model_path):\n", + " raise ValueError(\n", + " \"The ONNX model still has graph initializers in the input graph. Use `remove_initializer_from_input` to remove them.\"\n", + " )\n", + " else:\n", + " pass\n", + "\n", + " def __repr__(self):\n", + " if self.local:\n", + " return f\"Class to handle ONNX model locally stored at {self.model_path}\"\n", + " else:\n", + " return f\"Class to handle a {self.model_card['model_name']} from the PathML model zoo.\"\n", + "\n", + " def inference(self, image):\n", + " # reshape the image\n", + " image = self.reshape(image)\n", + "\n", + " # load fixed model\n", + " onnx_model = onnx.load(self.model_path)\n", + "\n", + " # check tile dimensions match ONNX input dimensions\n", + " input_node = onnx_model.graph.input\n", + "\n", + " dimensions = []\n", + " for input in input_node:\n", + " if input.name == self.input_name:\n", + " input_shape = input.type.tensor_type.shape.dim\n", + " for dim in input_shape:\n", + " dimensions.append(dim.dim_value)\n", + "\n", + " assert (\n", + " image.shape[-1] == dimensions[-1] and image.shape[-2] == dimensions[-2]\n", + " ), f\"expecting tile shape of {dimensions[-2]} by {dimensions[-1]}, got {image.shape[-2]} by {image.shape[-1]}\"\n", + "\n", + " # check onnx model\n", + " onnx.checker.check_model(onnx_model)\n", + "\n", + " # start an inference session\n", + " ort_sess = onnxruntime.InferenceSession(self.model_path)\n", + "\n", + " # create model output, returns a list\n", + " model_output = ort_sess.run(None, {self.input_name: image.astype(\"f\")})\n", + "\n", + " return model_output\n", + "\n", + " def F(self, image):\n", + " # run inference function\n", + " prediction_map = self.inference(image)\n", + "\n", + " # single task model\n", + " if len(prediction_map) == 1:\n", + " # return first and only prediction array in the list\n", + " return prediction_map[0]\n", + "\n", + " # multi task model\n", + " else:\n", + " # concatenate prediction results\n", + " # assumes that the tasks all output prediction arrays of same dimension on H and W\n", + " result_array = np.concatenate(prediction_map, axis=1)\n", + " return result_array\n", + "\n", + " def apply(self, tile):\n", + " tile.image = self.F(tile.image)\n", + "\n", + "\n", + "class HaloAIInference(Inference):\n", + " \"\"\"Transformation to run inferrence on HALO AI ONNX model.\n", + "\n", + " Assumptions:\n", + " - Assumes that the ONNX model returns a tensor in which there is one prediction map for each class\n", + " - For example, if there are 5 classes, the ONNX model will output a (1, 5, Height, Weight) tensor\n", + " - If you select to argmax the classes, the class assumes a softmax or sigmoid has already been applied\n", + " - HaloAI ONNX models always have 20 class maps so you need to index into the first x maps if you have x classes\n", + "\n", + "\n", + " Args:\n", + " model_path (str): path to ONNX model w/o initializers,\n", + " num_classes (int): number of classes in the data,\n", + " input_name (str): name of the input the ONNX model accepts\n", + " \"\"\"\n", + "\n", + " def __init__(\n", + " self,\n", + " model_path=None,\n", + " input_name=\"data\",\n", + " num_classes=None,\n", + " model_type=None,\n", + " local=True,\n", + " ):\n", + " super().__init__(model_path, input_name, num_classes, model_type, local)\n", + "\n", + " self.model_card[\"num_classes\"] = self.num_classes\n", + " self.model_card[\"model_type\"] = self.model_type\n", + "\n", + " def __repr__(self):\n", + " return f\"Class to handle HALO AI ONNX model locally stored at {self.model_path}\"\n", + "\n", + " def F(self, image):\n", + " prediction_map = self.inference(image)\n", + "\n", + " prediction_map = prediction_map[0][:, 0 : self.num_classes, :, :]\n", + "\n", + " return prediction_map\n", + "\n", + " def apply(self, tile):\n", + " tile.image = self.F(tile.image)\n", + "\n", + "\n", + "# class to handle remote onnx models\n", + "class RemoteTestHoverNet(Inference):\n", + " \"\"\"Transformation to run inferrence on ONNX model.\n", + "\n", + " Citation for model:\n", + " Pocock J, Graham S, Vu QD, Jahanifar M, Deshpande S, Hadjigeorghiou G, Shephard A, Bashir RM, Bilal M, Lu W, Epstein D.\n", + " TIAToolbox as an end-to-end library for advanced tissue image analytics. Communications medicine. 2022 Sep 24;2(1):120.\n", + "\n", + " Args:\n", + " model_path (str): temp file name to download onnx from huggingface,\n", + " input_name (str): name of the input the ONNX model accepts\n", + " \"\"\"\n", + "\n", + " def __init__(\n", + " self,\n", + " model_path=\"temp.onnx\",\n", + " input_name=\"data\",\n", + " num_classes=5,\n", + " model_type=\"Segmentation\",\n", + " local=False,\n", + " ):\n", + " super().__init__(model_path, input_name, num_classes, model_type, local)\n", + "\n", + " # specify URL of the model in PathML public repository\n", + " url = \"https://huggingface.co/pathml/test/resolve/main/hovernet_fast_tiatoolbox_fixed.onnx\"\n", + "\n", + " # download model, save as temp.onnx\n", + " with open(self.model_path, \"wb\") as out_file:\n", + " content = requests.get(url, stream=True).content\n", + " out_file.write(content)\n", + "\n", + " self.model_card[\"num_classes\"] = self.num_classes\n", + " self.model_card[\"model_type\"] = self.model_type\n", + " self.model_card[\"name\"] = \"Tiabox HoverNet Test\"\n", + " self.model_card[\"model_input_notes\"] = \"Accepts tiles of 256 x 256\"\n", + " self.model_card[\n", + " \"citation\"\n", + " ] = \"Pocock J, Graham S, Vu QD, Jahanifar M, Deshpande S, Hadjigeorghiou G, Shephard A, Bashir RM, Bilal M, Lu W, Epstein D. TIAToolbox as an end-to-end library for advanced tissue image analytics. Communications medicine. 2022 Sep 24;2(1):120.\"\n", + "\n", + " def __repr__(self):\n", + " return \"Class to handle remote TIAToolBox HoverNet test ONNX. See model card for citation.\"\n", + "\n", + " def apply(self, tile):\n", + " tile.image = self.F(tile.image)\n", + "\n", + " def remove(self):\n", + " # remove the temp.onnx model\n", + " os.remove(self.model_path)\n" + ] + }, + { + "cell_type": "markdown", + "id": "8b28c79e-2453-42e5-9280-6c0d3ee082c0", + "metadata": {}, + "source": [ + "## Try it Yourself!\n", + "\n", + "- What you need:\n", + " - An ONNX model stored locally\n", + " - An image with which you want to run inference stored locally\n", + " - PathML already downloaded \n", + "\n", + "- Make sure to define the `Inference` class and `remove_initializer_from_input` above in the previous seciton if you have not downloaded the latest version of PathML.\n", + "\n", + "- You will need to define the following variables: \n", + " - `slide_path`: 'PATH TO SLIDE'\n", + " - `model_path`: 'PATH TO ONNX MODEL'\n", + " - `new_path`: 'PATH TO SAVE FIXED ONNX MODEL'\n", + " - `num_classes`: 'NUMBER OF CLASSES IN YOUR DATASET'\n", + " - `tile_size`: 'TILE SIZE THAT YOUR ONNX MODEL ACCEPTS'\n", + " \n", + "- The code in the cell below assumes you want the images passed in as is. If you need to select channels, you will need to add another `transform` method to do so before the inference transform. The following code provides an example if you want to subset into the first channel of an image. *Remember that PathML reads images in as XYZCT.* \n", + "\n", + "```python \n", + "class convert_format(Transforms.Transform):\n", + " def F(self, image):\n", + " # orig = (1280, 1280, 1, 6, 1) = (XYZCT)\n", + " image = image[:, :, :, 0, ...] # this will make the tile (1280, 1280, 1, 1)\n", + " return image\n", + "\n", + " def apply(self, tile):\n", + " tile.image = self.F(tile.image)\n", + " \n", + "convert = convert_format()\n", + "inference = Inference(\n", + " model_path = 'PATH TO LOCAL MODEL', \n", + " input_name = 'data', \n", + " num_classes = 'NUMBER OF CLASSES' , \n", + " model_type = 'CLASSIFICATION OR SEGMENTATION', \n", + " local = True)\n", + "\n", + "transformation_list = [convert, inference] \n", + "\n", + "```" + ] + }, + { + "cell_type": "markdown", + "id": "bcdeaac3-80ae-4e67-8aa9-8f4c637a92eb", + "metadata": {}, + "source": [ + "### Local ONNX Model Using the `Inference` Class" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "0bc2f84e-e554-4770-aad9-c51fa1890ea6", + "metadata": {}, + "outputs": [], + "source": [ + "# Define slide path\n", + "slide_path = 'PATH TO SLIDE'\n", + "\n", + "# Set path to model \n", + "model_path = 'PATH TO ONNX MODEL'\n", + "# Define path to export fixed model\n", + "new_path = 'PATH TO SAVE NEW ONNX MODEL'\n", + "\n", + "\n", + "# Fix the ONNX model\n", + "remove_initializer_from_input(model_path, new_path) \n", + "\n", + "inference = Inference(model_path = new_path, input_name = 'data', num_classes = 'NUMBER OF CLASSES' , model_type = 'CLASSIFICATION OR SEGMENTATION', local = True)\n", + "\n", + "transformation_list = [inference] \n", + "\n", + "# Initialize pathml.core.slide_data.SlideData object\n", + "wsi = SlideData(slide_path)\n", + "\n", + "# Set up PathML pipeline\n", + "pipeline = Pipeline(transformation_list)\n", + "\n", + "# Run Inference\n", + "# Level is equal to 0 for highest resolution (Note that this is the default setting)\n", + "wsi.run(pipeline, tile_size = 'TILE SIZE THAT YOUR ONNX MODEL ACCEPTS', level = 0)" + ] + }, + { + "cell_type": "markdown", + "id": "bc7902dc-0113-4604-abe4-6f3a8588c0b5", + "metadata": {}, + "source": [ + "### Local ONNX Model Using the `HaloAIInference` Class" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "d2eedbf1-be61-440e-a044-6dce4c8de04e", + "metadata": {}, + "outputs": [], + "source": [ + "# Define slide path\n", + "slide_path = 'PATH TO SLIDE'\n", + "\n", + "# Set path to model \n", + "model_path = 'PATH TO ONNX MODEL'\n", + "# Define path to export fixed model\n", + "new_path = 'PATH TO SAVE NEW ONNX MODEL'\n", + "\n", + "\n", + "# Fix the ONNX model\n", + "remove_initializer_from_input(model_path, new_path) \n", + "\n", + "inference = HaloAIInference(model_path = new_path, input_name = 'data', num_classes = 'NUMBER OF CLASSES' , model_type = 'CLASSIFICATION OR SEGMENTATION', local = True)\n", + "\n", + "transformation_list = [inference] \n", + "\n", + "# Initialize pathml.core.slide_data.SlideData object\n", + "wsi = SlideData(slide_path)\n", + "\n", + "# Set up PathML pipeline\n", + "pipeline = Pipeline(transformation_list)\n", + "\n", + "# Run Inference\n", + "# Level is equal to 0 for highest resolution (Note that this is the default setting)\n", + "wsi.run(pipeline, tile_size = 'TILE SIZE THAT YOUR ONNX MODEL ACCEPTS', level = 0)" + ] + }, + { + "cell_type": "markdown", + "id": "431abad0-10ff-44fe-ba56-eb6402ce8e4c", + "metadata": {}, + "source": [ + "### Remote ONNX Using our `RemoteTestHoverNet` Class\n", + "- Uses a Hovernet from [TIAToolbox](https://github.com/TissueImageAnalytics/tiatoolbox) \n", + "- Note that the purpose of this model is to illustrate how PathML will handle future remote models. We plan on release more public models to our model zoo on HuggingFace in the future.\n", + "- Citation for model:\n", + " - Pocock J, Graham S, Vu QD, Jahanifar M, Deshpande S, Hadjigeorghiou G, Shephard A, Bashir RM, Bilal M, Lu W, Epstein D. TIAToolbox as an end-to-end library for advanced tissue image analytics. Communications medicine. 2022 Sep 24;2(1):120.\n", + "- Make sure your image has 3 channels! \n", + "- When the `RemoteTestHoverNet` is first initialized, it downloads the HoverNet from HuggingFace and saves it locally on your own system as `temp.onnx`. \n", + " - **You will need to remove it manually by calling the `remove()` method** An example of how to call this method is in the last line in the code below. " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "8976d60b-6e78-42ca-a52d-489911e580f4", + "metadata": {}, + "outputs": [], + "source": [ + "# Define slide path\n", + "slide_path = 'PATH TO SLIDE'\n", + "\n", + "inference = RemoteTestHoverNet()\n", + "\n", + "# Create a transformation list\n", + "transformation_list = [\n", + " inference\n", + "] \n", + "\n", + "# Initialize pathml.core.slide_data.SlideData object\n", + "wsi = SlideData(slide_path)\n", + "\n", + "# Set up PathML pipeline\n", + "pipeline = Pipeline(transformation_list)\n", + "\n", + "# Run Inference\n", + "wsi.run(pipeline, tile_size = 256)\n", + "\n", + "# DELETE ONNX MODEL DOWNLOADED FROM HUGGINGFACE\n", + "inference.remove() " + ] + }, + { + "cell_type": "markdown", + "id": "318ae957-73d8-4c7f-b87c-b012750eda10", + "metadata": {}, + "source": [ + "## Iterate over the tiles\n", + "\n", + "Now that you have your tiles saved to your SlideData object, you can now iterate over them.\n", + "\n", + "For example, if you wanted to check the shape of the tiles you could run the following code: \n", + "\n", + "```python\n", + "for tile in wsi.tiles: \n", + " print(tile.image.shape) \n", + "```" + ] + }, + { + "cell_type": "markdown", + "id": "fc5c89ae-400e-4380-a717-12800fb77d97", + "metadata": {}, + "source": [ + "## References\n", + "\n", + "- Pocock J, Graham S, Vu QD, Jahanifar M, Deshpande S, Hadjigeorghiou G, Shephard A, Bashir RM, Bilal M, Lu W, Epstein D. TIAToolbox as an end-to-end library for advanced tissue image analytics. Communications medicine. 2022 Sep 24;2(1):120.\n", + "\n", + "- https://github.com/microsoft/onnxruntime/blob/main/tools/python/remove_initializer_from_input.py" + ] + } + ], + "metadata": { + "environment": { + "kernel": "james_test2", + "name": "pytorch-gpu.1-13.m105", + "type": "gcloud", + "uri": "gcr.io/deeplearning-platform-release/pytorch-gpu.1-13:m105" + }, + "kernelspec": { + "display_name": "james_test2", + "language": "python", + "name": "james_test2" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.8.15" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/pathml/inference/inference.py b/pathml/inference/inference.py index 83ec0093..958f97d6 100644 --- a/pathml/inference/inference.py +++ b/pathml/inference/inference.py @@ -63,7 +63,6 @@ def check_onnx_clean(model_path): # Base class -# I think this should still inherit from Transforms to make the tiling easier/so we don't have to rewrite so much existing code class InferenceBase(Transforms.Transform): """ Base class for all ONNX Models. @@ -235,7 +234,6 @@ def F(self, image): else: # concatenate prediction results # assumes that the tasks all output prediction arrays of same dimension on H and W - # To Do: figure out solution for way different tasks such as if a model does both segmentation and classification result_array = np.concatenate(prediction_map, axis=1) return result_array @@ -287,7 +285,6 @@ def apply(self, tile): # class to handle remote onnx models -# ToDo create function to remove model after tiling is done would be a sep line in workflow class RemoteTestHoverNet(Inference): """Transformation to run inferrence on ONNX model. From 1c462d2137f705e66017c362d72b1ff30fbba94c Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Thu, 7 Sep 2023 10:20:10 -0700 Subject: [PATCH 33/50] adding model w/ initializers, modified tests and notebook --- examples/InferenceOnnx_tutorial.ipynb | 33 +++++++++++----------- tests/inference_tests/test_inference.py | 10 +++++++ tests/testdata/model_with_initalizers.onnx | 3 ++ 3 files changed, 30 insertions(+), 16 deletions(-) create mode 100644 tests/testdata/model_with_initalizers.onnx diff --git a/examples/InferenceOnnx_tutorial.ipynb b/examples/InferenceOnnx_tutorial.ipynb index 98c67052..c2787b7a 100644 --- a/examples/InferenceOnnx_tutorial.ipynb +++ b/examples/InferenceOnnx_tutorial.ipynb @@ -1,6 +1,7 @@ { "cells": [ { + "attachments": {}, "cell_type": "markdown", "id": "c4e08d2c-f53e-4366-888d-ab72819b4c2f", "metadata": {}, @@ -11,13 +12,6 @@ "\n", "[![View on GitHub](https://img.shields.io/badge/View-on%20GitHub-lightgrey?logo=github)](https://github.com/Dana-Farber-AIOS/pathml/blob/master/examples/)\n", "\n", - "## Updates\n", - "August 09, 2023\n", - "- Simplified the class name structure\n", - "- Added \"model cards\" via base class\n", - "- Added setter functions to the base class to edit model card\n", - "- New fxn to check if model is clean (without initializers in the input graph) \n", - "\n", "## Introduction\n", "\n", "This notebook is a tutorial on how to use the future ONNX `inference` feature in PathML. \n", @@ -109,6 +103,7 @@ ] }, { + "attachments": {}, "cell_type": "markdown", "id": "886a74a3-b905-40dd-9b3e-4e1b90918f9b", "metadata": {}, @@ -150,6 +145,7 @@ ] }, { + "attachments": {}, "cell_type": "markdown", "id": "34e9fb8c-0148-4184-ba6b-cf5dae63a869", "metadata": {}, @@ -187,15 +183,14 @@ " - This is the base class for all Inference classes for ONNX modeling\n", " - Each instance of a class also comes with a `model_card` which specifies certain details of the model in dictionary form. The default parameters are:\n", " - ```python \n", - " self.model_card = {\n", - " 'name' : None, \n", - " 'num_classes' : None,\n", - " 'model_type' : None, \n", - " 'notes' : None, \n", - " 'model_input_notes': None, \n", - " 'model_output_notes' : None,\n", - " 'citation': None \n", - " } \n", + " self.model_card = {\n", + " 'name' : None, \n", + " 'num_classes' : None,\n", + " 'model_type' : None, \n", + " 'notes' : None, \n", + " 'model_input_notes': None, \n", + " 'model_output_notes' : None,\n", + " 'citation': None } \n", " ``` \n", " - Model cards are where important information about the model should be kept. Since they are in dictionary form, the user can add keys and values as they see fit. \n", " - This class also has getter and setter functions to adjust the `model_card`. Certain functions include `get_model_card`, `set_name`, `set_num_classes`, etc. \n", @@ -571,6 +566,7 @@ ] }, { + "attachments": {}, "cell_type": "markdown", "id": "8b28c79e-2453-42e5-9280-6c0d3ee082c0", "metadata": {}, @@ -617,6 +613,7 @@ ] }, { + "attachments": {}, "cell_type": "markdown", "id": "bcdeaac3-80ae-4e67-8aa9-8f4c637a92eb", "metadata": {}, @@ -659,6 +656,7 @@ ] }, { + "attachments": {}, "cell_type": "markdown", "id": "bc7902dc-0113-4604-abe4-6f3a8588c0b5", "metadata": {}, @@ -701,6 +699,7 @@ ] }, { + "attachments": {}, "cell_type": "markdown", "id": "431abad0-10ff-44fe-ba56-eb6402ce8e4c", "metadata": {}, @@ -746,6 +745,7 @@ ] }, { + "attachments": {}, "cell_type": "markdown", "id": "318ae957-73d8-4c7f-b87c-b012750eda10", "metadata": {}, @@ -763,6 +763,7 @@ ] }, { + "attachments": {}, "cell_type": "markdown", "id": "fc5c89ae-400e-4380-a717-12800fb77d97", "metadata": {}, diff --git a/tests/inference_tests/test_inference.py b/tests/inference_tests/test_inference.py index dd3c51fa..8a8c64fd 100644 --- a/tests/inference_tests/test_inference.py +++ b/tests/inference_tests/test_inference.py @@ -104,11 +104,14 @@ def test_InferenceBase(): test.set_citation("citation") + # test model card for key in test.model_card: assert key == test.model_card[key], f"function for {key} is not working" + # test repr function assert "Base class for all ONNX models" == repr(test) + # test get model card fxn assert test.model_card == test.get_model_card() # test reshape function @@ -143,6 +146,13 @@ def test_Inference(tileHE): assert repr(inference) == f"Class to handle ONNX model locally stored at {new_path}" + # test initializer catching + new_path = "tests/testdata/model_with_initalizers.onnx" + try: + inference = Inference(model_path=model_path, input_name="data", num_classes=1, model_type="segmentation") + except Exception as e: + assert str(e) == "The ONNX model still has graph initializers in the input graph. Use `remove_initializer_from_input` to remove them." + def test_HaloAIInference(tileHE): new_path = "tests/testdata/random_model.onnx" diff --git a/tests/testdata/model_with_initalizers.onnx b/tests/testdata/model_with_initalizers.onnx new file mode 100644 index 00000000..36e68494 --- /dev/null +++ b/tests/testdata/model_with_initalizers.onnx @@ -0,0 +1,3 @@ +:!* Binput_2Z +input_1Z +input_2 \ No newline at end of file From 640de9eade160e6fd1c40d3de7b5e28ae541cd1e Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Thu, 7 Sep 2023 10:20:48 -0700 Subject: [PATCH 34/50] fixed test format --- tests/inference_tests/test_inference.py | 33 ++++++++++++++++++++++--- 1 file changed, 29 insertions(+), 4 deletions(-) diff --git a/tests/inference_tests/test_inference.py b/tests/inference_tests/test_inference.py index 8a8c64fd..6fefa48c 100644 --- a/tests/inference_tests/test_inference.py +++ b/tests/inference_tests/test_inference.py @@ -147,11 +147,36 @@ def test_Inference(tileHE): assert repr(inference) == f"Class to handle ONNX model locally stored at {new_path}" # test initializer catching - new_path = "tests/testdata/model_with_initalizers.onnx" - try: - inference = Inference(model_path=model_path, input_name="data", num_classes=1, model_type="segmentation") + bad_model = "tests/testdata/model_with_initalizers.onnx" + try: + inference = Inference( + model_path=bad_model, + input_name="data", + num_classes=1, + model_type="segmentation", + ) except Exception as e: - assert str(e) == "The ONNX model still has graph initializers in the input graph. Use `remove_initializer_from_input` to remove them." + assert ( + str(e) + == "The ONNX model still has graph initializers in the input graph. Use `remove_initializer_from_input` to remove them." + ) + + # test repr function with local set to False + inference = Inference( + model_path=new_path, + input_name="data", + num_classes=1, + model_type="segmentation", + local=False, + ) + + fake_model_name = "test model" + inference.set_name(fake_model_name) + + assert ( + repr(inference) + == f"Class to handle a {fake_model_name} from the PathML model zoo." + ) def test_HaloAIInference(tileHE): From 575ff2b7e11f44cd2859fd73b3dd79c796f8a5bb Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Thu, 7 Sep 2023 11:10:40 -0700 Subject: [PATCH 35/50] fixing name in card --- pathml/inference/inference.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/pathml/inference/inference.py b/pathml/inference/inference.py index 958f97d6..b360dda2 100644 --- a/pathml/inference/inference.py +++ b/pathml/inference/inference.py @@ -187,7 +187,7 @@ def __repr__(self): if self.local: return f"Class to handle ONNX model locally stored at {self.model_path}" else: - return f"Class to handle a {self.model_card['model_name']} from the PathML model zoo." + return f"Class to handle a {self.model_card['name']} from the PathML model zoo." def inference(self, image): # reshape the image From e1ffa6261403af7705a64941fc89107d016b71c3 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Tue, 17 Oct 2023 10:22:46 -0700 Subject: [PATCH 36/50] adding comment to adj openslide --- environment.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/environment.yml b/environment.yml index e8a5469e..bb83d68a 100644 --- a/environment.yml +++ b/environment.yml @@ -32,3 +32,4 @@ dependencies: - tqdm==4.62.3 - loguru==0.5.3 - pandas==1.5.2 # orig no req + # to do: adjust openslide From 4f1fea50da5ed95acb2f41ded84bcef107b520d7 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Wed, 18 Oct 2023 10:34:20 -0700 Subject: [PATCH 37/50] changing readthedocs recs --- docs/readthedocs-requirements.txt | 5 ++--- 1 file changed, 2 insertions(+), 3 deletions(-) diff --git a/docs/readthedocs-requirements.txt b/docs/readthedocs-requirements.txt index b672810f..342675b2 100644 --- a/docs/readthedocs-requirements.txt +++ b/docs/readthedocs-requirements.txt @@ -1,8 +1,7 @@ -sphinx==4.3.2 +sphinx==6.2.1 nbsphinx==0.8.8 nbsphinx-link==1.3.0 sphinx-rtd-theme==1.0.0 -sphinx-autoapi==1.8.4 +sphinx-autoapi==3.0.0 ipython==8.10.0 sphinx-copybutton==0.4.0 - From 0f2b1935f676e15194bd1431d1c010c28197eb0c Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Wed, 18 Oct 2023 11:37:32 -0700 Subject: [PATCH 38/50] chaning mamba to miniforge --- .github/workflows/tests-conda.yml | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/.github/workflows/tests-conda.yml b/.github/workflows/tests-conda.yml index 53a8d93a..c93c4213 100644 --- a/.github/workflows/tests-conda.yml +++ b/.github/workflows/tests-conda.yml @@ -40,7 +40,10 @@ jobs: auto-activate-base: false activate-environment: pathml environment-file: environment.yml - mamba-version: "*" + # mamba-version: "*" + miniforge-version: latest + use-mamba: true + channels: conda-forge python-version: ${{ matrix.python-version }} - name: Debugging run: | From 7e165eaacc4715ff35d803dfcfa329ef1a8df5e0 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Wed, 18 Oct 2023 11:57:54 -0700 Subject: [PATCH 39/50] addjusting sphinx version --- docs/readthedocs-requirements.txt | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docs/readthedocs-requirements.txt b/docs/readthedocs-requirements.txt index 342675b2..ba3a28a5 100644 --- a/docs/readthedocs-requirements.txt +++ b/docs/readthedocs-requirements.txt @@ -1,4 +1,4 @@ -sphinx==6.2.1 +sphinx==7.2.6 nbsphinx==0.8.8 nbsphinx-link==1.3.0 sphinx-rtd-theme==1.0.0 From 2730b7e92e2227bb2a16dd86f94ae06c850dbf46 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Wed, 18 Oct 2023 12:36:20 -0700 Subject: [PATCH 40/50] changing sphinx-rtd-theme version --- docs/readthedocs-requirements.txt | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docs/readthedocs-requirements.txt b/docs/readthedocs-requirements.txt index ba3a28a5..1efef52e 100644 --- a/docs/readthedocs-requirements.txt +++ b/docs/readthedocs-requirements.txt @@ -1,7 +1,7 @@ sphinx==7.2.6 nbsphinx==0.8.8 nbsphinx-link==1.3.0 -sphinx-rtd-theme==1.0.0 +sphinx-rtd-theme==1.3.0 sphinx-autoapi==3.0.0 ipython==8.10.0 sphinx-copybutton==0.4.0 From 5e0f0f935293f7a6fa0af064d7148be272549968 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Wed, 18 Oct 2023 12:55:30 -0700 Subject: [PATCH 41/50] adjusting sphynx --- docs/readthedocs-requirements.txt | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docs/readthedocs-requirements.txt b/docs/readthedocs-requirements.txt index 1efef52e..0e8f22d3 100644 --- a/docs/readthedocs-requirements.txt +++ b/docs/readthedocs-requirements.txt @@ -1,4 +1,4 @@ -sphinx==7.2.6 +sphinx==7.1.2 nbsphinx==0.8.8 nbsphinx-link==1.3.0 sphinx-rtd-theme==1.3.0 From 995409c86085fb829771738fd0c6b1a6c2f28767 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Wed, 1 Nov 2023 16:53:32 +0100 Subject: [PATCH 42/50] adding pytorch to onnx function --- pathml/inference/__init__.py | 1 + pathml/inference/inference.py | 41 +++++++++++++++++++ tests/inference_tests/test_inference.py | 51 ++++++++++++++++++++++++ tests/testdata/test.pt | Bin 0 -> 2310 bytes 4 files changed, 93 insertions(+) create mode 100644 tests/testdata/test.pt diff --git a/pathml/inference/__init__.py b/pathml/inference/__init__.py index dd2b9a39..3ee73dac 100644 --- a/pathml/inference/__init__.py +++ b/pathml/inference/__init__.py @@ -9,5 +9,6 @@ InferenceBase, RemoteTestHoverNet, check_onnx_clean, + convert_pytorch_onnx, remove_initializer_from_input, ) diff --git a/pathml/inference/inference.py b/pathml/inference/inference.py index b360dda2..a63fd6de 100644 --- a/pathml/inference/inference.py +++ b/pathml/inference/inference.py @@ -9,6 +9,7 @@ import onnx import onnxruntime import requests +import torch import pathml.preprocessing.transforms as Transforms @@ -62,6 +63,46 @@ def check_onnx_clean(model_path): return True +def convert_pytorch_onnx( + model, dummy_tensor, model_name, opset_version=10, input_name="data" +): + """Converts a Pytorch Model to ONNX + Adjusted from https://pytorch.org/tutorials/advanced/super_resolution_with_onnxruntime.html + + You need to define the model class and load the weights before exporting. See URL above for full steps. + + Args: + model_path (torch.nn.Module Model): Pytorch model to be converted, + dummy_tensor (torch.tensor): dummy input tensor that is an example of what will be passed into the model, + model_name (str): name of ONNX model created with .onnx at the end, + opset_version (int): which opset version you want to use to export + input_name (str): name assigned to dummy_tensor + + Returns: + Exports ONNX model converted from Pytorch + """ + + if not isinstance(model, torch.nn.Module): + raise ValueError( + f"The model is not of type torch.nn.Module. Received {type(model)}." + ) + + if not torch.is_tensor(dummy_tensor): + raise ValueError( + f"The dummy tensor needs to be a torch tensor. Received {type(dummy_tensor)}." + ) + + torch.onnx.export( + model, + dummy_tensor, + model_name, + export_params=True, + opset_version=opset_version, + do_constant_folding=True, + input_names=[input_name], + ) + + # Base class class InferenceBase(Transforms.Transform): """ diff --git a/tests/inference_tests/test_inference.py b/tests/inference_tests/test_inference.py index 6fefa48c..535e3f4d 100644 --- a/tests/inference_tests/test_inference.py +++ b/tests/inference_tests/test_inference.py @@ -2,6 +2,7 @@ import numpy as np import onnx +import torch from pathml.core import SlideData from pathml.inference import ( @@ -10,6 +11,7 @@ InferenceBase, RemoteTestHoverNet, check_onnx_clean, + convert_pytorch_onnx, remove_initializer_from_input, ) @@ -219,3 +221,52 @@ def test_RemoteTestHoverNet(): ) inference.remove() + + +def test_convert_pytorch_onnx(): + class SimpleModel(torch.nn.Module): + def __init__(self): + super(SimpleModel, self).__init__() + self.linear = torch.nn.Linear(10, 1) + torch.nn.init.xavier_uniform_(self.linear.weight) + + def forward(self, x): + y = self.linear(x) + return y + + test_tensor = torch.randn(1, 10) + model_test = torch.load("tests/testdata/test.pt") + + model_test.eval() + + convert_pytorch_onnx( + model=model_test, dummy_tensor=test_tensor, model_name="test_export.onnx" + ) + + os.remove("test_export.onnx") + + # test Value Error Statements + + # test lines to check model input + try: + convert_pytorch_onnx( + model=None, dummy_tensor=test_tensor, model_name="test_export.onnx" + ) + + except Exception as e: + assert ( + str(e) + == f"The model is not of type torch.nn.Module. Received {type(None)}." + ) + + # test lines to check model dummy input + try: + convert_pytorch_onnx( + model=model_test, dummy_tensor=None, model_name="test_export.onnx" + ) + + except Exception as e: + assert ( + str(e) + == f"The dummy tensor needs to be a torch tensor. Received {type(None)}." + ) diff --git a/tests/testdata/test.pt b/tests/testdata/test.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4047a54695774620baab6726947d43e70480d37 GIT binary patch literal 2310 zcmb7GOK%%h6duQUb@FJFHi0%JEwA8|#2!DA*d=kODW)(@>N*sLNYya*+~kfj@%YT# zX;h?2Ae1I_2Lg#zS7p-`8xRXb5PO8W;1{rC&qHFveb^a4;s}m(<;*?b`OdlbeD~fI z)Nr>X_4i9{HYANn1bHN88pMcJx9ogwL|SjP54*~`zHL|)U61Y=(k=qTw@y%xd}vNkb+nHq)e6U+8w-9=0+R0?%n$}rmjLZ#+8u6`#WLo^c6`e zMacVD9HBSx2~1DKwOx3#2ybDbd=(3oU&o`XSm<^I3t_Hep}QMc2&{mGdTwH&lOh&s zSi_>-Z)4HUTUd1P9e(iXY1}{t@m<>4cU4&%r0a5g5=?4p$S-+*DOynb`u{OM{(7A* zosB}rn`&6PByOtGU4k5Tf8=vh?N?Rn)y2PUix3;JT)RuZon;zhqjRnS=}K@b#*}<+ z=|3hqGW+^^-{XaY_rL!uyZ7x+KdcOWvv~RUsioUbl;y7;{F43o)Ti0Mv2?KfdFp^w z_@ymOe*jj_?0dr-;=?mO(#bt?H>_Biqm zYi^uQ$}Ibnhnu&$Xl6D#XP=PfMD{3ql42fmEyK1xFxbPPTV_5N|Nq6rlZpAHGM}E$ zq%+C%TvACZbBdzSuXrYz%48PO>68*rq*#@!e-8f`?0<+Ad-!rTDs_lCnyl#^EvU_* zjlyHEM_`X>H+blwuv=prCBfd+z{Y!Ov3#$T*1*PoHwS*#6c}#}Y-|-fyn&seCx=&C z6Gv-gYK`_Fuv8Qqcea literal 0 HcmV?d00001 From 8c6ab73d8c94ca92d5923c010e6028d5688d863b Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Wed, 1 Nov 2023 17:36:05 +0100 Subject: [PATCH 43/50] attempt to get pytorch class to load --- examples/InferenceOnnx_tutorial.ipynb | 102 ++++++++++++++++++++++++ tests/inference_tests/test_inference.py | 13 +-- tests/testdata/simple_model.py | 12 +++ 3 files changed, 117 insertions(+), 10 deletions(-) create mode 100644 tests/testdata/simple_model.py diff --git a/examples/InferenceOnnx_tutorial.ipynb b/examples/InferenceOnnx_tutorial.ipynb index c2787b7a..5d1bb2b9 100644 --- a/examples/InferenceOnnx_tutorial.ipynb +++ b/examples/InferenceOnnx_tutorial.ipynb @@ -128,6 +128,7 @@ "import onnx\n", "import onnxruntime as ort \n", "import requests\n", + "import torch\n", "\n", "from pathml.core import SlideData, Tile\n", "from dask.distributed import Client\n", @@ -174,6 +175,19 @@ " - Users specify:\n", " - `model_path` (str): path to ONNX model\n", "\n", + "
\n", + "\n", + " - `convert_pytorch_onnx` \n", + " - Converts a PyTorch `.pt` file to `.onnx`\n", + " - Wrapper function of the [PyTorch](https://pytorch.org/tutorials/advanced/super_resolution_with_onnxruntime.html) function to handle the conversion.\n", + " - Users specify:\n", + " - model_path (torch.nn.Module Model): Pytorch model to be converted,\n", + " - dummy_tensor (torch.tensor): dummy input tensor that is an example of what will be passed into the model,\n", + " - model_name (str): name of ONNX model created with .onnx at the end,\n", + " - opset_version (int): which opset version you want to use to export\n", + " - input_name (str): name assigned to dummy_tensor\n", + " - Note that the model class must be defined before loading the `.pt` file and set to eval before calling this function. \n", + "\n", "### Inference Classes\n", "\n", "
\n", @@ -293,6 +307,46 @@ " return True\n", "\n", "\n", + "def convert_pytorch_onnx(\n", + " model, dummy_tensor, model_name, opset_version=10, input_name=\"data\"\n", + "):\n", + " \"\"\"Converts a Pytorch Model to ONNX\n", + " Adjusted from https://pytorch.org/tutorials/advanced/super_resolution_with_onnxruntime.html\n", + "\n", + " You need to define the model class and load the weights before exporting. See URL above for full steps.\n", + "\n", + " Args:\n", + " model_path (torch.nn.Module Model): Pytorch model to be converted,\n", + " dummy_tensor (torch.tensor): dummy input tensor that is an example of what will be passed into the model,\n", + " model_name (str): name of ONNX model created with .onnx at the end,\n", + " opset_version (int): which opset version you want to use to export\n", + " input_name (str): name assigned to dummy_tensor\n", + "\n", + " Returns:\n", + " Exports ONNX model converted from Pytorch\n", + " \"\"\"\n", + "\n", + " if not isinstance(model, torch.nn.Module):\n", + " raise ValueError(\n", + " f\"The model is not of type torch.nn.Module. Received {type(model)}.\"\n", + " )\n", + "\n", + " if not torch.is_tensor(dummy_tensor):\n", + " raise ValueError(\n", + " f\"The dummy tensor needs to be a torch tensor. Received {type(dummy_tensor)}.\"\n", + " )\n", + "\n", + " torch.onnx.export(\n", + " model,\n", + " dummy_tensor,\n", + " model_name,\n", + " export_params=True,\n", + " opset_version=opset_version,\n", + " do_constant_folding=True,\n", + " input_names=[input_name],\n", + " )\n", + "\n", + "\n", "# Base class\n", "class InferenceBase(Transforms.Transform):\n", " \"\"\"\n", @@ -612,6 +666,54 @@ "```" ] }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "afe45989", + "metadata": {}, + "source": [ + "### Converting a Pytorch Model to ONNX\n", + "\n", + "Note the following:\n", + "- Similar to PyTorch, you will need to define and create an instance of you model class before loading the `.pt` file. Then you will need to set it to eval mode before calling the conversion function. The code to do these steps is below." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "aa8f41f7", + "metadata": {}, + "outputs": [], + "source": [ + "# Define your model class\n", + "class SimpleModel(torch.nn.Module):\n", + " def __init__(self):\n", + " super(SimpleModel, self).__init__()\n", + " self.linear = torch.nn.Linear(10, 1)\n", + " torch.nn.init.xavier_uniform_(self.linear.weight)\n", + " def forward(self, x):\n", + " y = self.linear(x)\n", + " return y\n", + "\n", + "# Define your model var\n", + "model = SimpleModel()\n", + "\n", + "# Export model as .pt if you haven't already done so\n", + "# If you have already exported a .pt file, you will still need to define a model class, initialize it, and set it to eval mode. \n", + "torch.save(model, \"test.pt\")\n", + "\n", + "# Load .pt file\n", + "model_test = torch.load(\"test.pt\")\n", + "# Set model to eval mode\n", + "model_test.eval()\n", + "\n", + "# Define a dummy tensor (this is an example of what the ONNX should expect during inference)\n", + "x = torch.randn(1, 10)\n", + "\n", + "# Run conversion function\n", + "convert_pytorch_onnx(model = model_test, dummy_tensor = x, model_name = \"NAME_OF_OUTPUT_MODEL_HERE.onnx\")" + ] + }, { "attachments": {}, "cell_type": "markdown", diff --git a/tests/inference_tests/test_inference.py b/tests/inference_tests/test_inference.py index 535e3f4d..bbb8e013 100644 --- a/tests/inference_tests/test_inference.py +++ b/tests/inference_tests/test_inference.py @@ -14,6 +14,7 @@ convert_pytorch_onnx, remove_initializer_from_input, ) +from pathml.tests.testdata.simple_model import SimpleModel def test_remove_initializer_from_input(): @@ -224,18 +225,10 @@ def test_RemoteTestHoverNet(): def test_convert_pytorch_onnx(): - class SimpleModel(torch.nn.Module): - def __init__(self): - super(SimpleModel, self).__init__() - self.linear = torch.nn.Linear(10, 1) - torch.nn.init.xavier_uniform_(self.linear.weight) - - def forward(self, x): - y = self.linear(x) - return y + model_test = SimpleModel() test_tensor = torch.randn(1, 10) - model_test = torch.load("tests/testdata/test.pt") + model_test.load_state_dict(torch.load("tests/testdata/test.pt")) model_test.eval() diff --git a/tests/testdata/simple_model.py b/tests/testdata/simple_model.py new file mode 100644 index 00000000..bd9a0219 --- /dev/null +++ b/tests/testdata/simple_model.py @@ -0,0 +1,12 @@ +import torch + + +class SimpleModel(torch.nn.Module): + def __init__(self): + super(SimpleModel, self).__init__() + self.linear = torch.nn.Linear(10, 1) + torch.nn.init.xavier_uniform_(self.linear.weight) + + def forward(self, x): + y = self.linear(x) + return y From 1ae9f8c78ce31d68247240c6e6eac01256bcfc6a Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Wed, 1 Nov 2023 18:12:23 +0100 Subject: [PATCH 44/50] deleting simple model module --- tests/testdata/simple_model.py | 12 ------------ 1 file changed, 12 deletions(-) delete mode 100644 tests/testdata/simple_model.py diff --git a/tests/testdata/simple_model.py b/tests/testdata/simple_model.py deleted file mode 100644 index bd9a0219..00000000 --- a/tests/testdata/simple_model.py +++ /dev/null @@ -1,12 +0,0 @@ -import torch - - -class SimpleModel(torch.nn.Module): - def __init__(self): - super(SimpleModel, self).__init__() - self.linear = torch.nn.Linear(10, 1) - torch.nn.init.xavier_uniform_(self.linear.weight) - - def forward(self, x): - y = self.linear(x) - return y From 8fa3bebb317c5d3d7d09b41815fb63e4ae990437 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Wed, 1 Nov 2023 18:15:59 +0100 Subject: [PATCH 45/50] adding new .pt file and new test --- tests/inference_tests/test_inference.py | 5 +---- tests/testdata/test.pt | Bin 2310 -> 3646 bytes 2 files changed, 1 insertion(+), 4 deletions(-) diff --git a/tests/inference_tests/test_inference.py b/tests/inference_tests/test_inference.py index bbb8e013..d8106d43 100644 --- a/tests/inference_tests/test_inference.py +++ b/tests/inference_tests/test_inference.py @@ -14,7 +14,6 @@ convert_pytorch_onnx, remove_initializer_from_input, ) -from pathml.tests.testdata.simple_model import SimpleModel def test_remove_initializer_from_input(): @@ -225,10 +224,8 @@ def test_RemoteTestHoverNet(): def test_convert_pytorch_onnx(): - model_test = SimpleModel() - test_tensor = torch.randn(1, 10) - model_test.load_state_dict(torch.load("tests/testdata/test.pt")) + model_test = torch.jit.load("tests/testdata/test.pt") model_test.eval() diff --git a/tests/testdata/test.pt b/tests/testdata/test.pt index a4047a54695774620baab6726947d43e70480d37..f52fcb123abbfc92f9982bb5f86ec4395d12ac21 100644 GIT binary patch literal 3646 zcmbtX3se(V8lDg|5FP@`%SaW)5`pGH!XqLmS%|hH$U`&=b__`%kz~Ro6D*HivAhvj zq}F9ug@p>NRTL0vX?d(*RXC{C)y0a4^#!i09;6gpD(nm)5)fECdvorYN#=gvcjtfI zKS3Z-9{>ytfOm!wU=5&R6-pNgPywC6<1PkvzB_i;GMY=+cI)>y7c`CiVOjH4k1v{h z9}PF9gb|yMxp_1%{Y~MsmS*b{1d7hT9bG1mOPNVmyOTqe#p`hH zyxdp{_96g2XXiEnd?&eSu`x0p*LyB@t;+1zWIZ7Sp$er?0zouLdn*^f(K0c_B!^1n zu`+RhLL`=v5n#>!-&6UxsZpgs3QOT=gpkR%!oEXN6%?hG$)HGqFlMhnDS{*lMGT@B z$X|#(l}TZ-K#34_l*SclFievxL~5B>MboSyZysMtM)b#}aPVHSG+Kfp3xpa7q(-GO z6&X^BBh^xw2tviMN}+_}T*=5nDwR*d5Grh?AXhqwF*=C`WiBCPO7sHNk%$F07t?UpBdg>E z`>;*n6LDP``+JV(@$h3;ppxtoiFqSa9*4Y3Gq!=Jb`F9b?zpz^WvdmIvbH zm-j@OebE=|%dR_O*0J@h-@whno;x+s4y3@^f6G@^Cwe@LIV$sH{d_Kd1U_;F7&0|o zQYtZm)<3%)7G-iarAF-?Zdg_;Nq%Bj_eA}sDJ^aQvm43a-bIh@OPEjm=d`0MU^{O+ z(nMI4MML9xW;wG(z1z2dsT*uA^}a(4GI+UsRbX2m z%j-tMGk1m8m;BG}@9*gyiP@N#nxE16_u{nvk#$MgJuSOOU)f}w?dnZ*2)ya)d-9qM z7=N)Q**b&PwgEbYP4IqXJ*`J7_!T`ZE1F^q`CXF z->treL#Ok@D!W;G*Lq*6Y3q+yGCB3&QHu-Nsr!%$P|uMa+P=vh!vTt~gZ-?S^U zto+-@NuCj;4aqjk2G4kpU2gXx7|Cpar`h&7#xOC3NIcyC@>J3>%JGXMMBK(UnLbv} zFdLiAX=56|nbF4MDNKi9`b5^#HCaC%v2HWlclOGqd7=*b9&TkA-yN__b)>|m#ku9@ z9lI0w)8`xVR>B-qm_x2i^W|;h1r1#Tm;T4>yIg>-|neDe`jGd$n5^jlAkeqQ2fo7+~$Jvfno3 zUUH5|FaF(8tI99^{ExqQ_4)CJBtQ8dpVohW6#_@=OH(R3z3o!F&-ifbwuP@wUDn*{ zX3bc6=Hsf|?x?y4Jui8Uzo;`5xDOgE0~20iKKSdLKJc8SUd-+T-Dsb8{qPO|16vtp z>X0T50i=hXs5`)4p(gBEz0)Z)pX*TL8|)J(+;j9cvQ?dO`?XDkrQ@MIUIJ^tXW%(+ zJCOVXSXGqP-{q8)1GVlRY{+T->9?o8dh2W0`GM?eK>oNk*}p6iWaAZQrz|yYsg@IaiwvpKT9^7wvV@ed!D^1V%RrKILP}nKe2{=!R^`d zignq!4eUN^+(R*u!u#f!ceYJw3A_?*3aG1aO^#-m~dex&~Y`Z6hs z%Eb5{(!3wq;tc~nXWs(_U}`Kt8*d9$Vx?3dlO_o8a~_h4c-)WP&mc^u2Z!y+WU<}Z zOivGNaM&D%JA=vMxH6d>Hp`Rk;l^ZeT=5-}xVA2n{UZT4*4xfix3@IHA50lKeQXdo z6{y=dP6d93QA`4v(}B8ehshMRo4PzC`z=#b0Q0T*F>!Tyq{>%5+xUv&D6i z61%g;B7459lT~awzi!>6P2o>mFf;$`wQ@SQZpM2~;U2@{ai+b`&OQANCWAyb$t|X+ zlwb|xgo;ir(d=>(ubZaEQ}9a+C-4)6VLDPbxlE@Z3$)0$Nj)8_8}^hbSS#{`>deU) z1TI|YG6DF2_|aRaHq5nG2fUNV#N*sLNYya*+~kfj@%YT# zX;h?2Ae1I_2Lg#zS7p-`8xRXb5PO8W;1{rC&qHFveb^a4;s}m(<;*?b`OdlbeD~fI z)Nr>X_4i9{HYANn1bHN88pMcJx9ogwL|SjP54*~`zHL|)U61Y=(k=qTw@y%xd}vNkb+nHq)e6U+8w-9=0+R0?%n$}rmjLZ#+8u6`#WLo^c6`e zMacVD9HBSx2~1DKwOx3#2ybDbd=(3oU&o`XSm<^I3t_Hep}QMc2&{mGdTwH&lOh&s zSi_>-Z)4HUTUd1P9e(iXY1}{t@m<>4cU4&%r0a5g5=?4p$S-+*DOynb`u{OM{(7A* zosB}rn`&6PByOtGU4k5Tf8=vh?N?Rn)y2PUix3;JT)RuZon;zhqjRnS=}K@b#*}<+ z=|3hqGW+^^-{XaY_rL!uyZ7x+KdcOWvv~RUsioUbl;y7;{F43o)Ti0Mv2?KfdFp^w z_@ymOe*jj_?0dr-;=?mO(#bt?H>_Biqm zYi^uQ$}Ibnhnu&$Xl6D#XP=PfMD{3ql42fmEyK1xFxbPPTV_5N|Nq6rlZpAHGM}E$ zq%+C%TvACZbBdzSuXrYz%48PO>68*rq*#@!e-8f`?0<+Ad-!rTDs_lCnyl#^EvU_* zjlyHEM_`X>H+blwuv=prCBfd+z{Y!Ov3#$T*1*PoHwS*#6c}#}Y-|-fyn&seCx=&C z6Gv-gYK`_Fuv8Qqcea From 2e84cf7f0a6629568e46a79acfc710d748ed35e2 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Wed, 1 Nov 2023 18:36:25 +0100 Subject: [PATCH 46/50] adding new tutorial --- examples/InferenceOnnx_tutorial.ipynb | 9 ++++++--- 1 file changed, 6 insertions(+), 3 deletions(-) diff --git a/examples/InferenceOnnx_tutorial.ipynb b/examples/InferenceOnnx_tutorial.ipynb index 5d1bb2b9..fe4de75a 100644 --- a/examples/InferenceOnnx_tutorial.ipynb +++ b/examples/InferenceOnnx_tutorial.ipynb @@ -672,7 +672,7 @@ "id": "afe45989", "metadata": {}, "source": [ - "### Converting a Pytorch Model to ONNX\n", + "### Converting a Pytorch Model to ONNX Using the `convert_pytorch_onnx` Function\n", "\n", "Note the following:\n", "- Similar to PyTorch, you will need to define and create an instance of you model class before loading the `.pt` file. Then you will need to set it to eval mode before calling the conversion function. The code to do these steps is below." @@ -686,10 +686,12 @@ "outputs": [], "source": [ "# Define your model class\n", + "num_input, num_output, batch_size = 10, 1, 1\n", + "\n", "class SimpleModel(torch.nn.Module):\n", " def __init__(self):\n", " super(SimpleModel, self).__init__()\n", - " self.linear = torch.nn.Linear(10, 1)\n", + " self.linear = torch.nn.Linear(num_input, num_output)\n", " torch.nn.init.xavier_uniform_(self.linear.weight)\n", " def forward(self, x):\n", " y = self.linear(x)\n", @@ -700,6 +702,7 @@ "\n", "# Export model as .pt if you haven't already done so\n", "# If you have already exported a .pt file, you will still need to define a model class, initialize it, and set it to eval mode. \n", + "# If you saved your model using `torch.jit.script`, you will not need to define your model class and instead load it using `torch.jit.load` then set it to eval mode.\n", "torch.save(model, \"test.pt\")\n", "\n", "# Load .pt file\n", @@ -708,7 +711,7 @@ "model_test.eval()\n", "\n", "# Define a dummy tensor (this is an example of what the ONNX should expect during inference)\n", - "x = torch.randn(1, 10)\n", + "x = torch.randn(batch_size, num_input)\n", "\n", "# Run conversion function\n", "convert_pytorch_onnx(model = model_test, dummy_tensor = x, model_name = \"NAME_OF_OUTPUT_MODEL_HERE.onnx\")" From 91d8f41b49d1b2b21a274db7c3fbabe187430f21 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Mon, 6 Nov 2023 15:51:16 +0100 Subject: [PATCH 47/50] new example book --- examples/InferenceOnnx_tutorial.ipynb | 574 +++++++++----------------- 1 file changed, 188 insertions(+), 386 deletions(-) diff --git a/examples/InferenceOnnx_tutorial.ipynb b/examples/InferenceOnnx_tutorial.ipynb index fe4de75a..9e1d8f19 100644 --- a/examples/InferenceOnnx_tutorial.ipynb +++ b/examples/InferenceOnnx_tutorial.ipynb @@ -117,7 +117,7 @@ }, { "cell_type": "code", - "execution_count": 1, + "execution_count": 8, "id": "436b91f3-6338-4043-8742-496b354544aa", "metadata": {}, "outputs": [], @@ -126,7 +126,7 @@ "os.environ[\"JAVA_HOME\"] = \"/opt/conda/envs/YOUR ENVIRONMENET NAME\" # TO DO: CHANGE THIS TO YOUR ENVIRONMENT NAME\n", "import numpy as np \n", "import onnx\n", - "import onnxruntime as ort \n", + "import onnxruntime\n", "import requests\n", "import torch\n", "\n", @@ -135,14 +135,11 @@ "from pathml.preprocessing import Pipeline\n", "import pathml.preprocessing.transforms as Transforms\n", "\n", - "from pathml.inference import (\n", - " HaloAIInference,\n", - " Inference,\n", - " InferenceBase,\n", - " RemoteTestHoverNet,\n", - " check_onnx_clean,\n", - " remove_initializer_from_input,\n", - ")" + "import matplotlib.pyplot as plt\n", + "import matplotlib \n", + "\n", + "from PIL import Image\n", + "\n" ] }, { @@ -243,380 +240,7 @@ " 'model_input_notes': 'Accepts tiles of 256 x 256',\n", " 'model_output_notes': None,\n", " 'citation': 'Pocock J, Graham S, Vu QD, Jahanifar M, Deshpande S, Hadjigeorghiou G, Shephard A, Bashir RM, Bilal M, Lu W, Epstein D. TIAToolbox as an end-to-end library for advanced tissue image analytics. Communications medicine. 2022 Sep 24;2(1):120.'}\n", - " ```\n", - " \n", - "### Raw Code\n", - "\n", - "Below is the raw code for your convenience. You can also find the raw code on our github. \n", - "[![View on GitHub](https://img.shields.io/badge/View-on%20GitHub-lightgrey?logo=github)](https://github.com/Dana-Farber-AIOS/pathml/tree/master/pathml)" - ] - }, - { - "cell_type": "code", - "execution_count": 2, - "id": "3339cf66-8de6-4af1-9d3e-7312cd69eb33", - "metadata": {}, - "outputs": [], - "source": [ - "def remove_initializer_from_input(model_path, new_path):\n", - " \"\"\"Removes initializers from HaloAI ONNX models\n", - " Taken from https://github.com/microsoft/onnxruntime/blob/main/tools/python/remove_initializer_from_input.py\n", - "\n", - " Args:\n", - " model_path (str): path to ONNX model,\n", - " new_path (str): path to save adjusted model w/o initializers,\n", - "\n", - " Returns:\n", - " ONNX model w/o initializers to run inference using PathML\n", - " \"\"\"\n", - "\n", - " model = onnx.load(model_path)\n", - "\n", - " inputs = model.graph.input\n", - " name_to_input = {}\n", - " for onnx_input in inputs:\n", - " name_to_input[onnx_input.name] = onnx_input\n", - "\n", - " for initializer in model.graph.initializer:\n", - " if initializer.name in name_to_input:\n", - " inputs.remove(name_to_input[initializer.name])\n", - "\n", - " onnx.save(model, new_path)\n", - "\n", - "\n", - "def check_onnx_clean(model_path):\n", - " \"\"\"Checks if the model has had it's initalizers removed from input graph.\n", - " Adapted from from https://github.com/microsoft/onnxruntime/blob/main/tools/python/remove_initializer_from_input.py\n", - "\n", - " Args:\n", - " model_path (str): path to ONNX model,\n", - "\n", - " Returns:\n", - " Boolean if there are initializers in input graph.\n", - " \"\"\"\n", - "\n", - " model = onnx.load(model_path)\n", - "\n", - " inputs = model.graph.input\n", - " name_to_input = {}\n", - " for onnx_input in inputs:\n", - " name_to_input[onnx_input.name] = onnx_input\n", - "\n", - " for initializer in model.graph.initializer:\n", - " if initializer.name in name_to_input:\n", - " return True\n", - "\n", - "\n", - "def convert_pytorch_onnx(\n", - " model, dummy_tensor, model_name, opset_version=10, input_name=\"data\"\n", - "):\n", - " \"\"\"Converts a Pytorch Model to ONNX\n", - " Adjusted from https://pytorch.org/tutorials/advanced/super_resolution_with_onnxruntime.html\n", - "\n", - " You need to define the model class and load the weights before exporting. See URL above for full steps.\n", - "\n", - " Args:\n", - " model_path (torch.nn.Module Model): Pytorch model to be converted,\n", - " dummy_tensor (torch.tensor): dummy input tensor that is an example of what will be passed into the model,\n", - " model_name (str): name of ONNX model created with .onnx at the end,\n", - " opset_version (int): which opset version you want to use to export\n", - " input_name (str): name assigned to dummy_tensor\n", - "\n", - " Returns:\n", - " Exports ONNX model converted from Pytorch\n", - " \"\"\"\n", - "\n", - " if not isinstance(model, torch.nn.Module):\n", - " raise ValueError(\n", - " f\"The model is not of type torch.nn.Module. Received {type(model)}.\"\n", - " )\n", - "\n", - " if not torch.is_tensor(dummy_tensor):\n", - " raise ValueError(\n", - " f\"The dummy tensor needs to be a torch tensor. Received {type(dummy_tensor)}.\"\n", - " )\n", - "\n", - " torch.onnx.export(\n", - " model,\n", - " dummy_tensor,\n", - " model_name,\n", - " export_params=True,\n", - " opset_version=opset_version,\n", - " do_constant_folding=True,\n", - " input_names=[input_name],\n", - " )\n", - "\n", - "\n", - "# Base class\n", - "class InferenceBase(Transforms.Transform):\n", - " \"\"\"\n", - " Base class for all ONNX Models.\n", - " Each transform must operate on a Tile.\n", - " \"\"\"\n", - "\n", - " def __init__(self):\n", - " self.model_card = {\n", - " \"name\": None,\n", - " \"num_classes\": None,\n", - " \"model_type\": None,\n", - " \"notes\": None,\n", - " \"model_input_notes\": None,\n", - " \"model_output_notes\": None,\n", - " \"citation\": None,\n", - " }\n", - "\n", - " def __repr__(self):\n", - " return \"Base class for all ONNX models\"\n", - "\n", - " def get_model_card(self):\n", - " return self.model_card\n", - "\n", - " def set_name(self, name):\n", - " self.model_card[\"name\"] = name\n", - "\n", - " def set_num_classes(self, num):\n", - " self.model_card[\"num_classes\"] = num\n", - "\n", - " def set_model_type(self, model_type):\n", - " self.model_card[\"model_type\"] = model_type\n", - "\n", - " def set_notes(self, note):\n", - " self.model_card[\"notes\"] = note\n", - "\n", - " def set_model_input_notes(self, note):\n", - " self.model_card[\"model_input_notes\"] = note\n", - "\n", - " def set_model_output_notes(self, note):\n", - " self.model_card[\"model_output_notes\"] = note\n", - "\n", - " def set_citation(self, citation):\n", - " self.model_card[\"citation\"] = citation\n", - "\n", - " def reshape(self, image):\n", - " \"\"\"standard reshaping of tile image\"\"\"\n", - " # flip dimensions\n", - " # follows convention used here https://github.com/Dana-Farber-AIOS/pathml/blob/master/pathml/ml/dataset.py\n", - "\n", - " if image.ndim == 3:\n", - " # swap axes from HWC to CHW\n", - " image = image.transpose(2, 0, 1)\n", - " # add a dimesion bc onnx models usually have batch size as first dim: e.g. (1, channel, height, width)\n", - " image = np.expand_dims(image, axis=0)\n", - "\n", - " return image\n", - " else:\n", - " # in this case, we assume that we have XYZCT channel order\n", - " # so we swap axes to TCZYX for batching\n", - " # note we are not adding a dim here for batch bc we assume that subsetting will create a batch \"placeholder\" dim\n", - " image = image.T\n", - "\n", - " return image\n", - "\n", - " def F(self, target):\n", - " \"\"\"functional implementation\"\"\"\n", - " raise NotImplementedError\n", - "\n", - " def apply(self, tile):\n", - " \"\"\"modify Tile object in-place\"\"\"\n", - " raise NotImplementedError\n", - "\n", - "\n", - "# class to handle local onnx models\n", - "class Inference(InferenceBase):\n", - " \"\"\"Transformation to run inferrence on ONNX model.\n", - "\n", - " Assumptions:\n", - " - The ONNX model has been cleaned by `remove_initializer_from_input` first\n", - "\n", - " Args:\n", - " model_path (str): path to ONNX model w/o initializers,\n", - " input_name (str): name of the input the ONNX model accepts\n", - " \"\"\"\n", - "\n", - " def __init__(\n", - " self,\n", - " model_path=None,\n", - " input_name=\"data\",\n", - " num_classes=None,\n", - " model_type=None,\n", - " local=True,\n", - " ):\n", - " super().__init__()\n", - "\n", - " self.input_name = input_name\n", - " self.num_classes = num_classes\n", - " self.model_type = model_type\n", - " self.local = local\n", - "\n", - " if self.local:\n", - " # using a local onnx model\n", - " self.model_path = model_path\n", - " else:\n", - " # if using a model from the model zoo, set the local path to a temp file\n", - " self.model_path = \"temp.onnx\"\n", - "\n", - " # fill in parts of the model_card with the following info\n", - " self.model_card[\"num_classes\"] = self.num_classes\n", - " self.model_card[\"model_type\"] = self.model_type\n", - "\n", - " # check if there are initializers in input graph if using a local model\n", - " if local:\n", - " if check_onnx_clean(model_path):\n", - " raise ValueError(\n", - " \"The ONNX model still has graph initializers in the input graph. Use `remove_initializer_from_input` to remove them.\"\n", - " )\n", - " else:\n", - " pass\n", - "\n", - " def __repr__(self):\n", - " if self.local:\n", - " return f\"Class to handle ONNX model locally stored at {self.model_path}\"\n", - " else:\n", - " return f\"Class to handle a {self.model_card['model_name']} from the PathML model zoo.\"\n", - "\n", - " def inference(self, image):\n", - " # reshape the image\n", - " image = self.reshape(image)\n", - "\n", - " # load fixed model\n", - " onnx_model = onnx.load(self.model_path)\n", - "\n", - " # check tile dimensions match ONNX input dimensions\n", - " input_node = onnx_model.graph.input\n", - "\n", - " dimensions = []\n", - " for input in input_node:\n", - " if input.name == self.input_name:\n", - " input_shape = input.type.tensor_type.shape.dim\n", - " for dim in input_shape:\n", - " dimensions.append(dim.dim_value)\n", - "\n", - " assert (\n", - " image.shape[-1] == dimensions[-1] and image.shape[-2] == dimensions[-2]\n", - " ), f\"expecting tile shape of {dimensions[-2]} by {dimensions[-1]}, got {image.shape[-2]} by {image.shape[-1]}\"\n", - "\n", - " # check onnx model\n", - " onnx.checker.check_model(onnx_model)\n", - "\n", - " # start an inference session\n", - " ort_sess = onnxruntime.InferenceSession(self.model_path)\n", - "\n", - " # create model output, returns a list\n", - " model_output = ort_sess.run(None, {self.input_name: image.astype(\"f\")})\n", - "\n", - " return model_output\n", - "\n", - " def F(self, image):\n", - " # run inference function\n", - " prediction_map = self.inference(image)\n", - "\n", - " # single task model\n", - " if len(prediction_map) == 1:\n", - " # return first and only prediction array in the list\n", - " return prediction_map[0]\n", - "\n", - " # multi task model\n", - " else:\n", - " # concatenate prediction results\n", - " # assumes that the tasks all output prediction arrays of same dimension on H and W\n", - " result_array = np.concatenate(prediction_map, axis=1)\n", - " return result_array\n", - "\n", - " def apply(self, tile):\n", - " tile.image = self.F(tile.image)\n", - "\n", - "\n", - "class HaloAIInference(Inference):\n", - " \"\"\"Transformation to run inferrence on HALO AI ONNX model.\n", - "\n", - " Assumptions:\n", - " - Assumes that the ONNX model returns a tensor in which there is one prediction map for each class\n", - " - For example, if there are 5 classes, the ONNX model will output a (1, 5, Height, Weight) tensor\n", - " - If you select to argmax the classes, the class assumes a softmax or sigmoid has already been applied\n", - " - HaloAI ONNX models always have 20 class maps so you need to index into the first x maps if you have x classes\n", - "\n", - "\n", - " Args:\n", - " model_path (str): path to ONNX model w/o initializers,\n", - " num_classes (int): number of classes in the data,\n", - " input_name (str): name of the input the ONNX model accepts\n", - " \"\"\"\n", - "\n", - " def __init__(\n", - " self,\n", - " model_path=None,\n", - " input_name=\"data\",\n", - " num_classes=None,\n", - " model_type=None,\n", - " local=True,\n", - " ):\n", - " super().__init__(model_path, input_name, num_classes, model_type, local)\n", - "\n", - " self.model_card[\"num_classes\"] = self.num_classes\n", - " self.model_card[\"model_type\"] = self.model_type\n", - "\n", - " def __repr__(self):\n", - " return f\"Class to handle HALO AI ONNX model locally stored at {self.model_path}\"\n", - "\n", - " def F(self, image):\n", - " prediction_map = self.inference(image)\n", - "\n", - " prediction_map = prediction_map[0][:, 0 : self.num_classes, :, :]\n", - "\n", - " return prediction_map\n", - "\n", - " def apply(self, tile):\n", - " tile.image = self.F(tile.image)\n", - "\n", - "\n", - "# class to handle remote onnx models\n", - "class RemoteTestHoverNet(Inference):\n", - " \"\"\"Transformation to run inferrence on ONNX model.\n", - "\n", - " Citation for model:\n", - " Pocock J, Graham S, Vu QD, Jahanifar M, Deshpande S, Hadjigeorghiou G, Shephard A, Bashir RM, Bilal M, Lu W, Epstein D.\n", - " TIAToolbox as an end-to-end library for advanced tissue image analytics. Communications medicine. 2022 Sep 24;2(1):120.\n", - "\n", - " Args:\n", - " model_path (str): temp file name to download onnx from huggingface,\n", - " input_name (str): name of the input the ONNX model accepts\n", - " \"\"\"\n", - "\n", - " def __init__(\n", - " self,\n", - " model_path=\"temp.onnx\",\n", - " input_name=\"data\",\n", - " num_classes=5,\n", - " model_type=\"Segmentation\",\n", - " local=False,\n", - " ):\n", - " super().__init__(model_path, input_name, num_classes, model_type, local)\n", - "\n", - " # specify URL of the model in PathML public repository\n", - " url = \"https://huggingface.co/pathml/test/resolve/main/hovernet_fast_tiatoolbox_fixed.onnx\"\n", - "\n", - " # download model, save as temp.onnx\n", - " with open(self.model_path, \"wb\") as out_file:\n", - " content = requests.get(url, stream=True).content\n", - " out_file.write(content)\n", - "\n", - " self.model_card[\"num_classes\"] = self.num_classes\n", - " self.model_card[\"model_type\"] = self.model_type\n", - " self.model_card[\"name\"] = \"Tiabox HoverNet Test\"\n", - " self.model_card[\"model_input_notes\"] = \"Accepts tiles of 256 x 256\"\n", - " self.model_card[\n", - " \"citation\"\n", - " ] = \"Pocock J, Graham S, Vu QD, Jahanifar M, Deshpande S, Hadjigeorghiou G, Shephard A, Bashir RM, Bilal M, Lu W, Epstein D. TIAToolbox as an end-to-end library for advanced tissue image analytics. Communications medicine. 2022 Sep 24;2(1):120.\"\n", - "\n", - " def __repr__(self):\n", - " return \"Class to handle remote TIAToolBox HoverNet test ONNX. See model card for citation.\"\n", - "\n", - " def apply(self, tile):\n", - " tile.image = self.F(tile.image)\n", - "\n", - " def remove(self):\n", - " # remove the temp.onnx model\n", - " os.remove(self.model_path)\n" + " ```" ] }, { @@ -811,6 +435,7 @@ "source": [ "### Remote ONNX Using our `RemoteTestHoverNet` Class\n", "- Uses a Hovernet from [TIAToolbox](https://github.com/TissueImageAnalytics/tiatoolbox) \n", + "- This version of Hovernet was trained on the [MoNuSAC](https://monusac-2020.grand-challenge.org/) dataset.\n", "- Note that the purpose of this model is to illustrate how PathML will handle future remote models. We plan on release more public models to our model zoo on HuggingFace in the future.\n", "- Citation for model:\n", " - Pocock J, Graham S, Vu QD, Jahanifar M, Deshpande S, Hadjigeorghiou G, Shephard A, Bashir RM, Bilal M, Lu W, Epstein D. TIAToolbox as an end-to-end library for advanced tissue image analytics. Communications medicine. 2022 Sep 24;2(1):120.\n", @@ -864,7 +489,180 @@ "```python\n", "for tile in wsi.tiles: \n", " print(tile.image.shape) \n", - "```" + "```\n", + "\n", + "To see how to use these tiles to make visualizations, see below." + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "251a9099-8e6f-4e4c-b685-7087191fe9fe", + "metadata": {}, + "source": [ + "## Full Example With Vizualization of Output\n", + "\n", + "The `RemoteTestHoverNet()` uses a pretrained HoverNet from TIAToolBox trained on the [MoNuSAC](https://monusac-2020.grand-challenge.org/) dataset. **The model was trained to accept tiles of 256x256 to create a prediction matrix of size 164x164 with 9 channels.** The first 5 channels correspond to the Nuclei Types (TP), the next two channels correspond to the Nuclei Pixels (NP), and the last two channels correspond to the Hover (HV). The documention for these channels can be found here on TIAToolBox's [website](https://tia-toolbox.readthedocs.io/en/v1.0.1/_modules/tiatoolbox/models/architecture/hovernet.html#HoVerNet.infer_batch). \n", + "\n", + "In this example we use an taken from the [MoNuSAC](https://monusac-2020.grand-challenge.org/) dataset. See citation in the `References` section.\n", + "\n", + "See citation in the `References` section.\n", + "\n", + "### Load Packages" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "925d4ebd-3803-409a-82be-780115ffb152", + "metadata": {}, + "source": [ + "### Run Code as Demonstrated Above\n", + "\n", + "Note that to run the following code, you will need to download and save the image titled `TCGA-5P-A9K0-01Z-00-DX1_1.svs` in the same directory as the notebook." + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "23951050-b47f-4b38-b0b6-786081fc69f0", + "metadata": {}, + "outputs": [], + "source": [ + "# Define slide path\n", + "slide_path = 'TCGA-5P-A9K0-01Z-00-DX1_1.svs'\n", + "\n", + "inference = RemoteTestHoverNet()\n", + "\n", + "# Create a transformation list\n", + "transformation_list = [\n", + " inference\n", + "] \n", + "\n", + "# Initialize pathml.core.slide_data.SlideData object\n", + "wsi = SlideData(slide_path)\n", + "\n", + "# Set up PathML pipeline\n", + "pipeline = Pipeline(transformation_list)\n", + "\n", + "# Run Inference\n", + "wsi.run(pipeline, tile_size = 256, tile_stride = 164, tile_pad=True)\n", + "\n", + "# DELETE ONNX MODEL DOWNLOADED FROM HUGGINGFACE\n", + "inference.remove() " + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "2921a180-20bc-4ce1-960d-7005892f4585", + "metadata": {}, + "source": [ + "Let's look at the first tile which comes from the top left corner (0,0) and Nucleus Pixel predictions." + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "a607bb7d-de3e-4444-8829-75d7da9505fb", + "metadata": {}, + "outputs": [], + "source": [ + "for tile in wsi.tiles:\n", + " # Create empty numpy array\n", + " a = np.empty((2, 164, 164), dtype=object)\n", + " # Get Nucleus Predictions\n", + " classes = tile.image[0, 5:7, :, :] \n", + " a = classes\n", + " # Take the argmax to make the predictions binary\n", + " image = np.argmax(a, axis = 0) \n", + " # Multiple values by 255 to make the array image friendly\n", + " image = image * (255/1) \n", + " # Make a grey scale image\n", + " img = Image.fromarray(image.astype('uint8'), \"L\")\n", + " # Save Image\n", + " img.save('test_array_1.png')\n", + " # Can break after one iteration since we are using at the tile at (0, 0).\n", + " break " + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "aa6fbb49-7173-4a65-9b1f-e7b90a5228c5", + "metadata": {}, + "source": [ + "Lets visualize the tile vs the tile predictions. Since the model uses a 256x256 tile to create a prediction map of size 164x164, we need to take our tile located at (0,0) and crop it down to the center 164x164 pixes. " + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "id": "e29e98f3-c04c-4d77-8681-c837181bf415", + "metadata": {}, + "outputs": [], + "source": [ + "prediction_dim = 164\n", + "tile_dim = 256\n", + "crop_amount = int((256 - 164) / 2) \n", + "wsi = SlideData(slide_path)\n", + "\n", + "generator = wsi.generate_tiles(shape = (tile_dim, tile_dim), level = 0)\n", + "\n", + "for tile in generator:\n", + " # Extract array from tile\n", + " image = tile.image\n", + " # Crop tile\n", + " image = image[crop_amount: crop_amount + prediction_dim, crop_amount: crop_amount + prediction_dim] \n", + " # Convert array to image\n", + " img = Image.fromarray(image)\n", + " # Save Image\n", + " img.save('raw_tile.png')\n", + " break" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "id": "98ab9eb0-455d-4353-b760-3d65820e81de", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Set figure sice\n", + "plt.rcParams['figure.figsize'] = 11 ,8\n", + "\n", + "# Read images\n", + "img_A = matplotlib.image.imread('raw_tile.png')\n", + "img_B = matplotlib.image.imread('test_array_1.png')\n", + "\n", + "# Set up plots\n", + "fig, ax = plt.subplots(1,2)\n", + "plt.xticks([])\n", + "plt.yticks([])\n", + "ax[0].imshow(img_A)\n", + "ax[1].imshow(img_B, cmap='gray')\n", + "ax[0].set_title(\"Original Image\")\n", + "ax[1].set_title(\"Model Predictions\")\n", + "plt.tight_layout()\n", + "\n", + "# Get rid of tick marks\n", + "for a in ax.ravel():\n", + " a.set_xticks([])\n", + " a.set_yticks([])\n", + "\n", + "# Show images\n", + "plt.show()" ] }, { @@ -877,7 +675,11 @@ "\n", "- Pocock J, Graham S, Vu QD, Jahanifar M, Deshpande S, Hadjigeorghiou G, Shephard A, Bashir RM, Bilal M, Lu W, Epstein D. TIAToolbox as an end-to-end library for advanced tissue image analytics. Communications medicine. 2022 Sep 24;2(1):120.\n", "\n", - "- https://github.com/microsoft/onnxruntime/blob/main/tools/python/remove_initializer_from_input.py" + "- R. Verma, et al. \"MoNuSAC2020: A Multi-organ Nuclei Segmentation and Classification Challenge.\" IEEE Transactions on Medical Imaging (2021).\n", + "\n", + "- https://github.com/microsoft/onnxruntime/blob/main/tools/python/remove_initializer_from_input.py\n", + "\n", + "- https://pytorch.org/tutorials/advanced/super_resolution_with_onnxruntime.html" ] } ], From c69e4a28949cfd376b4e0509e66ad54fc740e475 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Wed, 8 Nov 2023 21:43:17 +0100 Subject: [PATCH 48/50] further edits --- examples/InferenceOnnx_tutorial.ipynb | 2 -- 1 file changed, 2 deletions(-) diff --git a/examples/InferenceOnnx_tutorial.ipynb b/examples/InferenceOnnx_tutorial.ipynb index 9e1d8f19..2245643f 100644 --- a/examples/InferenceOnnx_tutorial.ipynb +++ b/examples/InferenceOnnx_tutorial.ipynb @@ -506,8 +506,6 @@ "\n", "In this example we use an taken from the [MoNuSAC](https://monusac-2020.grand-challenge.org/) dataset. See citation in the `References` section.\n", "\n", - "See citation in the `References` section.\n", - "\n", "### Load Packages" ] }, From a3011b318e157eebe86a6d8eff38266cd6e1f9a9 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Wed, 22 Nov 2023 08:44:14 -0800 Subject: [PATCH 49/50] changing torch version --- environment.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/environment.yml b/environment.yml index bb83d68a..1b8973df 100644 --- a/environment.yml +++ b/environment.yml @@ -11,7 +11,7 @@ dependencies: - scikit-image==0.18.3 - matplotlib==3.5.1 - openjdk==8.0.152 - - pytorch==1.10.1 + - pytorch==1.13.1 # orig = 1.10.1 - h5py==3.1.0 - dask==2021.12.0 - pydicom==2.2.2 From 591caaf930717d8a59aedb70f138fb2164081ac5 Mon Sep 17 00:00:00 2001 From: jamesgwen Date: Thu, 30 Nov 2023 12:02:16 -0800 Subject: [PATCH 50/50] fixed typos in example notebook --- examples/InferenceOnnx_tutorial.ipynb | 9 ++------- 1 file changed, 2 insertions(+), 7 deletions(-) diff --git a/examples/InferenceOnnx_tutorial.ipynb b/examples/InferenceOnnx_tutorial.ipynb index 2245643f..23452c56 100644 --- a/examples/InferenceOnnx_tutorial.ipynb +++ b/examples/InferenceOnnx_tutorial.ipynb @@ -8,8 +8,6 @@ "source": [ "# PathML ONNX Tutorial\n", "\n", - "Written by James Wen. James_Wen@dfci.harvard.edu. \n", - "\n", "[![View on GitHub](https://img.shields.io/badge/View-on%20GitHub-lightgrey?logo=github)](https://github.com/Dana-Farber-AIOS/pathml/blob/master/examples/)\n", "\n", "## Introduction\n", @@ -138,8 +136,7 @@ "import matplotlib.pyplot as plt\n", "import matplotlib \n", "\n", - "from PIL import Image\n", - "\n" + "from PIL import Image" ] }, { @@ -504,9 +501,7 @@ "\n", "The `RemoteTestHoverNet()` uses a pretrained HoverNet from TIAToolBox trained on the [MoNuSAC](https://monusac-2020.grand-challenge.org/) dataset. **The model was trained to accept tiles of 256x256 to create a prediction matrix of size 164x164 with 9 channels.** The first 5 channels correspond to the Nuclei Types (TP), the next two channels correspond to the Nuclei Pixels (NP), and the last two channels correspond to the Hover (HV). The documention for these channels can be found here on TIAToolBox's [website](https://tia-toolbox.readthedocs.io/en/v1.0.1/_modules/tiatoolbox/models/architecture/hovernet.html#HoVerNet.infer_batch). \n", "\n", - "In this example we use an taken from the [MoNuSAC](https://monusac-2020.grand-challenge.org/) dataset. See citation in the `References` section.\n", - "\n", - "### Load Packages" + "In this example we use an taken from the [MoNuSAC](https://monusac-2020.grand-challenge.org/) dataset. See citation in the `References` section." ] }, {