Merge pull request #44 from DARPA-CRITICALMAAS/polymer_no_label_fix

Fix to Allow duplicate label and no label map units
DARPA-CRITICALMAAS · Nov 6, 2024 · 4b21685 · 4b21685
2 parents 2d41cfc + bfb718a
commit 4b21685
Show file tree

Hide file tree

Showing 5 changed files with 55 additions and 104 deletions.
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -5,6 +5,7 @@ The format is based on [Keep a Changelog](http://keepachangelog.com/)
 and this project adheres to [Semantic Versioning](http://semver.org/).
 
 ## [Unreleased]
+- Fixed bug were map units from polymer with no label or duplicate labels would get dropped from results.
 
 ## [0.4.6] - 2024-10-23
 

diff --git a/src/models/golden_muscat_model.py b/src/models/golden_muscat_model.py
@@ -51,17 +51,21 @@ def my_norm(self, data):
 
     # @override
     def inference(self, image, legend_images, data_id=-1):
-        """Image data is in CHW format. legend_images is a dictionary of label to map_unit label images in CHW format."""         
+        """
+        Args:
+            image (np.array): Image data in CHW format.
+            legend_images (list): List of map_unit swatch images in CHW format.
+            data_id (int): Data id for logging purposes.
+        
+        Returns:
+            np.array: Prediction mask in CHW format.
+        """           
         # For profiling memory usage 
         #torch.cuda.memory._record_memory_history()
 
         # Get the size of the map
         map_channels, map_height, map_width = image.shape
 
-        # Reshape maps with 1 channel images (greyscale) to 3 channels for inference
-        if map_channels == 1: # This is tmp fix!    
-            image = np.concatenate([image,image,image], axis=0)
-
         # Generate patches
         # Pad image so we get a size that can be evenly divided into patches.
         right_pad = self.patch_size - (map_width % self.patch_size)
@@ -81,15 +85,7 @@ def inference(self, image, legend_images, data_id=-1):
         map_prediction = np.zeros((1, map_height, map_width), dtype=np.float32)
         map_confidence = np.zeros((1, map_height, map_width), dtype=np.float32)
         legend_index = 1
-        for label, legend_img in legend_images.items():
-            # Debugging GPU memory usage
-            # device_num = 0
-            # alloc_mem = torch.cuda.max_memory_allocated(device_num)/(1024**3)
-            # resev_mem = torch.cuda.memory_reserved(device_num)/(1024**3)
-            # free_mem = torch.cuda.mem_get_info(device_num)[0]/(1024**3)
-            # pipeline_manager.log_to_monitor(data_id, {'GPU Mem (Alloc/Reserve/Avail)' : f'{alloc_mem:.2f}/{resev_mem:.2f}/{free_mem:.2f} GB'})
-
-            # pipeline_manager.log(logging.DEBUG, f'\t\tInferencing legend: {label}')
+        for legend_img in legend_images:
             lgd_stime = time()
             # Reshape maps with 1 channel legends (greyscale) to 3 channels for inference
             if legend_img.shape[0] == 1:

diff --git a/src/models/icy_resin_model.py b/src/models/icy_resin_model.py
@@ -51,17 +51,21 @@ def my_norm(self, data):
 
     # @override
     def inference(self, image, legend_images, data_id=-1):
-        """Image data is in CHW format. legend_images is a dictionary of label to map_unit label images in CHW format."""         
+        """
+        Args:
+            image (np.array): Image data in CHW format.
+            legend_images (list): List of map_unit swatch images in CHW format.
+            data_id (int): Data id for logging purposes.
+        
+        Returns:
+            np.array: Prediction mask in CHW format.
+        """          
         # For profiling memory usage 
         #torch.cuda.memory._record_memory_history()
 
         # Get the size of the map
         map_channels, map_height, map_width = image.shape
 
-        # Reshape maps with 1 channel images (greyscale) to 3 channels for inference
-        if map_channels == 1: # This is tmp fix!    
-            image = np.concatenate([image,image,image], axis=0)
-
         # Generate patches
         # Pad image so we get a size that can be evenly divided into patches.
         right_pad = self.patch_size - (map_width % self.patch_size)
@@ -81,15 +85,7 @@ def inference(self, image, legend_images, data_id=-1):
         map_prediction = np.zeros((1, map_height, map_width), dtype=np.float32)
         map_confidence = np.zeros((1, map_height, map_width), dtype=np.float32)
         legend_index = 1
-        for label, legend_img in legend_images.items():
-            # Debugging GPU memory usage
-            # device_num = 0
-            # alloc_mem = torch.cuda.max_memory_allocated(device_num)/(1024**3)
-            # resev_mem = torch.cuda.memory_reserved(device_num)/(1024**3)
-            # free_mem = torch.cuda.mem_get_info(device_num)[0]/(1024**3)
-            # pipeline_manager.log_to_monitor(data_id, {'GPU Mem (Alloc/Reserve/Avail)' : f'{alloc_mem:.2f}/{resev_mem:.2f}/{free_mem:.2f} GB'})
-
-            # pipeline_manager.log(logging.DEBUG, f'\t\tInferencing legend: {label}')
+        for legend_img in legend_images:
             lgd_stime = time()
             # Reshape maps with 1 channel legends (greyscale) to 3 channels for inference
             if legend_img.shape[0] == 1:

diff --git a/src/models/pipeline_pytorch_model.py b/src/models/pipeline_pytorch_model.py
@@ -35,14 +35,18 @@ def load_model(self):
 
     # Optional to override this method
     def inference(self, image, legend_images, data_id=-1):
-        """Image data is in CHW format. legend_images is a dictionary of label to map_unit label images in CHW format."""         
+        """
+        Args:
+            image (np.array): Image data in CHW format.
+            legend_images (list): List of map_unit swatch images in CHW format.
+            data_id (int): Data id for logging purposes.
+        
+        Returns:
+            np.array: Prediction mask in CHW format.
+        """        
 
         # Get the size of the map
-        map_channels, map_height, map_width = image.shape
-
-        # Reshape maps with 1 channel images (greyscale) to 3 channels for inference
-        if map_channels == 1: # This is tmp fix!
-            image = np.concatenate([image,image,image], axis=0)        
+        map_channels, map_height, map_width = image.shape   
 
         # Generate patches
         # Pad image so we get a size that can be evenly divided into patches.
@@ -63,7 +67,7 @@ def inference(self, image, legend_images, data_id=-1):
         map_prediction = np.zeros((1, map_height, map_width), dtype=np.float32)
         map_confidence = np.zeros((1, map_height, map_width), dtype=np.float32)
         legend_index = 1
-        for label, legend_img in legend_images.items():
+        for legend_img in legend_images:
             # pipeline_manager.log(logging.DEBUG, f'\t\tInferencing legend: {label}')
             lgd_stime = time()
 

diff --git a/src/pipeline_steps.py b/src/pipeline_steps.py
@@ -32,6 +32,7 @@ def load_data(data_id, image_path:str, legend_dir:str=None, layout_dir:str=None)
         if not os.path.exists(layout_path):
             layout_path = None
     map_data = io.loadCMAASMapFromFiles(image_path, legend_path, layout_path)
+    pipeline_manager.log(logging.WARNING, f'Map loaded with {len(map_data.legend.features)} Map units')
     pipeline_manager.log_to_monitor(data_id, {'Shape': map_data.image.shape})
     return map_data
 
@@ -78,11 +79,13 @@ def gen_legend(data_id, map_data:CMAAS_Map, model, max_legends=300, drab_volcano
             map_data.legend = model.inference(map_data.image, map_data.layout, data_id=data_id)
 
     # Reduce duplicates
-    legend_features = {}
-    for feature in map_data.legend.features:
-        legend_features[feature.label] = feature
-
-    map_data.legend.features = list(legend_features.values())
+    if map_data.legend.provenance.name != 'polymer': # Skip de-duplication for polymer legends
+        legend_features = {}
+        for feature in map_data.legend.features:
+            legend_features[feature.label] = feature
+    if isinstance(map_data.legend.features, dict):
+        map_data.legend.features = list(legend_features.values())
+    pipeline_manager.log(logging.WARNING, f'Map features after de duplication : {len(map_data.legend.features)} Map units')
 
     # TMP solution for maps with too many features (most likely from bad legend extraction)
     if len(map_data.legend.features) > max_legends:
@@ -105,71 +108,15 @@ def gen_legend(data_id, map_data:CMAAS_Map, model, max_legends=300, drab_volcano
 
     return map_data
 
-# def old_gen_legend(data_id, map_data:CMAAS_Map, max_legends=300, drab_volcano_legend:bool=False):
-#     from submodules.legend_extraction.src.extraction import extractLegends
-#     def convertLegendtoCMASS(legend):
-#         from cmaas_utils.types import Legend, MapUnit
-#         features = []
-#         for feature in legend:
-#             features.append(MapUnit(type=MapUnitType.POLYGON, label=feature['label'], bounding_box=feature['points']))
-#         return Legend(provenance=Provenance(name='UIUC Heuristic Model', version='0.1'), features=features)
-
-#     if map_data.legend is None:
-#         if drab_volcano_legend:
-#             map_data.legend = io.loadLegendJson('src/models/drab_volcano_legend.json')
-#         else:
-#             # Mask legend area before prediction.
-#             if map_data.layout is not None and map_data.layout.polygon_legend is not None:
-#                 image = map_data.image.transpose(1,2,0).copy()
-#                 mask = np.zeros_like(image)
-#                 cv2.fillPoly(mask, pts=[map_data.layout.polygon_legend], color=(255,255,255))
-#                 image = cv2.bitwise_and(image, mask)
-#                 image = image.transpose(2,0,1)
-#             else:
-#                 image = map_data.image
-
-#             # Generate legend
-#             pipeline_manager.log(logging.DEBUG, f'{map_data.name} - No legend data found, generating legend', pid=mp.current_process().pid)
-#             lgd = extractLegends(image.transpose(1,2,0))
-#             map_data.legend = convertLegendtoCMASS(lgd)
-
-#     # Reduce duplicates
-#     legend_features = {}
-#     for feature in map_data.legend.features:
-#         legend_features[feature.label] = feature
-
-#     map_data.legend.features = list(legend_features.values())
-
-#     # Count distribution of map units for log.
-#     pt, ln, py, un = 0,0,0,0
-#     for feature in map_data.legend.features:
-#         if feature.type == MapUnitType.POINT:
-#             pt += 1
-#         if feature.type == MapUnitType.LINE:
-#             ln += 1
-#         if feature.type == MapUnitType.POLYGON:
-#             py += 1
-#         if feature.type == MapUnitType.UNKNOWN:
-#             un += 1
-
-#     # TMP solution for maps with too many features (most likely from bad legend extraction)
-#     if len(map_data.legend.features) > max_legends:
-#         raise Exception(f'{map_data.name} - Too many features found in legend. Found {len(map_data.legend.features)} features. Max is {max_legends}')
-
-#     pipeline_manager.log(logging.DEBUG, f'{map_data.name} - Found {len(map_data.legend.features)} Total map units. ({pt} pt, {ln} ln, {py} poly, {un} unknown)', pid=mp.current_process().pid)
-#     pipeline_manager.log_to_monitor(data_id, {'Map Units': len(map_data.legend.features)})
-
-#     return map_data
-
 def save_legend(data_id, map_data:CMAAS_Map, feedback_dir:str, legend_feedback_mode:str = 'single_image'):
     # Create directory for that map
     os.makedirs(os.path.join(feedback_dir, map_data.name), exist_ok=True)
 
     # Cutout map unit labels from image
-    legend_images = {}
+    legend_images = []
     for feature in map_data.legend.features:
         min_pt, max_pt = boundingBox(feature.label_bbox) # Need this as points order can be reverse or could have quad
-        legend_images[feature.label] = map_data.image[:,min_pt[1]:max_pt[1], min_pt[0]:max_pt[0]]
+        legend_images.append((feature.label, map_data.image[:,min_pt[1]:max_pt[1], min_pt[0]:max_pt[0]]))
 
     # Save preview of legend labels
     if len(legend_images) > 0:
@@ -178,19 +125,21 @@ def save_legend(data_id, map_data:CMAAS_Map, feedback_dir:str, legend_feedback_m
             with open(os.path.join(feedback_dir, map_data.name, sanitize_filename(map_data.name + '_legend.json')), 'w') as fh:
                 fh.write(map_data.legend.model_dump_json())
         if legend_feedback_mode == 'individual_images':
-            legend_save_path = os.path.join(feedback_dir, map_data.name, sanitize_filename('lgd_' + map_data.name + '_' + feature.label + '.tif'))
-            io.saveGeoTiff(legend_save_path, legend_images[feature.label], None, None)
+            for label, image in legend_images:
+                legend_save_path = os.path.join(feedback_dir, map_data.name, sanitize_filename('lgd_' + map_data.name + '_' + label + '.tif'))
+                io.saveGeoTiff(legend_save_path, image, None, None)
         if legend_feedback_mode == 'single_image':
             cols = 4
             rows = ceil(len(legend_images)/cols)
             fig, ax = plt.subplots(rows, cols, figsize=(16,16))
             ax = ax.reshape(rows, cols) # Force 2d shape if less the 4 items
             for r,c in np.ndindex(ax.shape):
                 ax[r][c].axis('off')
-            for i, label in enumerate(legend_images):
+            for i, f_tuple in enumerate(legend_images):
+                label, image = f_tuple
                 row, col  = floor(i/cols), i%cols
                 ax[row][col].set_title(label)
-                ax[row][col].imshow(legend_images[label].transpose(1,2,0))
+                ax[row][col].imshow(image.transpose(1,2,0))
             legend_save_path = os.path.join(feedback_dir, map_data.name, sanitize_filename(map_data.name + '_labels'  + '.png'))
             fig.savefig(legend_save_path)
             plt.close(fig)
@@ -208,11 +157,11 @@ def segmentation_inference(data_id, map_data:CMAAS_Map, model, devices=None):
         model.model.to(target_device)
 
     # Cutout Legends
-    legend_images = {}
+    legend_images = []
     for feature in map_data.legend.features:
         if feature.type == model.feature_type:
             min_pt, max_pt = boundingBox(feature.label_bbox) # Need this as points order can be reverse or could have quad
-            legend_images[feature.label] = map_data.image[:,min_pt[1]:max_pt[1], min_pt[0]:max_pt[0]]
+            legend_images.append(map_data.image[:,min_pt[1]:max_pt[1], min_pt[0]:max_pt[0]])
         # else:
         #     pipeline_manager.log(logging.DEBUG, f'{map_data.name} - Skipping inference for {feature.label} as it is not a {model.feature_type.name} feature', pid=mp.current_process().pid)
 
@@ -223,6 +172,11 @@ def segmentation_inference(data_id, map_data:CMAAS_Map, model, devices=None):
         image = map_data.image
         offset = (0,0)
 
+    # Reshape maps with 1 channel images (greyscale) to 3 channels for inference
+    map_channels, map_height, map_width = image.shape
+    if map_channels == 1: 
+        image = np.concatenate([image,image,image], axis=0)
+
     # Log how many map units are being processed and the estimated time to perform inference
     est_patches = ceil(image.shape[1]/model.patch_size)*ceil(image.shape[2]/model.patch_size)
     est_time = (est_patches*len(legend_images))/model.est_patches_per_sec