refactor: cleanup describe people skill.

LASR-at-Home · Apr 18, 2024 · aa1d956 · aa1d956
1 parent 26e4db1
commit aa1d956
Showing 1 changed file with 47 additions and 143 deletions.
diff --git a/skills/src/lasr_skills/describe_people.py b/skills/src/lasr_skills/describe_people.py
@@ -6,49 +6,11 @@
 import cv2_img
 import numpy as np
 
-# from colour_estimation import closest_colours, RGB_COLOURS
+from colour_estimation import closest_colours, RGB_COLOURS
 from lasr_vision_msgs.msg import BodyPixMaskRequest, ColourPrediction, FeatureWithColour
-from lasr_vision_msgs.srv import YoloDetection, BodyPixDetection, TorchFaceFeatureDetection, TorchFaceFeatureDetectionDescription
-from numpy2message import numpy2message
+from lasr_vision_msgs.srv import YoloDetection, BodyPixDetection, TorchFaceFeatureDetection
 
-from .vision import GetImage, ImageMsgToCv2, Get3DImage, PclMsgToCv2, Get2DAnd3DImages
-
-import actionlib
-import numpy as np
-from sensor_msgs.msg import PointCloud2
-from control_msgs.msg import PointHeadAction, PointHeadGoal
-from geometry_msgs.msg import PointStamped
-from pal_common_msgs.msg import DisableActionGoal, DisableAction
-
-
-# rospy.init_node('point_head_client')
-client = actionlib.SimpleActionClient("/head_controller/point_head_action", PointHeadAction)   #
-rospy.logwarn('making client')
-
-def point_head_client(xyz_array, u, v, client):
-    u = 480 - 1 if u > 480 else u
-    v = 640 - 1 if v > 640 else u
-    target_point = xyz_array[v, u]
-
-    point_camera = PointStamped()
-    point_camera.header.frame_id = "xtion_rgb_optical_frame"
-    # point_camera.header.stamp = rospy.Time.now()
-    point_camera.point.x = target_point[0] if target_point[0] != np.nan else 0
-    point_camera.point.y = target_point[1] if target_point[1] != np.nan else 0
-    point_camera.point.z = target_point[2] if target_point[2] != np.nan else 0
-
-    goal = PointHeadGoal()
-    goal.target = point_camera
-    goal.max_velocity = 0.3
-    # goal.min_duration = rospy.Duration(1.0)
-    goal.pointing_frame = "head_2_link"
-    goal.pointing_axis.x = 1.0
-    goal.pointing_axis.y = 0.0
-    goal.pointing_axis.z = 0.0
-
-    rospy.logwarn('sending the goal and waiting, moving to: %s' % str(list(target_point)))
-    client.send_goal(goal)
-    rospy.logwarn('end')
+from .vision import GetImage, ImageMsgToCv2
 
 
 class DescribePeople(smach.StateMachine):
@@ -58,21 +20,16 @@ def __init__(self):
             self, outcomes=['succeeded', 'failed'], input_keys=[], output_keys=['people'])
 
         with self:
-            # smach.StateMachine.add('GET_IMAGE', GetImage(), transitions={
-            #                        'succeeded': 'CONVERT_IMAGE'})
-            # smach.StateMachine.add('CONVERT_IMAGE', ImageMsgToCv2(), transitions={
-            #                        'succeeded': 'SEGMENT'})
-
-            smach.StateMachine.add('GET_IMAGE', Get2DAnd3DImages(), transitions={
+            smach.StateMachine.add('GET_IMAGE', GetImage(), transitions={
                                    'succeeded': 'CONVERT_IMAGE'})
-            smach.StateMachine.add('CONVERT_IMAGE', PclMsgToCv2(), transitions={
+            smach.StateMachine.add('CONVERT_IMAGE', ImageMsgToCv2(), transitions={
                                    'succeeded': 'SEGMENT'})
 
             sm_con = smach.Concurrence(outcomes=['succeeded', 'failed'],
                                        default_outcome='failed',
                                        outcome_map={'succeeded': {
                                            'SEGMENT_YOLO': 'succeeded', 'SEGMENT_BODYPIX': 'succeeded'}},
-                                       input_keys=['img', 'img_msg_2d', 'img_msg_3d', 'xyz'],
+                                       input_keys=['img', 'img_msg'],
                                        output_keys=['people_detections', 'bodypix_masks'])
 
             with sm_con:
@@ -83,7 +40,7 @@ def __init__(self):
                                    'succeeded': 'FEATURE_EXTRACTION'})
             smach.StateMachine.add('FEATURE_EXTRACTION', self.FeatureExtraction(), transitions={
                                    'succeeded': 'succeeded'})
-    
+
     class SegmentYolo(smach.State):
         '''
         Segment using YOLO
@@ -93,13 +50,13 @@ class SegmentYolo(smach.State):
 
         def __init__(self):
             smach.State.__init__(self, outcomes=['succeeded', 'failed'], input_keys=[
-                                 'img_msg_2d'], output_keys=['people_detections'])
+                                 'img_msg'], output_keys=['people_detections'])
             self.yolo = rospy.ServiceProxy('/yolov8/detect', YoloDetection)
 
         def execute(self, userdata):
             try:
                 result = self.yolo(
-                    userdata.img_msg_2d, "yolov8n-seg.pt", 0.5, 0.3)
+                    userdata.img_msg, "yolov8n-seg.pt", 0.5, 0.3)
                 userdata.people_detections = [
                     det for det in result.detected_objects if det.name == "person"]
                 return 'succeeded'
@@ -116,7 +73,7 @@ class SegmentBodypix(smach.State):
 
         def __init__(self):
             smach.State.__init__(self, outcomes=['succeeded', 'failed'], input_keys=[
-                                 'img_msg_2d', 'xyz'], output_keys=['bodypix_masks'])
+                                 'img_msg'], output_keys=['bodypix_masks'])
             self.bodypix = rospy.ServiceProxy(
                 '/bodypix/detect', BodyPixDetection)
 
@@ -130,18 +87,8 @@ def execute(self, userdata):
 
                 masks = [torso, head]
 
-                result = self.bodypix(userdata.img_msg_2d, "resnet50", 0.7, masks)
+                result = self.bodypix(userdata.img_msg, "resnet50", 0.7, masks)
                 userdata.bodypix_masks = result.masks
-                rospy.loginfo("Found:::%s" % str(len(result.poses)))
-                try:
-                    neck_coord = (int(result.poses[0].coord[0]), int(result.poses[0].coord[1]))
-                except Exception:
-                    neck_coord = (240, 320)
-                rospy.loginfo("COORD_XY:::%s" % str(neck_coord))
-                xyz = userdata.xyz
-                # xyz = np.nanmean(xyz, axis=2)
-                # rospy.loginfo("COORD_Z:::%s" % str(xyz[neck_coord[0]][neck_coord[1]]))
-                # point_head_client(xyz, neck_coord[0], neck_coord[1], client)
                 return 'succeeded'
             except rospy.ServiceException as e:
                 rospy.logwarn(f"Unable to perform inference. ({str(e)})")
@@ -158,10 +105,9 @@ def __init__(self):
             smach.State.__init__(self, outcomes=['succeeded', 'failed'], input_keys=[
                                  'img', 'people_detections', 'bodypix_masks'], output_keys=['people'])
             self.torch_face_features = rospy.ServiceProxy(
-                '/torch/detect/face_features', TorchFaceFeatureDetectionDescription)
+                '/torch/detect/face_features', TorchFaceFeatureDetection)
 
         def execute(self, userdata):
-            #try:
             if len(userdata.people_detections) == 0:
                 rospy.logerr("Couldn't find anyone!")
                 return 'failed'
@@ -187,14 +133,14 @@ def execute(self, userdata):
                     [contours]), color=(255, 255, 255))
                 mask_bin = mask_image > 128
 
-                # # keep track
-                # features = []
+                # keep track
+                features = []
 
                 # process part masks
                 for (bodypix_mask, part) in zip(userdata.bodypix_masks, ['torso', 'head']):
                     part_mask = np.array(bodypix_mask.mask).reshape(
                         bodypix_mask.shape[0], bodypix_mask.shape[1])
-                    
+
                     # filter out part for current person segmentation
                     try:
                         part_mask[mask_bin == 0] = 0
@@ -209,82 +155,42 @@ def execute(self, userdata):
                             f'|> Person does not have {part} visible')
                         continue
 
+                    # do colour processing on the torso
                     if part == 'torso':
-                        torso_mask = part_mask
-                    elif part == 'head':
-                        head_mask = part_mask
-
-                torso_mask_data, torso_mask_shape, torso_mask_dtype = numpy2message(torso_mask)
-                head_mask_data, head_mask_shape, head_mask_dtype = numpy2message(head_mask)
-
-                full_frame = cv2_img.cv2_img_to_msg(img)
-                # features.extend(self.torch_face_features(
-                #     full_frame, 
-                #     head_mask_data, head_mask_shape, head_mask_dtype,
-                #     torso_mask_data, torso_mask_shape, torso_mask_dtype,
-                # ).detected_features)
-
-                rst = self.torch_face_features(
-                    full_frame, 
-                    head_mask_data, head_mask_shape, head_mask_dtype,
-                    torso_mask_data, torso_mask_shape, torso_mask_dtype,
-                ).description
-
-                # # process part masks
-                # for (bodypix_mask, part) in zip(userdata.bodypix_masks, ['torso', 'head']):
-                #     part_mask = np.array(bodypix_mask.mask).reshape(
-                #         bodypix_mask.shape[0], bodypix_mask.shape[1])
-
-                #     # filter out part for current person segmentation
-                #     try:
-                #         part_mask[mask_bin == 0] = 0
-                #     except Exception:
-                #         rospy.logdebug('|> Failed to check {part} is visible')
-                #         continue
-
-                #     if part_mask.any():
-                #         rospy.logdebug(f'|> Person has {part} visible')
-                #     else:
-                #         rospy.logdebug(
-                #             f'|> Person does not have {part} visible')
-                #         continue
-
-                #     # do colour processing on the torso
-                #     if part == 'torso':
-                #         try:
-                #             features.append(FeatureWithColour("torso", [
-                #                 ColourPrediction(colour, distance)
-                #                 for colour, distance
-                #                 in closest_colours(np.median(img[part_mask == 1], axis=0), RGB_COLOURS)
-                #             ]))
-                #         except Exception as e:
-                #             rospy.logerr(f"Failed to process colour: {e}")
-
-                #     # do feature extraction on the head
-                #     if part == 'head':
-                #         try:
-                #             # crop out face
-                #             face_mask = np.array(userdata.bodypix_masks[1].mask).reshape(
-                #                 userdata.bodypix_masks[1].shape[0], userdata.bodypix_masks[1].shape[1])
-
-                #             mask_image_only_face = mask_image.copy()
-                #             mask_image_only_face[face_mask == 0] = 0
-
-                #             face_region = cv2_img.extract_mask_region(
-                #                 img, mask_image_only_face)
-                #             if face_region is None:
-                #                 raise Exception(
-                #                     "Failed to extract mask region")
-
-                #             msg = cv2_img.cv2_img_to_msg(face_region)
-                #             features.extend(self.torch_face_features(
-                #                 msg, False).detected_features)
-                #         except Exception as e:
-                #             rospy.logerr(f"Failed to process extraction: {e}")
+                        try:
+                            features.append(FeatureWithColour("torso", [
+                                ColourPrediction(colour, distance)
+                                for colour, distance
+                                in closest_colours(np.median(img[part_mask == 1], axis=0), RGB_COLOURS)
+                            ]))
+                        except Exception as e:
+                            rospy.logerr(f"Failed to process colour: {e}")
+
+                    # do feature extraction on the head
+                    if part == 'head':
+                        try:
+                            # crop out face
+                            face_mask = np.array(userdata.bodypix_masks[1].mask).reshape(
+                                userdata.bodypix_masks[1].shape[0], userdata.bodypix_masks[1].shape[1])
+
+                            mask_image_only_face = mask_image.copy()
+                            mask_image_only_face[face_mask == 0] = 0
+
+                            face_region = cv2_img.extract_mask_region(
+                                img, mask_image_only_face)
+                            if face_region is None:
+                                raise Exception(
+                                    "Failed to extract mask region")
+
+                            msg = cv2_img.cv2_img_to_msg(face_region)
+                            features.extend(self.torch_face_features(
+                                msg).detected_features)
+                        except Exception as e:
+                            rospy.logerr(f"Failed to process extraction: {e}")
 
                 people.append({
                     'detection': person,
-                    'features': rst
+                    'features': features
                 })
 
             # Userdata:
@@ -295,6 +201,4 @@ def execute(self, userdata):
             #         - mask
 
             userdata['people'] = people
-            # except Exception:
-            #     return 'failed'
             return 'succeeded'