From 2bd11f3de315775da6347b5010cc135aeec735b7 Mon Sep 17 00:00:00 2001
From: yichao-liang <yichao-liang>
Date: Thu, 12 Dec 2024 08:42:29 -0500
Subject: [PATCH] plug + make coffee working

---
 predicators/envs/coffee.py                    |  10 +-
 predicators/envs/pybullet_coffee.py           | 179 +++++++++++++++---
 .../ground_truth_models/coffee/nsrts.py       |   7 +-
 .../ground_truth_models/coffee/options.py     |  76 +++++++-
 predicators/option_model.py                   |   4 +-
 predicators/planning.py                       |   1 +
 predicators/utils.py                          |   4 +-
 7 files changed, 241 insertions(+), 40 deletions(-)
diff --git a/predicators/envs/coffee.py b/predicators/envs/coffee.py
index d58b803a1..4ebc0c486 100644
--- a/predicators/envs/coffee.py
+++ b/predicators/envs/coffee.py
@@ -484,8 +484,13 @@ def _get_tasks(self,
                 num_cups = num_cups_lst[rng.choice(len(num_cups_lst))]
             cups = [Object(f"cup{i}", self._cup_type) for i in range(num_cups)]
             if CFG.coffee_simple_tasks:
-                # goal = {GroundAtom(self._JugFilled, [self._jug])}
-                goal = {GroundAtom(self._PluggedIn, [self._plug])}
+                # goal = {
+                # }
+                goal = {
+                    GroundAtom(self._JugFilled, [self._jug]),
+                    # GroundAtom(self._PluggedIn, [self._plug]),
+                    # GroundAtom(self._JugInMachine, [self._jug, self._machine]),
+                    }
             else:
                 goal = {GroundAtom(self._CupFilled, [c]) for c in cups}
             # Sample initial positions for cups, making sure to keep them
@@ -671,6 +676,7 @@ def _NotAboveCup_holds(self, state: State,
     def _PressingButton_holds(self, state: State,
                               objects: Sequence[Object]) -> bool:
         robot, _ = objects
+        # have a tighter threshold for x, z than y
         button_pos = (self.button_x, self.button_y, self.button_z)
         x = state.get(robot, "x")
         y = state.get(robot, "y")
diff --git a/predicators/envs/pybullet_coffee.py b/predicators/envs/pybullet_coffee.py
index 5069898b2..801c5a88d 100644
--- a/predicators/envs/pybullet_coffee.py
+++ b/predicators/envs/pybullet_coffee.py
@@ -28,7 +28,7 @@
 python predicators/main.py --env pybullet_coffee --approach oracle --seed 0 \
 --coffee_rotated_jug_ratio 0.5 \
 --sesame_check_expected_atoms False --coffee_jug_pickable_pred True \
---pybullet_control_mode "reset" --coffee_twist_sampler False \
+--coffee_twist_sampler False \
 --make_test_videos --num_test_tasks 1 --video_fps 20 \
 --pybullet_camera_height 300 --pybullet_camera_width 300 \
 --coffee_render_grid_world False --coffee_simple_tasks True \
@@ -36,7 +36,8 @@
 --coffee_move_back_after_place_and_push True \
 --coffee_machine_has_plug True --sesame_max_skeletons_optimized 1 \
 --make_failure_videos \
---debug --horizon 50 --option_model_terminate_on_repeat False
+--debug --horizon 100 --option_model_terminate_on_repeat False \
+--pybullet_sim_steps_per_action 100 --max_num_steps_option_rollout 50
 """
 import math
 import logging
@@ -99,7 +100,7 @@ class PyBulletCoffeeEnv(PyBulletEnv, CoffeeEnv):
     machine_y_len: ClassVar[float] = 0.15 * (y_ub - y_lb)
     machine_z_len: ClassVar[float] = 0.5 * (z_ub - z_lb)
     machine_top_y_len: ClassVar[float] = 1.3 * machine_y_len
-    machine_x: ClassVar[float] = x_ub - machine_x_len / 2 - init_padding
+    machine_x: ClassVar[float] = x_ub - machine_x_len / 2 - init_padding 
     machine_y: ClassVar[float] = y_ub - machine_y_len / 2 - init_padding
     button_radius: ClassVar[float] = 0.6 * machine_y_len
     button_height = button_radius / 4
@@ -107,7 +108,7 @@ class PyBulletCoffeeEnv(PyBulletEnv, CoffeeEnv):
     button_y: ClassVar[float] =\
         machine_y - machine_y_len / 2 - machine_top_y_len - button_height/2
     button_z: ClassVar[float] = z_lb + machine_z_len - button_radius
-    button_press_threshold: ClassVar[float] = 1e-3
+    button_press_threshold: ClassVar[float] = 1e-2
     machine_color: ClassVar[Tuple[float, float, float, float]] =\
         (0.1, 0.1, 0.1, 1) # Black
     button_color_on: ClassVar[Tuple[float, float, float,
@@ -115,11 +116,14 @@ class PyBulletCoffeeEnv(PyBulletEnv, CoffeeEnv):
     plate_color_on: ClassVar[Tuple[float, float, float, float]] = machine_color
     button_color_off: ClassVar[Tuple[float, float, float,
                                      float]] = (0.5, 0.2, 0.2, 1.0)
+    button_color_power_off: ClassVar[Tuple[float, float, float,
+                                     float]] = (.25, .25, .25, 1.0)
     plate_color_off: ClassVar[Tuple[float, float, float,
                                     float]] = machine_color
     # Jug setting
     jug_radius: ClassVar[float] = 0.3 * machine_y_len
-    jug_height: ClassVar[float] = 0.15 * (z_ub - z_lb)  # kettle urdf
+    jug_height: ClassVar[float] = 0.19 * (z_ub - z_lb)  # kettle urdf
+    # jug_height: ClassVar[float] = 0.z_lb)  # kettle urdf
     jug_init_x_lb: ClassVar[
         float] = machine_x - machine_x_len / 2 + init_padding
     jug_init_x_ub: ClassVar[
@@ -141,7 +145,7 @@ class PyBulletCoffeeEnv(PyBulletEnv, CoffeeEnv):
     dispense_area_x: ClassVar[float] = machine_x
     dispense_area_y: ClassVar[float] = machine_y - 5 * jug_radius
     dispense_radius = 2 * jug_radius
-    dispense_height = 0.005
+    dispense_height = 0.0001
     # Cup settings.
     cup_radius: ClassVar[float] = 0.6 * jug_radius
     cup_init_x_lb: ClassVar[float] = x_lb + cup_radius + init_padding
@@ -173,7 +177,7 @@ class PyBulletCoffeeEnv(PyBulletEnv, CoffeeEnv):
     plug_z = cord_start_z
     # Socket settings.
     socket_height: ClassVar[float] = 0.1
-    socket_width: ClassVar[float] = 0.1
+    socket_width: ClassVar[float] = 0.05
     socket_depth: ClassVar[float] = 0.01
     socket_x: ClassVar[float] = (x_lb + x_ub) / 2
     socket_y: ClassVar[float] = machine_y
@@ -204,11 +208,13 @@ def __init__(self, use_gui: bool = True) -> None:
             # Camera parameters -- standard
             self._camera_distance: ClassVar[float] = 1.3
             if CFG.coffee_machine_has_plug:
-                # self._camera_yaw: ClassVar[float] = -70
-                self._camera_yaw: ClassVar[float] = -100
+                self._camera_yaw: ClassVar[float] = -60
+                # self._camera_yaw: ClassVar[float] = -100
+                # self._camera_yaw: ClassVar[float] = -180
             else:
                 self._camera_yaw: ClassVar[float] = 70
             self._camera_pitch: ClassVar[float] = -38  # lower
+            # self._camera_pitch: ClassVar[float] = 0  # even lower
             self._camera_target: ClassVar[Pose3D] = (0.75, 1.25, 0.42)
 
         # Camera font view parameters.
@@ -405,8 +411,14 @@ def _reset_state(self, state: State) -> None:
             button_color = self.button_color_on
             plate_color = self.plate_color_on
         else:
-            button_color = self.button_color_off
-            plate_color = self.plate_color_off
+            if CFG.coffee_machine_has_plug and \
+                self._PluggedIn_holds(state, [self._plug]):
+                button_color = self.button_color_off
+                plate_color = self.plate_color_off
+            else:
+                button_color = self.button_color_power_off
+                plate_color = self.plate_color_off
+
         p.changeVisualShape(self._button_id,
                             -1,
                             rgbaColor=button_color,
@@ -562,7 +574,8 @@ def step(self, action: Action, render_obs: bool = False) -> State:
                 quat,
                 physicsClientId=self._physics_client_id)
         
-        if self._PluggedIn_holds(state, [self._plug]) and \
+        if CFG.coffee_machine_has_plug and \
+            self._PluggedIn_holds(state, [self._plug]) and \
             self._machine_plugged_in_id is None:
             # logging.debug("[env] plug in the machine")
             # Create a constraint between plug and socket
@@ -576,6 +589,14 @@ def step(self, action: Action, render_obs: bool = False) -> State:
                 parentFramePosition=[0, 0, 0],
                 childFramePosition=[0, 0, 0],
             )
+            p.changeVisualShape(self._button_id,
+                                -1,
+                                rgbaColor=self.button_color_off,
+                                physicsClientId=self._physics_client_id)
+            p.changeVisualShape(self._button_id,
+                                0,
+                                rgbaColor=self.button_color_off,
+                                physicsClientId=self._physics_client_id)
 
         # If the robot is sufficiently close to the button, turn on the machine
         # and update the status of the jug.
@@ -666,7 +687,10 @@ def _load_task_from_json(self, json_file: Path) -> EnvironmentTask:
         return self._add_pybullet_state_to_tasks([task])[0]
 
     def _get_object_ids_for_held_check(self) -> List[int]:
-        return [self._jug_id, self._plug_id]
+        if CFG.coffee_machine_has_plug:
+            return [self._jug_id, self._plug_id]
+        else:
+            return [self._jug_id]
 
     def _get_expected_finger_normals(self) -> Dict[int, Array]:
         if CFG.pybullet_robot == "fetch":
@@ -769,8 +793,8 @@ def _create_pybullet_liquid_for_cup(self, cup: Object,
                                  physicsClientId=self._physics_client_id)
 
     def _create_pybullet_liquid_for_jug(self) -> Optional[int]:
-        liquid_height = self.jug_height * 0.7
-        liquid_radius = self.jug_radius * 1.5
+        liquid_height = self.jug_height * 0.6
+        liquid_radius = self.jug_radius * 1.3
 
         collision_id = p.createCollisionShape(
             p.GEOM_CYLINDER,
@@ -783,7 +807,7 @@ def _create_pybullet_liquid_for_jug(self) -> Optional[int]:
             radius=liquid_radius,
             length=liquid_height,
             # rgbaColor=(0.2 * 1.5, 0.05 * 1.5, 0.0, 1.0), # brown
-            rgbaColor=(0.8, 0, 0, 1.0), # red
+            rgbaColor=(0.35, 0.1, 0.0, 1.0),
             physicsClientId=self._physics_client_id)
 
         pose, orientation = p.getBasePositionAndOrientation(
@@ -845,7 +869,8 @@ def _add_pybullet_coffee_machine(cls, physics_client_id) -> int:
         # Define the dimensions for the dispense area
         half_extents_dispense_base = (cls.machine_x_len,
                                       1.1 * cls.dispense_radius + cls.jug_radius +
-                                      0.003, cls.dispense_height)
+                                      0.003, 
+                                      cls.dispense_height)
         collision_id_dispense_base = p.createCollisionShape(
             p.GEOM_BOX,
             halfExtents=half_extents_dispense_base,
@@ -950,7 +975,8 @@ def _add_pybullet_machine_button(cls, physics_client_id) -> int:
             p.GEOM_CYLINDER,
             radius=cls.button_radius,
             length=cls.button_height,
-            rgbaColor=cls.button_color_off,
+            rgbaColor=cls.button_color_power_off if \
+                CFG.coffee_machine_has_plug else cls.button_color_off,
             physicsClientId=physics_client_id)
 
         if CFG.coffee_machine_have_light_bar:
@@ -1012,9 +1038,8 @@ def _add_pybullet_jug(cls, physics_client_id) -> int:
         p.configureDebugVisualizer(p.COV_ENABLE_RENDERING, 0)
         jug_id = p.loadURDF(
             utils.get_env_asset_path("urdf/kettle.urdf"),
-            useFixedBase=True,
-            # globalScaling=0.075, # original jug
             globalScaling=0.09,  # enlarged jug
+            useFixedBase=False,
             physicsClientId=physics_client_id)
 
         p.changeVisualShape(jug_id,
@@ -1026,13 +1051,110 @@ def _add_pybullet_jug(cls, physics_client_id) -> int:
                             1,
                             rgbaColor=[1, 1, 1, 0],
                             physicsClientId=physics_client_id)
+        p.changeDynamics(
+            bodyUniqueId=jug_id,
+            linkIndex=-1,  # -1 for the base link
+            mass=0.1,
+            physicsClientId=physics_client_id
+        )
+
+        # new cup
+        # jug_id = cls.create_cup(physics_client_id)
         p.resetBasePositionAndOrientation(jug_id,
                                           jug_pose,
                                           jug_orientation,
                                           physicsClientId=physics_client_id)
+
         return jug_id
 
     @classmethod
+    def create_cup(cls, physics_client_id, scale=0.16):
+        # Parameters
+        cup_thickness = 0.1 * scale # Wall thickness
+        cup_width = 5 * cup_thickness  # Width of the cup
+        cup_height = 4 * cup_thickness  # Height of the cup
+        handle_x_len = 3 * cup_thickness
+        handle_y_len = cup_thickness
+        handle_z_len = 3 * cup_thickness
+        handle_x = cup_width / 2 + handle_x_len / 2  # Offset for the handle
+        handle_z = cup_height / 2 # Offset for the handle
+
+        # Base position
+        base_position = [0, 0, 0]
+
+        # Shape IDs for different parts
+        visual_shapes = []
+        collision_shapes = []
+        base_positions = []
+
+        # Base of the cup
+        visual_shapes.append(
+            p.createVisualShape(
+                p.GEOM_BOX,
+                halfExtents=[cup_width / 2, cup_width / 2, cup_thickness / 2]))
+        collision_shapes.append(
+            p.createCollisionShape(
+                p.GEOM_BOX,
+                halfExtents=[cup_width / 2, cup_width / 2, cup_thickness / 2]))
+        base_positions.append(base_position)
+
+        # Walls
+        wall_half_extents = [cup_width / 2, cup_thickness / 2, cup_height / 2]
+        visual_shapes.extend([
+            p.createVisualShape(p.GEOM_BOX, halfExtents=wall_half_extents),
+            p.createVisualShape(p.GEOM_BOX, halfExtents=wall_half_extents),
+            p.createVisualShape(
+                p.GEOM_BOX,
+                halfExtents=[cup_thickness / 2, cup_width / 2, cup_height / 2]),
+            p.createVisualShape(
+                p.GEOM_BOX,
+                halfExtents=[cup_thickness / 2, cup_width / 2, cup_height / 2]),
+        ])
+        collision_shapes.extend([
+            p.createCollisionShape(p.GEOM_BOX, halfExtents=wall_half_extents),
+            p.createCollisionShape(p.GEOM_BOX, halfExtents=wall_half_extents),
+            p.createCollisionShape(
+                p.GEOM_BOX,
+                halfExtents=[cup_thickness / 2, cup_width / 2, cup_height / 2]),
+            p.createCollisionShape(
+                p.GEOM_BOX,
+                halfExtents=[cup_thickness / 2, cup_width / 2, cup_height / 2]),
+        ])
+        base_positions.extend([
+            [0, -cup_width / 2 + cup_thickness / 2, cup_height / 2],
+            [0, cup_width / 2 - cup_thickness / 2, cup_height / 2],
+            [-cup_width / 2 + cup_thickness / 2, 0, cup_height / 2],
+            [cup_width / 2 - cup_thickness / 2, 0, cup_height / 2],
+        ])
+
+        # Handle
+        handle_extents = [handle_x_len / 2, handle_y_len / 2, handle_z_len / 2]
+        visual_shapes.append(
+            p.createVisualShape(p.GEOM_BOX, halfExtents=handle_extents))
+        collision_shapes.append(
+            p.createCollisionShape(p.GEOM_BOX, halfExtents=handle_extents))
+        base_positions.append([handle_x, 0, handle_z])
+
+        # Combine all into a single multi-body object
+        cup_id = p.createMultiBody(
+            baseMass=0.02,
+            baseCollisionShapeIndex=-1,  # No collision for the base
+            baseVisualShapeIndex=-1,  # No visual for the base
+            basePosition=[0, 0, 0],
+            linkMasses=[0.02] * len(collision_shapes),  # Static links
+            linkCollisionShapeIndices=collision_shapes,
+            linkVisualShapeIndices=visual_shapes,
+            linkPositions=base_positions,
+            linkOrientations=[[0, 0, 0, 1]] * len(collision_shapes),
+            linkInertialFramePositions=[[0, 0, 0]] * len(collision_shapes),
+            linkInertialFrameOrientations=[[0, 0, 0, 1]] * len(collision_shapes),
+            linkParentIndices=[0] * len(collision_shapes),
+            linkJointTypes=[p.JOINT_FIXED] * len(collision_shapes),
+            linkJointAxis=[[0, 0, 0]] * len(collision_shapes),
+            physicsClientId=physics_client_id
+        )
+        return cup_id
+    @classmethod
     def _add_pybullet_table(cls, physics_client_id) -> int:
         table_id = p.loadURDF(utils.get_env_asset_path("urdf/table.urdf"),
                               useFixedBase=True,
@@ -1068,11 +1190,12 @@ def _add_pybullet_cord(cls, physics_client_id) -> List[int]:
             # Set color: Red for the first link, Blue for the last link, and 
             # Black for others
             if i == 0:
-                color = [1, 0, 0, 1]  # Red
+                color = [0, 0, 0, 1]  # Black
             elif i == cls.num_cord_links - 1:
-                color = [0, 0, 1, 1]  # Blue
+                # color = [0, 0, 1, 1]  # Blue
+                color = [1, 0, 0, 1]  # Red
             else:
-                color = [0, 0, 0, 1]  # Black
+                color = [139/255, 0, 0, 1]  # Black
 
             # Create collision and visual shapes
             segment = p.createCollisionShape(p.GEOM_BOX, 
@@ -1114,11 +1237,11 @@ def _add_pybullet_cord(cls, physics_client_id) -> List[int]:
                 childFramePosition=[cls.cord_link_length / 2 + half_gap, 0, 0]
             )
             # Adjust constraint parameters for softness
-            p.changeConstraint(
-                constraint_id,
-                maxForce=0.1,    # Lower max force for flexibility
-                erp=0.1         # Adjust error reduction parameter
-            )
+            # p.changeConstraint(
+            #     constraint_id,
+            #     maxForce=0.1,    # Lower max force for flexibility
+            #     erp=0.1         # Adjust error reduction parameter
+            # )
         # for i in range(len(segments) - 1):
         #     p.createConstraint(
         #         parentBodyUniqueId=segments[i],
diff --git a/predicators/ground_truth_models/coffee/nsrts.py b/predicators/ground_truth_models/coffee/nsrts.py
index 2d847e6fc..c6b3292df 100644
--- a/predicators/ground_truth_models/coffee/nsrts.py
+++ b/predicators/ground_truth_models/coffee/nsrts.py
@@ -63,11 +63,14 @@ def get_nsrts(env_name: str, types: Dict[str, Type],
             # PlugIn
             plug = Variable("?plug", plug_type)
             robot = Variable("?robot", robot_type)
-            parameters = [robot, plug]
+            jug = Variable("?jug", jug_type)
+            parameters = [robot, plug, jug]
             option_vars = [robot, plug]
             option = options["PlugIn"]
             preconditions = {
-                LiftedAtom(HandEmpty, [robot])
+                LiftedAtom(HandEmpty, [robot]),
+                LiftedAtom(OnTable, [jug]), 
+                # just a limitation of the current controller
             }
             add_effects = {
                 LiftedAtom(PluggedIn, [plug]),
diff --git a/predicators/ground_truth_models/coffee/options.py b/predicators/ground_truth_models/coffee/options.py
index 63f92e061..7a473f268 100644
--- a/predicators/ground_truth_models/coffee/options.py
+++ b/predicators/ground_truth_models/coffee/options.py
@@ -167,7 +167,17 @@ def _TurnMachineOn_terminal(state: State, memory: Dict,
             terminal=_TurnMachineOn_terminal)
         cls.TurnMachineOn = TurnMachineOn
 
+
         if CFG.coffee_machine_has_plug:
+
+            RestoreForPlugIn = ParameterizedOption(
+                "RestoreForPlugIn",
+                types=[robot_type, plug_type],
+                params_space=Box(0, 1, (0, )),
+                policy=cls._create_move_to_initial_position_policy(),
+                initiable=lambda s, m, o, p: True,
+                terminal=cls._Restore_terminal)
+
             # Plug in the plug to the socket
             def _PlugIn_initiable(state: State, memory: Dict,
                             objects: Sequence[Object], params: Array) -> bool:
@@ -183,7 +193,7 @@ def _PlugIn_terminal(state: State, memory: Dict,
                     finger_open = state.get(robot, "fingers") > 0.3
                     return PluggedIn.holds(state, [plug]) and finger_open
 
-            PlugIn = ParameterizedOption(
+            _PlugIn = ParameterizedOption(
                 "PlugIn",
                 types=[robot_type, plug_type],
                 params_space=Box(0, 1, (0, )),
@@ -191,6 +201,12 @@ def _PlugIn_terminal(state: State, memory: Dict,
                 initiable=_PlugIn_initiable,
                 terminal=_PlugIn_terminal)
 
+            PlugIn = utils.LinearChainParameterizedOption(
+                "PlugIn", [RestoreForPlugIn, _PlugIn, RestoreForPlugIn])
+            
+            
+
+
 
         # Pour
         def _Pour_initiable(state: State, memory: Dict,
@@ -213,10 +229,27 @@ def _Pour_terminal(state: State, memory: Dict,
             initiable=_Pour_initiable,
             terminal=_Pour_terminal)
 
-        return {
+        options = {
             PickJug, PlaceJugInMachine, TurnMachineOn, Pour, MoveToTwistJug,
-            TwistJug, PlugIn
+            TwistJug
         }
+        if CFG.coffee_machine_has_plug:
+            options.add(PlugIn)
+        return options
+
+    @classmethod
+    def _Restore_terminal(cls, state: State, memory: Dict,
+                                objects: Sequence[Object],
+                                params: Array) -> bool:
+        del memory, params
+        robot = objects[0]
+        robot_pos = (state.get(robot, "x"),
+                        state.get(robot, "y"),
+                        state.get(robot, "z"))
+        robot_init_pos = (cls.env_cls.robot_init_x,
+                            cls.env_cls.robot_init_y,
+                            cls.env_cls.robot_init_z)
+        return np.allclose(robot_pos, robot_init_pos, atol=1e-2)
 
     @classmethod
     def _create_move_to_twist_policy(cls) -> ParameterizedPolicy:
@@ -386,6 +419,30 @@ def policy(state: State, memory: Dict, objects: Sequence[Object],
                                         robot_pos)
 
         return policy
+    
+    @classmethod
+    def _create_move_to_initial_position_policy(cls) -> ParameterizedPolicy:
+
+        def policy(state: State, memory: Dict, objects: Sequence[Object],
+                   params: Array) -> Action:
+            # This policy moves the robot to the initial position
+            del memory, params
+            robot = objects[0]
+            robot_pos = (state.get(robot, "x"),
+                            state.get(robot, "y"),
+                            state.get(robot, "z"))
+            target_pos = (cls.env_cls.robot_init_x,
+                            cls.env_cls.robot_init_y,
+                            cls.env_cls.robot_init_z)
+            robot_tilt = state.get(robot, "tilt")
+            robot_wrists = state.get(robot, "wrist")
+            target_tilt = cls.env_cls.robot_init_tilt
+            target_wrists = cls.env_cls.robot_init_wrist
+            return cls._get_move_action(state, target_pos, robot_pos,
+                                        dtilt=target_tilt - robot_tilt,
+                                        dwrist=target_wrists - robot_wrists,
+                                        finger_status="open")
+        return policy
 
     @classmethod
     def _create_pour_policy(cls) -> ParameterizedPolicy:
@@ -711,8 +768,14 @@ def policy(state: State, memory: Dict, objects: Sequence[Object],
                                             finger_status="closed",
                                             dwrist=dwrist)
 
+            # When moving toward the plug, first map to the correct x-y location
+            # at the initial height(z), then move down to pick up the plug
+            xy_sq_dist = np.sum(np.subtract(plug_pos[:2], robot_pos[:2])**2)
+            if xy_sq_dist > 0.01:
+                target_robot_pos = (plug_x, plug_y, cls.env_cls.socket_z)
+            else:
+                target_robot_pos = plug_pos
             # When the gripper is far away from the plug, move to it
-            target_robot_pos = plug_pos
             target_wrist = 0
             dwrist = np.clip(target_wrist - wrist, 
                              -cls.env_cls.max_angular_vel,
@@ -738,6 +801,8 @@ def policy(state: State, memory: Dict, objects: Sequence[Object],
             x = state.get(robot, "x")
             y = state.get(robot, "y")
             z = state.get(robot, "z")
+            wrist = state.get(robot, "wrist")
+            dwrist = cls.env_cls.robot_init_wrist - wrist
             robot_pos = (x, y, z)
             # target_x = cls.env_cls.robot_init_x
             target_x = x
@@ -746,7 +811,8 @@ def policy(state: State, memory: Dict, objects: Sequence[Object],
             # target_z = cls.env_cls.robot_init_z
             target_z = z
             target_pos = (target_x, target_y, target_z)
-            return cls._get_move_action(state, target_pos, robot_pos)
+            return cls._get_move_action(state, target_pos, robot_pos, 
+                                        dwrist=dwrist)
 
         return policy
 
diff --git a/predicators/option_model.py b/predicators/option_model.py
index 908792c21..59529b4a6 100644
--- a/predicators/option_model.py
+++ b/predicators/option_model.py
@@ -105,10 +105,10 @@ def get_next_state_and_num_actions(self, state: State,
             def _terminal(s: State) -> bool:
                 nonlocal last_state
                 if option_copy.terminal(s):
-                    # logging.debug("Option reached terminal state.")
+                    logging.debug("Option reached terminal state.")
                     return True
                 if last_state is not DefaultState and last_state.allclose(s):
-                    # logging.debug("Option got stuck.")
+                    logging.debug("Option got stuck.")
                     raise utils.OptionExecutionFailure("Option got stuck.")
                 last_state = s
                 return False
diff --git a/predicators/planning.py b/predicators/planning.py
index ab4022226..20d1e7c9b 100644
--- a/predicators/planning.py
+++ b/predicators/planning.py
@@ -681,6 +681,7 @@ def run_low_level_search(
                                     longest_failed_refinement
                                 })
                     return longest_failed_refinement, False
+        logging.debug("Option succeed!")
     # Should only get here if the skeleton was empty.
     assert not skeleton
     return [], True
diff --git a/predicators/utils.py b/predicators/utils.py
index 7e629680f..b7f9efb2b 100644
--- a/predicators/utils.py
+++ b/predicators/utils.py
@@ -1202,7 +1202,8 @@ def run_policy_with_simulator(
     actions: List[Action] = []
     exception_raised_in_step = False
     if not termination_function(state):
-        for _ in range(max_num_steps):
+        for i in range(max_num_steps):
+            logging.debug(f"Step {i}")
             # logging.debug(f"State: {state.pretty_str()}")
             monitor_observed = False
             exception_raised_in_step = False
@@ -1216,6 +1217,7 @@ def run_policy_with_simulator(
                 actions.append(act)
                 states.append(state)
             except Exception as e:
+                logging.debug(f"Exception during running policy: {e}")
                 if exceptions_to_break_on is not None and \
                     type(e) in exceptions_to_break_on:
                     if monitor_observed: