예제 #1
0
class HandDrawerEnv(BaseEnv):
    def __init__(self,
                 config_file,
                 model_id=None,
                 mode='headless',
                 action_timestep=1 / 10.0,
                 physics_timestep=1 / 240.0,
                 automatic_reset=False,
                 device_idx=0,
                 render_to_tensor=False):
        """
        :param config_file: config_file path
        :param model_id: override model_id in config file
        :param mode: headless or gui mode
        :param action_timestep: environment executes action per action_timestep second
        :param physics_timestep: physics timestep for pybullet
        :param device_idx: device_idx: which GPU to run the simulation and rendering on
        """
        self.config = parse_config(config_file)
        if model_id is not None:
            self.config['model_id'] = model_id

        # gibson external camera
        self.initial_pos = np.array([0, 1.3, 4])
        self.initial_view_direction = np.array([0, 0, -1])
        self.up = np.array([0, 1, 0])

        # output res for RL
        self.out_image_height = 84
        self.out_image_width = 84

        # class: stadium=0, robot=1, drawer=2, handle=3
        self.num_object_classes = 4
        self.automatic_reset = automatic_reset
        self.mode = mode
        self.action_timestep = action_timestep
        self.physics_timestep = physics_timestep
        self.simulator = Simulator(
            mode=mode,
            gravity=0,
            timestep=physics_timestep,
            use_fisheye=self.config.get('fisheye', False),
            image_width=self.config.get('image_width', 128),
            image_height=self.config.get('image_height', 128),
            vertical_fov=self.config.get('vertical_fov', 90),
            device_idx=device_idx,
            render_to_tensor=render_to_tensor,
            auto_sync=False)
        self.simulator_loop = int(self.action_timestep /
                                  self.simulator.timestep)
        self.load()
        self.hand_start_pos = [0.05, 1, 1.05]
        self.hand_start_orn = p.getQuaternionFromEuler([-np.pi / 2, 0, np.pi])
        self.set_robot_pos_orn(self.robots[0], self.hand_start_pos,
                               self.hand_start_orn)

        # load drawer
        self.drawer_start_pos = [0, 2.2, 1]
        self.drawer_start_orn = p.getQuaternionFromEuler([0, 0, -np.pi / 2])
        self.handle_idx = 3
        self.drawer = InteractiveObj(
            os.path.join(gibson2.assets_path, 'models', 'drawer',
                         'drawer_one_sided_handle.urdf'))
        self.import_drawer_handle()
        self.drawer.set_position_orientation(self.drawer_start_pos,
                                             self.drawer_start_orn)
        self.handle_init_pos = p.getLinkState(self.drawer_id,
                                              self.handle_idx)[0][1]
        self.simulator.sync()
        self._state_id = p.saveState()

    """
    modify import_articulated_object() in simulator.py to
    render drawer and drawer handle separately for semantic inforamtion
    """

    def import_drawer_handle(self):
        self.drawer_id = self.drawer.load()

        # render drawer
        class_id = self.simulator.next_class_id
        self.simulator.next_class_id += 1
        visual_objects = []
        link_ids = []
        poses_rot = []
        poses_trans = []
        for shape in p.getVisualShapeData(self.drawer_id):
            id, link_id, type, dimensions, filename, rel_pos, rel_orn, color = shape[:
                                                                                     8]
            link_name = p.getJointInfo(self.drawer_id, link_id)[12]
            if link_name != b'handle_left' and link_name != b'handle_right' and link_name != b'handle_grip':
                filename = os.path.join(gibson2.assets_path,
                                        'models/mjcf_primitives/cube.obj')
                self.simulator.renderer.load_object(filename,
                                                    transform_orn=rel_orn,
                                                    transform_pos=rel_pos,
                                                    input_kd=color[:3],
                                                    scale=np.array(dimensions))
                visual_objects.append(
                    len(self.simulator.renderer.visual_objects) - 1)
                link_ids.append(link_id)
                _, _, _, _, pos, orn = p.getLinkState(id, link_id)
                poses_rot.append(
                    np.ascontiguousarray(quat2rotmat(xyzw2wxyz(orn))))
                poses_trans.append(np.ascontiguousarray(xyz2mat(pos)))
        self.simulator.renderer.add_instance_group(
            object_ids=visual_objects,
            link_ids=link_ids,
            pybullet_uuid=self.drawer_id,
            class_id=class_id,
            poses_rot=poses_rot,
            poses_trans=poses_trans,
            dynamic=True,
            robot=None)

        # render drawer handle
        class_id = self.simulator.next_class_id
        self.simulator.next_class_id += 1
        visual_objects = []
        link_ids = []
        poses_rot = []
        poses_trans = []
        for shape in p.getVisualShapeData(self.drawer_id):
            id, link_id, type, dimensions, filename, rel_pos, rel_orn, color = shape[:
                                                                                     8]
            link_name = p.getJointInfo(self.drawer_id, link_id)[12]
            if link_name == b'handle_left' or link_name == b'handle_right' or link_name == b'handle_grip':
                filename = os.path.join(gibson2.assets_path,
                                        'models/mjcf_primitives/cube.obj')
                self.simulator.renderer.load_object(filename,
                                                    transform_orn=rel_orn,
                                                    transform_pos=rel_pos,
                                                    input_kd=color[:3],
                                                    scale=np.array(dimensions))
                visual_objects.append(
                    len(self.simulator.renderer.visual_objects) - 1)
                link_ids.append(link_id)
                _, _, _, _, pos, orn = p.getLinkState(id, link_id)
                poses_rot.append(
                    np.ascontiguousarray(quat2rotmat(xyzw2wxyz(orn))))
                poses_trans.append(np.ascontiguousarray(xyz2mat(pos)))
        self.simulator.renderer.add_instance_group(
            object_ids=visual_objects,
            link_ids=link_ids,
            pybullet_uuid=self.drawer_id,
            class_id=class_id,
            poses_rot=poses_rot,
            poses_trans=poses_trans,
            dynamic=True,
            robot=None)

    def set_robot_pos_orn(self, robot, pos, orn):
        robot.set_position_orientation(pos, orn)

    def get_drawer_handle_pos(self):
        return np.array(p.getLinkState(self.drawer_id, self.handle_idx)[0])

    # legacy get state from gibson
    def get_state_legacy(self):
        state = OrderedDict()
        if 'rgb' in self.output:
            state['rgb'] = self.get_rgb()
        if 'depth' in self.output:
            state['depth'] = self.get_depth()
        if 'normal' in self.output:
            state['normal'] = self.get_normal()
        if 'seg' in self.output:
            state['seg'] = self.get_seg()
        return state

    def get_state(self):
        state = np.empty((0, self.image_height, self.image_width),
                         dtype=np.uint8)
        if 'depth' in self.output:
            depth = self.get_depth_external()[..., None].transpose(2, 0, 1)
            state = np.concatenate((state, depth), axis=0)
        if 'seg' in self.output:
            seg = self.get_seg_external()[..., None].transpose(2, 0, 1)
            state = np.concatenate((state, seg), axis=0)
        return state.astype(np.uint8)

    def _sigmoids(self, x, value_at_1, sigmoid):
        if sigmoid in ('cosine', 'linear', 'quadratic'):
            if not 0 <= value_at_1 < 1:
                raise ValueError(
                    '`value_at_1` must be nonnegative and smaller than 1, '
                    'got {}.'.format(value_at_1))
        else:
            if not 0 < value_at_1 < 1:
                raise ValueError(
                    '`value_at_1` must be strictly between 0 and 1, '
                    'got {}.'.format(value_at_1))

        if sigmoid == 'gaussian':
            scale = np.sqrt(-2 * np.log(value_at_1))
            return np.exp(-0.5 * (x * scale)**2)

        elif sigmoid == 'hyperbolic':
            scale = np.arccosh(1 / value_at_1)
            return 1 / np.cosh(x * scale)

        elif sigmoid == 'long_tail':
            scale = np.sqrt(1 / value_at_1 - 1)
            return 1 / ((x * scale)**2 + 1)

        elif sigmoid == 'cosine':
            scale = np.arccos(2 * value_at_1 - 1) / np.pi
            scaled_x = x * scale
            return np.where(
                abs(scaled_x) < 1, (1 + np.cos(np.pi * scaled_x)) / 2, 0.0)

        elif sigmoid == 'linear':
            scale = 1 - value_at_1
            scaled_x = x * scale
            return np.where(abs(scaled_x) < 1, 1 - scaled_x, 0.0)

        elif sigmoid == 'quadratic':
            scale = np.sqrt(1 - value_at_1)
            scaled_x = x * scale
            return np.where(abs(scaled_x) < 1, 1 - scaled_x**2, 0.0)

        elif sigmoid == 'tanh_squared':
            scale = np.arctanh(np.sqrt(1 - value_at_1))
            return 1 - np.tanh(x * scale)**2

        else:
            raise ValueError('Unknown sigmoid type {!r}.'.format(sigmoid))

    def is_close_reward(self,
                        x,
                        bounds=(0.0, 0.0),
                        margin=0.0,
                        sigmoid='gaussian',
                        value_at_margin=_DEFAULT_VALUE_AT_MARGIN):
        lower, upper = bounds
        if lower > upper:
            raise ValueError('Lower bound must be <= upper bound.')
        if margin < 0:
            raise ValueError('`margin` must be non-negative.')
        in_bounds = np.logical_and(lower <= x, x <= upper)
        if margin == 0:
            value = np.where(in_bounds, 1.0, 0.0)
        else:
            d = np.where(x < lower, lower - x, x - upper) / margin
            value = np.where(in_bounds, 1.0,
                             self._sigmoids(d, value_at_margin, sigmoid))

        return float(value) if np.isscalar(x) else value

    def get_reward_new(self):
        handle_center = self.get_drawer_handle_pos()
        grip_center = self.robots[0].get_palm_position()
        reach_dist = np.linalg.norm(grip_center - handle_center)
        pull_dist = self.max_pull_dist - (self.handle_init_pos -
                                          handle_center[1])
        close_threshold = 0.05
        reach_reward = -self.reach_reward_factor * reach_dist
        pull_reward = self.is_close_reward(pull_dist, (0, close_threshold),
                                           close_threshold * 2)
        return reach_reward + pull_reward

    def get_reward(self):
        handle_center = self.get_drawer_handle_pos()
        grip_center = self.robots[0].get_palm_position()
        reach_dist = np.linalg.norm(grip_center - handle_center)
        pull_dist = self.handle_init_pos - handle_center[1]
        reach_rew = -self.reach_reward_factor * reach_dist
        if reach_dist < 0.05:
            self.reach_completed = True
        else:
            self.reach_completed = False

        def pull_reward():
            if self.reach_completed:
                pull_rew = self.pull_reward_factor * pull_dist
                return pull_rew
            else:
                return 0

        pull_rew = pull_reward()
        reward = reach_rew + pull_rew
        return reward

    def is_goal_pulled(self):
        epsilon = 0.01
        return (self.handle_init_pos -
                self.get_drawer_handle_pos()[1]) > self.max_pull_dist - epsilon

    def get_termination(self, info={}):
        done = False

        # if self.is_goal_pulled() and self.reach_completed:
        #     done = True
        #     info['success'] = True
        if self.current_step >= self.max_step:
            done = True
            # info['success'] = False

        if done:
            info['episode_length'] = self.current_step

        return done, info

    def get_depth(self):
        """
        :return: depth sensor reading, normalized to [0.0, 1.0]
        """
        depth = -self.simulator.renderer.render_robot_cameras(
            modes=('3d'))[0][:, :, 2:3]
        # 0.0 is a special value for invalid entries
        depth[depth < self.depth_low] = 0.0
        depth[depth > self.depth_high] = 0.0

        # re-scale depth to [0.0, 1.0]
        depth /= self.depth_high
        return depth

    def get_rgb(self):
        """
        :return: RGB sensor reading, normalized to [0.0, 1.0]
        """
        return self.simulator.renderer.render_robot_cameras(
            modes=('rgb'))[0][:, :, :3]

    def get_normal(self):
        """
        :return: surface normal reading
        """
        return self.simulator.renderer.render_robot_cameras(
            modes='normal')[0][:, :, :3]

    def get_seg(self):
        """
        :return: semantic segmentation mask, normalized to [0.0, 1.0]
        """
        seg = self.simulator.renderer.render_robot_cameras(
            modes='seg')[0][:, :, 0:1]
        if self.num_object_classes is not None:
            seg = np.clip(seg * 255.0 / self.num_object_classes, 0.0, 1.0)
        return seg

    def get_depth_external(self):
        self.simulator.renderer.set_camera(
            self.initial_pos, self.initial_pos + self.initial_view_direction,
            self.up)
        depth = -self.simulator.renderer.render(modes=('3d'))[0][:, :, 2:3]
        depth[depth < self.depth_low] = 0.0
        depth[depth > self.depth_high] = 0.0
        depth /= self.depth_high
        return (depth * 255).astype(np.uint8)[:, :, 0]

    def get_seg_external(self):
        self.simulator.renderer.set_camera(
            self.initial_pos, self.initial_pos + self.initial_view_direction,
            self.up)
        seg = self.simulator.renderer.render(modes='seg')[0][:, :, 0:1]
        if self.num_object_classes is not None:
            seg = seg * 255
            # only mask handle
            seg[seg < 3.1] = 0
            seg = np.clip(seg / self.num_object_classes, 0.0, 1.0)
        return (seg * 255).astype(np.uint8)[:, :, 0]

    def get_external_camera(self):
        """
        pybullet external view rendering
        """
        # pybullet external camera position
        self._view_matrix = [
            0.5708255171775818, -0.6403688788414001, 0.5138930082321167, 0.0,
            0.821071445941925, 0.4451974034309387, -0.3572688400745392, 0.0,
            -0.0, 0.6258810758590698, 0.7799185514450073, 0.0,
            -1.0701078176498413, -0.883043646812439, -1.8267910480499268, 1.0
        ]
        self._projection_matrix = [
            0.7499999403953552, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0,
            -1.0000200271606445, -1.0, 0.0, 0.0, -0.02000020071864128, 0.0
        ]
        self._external_width = 1024
        self._external_height = 768

        (_, _, px, _,
         _) = p.getCameraImage(width=self._external_width,
                               height=self._external_height,
                               renderer=p.ER_BULLET_HARDWARE_OPENGL,
                               viewMatrix=self._view_matrix,
                               projectionMatrix=self._projection_matrix)
        rgb_array = np.array(px, dtype=np.uint8)
        rgb_array = np.reshape(
            np.array(px), (self._external_height, self._external_width, -1))
        rgb_array = rgb_array[:, :, :3]
        return rgb_array

    def render(self, mode='rgb_array'):
        self._view_matrix = [
            0.5708255171775818, -0.6403688788414001, 0.5138930082321167, 0.0,
            0.821071445941925, 0.4451974034309387, -0.3572688400745392, 0.0,
            -0.0, 0.6258810758590698, 0.7799185514450073, 0.0,
            -1.0701078176498413, -0.883043646812439, -1.8267910480499268, 1.0
        ]
        self._projection_matrix = [
            0.7499999403953552, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0,
            -1.0000200271606445, -1.0, 0.0, 0.0, -0.02000020071864128, 0.0
        ]
        self._external_width = 1024
        self._external_height = 768

        (_, _, px, _,
         _) = p.getCameraImage(width=self._external_width,
                               height=self._external_height,
                               renderer=p.ER_BULLET_HARDWARE_OPENGL,
                               viewMatrix=self._view_matrix,
                               projectionMatrix=self._projection_matrix)
        rgb_array = np.array(px, dtype=np.uint8)
        rgb_array = np.reshape(
            np.array(px), (self._external_height, self._external_width, -1))
        rgb_array = rgb_array[:, :, :3]
        return rgb_array

    def save_rgb_image(self, path):
        rgb = self.get_rgb()
        Image.fromarray((rgb * 255).astype(np.uint8)).save(path)

    def save_depth_image(self, path):
        depth = self.get_depth()
        Image.fromarray((depth * 255).astype(np.uint8)[:, :, 0]).save(path)

    def save_seg_image(self, path):
        seg = self.get_seg()
        Image.fromarray((seg * 255).astype(np.uint8)[:, :, 0]).save(path)

    def save_normal_image(self, path):
        normal = self.get_normal()
        Image.fromarray((normal * 255).astype(np.uint8)).save(path)

    def save_external_image(self, path):
        external = self.get_external_camera()
        Image.fromarray(external).save(path)

    def save_depth_image_external(self, path):
        depth = self.get_depth_external()
        Image.fromarray(depth).save(path)

    def save_seg_image_external(self, path):
        seg = self.get_seg_external()
        Image.fromarray(seg).save(path)

    def load_task_setup(self):
        self.max_pull_dist = 0.5
        self.reach_reward_factor = 1.0
        self.pull_reward_factor = 1.0
        self.max_step = self.config.get('max_step', 500)
        # interface for drq
        self._max_episode_steps = self.max_step

    # legacy observation space from gibson
    def load_observation_space_legacy(self):
        self.output = self.config['output']
        self.image_width = self.config.get('image_width', 128)
        self.image_height = self.config.get('image_height', 128)
        observation_space = OrderedDict()
        if 'rgb' in self.output:
            self.rgb_space = gym.spaces.Box(low=0.0,
                                            high=1.0,
                                            shape=(self.image_height,
                                                   self.image_width, 3),
                                            dtype=np.float32)
            observation_space['rgb'] = self.rgb_space
        if 'depth' in self.output:
            self.depth_low = self.config.get('depth_low', 0.5)
            self.depth_high = self.config.get('depth_high', 5.0)
            self.depth_space = gym.spaces.Box(low=0.0,
                                              high=1.0,
                                              shape=(self.image_height,
                                                     self.image_width, 1),
                                              dtype=np.float32)
            observation_space['depth'] = self.depth_space
        if 'seg' in self.output:
            self.seg_space = gym.spaces.Box(low=0.0,
                                            high=1.0,
                                            shape=(self.image_height,
                                                   self.image_width, 1),
                                            dtype=np.float32)
            observation_space['seg'] = self.seg_space
        if 'normal' in self.output:
            self.normal_space = gym.spaces.Box(low=0.0,
                                               high=1.0,
                                               shape=(self.image_height,
                                                      self.image_width, 3),
                                               dtype=np.float32)
            observation_space['normal'] = self.normal_space

        self.observation_space = gym.spaces.Dict(observation_space)

    # observation space for drq
    def load_observation_space(self):
        self.output = self.config['output']
        self.image_width = self.config.get('image_width', 128)
        self.image_height = self.config.get('image_height', 128)
        self.depth_low = self.config.get('depth_low', 0.5)
        self.depth_high = self.config.get('depth_high', 5.0)
        channels = 0
        if 'rgb' in self.output: channels += 3
        if 'depth' in self.output: channels += 1
        if 'seg' in self.output: channels += 1
        if 'normal' in self.output: channels += 3
        shape = [channels, self.image_height, self.image_width]
        self.observation_space = gym.spaces.Box(low=0,
                                                high=255,
                                                shape=shape,
                                                dtype=np.uint8)

    def load_action_space(self):
        self.action_space = self.robots[0].action_space

    def load_miscellaneous_variables(self):
        self.current_step = 0
        self.current_episode = 0

    def load(self):
        super(HandDrawerEnv, self).load()
        self.load_task_setup()
        self.load_observation_space()
        self.load_action_space()
        self.load_miscellaneous_variables()

    def reset_variables(self):
        self.current_episode += 1
        self.current_step = 0

    def reset(self):
        p.restoreState(self._state_id)
        self.simulator.sync()
        self.reset_variables()
        return self.get_state()

    def run_simulation(self):
        for _ in range(self.simulator_loop):
            self.simulator_step()
        self.simulator.sync()

    def step(self, action):
        self.current_step += 1
        if action is not None:
            self.robots[0].apply_action(action)
        self.run_simulation()

        state = self.get_state()
        info = {}
        reward = self.get_reward()
        done, info = self.get_termination()

        if done and self.automatic_reset:
            info['last_observation'] = state
            state = self.reset()
        return state, reward, done, info
예제 #2
0
파일: sim.py 프로젝트: hongyunnchen/HMS
class ContainerObjectsEnv(object):
    def __init__(self, show_gui=False):
        # set up our initial configurations
        self.image_height = 480
        self.image_width = 640
        self.camera_height = 0.9
        self.camera_x = 0.0
        self.camera_y = -0.8

        self.objects = {}

        if show_gui:
            self.simulator = Simulator(image_width=self.image_width,
                                       image_height=self.image_height)
        else:
            self.simulator = Simulator(image_width=self.image_width,
                                       image_height=self.image_height,
                                       mode='headless',
                                       timestep=0.001)
        pb.setAdditionalSearchPath(pybullet_data.getDataPath())
        pb.loadURDF('plane.urdf')

        # set up renderer
        self.adjust_camera([self.camera_x, self.camera_y, self.camera_height],
                           [0, 0, 0], [-1, 0, 0])
        self.simulator.renderer.set_light_pos([0.65, 0.0, 10.0])
        self.simulator.renderer.set_fov(53)

    def reset(self, container):
        with suppress_stdout_stderr():
            self.simulator.reload()
            self.container = container
            self.simulator.import_object(container)
            container.set_position([0, 0, container.size[2] / 2.0])
            self.objects = {}

    def adjust_camera(self,
                      camera_eye_position,
                      camera_target_position,
                      camera_up_vector,
                      randomize=False):
        if randomize:
            self.simulator.renderer.set_camera(
                camera_eye_position + np.random.random(3) * 0.1,
                camera_target_position + np.random.random(3) * 0.1,
                camera_up_vector)
        else:
            self.simulator.renderer.set_camera(camera_eye_position,
                                               camera_target_position,
                                               camera_up_vector)

    def __del__(self):
        self.simulator.renderer.release()
        del self.simulator.renderer

    def get_renderer_rgb_depth(self):
        rgb, im3d = self.simulator.renderer.render(modes=('rgb', '3d'))
        depth = im3d[:, :, 2]

        return rgb, -depth

    def get_renderer_rgb(self):
        rgb = self.simulator.renderer.render(modes=('rgb'))[0]
        return rgb

    def get_renderer_depth(self):
        rgb, im3d = self.simulator.renderer.render(modes=('rgb', '3d'))
        depth = im3d[:, :, 2]

        return -depth

    # selected_object should be an object id
    def get_renderer_segmask(self, selected_object_id, with_occlusion=True):
        all_instances = self.simulator.renderer.instances.copy()
        # get unoccluded segmask
        self.simulator.renderer.instances = []
        selected_object = self.get_body(selected_object_id)

        for instance in all_instances:
            if selected_object is not None and isinstance(
                    instance,
                    Instance) and instance.pybullet_uuid == selected_object:
                self.simulator.renderer.instances.append(instance)
            elif isinstance(
                    instance,
                    Instance) and instance.pybullet_uuid == selected_object_id:
                self.simulator.renderer.instances.append(instance)
        target_segmask = np.sum(
            self.simulator.renderer.render(modes=('seg'))[0][:, :, :3], axis=2)

        target_segmask, target_depth = self.simulator.renderer.render(
            modes=('seg', '3d'))
        target_segmask = np.sum(target_segmask[:, :, :3], axis=2)
        target_depth = target_depth[:, :, 2]

        self.simulator.renderer.instances = all_instances
        if not with_occlusion:
            return target_segmask

        all_depth = self.simulator.renderer.render(modes=('3d'))[0][:, :, 2]
        occluded_segmask = np.logical_and(
            np.abs(target_depth - all_depth) < 0.01, target_segmask)

        return occluded_segmask

    def set_camera_point_at(self, position, randomize=False, dist=0.3):
        camera_eye_position = np.asarray(
            [position[0], position[1] - dist, position[2] + 0.1])
        camera_target_position = np.asarray(
            [position[0], position[1], position[2]])
        self.adjust_camera(camera_eye_position,
                           camera_target_position, [0, 0, 1],
                           randomize=randomize)
        self.simulator.sync()

    def get_observation(self,
                        segmak_object_id=None,
                        visualize=False,
                        save=False,
                        demo=False,
                        randomize_camera=False):
        rgb_im, depth_im = self.get_renderer_rgb_depth()
        if segmak_object_id:
            segmask_im = self.get_renderer_segmask(segmak_object_id)

        if visualize:
            plt.imshow(segmask_im)
            plt.title('segmask')
            plt.show()
            plt.close()

            plt.imshow(rgb_im)
            plt.title('rgb')
            plt.show()
            plt.close()

            plt.imshow(depth_im)
            plt.title('depth')
            plt.show()
            plt.close()

        if save:
            save_dir = './rendered_images/'
            save_time = str(time.time())
            plt.imshow(segmask_im)
            plt.title('segmask')
            plt.savefig(save_dir + "segmask_im_" + save_time + '_.png')
            plt.close()

            plt.imshow(rgb_im)
            plt.title('rgb')
            plt.savefig(save_dir + "rgb_im_" + save_time + '_.png')
            plt.close()

            plt.imshow(depth_im)
            plt.title('depth')
            plt.savefig(save_dir + "depth_im_" + save_time + '_.png')
            plt.close()

        if segmak_object_id:
            return rgb_im, depth_im, segmask_im
        return rgb_im, depth_im

    def get_obj_ids(self):
        return list(self.objects.keys())

    def remove_object(self, obj):
        with suppress_stdout_stderr():
            obj_id = obj.body_id
            pb.removeBody(bodyUniqueId=obj_id)
            del self.objects[obj_id]
            self.simulator.sync()

    def add_object(self, obj):
        with suppress_stdout_stderr():
            new_obj_id = self.simulator.import_object(obj)
            self.objects[new_obj_id] = obj
            return new_obj_id

    def get_object(self, body_id):
        return self.get_body(body_id)

    def get_body(self, body_id):
        if body_id in self.objects:
            return self.objects[body_id]
        return None

    def gentle_drop(self, body_id, threshold=0.1):
        start_time = time.time()

        lvel = pb.getBaseVelocity(bodyUniqueId=body_id)[0]
        avel = pb.getBaseVelocity(bodyUniqueId=body_id)[1]
        pos, _ = pb.getBasePositionAndOrientation(body_id)
        while np.linalg.norm(lvel) < threshold:
            pb.stepSimulation()
            lvel = pb.getBaseVelocity(bodyUniqueId=body_id)[0]
            avel = pb.getBaseVelocity(bodyUniqueId=body_id)[1]
        for _ in range(100000):
            if time.time() > start_time + 5:
                return False
            pos, _ = pb.getBasePositionAndOrientation(body_id)
            if pos[2] < 0:
                return False
            for _ in range(10):
                pb.stepSimulation()
            lvel = pb.getBaseVelocity(bodyUniqueId=body_id)[0]
            avel = pb.getBaseVelocity(bodyUniqueId=body_id)[1]
            # return if it's basically stable
            if np.linalg.norm(lvel) < threshold * 0.5 and np.linalg.norm(
                    avel) < threshold:
                return True
            # modify linear velocity if too large, else leave the same
            if np.linalg.norm(lvel) > threshold:
                new_lvel = np.array(lvel) * (threshold / np.linalg.norm(lvel))
            else:
                new_lvel = lvel
            # modify angular velocity if too large, else leave the same
            if np.linalg.norm(avel) > threshold:
                new_avel = np.array(avel) * (threshold / np.linalg.norm(avel))
            else:
                new_avel = avel
            pb.resetBaseVelocity(objectUniqueId=body_id,
                                 angularVelocity=list(new_avel),
                                 linearVelocity=list(new_lvel))

        return True

    def load_container_setup(self, obj_file, container_id=None):
        abs_path = os.path.join(os.getcwd() + '/', obj_file)

        with open(abs_path, 'rb') as file:
            data = pickle.load(file)

        self.add_objects(data, container_id)

    def get_obj_img(self, color_obs, segmask, zoom_factor=1.2, save=False):
        np_any = np.any(segmask)
        if not np_any:
            return None
        rows = np.any(segmask, axis=0)
        cols = np.any(segmask, axis=1)
        rmin, rmax = np.where(rows)[0][[0, -1]]
        cmin, cmax = np.where(cols)[0][[0, -1]]
        rmean = (rmin + rmax) / 2
        cmean = (cmin + cmax) / 2
        rlen = rmax - rmin
        clen = cmax - cmin
        maxlen = max([rlen, clen]) * zoom_factor
        rmin = int((rmean - maxlen / 2))
        rmax = int((rmean + maxlen / 2))
        cmin = int((cmean - maxlen / 2))
        cmax = int((cmean + maxlen / 2))
        obj_color = color_obs[cmin:cmax, rmin:rmax]
        try:
            if save:
                save_dir = './sim_images/'
                plt.imshow(obj_color)
                save_time = str(time.time())
                plt.savefig(save_dir + "im_" + save_time + '_.png')
        except:
            pass
        return obj_color