CustomEnv.py

# -*- coding: utf-8 -*-
"""
Wrap gym and Carla into common interface
"""
import random
import numpy as np
from carla.client import CarlaClient
from carla.sensor import Camera, Lidar
from carla.settings import CarlaSettings
import config
import utils


class CarlaEnv:
    def __init__(self, target):
        self.carla_client = CarlaClient(
            config.CARLA_HOST_ADDRESS, config.CARLA_HOST_PORT, timeout=100)
        self.carla_client.connect()
        self.target = target
        self.pre_image = None
        self.cur_image = None
        self.pre_measurements = None
        self.cur_measurements = None

    def step(self, action):
        """
        :param action: dict of control signals, such as {'steer':0, 'throttle':0.2}
        :return: next_state, reward, done, info
        """
        if isinstance(action,dict):
            self.carla_client.send_control(**action)
            print(action)
        else:
            self.carla_client.send_control(action)

        measurements, self.cur_image = self.carla_client.read_data()
        self.cur_measurements = self.extract_measurements(measurements)
        # Todo: Checkup the reward function with the images
        reward, done = self.cal_reward()
        self.pre_measurements = self.cur_measurements
        self.pre_image = self.cur_image
        return self.cur_measurements, self.cur_image , reward, done, measurements

    def reset(self):
        """

        :return:
        """
        settings = CarlaSettings()
        settings.set(
            SynchronousMode=True,
            SendNonPlayerAgentsInfo=True,
            NumberOfVehicles=20,
            NumberOfPedestrians=40,
            WeatherId=random.choice([1, 3, 7, 8, 14]),
            QualityLevel='Epic')

        # CAMERA
        camera0 = Camera('CameraRGB', PostProcessing='SceneFinal')
        # Set image resolution in pixels.
        camera0.set_image_size(800, 600)
        # Set its position relative to the car in meters.
        camera0.set_position(0.30, 0, 1.30)
        settings.add_sensor(camera0)

        # Let's add another camera producing ground-truth depth.
        # camera1 = Camera('CameraDepth', PostProcessing='Depth')
        # camera1.set_image_size(800, 600)
        # camera1.set_position(0.30, 0, 1.30)
        # settings.add_sensor(camera1)

        # LIDAR
        # lidar = Lidar('Lidar32')
        # lidar.set_position(0, 0, 2.50)
        # lidar.set_rotation(0, 0, 0)
        # lidar.set(
        #     Channels=32,
        #     Range=50,
        #     PointsPerSecond=100000,
        #     RotationFrequency=10,
        #     UpperFovLimit=10,
        #     LowerFovLimit=-30)
        # settings.add_sensor(lidar)

        scene = self.carla_client.load_settings(settings)
        self.pre_image = None
        self.cur_image = None
        self.pre_measurements = None
        self.cur_measurements = None

        # define a random starting point of the agent for the appropriate trainning
        number_of_player_starts = len(scene.player_start_spots)
        player_start = random.randint(0, max(0, number_of_player_starts - 1))
        # player_start = 140
        self.carla_client.start_episode(player_start)
        print('Starting new episode at %r, %d...' %
              (scene.map_name, player_start))

        # TODO: read and return status after reset
        return

    def extract_measurements(self, measurements):
        """
        extract custom measurement data from carla measurement
        :param measurements:
        :return: custom measurement data dict
        """
        p_meas = measurements.player_measurements
        pos_x = p_meas.transform.location.x
        pos_y = p_meas.transform.location.y
        speed = p_meas.forward_speed * 3.6  # m/s -> km/h
        col_cars = p_meas.collision_vehicles
        col_ped = p_meas.collision_pedestrians
        col_other = p_meas.collision_other
        other_lane = 100 * p_meas.intersection_otherlane
        if other_lane:
            print('Intersection into other lane %.2f' % other_lane)
        offroad = 100 * p_meas.intersection_offroad
        if offroad:
            print('offroad %.2f' % offroad)
        agents_num = len(measurements.non_player_agents)
        distance = np.linalg.norm(np.array([pos_x, pos_y]) - self.target)
        meas = {
            'pos_x': pos_x,
            'pos_y': pos_y,
            'speed': speed,
            'col_damage': col_cars + col_ped + col_other,
            'other_lane': other_lane,
            'offroad': offroad,
            'agents_num': agents_num,
            'distance': distance
        }
        message = 'Vehicle at %.1f, %.1f, ' % (pos_x, pos_y)
        message += '%.0f km/h, ' % (speed,)
        message += 'Collision: vehicles=%.0f, pedestrians=%.0f, other=%.0f, ' % (col_cars, col_ped, col_other,)
        message += '%.0f%% other lane, %.0f%% off-road, ' % (other_lane, offroad,)
        message += '%d non-player agents in the scene.' % (agents_num,)
        # print(message)

        return meas

    def cal_reward(self):
        """
        :param
        :return: reward, done
        """
        def delta(key):
            return self.cur_measurements[key] - self.pre_measurements[key]

        if self.pre_measurements is None:
            reward = 0.0
        else:
            reward = 0.05 * delta('speed') - 0.002 * delta('col_damage') \
                   - 2 * delta('offroad') - 2 * delta('other_lane')
            # print('delta speed %.3f' % delta('speed') )
            # print('[pre_offroad, current_offroad] =[%.2f, %.2f], reward: %.2f' % (self.pre_measurements['offroad'], self.cur_measurements['offroad'], reward))

        # 1000 * delta('distance') +  ignore the distance for auto-pilot

        # check distance to target
        done = self.cur_measurements['distance'] < 1  # final state arrived or not

        return reward, done

    def action_discretize(self,control):
        """
        discrete the control action
        :param action:
        :return:
        """
        # print('Before processing, steer=%.5f,throttle=%.2f,brake=%.2f' % (
        #     action.steer, action.throttle, action.brake))
        action = control
        steer = int(100 * action.steer) + 100 #action.steer has 21 options from [-1, 1]
        throttle = int(action.throttle / 0.5)  # action.throttle= 0, 0.5 or 1.0
        brake = int(action.brake)  # action.brake=0 or 1.0
        if brake:
            gas = -brake     # -1

        else:
            gas = throttle   # 0, 1, 2

        gas += 1

        action_no = steer << 2 | gas  # map the action combination into the a numerical value

        #gas takes two digits, steer takes 5 digits
        action.steer, action.throttle, action.brake = (steer - 100) / 100.0, throttle * 0.5, brake * 1.0
        # print('After processing, steer=%.5f,throttle=%.2f,brake=%.2f' % (
        #     action.steer, action.throttle, action.brake))
        return action_no, action


    def reverse_action(self, action_no):
        """
        map the action number to the discretized action control
        :param action_no:
        :return:
        """
        gas = action_no & 0b11
        throttle = 0.0
        brake = 0.0

        if gas:
            throttle = (gas -1) * 0.5
        else:
            brake = abs(gas -1) * 1.0

        steer = (((action_no & 0b1111111100) >> 2) -100) / 100.0

        action = dict()
        action['steer'], action['throttle'], action['brake'] = steer, throttle, brake

        return action


    def close(self):
        """

        :return:
        """
        self.carla_client.disconnect()