Advanced workshops/reInvent2019-400/customize/deepracer_racetrack_env_lidar_5cars.py [24:1242]:
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
del_path = []
for p in reversed(sys.path):
    if 'python2.7' in p:
        sys.path.remove(p)
        del_path.append(p)
# print(sys.path)
import cv2
for p in del_path:
    sys.path.append(p)
# print(sys.path)

logger = utils.Logger(__name__, logging.INFO).get_logger()
logger.info("*********** ENV from SRC SAHIKA **********************")

# Type of worker
SIMULATION_WORKER = "SIMULATION_WORKER"
SAGEMAKER_TRAINING_WORKER = "SAGEMAKER_TRAINING_WORKER"

node_type = os.environ.get("NODE_TYPE", SIMULATION_WORKER)
if node_type == SIMULATION_WORKER:
    import rospy
    from std_msgs.msg import Float64
    from gazebo_msgs.msg import ModelState
    from gazebo_msgs.srv import GetLinkState, GetModelState, JointRequest, SetModelState, SpawnModel
    from geometry_msgs.msg import Pose
    from scipy.spatial.transform import Rotation
    from rosgraph_msgs.msg import Clock as clock
    from sensor_msgs.msg import Image as sensor_image
    from sensor_msgs.msg import LaserScan
    from shapely.geometry import Point, Polygon
    from shapely.geometry.polygon import LinearRing, LineString
    from deepracer_simulation_environment.srv import GetWaypointSrv, ResetCarSrv
    # from markov.s3_simdata_upload import DeepRacerRacetrackSimTraceData

# Type of job
TRAINING_JOB = 'TRAINING'
EVALUATION_JOB = 'EVALUATION'

# Dimensions of the input training image
TRAINING_IMAGE_SIZE = (160, 120)

# Local offset of the front of the car
RELATIVE_POSITION_OF_FRONT_OF_CAR = [0.14, 0, 0]

# Normalized track distance to move with each reset
# ROUND_ROBIN_ADVANCE_DIST = 0.05

# Reward to give the car when it "crashes"
CRASHED = 1e-8

# Size of the image queue buffer, we want this to be one so that we consume 1 image
# at a time, but may want to change this as we add more algorithms
IMG_QUEUE_BUF_SIZE = 1

# List of required velocity topics, one topic per wheel
VELOCITY_TOPICS = ['/racecar/left_rear_wheel_velocity_controller/command',
                   '/racecar/right_rear_wheel_velocity_controller/command',
                   '/racecar/left_front_wheel_velocity_controller/command',
                   '/racecar/right_front_wheel_velocity_controller/command']

# List of required steering hinges
STEERING_TOPICS = ['/racecar/left_steering_hinge_position_controller/command',
                   '/racecar/right_steering_hinge_position_controller/command']

# List of all effort joints
EFFORT_JOINTS = ['/racecar/left_rear_wheel_joint', '/racecar/right_rear_wheel_joint',
                 '/racecar/left_front_wheel_joint','/racecar/right_front_wheel_joint',
                 '/racecar/left_steering_hinge_joint','/racecar/right_steering_hinge_joint']
# Radius of the wheels of the car in meters
WHEEL_RADIUS = 0.1

# The number of steps to wait before checking if the car is stuck
# This number should corespond to the camera FPS, since it is pacing the
# step rate.
NUM_STEPS_TO_CHECK_STUCK = 15

#Defines to upload SIM_TRACE data in S3
TRAINING_SIMTRACE_DATA_S3_OBJECT_KEY = "sim_inference_logs/TrainingSimTraceData.csv"
EVALUATION_SIMTRACE_DATA_S3_OBJECT_KEY = "sim_inference_logs/EvaluationSimTraceData.csv"
SIMAPP_DATA_UPLOAD_TIME_TO_S3 = 300 #in seconds
simapp_data_upload_timer = None

def simapp_shutdown():
    #This function is called on simapp exit. This is called on:
    #  -robomaker expiry shutdown
    #  -an unexpected exception in the simapp leading to system exit.
    #  -cancel_simulation_job
    #  -simulation data upload timer expiry
    logger.info("deepracer_racetrack_env - Shutdown simapp, close the running processes.")
    stack_trace = traceback.format_exc()
    logger.info ("deepracer_racetrack_env - callstack={}".format(stack_trace))
    # if node_type == SIMULATION_WORKER:
        # simtrace_data = DeepRacerRacetrackSimTraceData.getInstance()
        # simtrace_data.complete_upload_to_s3()

def simapp_data_upload_timer_expiry():
    logger.info("deepracer_racetrack_env - simapp_data_upload timer expired")
    simapp_data_upload_timer.cancel()
    simapp_shutdown()

# class BotCarController(object):
#     def __init__(self, car_id, start_dist, speed, lanes_list_np, change_lane_freq_sec=0):

#         # Wait for ros services
#         rospy.wait_for_service('/gazebo/set_model_state')
#         rospy.wait_for_service('/gazebo/spawn_urdf_model')
#         self.set_model_state = rospy.ServiceProxy('/gazebo/set_model_state', SetModelState)
#         self.spawn_model_client = rospy.ServiceProxy('gazebo/spawn_urdf_model', SpawnModel)

#         # Spawn the new car
#         robot_description = rospy.get_param('robot_description_bot')

#         car_initial_pose = Pose()
#         car_initial_pose.position.x = 0
#         car_initial_pose.position.y = 0
#         car_initial_pose.position.z = 0
#         self.car_name = "racecar_{}".format(car_id)
#         self.car_section = car_id    # car_id should be 1, 2 and 3
#         self.resp = self.spawn_model_client(self.car_name,
#                                             robot_description,
#                                             '/{}'.format(self.car_name),
#                                             car_initial_pose, '')
#         logger.info('Spawn status: {}'.format(self.resp.status_message))

#         # Initialize member data and reset car
#         self.car_speed = speed

#         # Initializing the lane that the bot car runs
#         self.lanes_list_np = lanes_list_np
#         self.lanes_one_hot = np.zeros(len(lanes_list_np), dtype=bool)
#         self.lanes_one_hot[0] = True
#         self.shapely_lane = lanes_list_np[self.lanes_one_hot][0]
#         print('self.shapely_lane.length = ', self.shapely_lane.length)

#         # Change the lanes after certain time
#         self.change_lane_freq_sec = change_lane_freq_sec
#         self.reverse_dir = False

#         self.car_model_state = ModelState()
#         self.reset_sim(start_dist)

#     def reset_sim(self, start_dist):
#         rostime = rospy.get_rostime()
#         self.car_initial_dist = start_dist
#         self.car_initial_time = rostime.secs + 1.e-9*rostime.nsecs
#         self.next_change_lane_time = self.car_initial_time + self.change_lane_freq_sec
#         self.position_bot_car(start_dist)

#     def update_bot_sim(self, sim_time):
#         current_time = sim_time.clock.secs + 1.e-9*sim_time.clock.nsecs
#         seconds_elapsed = current_time - self.car_initial_time
#         traveled_dist = seconds_elapsed * self.car_speed
#         if self.reverse_dir:
#             current_dist = (self.car_initial_dist - traveled_dist) % self.shapely_lane.length
#         else:
#             current_dist = (self.car_initial_dist + traveled_dist) % self.shapely_lane.length

#         # Check for lane change
#         if self.change_lane_freq_sec > 0 and current_time > self.next_change_lane_time:
#             # Get the next lane index
#             tmp_lane_np = np.zeros(len(self.lanes_list_np), dtype=bool)
#             next_lane_idx = (int(np.argwhere(self.lanes_one_hot==True)) + 1) % len(self.lanes_list_np)
#             tmp_lane_np[next_lane_idx] = True
#             self.lanes_one_hot = tmp_lane_np

#             #
#             # Interpolate the x, y point and project on the new lane.
#             # So it does fall behind/move ahead when it changes lane
#             #
#             car_position = self.shapely_lane.interpolate(current_dist)
#             point = Point(car_position.x, car_position.y)

#             # Assigns the next lane that the bot car as to travel
#             self.shapely_lane = self.lanes_list_np[self.lanes_one_hot][0]
#             current_dist = self.shapely_lane.project(point)
#             self.reset_sim(current_dist)
#         else:
#             # Position the car on the lane
#             self.position_bot_car(current_dist)

#     def position_bot_car(self, car_dist):
#         # Set the position of the second car
#         _, next_index = self.find_prev_next_lane_points(car_dist, self.reverse_dir)
#         car_position = self.shapely_lane.interpolate(car_dist)
#         car_yaw = math.atan2(self.shapely_lane.coords[next_index][1] - car_position.y,
#                              self.shapely_lane.coords[next_index][0] - car_position.x)
#         car_quaternion = Rotation.from_euler('zyx', [car_yaw, 0, 0]).as_quat()
#         self.car_model_state.model_name = self.car_name
#         self.car_model_state.pose.position.x = car_position.x
#         self.car_model_state.pose.position.y = car_position.y
#         self.car_model_state.pose.position.z = 0
#         self.car_model_state.pose.orientation.x = car_quaternion[0]
#         self.car_model_state.pose.orientation.y = car_quaternion[1]
#         self.car_model_state.pose.orientation.z = car_quaternion[2]
#         self.car_model_state.pose.orientation.w = car_quaternion[3]
#         self.car_model_state.twist.linear.x = 0
#         self.car_model_state.twist.linear.y = 0
#         self.car_model_state.twist.linear.z = 0
#         self.car_model_state.twist.angular.x = 0
#         self.car_model_state.twist.angular.y = 0
#         self.car_model_state.twist.angular.z = 0
#         self.set_model_state(self.car_model_state)

#     def get_lane_dists(self, lane):
#         return [lane.project(Point(p)) for p in lane.coords[:-1]] + [1.0]
    
#     def find_prev_next_lane_points(self, ndist, reverse_dir):
#         lane_dist = self.get_lane_dists(self.shapely_lane)
#         if reverse_dir:
#             next_index = bisect.bisect_left(lane_dist, ndist) - 1
#             prev_index = next_index + 1
#             if next_index == -1: next_index = len(lane_dist) - 1
#         else:
#             next_index = bisect.bisect_right(lane_dist, ndist)
#             prev_index = next_index - 1
#             if next_index == len(lane_dist): next_index = 0
#         return prev_index, next_index


class BotCarController(object):
    def __init__(self, car_id, is_inner, speed, lanes_list_np, world_name):
        
        if 'base' in world_name:
            self.sec_map = [[[0.1, 2.8], [8.5, 11.8], [15.6]], [[0.1, 2.8], [7.3, 10.6], [13.9]]]    # base
            self.stat_sec = [2]
        elif 'inch' in world_name:
            self.sec_map = [[[0.4, 3.0], [6.2], [11.2, 13.6]], [[0, 2.6], [5.1], [8.9, 11.3]]]    # 36inch
            self.stat_sec = [1]
        elif 'mirror' in world_name:
            self.sec_map = [[[4.9], [9.8, 14.6], [21.1, 23.1]], [[4.3], [8.5, 13.3], [18.5, 20.8]]]    # mirror
            self.stat_sec = [0]
        else:
            self.sec_map = [[[8.1, 9.9], [11.8, 13.7], [18.8, 21.8], [0.8, 0.8], [3.8, 6.1]], 
                            [[6.9, 8.1], [10.2, 11.5], [15.8, 18.6], [0.8, 0.8], [3.2, 5]]]    # 2019
            self.stat_sec = [3]

        # Wait for ros services
        rospy.wait_for_service('/gazebo/set_model_state')
        rospy.wait_for_service('/gazebo/spawn_urdf_model')
        self.set_model_state = rospy.ServiceProxy('/gazebo/set_model_state', SetModelState)
        self.spawn_model_client = rospy.ServiceProxy('gazebo/spawn_urdf_model', SpawnModel)

        # Spawn the new car
        robot_description = rospy.get_param('robot_description_bot')

        car_initial_pose = Pose()
        car_initial_pose.position.x = 0
        car_initial_pose.position.y = 0
        car_initial_pose.position.z = 0
        self.car_name = "racecar_{}".format(car_id)
        self.car_section = car_id - 1    # car_id should be 1, 2 and 3
        self.is_inner = is_inner
        self.resp = self.spawn_model_client(self.car_name,
                                            robot_description,
                                            '/{}'.format(self.car_name),
                                            car_initial_pose, '')
        logger.info('Spawn status: {}'.format(self.resp.status_message))

        # Initialize member data and reset car
        self.car_speed = speed

        # Initializing the lane that the bot car runs
        self.lanes_list_np = lanes_list_np
        self.lanes_one_hot = np.zeros(len(lanes_list_np), dtype=bool)
        if is_inner:
            self.lanes_one_hot[0] = True
            self.shapely_lane = lanes_list_np[self.lanes_one_hot][0]
        else:
            self.lanes_one_hot[1] = True
            self.shapely_lane = lanes_list_np[self.lanes_one_hot][0]

        # Change the lanes after certain time
        self.change_lane_freq_sec = 30 if self.car_section==self.stat_sec else 0
        self.reverse_dir = False

        self.car_model_state = ModelState()
        self.reset_sim(self.sec_map[self.is_inner][self.car_section][0])

    def reset_sim(self, start_dist):
        rostime = rospy.get_rostime()
        self.car_initial_dist = start_dist
        self.car_initial_time = rostime.secs + 1.e-9*rostime.nsecs
        self.next_change_lane_time = self.car_initial_time + self.change_lane_freq_sec
        self.position_bot_car(start_dist)

    def update_bot_sim(self, sim_time):
        current_time = sim_time.clock.secs + 1.e-9*sim_time.clock.nsecs
        seconds_elapsed = current_time - self.car_initial_time
        traveled_dist = seconds_elapsed * self.car_speed
        if self.reverse_dir:
            current_dist = (self.car_initial_dist - traveled_dist) % self.shapely_lane.length
        else:
            current_dist = (self.car_initial_dist + traveled_dist) % self.shapely_lane.length

        
        # Check for lane change and section reset
        if self.car_section == self.stat_sec and current_time > self.next_change_lane_time:
            # Get the next lane index
            tmp_lane_np = np.zeros(len(self.lanes_list_np), dtype=bool)
            next_lane_idx = (int(np.argwhere(self.lanes_one_hot==True)) + 1) % len(self.lanes_list_np)
            tmp_lane_np[next_lane_idx] = True
            self.lanes_one_hot = tmp_lane_np
            self.is_inner = not self.is_inner

            # Assigns the next lane that the bot car as to travel
            self.shapely_lane = self.lanes_list_np[self.lanes_one_hot][0]
            self.reset_sim(self.sec_map[self.is_inner][self.car_section][0])
        elif self.car_section != self.stat_sec and current_dist >= self.sec_map[self.is_inner][self.car_section][1]:
            tmp_lane_np = np.zeros(len(self.lanes_list_np), dtype=bool)
            next_lane_idx = (int(np.argwhere(self.lanes_one_hot==True)) + 1) % len(self.lanes_list_np)
            tmp_lane_np[next_lane_idx] = True
            self.lanes_one_hot = tmp_lane_np
            self.is_inner = not self.is_inner
            
            self.shapely_lane = self.lanes_list_np[self.lanes_one_hot][0]
            self.reset_sim(self.sec_map[self.is_inner][self.car_section][0])
        else:
            # Position the car on the lane
            self.position_bot_car(current_dist)

    def position_bot_car(self, car_dist):
        # Set the position of the second car
        _, next_index = self.find_prev_next_lane_points(car_dist, self.reverse_dir)
        car_position = self.shapely_lane.interpolate(car_dist)
        car_yaw = math.atan2(self.shapely_lane.coords[next_index][1] - car_position.y,
                             self.shapely_lane.coords[next_index][0] - car_position.x)
        car_quaternion = Rotation.from_euler('zyx', [car_yaw, 0, 0]).as_quat()
        self.car_model_state.model_name = self.car_name
        self.car_model_state.pose.position.x = car_position.x
        self.car_model_state.pose.position.y = car_position.y
        self.car_model_state.pose.position.z = 0
        self.car_model_state.pose.orientation.x = car_quaternion[0]
        self.car_model_state.pose.orientation.y = car_quaternion[1]
        self.car_model_state.pose.orientation.z = car_quaternion[2]
        self.car_model_state.pose.orientation.w = car_quaternion[3]
        self.car_model_state.twist.linear.x = 0
        self.car_model_state.twist.linear.y = 0
        self.car_model_state.twist.linear.z = 0
        self.car_model_state.twist.angular.x = 0
        self.car_model_state.twist.angular.y = 0
        self.car_model_state.twist.angular.z = 0
        self.set_model_state(self.car_model_state)

    def get_lane_dists(self, lane):
        return [lane.project(Point(p)) for p in lane.coords[:-1]] + [1.0]
    
    def find_prev_next_lane_points(self, ndist, reverse_dir):
        lane_dist = self.get_lane_dists(self.shapely_lane)
        if reverse_dir:
            next_index = bisect.bisect_left(lane_dist, ndist) - 1
            prev_index = next_index + 1
            if next_index == -1: next_index = len(lane_dist) - 1
        else:
            next_index = bisect.bisect_right(lane_dist, ndist)
            prev_index = next_index - 1
            if next_index == len(lane_dist): next_index = 0
        return prev_index, next_index
    
### Gym Env ###
class DeepRacerRacetrackEnv(gym.Env):

    def __init__(self):

        # Create the observation space
#         self.observation_space = spaces.Box(low=0, high=255,
#                                             shape=(TRAINING_IMAGE_SIZE[1], TRAINING_IMAGE_SIZE[0], 3),
#                                             dtype=np.uint8)
#         self.observation_space = spaces.Dict({
# #                 'left_camera': spaces.Box(low=0, high=255,
# #                                         shape=(TRAINING_IMAGE_SIZE[1], TRAINING_IMAGE_SIZE[0], 3),
# #                                         dtype=np.uint8),
#                 'stereo': spaces.Box(low=0, high=255,
#                                         shape=(TRAINING_IMAGE_SIZE[1], TRAINING_IMAGE_SIZE[0], 2),
#                                         dtype=np.uint8)
#         })
    
        self.observation_space = spaces.Dict({
#                 'left_camera': spaces.Box(low=0, high=255,
#                                         shape=(TRAINING_IMAGE_SIZE[1], TRAINING_IMAGE_SIZE[0], 3),
#                                         dtype=np.uint8),
                'STEREO_CAMERAS': spaces.Box(low=0, high=255,
                                        shape=(TRAINING_IMAGE_SIZE[1], TRAINING_IMAGE_SIZE[0], 2),
                                        dtype=np.uint8),
                'LIDAR': spaces.Box(low=0.15, high=1.0, shape=(64,))
        })
    
        # Create the action space
        self.action_space = spaces.Box(low=np.array([-1, 0]), high=np.array([+1, +1]), dtype=np.float32)

        if node_type == SIMULATION_WORKER:

            # ROS initialization
            rospy.init_node('rl_coach', anonymous=True)

            # wait for required services
            rospy.wait_for_service('/deepracer_simulation_environment/get_waypoints')
            rospy.wait_for_service('/deepracer_simulation_environment/reset_car')
            rospy.wait_for_service('/gazebo/get_model_state')
            rospy.wait_for_service('/gazebo/get_link_state')
            rospy.wait_for_service('/gazebo/clear_joint_forces')
            rospy.wait_for_service('/gazebo/spawn_urdf_model')

            self.get_model_state = rospy.ServiceProxy('/gazebo/get_model_state', GetModelState)
            self.get_link_state = rospy.ServiceProxy('/gazebo/get_link_state', GetLinkState)
            self.clear_forces_client = rospy.ServiceProxy('/gazebo/clear_joint_forces', JointRequest)
            self.reset_car_client = rospy.ServiceProxy('/deepracer_simulation_environment/reset_car', ResetCarSrv)
            get_waypoints_client = rospy.ServiceProxy('/deepracer_simulation_environment/get_waypoints', GetWaypointSrv)

            # Create the publishers for sending speed and steering info to the car
            self.velocity_pub_dict = OrderedDict()
            self.steering_pub_dict = OrderedDict()

            for topic in VELOCITY_TOPICS:
                self.velocity_pub_dict[topic] = rospy.Publisher(topic, Float64, queue_size=1)

            for topic in STEERING_TOPICS:
                self.steering_pub_dict[topic] = rospy.Publisher(topic, Float64, queue_size=1)

            # Read in parameters
            self.world_name = rospy.get_param('WORLD_NAME')
            self.job_type = rospy.get_param('JOB_TYPE')
            self.aws_region = rospy.get_param('AWS_REGION')
            self.metrics_s3_bucket = rospy.get_param('METRICS_S3_BUCKET')
            self.metrics_s3_object_key = rospy.get_param('METRICS_S3_OBJECT_KEY')
            self.metrics = []
            self.simulation_job_arn = 'arn:aws:robomaker:' + self.aws_region + ':' + \
                                      rospy.get_param('ROBOMAKER_SIMULATION_JOB_ACCOUNT_ID') + \
                                      ':simulation-job/' + rospy.get_param('AWS_ROBOMAKER_SIMULATION_JOB_ID')

            # Setup SIM_TRACE_LOG data upload to s3
            # self.setup_simtrace_data_upload_to_s3()

            if self.job_type == TRAINING_JOB:
                from custom_files.customer_reward_function import reward_function
                self.reward_function = reward_function
                self.target_number_of_episodes = rospy.get_param('NUMBER_OF_EPISODES')
                self.target_reward_score = rospy.get_param('TARGET_REWARD_SCORE')
            else:
                from markov.defaults import reward_function
                self.reward_function = reward_function
                self.number_of_trials = 0
                self.target_number_of_trials = rospy.get_param('NUMBER_OF_TRIALS')

            # Request the waypoints
            waypoints = None
            try:
                resp = get_waypoints_client()
                waypoints = np.array(resp.waypoints).reshape(resp.row, resp.col)
            except Exception as ex:
                utils.json_format_logger("Unable to retrieve waypoints: {}".format(ex),
                             **utils.build_system_error_dict(utils.SIMAPP_ENVIRONMENT_EXCEPTION,
                                                             utils.SIMAPP_EVENT_ERROR_CODE_500))

            is_loop = np.all(waypoints[0,:] == waypoints[-1,:])
            if 'inch' in self.world_name:
                coef = 0.5
            else:
                coef = 0.6
            if is_loop:
                self.center_line = LinearRing(waypoints[:,0:2])
                self.inner_border = LinearRing(waypoints[:,2:4])
                self.outer_border = LinearRing(waypoints[:,4:6])
                self.left_lane = LinearRing(waypoints[:, 2:4]*coef + waypoints[:, 0:2]*(1-coef))
                self.right_lane = LinearRing(waypoints[:, 4:6]*coef + waypoints[:, 0:2]*(1-coef))
                self.road_poly = Polygon(self.outer_border, [self.inner_border])
            else:
                self.center_line = LineString(waypoints[:,0:2])
                self.inner_border = LineString(waypoints[:,2:4])
                self.outer_border = LineString(waypoints[:,4:6])
                self.left_lane = LinearRing(waypoints[:, 2:4]*coef + waypoints[:, 0:2]*(1-coef))
                self.right_lane = LinearRing(waypoints[:, 4:6]*coef + waypoints[:, 0:2]*(1-coef))
                self.road_poly = Polygon(np.vstack((self.outer_border, np.flipud(self.inner_border))))
            self.center_dists = [self.center_line.project(Point(p), normalized=True) for p in self.center_line.coords[:-1]] + [1.0]
            self.track_length = self.center_line.length
            
            self.safe_angle = 30
            
            # Queue used to maintain image consumption synchronicity
            self.image_queue_left_camera = queue.Queue(IMG_QUEUE_BUF_SIZE)
            rospy.Subscriber('/racecar/camera/zed/rgb/image_rect_color', sensor_image, self.callback_image_left_camera)
            self.image_queue_right_camera = queue.Queue(IMG_QUEUE_BUF_SIZE)
            rospy.Subscriber('/racecar/camera/zed_right/rgb/image_rect_color_right', sensor_image, self.callback_image_right_camera)
            print(self)

            # Initialize state data
            self.episodes = 0
            self.reverse_dir = False
#             if self.reverse_dir:
#                 self.start_ndist_map = [0.28, 0.5, 0.97]
#             else:
#                 self.start_ndist_map = [0.2, 0.42, 0.78]    # 36inch
# #                 self.start_ndist_map = [0.19, 0.67, 0.87]    # base

            if 'base' in self.world_name:
                self.start_ndist_map = [0.19, 0.67, 0.87]
            elif 'inch' in self.world_name:
                self.start_ndist_map = [0.23, 0.45, 0.93]
            elif 'mirror' in self.world_name:
                self.start_ndist_map = [0.12, 0.34, 0.83]
            else:
                self.start_ndist_map = [0.08, 0.27, 0.41, 0.57, 0.96]
    
            self.start_ndist_index = 0
#             self.start_ndist = 0.0
            self.start_ndist = self.start_ndist_map[0]
            # self.change_start = rospy.get_param('CHANGE_START_POSITION', (self.job_type == TRAINING_JOB))
            self.change_start = bool(rospy.get_param('CHANGE_START_POSITION', True))

            self.alternate_dir = rospy.get_param('ALTERNATE_DRIVING_DIRECTION')
#             if self.job_type == TRAINING_JOB:
#                 self.alternate_dir = True
#             else:
#                 self.alternate_dir = True
            print("Alternate direction is set to:", self.alternate_dir)
            
            self.is_simulation_done = False
            self.steering_angle = 0
            self.speed = 0
            self.action_taken = 0
            self.prev_progress = 0
            self.prev_point = Point(0, 0)
            self.prev_point_2 = Point(0, 0)
            self.next_state = None
            self.reward = None
            self.reward_in_episode = 0
            self.done = False
            self.steps = 0
            self.simulation_start_time = 0
            self.allow_servo_step_signals = False
            self.checkpoint_num = 0
            
            # Creating bot cars
            self.lanes_list_np_inner = np.array([self.left_lane, self.right_lane], dtype=object)
            self.lanes_list_np_outer = np.array([self.right_lane, self.left_lane], dtype=object)
            self.lanes_list_np_center = np.array([self.center_line, self.left_lane], dtype=object)
            self.lanes_list_np = np.array([self.left_lane, self.right_lane], dtype=object)

#             self.bot_cars = [
#                 BotCarController(car_id=1, start_dist=0.1, speed=0, lanes_list_np=self.lanes_list_np_inner, change_lane_freq_sec=0),
#                 BotCarController(car_id=2, start_dist=2.9, speed=0, lanes_list_np=self.lanes_list_np_inner, change_lane_freq_sec=0),
#                 BotCarController(car_id=3, start_dist=7.3, speed=0, lanes_list_np=self.lanes_list_np_inner, change_lane_freq_sec=0),
#                 BotCarController(car_id=4, start_dist=10.8, speed=0, lanes_list_np=self.lanes_list_np_inner, change_lane_freq_sec=0),
#                 BotCarController(car_id=5, start_dist=14, speed=0, lanes_list_np=self.lanes_list_np_inner, change_lane_freq_sec=0)
#             ]
#             # reinvent 36inch
#             # inner_lane: 14.7032; outer_lane: 18.1877; ratio=1.237
#             # forward dir: inner lane: 0-2.6, 5.1, 7.6-11. outer lane: 0.4-3, 6.2, 9.6-13.3
#             # reverse dir: inner lane: 14.2032-1.8, 4.4, 7.3-10.5. outer lane: 0.1-2.5, 5.8, 9.9-12.7
#             # reinvent_base
#             # inner_lane: 16.5382; outer_lane: 18.8032; ratio=1.137
#             # inner lane: 0.1-2.8, 7.3-10.6, 13.9. outer lane: 0.1-2.8, 8.5-11.8, 15.6
            
#             # 36inch
#             self.bot_cars = [
#                 BotCarController(car_id=1, is_inner=True, speed=0.1, lanes_list_np=self.lanes_list_np),
#                 BotCarController(car_id=2, is_inner=False, speed=0, lanes_list_np=self.lanes_list_np),
#                 BotCarController(car_id=3, is_inner=True, speed=0.1, lanes_list_np=self.lanes_list_np)
#             ]
        
            if 'base' in self.world_name:
                # base
                self.bot_cars = [
                    BotCarController(car_id=1, is_inner=True, speed=0.1, lanes_list_np=self.lanes_list_np, world_name=self.world_name),
                    BotCarController(car_id=2, is_inner=False, speed=0.1, lanes_list_np=self.lanes_list_np, world_name=self.world_name),
                    BotCarController(car_id=3, is_inner=True, speed=0, lanes_list_np=self.lanes_list_np, world_name=self.world_name)
                ]
            elif 'inch' in self.world_name:
                # 36inch
                self.bot_cars = [
                    BotCarController(car_id=1, is_inner=True, speed=0.1, lanes_list_np=self.lanes_list_np, world_name=self.world_name),
                    BotCarController(car_id=2, is_inner=False, speed=0, lanes_list_np=self.lanes_list_np, world_name=self.world_name),
                    BotCarController(car_id=3, is_inner=True, speed=0.1, lanes_list_np=self.lanes_list_np, world_name=self.world_name)
                ]
            elif 'mirror' in self.world_name:
                # mirror
                self.bot_cars = [
                    BotCarController(car_id=1, is_inner=True, speed=0, lanes_list_np=self.lanes_list_np, world_name=self.world_name),
                    BotCarController(car_id=2, is_inner=False, speed=0.2, lanes_list_np=self.lanes_list_np, world_name=self.world_name),
                    BotCarController(car_id=3, is_inner=True, speed=0.1, lanes_list_np=self.lanes_list_np, world_name=self.world_name)
                ]
            else:
                # 2019
                self.bot_cars = [
                    BotCarController(car_id=1, is_inner=True, speed=0.08, lanes_list_np=self.lanes_list_np, world_name=self.world_name),
                    BotCarController(car_id=2, is_inner=False, speed=0.1, lanes_list_np=self.lanes_list_np, world_name=self.world_name),
                    BotCarController(car_id=3, is_inner=True, speed=0.1, lanes_list_np=self.lanes_list_np, world_name=self.world_name),
                    BotCarController(car_id=4, is_inner=False, speed=0, lanes_list_np=self.lanes_list_np, world_name=self.world_name),
                    BotCarController(car_id=5, is_inner=True, speed=0.08, lanes_list_np=self.lanes_list_np, world_name=self.world_name)
                ]
            
#             print(self.bot_cars[0].shapely_lane.length)
#             print(self.bot_cars[1].shapely_lane.length)

            self.bot_reset_callback = []
            for bot in self.bot_cars:
                self.bot_reset_callback.append(rospy.Subscriber('/clock', clock, bot.update_bot_sim))
#             for bot in self.bot_cars:
#                 rospy.Subscriber('/clock', clock, bot.update_bot_sim)

    def setup_simtrace_data_upload_to_s3(self):
        if node_type == SIMULATION_WORKER:
            #start timer to upload SIM_TRACE data to s3 when simapp exits
            #There is not enough time to upload data to S3 when robomaker shuts down
            #Set up timer to upload data to S3 300 seconds before the robomaker quits
            # - 300 seocnds is randomly chosen number based on various jobs launched that
            #   provides enough time to upload data to S3
            global simapp_data_upload_timer
            session = boto3.session.Session()
            robomaker_client = session.client('robomaker', region_name=self.aws_region)
            result = robomaker_client.describe_simulation_job(
                job=self.simulation_job_arn
            )
            logger.info("robomaker job description: {}".format(result))
            self.simapp_upload_duration = result['maxJobDurationInSeconds'] - SIMAPP_DATA_UPLOAD_TIME_TO_S3
            start = 0
            if self.job_type == TRAINING_JOB:
                logger.info("simapp training job started_at={}".format(result['lastStartedAt']))
                start = result['lastStartedAt']
                self.simtrace_s3_bucket = rospy.get_param('SAGEMAKER_SHARED_S3_BUCKET')
                self.simtrace_s3_key = os.path.join(rospy.get_param('SAGEMAKER_SHARED_S3_PREFIX'), TRAINING_SIMTRACE_DATA_S3_OBJECT_KEY)
            else:
                logger.info("simapp evaluation job started_at={}".format(result['lastUpdatedAt']))
                start = result['lastUpdatedAt']
                self.simtrace_s3_bucket = rospy.get_param('MODEL_S3_BUCKET')
                self.simtrace_s3_key = os.path.join(rospy.get_param('MODEL_S3_PREFIX'), EVALUATION_SIMTRACE_DATA_S3_OBJECT_KEY)
            end = start + datetime.timedelta(seconds=self.simapp_upload_duration)
            now = datetime.datetime.now(tz=end.tzinfo) # use tzinfo as robomaker
            self.simapp_data_upload_time = (end - now).total_seconds()
            logger.info("simapp job started_at={} now={} end={} upload_data_in={} sec".format(start, now, end, self.simapp_data_upload_time))
            simapp_data_upload_timer = threading.Timer(self.simapp_data_upload_time, simapp_data_upload_timer_expiry)
            simapp_data_upload_timer.daemon = True
            simapp_data_upload_timer.start()
            logger.info("Timer with {} seconds is {}".format(self.simapp_data_upload_time, simapp_data_upload_timer.is_alive()))

            #setup to upload SIM_TRACE_DATA to S3
            self.simtrace_data = DeepRacerRacetrackSimTraceData(self.simtrace_s3_bucket, self.simtrace_s3_key)

    def reset(self):
        if node_type == SAGEMAKER_TRAINING_WORKER:
            return self.observation_space.sample()

        # Simulation is done - so RoboMaker will start to shut down the app.
        # Till RoboMaker shuts down the app, do nothing more else metrics may show unexpected data.
        if (node_type == SIMULATION_WORKER) and self.is_simulation_done:
            while True:
                time.sleep(1)

        self.steering_angle = 0
        self.speed = 0
        self.action_taken = 0
        self.prev_progress = 0
        self.prev_point = Point(0, 0)
        self.prev_point_2 = Point(0, 0)
        self.next_state = None
        self.reward = None
        self.reward_in_episode = 0
        self.done = False
        # Reset the car and record the simulation start time
        if self.allow_servo_step_signals:
            self.send_action(0, 0)

        self.racecar_reset()
        self.steps = 0
        self.simulation_start_time = time.time()
        self.infer_reward_state(0, 0)

        return self.next_state

    def set_next_state(self):
#         # Make sure the first image is the starting image
#         image_data = self.image_queue.get(block=True, timeout=None)
#         # Read the image and resize to get the state
#         image = Image.frombytes('RGB', (image_data.width, image_data.height), image_data.data, 'raw', 'RGB', 0, 1)
#         image = image.resize(TRAINING_IMAGE_SIZE, resample=2)
#         self.next_state = np.array(image)
        
        next_states = {}
        
        data = rospy.wait_for_message('/scan', LaserScan)
        next_states['LIDAR'] = np.array(data.ranges)
        
        # Make sure the first image is the starting image
        image_data = self.image_queue_left_camera.get(block=True, timeout=None)
        # Read the image and resize to get the state
        imgL = Image.frombytes('RGB', (image_data.width, image_data.height), image_data.data, 'raw', 'RGB', 0, 1)
        imgL = imgL.resize(TRAINING_IMAGE_SIZE, resample=2)
#         next_states['left_camera'] = np.array(imgL)
        
        image_data = self.image_queue_right_camera.get(block=True, timeout=None)
        imgR = Image.frombytes('RGB', (image_data.width, image_data.height), image_data.data, 'raw', 'RGB', 0, 1)
        imgR = imgR.resize(TRAINING_IMAGE_SIZE, resample=2)

        imgL = imgL.convert('L')
        imgR = imgR.convert('L')
        imgConcat = np.stack((imgL, imgR), axis=2)
        next_states['STEREO_CAMERAS'] = np.array(imgConcat)

        self.next_state = next_states

    def racecar_reset(self):
        try:
            for joint in EFFORT_JOINTS:
                self.clear_forces_client(joint)
            prev_index, next_index = self.find_prev_next_waypoints(self.start_ndist)
            self.reset_car_client(self.start_ndist, next_index)
            # First clear the queue so that we set the state to the start image
#             _ = self.image_queue.get(block=True, timeout=None)
            _ = self.image_queue_left_camera.get(block=True, timeout=None)
            _ = self.image_queue_right_camera.get(block=True, timeout=None)
            self.set_next_state()

        except Exception as ex:
            utils.json_format_logger("Unable to reset the car: {}".format(ex),
                         **utils.build_system_error_dict(utils.SIMAPP_ENVIRONMENT_EXCEPTION,
                                                         utils.SIMAPP_EVENT_ERROR_CODE_500))

    def set_allow_servo_step_signals(self, allow_servo_step_signals):
        self.allow_servo_step_signals = allow_servo_step_signals

    def step(self, action):
        if node_type == SAGEMAKER_TRAINING_WORKER:
            return self.observation_space.sample(), 0, False, {}

        # Initialize next state, reward, done flag
        self.next_state = None
        self.reward = None
        self.done = False

        # Send this action to Gazebo and increment the step count
        # if self.job_type == EVALUATION_JOB:
        noise_fraction = 0.1
        delta_steering = float(action[0]) * noise_fraction
        self.steering_angle = np.random.uniform(float(action[0])-delta_steering, float(action[0])+delta_steering)
        delta_speed = float(action[1]) * noise_fraction
        self.speed = max(0, np.random.uniform(float(action[1])-delta_speed, float(action[1])+delta_speed))
        # else:
        #     self.steering_angle = float(action[0])
        #     self.speed = float(action[1])

        if self.allow_servo_step_signals:
            self.send_action(self.steering_angle, self.speed)
        self.steps += 1

        # Compute the next state and reward
        self.infer_reward_state(self.steering_angle, self.speed)
        return self.next_state, self.reward, self.done, {}

#     def callback_image(self, data):
#         try:
#             self.image_queue.put_nowait(data)
#         except queue.Full:
#             pass
#         except Exception as ex:
#             utils.json_format_logger("Error retrieving frame from gazebo: {}".format(ex),
#                        **utils.build_system_error_dict(utils.SIMAPP_ENVIRONMENT_EXCEPTION, utils.SIMAPP_EVENT_ERROR_CODE_500))
            
    def callback_image_left_camera(self, data):
        try:
            self.image_queue_left_camera.put_nowait(data)
        except queue.Full:
            pass
        except Exception as ex:
            utils.json_format_logger("Error retrieving frame from gazebo: {}".format(ex),
                       **utils.build_system_error_dict(utils.SIMAPP_ENVIRONMENT_EXCEPTION, utils.SIMAPP_EVENT_ERROR_CODE_500))
            
    def callback_image_right_camera(self, data):
        try:
            self.image_queue_right_camera.put_nowait(data)
        except queue.Full:
            pass
        except Exception as ex:
            utils.json_format_logger("Error retrieving frame from gazebo: {}".format(ex),
                       **utils.build_system_error_dict(utils.SIMAPP_ENVIRONMENT_EXCEPTION, utils.SIMAPP_EVENT_ERROR_CODE_500))

    def send_action(self, steering_angle, speed):
        # Simple v/r to computes the desired rpm
        wheel_rpm = speed/WHEEL_RADIUS

        for _, pub in self.velocity_pub_dict.items():
            pub.publish(wheel_rpm)

        for _, pub in self.steering_pub_dict.items():
            pub.publish(steering_angle)

    def infer_reward_state(self, steering_angle, speed):
        try:
            self.set_next_state()
        except Exception as ex:
            utils.json_format_logger("Unable to retrieve image from queue: {}".format(ex),
                       **utils.build_system_error_dict(utils.SIMAPP_ENVIRONMENT_EXCEPTION, utils.SIMAPP_EVENT_ERROR_CODE_500))

        # Read model state from Gazebo
        model_state = self.get_model_state('racecar', '')
        model_orientation = Rotation.from_quat([
            model_state.pose.orientation.x,
            model_state.pose.orientation.y,
            model_state.pose.orientation.z,
            model_state.pose.orientation.w])
        model_location = np.array([
            model_state.pose.position.x,
            model_state.pose.position.y,
            model_state.pose.position.z]) + \
            model_orientation.apply(RELATIVE_POSITION_OF_FRONT_OF_CAR)
        model_point = Point(model_location[0], model_location[1])
        model_heading = model_orientation.as_euler('zyx')[0]

        # Read the wheel locations from Gazebo
        left_rear_wheel_state = self.get_link_state('racecar::left_rear_wheel', '')
        left_front_wheel_state = self.get_link_state('racecar::left_front_wheel', '')
        right_rear_wheel_state = self.get_link_state('racecar::right_rear_wheel', '')
        right_front_wheel_state = self.get_link_state('racecar::right_front_wheel', '')
        wheel_points = [
            Point(left_rear_wheel_state.link_state.pose.position.x,
                  left_rear_wheel_state.link_state.pose.position.y),
            Point(left_front_wheel_state.link_state.pose.position.x,
                  left_front_wheel_state.link_state.pose.position.y),
            Point(right_rear_wheel_state.link_state.pose.position.x,
                  right_rear_wheel_state.link_state.pose.position.y),
            Point(right_front_wheel_state.link_state.pose.position.x,
                  right_front_wheel_state.link_state.pose.position.y)
        ]

        # Project the current location onto the center line and find nearest points
        current_ndist = self.center_line.project(model_point, normalized=True)
        prev_index, next_index = self.find_prev_next_waypoints(current_ndist)
        distance_from_prev = model_point.distance(Point(self.center_line.coords[prev_index]))
        distance_from_next = model_point.distance(Point(self.center_line.coords[next_index]))
        closest_waypoint_index = (prev_index, next_index)[distance_from_next < distance_from_prev]

        # Compute distance from center and road width
        nearest_point_center = self.center_line.interpolate(current_ndist, normalized=True)
        nearest_point_inner = self.inner_border.interpolate(self.inner_border.project(nearest_point_center))
        nearest_point_outer = self.outer_border.interpolate(self.outer_border.project(nearest_point_center))
        distance_from_center = nearest_point_center.distance(model_point)
        distance_from_inner = nearest_point_inner.distance(model_point)
        distance_from_outer = nearest_point_outer.distance(model_point)
        track_width = nearest_point_inner.distance(nearest_point_outer)
        is_left_of_center = (distance_from_outer < distance_from_inner) if self.reverse_dir \
            else (distance_from_inner < distance_from_outer)
        
        # Compute the distance to the closest bot car
        is_crashed = False
        dist_closest_bot_car = 1e3 # large number
        closest_bot = -1           # index of closest bot car
        for kk in range(len(self.bot_cars)):
            dist_to_bot_car = np.sqrt((model_state.pose.position.x - self.bot_cars[kk].car_model_state.pose.position.x) ** 2
                                      + (model_state.pose.position.y - self.bot_cars[kk].car_model_state.pose.position.y) ** 2)
            if dist_to_bot_car < dist_closest_bot_car:
                dist_closest_bot_car = dist_to_bot_car
                closest_bot = kk
                
#         if self.bot_cars[closest_bot].shapely_lane.length < 16:
#             is_left_lane_bot = False if self.bot_cars[closest_bot].reverse_dir else True
#         else:
#             is_left_lane_bot = True if self.bot_cars[closest_bot].reverse_dir else False
                
        botcar = self.bot_cars[closest_bot].car_model_state
        botcar_orientation = Rotation.from_quat([
            botcar.pose.orientation.x,
            botcar.pose.orientation.y,
            botcar.pose.orientation.z,
            botcar.pose.orientation.w])
        botcar_heading = botcar_orientation.as_euler('zyx')[0]
        
        botcar_location = np.array([
            botcar.pose.position.x,
            botcar.pose.position.y,
            botcar.pose.position.z]) + \
            botcar_orientation.apply(RELATIVE_POSITION_OF_FRONT_OF_CAR)
        botcar_point = Point(botcar_location[0], botcar_location[1])
        botcar_current_ndist = self.center_line.project(botcar_point, normalized=True)
        botcar_prev_index, botcar_next_index = self.find_prev_next_waypoints(botcar_current_ndist)
        
        if next_index <= botcar_next_index:    # corner case: last few waypoints
            flag_model_car_behind = True
        else:
            flag_model_car_behind = False
            
        if flag_model_car_behind:
            behind_car_heading = model_heading * 180.0 / math.pi
            angle_to_front_car = math.atan2(botcar_point.y - model_point.y, botcar_point.x - model_point.x)
            angle_to_front_car = angle_to_front_car * 180.0 / math.pi
        else:
            behind_car_heading = botcar_heading * 180.0 / math.pi
            angle_to_front_car = math.atan2(model_point.y - botcar_point.y, model_point.x - botcar_point.x)
            angle_to_front_car = angle_to_front_car * 180.0 / math.pi
            
        abs_diff = abs(angle_to_front_car - behind_car_heading)
        if abs_diff > 180:
            abs_diff = 360 - abs_diff
            
        if abs_diff < self.safe_angle:
            flag_unsafe = True
        else:
            flag_unsafe = False
        
        if flag_unsafe and flag_model_car_behind and dist_closest_bot_car < 0.4:
            is_crashed = True
        elif flag_unsafe and not flag_model_car_behind and dist_closest_bot_car < 0.3:
            is_crashed = True
        elif not flag_unsafe and dist_closest_bot_car < 0.25:
            is_crashed = True

        # SAHIKA: Quantize the shapely projections to 2 digits
        current_ndist = np.around(current_ndist, decimals=2)
        self.start_ndist = np.around(self.start_ndist, decimals=2)

        # Convert current progress to be [0,100] starting at the initial waypoint
        if self.reverse_dir:
            current_progress = self.start_ndist - current_ndist
        else:
            current_progress = current_ndist - self.start_ndist
        
        # SAHIKA: adding the error margin because due to quantization errors some close points results in negative error
        #if current_progress < 0.0: current_progress = current_progress + 1.0
        if current_progress < 0.0: 
            if abs(current_progress) < 0.011:
                current_progress = 0.0
            else:
                current_progress = current_progress + 1.0
            
        
        current_progress = 100 * current_progress
        
        if current_progress < self.prev_progress:
            # Either: (1) we wrapped around and have finished the track,
            delta1 = current_progress + 100 - self.prev_progress
            # or (2) for some reason the car went backwards (this should be rare)
            delta2 = self.prev_progress - current_progress
            current_progress = (self.prev_progress, 100)[delta1 < delta2]

        # Car is off track if all wheels are outside the borders
        wheel_on_track = [self.road_poly.contains(p) for p in wheel_points]
        all_wheels_on_track = all(wheel_on_track)
        any_wheels_on_track = any(wheel_on_track)
        
        # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
        # SAHIKA 
        # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
        learner_car_position = Point(model_state.pose.position.x, model_state.pose.position.y)
        learner_car_progress = self.center_line.project(learner_car_position)
        learner_car_lane = self.center_line.contains(learner_car_position)
        
        bot_car_progress = list()
        bot_car_lane_match = list()
        for kk in range(len(self.bot_cars)):
            bot_car_position = Point(self.bot_cars[kk].car_model_state.pose.position.x, self.bot_cars[kk].car_model_state.pose.position.y)
            bot_car_progress.append(self.center_line.project(bot_car_position) - learner_car_progress)
            
            bot_car_lane = self.center_line.contains(bot_car_position)
            if learner_car_lane == bot_car_lane:
                bot_car_lane_match.append(True)
            else:
                bot_car_lane_match.append(False)
        # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
        
        bot_car_progress = np.array(bot_car_progress)
        if all(bot_car_progress < 0):
            ahead_bot_index = np.argmin(bot_car_progress)
            ahead_bot_lane_match = bot_car_lane_match[ahead_bot_index]
        else:
            ahead_bot_index = np.where(bot_car_progress > 0, bot_car_progress, np.inf).argmin()
            ahead_bot_lane_match = bot_car_lane_match[ahead_bot_index]
            
        THRESHOLD1, THRESHOLD2 = 5, 50

        is_bot_in_left_camera = False
        _, thr1 = cv2.threshold(self.next_state['STEREO_CAMERAS'][:,:,0], THRESHOLD1, 1, cv2.THRESH_BINARY)
        _, thr2 = cv2.threshold(self.next_state['STEREO_CAMERAS'][:,:,0], THRESHOLD2, 1, cv2.THRESH_BINARY)
        thr = cv2.bitwise_xor(thr1, thr2)
        thr = cv2.convertScaleAbs(thr)
        contours, hierarchy = cv2.findContours(thr, cv2.RETR_TREE, cv2.CHAIN_APPROX_SIMPLE)
        bot_size_in_left_camera = float('nan')
        for c in contours:
            x, y, w, h = cv2.boundingRect(c)
            if w * h > 70:
                is_bot_in_left_camera = True
                bot_size_in_left_camera = w*h
                break
                
        is_bot_in_right_camera = False
        _, thr1 = cv2.threshold(self.next_state['STEREO_CAMERAS'][:,:,1], THRESHOLD1, 1, cv2.THRESH_BINARY)
        _, thr2 = cv2.threshold(self.next_state['STEREO_CAMERAS'][:,:,1], THRESHOLD2, 1, cv2.THRESH_BINARY)
        thr = cv2.bitwise_xor(thr1, thr2)
        thr = cv2.convertScaleAbs(thr)
        contours, hierarchy = cv2.findContours(thr, cv2.RETR_TREE, cv2.CHAIN_APPROX_SIMPLE)
        bot_size_in_right_camera = float('nan')
        for c in contours:
            x, y, w, h = cv2.boundingRect(c)
            if w * h > 70:
                is_bot_in_right_camera = True
                bot_size_in_right_camera = w*h
                break
                
        is_bot_in_camera = is_bot_in_left_camera or is_bot_in_right_camera
        
        # Compute the reward
        reward = 0.0
        if (not is_crashed) and any_wheels_on_track:
            done = False
            params = {
                'all_wheels_on_track': all_wheels_on_track,
                'x': model_point.x,
                'y': model_point.y,
                'heading': model_heading * 180.0 / math.pi,
                'distance_from_center': distance_from_center,
                'progress': current_progress,
                'steps': self.steps,
                'speed': speed,
                'steering_angle': steering_angle * 180.0 / math.pi,
                'track_width': track_width,
                'waypoints': list(self.center_line.coords),
                'closest_waypoints': [prev_index, next_index],
                'is_left_of_center': is_left_of_center,
                'is_reversed': self.reverse_dir,
                'is_crashed': is_crashed,
                'dist_closest_bot': dist_closest_bot_car,
                'flag_unsafe': flag_unsafe,
                'bot_car_progress': bot_car_progress,
                'bot_car_lane_match': ahead_bot_lane_match,
                'is_bot_in_camera': is_bot_in_camera,
                'bot_size_in_left_camera': bot_size_in_left_camera,
                'bot_size_in_right_camera': bot_size_in_right_camera
            }
            try:
                reward = float(self.reward_function(params))
            except Exception as e:
                utils.json_format_logger("Exception {} in customer reward function. Job failed!".format(e),
                                         **utils.build_user_error_dict(utils.SIMAPP_SIMULATION_WORKER_EXCEPTION,
                                                                       utils.SIMAPP_EVENT_ERROR_CODE_400))
                traceback.print_exc()
                utils.simapp_exit_gracefully()
        else:
            done = True
            reward = CRASHED

        # Reset if the car position hasn't changed in the last 2 steps
        prev_pnt_dist = min(model_point.distance(self.prev_point), model_point.distance(self.prev_point_2))

        if prev_pnt_dist <= 0.0001 and self.steps % NUM_STEPS_TO_CHECK_STUCK == 0:
            done = True
            reward = CRASHED  # stuck

        # Simulation jobs are done when progress reaches 100
        if current_progress >= 100:
            done = True
#             reward = 1e3

        # Keep data from the previous step around
        self.prev_point_2 = self.prev_point
        self.prev_point = model_point
        self.prev_progress = current_progress

        # Set the reward and done flag
        self.reward = reward
        self.reward_in_episode += reward
        self.done = done

        # Trace logs to help us debug and visualize the training runs
        # btown TODO: This should be written to S3, not to CWL.
        logger.info('SIM_TRACE_LOG:%d,%d,%.4f,%.4f,%.4f,%.2f,%.2f,%d,%.4f,%s,%s,%.4f,%d,%.2f,%s,%s,%.2f\n' % (
            self.episodes, self.steps, model_location[0], model_location[1], model_heading,
            self.steering_angle,
            self.speed,
            self.action_taken,
            self.reward,
            self.done,
            all_wheels_on_track,
            current_progress,
            closest_waypoint_index,
            self.track_length,
            time.time(),
            is_crashed,
            dist_closest_bot_car))

        #build json record of the reward metrics
        reward_metrics = OrderedDict()
        reward_metrics['episode'] = self.episodes
        reward_metrics['steps'] = self.steps
        reward_metrics['X'] = model_location[0]
        reward_metrics['Y'] = model_location[1]
        reward_metrics['yaw'] = model_heading
        reward_metrics['steer'] = self.steering_angle
        reward_metrics['throttle'] = self.speed
        reward_metrics['action'] = self.action_taken
        reward_metrics['reward'] = self.reward
        reward_metrics['done'] = self.done
        reward_metrics['all_wheels_on_track'] = all_wheels_on_track
        reward_metrics['progress'] = current_progress
        reward_metrics['closest_waypoint'] = closest_waypoint_index
        reward_metrics['track_len'] = self.track_length
        reward_metrics['tstamp'] = time.time()
        # self.simtrace_data.write_simtrace_data(reward_metrics)

        # Terminate this episode when ready
        if done and node_type == SIMULATION_WORKER:
            self.finish_episode(current_progress)

    def find_prev_next_waypoints(self, ndist):
        if self.reverse_dir:
            next_index = bisect.bisect_left(self.center_dists, ndist) - 1
            prev_index = next_index + 1
            if next_index == -1: next_index = len(self.center_dists) - 1
        else:
            next_index = bisect.bisect_right(self.center_dists, ndist)
            prev_index = next_index - 1
            if next_index == len(self.center_dists): next_index = 0
        return prev_index, next_index

    def stop_car(self):
        self.steering_angle = 0
        self.speed = 0
        self.action_taken = 0
        self.send_action(0, 0)
        self.racecar_reset()

    def finish_episode(self, progress):
        # Increment episode count, update start position and direction
        self.episodes += 1            
#         if self.change_start:
#             if self.job_type == TRAINING_JOB:
#                 self.start_ndist = (self.start_ndist + ROUND_ROBIN_ADVANCE_DIST) % 1.0
#             else:
#                 self.start_ndist = (self.start_ndist + 2*ROUND_ROBIN_ADVANCE_DIST) % 1.0
        if self.change_start:
#             if self.checkpoint_num < 20 or progress > 40 or self.job_type == EVALUATION_JOB:
            self.start_ndist_index = (self.start_ndist_index + 1) % len(self.start_ndist_map)
            self.start_ndist = self.start_ndist_map[self.start_ndist_index]
        if self.alternate_dir:
            self.reverse_dir = not self.reverse_dir

        # Reset the car
        self.stop_car()

        # upload SIM_TRACE data to S3
        # self.simtrace_data.upload_to_s3(self.episodes)

        # Update metrics based on job type
        if self.job_type == TRAINING_JOB:
            self.update_training_metrics(progress)
            self.write_metrics_to_s3()
            if self.is_training_done():
                self.cancel_simulation_job()
        elif self.job_type == EVALUATION_JOB:
            self.number_of_trials += 1
            self.update_eval_metrics(progress)
            self.write_metrics_to_s3()

    def set_checkpoint_num(self, current_checkpoint):
        self.checkpoint_num = current_checkpoint

    def update_eval_metrics(self, progress):
        eval_metric = {}
        eval_metric['checkpoint_num'] = self.checkpoint_num
        eval_metric['completion_percentage'] = int(progress)
        eval_metric['metric_time'] = int(round(time.time() * 1000))
        eval_metric['start_time'] = int(round(self.simulation_start_time * 1000))
        eval_metric['elapsed_time_in_milliseconds'] = int(round((time.time() - self.simulation_start_time) * 1000))
        eval_metric['trial'] = int(self.number_of_trials)
        self.metrics.append(eval_metric)

    def update_training_metrics(self, progress):
        training_metric = {}
        training_metric['checkpoint_num'] = self.checkpoint_num
        training_metric['reward_score'] = int(round(self.reward_in_episode))
        training_metric['metric_time'] = int(round(time.time() * 1000))
        training_metric['start_time'] = int(round(self.simulation_start_time * 1000))
        training_metric['elapsed_time_in_milliseconds'] = int(round((time.time() - self.simulation_start_time) * 1000))
        training_metric['episode'] = int(self.episodes)
        training_metric['completion_percentage'] = int(progress)
        self.metrics.append(training_metric)

    def write_metrics_to_s3(self):
        session = boto3.session.Session()
        s3_client = session.client('s3', region_name=self.aws_region)
        metrics_body = json.dumps({'metrics': self.metrics})
        s3_client.put_object(
            Bucket=self.metrics_s3_bucket,
            Key=self.metrics_s3_object_key,
            Body=bytes(metrics_body, encoding='utf-8')
        )

    def is_training_done(self):
        if ((self.target_number_of_episodes > 0) and (self.target_number_of_episodes == self.episodes)) or \
           ((isinstance(self.target_reward_score, (int, float))) and (self.target_reward_score <= self.reward_in_episode)):
            self.is_simulation_done = True
        return self.is_simulation_done

    def cancel_simulation_job(self):
        logger.info ("cancel_simulation_job: make sure to shutdown simapp first")
        simapp_shutdown()

        session = boto3.session.Session()
        robomaker_client = session.client('robomaker', region_name=self.aws_region)
        robomaker_client.cancel_simulation_job(
            job=self.simulation_job_arn
        )

class DeepRacerRacetrackCustomActionSpaceEnv(DeepRacerRacetrackEnv):
    def __init__(self):
        DeepRacerRacetrackEnv.__init__(self)
        try:
            # Try loading the custom model metadata (may or may not be present)
            with open('custom_files/model_metadata.json', 'r') as f:
                model_metadata = json.load(f)
                self.json_actions = model_metadata['action_space']
            logger.info("Loaded action space from file: {}".format(self.json_actions))
        except Exception as ex:
            # Failed to load, fall back on the default action space
            from markov.defaults import model_metadata
            self.json_actions = model_metadata['action_space']
            logger.info("Exception {} on loading custom action space, using default: {}".format(ex, self.json_actions))
        self.action_space = spaces.Discrete(len(self.json_actions))

    def step(self, action):
        self.steering_angle = float(self.json_actions[action]['steering_angle']) * math.pi / 180.0
        self.speed = float(self.json_actions[action]['speed'])
        self.action_taken = action
        return super().step([self.steering_angle, self.speed])
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -


Advanced workshops/reInvent2019-400/src/markov/environments/deepracer_racetrack_env.py [24:1121]:
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
del_path = []
for p in reversed(sys.path):
    if 'python2.7' in p:
        sys.path.remove(p)
        del_path.append(p)
# print(sys.path)
import cv2
for p in del_path:
    sys.path.append(p)
# print(sys.path)

logger = utils.Logger(__name__, logging.INFO).get_logger()
logger.info("*********** ENV from SRC SAHIKA **********************")

# Type of worker
SIMULATION_WORKER = "SIMULATION_WORKER"
SAGEMAKER_TRAINING_WORKER = "SAGEMAKER_TRAINING_WORKER"

node_type = os.environ.get("NODE_TYPE", SIMULATION_WORKER)
if node_type == SIMULATION_WORKER:
    import rospy
    from std_msgs.msg import Float64
    from gazebo_msgs.msg import ModelState
    from gazebo_msgs.srv import GetLinkState, GetModelState, JointRequest, SetModelState, SpawnModel
    from geometry_msgs.msg import Pose
    from scipy.spatial.transform import Rotation
    from rosgraph_msgs.msg import Clock as clock
    from sensor_msgs.msg import Image as sensor_image
    from sensor_msgs.msg import LaserScan
    from shapely.geometry import Point, Polygon
    from shapely.geometry.polygon import LinearRing, LineString
    from deepracer_simulation_environment.srv import GetWaypointSrv, ResetCarSrv
    # from markov.s3_simdata_upload import DeepRacerRacetrackSimTraceData

# Type of job
TRAINING_JOB = 'TRAINING'
EVALUATION_JOB = 'EVALUATION'

# Dimensions of the input training image
TRAINING_IMAGE_SIZE = (160, 120)

# Local offset of the front of the car
RELATIVE_POSITION_OF_FRONT_OF_CAR = [0.14, 0, 0]

# Normalized track distance to move with each reset
# ROUND_ROBIN_ADVANCE_DIST = 0.05

# Reward to give the car when it "crashes"
CRASHED = 1e-8

# Size of the image queue buffer, we want this to be one so that we consume 1 image
# at a time, but may want to change this as we add more algorithms
IMG_QUEUE_BUF_SIZE = 1

# List of required velocity topics, one topic per wheel
VELOCITY_TOPICS = ['/racecar/left_rear_wheel_velocity_controller/command',
                   '/racecar/right_rear_wheel_velocity_controller/command',
                   '/racecar/left_front_wheel_velocity_controller/command',
                   '/racecar/right_front_wheel_velocity_controller/command']

# List of required steering hinges
STEERING_TOPICS = ['/racecar/left_steering_hinge_position_controller/command',
                   '/racecar/right_steering_hinge_position_controller/command']

# List of all effort joints
EFFORT_JOINTS = ['/racecar/left_rear_wheel_joint', '/racecar/right_rear_wheel_joint',
                 '/racecar/left_front_wheel_joint','/racecar/right_front_wheel_joint',
                 '/racecar/left_steering_hinge_joint','/racecar/right_steering_hinge_joint']
# Radius of the wheels of the car in meters
WHEEL_RADIUS = 0.1

# The number of steps to wait before checking if the car is stuck
# This number should corespond to the camera FPS, since it is pacing the
# step rate.
NUM_STEPS_TO_CHECK_STUCK = 15

#Defines to upload SIM_TRACE data in S3
TRAINING_SIMTRACE_DATA_S3_OBJECT_KEY = "sim_inference_logs/TrainingSimTraceData.csv"
EVALUATION_SIMTRACE_DATA_S3_OBJECT_KEY = "sim_inference_logs/EvaluationSimTraceData.csv"
SIMAPP_DATA_UPLOAD_TIME_TO_S3 = 300 #in seconds
simapp_data_upload_timer = None

def simapp_shutdown():
    #This function is called on simapp exit. This is called on:
    #  -robomaker expiry shutdown
    #  -an unexpected exception in the simapp leading to system exit.
    #  -cancel_simulation_job
    #  -simulation data upload timer expiry
    logger.info("deepracer_racetrack_env - Shutdown simapp, close the running processes.")
    stack_trace = traceback.format_exc()
    logger.info ("deepracer_racetrack_env - callstack={}".format(stack_trace))
    # if node_type == SIMULATION_WORKER:
        # simtrace_data = DeepRacerRacetrackSimTraceData.getInstance()
        # simtrace_data.complete_upload_to_s3()

def simapp_data_upload_timer_expiry():
    logger.info("deepracer_racetrack_env - simapp_data_upload timer expired")
    simapp_data_upload_timer.cancel()
    simapp_shutdown()


class BotCarController(object):
    def __init__(self, car_id, is_inner, speed, lanes_list_np, world_name):
        
        if 'base' in world_name:
            self.sec_map = [[[0.1, 2.8], [8.5, 11.8], [15.6]], [[0.1, 2.8], [7.3, 10.6], [13.9]]]    # base
            self.stat_sec = [2]
        elif 'inch' in world_name:
            self.sec_map = [[[0.4, 3.0], [6.2], [11.2, 13.6]], [[0, 2.6], [5.1], [8.9, 11.3]]]    # 36inch
            self.stat_sec = [1]
        elif 'mirror' in world_name:
            self.sec_map = [[[4.9], [9.8, 14.6], [21.1, 23.1]], [[4.3], [8.5, 13.3], [18.5, 20.8]]]    # mirror
            self.stat_sec = [0]
        else:
            self.sec_map = [[[8.1, 9.9], [11.8, 13.7], [18.8, 21.8], [0.8, 0.8], [3.8, 6.1]], 
                            [[6.9, 8.1], [10.2, 11.5], [15.8, 18.6], [0.8, 0.8], [3.2, 5]]]    # 2019
            self.stat_sec = [3]

        # Wait for ros services
        rospy.wait_for_service('/gazebo/set_model_state')
        rospy.wait_for_service('/gazebo/spawn_urdf_model')
        self.set_model_state = rospy.ServiceProxy('/gazebo/set_model_state', SetModelState)
        self.spawn_model_client = rospy.ServiceProxy('gazebo/spawn_urdf_model', SpawnModel)

        # Spawn the new car
        robot_description = rospy.get_param('robot_description_bot')

        car_initial_pose = Pose()
        car_initial_pose.position.x = 0
        car_initial_pose.position.y = 0
        car_initial_pose.position.z = 0
        self.car_name = "racecar_{}".format(car_id)
        self.car_section = car_id - 1    # car_id should be 1, 2 and 3
        self.is_inner = is_inner
        self.resp = self.spawn_model_client(self.car_name,
                                            robot_description,
                                            '/{}'.format(self.car_name),
                                            car_initial_pose, '')
        logger.info('Spawn status: {}'.format(self.resp.status_message))

        # Initialize member data and reset car
        self.car_speed = speed

        # Initializing the lane that the bot car runs
        self.lanes_list_np = lanes_list_np
        self.lanes_one_hot = np.zeros(len(lanes_list_np), dtype=bool)
        if is_inner:
            self.lanes_one_hot[0] = True
            self.shapely_lane = lanes_list_np[self.lanes_one_hot][0]
        else:
            self.lanes_one_hot[1] = True
            self.shapely_lane = lanes_list_np[self.lanes_one_hot][0]

        # Change the lanes after certain time
        self.change_lane_freq_sec = 30 if self.car_section==self.stat_sec else 0
        self.reverse_dir = False

        self.car_model_state = ModelState()
        self.reset_sim(self.sec_map[self.is_inner][self.car_section][0])

    def reset_sim(self, start_dist):
        rostime = rospy.get_rostime()
        self.car_initial_dist = start_dist
        self.car_initial_time = rostime.secs + 1.e-9*rostime.nsecs
        self.next_change_lane_time = self.car_initial_time + self.change_lane_freq_sec
        self.position_bot_car(start_dist)

    def update_bot_sim(self, sim_time):
        current_time = sim_time.clock.secs + 1.e-9*sim_time.clock.nsecs
        seconds_elapsed = current_time - self.car_initial_time
        traveled_dist = seconds_elapsed * self.car_speed
        if self.reverse_dir:
            current_dist = (self.car_initial_dist - traveled_dist) % self.shapely_lane.length
        else:
            current_dist = (self.car_initial_dist + traveled_dist) % self.shapely_lane.length

        
        # Check for lane change and section reset
        if self.car_section == self.stat_sec and current_time > self.next_change_lane_time:
            # Get the next lane index
            tmp_lane_np = np.zeros(len(self.lanes_list_np), dtype=bool)
            next_lane_idx = (int(np.argwhere(self.lanes_one_hot==True)) + 1) % len(self.lanes_list_np)
            tmp_lane_np[next_lane_idx] = True
            self.lanes_one_hot = tmp_lane_np
            self.is_inner = not self.is_inner

            # Assigns the next lane that the bot car as to travel
            self.shapely_lane = self.lanes_list_np[self.lanes_one_hot][0]
            self.reset_sim(self.sec_map[self.is_inner][self.car_section][0])
        elif self.car_section != self.stat_sec and current_dist >= self.sec_map[self.is_inner][self.car_section][1]:
            tmp_lane_np = np.zeros(len(self.lanes_list_np), dtype=bool)
            next_lane_idx = (int(np.argwhere(self.lanes_one_hot==True)) + 1) % len(self.lanes_list_np)
            tmp_lane_np[next_lane_idx] = True
            self.lanes_one_hot = tmp_lane_np
            self.is_inner = not self.is_inner
            
            self.shapely_lane = self.lanes_list_np[self.lanes_one_hot][0]
            self.reset_sim(self.sec_map[self.is_inner][self.car_section][0])
        else:
            # Position the car on the lane
            self.position_bot_car(current_dist)

    def position_bot_car(self, car_dist):
        # Set the position of the second car
        _, next_index = self.find_prev_next_lane_points(car_dist, self.reverse_dir)
        car_position = self.shapely_lane.interpolate(car_dist)
        car_yaw = math.atan2(self.shapely_lane.coords[next_index][1] - car_position.y,
                             self.shapely_lane.coords[next_index][0] - car_position.x)
        car_quaternion = Rotation.from_euler('zyx', [car_yaw, 0, 0]).as_quat()
        self.car_model_state.model_name = self.car_name
        self.car_model_state.pose.position.x = car_position.x
        self.car_model_state.pose.position.y = car_position.y
        self.car_model_state.pose.position.z = 0
        self.car_model_state.pose.orientation.x = car_quaternion[0]
        self.car_model_state.pose.orientation.y = car_quaternion[1]
        self.car_model_state.pose.orientation.z = car_quaternion[2]
        self.car_model_state.pose.orientation.w = car_quaternion[3]
        self.car_model_state.twist.linear.x = 0
        self.car_model_state.twist.linear.y = 0
        self.car_model_state.twist.linear.z = 0
        self.car_model_state.twist.angular.x = 0
        self.car_model_state.twist.angular.y = 0
        self.car_model_state.twist.angular.z = 0
        self.set_model_state(self.car_model_state)

    def get_lane_dists(self, lane):
        return [lane.project(Point(p)) for p in lane.coords[:-1]] + [1.0]
    
    def find_prev_next_lane_points(self, ndist, reverse_dir):
        lane_dist = self.get_lane_dists(self.shapely_lane)
        if reverse_dir:
            next_index = bisect.bisect_left(lane_dist, ndist) - 1
            prev_index = next_index + 1
            if next_index == -1: next_index = len(lane_dist) - 1
        else:
            next_index = bisect.bisect_right(lane_dist, ndist)
            prev_index = next_index - 1
            if next_index == len(lane_dist): next_index = 0
        return prev_index, next_index
    
### Gym Env ###
class DeepRacerRacetrackEnv(gym.Env):

    def __init__(self):

        # Create the observation space
#         self.observation_space = spaces.Box(low=0, high=255,
#                                             shape=(TRAINING_IMAGE_SIZE[1], TRAINING_IMAGE_SIZE[0], 3),
#                                             dtype=np.uint8)
#         self.observation_space = spaces.Dict({
# #                 'left_camera': spaces.Box(low=0, high=255,
# #                                         shape=(TRAINING_IMAGE_SIZE[1], TRAINING_IMAGE_SIZE[0], 3),
# #                                         dtype=np.uint8),
#                 'stereo': spaces.Box(low=0, high=255,
#                                         shape=(TRAINING_IMAGE_SIZE[1], TRAINING_IMAGE_SIZE[0], 2),
#                                         dtype=np.uint8)
#         })
    
        self.observation_space = spaces.Dict({
                'STEREO_CAMERAS': spaces.Box(low=0, high=255,
                                        shape=(TRAINING_IMAGE_SIZE[1], TRAINING_IMAGE_SIZE[0], 2),
                                        dtype=np.uint8),
                'LIDAR': spaces.Box(low=0.15, high=1.0, shape=(64,))
        })
    
        # Create the action space
        self.action_space = spaces.Box(low=np.array([-1, 0]), high=np.array([+1, +1]), dtype=np.float32)

        if node_type == SIMULATION_WORKER:

            # ROS initialization
            rospy.init_node('rl_coach', anonymous=True)

            # wait for required services
            rospy.wait_for_service('/deepracer_simulation_environment/get_waypoints')
            rospy.wait_for_service('/deepracer_simulation_environment/reset_car')
            rospy.wait_for_service('/gazebo/get_model_state')
            rospy.wait_for_service('/gazebo/get_link_state')
            rospy.wait_for_service('/gazebo/clear_joint_forces')
            rospy.wait_for_service('/gazebo/spawn_urdf_model')

            self.get_model_state = rospy.ServiceProxy('/gazebo/get_model_state', GetModelState)
            self.get_link_state = rospy.ServiceProxy('/gazebo/get_link_state', GetLinkState)
            self.clear_forces_client = rospy.ServiceProxy('/gazebo/clear_joint_forces', JointRequest)
            self.reset_car_client = rospy.ServiceProxy('/deepracer_simulation_environment/reset_car', ResetCarSrv)
            get_waypoints_client = rospy.ServiceProxy('/deepracer_simulation_environment/get_waypoints', GetWaypointSrv)

            # Create the publishers for sending speed and steering info to the car
            self.velocity_pub_dict = OrderedDict()
            self.steering_pub_dict = OrderedDict()

            for topic in VELOCITY_TOPICS:
                self.velocity_pub_dict[topic] = rospy.Publisher(topic, Float64, queue_size=1)

            for topic in STEERING_TOPICS:
                self.steering_pub_dict[topic] = rospy.Publisher(topic, Float64, queue_size=1)

            # Read in parameters
            self.world_name = rospy.get_param('WORLD_NAME')
            self.job_type = rospy.get_param('JOB_TYPE')
            self.aws_region = rospy.get_param('AWS_REGION')
            self.metrics_s3_bucket = rospy.get_param('METRICS_S3_BUCKET')
            self.metrics_s3_object_key = rospy.get_param('METRICS_S3_OBJECT_KEY')
            self.metrics = []
            self.simulation_job_arn = 'arn:aws:robomaker:' + self.aws_region + ':' + \
                                      rospy.get_param('ROBOMAKER_SIMULATION_JOB_ACCOUNT_ID') + \
                                      ':simulation-job/' + rospy.get_param('AWS_ROBOMAKER_SIMULATION_JOB_ID')

            # Setup SIM_TRACE_LOG data upload to s3
            # self.setup_simtrace_data_upload_to_s3()

            if self.job_type == TRAINING_JOB:
                from custom_files.customer_reward_function import reward_function
                self.reward_function = reward_function
                self.target_number_of_episodes = rospy.get_param('NUMBER_OF_EPISODES')
                self.target_reward_score = rospy.get_param('TARGET_REWARD_SCORE')
            else:
                from markov.defaults import reward_function
                self.reward_function = reward_function
                self.number_of_trials = 0
                self.target_number_of_trials = rospy.get_param('NUMBER_OF_TRIALS')

            # Request the waypoints
            waypoints = None
            try:
                resp = get_waypoints_client()
                waypoints = np.array(resp.waypoints).reshape(resp.row, resp.col)
            except Exception as ex:
                utils.json_format_logger("Unable to retrieve waypoints: {}".format(ex),
                             **utils.build_system_error_dict(utils.SIMAPP_ENVIRONMENT_EXCEPTION,
                                                             utils.SIMAPP_EVENT_ERROR_CODE_500))

            is_loop = np.all(waypoints[0,:] == waypoints[-1,:])
            if 'inch' in self.world_name:
                coef = 0.5
            else:
                coef = 0.6
            if is_loop:
                self.center_line = LinearRing(waypoints[:,0:2])
                self.inner_border = LinearRing(waypoints[:,2:4])
                self.outer_border = LinearRing(waypoints[:,4:6])
                self.left_lane = LinearRing(waypoints[:, 2:4]*coef + waypoints[:, 0:2]*(1-coef))
                self.right_lane = LinearRing(waypoints[:, 4:6]*coef + waypoints[:, 0:2]*(1-coef))
                self.road_poly = Polygon(self.outer_border, [self.inner_border])
            else:
                self.center_line = LineString(waypoints[:,0:2])
                self.inner_border = LineString(waypoints[:,2:4])
                self.outer_border = LineString(waypoints[:,4:6])
                self.left_lane = LinearRing(waypoints[:, 2:4]*coef + waypoints[:, 0:2]*(1-coef))
                self.right_lane = LinearRing(waypoints[:, 4:6]*coef + waypoints[:, 0:2]*(1-coef))
                self.road_poly = Polygon(np.vstack((self.outer_border, np.flipud(self.inner_border))))
            self.center_dists = [self.center_line.project(Point(p), normalized=True) for p in self.center_line.coords[:-1]] + [1.0]
            self.track_length = self.center_line.length
            
            self.safe_angle = 30
            
            # Queue used to maintain image consumption synchronicity
            self.image_queue_left_camera = queue.Queue(IMG_QUEUE_BUF_SIZE)
            rospy.Subscriber('/racecar/camera/zed/rgb/image_rect_color', sensor_image, self.callback_image_left_camera)
            self.image_queue_right_camera = queue.Queue(IMG_QUEUE_BUF_SIZE)
            rospy.Subscriber('/racecar/camera/zed_right/rgb/image_rect_color_right', sensor_image, self.callback_image_right_camera)
            print(self)

            # Initialize state data
            self.episodes = 0
            self.reverse_dir = False
#             if self.reverse_dir:
#                 self.start_ndist_map = [0.28, 0.5, 0.97]
#             else:
#                 self.start_ndist_map = [0.2, 0.42, 0.78]    # 36inch
# #                 self.start_ndist_map = [0.19, 0.67, 0.87]    # base

            if 'base' in self.world_name:
                self.start_ndist_map = [0.19, 0.67, 0.87]
            elif 'inch' in self.world_name:
                self.start_ndist_map = [0.23, 0.45, 0.93]
            elif 'mirror' in self.world_name:
                self.start_ndist_map = [0.12, 0.34, 0.83]
            else:
                self.start_ndist_map = [0.08, 0.27, 0.41, 0.57, 0.96]
    
            self.start_ndist_index = 0
#             self.start_ndist = 0.0
            self.start_ndist = self.start_ndist_map[0]
            # self.change_start = rospy.get_param('CHANGE_START_POSITION', (self.job_type == TRAINING_JOB))
            self.change_start = bool(rospy.get_param('CHANGE_START_POSITION', True))

            self.alternate_dir = rospy.get_param('ALTERNATE_DRIVING_DIRECTION')
#             if self.job_type == TRAINING_JOB:
#                 self.alternate_dir = True
#             else:
#                 self.alternate_dir = True
            print("Alternate direction is set to:", self.alternate_dir)
            
            self.is_simulation_done = False
            self.steering_angle = 0
            self.speed = 0
            self.action_taken = 0
            self.prev_progress = 0
            self.prev_point = Point(0, 0)
            self.prev_point_2 = Point(0, 0)
            self.next_state = None
            self.reward = None
            self.reward_in_episode = 0
            self.done = False
            self.steps = 0
            self.simulation_start_time = 0
            self.allow_servo_step_signals = False
            self.checkpoint_num = 0
            
            # Creating bot cars
            self.lanes_list_np_inner = np.array([self.left_lane, self.right_lane], dtype=object)
            self.lanes_list_np_outer = np.array([self.right_lane, self.left_lane], dtype=object)
            self.lanes_list_np_center = np.array([self.center_line, self.left_lane], dtype=object)
            self.lanes_list_np = np.array([self.left_lane, self.right_lane], dtype=object)

#             self.bot_cars = [
#                 BotCarController(car_id=1, start_dist=0.1, speed=0, lanes_list_np=self.lanes_list_np_inner, change_lane_freq_sec=0),
#                 BotCarController(car_id=2, start_dist=2.9, speed=0, lanes_list_np=self.lanes_list_np_inner, change_lane_freq_sec=0),
#                 BotCarController(car_id=3, start_dist=7.3, speed=0, lanes_list_np=self.lanes_list_np_inner, change_lane_freq_sec=0),
#                 BotCarController(car_id=4, start_dist=10.8, speed=0, lanes_list_np=self.lanes_list_np_inner, change_lane_freq_sec=0),
#                 BotCarController(car_id=5, start_dist=14, speed=0, lanes_list_np=self.lanes_list_np_inner, change_lane_freq_sec=0)
#             ]
#             # reinvent 36inch
#             # inner_lane: 14.7032; outer_lane: 18.1877; ratio=1.237
#             # forward dir: inner lane: 0-2.6, 5.1, 7.6-11. outer lane: 0.4-3, 6.2, 9.6-13.3
#             # reverse dir: inner lane: 14.2032-1.8, 4.4, 7.3-10.5. outer lane: 0.1-2.5, 5.8, 9.9-12.7
#             # reinvent_base
#             # inner_lane: 16.5382; outer_lane: 18.8032; ratio=1.137
#             # inner lane: 0.1-2.8, 7.3-10.6, 13.9. outer lane: 0.1-2.8, 8.5-11.8, 15.6
            
#             # 36inch
#             self.bot_cars = [
#                 BotCarController(car_id=1, is_inner=True, speed=0.1, lanes_list_np=self.lanes_list_np),
#                 BotCarController(car_id=2, is_inner=False, speed=0, lanes_list_np=self.lanes_list_np),
#                 BotCarController(car_id=3, is_inner=True, speed=0.1, lanes_list_np=self.lanes_list_np)
#             ]
        
            if 'base' in self.world_name:
                # base
                self.bot_cars = [
                    BotCarController(car_id=1, is_inner=True, speed=0.1, lanes_list_np=self.lanes_list_np, world_name=self.world_name),
                    BotCarController(car_id=2, is_inner=False, speed=0.1, lanes_list_np=self.lanes_list_np, world_name=self.world_name),
                    BotCarController(car_id=3, is_inner=True, speed=0, lanes_list_np=self.lanes_list_np, world_name=self.world_name)
                ]
            elif 'inch' in self.world_name:
                # 36inch
                self.bot_cars = [
                    BotCarController(car_id=1, is_inner=True, speed=0.1, lanes_list_np=self.lanes_list_np, world_name=self.world_name),
                    BotCarController(car_id=2, is_inner=False, speed=0, lanes_list_np=self.lanes_list_np, world_name=self.world_name),
                    BotCarController(car_id=3, is_inner=True, speed=0.1, lanes_list_np=self.lanes_list_np, world_name=self.world_name)
                ]
            elif 'mirror' in self.world_name:
                # mirror
                self.bot_cars = [
                    BotCarController(car_id=1, is_inner=True, speed=0, lanes_list_np=self.lanes_list_np, world_name=self.world_name),
                    BotCarController(car_id=2, is_inner=False, speed=0.2, lanes_list_np=self.lanes_list_np, world_name=self.world_name),
                    BotCarController(car_id=3, is_inner=True, speed=0.1, lanes_list_np=self.lanes_list_np, world_name=self.world_name)
                ]
            else:
                # 2019
                self.bot_cars = [
                    BotCarController(car_id=1, is_inner=True, speed=0.08, lanes_list_np=self.lanes_list_np, world_name=self.world_name),
                    BotCarController(car_id=2, is_inner=False, speed=0.1, lanes_list_np=self.lanes_list_np, world_name=self.world_name),
                    BotCarController(car_id=3, is_inner=True, speed=0.1, lanes_list_np=self.lanes_list_np, world_name=self.world_name),
                    BotCarController(car_id=4, is_inner=False, speed=0, lanes_list_np=self.lanes_list_np, world_name=self.world_name),
                    BotCarController(car_id=5, is_inner=True, speed=0.08, lanes_list_np=self.lanes_list_np, world_name=self.world_name)
                ]
            
#             print(self.bot_cars[0].shapely_lane.length)
#             print(self.bot_cars[1].shapely_lane.length)

            self.bot_reset_callback = []
            for bot in self.bot_cars:
                self.bot_reset_callback.append(rospy.Subscriber('/clock', clock, bot.update_bot_sim))
#             for bot in self.bot_cars:
#                 rospy.Subscriber('/clock', clock, bot.update_bot_sim)

    def setup_simtrace_data_upload_to_s3(self):
        if node_type == SIMULATION_WORKER:
            #start timer to upload SIM_TRACE data to s3 when simapp exits
            #There is not enough time to upload data to S3 when robomaker shuts down
            #Set up timer to upload data to S3 300 seconds before the robomaker quits
            # - 300 seocnds is randomly chosen number based on various jobs launched that
            #   provides enough time to upload data to S3
            global simapp_data_upload_timer
            session = boto3.session.Session()
            robomaker_client = session.client('robomaker', region_name=self.aws_region)
            result = robomaker_client.describe_simulation_job(
                job=self.simulation_job_arn
            )
            logger.info("robomaker job description: {}".format(result))
            self.simapp_upload_duration = result['maxJobDurationInSeconds'] - SIMAPP_DATA_UPLOAD_TIME_TO_S3
            start = 0
            if self.job_type == TRAINING_JOB:
                logger.info("simapp training job started_at={}".format(result['lastStartedAt']))
                start = result['lastStartedAt']
                self.simtrace_s3_bucket = rospy.get_param('SAGEMAKER_SHARED_S3_BUCKET')
                self.simtrace_s3_key = os.path.join(rospy.get_param('SAGEMAKER_SHARED_S3_PREFIX'), TRAINING_SIMTRACE_DATA_S3_OBJECT_KEY)
            else:
                logger.info("simapp evaluation job started_at={}".format(result['lastUpdatedAt']))
                start = result['lastUpdatedAt']
                self.simtrace_s3_bucket = rospy.get_param('MODEL_S3_BUCKET')
                self.simtrace_s3_key = os.path.join(rospy.get_param('MODEL_S3_PREFIX'), EVALUATION_SIMTRACE_DATA_S3_OBJECT_KEY)
            end = start + datetime.timedelta(seconds=self.simapp_upload_duration)
            now = datetime.datetime.now(tz=end.tzinfo) # use tzinfo as robomaker
            self.simapp_data_upload_time = (end - now).total_seconds()
            logger.info("simapp job started_at={} now={} end={} upload_data_in={} sec".format(start, now, end, self.simapp_data_upload_time))
            simapp_data_upload_timer = threading.Timer(self.simapp_data_upload_time, simapp_data_upload_timer_expiry)
            simapp_data_upload_timer.daemon = True
            simapp_data_upload_timer.start()
            logger.info("Timer with {} seconds is {}".format(self.simapp_data_upload_time, simapp_data_upload_timer.is_alive()))

            #setup to upload SIM_TRACE_DATA to S3
            self.simtrace_data = DeepRacerRacetrackSimTraceData(self.simtrace_s3_bucket, self.simtrace_s3_key)

    def reset(self):
        if node_type == SAGEMAKER_TRAINING_WORKER:
            return self.observation_space.sample()

        # Simulation is done - so RoboMaker will start to shut down the app.
        # Till RoboMaker shuts down the app, do nothing more else metrics may show unexpected data.
        if (node_type == SIMULATION_WORKER) and self.is_simulation_done:
            while True:
                time.sleep(1)

        self.steering_angle = 0
        self.speed = 0
        self.action_taken = 0
        self.prev_progress = 0
        self.prev_point = Point(0, 0)
        self.prev_point_2 = Point(0, 0)
        self.next_state = None
        self.reward = None
        self.reward_in_episode = 0
        self.done = False
        # Reset the car and record the simulation start time
        if self.allow_servo_step_signals:
            self.send_action(0, 0)

        self.racecar_reset()
        self.steps = 0
        self.simulation_start_time = time.time()
        self.infer_reward_state(0, 0)

        return self.next_state

    def set_next_state(self):
#         # Make sure the first image is the starting image
#         image_data = self.image_queue.get(block=True, timeout=None)
#         # Read the image and resize to get the state
#         image = Image.frombytes('RGB', (image_data.width, image_data.height), image_data.data, 'raw', 'RGB', 0, 1)
#         image = image.resize(TRAINING_IMAGE_SIZE, resample=2)
#         self.next_state = np.array(image)
        
        next_states = {}
        
        data = rospy.wait_for_message('/scan', LaserScan)
        next_states['LIDAR'] = np.array(data.ranges)
        
        # Make sure the first image is the starting image
        image_data = self.image_queue_left_camera.get(block=True, timeout=None)
        # Read the image and resize to get the state
        imgL = Image.frombytes('RGB', (image_data.width, image_data.height), image_data.data, 'raw', 'RGB', 0, 1)
        imgL = imgL.resize(TRAINING_IMAGE_SIZE, resample=2)
#         next_states['left_camera'] = np.array(imgL)
        
        image_data = self.image_queue_right_camera.get(block=True, timeout=None)
        imgR = Image.frombytes('RGB', (image_data.width, image_data.height), image_data.data, 'raw', 'RGB', 0, 1)
        imgR = imgR.resize(TRAINING_IMAGE_SIZE, resample=2)

        imgL = imgL.convert('L')
        imgR = imgR.convert('L')
        imgConcat = np.stack((imgL, imgR), axis=2)
        next_states['STEREO_CAMERAS'] = np.array(imgConcat)

        self.next_state = next_states

    def racecar_reset(self):
        try:
            for joint in EFFORT_JOINTS:
                self.clear_forces_client(joint)
            prev_index, next_index = self.find_prev_next_waypoints(self.start_ndist)
            self.reset_car_client(self.start_ndist, next_index)
            # First clear the queue so that we set the state to the start image
#             _ = self.image_queue.get(block=True, timeout=None)
            _ = self.image_queue_left_camera.get(block=True, timeout=None)
            _ = self.image_queue_right_camera.get(block=True, timeout=None)
            self.set_next_state()

        except Exception as ex:
            utils.json_format_logger("Unable to reset the car: {}".format(ex),
                         **utils.build_system_error_dict(utils.SIMAPP_ENVIRONMENT_EXCEPTION,
                                                         utils.SIMAPP_EVENT_ERROR_CODE_500))

    def set_allow_servo_step_signals(self, allow_servo_step_signals):
        self.allow_servo_step_signals = allow_servo_step_signals

    def step(self, action):
        if node_type == SAGEMAKER_TRAINING_WORKER:
            return self.observation_space.sample(), 0, False, {}

        # Initialize next state, reward, done flag
        self.next_state = None
        self.reward = None
        self.done = False

        # Send this action to Gazebo and increment the step count
        # if self.job_type == EVALUATION_JOB:
        noise_fraction = 0.1
        delta_steering = float(action[0]) * noise_fraction
        self.steering_angle = np.random.uniform(float(action[0])-delta_steering, float(action[0])+delta_steering)
        delta_speed = float(action[1]) * noise_fraction
        self.speed = max(0, np.random.uniform(float(action[1])-delta_speed, float(action[1])+delta_speed))
        # else:
        #     self.steering_angle = float(action[0])
        #     self.speed = float(action[1])

        if self.allow_servo_step_signals:
            self.send_action(self.steering_angle, self.speed)
        self.steps += 1

        # Compute the next state and reward
        self.infer_reward_state(self.steering_angle, self.speed)
        return self.next_state, self.reward, self.done, {}

#     def callback_image(self, data):
#         try:
#             self.image_queue.put_nowait(data)
#         except queue.Full:
#             pass
#         except Exception as ex:
#             utils.json_format_logger("Error retrieving frame from gazebo: {}".format(ex),
#                        **utils.build_system_error_dict(utils.SIMAPP_ENVIRONMENT_EXCEPTION, utils.SIMAPP_EVENT_ERROR_CODE_500))
            
    def callback_image_left_camera(self, data):
        try:
            self.image_queue_left_camera.put_nowait(data)
        except queue.Full:
            pass
        except Exception as ex:
            utils.json_format_logger("Error retrieving frame from gazebo: {}".format(ex),
                       **utils.build_system_error_dict(utils.SIMAPP_ENVIRONMENT_EXCEPTION, utils.SIMAPP_EVENT_ERROR_CODE_500))
            
    def callback_image_right_camera(self, data):
        try:
            self.image_queue_right_camera.put_nowait(data)
        except queue.Full:
            pass
        except Exception as ex:
            utils.json_format_logger("Error retrieving frame from gazebo: {}".format(ex),
                       **utils.build_system_error_dict(utils.SIMAPP_ENVIRONMENT_EXCEPTION, utils.SIMAPP_EVENT_ERROR_CODE_500))

    def send_action(self, steering_angle, speed):
        # Simple v/r to computes the desired rpm
        wheel_rpm = speed/WHEEL_RADIUS

        for _, pub in self.velocity_pub_dict.items():
            pub.publish(wheel_rpm)

        for _, pub in self.steering_pub_dict.items():
            pub.publish(steering_angle)

    def infer_reward_state(self, steering_angle, speed):
        try:
            self.set_next_state()
        except Exception as ex:
            utils.json_format_logger("Unable to retrieve image from queue: {}".format(ex),
                       **utils.build_system_error_dict(utils.SIMAPP_ENVIRONMENT_EXCEPTION, utils.SIMAPP_EVENT_ERROR_CODE_500))

        # Read model state from Gazebo
        model_state = self.get_model_state('racecar', '')
        model_orientation = Rotation.from_quat([
            model_state.pose.orientation.x,
            model_state.pose.orientation.y,
            model_state.pose.orientation.z,
            model_state.pose.orientation.w])
        model_location = np.array([
            model_state.pose.position.x,
            model_state.pose.position.y,
            model_state.pose.position.z]) + \
            model_orientation.apply(RELATIVE_POSITION_OF_FRONT_OF_CAR)
        model_point = Point(model_location[0], model_location[1])
        model_heading = model_orientation.as_euler('zyx')[0]

        # Read the wheel locations from Gazebo
        left_rear_wheel_state = self.get_link_state('racecar::left_rear_wheel', '')
        left_front_wheel_state = self.get_link_state('racecar::left_front_wheel', '')
        right_rear_wheel_state = self.get_link_state('racecar::right_rear_wheel', '')
        right_front_wheel_state = self.get_link_state('racecar::right_front_wheel', '')
        wheel_points = [
            Point(left_rear_wheel_state.link_state.pose.position.x,
                  left_rear_wheel_state.link_state.pose.position.y),
            Point(left_front_wheel_state.link_state.pose.position.x,
                  left_front_wheel_state.link_state.pose.position.y),
            Point(right_rear_wheel_state.link_state.pose.position.x,
                  right_rear_wheel_state.link_state.pose.position.y),
            Point(right_front_wheel_state.link_state.pose.position.x,
                  right_front_wheel_state.link_state.pose.position.y)
        ]

        # Project the current location onto the center line and find nearest points
        current_ndist = self.center_line.project(model_point, normalized=True)
        prev_index, next_index = self.find_prev_next_waypoints(current_ndist)
        distance_from_prev = model_point.distance(Point(self.center_line.coords[prev_index]))
        distance_from_next = model_point.distance(Point(self.center_line.coords[next_index]))
        closest_waypoint_index = (prev_index, next_index)[distance_from_next < distance_from_prev]

        # Compute distance from center and road width
        nearest_point_center = self.center_line.interpolate(current_ndist, normalized=True)
        nearest_point_inner = self.inner_border.interpolate(self.inner_border.project(nearest_point_center))
        nearest_point_outer = self.outer_border.interpolate(self.outer_border.project(nearest_point_center))
        distance_from_center = nearest_point_center.distance(model_point)
        distance_from_inner = nearest_point_inner.distance(model_point)
        distance_from_outer = nearest_point_outer.distance(model_point)
        track_width = nearest_point_inner.distance(nearest_point_outer)
        is_left_of_center = (distance_from_outer < distance_from_inner) if self.reverse_dir \
            else (distance_from_inner < distance_from_outer)
        
        # Compute the distance to the closest bot car
        is_crashed = False
        dist_closest_bot_car = 1e3 # large number
        closest_bot = -1           # index of closest bot car
        for kk in range(len(self.bot_cars)):
            dist_to_bot_car = np.sqrt((model_state.pose.position.x - self.bot_cars[kk].car_model_state.pose.position.x) ** 2
                                      + (model_state.pose.position.y - self.bot_cars[kk].car_model_state.pose.position.y) ** 2)
            if dist_to_bot_car < dist_closest_bot_car:
                dist_closest_bot_car = dist_to_bot_car
                closest_bot = kk
                
#         if self.bot_cars[closest_bot].shapely_lane.length < 16:
#             is_left_lane_bot = False if self.bot_cars[closest_bot].reverse_dir else True
#         else:
#             is_left_lane_bot = True if self.bot_cars[closest_bot].reverse_dir else False
                
        botcar = self.bot_cars[closest_bot].car_model_state
        botcar_orientation = Rotation.from_quat([
            botcar.pose.orientation.x,
            botcar.pose.orientation.y,
            botcar.pose.orientation.z,
            botcar.pose.orientation.w])
        botcar_heading = botcar_orientation.as_euler('zyx')[0]
        
        botcar_location = np.array([
            botcar.pose.position.x,
            botcar.pose.position.y,
            botcar.pose.position.z]) + \
            botcar_orientation.apply(RELATIVE_POSITION_OF_FRONT_OF_CAR)
        botcar_point = Point(botcar_location[0], botcar_location[1])
        botcar_current_ndist = self.center_line.project(botcar_point, normalized=True)
        botcar_prev_index, botcar_next_index = self.find_prev_next_waypoints(botcar_current_ndist)
        
        if next_index <= botcar_next_index:    # corner case: last few waypoints
            flag_model_car_behind = True
        else:
            flag_model_car_behind = False
            
        if flag_model_car_behind:
            behind_car_heading = model_heading * 180.0 / math.pi
            angle_to_front_car = math.atan2(botcar_point.y - model_point.y, botcar_point.x - model_point.x)
            angle_to_front_car = angle_to_front_car * 180.0 / math.pi
        else:
            behind_car_heading = botcar_heading * 180.0 / math.pi
            angle_to_front_car = math.atan2(model_point.y - botcar_point.y, model_point.x - botcar_point.x)
            angle_to_front_car = angle_to_front_car * 180.0 / math.pi
            
        abs_diff = abs(angle_to_front_car - behind_car_heading)
        if abs_diff > 180:
            abs_diff = 360 - abs_diff
            
        if abs_diff < self.safe_angle:
            flag_unsafe = True
        else:
            flag_unsafe = False
        
        if flag_unsafe and flag_model_car_behind and dist_closest_bot_car < 0.4:
            is_crashed = True
        elif flag_unsafe and not flag_model_car_behind and dist_closest_bot_car < 0.3:
            is_crashed = True
        elif not flag_unsafe and dist_closest_bot_car < 0.25:
            is_crashed = True

        # SAHIKA: Quantize the shapely projections to 2 digits
        current_ndist = np.around(current_ndist, decimals=2)
        self.start_ndist = np.around(self.start_ndist, decimals=2)

        # Convert current progress to be [0,100] starting at the initial waypoint
        if self.reverse_dir:
            current_progress = self.start_ndist - current_ndist
        else:
            current_progress = current_ndist - self.start_ndist
        
        # SAHIKA: adding the error margin because due to quantization errors some close points results in negative error
        #if current_progress < 0.0: current_progress = current_progress + 1.0
        if current_progress < 0.0: 
            if abs(current_progress) < 0.011:
                current_progress = 0.0
            else:
                current_progress = current_progress + 1.0
            
        
        current_progress = 100 * current_progress
        
        if current_progress < self.prev_progress:
            # Either: (1) we wrapped around and have finished the track,
            delta1 = current_progress + 100 - self.prev_progress
            # or (2) for some reason the car went backwards (this should be rare)
            delta2 = self.prev_progress - current_progress
            current_progress = (self.prev_progress, 100)[delta1 < delta2]

        # Car is off track if all wheels are outside the borders
        wheel_on_track = [self.road_poly.contains(p) for p in wheel_points]
        all_wheels_on_track = all(wheel_on_track)
        any_wheels_on_track = any(wheel_on_track)
        
        # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
        # SAHIKA 
        # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
        learner_car_position = Point(model_state.pose.position.x, model_state.pose.position.y)
        learner_car_progress = self.center_line.project(learner_car_position)
        learner_car_lane = self.center_line.contains(learner_car_position)
        
        bot_car_progress = list()
        bot_car_lane_match = list()
        for kk in range(len(self.bot_cars)):
            bot_car_position = Point(self.bot_cars[kk].car_model_state.pose.position.x, self.bot_cars[kk].car_model_state.pose.position.y)
            bot_car_progress.append(self.center_line.project(bot_car_position) - learner_car_progress)
            
            bot_car_lane = self.center_line.contains(bot_car_position)
            if learner_car_lane == bot_car_lane:
                bot_car_lane_match.append(True)
            else:
                bot_car_lane_match.append(False)
        # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
        
        bot_car_progress = np.array(bot_car_progress)
        if all(bot_car_progress < 0):
            ahead_bot_index = np.argmin(bot_car_progress)
            ahead_bot_lane_match = bot_car_lane_match[ahead_bot_index]
        else:
            ahead_bot_index = np.where(bot_car_progress > 0, bot_car_progress, np.inf).argmin()
            ahead_bot_lane_match = bot_car_lane_match[ahead_bot_index]
            
        THRESHOLD1, THRESHOLD2 = 5, 50

        is_bot_in_left_camera = False
        _, thr1 = cv2.threshold(self.next_state['STEREO_CAMERAS'][:,:,0], THRESHOLD1, 1, cv2.THRESH_BINARY)
        _, thr2 = cv2.threshold(self.next_state['STEREO_CAMERAS'][:,:,0], THRESHOLD2, 1, cv2.THRESH_BINARY)
        thr = cv2.bitwise_xor(thr1, thr2)
        thr = cv2.convertScaleAbs(thr)
        contours, hierarchy = cv2.findContours(thr, cv2.RETR_TREE, cv2.CHAIN_APPROX_SIMPLE)
        bot_size_in_left_camera = float('nan')
        for c in contours:
            x, y, w, h = cv2.boundingRect(c)
            if w * h > 70:
                is_bot_in_left_camera = True
                bot_size_in_left_camera = w*h
                break
                
        is_bot_in_right_camera = False
        _, thr1 = cv2.threshold(self.next_state['STEREO_CAMERAS'][:,:,1], THRESHOLD1, 1, cv2.THRESH_BINARY)
        _, thr2 = cv2.threshold(self.next_state['STEREO_CAMERAS'][:,:,1], THRESHOLD2, 1, cv2.THRESH_BINARY)
        thr = cv2.bitwise_xor(thr1, thr2)
        thr = cv2.convertScaleAbs(thr)
        contours, hierarchy = cv2.findContours(thr, cv2.RETR_TREE, cv2.CHAIN_APPROX_SIMPLE)
        bot_size_in_right_camera = float('nan')
        for c in contours:
            x, y, w, h = cv2.boundingRect(c)
            if w * h > 70:
                is_bot_in_right_camera = True
                bot_size_in_right_camera = w*h
                break
                
        is_bot_in_camera = is_bot_in_left_camera or is_bot_in_right_camera
        
        # Compute the reward
        reward = 0.0
        if (not is_crashed) and any_wheels_on_track:
            done = False
            params = {
                'all_wheels_on_track': all_wheels_on_track,
                'x': model_point.x,
                'y': model_point.y,
                'heading': model_heading * 180.0 / math.pi,
                'distance_from_center': distance_from_center,
                'progress': current_progress,
                'steps': self.steps,
                'speed': speed,
                'steering_angle': steering_angle * 180.0 / math.pi,
                'track_width': track_width,
                'waypoints': list(self.center_line.coords),
                'closest_waypoints': [prev_index, next_index],
                'is_left_of_center': is_left_of_center,
                'is_reversed': self.reverse_dir,
                'is_crashed': is_crashed,
                'dist_closest_bot': dist_closest_bot_car,
                'flag_unsafe': flag_unsafe,
                'bot_car_progress': bot_car_progress,
                'bot_car_lane_match': ahead_bot_lane_match,
                'is_bot_in_camera': is_bot_in_camera,
                'bot_size_in_left_camera': bot_size_in_left_camera,
                'bot_size_in_right_camera': bot_size_in_right_camera
            }
            try:
                reward = float(self.reward_function(params))
            except Exception as e:
                utils.json_format_logger("Exception {} in customer reward function. Job failed!".format(e),
                                         **utils.build_user_error_dict(utils.SIMAPP_SIMULATION_WORKER_EXCEPTION,
                                                                       utils.SIMAPP_EVENT_ERROR_CODE_400))
                traceback.print_exc()
                utils.simapp_exit_gracefully()
        else:
            done = True
            reward = CRASHED

        # Reset if the car position hasn't changed in the last 2 steps
        prev_pnt_dist = min(model_point.distance(self.prev_point), model_point.distance(self.prev_point_2))

        if prev_pnt_dist <= 0.0001 and self.steps % NUM_STEPS_TO_CHECK_STUCK == 0:
            done = True
            reward = CRASHED  # stuck

        # Simulation jobs are done when progress reaches 100
        if current_progress >= 100:
            done = True
#             reward = 1e3

        # Keep data from the previous step around
        self.prev_point_2 = self.prev_point
        self.prev_point = model_point
        self.prev_progress = current_progress

        # Set the reward and done flag
        self.reward = reward
        self.reward_in_episode += reward
        self.done = done

        # Trace logs to help us debug and visualize the training runs
        # btown TODO: This should be written to S3, not to CWL.
        logger.info('SIM_TRACE_LOG:%d,%d,%.4f,%.4f,%.4f,%.2f,%.2f,%d,%.4f,%s,%s,%.4f,%d,%.2f,%s,%s,%.2f\n' % (
            self.episodes, self.steps, model_location[0], model_location[1], model_heading,
            self.steering_angle,
            self.speed,
            self.action_taken,
            self.reward,
            self.done,
            all_wheels_on_track,
            current_progress,
            closest_waypoint_index,
            self.track_length,
            time.time(),
            is_crashed,
            dist_closest_bot_car))

        #build json record of the reward metrics
        reward_metrics = OrderedDict()
        reward_metrics['episode'] = self.episodes
        reward_metrics['steps'] = self.steps
        reward_metrics['X'] = model_location[0]
        reward_metrics['Y'] = model_location[1]
        reward_metrics['yaw'] = model_heading
        reward_metrics['steer'] = self.steering_angle
        reward_metrics['throttle'] = self.speed
        reward_metrics['action'] = self.action_taken
        reward_metrics['reward'] = self.reward
        reward_metrics['done'] = self.done
        reward_metrics['all_wheels_on_track'] = all_wheels_on_track
        reward_metrics['progress'] = current_progress
        reward_metrics['closest_waypoint'] = closest_waypoint_index
        reward_metrics['track_len'] = self.track_length
        reward_metrics['tstamp'] = time.time()
        # self.simtrace_data.write_simtrace_data(reward_metrics)

        # Terminate this episode when ready
        if done and node_type == SIMULATION_WORKER:
            self.finish_episode(current_progress)

    def find_prev_next_waypoints(self, ndist):
        if self.reverse_dir:
            next_index = bisect.bisect_left(self.center_dists, ndist) - 1
            prev_index = next_index + 1
            if next_index == -1: next_index = len(self.center_dists) - 1
        else:
            next_index = bisect.bisect_right(self.center_dists, ndist)
            prev_index = next_index - 1
            if next_index == len(self.center_dists): next_index = 0
        return prev_index, next_index

    def stop_car(self):
        self.steering_angle = 0
        self.speed = 0
        self.action_taken = 0
        self.send_action(0, 0)
        self.racecar_reset()

    def finish_episode(self, progress):
        # Increment episode count, update start position and direction
        self.episodes += 1            
#         if self.change_start:
#             if self.job_type == TRAINING_JOB:
#                 self.start_ndist = (self.start_ndist + ROUND_ROBIN_ADVANCE_DIST) % 1.0
#             else:
#                 self.start_ndist = (self.start_ndist + 2*ROUND_ROBIN_ADVANCE_DIST) % 1.0
        if self.change_start:
#             if self.checkpoint_num < 20 or progress > 40 or self.job_type == EVALUATION_JOB:
            self.start_ndist_index = (self.start_ndist_index + 1) % len(self.start_ndist_map)
            self.start_ndist = self.start_ndist_map[self.start_ndist_index]
        if self.alternate_dir:
            self.reverse_dir = not self.reverse_dir

        # Reset the car
        self.stop_car()

        # upload SIM_TRACE data to S3
        # self.simtrace_data.upload_to_s3(self.episodes)

        # Update metrics based on job type
        if self.job_type == TRAINING_JOB:
            self.update_training_metrics(progress)
            self.write_metrics_to_s3()
            if self.is_training_done():
                self.cancel_simulation_job()
        elif self.job_type == EVALUATION_JOB:
            self.number_of_trials += 1
            self.update_eval_metrics(progress)
            self.write_metrics_to_s3()

    def set_checkpoint_num(self, current_checkpoint):
        self.checkpoint_num = current_checkpoint

    def update_eval_metrics(self, progress):
        eval_metric = {}
        eval_metric['checkpoint_num'] = self.checkpoint_num
        eval_metric['completion_percentage'] = int(progress)
        eval_metric['metric_time'] = int(round(time.time() * 1000))
        eval_metric['start_time'] = int(round(self.simulation_start_time * 1000))
        eval_metric['elapsed_time_in_milliseconds'] = int(round((time.time() - self.simulation_start_time) * 1000))
        eval_metric['trial'] = int(self.number_of_trials)
        self.metrics.append(eval_metric)

    def update_training_metrics(self, progress):
        training_metric = {}
        training_metric['checkpoint_num'] = self.checkpoint_num
        training_metric['reward_score'] = int(round(self.reward_in_episode))
        training_metric['metric_time'] = int(round(time.time() * 1000))
        training_metric['start_time'] = int(round(self.simulation_start_time * 1000))
        training_metric['elapsed_time_in_milliseconds'] = int(round((time.time() - self.simulation_start_time) * 1000))
        training_metric['episode'] = int(self.episodes)
        training_metric['completion_percentage'] = int(progress)
        self.metrics.append(training_metric)

    def write_metrics_to_s3(self):
        session = boto3.session.Session()
        s3_client = session.client('s3', region_name=self.aws_region)
        metrics_body = json.dumps({'metrics': self.metrics})
        s3_client.put_object(
            Bucket=self.metrics_s3_bucket,
            Key=self.metrics_s3_object_key,
            Body=bytes(metrics_body, encoding='utf-8')
        )

    def is_training_done(self):
        if ((self.target_number_of_episodes > 0) and (self.target_number_of_episodes == self.episodes)) or \
           ((isinstance(self.target_reward_score, (int, float))) and (self.target_reward_score <= self.reward_in_episode)):
            self.is_simulation_done = True
        return self.is_simulation_done

    def cancel_simulation_job(self):
        logger.info ("cancel_simulation_job: make sure to shutdown simapp first")
        simapp_shutdown()

        session = boto3.session.Session()
        robomaker_client = session.client('robomaker', region_name=self.aws_region)
        robomaker_client.cancel_simulation_job(
            job=self.simulation_job_arn
        )

class DeepRacerRacetrackCustomActionSpaceEnv(DeepRacerRacetrackEnv):
    def __init__(self):
        DeepRacerRacetrackEnv.__init__(self)
        try:
            # Try loading the custom model metadata (may or may not be present)
            with open('custom_files/model_metadata.json', 'r') as f:
                model_metadata = json.load(f)
                self.json_actions = model_metadata['action_space']
            logger.info("Loaded action space from file: {}".format(self.json_actions))
        except Exception as ex:
            # Failed to load, fall back on the default action space
            from markov.defaults import model_metadata
            self.json_actions = model_metadata['action_space']
            logger.info("Exception {} on loading custom action space, using default: {}".format(ex, self.json_actions))
        self.action_space = spaces.Discrete(len(self.json_actions))

    def step(self, action):
        self.steering_angle = float(self.json_actions[action]['steering_angle']) * math.pi / 180.0
        self.speed = float(self.json_actions[action]['speed'])
        self.action_taken = action
        return super().step([self.steering_angle, self.speed])
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -