main_image_gen.py

# Created By Aaron Brown
# January 20, 2017
# Udacity Self-Driving Car Nanodegree

# Main class to generate image output

import numpy as np
import cv2
import pickle
import glob
from LineTracker import Tracker

# Read in the saved objpoints and imgpoints
dist_pickle = pickle.load( open( "camera_cal/calibration_pickle.p", "rb" ) )
mtx = dist_pickle["mtx"]
dist = dist_pickle["dist"]

# Useful functions for producing the binary pixel of interest images to feed into the LaneTracker Algorithm
def abs_sobel_thresh(img, orient='x', sobel_kernel=3, thresh=(0, 255)):
    # Calculate directional gradient
    gray = cv2.cvtColor(img, cv2.COLOR_RGB2GRAY)
    if orient == 'x':
        abs_sobel = np.absolute(cv2.Sobel(gray, cv2.CV_64F, 1, 0))
    if orient == 'y':
        abs_sobel = np.absolute(cv2.Sobel(gray, cv2.CV_64F, 0, 1))
    scaled_sobel = np.uint8(255*abs_sobel/np.max(abs_sobel))
    binary_output = np.zeros_like(scaled_sobel)
    # Apply threshold
    binary_output[(scaled_sobel >= thresh[0]) & (scaled_sobel <= thresh[1])] = 1
    return binary_output

def mag_thresh(image, sobel_kernel=3, mag_thresh=(0, 255)):
    # Calculate gradient magnitude
    gray = cv2.cvtColor(img, cv2.COLOR_RGB2GRAY)
    sobelx = cv2.Sobel(gray, cv2.CV_64F, 1, 0, ksize=sobel_kernel)
    sobely = cv2.Sobel(gray, cv2.CV_64F, 0, 1, ksize=sobel_kernel)
    gradmag = np.sqrt(sobelx**2 + sobely**2)
    scale_factor = np.max(gradmag)/255 
    gradmag = (gradmag/scale_factor).astype(np.uint8)
    binary_output = np.zeros_like(gradmag)
    # Apply threshold
    binary_output[(gradmag >= mag_thresh[0]) & (gradmag <= mag_thresh[1])] = 1
    return binary_output

def dir_threshold(image, sobel_kernel=3, thresh=(0, np.pi/2)):
    # Calculate gradient direction
    gray = cv2.cvtColor(img, cv2.COLOR_RGB2GRAY)
    sobelx = cv2.Sobel(gray, cv2.CV_64F, 1, 0, ksize=sobel_kernel)
    sobely = cv2.Sobel(gray, cv2.CV_64F, 0, 1, ksize=sobel_kernel)
    with np.errstate(divide='ignore', invalid='ignore'):
        absgraddir = np.absolute(np.arctan(sobely/sobelx))
        binary_output =  np.zeros_like(absgraddir)
        # Apply threshold
        binary_output[(absgraddir >= thresh[0]) & (absgraddir <= thresh[1])] = 1
    return binary_output

def color_threshold(image, sthresh=(0,255), vthresh=(0,255)):
	hls = cv2.cvtColor(image, cv2.COLOR_RGB2HLS)
	s_channel = hls[:,:,2]
	s_binary = np.zeros_like(s_channel)
	s_binary[(s_channel >= sthresh[0]) & (s_channel <= sthresh[1])  ] = 1

	hsv = cv2.cvtColor(image, cv2.COLOR_RGB2HSV)
	v_channel = hsv[:,:,2]
	v_binary = np.zeros_like(v_channel)
	v_binary[(v_channel >= vthresh[0]) & (v_channel <= vthresh[1])  ] = 1

	output = np.zeros_like(s_channel)
	output[(s_binary == 1) & (v_binary == 1)] = 1
	return output

def window_mask(width, height, img_ref, center,level):
		output = np.zeros_like(img_ref)
		output[int(img_ref.shape[0]-(level+1)*height):int(img_ref.shape[0]-level*height),max(0,int(center-width)):min(int(center+width),img_ref.shape[1])] = 1
		return output

# Make a list of test images
images = glob.glob('./test_images/test*.jpg')

for idx, fname in enumerate(images):
	# read in image
	img = cv2.imread(fname)
	# undistort the image
	img = cv2.undistort(img,mtx,dist,None,mtx)

	# process image and generate binary pixel of interests
	preprocessImage = np.zeros_like(img[:,:,0])
	gradx = abs_sobel_thresh(img, orient='x', thresh=(25,255)) # 12
	grady = abs_sobel_thresh(img, orient='y', thresh=(10,255)) # 25
	c_binary = color_threshold(img, sthresh=(100,255), vthresh=(200,255)) 
	preprocessImage[((gradx == 1) & (grady == 1) | (c_binary == 1) )] = 255


	# work on defining perspective transformation area
	img_size = (img.shape[1],img.shape[0])
	bot_width = .76 # percent of bottom trapizoid height
	mid_width = .16 # percent of middle trapizoid height
	height_pct = .66 # percent for trapizoid height
	bottom_trim = .935 # percent from top to bottom to avoid car hood 
	src = np.float32([[img.shape[1]*(.5-mid_width/2),img.shape[0]*height_pct],[img.shape[1]*(.5+mid_width/2),img.shape[0]*height_pct],[img.shape[1]*(.5+bot_width/2),img.shape[0]*bottom_trim],[img.shape[1]*(.5-bot_width/2),img.shape[0]*bottom_trim]])
	offset = img_size[0]*.33
	dst = np.float32([[offset, 0], [img_size[0]-offset, 0],[img_size[0]-offset, img_size[1]], [offset ,img_size[1]]])

	# perform the transform
	M = cv2.getPerspectiveTransform(src,dst)
	Minv = cv2.getPerspectiveTransform(dst,src)
	warped = cv2.warpPerspective(preprocessImage,M,img_size,flags=cv2.INTER_LINEAR)

	# Set up the overall class to do all the tracking
	curve_centers = Tracker(Mycenter_dis = .275*1280, Mywindow_width = 25, Mywindow_height = 40, Mypadding = 25, Myslide_res = 5, Myframe_ps = 1, My_ym = 10/720, My_xm = 4/384)

	# find the best line centers based on the binary pixel of interest input
	frame_centers = curve_centers.track_line(warped)
	# need these parameters to draw the graphic overlay illustraing the window convolution matching
	window_width = curve_centers.window_width 
	window_height = curve_centers.window_height
	# points used for graphic overlay 
	l_points = np.zeros_like(warped)
	r_points = np.zeros_like(warped)

	# points used to find the left and right lanes
	rightx = []
	leftx = []

	res_yvals = np.arange(warped.shape[0]-(window_height+window_height/2),0,-window_height)
	
	for level in range(1,len(frame_centers)):
		l_mask = window_mask(window_width,window_height,warped,frame_centers[level][0],level)
		r_mask = window_mask(window_width,window_height,warped,frame_centers[level][1],level)
		# add center value found in frame to the list of lane points per left,right
		leftx.append(frame_centers[level][0])
		rightx.append(frame_centers[level][1])
		# fill in graphic points here if pixels fit inside the specificed window from l/r mask
		l_points[(l_points == 255) | ((l_mask == 1) ) ] = 255
		r_points[(r_points == 255) | ((r_mask == 1) ) ] = 255

	# drawing the graphic overlay to represents the results found for tracking window centers
	template = np.array(r_points+l_points,np.uint8)
	zero_channel = np.zeros_like(template)
	template = np.array(cv2.merge((zero_channel,zero_channel,template)),np.uint8)
	warpage = np.array(cv2.merge((warped,warped,warped)),np.uint8)
	graphic_measure = cv2.addWeighted(warpage, 0.2, template, 0.75, 0.0)
	
	# fit the lane boundaries to the left,right center positions found
	yvals = range(0,warped.shape[0])

	left_fit = np.polyfit(res_yvals, leftx, 3)
	left_fitx = left_fit[0]*yvals*yvals*yvals + left_fit[1]*yvals*yvals + left_fit[2]*yvals+left_fit[3]
	left_fitx = np.array(left_fitx,np.int32)
	
	right_fit = np.polyfit(res_yvals, rightx, 3)
	right_fitx = right_fit[0]*yvals*yvals*yvals + right_fit[1]*yvals*yvals + right_fit[2]*yvals+right_fit[3]
	right_fitx = np.array(right_fitx,np.int32)

	# used to find center curve
	curve_xpts = [(right_fitx[0]+left_fitx[0])/2,(right_fitx[len(right_fitx)/2]+left_fitx[len(left_fitx)/2])/2,(right_fitx[-1]+left_fitx[-1])/2]
	curve_ypts = [yvals[0],yvals[(int)(len(yvals)/2)],yvals[-1]]
	curve_fit = np.polyfit(curve_ypts, curve_xpts, 2)
	curve_fitx = curve_fit[0]*yvals*yvals + curve_fit[1]*yvals+ curve_fit[2]

	# used to format everything so its ready for cv2 draw functions
	left_lane = np.array(list(zip(np.concatenate((left_fitx-window_width/2,left_fitx[::-1]+window_width/2), axis=0),np.concatenate((yvals,yvals[::-1]),axis=0))),np.int32)
	right_lane = np.array(list(zip(np.concatenate((right_fitx-window_width/2,right_fitx[::-1]+window_width/2), axis=0),np.concatenate((yvals,yvals[::-1]),axis=0))),np.int32)
	inner_lane = np.array(list(zip(np.concatenate((left_fitx+window_width/2,right_fitx[::-1]-window_width/2), axis=0),np.concatenate((yvals,yvals[::-1]),axis=0))),np.int32)
	curve_pts = np.array([list(zip(curve_fitx,yvals))],np.int32)

	# draw lane lines, middle curve, road background on two different blank overlays
	road = np.zeros_like(template)
	road_bkg = np.zeros_like(template)
	cv2.fillPoly(road,[left_lane],color=[9, 67, 109])
	cv2.fillPoly(road,[right_lane],color=[9, 67, 109])
	cv2.polylines(road,[curve_pts],isClosed=False, color=[5, 176, 249], thickness=3)
	for horz_line_y in curve_centers.horz_lines:
		cv2.line(road,(left_fitx[(int)(horz_line_y)],(int)(horz_line_y)),(right_fitx[(int)(horz_line_y)],(int)(horz_line_y)),color=[5, 176, 249], thickness=3)

	cv2.fillPoly(road_bkg,[inner_lane],color=[38, 133, 197])

	# after done drawing all the marking effects, warp back image to its orginal perspective.
	# Note for the two different overlays, just seperating road_warped and road_warped_bkg to get two different alpha values, its just for astetics...
	road_warped = cv2.warpPerspective(road,Minv,img_size,flags=cv2.INTER_LINEAR)
	road_warped_bkg = cv2.warpPerspective(road_bkg,Minv,img_size,flags=cv2.INTER_LINEAR)

	# merging all the different overlays, basically make things look pretty!
	lane_template = np.array(cv2.merge((road_warped[:,:,2],road_warped[:,:,2],road_warped[:,:,2])),np.uint8)
	bkg_template = np.array(cv2.merge((road_warped_bkg[:,:,2],road_warped_bkg[:,:,2],road_warped_bkg[:,:,2])),np.uint8)
	base = cv2.addWeighted(img, 1.0, bkg_template, -0.6, 0.0)
	base = cv2.addWeighted(base, 1.0, road_warped_bkg, 0.6, 0.0)
	base = cv2.addWeighted(base, 1.0, lane_template, -1.8, 0.0)
	result = cv2.addWeighted(base, 1.0, road_warped, 0.9, 0.0)
	
	# calcuate the middle line curvature
	ym_per_pix = curve_centers.ym_per_pix # meters per pixel in y dimension
	xm_per_pix = curve_centers.xm_per_pix # meteres per pixel in x dimension
	curve_fit_cr = np.polyfit(np.array(curve_ypts,np.float32)*ym_per_pix, np.array(curve_xpts,np.float32)*xm_per_pix, 2)
	curverad = ((1 + (2*curve_fit_cr[0]*curve_ypts[1]*ym_per_pix + curve_fit_cr[1])**2)**1.5) /np.absolute(2*curve_fit_cr[0])
	curve_centers.curvatures.append(curverad)
	curverad = curve_centers.SmoothCurve()

	# calculate the offset of the car on the road
	camera_center = (left_fitx[-1] + right_fitx[-1])/2
	center_diff = (camera_center-warped.shape[1]/2)*xm_per_pix
	side_pos = 'left'
	if center_diff <= 0:
		side_pos = 'right'
	
	# add text backdrop
	txt_bkg = np.zeros_like(result)
	txt_bkg_pts = np.array([(0,0),((int)(result.shape[1]*.5),0),((int)(result.shape[1]*.5),(int)(result.shape[0]*.25)),(0,(int)(result.shape[0]*.25))])
	cv2.fillPoly(txt_bkg,[txt_bkg_pts],color=[200, 200, 200])
	result = cv2.addWeighted(result, 1.0, txt_bkg, -1.0, 0.0)
	# draw the text showing curvature, offset, and speed
	cv2.putText(result,'Radius of Curvature = '+str(round(curverad,3))+'(m)',(50,50) , cv2.FONT_HERSHEY_SIMPLEX, 1,(5, 176, 249),2)
	cv2.putText(result,'Vehicle is '+str(abs(round(center_diff,3)))+'m '+side_pos+' of center',(50,100) , cv2.FONT_HERSHEY_SIMPLEX, 1,(5, 176, 249),2)

	# insert graphic overlay map
	graphic_bkg = np.zeros_like(result)
	# scale the graphic measure that we generated near the start for finding window centers, by some constant factor in both axis
	g_scale = 0.4
	graphic_overlay = cv2.resize(graphic_measure, (0,0), fx=g_scale, fy=g_scale) 
	g_xoffset = result.shape[1]-graphic_overlay.shape[1]
	# overlay the graphic measure in the result image at the top right corner
	result[:graphic_overlay.shape[0], g_xoffset:g_xoffset+graphic_overlay.shape[1]] = graphic_overlay

	write_name = './test_images/tracked'+str(idx)+'.jpg'
	cv2.imwrite(write_name, result)