···· 1.讲解Udacity的CarND-LaneLines-P1-master项目
···· 2.讲解Udacity的CarND-Advanced-Lane-Lines-master项目
···· 3.讲解我在这基础上改进的multi-lane-lines-detection项目
详细代码见 https://github.com/wisdom-bob/CarND-Advanced-Lane-Lines-master
如上图所示为标定的图片,通过以下代码,基于cv2.findChessboardCorners找到对标像素点,这里的像素坐标精确到小数点后3位(ps,事实上这里并不是简单的图像捕捉点,也是统计得到的结果,精确度算不得准,只是当单张表格点较多时结果更可信),对标点对应的ground_truth point,即objp点集,相当于标定板不动,相机移动,由于标定板间隔相同,这里直接简单设定间距为单位1.
# prepare object points, like (0,0,0), (1,0,0), (2,0,0) ....,(6,5,0)
objp = np.zeros((6 * 9, 3), np.float32)
objp[:,:2] = np.mgrid[0:9, 0:6].T.reshape(-1, 2)
# Arrays to store object points and image points from all the images.
objpoints = [] # 3d points in real world space
imgpoints = [] # 2d points in image plane.
img_with_corners = []
# Make a list of calibration images
images = glob.glob('./camera_cal/calibration*.jpg')
# Step through the list and search for chessboard corners
for i in range(len(images)):
img = cv2.imread(images[i])
gray = cv2.cvtColor(img,cv2.COLOR_BGR2GRAY)
ret, corners = cv2.findChessboardCorners(gray, (9,6), None)
# If found, add object points, image points
if ret == True:
# Draw and display the corners
img = cv2.drawChessboardCorners(img, (9,6), corners, ret)
# mtx is Camera Matrix, dist is the distort arameter Vector
global mtx,dist
# calculate the mtx and dist by cv2.calibrateCamera
img = cv2.imread('camera_cal/calibration1.jpg')
gray = cv2.cvtColor(img,cv2.COLOR_BGR2GRAY)
img_size = gray.shape[::-1]
ret, mtx, dist, rvecs, tvecs = cv2.calibrateCamera(objpoints, imgpoints, img_size, None, None)
cv2.calibrateCamera,基于objpoints和imgpoints计算结果,当然数据是越多越好,它会逐渐趋向稳定,这里推荐cv2.projectPoints配合筛选元图像数据。另外说一下cv2.calibrateCamera最末尾参数 criteria,用于设定迭代终止条件,算法依据最小二乘法,利用输入的对应点集进行循环计算,不断修缮结果,但偶尔也会碰到无法计算的情况,即使findchessboard没有剔除图像,但是对于标定计算的过程中,也有一些图像缺陷会被暴露出来需要剔除,这些都需要在调试中慢慢进行。
def cal_undistort(img):
# convert image into gray scale
undist = cv2.undistort(img, mtx, dist, None, mtx)
return undist
undist = cal_undistort(img)
# Visualize undistortion
f, (ax1, ax2) = plt.subplots(1, 2, figsize=(20,10))
ax1.set_title('Original Image', fontsize=30)
ax2.set_title('Undistorted Image', fontsize=30)
plt.subplots_adjust(left=0., right=1, top=0.9, bottom=0.)
····如上图所示为图像的RGB,HLS通道成像及在各自方向上做二值化特征提取的结果图,二值化的目的是希望尽可能保留道路特征,而其他干扰特征尽可能少,那么对比以上各托我们发现[X sobel on hls],[Y sobel on hls],[X sobel]都是不错的结果,于是这里考虑取[X sobel on hls]和[X sobel]交集,再与[R_channel]作为背景进行取交,得到一个更稳定的结果,从而完成二值化,这里使用的是cv2.Sobel,详细可见上篇文章中的转载[4],本文使用sobel算子(ps.canny算子中也同样通到了sobel算子)。结果如图所示。
def rgb_select(img, thresh=(0, 255)):
# get the binary image of r-channel
R = img[:,:,0]
binary = np.zeros_like(R)
binary[(R > thresh[0]) & (R <= thresh[1])] = 1
return binary
def abs_sobel_thresh(img, orient='x', thresh=(0, 255)):
# calculate the binary image by sobel operator with orient and thresh from grayscale
gray = cv2.cvtColor(img, cv2.COLOR_RGB2GRAY)
if orient == 'x':
sobel = cv2.Sobel(gray, cv2.CV_64F, 1, 0)
sobel = cv2.Sobel(gray, cv2.CV_64F, 0, 1)
abs_sobel = np.absolute(sobel)
scaled_sobel = np.uint8(255 * abs_sobel / np.max(abs_sobel))
binary_output = np.zeros_like(scaled_sobel)
binary_output[(scaled_sobel > thresh[0]) & (scaled_sobel <= thresh[1])] = 1
return binary_output
def abs_sobel_thresh_hls(img, orient='x', thresh=(0, 255)):
# calculate the binary image by sobel operator with orient and thresh from s-channel
hls = cv2.cvtColor(img, cv2.COLOR_RGB2HLS)[:,:,2]
if orient == 'x':
sobel = cv2.Sobel(hls, cv2.CV_64F, 1, 0)
sobel = cv2.Sobel(hls, cv2.CV_64F, 0, 1)
abs_sobel = np.absolute(sobel)
scaled_sobel = np.uint8(255 * abs_sobel / np.max(abs_sobel))
binary_output = np.zeros_like(scaled_sobel)
binary_output[(scaled_sobel > thresh[0]) & (scaled_sobel <= thresh[1])] = 1
return binary_output
def make_binary(img):
# Threshold color channel
r_binary = rgb_select(img, (220, 255))
# Threshold based on sobel edge detection
sobel = abs_sobel_thresh(img, 'x', (40, 255))
# Complex threshold
c_binary = abs_sobel_thresh_hls(img, 'x', (50, 255))
# Stack each channel
color_binary = np.dstack((r_binary, sobel, c_binary)) * 255
# Combine the two binary thresholds
combined_binary = np.zeros_like(sobel)
combined_binary[(c_binary == 1) | (sobel == 1) | (r_binary == 1)] = 1
return (combined_binary, color_binary)
undist = cal_undistort(img)
(comb_bin, col_bin) = make_binary(undist)
def perspective_transform(img, M):
# calculate the wrap image by perspective matrix
warped = cv2.warpPerspective(img,M,(img_size),flags=cv2.INTER_LINEAR)
return warped
src = np.float32([[185, img_size[1]],[580, 460], [705, 460], [1200, img_size[1]]])
dst = np.float32([[280, img_size[1]], [280, 0], [1000, 0], [1000, img_size[1]]])
# calculate the perspective matrix
M = cv2.getPerspectiveTransform(src, dst)
M_inv = cv2.getPerspectiveTransform(dst, src)
warped = perspective_transform(comb_bin,M)
# Plot the result
colored_comb_bin = np.dstack((comb_bin, comb_bin, comb_bin)) * 255
cv2.polylines(colored_comb_bin, [np.array(src,dtype=np.int32).reshape((-1, 1, 2))], True, (255,255,0), thickness = 2)
colored_warped = np.dstack((warped, warped, warped)) * 255
cv2.polylines(colored_warped, [np.array(dst, dtype=np.int32).reshape((-1, 1, 2))], True, (255,255,0), thickness=2)
def find_lane_pixels(binary_warped):
# Take a histogram of the bottom half of the image
histogram = np.sum(binary_warped[binary_warped.shape[0]//2:,:], axis=0)
# Create an output image to draw on and visualize the result
out_img = np.dstack((binary_warped, binary_warped, binary_warped))
# Find the peak of the left and right halves of the histogram
# These will be the starting point for the left and right lines
midpoint = np.int(histogram.shape[0]//2)
leftx_base = np.argmax(histogram[:midpoint])
rightx_base = np.argmax(histogram[midpoint:]) + midpoint
nwindows = 10 # Choose the number of sliding windows
margin = 80 # Set the width of the windows +/- margin
minpix = 40 # Set minimum number of pixels found to recenter window
# Set height of windows - based on nwindows above and image shape
window_height = np.int(binary_warped.shape[0]//nwindows)
# Identify the x and y positions of all nonzero pixels in the image
nonzero = binary_warped.nonzero()
nonzeroy = np.array(nonzero[0])
nonzerox = np.array(nonzero[1])
# Current positions to be updated later for each window in nwindows
leftx_current = leftx_base
rightx_current = rightx_base
# Create empty lists to receive left and right lane pixel indices
left_lane_inds = []
right_lane_inds = []
# Step through the windows one by one
for window in range(nwindows):
# Identify window boundaries in x and y (and right and left)
win_y_low = binary_warped.shape[0] - ( window + 1) * window_height
win_y_high = binary_warped.shape[0] - window * window_height
##Find the four below boundaries of the window
win_xleft_low = leftx_current - margin
win_xleft_high = leftx_current + margin
win_xright_low = rightx_current - margin
win_xright_high = rightx_current + margin
# Draw the windows on the visualization image
cv2.rectangle(out_img,(win_xleft_low, win_y_low), (win_xleft_high, win_y_high), (0, 255, 0), 2)
cv2.rectangle(out_img,(win_xright_low, win_y_low), (win_xright_high, win_y_high), (0, 255, 0), 2)
# Identify the nonzero pixels in x and y within the window
good_left_inds = ((nonzeroy >= win_y_low) & (nonzeroy < win_y_high) &
(nonzerox >= win_xleft_low) & (nonzerox < win_xleft_high)).nonzero()[0]
good_right_inds = ((nonzeroy >= win_y_low) & (nonzeroy < win_y_high) &
(nonzerox >= win_xright_low) & (nonzerox < win_xright_high)).nonzero()[0]
# Append these indices to the lists
# If found > minpix pixels, recenter next window
# (`right` or `leftx_current`) on their mean position
if len(good_left_inds) > minpix:
leftx_current = np.int(np.mean(nonzerox[good_left_inds]))
if len(good_right_inds) > minpix:
rightx_current = np.int(np.mean(nonzerox[good_right_inds]))
# Concatenate the arrays of indices (previously was a list of lists of pixels)
left_lane_inds = np.concatenate(left_lane_inds)
right_lane_inds = np.concatenate(right_lane_inds)
except ValueError:
# Avoids an error if the above is not implemented fully
# Extract left and right line pixel positions
leftx = nonzerox[left_lane_inds]
lefty = nonzeroy[left_lane_inds]
rightx = nonzerox[right_lane_inds]
righty = nonzeroy[right_lane_inds]
return leftx, lefty, rightx, righty, out_img, left_lane_inds, right_lane_inds
def fit_polynomial(binary_warped, vis, chose=1):
# Find our lane pixels first
leftx, lefty, rightx, righty, out_img, left_lane_inds, right_lane_inds = find_lane_pixels(binary_warped)
left_fit, right_fit = (None, None)
# Fit a second order polynomial to each
if len(leftx) != 0:
left_fit = np.polyfit(lefty, leftx, 2)
if len(rightx) != 0:
right_fit = np.polyfit(righty, rightx, 2)
# Generate x and y values for plotting
ploty = np.linspace(0, binary_warped.shape[0]-1, binary_warped.shape[0] )
left_fitx = left_fit[0]*ploty**2 + left_fit[1]*ploty + left_fit[2]
right_fitx = right_fit[0]*ploty**2 + right_fit[1]*ploty + right_fit[2]
except TypeError:
# Avoids an error if `left` and `right_fit` are still none or incorrect
left_fitx = 1*ploty**2 + 1*ploty
right_fitx = 1*ploty**2 + 1*ploty
## Visualization ##
if vis:
# Colors in the left and right lane regions
out_img[lefty, leftx] = [255, 0, 0]
out_img[righty, rightx] = [0, 0, 255]
# Plots the left and right polynomials on the lane lines
plt.figure(figsize=(15, 15))
plt.plot(left_fitx, ploty, color='yellow')
plt.plot(right_fitx, ploty, color='yellow')
if chose == 1:
return (ploty, left_fit, right_fit, left_fitx, right_fitx)
return left_fit, right_fit, left_lane_inds, right_lane_inds
(ploty, left_fit, right_fit, left_fitx, right_fitx) = fit_polynomial(warped, True)
····通过测试,在时间占比上:二值化41%,去畸变22.7%,绘制19.7%,拟合车道线13%,透视变换5%…。可以考虑去掉r-channel,只考虑[X sobel on hls]和[X sobel],或者换种二值化方法;此外绘制也可以简化,从而提高帧率。
