watchGo.py

#_*_coding:utf8_*_
import numpy as np
import cv2
from math import sqrt
from os.path import exists

#设置gstreamer管道参数
def gstreamer_pipeline(
    capture_width=1280,  #摄像头预捕获的图像宽度
    capture_height=720,  #摄像头预捕获的图像高度
    display_width=1280,  #窗口显示的图像宽度
    display_height=720,  #窗口显示的图像高度
    framerate=60,       #捕获帧率
    flip_method=0,      #是否旋转图像
):
    return (
        "nvarguscamerasrc ! "
        "video/x-raw(memory:NVMM), "
        "width=(int)%d, height=(int)%d, "
        "format=(string)NV12, framerate=(fraction)%d/1 ! "
        "nvvidconv flip-method=%d ! "
        "video/x-raw, width=(int)%d, height=(int)%d, format=(string)BGRx ! "
        "videoconvert ! "
        "video/x-raw, format=(string)BGR ! appsink"
        % (
            capture_width,
            capture_height,
            framerate,
            flip_method,
            display_width,
            display_height,
        )
    )


# # variables
# capture_width = 1280
# capture_height = 720
# display_width = 1280
# display_height = 720
# framerate = 60
# flip_method = 0

#     # 创建管道
# print(gstreamer_pipeline(capture_width,capture_height,display_width,display_height,framerate,flip_method))

#     #管道与视频流绑定
# cap = cv2.VideoCapture(gstreamer_pipeline(flip_method=0), cv2.CAP_GSTREAMER)
#cap = cv2.VideoCapture(0)
#cap.set(cv2.CAP_PROP_FRAME_WIDTH, 3280)
#cap.set(cv2.CAP_PROP_FRAME_HEIGHT, 2464)
# #cap.set(cv2.CAP_PROP_FOURCC, cv2.VideoWriter_fourcc(*'MJPG'))
#cap.set(cv2.CAP_PROP_FPS, 30) 

boardSize = 19 # might also be 9 or 13
frameSize = None # watchBoard will set this to the size of the video frame

# important file locations:

calibrationFile = "./calibration.npy"
blackCascadeFile = "./blackCascade.xml"
whiteCascadeFile = "./whiteCascade.xml"
emptyCascadeFile = "./emptyCascade.xml"

# camera calibration

# This is an optional step that loads two remapping matrices from
# a file. readImage() below can then use those to remove camera pinhole
# distortion from the video feed.
# to make your own calibration file, see, e.g.:
# https://opencv-python-tutroals.readthedocs.org/en/latest/py_tutorials/py_calib3d/py_calibration/py_calibration.html
# and when you have mapx, mapy, use numpy to save them like this:
# np.save(filename, np.array([mapx, mapy]))

mapx = None
mapy = None

def loadCalibration(filename):
    global mapx, mapy
    if exists(filename):
        loaded = np.load(filename)
        mapx = loaded[0]
        mapy = loaded[1]

loadCalibration(calibrationFile)

# video input and display

# closing the windows that opencv makes is a slightly hacky proposition:
def closeWindow(win="video"):
    cv2.destroyWindow(win)
    for i in range(4):
        cv2.waitKey(1)

def readImage():
    global cap
    
    # read image from cap, remapping it if we have mapx, mapy
    # assumes camera is already open
    retval, img = cap.read()
    img = undistort(img)
# 图像太大需要调整
    height, width = img.shape[0:2]
    #print("height=",height,"width=",width)
    if width > 800:
            new_width = 640
            new_height = int(new_width/width*height)
            img = cv2.resize(img, (new_width, new_height))
    #print("new_height=",new_height,"new_width=",new_width)
    

    # print(height,width,mapx,mapy)
    # if mapx is not None and mapy is not None:
    #     return cv2.remap(img, mapx, mapy, cv2.INTER_LINEAR)
      
    # else:
    #     return img
    return img            

# finding and watching a go board

# open the cascade classifiers:
empty_cascade = cv2.CascadeClassifier(emptyCascadeFile)
black_cascade = cv2.CascadeClassifier(blackCascadeFile)
white_cascade = cv2.CascadeClassifier(whiteCascadeFile)

def avgImages(images): # average an array of images to remove some video noise
    output = np.zeros(images[0].shape, dtype="float32")
    for i in images:
        output += i
    output /= len(images)
    return output.astype("uint8")

def readBoard(image):
    # search the image for a go board whose size is set by the global variable boardSize
    # this function returns a numpy array that represents a go position: 0 is an empty
    # intersection, 1 is a black stone, 2 is a white stone
    # readBoard also returns an array of the board's corners' coordinates in image 

    output = np.zeros((boardSize, boardSize), dtype="uint8")
    imgCorners = None

    # use the cascade classifiers to find anything that looks like
    # an empty intersection:
    emptyRectangles = empty_cascade.detectMultiScale(image, 1.08, 1)
    # a black stone:
    blackRectangles = black_cascade.detectMultiScale(image, 1.1, 1)
    # or a white stone:
    whiteRectangles = white_cascade.detectMultiScale(image, 1.1, 1)

    # cascade classifiers return a rectangle around the found object;
    # the center points of these rectangles are what we actually want:
    empties = []
    blacks = []
    whites = []
    for (ex, wy, w, h) in emptyRectangles:
        x = ex + w / 2.0
        y = wy + w / 2.0
        empties.append([x, y])
    for (ex, wy, w, h) in blackRectangles:
        x = ex + w / 2.0
        y = wy + w / 2.0
        blacks.append([x, y])
    for (ex, wy, w, h) in whiteRectangles:
        x = ex + w / 2.0
        y = wy + w / 2.0
        whites.append([x, y])

    # for diagnostic purposes, it can be useful to draw all the points
    # noted by the cascade classifier. uncomment the following to do this:
    for c in empties:
        cv2.circle(image,
                   (int(round(c[0])), int(round(c[1]))),
                   3,
                   (0, 255, 255),
                   -1)
    for c in blacks:
        cv2.circle(image,
                   (int(round(c[0])), int(round(c[1]))),
                   3,
                   (0, 255, 0),
                   -1)
    for c in whites:
        cv2.circle(image,
                   (int(round(c[0])), int(round(c[1]))),
                   3,
                   (0, 0, 255),
                   -1)
    cv2.imshow("dots", image)

    # now find the corners of a rectangle around those spots
    # that seem most likely to be the board & any stones on it
    group = findGroup(empties + blacks + whites)
    print(empties,blacks,whites)
    print(group)
    if group is None:
        return output, imgCorners
    hull = cv2.convexHull(np.array(group, dtype="int32"))
    epsilon = 0.001*cv2.arcLength(hull, True)
    approx = cv2.approxPolyDP(hull, epsilon, True)
    # approx returns maybe a rectangle with a corner or two lopped off
    imgCorners = fourCorners(approx) # so un-lop those corners

    if imgCorners is not None and len(imgCorners) > 3:
        # unwarp the stone positions and mark them in the output
        flatCorners = np.array([[0, 0],
                                [boardSize - 1, 0],
                                [boardSize - 1, boardSize - 1],
                                [0, boardSize - 1]],
                               dtype="float32")
        persp = cv2.getPerspectiveTransform(imgCorners, flatCorners)
        if len(blacks) > 0:
            blacks = np.array(blacks, dtype="float32")
            blacks = np.array([blacks])
            blacksFlat = cv2.perspectiveTransform(blacks, persp)
            for i in blacksFlat[0]:
                x = int(round(i[0]))
                y = int(round(i[1]))
                if x >= 0 and x < boardSize and y >= 0 and y < boardSize:
                    output[x][y] = 1
        if len(whites) > 0:
            whites = np.array(whites, dtype="float32")
            whites = np.array([whites])
            whitesFlat = cv2.perspectiveTransform(whites, persp)
            for i in whitesFlat[0]:
                x = int(round(i[0]))
                y = int(round(i[1]))
                if x >= 0 and x < boardSize and y >= 0 and y < boardSize:
                    output[x][y] = 2
        #print(output)
        print(imgCorners)

    return output, imgCorners


def findGroupMembers(maxDistance, i, distances, group):
    # recursively search for all the spots that are close enough to i,
    # or are close enough to a spot that's close enough, etc.
    for j in range(len(group)):
        if group[j]:
            pass
        elif distances[i][j] < maxDistance:
            group[j] = True
            findGroupMembers(maxDistance, j, distances, group)

def findGroup(spots):
    # find the spots that are bunched together

    # make an array of every spot's distance to every other spot
    length = len(spots)
    distances = np.zeros((length, length), dtype="float32")
    distanceList = []
    for i in range(length):
        for j in range(length):
            d = sqrt((spots[i][0] - spots[j][0])**2 + (spots[i][1] - spots[j][1])**2)
            distances[i][j] = d
            if d > 0:
                distanceList.append(d)

    # get the maximum distance to be considered in the main group
    distanceList.sort()
    numDistances = int((boardSize - 1)**2 * 1.8) # number of distances that should be between spots on a board
    maxDistance = np.mean(distanceList[0:numDistances]) * 1.75 # a little bigger than that, for luck

    # find a big enough group
    minGroup = int(boardSize**2 * 0.75)
    group = np.zeros((length), dtype="bool_")
    for i in range(length):
        findGroupMembers(maxDistance, i, distances, group)
        if group.sum() >= minGroup:
            outPoints = []
            for k in range(length):
                if group[k]:
                    outPoints.append(spots[k])
            return outPoints
        else:
            group = np.zeros((length), dtype="bool_")

def sortPoints(box):
    # sort the four points of a box so they're in the same order every time
    # for perspective mapping
    rect = np.zeros((4, 2), dtype = "float32")

    s = box.sum(axis = 1)
    rect[0] = box[np.argmin(s)]
    rect[2] = box[np.argmax(s)]

    diff = np.diff(box, axis = 1)
    rect[1] = box[np.argmin(diff)]
    rect[3] = box[np.argmax(diff)]

    return rect

def fourCorners(hull):
    # hull is an approximation of a quadrilateral that may have a corner or two lopped off
    # the assumption is that the four longest lines in that hull will be segments
    # of the sides of that un-lopped ideal quadrilateral
    length = len(hull)

    if len < 4:
        return []
    
    # make a list of [line, length]
    allLines = []
    for i in range(length):
        if i == (length - 1):
            line = [[hull[i][0][0], hull[i][0][1]], [hull[0][0][0], hull[0][0][1]]]
        else:
            line = [[hull[i][0][0], hull[i][0][1]], [hull[i + 1][0][0], hull[i + 1][0][1]]]
        d = sqrt((line[0][0] - line[1][0])**2 + (line[0][1] - line[1][1])**2)
        allLines.append([line, d])

    # get the four longest lines
    allLines.sort(key=lambda x: x[1], reverse=True)
    lines = []
    for i in range(4):
        lines.append(allLines[i][0])

    # make equations for each line of the form: y = m*x + c
    equations = []
    for i in lines:
        x_coords, y_coords = zip(*i)
        A = np.vstack([x_coords, np.ones(len(x_coords))]).T
        m, c = np.linalg.lstsq(A, y_coords)[0]
        equations.append([m, c])

    # find intersections of each line with each other line
    # as long as it's in the frame
    intersections = []
    for i in equations:
        for j in equations:
            if i[0] == j[0]:
                pass
            else:
                a = np.array([[i[0] * -1, 1], [j[0] * -1, 1]])
                b = np.array([i[1], j[1]])
                solution = np.linalg.solve(a, b)
                if solution[0] > 0 and solution[1] > 0 and solution[0] < frameSize[0] and solution[1] < frameSize[1]:
                    intersections.append([solution[0], solution[1]])

    intersections.sort()
    
    if len(intersections) > 6:
        output = [intersections[0],
                  intersections[2],
                  intersections[4],
                  intersections[6]]
        box = sortPoints(np.array(output, dtype="float32"))
        return box
    else:
        return []

# displaying the board

# make a blank board
def blankBoard(boardBlockSize):
    yellow = [75, 215, 255]
    black = [0, 0, 0]
    white = [255, 255, 255]
    halfBoardBlock = int(round((boardBlockSize / 2.0)))
    boardSide = boardBlockSize * boardSize
    blankBoard = np.zeros((boardSide, boardSide, 3),
                     dtype="uint8")
    cv2.rectangle(blankBoard, (0, 0), (boardSide, boardSide), yellow, -1)
    for i in range(boardSize):
        spot = i * boardBlockSize + halfBoardBlock
        cv2.line(blankBoard,
                 (spot, halfBoardBlock),
                 (spot, boardSide - halfBoardBlock),
                 black,
                 int(boardBlockSize / 10))
        cv2.line(blankBoard,
                 (halfBoardBlock, spot),
                 (boardSide - halfBoardBlock, spot),
                 black,
                  int(boardBlockSize / 10))
    if boardSize == 19:
        spots = [[3, 3], [9, 3], [15, 3],
                 [3, 9], [9, 9], [15, 9],
                 [3, 15], [9, 15], [15, 15]]
    else:
        spots = []

    for s in spots:
        cv2.circle(blankBoard,
                   (s[0] * boardBlockSize + halfBoardBlock,
                    s[1] * boardBlockSize + halfBoardBlock),
                   int(boardBlockSize * .15),
                   black,
                   -1)

    return blankBoard

def drawBoard(board, size=(500, 500)):
    black = [0, 0, 0]
    white = [255, 255, 255]
    
    boardBlockSize = 100
    halfBoardBlock = int(round(boardBlockSize / 2.0))
    output =  blankBoard(100)
    (w, h) = board.shape
    for x in range(w):
        for y in range(h):
            if board[x][y] == 1:
                cv2.circle(output,
                           ((x * boardBlockSize) + halfBoardBlock,
                            (y * boardBlockSize) + halfBoardBlock),
                           boardBlockSize / 2,
                           black,
                           -1)
            elif board[x][y] == 2:
                cv2.circle(output,
                           ((x * boardBlockSize) + halfBoardBlock,
                            (y * boardBlockSize) + halfBoardBlock),
                           boardBlockSize / 2,
                           white,
                           -1)
    output = cv2.resize(output, size, output, 0, 0, cv2.INTER_AREA)
    return output

def watchBoard():
    global frameSize
    global cap
    capture_width = 1280
    capture_height = 720
    display_width = 1280
    display_height = 720
    framerate = 60
    flip_method = 0

    # 创建管道
    print(gstreamer_pipeline(capture_width,capture_height,display_width,display_height,framerate,flip_method))

    #管道与视频流绑定
    cap = cv2.VideoCapture(gstreamer_pipeline(flip_method=0), cv2.CAP_GSTREAMER)
    #cap.open(0)
    #cap = cv2.VideoCapture(gstreamer_pipeline(flip_method=0), cv2.CAP_GSTREAMER)


    imgCorners = None

    # initialize the video display
    #ret_val, img = cap.read()
    img = readImage()
    (h, w, d) = img.shape
    frameSize = (w, h)
    videoSize = (int(round(w / 2.0)), int(round(h / 2.0)))
    cv2.imshow("camera", cv2.resize(img, videoSize, 0, 0, cv2.INTER_AREA))

    # show a grayed-out blank board to begin with
    board = np.zeros((boardSize, boardSize), dtype="uint8")
    print(board)
    cv2.imshow("board", cv2.cvtColor(drawBoard(board), cv2.COLOR_BGR2GRAY))
    
    # fill a buffer with video frames
    bufSize = 10
    buf = []
    for i in range(bufSize):
        buf.append(readImage())
    i = 0

    # to start with, look for movement in the whole video frame:
    roi = np.zeros((h, w), dtype="uint8") # Region Of Interest
    cv2.rectangle(roi, (0, 0), (w, h), 1, -1)
    movementThreshold = int(w * h * 0.1)
    stillFrames = 0
    moving = True

    
    while cv2.waitKey(1) == -1:
        new = readImage()
        bkg = avgImages(buf)
        motion = cv2.absdiff(cv2.GaussianBlur(new, (11, 11), 0),
                             cv2.GaussianBlur(bkg, (11, 11), 0))
        motion = cv2.cvtColor(motion, cv2.COLOR_BGR2GRAY)
        motion *= roi
        retval, motion = cv2.threshold(motion, 32, 1, cv2.THRESH_BINARY)
        motionSum = motion.sum()
        buf[i] = new
        i = (i + 1) % bufSize

        if motionSum > movementThreshold:
            if not moving: # if the video starts moving, gray out the board
                cv2.imshow("board", cv2.cvtColor(drawBoard(board), cv2.COLOR_BGR2GRAY))
                moving = True
                stillFrames = 0
        else:
            moving = False
            stillFrames += 1
            if stillFrames == (bufSize + 1): # if the video stands still for long enough, read the board
                board, imgCorners = readBoard(bkg)
                print(board)
                cv2.imshow("board", drawBoard(board))
                if imgCorners is not None and len(imgCorners) > 3: # look for movement around where the board is:
                    roi = np.zeros((h, w), dtype="uint8")
                    cv2.fillConvexPoly(roi, np.array(imgCorners, dtype="int32"), 1)
                    kernel = cv2.getStructuringElement(cv2.MORPH_ELLIPSE, (27, 27))
                    roi = cv2.dilate(roi, kernel)
                    movementThreshold = int(cv2.contourArea(imgCorners) / (boardSize**2))

        # draw the board corners to the video display:
        image = new.copy()
        if imgCorners is not None:
            for c in imgCorners:
                cv2.circle(image,
                           (int(round(c[0])), int(round(c[1]))),
                           6,
                           (0, 0, 255),
                           -1)
        cv2.imshow("camera", cv2.resize(image, videoSize, 0, 0, cv2.INTER_AREA))

    cap.release()
    closeWindow("camera")
    closeWindow("board")


def undistort(frame): 
    fx = 783.7093 
    cx = 653.2896 
    fy = 783.5000 
    cy = 393.6671 
    k1, k2, p1, p2, k3 = -0.3500, 0.1379, 0.0, 0.0, 0.0 
    # 相机坐标系到像素坐标系的转换矩阵 
    k = np.array([ [fx, 0, cx], [0, fy, cy], [0, 0, 1] ]) 
    # 畸变系数 
    d = np.array([ k1, k2, p1, p2, k3 ]) 
    h, w = frame.shape[:2] 
    mapx, mapy = cv2.initUndistortRectifyMap(k, d, None, k, (w, h), 5) 
    return cv2.remap(frame, mapx, mapy, cv2.INTER_LINEAR)

if __name__ == "__main__":
    watchBoard()