feat: add perspective correction code but not working

2026-04-09 07:26:45 +08:00
parent 5392084f0f
commit 1cf5afcd0f
1 changed files with 94 additions and 5 deletions
--- a/mv-and-ip/car_plate.py
+++ b/mv-and-ip/car_plate.py
@@ -118,6 +118,72 @@ def _analyse_car_plate_connection(
    return best
@dataclass
 class PerspectiveData:
    top_left: tuple[int, int]
    top_right: tuple[int, int]
    bottom_left: tuple[int, int]
    bottom_right: tuple[int, int]
    new_width: int
    new_height: int
 def _extract_perspective_data(
    gray: cv.typing.MatLike,
 ) -> typing.Optional[PerspectiveData]:
    """ """
    # Histogram balance to increase contrast
    hist_gray = cv.equalizeHist(gray)
    # Apply Gaussian blur to reduce noise
    blurred = cv.GaussianBlur(hist_gray, (5, 5), 0)
    # Edge detection using Canny
    edges = cv.Canny(blurred, 50, 150)
    # Find contours
    contours, _ = cv.findContours(edges, cv.RETR_EXTERNAL, cv.CHAIN_APPROX_SIMPLE)
    if not contours:
        return None
    # Find the largest one because all image is car plate
    max_area_contour = max(contours, key=lambda contour: cv.contourArea(contour))
    # Approximate the contour
    peri = cv.arcLength(max_area_contour, True)
    approx = cv.approxPolyDP(max_area_contour, 0.02 * peri, True)
    if len(approx) != 4:
        return None
    # Perspective transformation to get front view
    # Order points: top-left, top-right, bottom-right, bottom-left
    pts = approx.reshape(4, 2)
    rect = np.zeros((4, 2), dtype="float32")
    # Sum and difference of coordinates to find corners
    s = pts.sum(axis=1)
    top_left = pts[np.argmin(s)]  # Top-left has smallest sum
    bottom_right = pts[np.argmax(s)]  # Bottom-right has largest sum
    diff = np.diff(pts, axis=1)
    top_right = pts[np.argmin(diff)]  # Top-right has smallest difference
    bottom_left = pts[np.argmax(diff)]  # Bottom-left has largest difference
    # Calculate width and height of new image
    width_a = np.linalg.norm(rect[0] - rect[1])
    width_b = np.linalg.norm(rect[2] - rect[3])
    max_width = max(int(width_a), int(width_b))
    height_a = np.linalg.norm(rect[0] - rect[3])
    height_b = np.linalg.norm(rect[1] - rect[2])
    max_height = max(int(height_a), int(height_b))
    # Return value
    return PerspectiveData(
        top_left, top_right, bottom_left, bottom_right, max_width, max_height
    )
 def extract_car_plate(img: cv.typing.MatLike) -> typing.Optional[cv.typing.MatLike]:
    """
    Extract the car plate part from given image.
@@ -136,10 +202,11 @@ def extract_car_plate(img: cv.typing.MatLike) -> typing.Optional[cv.typing.MatLi
        # 连通域分析，筛选最符合车牌长宽比的区域作为车牌
        candidate = _analyse_car_plate_connection(mask)
        # 找到任意一个就退出
-        if candidate is not None: break
+        if candidate is not None:
            break
    if candidate is None:
-        logging.error('Can not find any car plate.')
+        logging.error("Can not find any car plate.")
        return None
    # 稍微扩边获取最终车牌区域
@@ -149,13 +216,13 @@ def extract_car_plate(img: cv.typing.MatLike) -> typing.Optional[cv.typing.MatLi
    y1 = max(candidate.y - pad, 0)
    x2 = min(candidate.x + candidate.w + pad, w_img)
    y2 = min(candidate.y + candidate.h + pad, h_img)
-    logging.info(f'车牌区域: x={x1}, y={y1}, w={x2 - x1}, h={y2 - y1}')
+    logging.info(f"车牌区域: x={x1}, y={y1}, w={x2 - x1}, h={y2 - y1}")
    # # 在原图上标记（仅供调试）
    # debug = img.copy()
    # cv.rectangle(debug, (x1, y1), (x2, y2), (0, 255, 0), 3)
    # cv.imwrite('./debug_detected.jpg', debug)
-    
+
    # 二值化：文字/边缘 → 黑色，背景 → 白色
    gray = cv.cvtColor(img[y1:y2, x1:x2], cv.COLOR_BGR2GRAY)
@@ -171,7 +238,29 @@ def extract_car_plate(img: cv.typing.MatLike) -> typing.Optional[cv.typing.MatLi
    kernel_denoise = cv.getStructuringElement(cv.MORPH_RECT, (2, 2))
    binary = cv.morphologyEx(binary, cv.MORPH_OPEN, kernel_denoise)
-    #return binary
+    # 尝试获取视角矫正数据
    perspective_data = _extract_perspective_data(gray)
    if perspective_data is None:
        logging.warning(f'Can not fetch perspective data. The output image has no perspective correction.')
        return binary
    # 执行视角矫正
    perspective_src = np.array([
        list(perspective_data.top_left),
        list(perspective_data.top_right),
        list(perspective_data.bottom_right),
        list(perspective_data.bottom_left)
    ], dtype="float32")
    perspective_dst = np.array([
        [0, 0],
        [perspective_data.new_width - 1, 0],
        [perspective_data.new_width - 1, perspective_data.new_height - 1],
        [0, perspective_data.new_height - 1]
    ], dtype="float32")
    M = cv.getPerspectiveTransform(perspective_src, perspective_dst)
    warped = cv.warpPerspective(binary, M, (perspective_data.new_width, perspective_data.new_height))
    return warped
    # cv.imwrite('./plate_binary.png', binary)
    # print("二值化结果已保存: plate_binary.png")