临时提交

2025-08-01 22:10:53 +08:00
parent 1269cf0573
commit aaf371a001
11 changed files with 191 additions and 82 deletions
--- a/resources/add.jpg
+++ b/resources/add.jpg
--- a/resources/bgv.jpg
+++ b/resources/bgv.jpg
--- a/resources/bgv.png
+++ b/resources/bgv.png
--- a/resources/comment.jpg
+++ b/resources/comment.jpg
--- a/resources/like.jpg
+++ b/resources/like.jpg
--- a/resources/like.png
+++ b/resources/like.png
--- a/resources/more.jpg
+++ b/resources/more.jpg
--- a/resources/search.jpg
+++ b/resources/search.jpg
--- a/script/AiTools.py
+++ b/script/AiTools.py
@@ -1,109 +1,218 @@
 import os
-import time
 import cv2
 import numpy as np
-from PIL import Image
+import imutils


 # 工具类
 class AiTools(object):

    @classmethod
-    def find_image_in_image(
-            cls,
-            smallImageUrl,
-            bigImageUrl,
-            match_threshold=0.90,
-            consecutive_required=3,
-            scales=None
-    ):
+    def find_image_in_image(cls, big_image_path, small_image_path, threshold=0.6, use_multiscale=True, scale_range=(0.7, 1.3), scale_steps=10, visualize=True, enable_subpixel=True, preprocess='histogram'):
+        # 读取大图和小图
+        large_image = cv2.imread(big_image_path)
+        small_image = cv2.imread(small_image_path)

-        if scales is None:
-            scales = [0.5, 0.75, 1.0, 1.25, 1.5]
+        if large_image is None or small_image is None:
+            print(f"无法加载图像，请检查路径是否正确！\n大图路径: {big_image_path}\n小图路径: {small_image_path}")
+            return -1, -1

-        template = cv2.imread(smallImageUrl, cv2.IMREAD_COLOR)
-        # if template is None:
-        #     raise Exception(f"❌ 无法读取模板 '{smallImageUrl}'")
+        # 打印图像尺寸信息
+        print(f"大图尺寸: {large_image.shape[1]}x{large_image.shape[0]}")
+        print(f"小图尺寸: {small_image.shape[1]}x{small_image.shape[0]}")

-        template_gray = cv2.cvtColor(template, cv2.COLOR_BGR2GRAY)
+        # 图像预处理函数
+        def preprocess_image(image, method='histogram'):
+            if method == 'histogram':
+                # 直方图均衡化
+                gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
+                equalized = cv2.equalizeHist(gray)
+                return equalized
+            elif method == 'blur':
+                # 高斯模糊
+                blurred = cv2.GaussianBlur(image, (5, 5), 0)
+                gray = cv2.cvtColor(blurred, cv2.COLOR_BGR2GRAY)
+                return gray
+            elif method == 'edge':
+                # 边缘检测
+                gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
+                edges = cv2.Canny(gray, 100, 200)
+                return edges
+            elif method == 'sharp':
+                # 锐化
+                gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
+                kernel = np.array([[-1, -1, -1], [-1, 9, -1], [-1, -1, -1]])
+                sharpened = cv2.filter2D(gray, -1, kernel=kernel)
+                return sharpened
+            else:
+                # 默认转为灰度图
+                return cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)

-        cap = cv2.imread(bigImageUrl, cv2.IMREAD_COLOR)
-        # if not cap.isOpened():
-        #     print(f"❌ 无法打开视频流: {bigImageUrl}")
-        #     return None
+        # 预处理图像
+        large_image_gray = preprocess_image(large_image, preprocess)
+        small_image_gray = preprocess_image(small_image, preprocess)

-        detected_consecutive_frames = 0
+        best_match_val = -1
+        best_match_loc = (-1, -1)
+        best_scale = 1.0
+        best_method = None
+        best_method_enum = None
+        
+        # 定义要尝试的匹配方法
+        match_methods = [
+            (cv2.TM_CCOEFF, 'TM_CCOEFF'),
+            (cv2.TM_CCOEFF_NORMED, 'TM_CCOEFF_NORMED'),
+            (cv2.TM_CCORR, 'TM_CCORR'),  # 添加这个方法
+            (cv2.TM_CCORR_NORMED, 'TM_CCORR_NORMED'),
+            (cv2.TM_SQDIFF, 'TM_SQDIFF'),
+            (cv2.TM_SQDIFF_NORMED, 'TM_SQDIFF_NORMED')
+        ]

-        print("🚀 正在检测爱心图标...")
-        while True:
-            print("死了")
-            ret, frame = cap.read()
-            if not ret or frame is None:
-                time.sleep(0.01)
-                continue
-            print("哈哈哈")
-            frame_gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
+        if use_multiscale:
+            # 多尺度匹配
+            small_height, small_width = small_image_gray.shape
+            scale_step = (scale_range[1] - scale_range[0]) / scale_steps
+            scales = [scale_range[0] + i * scale_step for i in range(scale_steps + 1)]
+            print(f"多尺度匹配范围: {scales}")

-            current_frame_has_match = False
-            best_match_val = 0
-            best_match_loc = None
-            best_match_w_h = None
-            print("aaaaaaaaaaaa")
            for scale in scales:
-                resized_template = cv2.resize(template_gray, (0, 0), fx=scale, fy=scale)
-                th, tw = resized_template.shape[:2]
-
-                if th > frame_gray.shape[0] or tw > frame_gray.shape[1]:
+                # 调整小图大小
+                new_width = int(small_width * scale)
+                new_height = int(small_height * scale)
+                if new_width < 10 or new_height < 10:  # 防止图像太小
                    continue
+                # 使用INTER_AREA插值方法提高缩放精度
+                resized_small = cv2.resize(small_image_gray, (new_width, new_height), interpolation=cv2.INTER_AREA)
+                print(f"尝试尺度: {scale}, 调整后小图尺寸: {new_width}x{new_height}")

-                result = cv2.matchTemplate(frame_gray, resized_template, cv2.TM_CCOEFF_NORMED)
-                _, max_val, _, max_loc = cv2.minMaxLoc(result)
+                # 尝试多种匹配方法
+                for method in [cv2.TM_CCOEFF_NORMED, cv2.TM_CCORR_NORMED, cv2.TM_SQDIFF_NORMED]:
+                    method_name = 'TM_CCOEFF_NORMED' if method == cv2.TM_CCOEFF_NORMED else 'TM_CCORR_NORMED' if method == cv2.TM_CCORR_NORMED else 'TM_SQDIFF_NORMED'
+                    result = cv2.matchTemplate(large_image_gray, resized_small, method)
+                    if method == cv2.TM_SQDIFF_NORMED:
+                        min_val, max_val, min_loc, max_loc = cv2.minMaxLoc(result)
+                        current_val = 1 - min_val  # 转换为类似其他方法的值
+                        current_loc = min_loc
+                    else:
+                        min_val, max_val, min_loc, max_loc = cv2.minMaxLoc(result)
+                        current_val = max_val
+                        current_loc = max_loc

-                if max_val > best_match_val:
-                    best_match_val = max_val
-                    best_match_loc = max_loc
-                    best_match_w_h = (tw, th)
-                if max_val >= match_threshold:
-                    current_frame_has_match = True
-                    print("break 了")
-                    break
-            print("bbbbbbbbbbbbbbbbbbbbbb")
-            if current_frame_has_match:
-                print("111111")
-                detected_consecutive_frames += 1
-                last_detection_info = (best_match_loc, best_match_w_h, best_match_val)
-            else:
-                print("2222222")
-                detected_consecutive_frames = 0
-                last_detection_info = None
+                    print(f"  方法: {method_name}, 匹配值: {current_val:.6f}")
+                    if current_val > best_match_val:
+                        best_match_val = current_val
+                        best_match_loc = current_loc
+                        best_scale = scale
+                        best_method = method_name
+                        best_method_enum = method
+        else:
+            # 单一尺度匹配，但尝试多种方法
+            for method in [cv2.TM_CCOEFF_NORMED, cv2.TM_CCORR_NORMED, cv2.TM_SQDIFF_NORMED]:
+                method_name = 'TM_CCOEFF_NORMED' if method == cv2.TM_CCOEFF_NORMED else 'TM_CCORR_NORMED' if method == cv2.TM_CCORR_NORMED else 'TM_SQDIFF_NORMED'
+                result = cv2.matchTemplate(large_image_gray, small_image_gray, method)
+                if method == cv2.TM_SQDIFF_NORMED:
+                    min_val, max_val, min_loc, max_loc = cv2.minMaxLoc(result)
+                    current_val = 1 - min_val  # 转换为类似其他方法的值
+                    current_loc = min_loc
+                else:
+                    min_val, max_val, min_loc, max_loc = cv2.minMaxLoc(result)
+                    current_val = max_val
+                    current_loc = max_loc

-            if detected_consecutive_frames >= consecutive_required and last_detection_info:
-                print("333333333")
-                top_left, (w, h), match_val = last_detection_info
-                center_x = top_left[0] + w // 2
-                center_y = top_left[1] + h // 2
+                print(f"方法: {method_name}, 匹配值: {current_val:.6f}")
+                if current_val > best_match_val:
+                    best_match_val = current_val
+                    best_match_loc = current_loc
+                    best_method = method_name
+                    best_method_enum = method

-                print(f"🎯 成功识别爱心图标: 中心坐标=({center_x}, {center_y}), 匹配度={match_val:.4f}")
-                return center_y, center_y
-            else:
-                return -1, -1
-        cap.release()
-        print("释放了")
-        return -1, -1
+        print(f"最佳匹配值: {best_match_val:.6f}")  # 打印最佳匹配值，用于调试
+        print(f"最佳匹配方法: {best_method}")
+        print(f"使用尺度: {best_scale}")  # 打印使用的尺度
+        print(f"匹配位置(左上角): {best_match_loc}")

+        # 设置一个阈值，只有当匹配度高于这个阈值时才认为找到
+        if best_match_val >= threshold:
+            # 计算小图在大图中的中心坐标
+            top_left = best_match_loc  # 左上角坐标
+            # 根据最佳尺度调整小图尺寸
+            small_height, small_width = small_image_gray.shape
+            adjusted_width = small_width * best_scale
+            adjusted_height = small_height * best_scale

+            # 亚像素级精确匹配
+            if enable_subpixel and best_method_enum is not None:
+                # 调整小图到最佳尺度
+                resized_small = cv2.resize(small_image_gray, (int(adjusted_width), int(adjusted_height)), interpolation=cv2.INTER_AREA)
+                # 重新执行模板匹配以获取更精确的结果
+                result = cv2.matchTemplate(large_image_gray, resized_small, best_method_enum)
+                
+                # 在最佳匹配点周围定义一个小区域进行亚像素精确化
+                x, y = top_left
+                window_size = 5
+                x1, x2 = max(0, x - window_size), min(result.shape[1], x + window_size + 1)
+                y1, y2 = max(0, y - window_size), min(result.shape[0], y + window_size + 1)
+                
+                # 提取局部区域
+                local_result = result[y1:y2, x1:x2]
+                
+                # 拟合二次曲线找到亚像素级最大值
+                if best_method_enum == cv2.TM_SQDIFF_NORMED:
+                    min_val, _, min_loc, _ = cv2.minMaxLoc(local_result)
+                    subpixel_offset = (min_loc[0] - window_size, min_loc[1] - window_size)
+                else:
+                    _, max_val, _, max_loc = cv2.minMaxLoc(local_result)
+                    subpixel_offset = (max_loc[0] - window_size, max_loc[1] - window_size)
+                
+                # 计算亚像素级精确位置
+                subpixel_x = x + subpixel_offset[0]
+                subpixel_y = y + subpixel_offset[1]
+                
+                print(f"亚像素级精确位置: ({subpixel_x:.2f}, {subpixel_y:.2f})")
+                top_left = (subpixel_x, subpixel_y)
+            
+            # 使用浮点运算计算中心坐标
+            center_x = top_left[0] + adjusted_width / 2
+            center_y = top_left[1] + adjusted_height / 2
+            print(f"计算得到的中心坐标: ({center_x:.2f}, {center_y:.2f})")

+            # 可视化匹配结果
+            if visualize:
+                # 在彩色大图上绘制矩形和中心点
+                large_image_copy = large_image.copy()
+                # 绘制矩形
+                if enable_subpixel:
+                    top_left_int = (int(round(top_left[0])), int(round(top_left[1])))
+                    adjusted_width_int = int(round(adjusted_width))
+                    adjusted_height_int = int(round(adjusted_height))
+                    bottom_right = (top_left_int[0] + adjusted_width_int, top_left_int[1] + adjusted_height_int)
+                    center_int = (int(round(center_x)), int(round(center_y)))
+                else:
+                    bottom_right = (top_left[0] + int(adjusted_width), top_left[1] + int(adjusted_height))
+                    center_int = (int(center_x), int(center_y))
+                    top_left_int = top_left
+                
+                cv2.rectangle(large_image_copy, top_left_int, bottom_right, (0, 255, 0), 2)
+                cv2.circle(large_image_copy, center_int, 5, (0, 0, 255), -1)
+                # 显示图像
+                cv2.imshow('匹配结果', large_image_copy)
+                cv2.waitKey(0)
+                cv2.destroyAllWindows()
+
+            return center_x, center_y
+        else:
+            print(f"匹配值 {best_match_val:.6f} 低于阈值 {threshold}，未找到匹配")
+            return -1, -1
+
+    # 根据名称获取图片地址
    @classmethod
-    def imagePath(cls, name):
+    def pathWithName(cls, name):
        current_file_path = os.path.abspath(__file__)
        # 获取当前文件所在的目录（即script目录）
        current_dir = os.path.dirname(current_file_path)
        # 由于script目录位于项目根目录下一级，因此需要向上一级目录移动两次
        project_root = os.path.abspath(os.path.join(current_dir, '..'))
        # 构建资源文件的完整路径，向上两级目录，然后进入 resources 目录
-        resource_path = os.path.abspath(os.path.join(project_root, 'resources', name + ".png")).replace('/', '\\\\')
+        resource_path = os.path.abspath(os.path.join(project_root, 'resources', name + ".jpg")).replace('/', '\\\\')
        return resource_path

-
-
-
--- a/script/ScriptManager.py
+++ b/script/ScriptManager.py
@@ -18,19 +18,19 @@ class ScriptManager():
        session = client.session()
        session.appium_settings({"snapshotMaxDepth": 0})

-        deviceWidth = client.window_size().width
-        deviceHeight = client.window_size().height
+        # deviceWidth = client.window_size().width
+        # deviceHeight = client.window_size().height

        img = client.screenshot()
-        tempPath = "resources/bgv.png"
+        tempPath = "resources/bgv.jpg"
        img.save(tempPath)

-        bgvPath = AiTools.imagePath("bgv")
-        likePath = AiTools.imagePath("like")
+        smallImage = AiTools.pathWithName("like")
+        bigImage = AiTools.pathWithName("bgv")

-        x, y = AiTools.find_image_in_image(bgvPath, likePath)
+        x, y = AiTools.find_image_in_image(bigImage, smallImage)
        print(x, y)
-        # client.tap(end[0] / 3 - 2, end[1] / 3 - 2)
+        # client.tap(x, y)


        # xml = session.source()
--- a/script/screenshot.png
+++ b/script/screenshot.png