726 lines
27 KiB
Python
726 lines
27 KiB
Python
# coding=utf-8
|
||
import uiautomator2 as u2
|
||
import time
|
||
import logging
|
||
import sys
|
||
import os
|
||
import cv2
|
||
import numpy as np
|
||
import re
|
||
|
||
# 添加项目根目录到 sys.path 以便导入 Util
|
||
project_root = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
|
||
if project_root not in sys.path:
|
||
sys.path.append(project_root)
|
||
|
||
from Util.EasyOcrKit import get_easyocr_reader
|
||
|
||
# 配置日志
|
||
logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(name)s - %(levelname)s - %(message)s')
|
||
logger = logging.getLogger("TestWeChat")
|
||
|
||
def find_input_box_center(image_path):
|
||
"""
|
||
识别底部输入框的中心坐标,返回 (center_x, center_y, rect_box)
|
||
rect_box 用于可视化: (x, y, w, h) (相对于原图)
|
||
"""
|
||
try:
|
||
img_data = np.fromfile(image_path, dtype=np.uint8)
|
||
img = cv2.imdecode(img_data, cv2.IMREAD_COLOR)
|
||
if img is None:
|
||
return None, None
|
||
|
||
height, width = img.shape[:2]
|
||
|
||
# 截取底部 12% 区域 (缩小范围以精准定位)
|
||
bottom_h = int(height * 0.12)
|
||
crop_y_start = height - bottom_h
|
||
crop = img[crop_y_start:height, 0:width]
|
||
|
||
# 预处理
|
||
gray = cv2.cvtColor(crop, cv2.COLOR_BGR2GRAY)
|
||
|
||
# 策略1: Canny 边缘检测 (对低对比度 UI 更有效)
|
||
edges = cv2.Canny(gray, 50, 150)
|
||
# 膨胀连接断裂的边缘
|
||
kernel = np.ones((3,3), np.uint8)
|
||
dilated = cv2.dilate(edges, kernel, iterations=1)
|
||
|
||
contours, _ = cv2.findContours(dilated, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
|
||
|
||
best_cnt = None
|
||
max_area = 0
|
||
|
||
for cnt in contours:
|
||
x, y, w, h = cv2.boundingRect(cnt)
|
||
# 筛选条件优化:
|
||
# 1. 宽度: 屏幕宽度的 50% - 98% (通常输入框很长)
|
||
# 2. 高度: 30px - 底部区域的 90%
|
||
if width * 0.5 < w < width * 0.98 and 30 < h < bottom_h * 0.9:
|
||
# 计算中心点 Y 坐标相对于全图
|
||
global_y = crop_y_start + y + h // 2
|
||
|
||
# 排除过于靠下的区域 (导航栏/手势条),通常在最后 2%
|
||
if global_y > height * 0.98:
|
||
continue
|
||
|
||
if w * h > max_area:
|
||
max_area = w * h
|
||
best_cnt = (x, y, w, h)
|
||
|
||
if best_cnt:
|
||
x, y, w, h = best_cnt
|
||
center_x = x + w // 2
|
||
center_y = crop_y_start + y + h // 2
|
||
logger.info(f"找到输入框(CV-Canny): ({center_x}, {center_y}), 尺寸: {w}x{h}")
|
||
return (center_x, center_y), (x, crop_y_start + y, w, h)
|
||
|
||
# 策略2: 自适应阈值 (原有逻辑作为备份)
|
||
thresh = cv2.adaptiveThreshold(gray, 255, cv2.ADAPTIVE_THRESH_GAUSSIAN_C,
|
||
cv2.THRESH_BINARY_INV, 11, 2)
|
||
contours_thresh, _ = cv2.findContours(thresh, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
|
||
|
||
for cnt in contours_thresh:
|
||
x, y, w, h = cv2.boundingRect(cnt)
|
||
if width * 0.4 < w < width * 0.95 and 20 < h < bottom_h * 0.8:
|
||
global_y = crop_y_start + y + h // 2
|
||
if global_y > height * 0.98:
|
||
continue
|
||
if w * h > max_area:
|
||
max_area = w * h
|
||
best_cnt = (x, y, w, h)
|
||
|
||
if best_cnt:
|
||
x, y, w, h = best_cnt
|
||
center_x = x + w // 2
|
||
center_y = crop_y_start + y + h // 2
|
||
logger.info(f"找到输入框(CV-Adaptive): ({center_x}, {center_y}), 尺寸: {w}x{h}")
|
||
return (center_x, center_y), (x, crop_y_start + y, w, h)
|
||
|
||
# 兜底策略:使用更靠下的默认坐标 (94%)
|
||
# 之前的 90.5% 用户反馈偏上
|
||
logger.warning("未找到明显输入框轮廓,使用更靠下的默认坐标 (94%)")
|
||
default_y = int(height * 0.94)
|
||
center_x = width // 2
|
||
|
||
# 构造假想框
|
||
fake_w = int(width * 0.7)
|
||
fake_h = int(height * 0.08) # 稍微加高一点,视觉上更像
|
||
fake_x = (width - fake_w) // 2
|
||
fake_y = default_y - fake_h // 2
|
||
|
||
return (center_x, default_y), (fake_x, fake_y, fake_w, fake_h)
|
||
|
||
|
||
except Exception as e:
|
||
logger.error(f"查找输入框失败: {e}")
|
||
return None, None
|
||
|
||
def find_send_button(d):
|
||
"""
|
||
截图并寻找发送按钮 (绿色按钮)
|
||
扩大搜索范围以适应键盘弹出的情况
|
||
"""
|
||
try:
|
||
# 截图到 Screenshots 目录方便调试
|
||
screenshot_dir = os.path.join(os.path.dirname(os.path.abspath(__file__)), "Screenshots")
|
||
if not os.path.exists(screenshot_dir):
|
||
os.makedirs(screenshot_dir)
|
||
timestamp = time.strftime("%Y%m%d_%H%M%S")
|
||
debug_shot_path = os.path.join(screenshot_dir, f"debug_send_check_{timestamp}.jpg")
|
||
|
||
d.screenshot(debug_shot_path)
|
||
logger.info(f"发送按钮查找调试截图已保存: {debug_shot_path}")
|
||
|
||
img = cv2.imread(debug_shot_path)
|
||
if img is None:
|
||
return None
|
||
|
||
h, w = img.shape[:2]
|
||
|
||
# ROI: 底部 60% (考虑到键盘弹出,按钮可能被顶上去)
|
||
# 且只关注右侧 30%
|
||
roi_h = int(h * 0.6)
|
||
roi_w = int(w * 0.3)
|
||
y_start = h - roi_h
|
||
x_start = w - roi_w
|
||
|
||
roi = img[y_start:h, x_start:w]
|
||
|
||
# 转换 HSV
|
||
hsv = cv2.cvtColor(roi, cv2.COLOR_BGR2HSV)
|
||
|
||
# 绿色范围 (WeChat Green)
|
||
lower_green = np.array([35, 80, 80])
|
||
upper_green = np.array([90, 255, 255])
|
||
|
||
mask = cv2.inRange(hsv, lower_green, upper_green)
|
||
|
||
# 查找轮廓
|
||
contours, _ = cv2.findContours(mask, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
|
||
|
||
if contours:
|
||
# 找符合条件的轮廓
|
||
valid_candidates = []
|
||
for cnt in contours:
|
||
area = cv2.contourArea(cnt)
|
||
x, y, cw, ch = cv2.boundingRect(cnt)
|
||
|
||
# 过滤太小的噪点和太大的区域(例如全屏背景)
|
||
# 发送按钮通常面积在 2000-15000 之间 (视分辨率而定)
|
||
if 500 < area < 30000:
|
||
# 宽高比检查:发送按钮通常接近正方形或微扁 (ratio < 2.5)
|
||
ratio = float(cw) / ch
|
||
if 0.5 < ratio < 3.0:
|
||
# 坐标还原到原图
|
||
global_y = y_start + y
|
||
valid_candidates.append({
|
||
'cnt': cnt,
|
||
'area': area,
|
||
'y': global_y,
|
||
'rect': (x, y, cw, ch)
|
||
})
|
||
|
||
if valid_candidates:
|
||
# 核心逻辑:发送按钮一定是所有绿色元素中最靠下的 (Y坐标最大)
|
||
# 且在最右侧
|
||
# 先按 Y 坐标降序排序
|
||
valid_candidates.sort(key=lambda c: c['y'], reverse=True)
|
||
|
||
# 取最靠下的一个 (可能是发送按钮)
|
||
best = valid_candidates[0]
|
||
|
||
# 获取中心点
|
||
bx, by, bw, bh = best['rect']
|
||
cx = x_start + bx + bw // 2
|
||
cy = y_start + by + bh // 2
|
||
|
||
logger.info(f"通过图像识别找到发送按钮 (Bottom-Most): ({cx}, {cy}), 面积: {best['area']}")
|
||
return cx, cy
|
||
|
||
logger.warning("未通过图像识别找到绿色发送按钮")
|
||
return None
|
||
|
||
except Exception as e:
|
||
logger.error(f"查找发送按钮出错: {e}")
|
||
return None
|
||
|
||
def take_debug_screenshot(d, step_name):
|
||
"""
|
||
调试专用截图函数
|
||
"""
|
||
try:
|
||
screenshot_dir = os.path.join(os.path.dirname(os.path.abspath(__file__)), "Screenshots")
|
||
if not os.path.exists(screenshot_dir):
|
||
os.makedirs(screenshot_dir)
|
||
timestamp = time.strftime("%Y%m%d_%H%M%S")
|
||
filename = f"debug_{timestamp}_{step_name}.jpg"
|
||
save_path = os.path.join(screenshot_dir, filename)
|
||
d.screenshot(save_path)
|
||
logger.info(f"📸 [调试截图] {step_name} 已保存: {filename}")
|
||
return save_path
|
||
except Exception as e:
|
||
logger.error(f"截图失败 ({step_name}): {e}")
|
||
return None
|
||
|
||
def perform_input_action(coords, text):
|
||
"""
|
||
点击坐标并输入文本
|
||
"""
|
||
# 优先尝试使用 uiautomator2 的原生控件查找 (更稳健)
|
||
native_success = False
|
||
try:
|
||
d = u2.connect()
|
||
# 查找 EditText 控件
|
||
input_elem = d(className="android.widget.EditText")
|
||
|
||
if input_elem.exists:
|
||
logger.info("发现原生输入框控件,尝试点击...")
|
||
|
||
# 1. 截图:点击前
|
||
take_debug_screenshot(d, "native_01_before_click")
|
||
|
||
# 双击策略
|
||
input_elem.click()
|
||
time.sleep(0.5)
|
||
input_elem.click()
|
||
time.sleep(1)
|
||
|
||
# 2. 截图:点击后 (预期键盘弹出)
|
||
take_debug_screenshot(d, "native_02_after_click_keyboard")
|
||
|
||
logger.info(f"输入文本: {text}")
|
||
|
||
# 尝试 set_text + send_keys 组合
|
||
try:
|
||
input_elem.set_text(text)
|
||
except:
|
||
pass
|
||
|
||
time.sleep(0.5)
|
||
|
||
# 检查文本是否输入成功,如果没有,尝试 send_keys
|
||
try:
|
||
current_text = input_elem.get_text()
|
||
if not current_text or current_text != text:
|
||
logger.warning(f"set_text 似乎未生效 (当前: {current_text}),尝试 send_keys...")
|
||
d.send_keys(text)
|
||
except:
|
||
d.send_keys(text)
|
||
|
||
# 3. 截图:输入文本后
|
||
take_debug_screenshot(d, "native_03_after_text_input")
|
||
|
||
# 尝试发送回车键
|
||
time.sleep(0.5)
|
||
d.press("enter")
|
||
|
||
# 尝试点击发送按钮
|
||
try:
|
||
if d(text="发送").exists:
|
||
d(text="发送").click()
|
||
logger.info("已点击 '发送' 按钮 (Native Text)")
|
||
take_debug_screenshot(d, "native_04_after_send_click_text")
|
||
else:
|
||
logger.info("未找到 '发送' 文本控件,尝试图像识别...")
|
||
send_btn_coords = find_send_button(d)
|
||
if send_btn_coords:
|
||
sx, sy = send_btn_coords
|
||
d.click(sx, sy)
|
||
logger.info(f"已点击 '发送' 按钮 (Image Rec): {sx}, {sy}")
|
||
take_debug_screenshot(d, "native_04_after_send_click_image")
|
||
else:
|
||
width, height = d.window_size()
|
||
fallback_x = int(width * 0.9)
|
||
fallback_y = int(height * 0.965)
|
||
logger.info(f"未识别到发送按钮,尝试盲点右下角: {fallback_x}, {fallback_y}")
|
||
d.click(fallback_x, fallback_y)
|
||
take_debug_screenshot(d, "native_04_after_send_click_fallback")
|
||
except Exception as e:
|
||
logger.error(f"点击发送按钮失败: {e}")
|
||
|
||
logger.info("输入完成 (Native)")
|
||
native_success = True
|
||
return
|
||
|
||
else:
|
||
logger.warning("未找到输入框元素 (Native),转入坐标点击模式...")
|
||
|
||
except Exception as e:
|
||
logger.warning(f"原生控件操作失败,降级为坐标点击: {e}")
|
||
|
||
if native_success:
|
||
return
|
||
|
||
# 降级方案:使用坐标点击
|
||
if not coords:
|
||
logger.error("坐标无效,无法执行点击输入")
|
||
return
|
||
|
||
x, y = coords
|
||
|
||
# 坐标安全检查
|
||
if 'd' not in locals():
|
||
d = u2.connect()
|
||
|
||
try:
|
||
width, height = d.window_size()
|
||
# 移除过于激进的坐标修正 (95% -> 93% 会导致点到输入框上方)
|
||
# 输入框中心通常在 96%-97% 左右
|
||
if y > height * 0.99:
|
||
logger.warning(f"检测到的输入框坐标 y={y} 过于靠底,修正为 {height * 0.97}")
|
||
y = int(height * 0.97)
|
||
except:
|
||
pass
|
||
|
||
try:
|
||
logger.info(f"设备连接成功: {d.info.get('serial')}")
|
||
|
||
# 1. 截图:点击输入框前
|
||
take_debug_screenshot(d, "coord_01_before_click_input")
|
||
|
||
# 点击输入框
|
||
logger.info(f"点击坐标: ({x}, {y})")
|
||
d.click(x, y)
|
||
time.sleep(0.5)
|
||
d.click(x, y) # Double click
|
||
|
||
# 等待键盘弹出
|
||
time.sleep(1.5)
|
||
|
||
# 2. 截图:点击输入框后
|
||
take_debug_screenshot(d, "coord_02_after_click_input_keyboard")
|
||
|
||
# 输入文本
|
||
logger.info(f"输入文本 (SendKeys): {text}")
|
||
try:
|
||
d.send_keys(text)
|
||
except Exception as sk_e:
|
||
logger.error(f"send_keys 失败: {sk_e}")
|
||
|
||
# 3. 截图:输入文本后
|
||
take_debug_screenshot(d, "coord_03_after_input_text")
|
||
|
||
time.sleep(0.5)
|
||
d.press("enter")
|
||
|
||
# 尝试查找发送按钮并点击
|
||
try:
|
||
if d(text="发送").exists:
|
||
d(text="发送").click()
|
||
logger.info("已点击 '发送' 按钮 (Native Text)")
|
||
take_debug_screenshot(d, "coord_04_after_click_send_native")
|
||
else:
|
||
logger.info("未找到 '发送' 文本控件,尝试图像识别...")
|
||
send_btn_coords = find_send_button(d)
|
||
if send_btn_coords:
|
||
sx, sy = send_btn_coords
|
||
d.click(sx, sy)
|
||
logger.info(f"已点击 '发送' 按钮 (Image Rec): {sx}, {sy}")
|
||
take_debug_screenshot(d, "coord_04_after_click_send_image")
|
||
else:
|
||
width, height = d.window_size()
|
||
fallback_x = int(width * 0.9)
|
||
fallback_y = int(height * 0.965)
|
||
logger.info(f"未识别到发送按钮,尝试盲点右下角: {fallback_x}, {fallback_y}")
|
||
d.click(fallback_x, fallback_y)
|
||
take_debug_screenshot(d, "coord_04_after_click_send_fallback")
|
||
except Exception as e:
|
||
logger.error(f"点击发送按钮失败: {e}")
|
||
|
||
logger.info("输入完成 (Coordinate)")
|
||
|
||
except Exception as e:
|
||
logger.error(f"自动化操作失败: {e}")
|
||
|
||
def analyze_chat_image(image_path, output_path, target_name="对方"):
|
||
"""
|
||
识别微信聊天截图中的头像并画框,识别对话内容
|
||
"""
|
||
logger.info(f"正在分析图片: {image_path}")
|
||
|
||
# 读取图片(支持中文路径)
|
||
try:
|
||
img_data = np.fromfile(image_path, dtype=np.uint8)
|
||
img = cv2.imdecode(img_data, cv2.IMREAD_COLOR)
|
||
except Exception as e:
|
||
logger.error(f"读取图片失败: {e}")
|
||
return
|
||
|
||
if img is None:
|
||
logger.error("图片读取为空")
|
||
return
|
||
|
||
# 备份一份干净的图片用于 OCR (避免识别到画上去的框)
|
||
img_clean = img.copy()
|
||
|
||
height, width = img.shape[:2]
|
||
logger.info(f"图片尺寸: {width}x{height}")
|
||
|
||
# 调用输入框识别,获取坐标和可视化框
|
||
input_center, input_rect = find_input_box_center(image_path)
|
||
|
||
# 1. 预处理
|
||
# 转为灰度图
|
||
gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
|
||
|
||
# 使用自适应阈值二值化
|
||
thresh = cv2.adaptiveThreshold(gray, 255, cv2.ADAPTIVE_THRESH_GAUSSIAN_C,
|
||
cv2.THRESH_BINARY_INV, 11, 2)
|
||
|
||
# 形态学操作:闭运算,填充内部空洞
|
||
kernel = cv2.getStructuringElement(cv2.MORPH_RECT, (3, 3))
|
||
closed = cv2.morphologyEx(thresh, cv2.MORPH_CLOSE, kernel)
|
||
|
||
# 2. 轮廓查找
|
||
contours, _ = cv2.findContours(closed, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
|
||
logger.info(f"检测到轮廓数量: {len(contours)}")
|
||
|
||
# 收集所有符合条件的头像
|
||
avatars = []
|
||
|
||
# 3. 筛选轮廓
|
||
for contour in contours:
|
||
# 获取外接矩形
|
||
x, y, w, h = cv2.boundingRect(contour)
|
||
|
||
# 筛选条件优化:
|
||
# 1. 形状接近正方形 (放宽宽高比限制: 0.8 ~ 1.2)
|
||
aspect_ratio = float(w) / h
|
||
|
||
# 2. 尺寸适中
|
||
# 假设头像宽度在屏幕宽度的 6% 到 15% 之间
|
||
min_w = width * 0.06
|
||
max_w = width * 0.15
|
||
|
||
# 3. 位置筛选
|
||
# 排除底部输入框区域 (假设底部 10% 为输入区域)
|
||
if y > height * 0.9:
|
||
continue
|
||
|
||
# 左侧头像:靠左边 (x < width * 0.18)
|
||
# 右侧头像:靠右边 (x > width * 0.82)
|
||
is_left = x < width * 0.18
|
||
is_right = x > width * 0.82
|
||
|
||
if 0.8 <= aspect_ratio <= 1.2 and min_w < w < max_w:
|
||
if is_left or is_right:
|
||
side = "Left" if is_left else "Right"
|
||
avatars.append({
|
||
'x': x, 'y': y, 'w': w, 'h': h,
|
||
'side': side
|
||
})
|
||
|
||
# 按 y 坐标排序
|
||
avatars.sort(key=lambda a: a['y'])
|
||
|
||
logger.info(f"找到有效头像数量: {len(avatars)}")
|
||
|
||
# 初始化 OCR
|
||
try:
|
||
reader = get_easyocr_reader(gpu=True)
|
||
logger.info("OCR 初始化成功")
|
||
except Exception as e:
|
||
logger.error(f"OCR 初始化失败: {e}")
|
||
reader = None
|
||
|
||
dialogue_log = []
|
||
|
||
# 4. 绘制对话内容框 (Green/Red Boxes)
|
||
if avatars:
|
||
i = 0
|
||
while i < len(avatars):
|
||
current_group_start = i
|
||
current_side = avatars[i]['side']
|
||
|
||
# 找到当前组的结束位置 (即下一个不同侧头像的索引)
|
||
j = i + 1
|
||
while j < len(avatars) and avatars[j]['side'] == current_side:
|
||
j += 1
|
||
|
||
# Start Y: 当前组第一个头像的上方 (例如 -10px)
|
||
start_y = max(0, avatars[i]['y'] - 10)
|
||
|
||
# End Y
|
||
if j < len(avatars):
|
||
end_y = max(start_y + 10, avatars[j]['y'] - 30)
|
||
else:
|
||
# 最后一个框的底边,使用输入框的上沿
|
||
if input_rect:
|
||
_, input_y, _, _ = input_rect
|
||
end_y = max(start_y + 10, input_y - 10)
|
||
else:
|
||
end_y = int(height * 0.9) # 默认
|
||
|
||
# 绘制大框
|
||
# 左侧 (Left) -> 对方 -> 绿色 (0, 255, 0)
|
||
# 右侧 (Right) -> 我 -> 红色 (0, 0, 255)
|
||
box_color = (0, 255, 0) if current_side == "Left" else (0, 0, 255)
|
||
|
||
cv2.rectangle(img, (0, start_y), (width, end_y), box_color, 5)
|
||
|
||
logger.info(f"绘制内容框: 侧别={current_side}, 范围 Y={start_y} to {end_y}")
|
||
|
||
# OCR 识别区域文本
|
||
if reader:
|
||
try:
|
||
safe_start_y = max(0, start_y)
|
||
safe_end_y = min(height, end_y)
|
||
|
||
if safe_end_y > safe_start_y:
|
||
roi_img = img_clean[safe_start_y:safe_end_y, 0:width]
|
||
|
||
# 识别
|
||
results = reader.read_text(roi_img)
|
||
|
||
# 过滤关键词
|
||
ignore_keywords = ["点击查看对话内容", "以上是打招呼的消息", "和 Kimi 的对话", "Kim智能助手"]
|
||
|
||
texts = []
|
||
for res in results:
|
||
text = res[1]
|
||
prob = res[2]
|
||
if prob > 0.3:
|
||
# 1. 检查是否包含屏蔽词
|
||
if any(kw in text for kw in ignore_keywords):
|
||
continue
|
||
|
||
# 2. 检查是否为单行时间
|
||
if re.match(r'^\s*\d{1,2}:\d{2}\s*$', text):
|
||
continue
|
||
|
||
texts.append(text)
|
||
|
||
combined_text = " ".join(texts)
|
||
|
||
if combined_text.strip():
|
||
role = target_name if current_side == "Left" else "我"
|
||
dialogue_log.append(f"{role}: {combined_text}")
|
||
logger.info(f" -> OCR结果: {combined_text}")
|
||
except Exception as e:
|
||
logger.error(f" -> OCR出错: {e}")
|
||
|
||
# 移动到下一组
|
||
i = j
|
||
|
||
# 5. 绘制头像框 (Blue/Yellow Boxes) - 画在内容框之上
|
||
for av in avatars:
|
||
x, y, w, h = av['x'], av['y'], av['w'], av['h']
|
||
color = (255, 0, 0) if av['side'] == "Left" else (0, 255, 255)
|
||
|
||
cv2.rectangle(img, (x, y), (x + w, y + h), color, 10)
|
||
logger.info(f"绘制头像: 位置=({x},{y}), 侧别={av['side']}")
|
||
|
||
# 6. 保存结果
|
||
try:
|
||
# 如果有识别到输入框,画出来 (紫色)
|
||
if input_rect:
|
||
rx, ry, rw, rh = input_rect
|
||
cv2.rectangle(img, (rx, ry), (rx + rw, ry + rh), (255, 0, 255), 5)
|
||
# 画中心点
|
||
if input_center:
|
||
cx, cy = input_center
|
||
cv2.circle(img, (cx, cy), 10, (255, 0, 255), -1)
|
||
logger.info(f"已绘制输入框标记: {input_rect}")
|
||
|
||
# cv2.imwrite 不支持中文路径,使用 imencode + tofile
|
||
ext = os.path.splitext(output_path)[1]
|
||
cv2.imencode(ext, img)[1].tofile(output_path)
|
||
logger.info(f"✅ 分析结果已保存至: {output_path}")
|
||
except Exception as e:
|
||
logger.error(f"保存分析图片失败: {e}")
|
||
|
||
logger.info("\n" + "="*30)
|
||
logger.info("对话内容汇总:")
|
||
for line in dialogue_log:
|
||
logger.info(line)
|
||
logger.info("="*30 + "\n")
|
||
|
||
def main():
|
||
logger.info("开始执行微信搜索测试...")
|
||
|
||
# 连接设备
|
||
try:
|
||
d = u2.connect()
|
||
logger.info(f"设备连接成功: {d.info.get('serial')}")
|
||
except Exception as e:
|
||
logger.error(f"设备连接失败: {e}")
|
||
return
|
||
|
||
# 1. 启动微信
|
||
logger.info("步骤 1: 启动微信...")
|
||
d.app_start("com.tencent.mm", stop=True)
|
||
# 等待微信启动完成
|
||
time.sleep(5)
|
||
|
||
# 获取屏幕尺寸
|
||
w, h = d.window_size()
|
||
logger.info(f"屏幕尺寸: {w}x{h}")
|
||
|
||
# 2. 点击搜索按钮 (参考 Opener.py 的坐标比例: w * 0.84, h * 0.08)
|
||
search_x = int(w * 0.84)
|
||
search_y = int(h * 0.08)
|
||
logger.info(f"步骤 2: 点击搜索按钮 (坐标: {search_x}, {search_y})...")
|
||
d.click(search_x, search_y)
|
||
time.sleep(2)
|
||
|
||
# 3. 输入 "糖豆爸爸"
|
||
target_name = "糖豆爸爸"
|
||
logger.info(f"步骤 3: 输入搜索内容 '{target_name}'...")
|
||
|
||
try:
|
||
# 启用 FastInputIME 以支持中文输入
|
||
d.set_input_ime(True)
|
||
|
||
# 点击搜索框获取焦点 (参考 Opener.py: w * 0.4, h * 0.08)
|
||
d.click(int(w * 0.4), int(h * 0.08))
|
||
time.sleep(1)
|
||
|
||
# 输入文字
|
||
d.send_keys(target_name)
|
||
time.sleep(2)
|
||
|
||
# 恢复输入法
|
||
d.set_input_ime(False)
|
||
except Exception as e:
|
||
logger.error(f"输入文字失败: {e}")
|
||
try:
|
||
d(focused=True).set_text(target_name)
|
||
except:
|
||
pass
|
||
|
||
# 4. 点击搜索结果
|
||
logger.info("步骤 4: 查找并点击搜索结果...")
|
||
time.sleep(2)
|
||
|
||
found = False
|
||
|
||
# 策略 A: 精确匹配文本
|
||
if d(text=target_name).exists:
|
||
logger.info(f"找到文本为 '{target_name}' 的元素,点击...")
|
||
d(text=target_name).click()
|
||
found = True
|
||
else:
|
||
logger.warning(f"未找到文本为 '{target_name}' 的元素,尝试模糊匹配或坐标点击...")
|
||
|
||
# 策略 B: 坐标点击 (参考 Opener.py 点击第一个结果: w * 0.5, h * 0.18)
|
||
result_x = int(w * 0.5)
|
||
result_y = int(h * 0.18)
|
||
logger.info(f"尝试点击第一个搜索结果位置 ({result_x}, {result_y})...")
|
||
d.click(result_x, result_y)
|
||
found = True
|
||
|
||
if found:
|
||
logger.info("✅ 已执行点击操作,应该已进入对话框。")
|
||
|
||
# 5. 截图保存结果
|
||
logger.info("步骤 5: 截图并分析...")
|
||
# 等待界面加载稳定
|
||
time.sleep(3)
|
||
|
||
# 创建截图目录
|
||
screenshot_dir = os.path.join(os.path.dirname(os.path.abspath(__file__)), "Screenshots")
|
||
if not os.path.exists(screenshot_dir):
|
||
os.makedirs(screenshot_dir)
|
||
|
||
# 生成文件名
|
||
timestamp = time.strftime("%Y%m%d_%H%M%S")
|
||
filename = f"chat_result_{timestamp}.jpg"
|
||
save_path = os.path.join(screenshot_dir, filename)
|
||
|
||
try:
|
||
d.screenshot(save_path)
|
||
logger.info(f"✅ 原始截图已保存: {save_path}")
|
||
|
||
# 6. 分析截图并标记头像
|
||
logger.info("步骤 6: 自动标记头像和识别内容...")
|
||
analyzed_filename = f"chat_result_{timestamp}_analyzed.jpg"
|
||
analyzed_path = os.path.join(screenshot_dir, analyzed_filename)
|
||
|
||
analyze_chat_image(save_path, analyzed_path, target_name=target_name)
|
||
|
||
# 7. 查找输入框并执行自动化操作
|
||
logger.info("步骤 7: 自动回复...")
|
||
# 注意:analyze_chat_image 内部已经调用了 find_input_box_center 并且画在图上了
|
||
# 但我们需要返回值来执行操作。analyze_chat_image 并没有返回坐标。
|
||
# 为了简单,再次调用一次 (或者修改 analyze_chat_image 返回坐标,但改动较大)
|
||
# 这里直接再次调用 find_input_box_center 获取坐标
|
||
coords, _ = find_input_box_center(save_path)
|
||
|
||
if coords:
|
||
logger.info(f"输入框坐标: {coords}")
|
||
perform_input_action(coords, "AI助手我现在可以开始和你聊天了!")
|
||
else:
|
||
logger.warning("未找到输入框坐标,跳过回复")
|
||
|
||
except Exception as e:
|
||
logger.error(f"❌ 截图或分析失败: {e}")
|
||
|
||
else:
|
||
logger.error("❌ 未能定位到搜索结果,跳过截图。")
|
||
|
||
logger.info("测试结束。")
|
||
|
||
if __name__ == "__main__":
|
||
main()
|