优化首帧功能，如果没传入首帧，则提取首帧。

2025-05-29 16:36:51 +08:00
parent a01b9e444e
commit 31c062fa70
2 changed files with 56 additions and 3 deletions
--- a/utils/video_utils.py
+++ b/utils/video_utils.py
@@ -0,0 +1,48 @@
+import os
+
+import cv2
+
+from loguru import logger
+
+
+def _get_first_frame(video_path, output_path):
+    """
+    提取视频的第一帧并保存为图片
+    :param video_path: 视频文件路径
+    :param output_path: 输出图片路径
+    :return: 输出图片的绝对路径，如果失败则返回None
+    """
+    cap = None
+    try:
+        logger.info(f"开始提取视频首帧: {video_path}")
+        # 打开视频文件
+        cap = cv2.VideoCapture(video_path)
+        if not cap.isOpened():
+            logger.error(f"无法打开视频: {video_path}")
+            return None
+
+        # 读取首帧
+        ret, frame = cap.read()
+        if not ret:
+            logger.error("无法读取视频帧")
+            cap.release()
+            return None
+
+        # 保存首帧为图片
+        try:
+            cv2.imwrite(output_path, frame)
+            logger.info(f"首帧已保存为: {output_path}")
+        except Exception as e:
+            logger.error(f"保存首帧图片失败: {e}")
+            cap.release()
+            return None
+
+        # 释放资源
+        cap.release()
+        return os.path.abspath(output_path)
+
+    except Exception as e:
+        logger.error(f"提取视频首帧时出错: {e}")
+        return None
+    finally:
+        cap.release()
--- a/wechat_ipad/client/message.py
+++ b/wechat_ipad/client/message.py
@@ -1,6 +1,7 @@
 import asyncio
 import base64
 import os
+import time
 from asyncio import Future
 from asyncio import Queue, sleep
 from io import BytesIO
@@ -14,6 +15,7 @@ from pymediainfo import MediaInfo
 import pysilk
 from pydub import AudioSegment

+from utils.video_utils import _get_first_frame
 from wechat_ipad import UserLoggedOut
 from wechat_ipad.client.base import WechatAPIClientBase

@@ -214,8 +216,7 @@ class MessageMixin(WechatAPIClientBase):
                    ValueError: 视频或图片参数都为空或都不为空时
                    根据error_handler处理错误
                """
-        if not image:
-            image = Path(os.path.join(Path(__file__).resolve().parent, "fallback.png"))
+
        # get video base64 and duration
        if isinstance(video, str):
            vid_base64 = video
@@ -235,6 +236,9 @@ class MessageMixin(WechatAPIClientBase):
            file_len = len(video_bytes)
            vid_base64 = base64.b64encode(video_bytes).decode()
            media_info = MediaInfo.parse(video_path)
+            first_frame = _get_first_frame(video_path, f"dify_frame_{int(time.time())}.jpg")
+            if first_frame:
+                image = first_frame
        else:
            raise ValueError("video should be str, bytes, or path")
            # 获取视频时长
@@ -246,7 +250,8 @@ class MessageMixin(WechatAPIClientBase):
        if duration is None:
            duration = 1
            self.logging.error(f"无法从视频文件获取时长: {video}")
-
+        if not image:
+            image = Path(os.path.join(Path(__file__).resolve().parent, "fallback.png"))
        # get image base64
        if isinstance(image, str):
            image_base64 = image