添加视频切片功能

2026-01-09 21:40:03 +08:00
parent 408fcd3f1b
commit cad3a033a3
7 changed files with 156248 additions and 22 deletions
--- a/video_frame_utils.py
+++ b/video_frame_utils.py
@@ -0,0 +1,394 @@
+import os
+import sys
+import uuid
+import subprocess
+import tempfile
+import threading
+import time
+from datetime import datetime, timedelta
+import json
+import glob
+import requests
+import logging
+from shared_utils import task_registry, file_registry, file_lock, task_lock, add_task_log
+
+# ======================
+# 配置
+# ======================
+BASE_DIR = os.path.dirname(os.path.abspath(__file__))
+FRAMES_ROOT = os.path.abspath("./frames")
+TASK_TIMEOUT_HOURS = 1  # 任务过期时间（小时）
+
+# 确保frames目录存在
+os.makedirs(FRAMES_ROOT, exist_ok=True)
+
+if sys.platform.startswith('win'):
+    FFMPEG_PATH = os.path.join(BASE_DIR, 'lib', 'ffmpeg', 'bin', 'ffmpeg.exe')
+    FFPROBE_PATH = os.path.join(BASE_DIR, 'lib', 'ffmpeg', 'bin', 'ffprobe.exe')
+else:
+    FFMPEG_PATH = os.path.join(BASE_DIR, 'lib', 'ffmpeg', 'bin', 'ffmpeg')
+    FFPROBE_PATH = os.path.join(BASE_DIR, 'lib', 'ffmpeg', 'bin', 'ffprobe')
+
+def log_subprocess_output(pipe, task_id, task_registry, task_lock, prefix=""):
+    """从管道实时读取并记录日志"""
+    if not pipe:
+        return
+    try:
+        for line in iter(pipe.readline, ''):
+            if line:
+                clean_line = line.strip()
+                if clean_line and task_id and task_registry and task_lock:
+                    add_task_log(task_id, f"{prefix}{clean_line}", task_registry, task_lock)
+    except Exception as e:
+        if task_id and task_registry and task_lock:
+            add_task_log(task_id, f"[日志读取错误] {e}", task_registry, task_lock)
+    finally:
+        pipe.close()
+    
+# ======================
+# 任务处理函数
+# ======================
+
+def process_video_frame_extraction(data, file_registry, file_lock, task_id=None, task_registry=None, task_lock=None):
+    """处理视频帧提取任务"""
+    try:
+        if task_id and task_registry and task_lock:
+            add_task_log(task_id, "开始处理视频帧提取任务", task_registry, task_lock)
+
+        logging.info(f"开始处理视频帧提取任务: {task_id}")
+
+        # 提取参数
+        video_url = data.get('video_url')
+        video_bv = data.get('video_bv')  # 支持BV号
+        w = data.get('w')
+        h = data.get('h')
+        fps = data.get('fps', 30)
+        force_resolution = data.get('force_resolution', False)
+        pad_to_target = data.get('pad_to_target', False)
+
+        # 验证参数
+        if not video_url and not video_bv:
+            raise Exception("缺少必要参数: video_url 或 video_bv")
+        if w is None or h is None:
+            raise Exception("缺少必要参数: w, h")
+
+        try:
+            w = int(w)
+            h = int(h)
+            fps = float(fps)
+            if w <= 0 or h <= 0 or fps <= 0:
+                raise ValueError("参数必须为正数")
+        except (ValueError, TypeError) as e:
+            raise Exception(f"参数无效: {str(e)}")
+
+        # 如果提供了BV号，自动生成Bilibili URL
+        if not video_url and video_bv:
+            video_bv = str(video_bv).strip()
+            if not video_bv.startswith(('BV', 'bv')):
+                raise Exception("video_bv 必须以 BV 或 bv 开头")
+            video_url = f"https://www.bilibili.com/video/{video_bv.upper()}"
+
+        # 准备目录
+        job_dir = os.path.join(FRAMES_ROOT, task_id)
+        os.makedirs(job_dir, exist_ok=True)
+
+        if task_id and task_registry and task_lock:
+            add_task_log(task_id, f"创建任务目录: {job_dir}", task_registry, task_lock)
+            with task_lock:
+                if task_id in task_registry:
+                    task_registry[task_id]['progress'] = 10
+
+        # 下载视频
+        temp_base = os.path.join(tempfile.gettempdir(), task_id)
+
+        # === 替换 yt-dlp 下载部分 ===
+        if task_id and task_registry and task_lock:
+            add_task_log(task_id, f"开始下载视频: {video_url}", task_registry, task_lock)
+
+        yt_dlp_cmd = [
+            sys.executable, '-m', 'yt_dlp',
+            video_url,
+            '-o', temp_base,
+            '-f', 'bv*[height<=720]+ba/b',
+            '--no-warnings',
+            '--progress',  # 显式启用进度（可选）
+        ]
+
+        # 使用 Popen 实时捕获 stderr
+        proc = subprocess.Popen(
+            yt_dlp_cmd,
+            stdout=subprocess.PIPE,
+            stderr=subprocess.PIPE,
+            text=True,
+            bufsize=1,
+            universal_newlines=True
+        )
+
+        # 启动日志线程（只读 stderr，因为 yt-dlp 进度在 stderr）
+        stderr_thread = threading.Thread(
+            target=log_subprocess_output,
+            args=(proc.stderr, task_id, task_registry, task_lock, "[yt-dlp] "),
+            daemon=True
+        )
+        stderr_thread.start()
+
+        try:
+            proc.wait(timeout=600)
+            if proc.returncode != 0:
+                raise subprocess.CalledProcessError(proc.returncode, yt_dlp_cmd)
+        except subprocess.TimeoutExpired:
+            proc.kill()
+            raise Exception("yt-dlp 下载超时（超过10分钟）")
+        finally:
+            stderr_thread.join(timeout=5)  # 等待日志线程结束
+
+        # 查找实际生成的文件
+        candidates = glob.glob(temp_base + ".*")
+        if not candidates:
+            raise Exception("yt-dlp 执行成功但未生成任何视频文件")
+
+        # 按修改时间取最新
+        temp_video = max(candidates, key=os.path.getmtime)
+
+        if task_id and task_registry and task_lock:
+            add_task_log(task_id, "下载完成，开始获取视频信息", task_registry, task_lock)
+            with task_lock:
+                if task_id in task_registry:
+                    task_registry[task_id]['progress'] = 40
+
+        # 获取视频信息
+        duration = get_video_duration(temp_video)
+
+        # 构建滤镜
+        vf = build_video_filter(w, h, fps, force_resolution, pad_to_target)
+
+        # 提取帧
+        if task_id and task_registry and task_lock:
+            add_task_log(task_id, "开始提取视频帧", task_registry, task_lock)
+            with task_lock:
+                if task_id in task_registry:
+                    task_registry[task_id]['progress'] = 50
+
+        frame_pattern = os.path.join(job_dir, "frame_%06d.png")
+
+        ffmpeg_cmd = [
+            FFMPEG_PATH, '-y',
+            '-i', temp_video,
+            '-vf', vf,
+            '-pix_fmt', 'rgb24',
+            '-stats',          # 关键：启用进度统计
+            '-v', 'info',      # 确保输出级别足够
+            frame_pattern
+        ]
+
+        proc = subprocess.Popen(
+            ffmpeg_cmd,
+            stdout=subprocess.PIPE,
+            stderr=subprocess.PIPE,
+            text=True,
+            bufsize=1,
+            universal_newlines=True
+        )
+
+        # FFmpeg 的进度在 stderr
+        stderr_thread = threading.Thread(
+            target=log_subprocess_output,
+            args=(proc.stderr, task_id, task_registry, task_lock, "[FFmpeg] "),
+            daemon=True
+        )
+        stderr_thread.start()
+
+        try:
+            proc.wait()
+            if proc.returncode != 0:
+                raise subprocess.CalledProcessError(proc.returncode, ffmpeg_cmd)
+        finally:
+            stderr_thread.join(timeout=5)
+
+        # 获取输出分辨率
+        if task_id and task_registry and task_lock:
+            add_task_log(task_id, "分析输出结果", task_registry, task_lock)
+            with task_lock:
+                if task_id in task_registry:
+                    task_registry[task_id]['progress'] = 80
+
+        out_w, out_h = get_output_resolution(job_dir)
+        total_frames = len([f for f in os.listdir(job_dir) if f.endswith('.png')])
+
+        # 检查音频
+        audio_exists = has_audio(temp_video)
+
+        if audio_exists:
+            if task_id and task_registry and task_lock:
+                add_task_log(task_id, "提取音频（左/右/混合声道）", task_registry, task_lock)
+                with task_lock:
+                    if task_id in task_registry:
+                        task_registry[task_id]['progress'] = 90
+
+            # 公共参数
+            dfpwm_args = [
+                FFMPEG_PATH, '-y',
+                '-i', temp_video,
+                '-vn',
+                '-ar', '48000',
+                '-ac', '1',
+                '-f', 'dfpwm'
+            ]
+
+            # 混合声道
+            dfpwm_path_mix = os.path.join(job_dir, "audio.dfpwm")
+            subprocess.run(
+                dfpwm_args + [dfpwm_path_mix],
+                check=True, capture_output=True
+            )
+
+            # 左声道
+            dfpwm_path_left = os.path.join(job_dir, "audio_left.dfpwm")
+            subprocess.run(
+                dfpwm_args + ['-af', 'pan=mono|c0=c0'] + [dfpwm_path_left],
+                check=True, capture_output=True
+            )
+
+            # 右声道
+            dfpwm_path_right = os.path.join(job_dir, "audio_right.dfpwm")
+            subprocess.run(
+                dfpwm_args + ['-af', 'pan=mono|c0=c1'] + [dfpwm_path_right],
+                check=True, capture_output=True
+            )
+
+        # 生成结果
+        result_data = {
+            "duration_seconds": round(duration, 3),
+            "total_frames": total_frames,
+            "fps": fps,
+            "output_resolution": {"w": out_w, "h": out_h},
+            "frame_urls": [f"/frames/{task_id}/frame_{i:06d}.png" for i in range(1, total_frames + 1)],
+            "audio_dfpwm_url": f"/frames/{task_id}/audio.dfpwm" if has_audio else None,
+            "audio_dfpwm_left_url": f"/frames/{task_id}/audio_left.dfpwm" if has_audio else None,
+            "audio_dfpwm_right_url": f"/frames/{task_id}/audio_right.dfpwm" if has_audio else None
+        }
+
+        # 注册文件到文件注册表
+        with file_lock:
+            for frame_file in glob.glob(os.path.join(job_dir, "frame_*.png")):
+                filename = os.path.basename(frame_file)
+                file_id = f"frame_{task_id}_{filename}"
+                file_registry[file_id] = {
+                    'path': os.path.abspath(frame_file),
+                    'filename': filename,
+                    'last_access': time.time(),
+                    'download_count': 0
+                }
+
+            if audio_exists:
+                for audio_file in ["audio.dfpwm", "audio_left.dfpwm", "audio_right.dfpwm"]:
+                    audio_path = os.path.join(job_dir, audio_file)
+                    if os.path.exists(audio_path):
+                        file_id = f"audio_{task_id}_{audio_file}"
+                        file_registry[file_id] = {
+                            'path': os.path.abspath(audio_path),
+                            'filename': audio_file,
+                            'last_access': time.time(),
+                            'download_count': 0
+                        }
+
+        if task_id and task_registry and task_lock:
+            add_task_log(task_id, "视频帧提取任务完成", task_registry, task_lock)
+            with task_lock:
+                if task_id in task_registry:
+                    task_registry[task_id]['progress'] = 100
+
+        return {
+            'status': 'success',
+            'result': result_data,
+            'task_id': task_id,
+            'temp_dir': job_dir
+        }
+
+    except subprocess.CalledProcessError as e:
+        stderr_str = e.stderr.strip() if e.stderr else ""
+        stdout_str = e.stdout.strip() if e.stdout else ""
+        error_output = stderr_str or stdout_str or str(e)
+        error_msg = error_output[-500:] if len(error_output) > 500 else error_output
+
+        if task_id and task_registry and task_lock:
+            add_task_log(task_id, f"FFmpeg处理失败: {error_msg}", task_registry, task_lock)
+
+        return {'error': f'FFmpeg处理失败: {error_msg}'}
+    except requests.RequestException as e:
+        error_msg = f'视频下载失败: {str(e)}'
+        if task_id and task_registry and task_lock:
+            add_task_log(task_id, error_msg, task_registry, task_lock)
+        return {'error': error_msg}
+    except Exception as e:
+        error_msg = f'处理失败: {str(e)}'
+        if task_id and task_registry and task_lock:
+            add_task_log(task_id, error_msg, task_registry, task_lock)
+        return {'error': error_msg}
+    finally:
+        # 清理临时视频文件
+        for f in glob.glob(os.path.join(tempfile.gettempdir(), f"{task_id}.*")):
+            try:
+                os.remove(f)
+            except:
+                pass
+
+# ======================
+# 辅助函数
+# ======================
+
+def get_video_duration(video_path):
+    """获取视频时长"""
+    result = subprocess.run([
+        FFPROBE_PATH, '-v', 'error',
+        '-show_entries', 'format=duration',
+        '-of', 'csv=p=0',
+        video_path
+    ], capture_output=True, text=True, check=True)
+
+    duration_str = result.stdout.strip()
+    return float(duration_str) if duration_str and duration_str != 'N/A' else 0.0
+
+def build_video_filter(w, h, fps, force_resolution, pad_to_target):
+    """构建视频滤镜"""
+    if force_resolution:
+        return f"scale={w}:{h},fps={fps}"
+    else:
+        scale_expr = f"scale='min({w},iw*min(1,{h}/ih))':'min({h},ih*min(1,{w}/iw))'"
+        if pad_to_target:
+            return f"{scale_expr},pad={w}:{h}:(ow-iw)/2:(oh-ih)/2,fps={fps}"
+        else:
+            return f"{scale_expr},fps={fps}"
+
+def get_output_resolution(job_dir):
+    """获取输出分辨率"""
+    first_frame = None
+    for f in sorted(os.listdir(job_dir)):
+        if f.endswith('.png'):
+            first_frame = os.path.join(job_dir, f)
+            break
+
+    if first_frame:
+        probe_res = subprocess.run([
+            FFPROBE_PATH, '-v', 'error',
+            '-select_streams', 'v:0',
+            '-show_entries', 'stream=width,height',
+            '-of', 'csv=p=0',
+            first_frame
+        ], capture_output=True, text=True, check=True)
+
+        out_w, out_h = map(int, probe_res.stdout.strip().split(','))
+        return out_w, out_h
+
+    return 0, 0
+
+def has_audio(video_path):
+    """检查视频是否有音频"""
+    probe_streams = subprocess.run([
+        FFPROBE_PATH, '-v', 'error',
+        '-show_entries', 'stream=codec_type',
+        '-of', 'csv=p=0',
+        video_path
+    ], capture_output=True, text=True)
+
+    return 'audio' in probe_streams.stdout.lower()