feat(video): 集成可灵AI多图参考生视频生成服务
- 替换视频生成服务为可灵AI多图参考生视频API,支持1-4张多视角图片输入 - 调整图片拼接逻辑,生成横向长图传入即梦API备用 - 实现基于JWT认证的可灵API请求和轮询机制,支持高品质1:1正方形视频生成 - 在设计详情页新增视频展示区域及生成、重新生成和下载视频操作 - 更新后台系统配置,支持配置可灵AI Access Key和Secret Key - 删除即梦视频相关配置及逻辑,所有视频生成功能切换到可灵AI实现 - 优化视频生成提示词,提升视频质感和展示效果 - 增加视频文件本地存储和路径管理,保证视频可访问和下载 - 前端增加视频生成状态管理和用户界面交互提示 - 后端添加PyJWT依赖,支持JWT认证流程
This commit is contained in:
276
backend/app/services/ai_video_generator_kling.py
Normal file
276
backend/app/services/ai_video_generator_kling.py
Normal file
@@ -0,0 +1,276 @@
|
||||
"""
|
||||
AI 视频生成服务 - 可灵(Kling)多图参考生视频
|
||||
使用可灵 AI 的多图参考生视频 API,原生支持传入 1-4 张参考图片
|
||||
AI 会理解为同一物体的多角度参考,生成单品旋转展示视频
|
||||
|
||||
API 文档: https://app.klingai.com/cn/dev/document-api/apiReference/model/multiImageToVideo
|
||||
认证方式: JWT (Access Key + Secret Key)
|
||||
API 端点: https://api.klingai.com
|
||||
"""
|
||||
import asyncio
|
||||
import json
|
||||
import logging
|
||||
import time
|
||||
import uuid
|
||||
from pathlib import Path
|
||||
from typing import Optional, List
|
||||
|
||||
import httpx
|
||||
import jwt
|
||||
|
||||
from .config_service import get_config_value
|
||||
|
||||
# 视频本地存储目录
|
||||
VIDEO_UPLOAD_DIR = Path(__file__).resolve().parent.parent.parent / "uploads" / "videos"
|
||||
VIDEO_UPLOAD_DIR.mkdir(parents=True, exist_ok=True)
|
||||
|
||||
logger = logging.getLogger(__name__)
|
||||
|
||||
# 可灵 API 配置(中国区域名)
|
||||
KLING_API_BASE = "https://api-beijing.klingai.com"
|
||||
|
||||
# 超时与轮询配置
|
||||
SUBMIT_TIMEOUT = 30
|
||||
POLL_TIMEOUT = 15
|
||||
MAX_POLL_ATTEMPTS = 120 # 约 10 分钟
|
||||
POLL_INTERVAL = 5
|
||||
|
||||
|
||||
# ============================================================
|
||||
# JWT 认证
|
||||
# ============================================================
|
||||
|
||||
def _generate_jwt_token(access_key: str, secret_key: str) -> str:
|
||||
"""
|
||||
使用 Access Key 和 Secret Key 生成 JWT Token
|
||||
可灵 API 使用 JWT 认证,token 有效期 30 分钟
|
||||
"""
|
||||
now = int(time.time())
|
||||
headers = {
|
||||
"alg": "HS256",
|
||||
"typ": "JWT"
|
||||
}
|
||||
payload = {
|
||||
"iss": access_key,
|
||||
"exp": now + 1800, # 30 分钟过期
|
||||
"nbf": now - 5, # 允许 5 秒时钟偏差
|
||||
"iat": now, # 签发时间
|
||||
}
|
||||
token = jwt.encode(payload, secret_key, algorithm="HS256", headers=headers)
|
||||
return token
|
||||
|
||||
|
||||
def _get_kling_keys() -> tuple:
|
||||
"""获取可灵 Access Key 和 Secret Key"""
|
||||
access_key = get_config_value("KLING_ACCESS_KEY", "")
|
||||
secret_key = get_config_value("KLING_SECRET_KEY", "")
|
||||
if not access_key or not secret_key:
|
||||
raise RuntimeError(
|
||||
"未配置 KLING_ACCESS_KEY 或 KLING_SECRET_KEY,无法使用可灵视频生成。"
|
||||
"请在管理后台 系统配置 中添加可灵 AI 的 Access Key 和 Secret Key。"
|
||||
)
|
||||
return access_key, secret_key
|
||||
|
||||
|
||||
def _build_headers(access_key: str, secret_key: str) -> dict:
|
||||
"""构建带 JWT 认证的请求头"""
|
||||
token = _generate_jwt_token(access_key, secret_key)
|
||||
return {
|
||||
"Content-Type": "application/json",
|
||||
"Authorization": f"Bearer {token}",
|
||||
}
|
||||
|
||||
|
||||
# ============================================================
|
||||
# 视频生成核心逻辑
|
||||
# ============================================================
|
||||
|
||||
async def generate_video(
|
||||
image_urls: List[str],
|
||||
prompt: str = "",
|
||||
duration_seconds: int = 5,
|
||||
) -> str:
|
||||
"""
|
||||
调用可灵多图参考生视频 API,生成 360 度旋转展示视频
|
||||
|
||||
核心优势:原生支持传入多张参考图(1-4张),
|
||||
AI 理解为同一物体的多角度参考,生成单品视频。
|
||||
|
||||
Args:
|
||||
image_urls: 多视角图片 URL 列表(最多4张)
|
||||
prompt: 视频生成提示词
|
||||
duration_seconds: 视频时长(5 或 10 秒)
|
||||
|
||||
Returns:
|
||||
生成的视频本地 URL
|
||||
"""
|
||||
access_key, secret_key = _get_kling_keys()
|
||||
|
||||
logger.info(f"可灵视频生成,传入图片数量: {len(image_urls)}")
|
||||
|
||||
# 可灵最多支持 4 张参考图
|
||||
if len(image_urls) > 4:
|
||||
image_urls = image_urls[:4]
|
||||
logger.info("图片数量超过4张,截取前4张")
|
||||
|
||||
# 构建提示词
|
||||
if not prompt:
|
||||
prompt = get_config_value("VIDEO_PROMPT", "")
|
||||
if not prompt:
|
||||
prompt = (
|
||||
"精美玉雕工艺品在专业珠宝摄影棚内展示,"
|
||||
"纯白色背景,柔和的珠宝摄影灯光,"
|
||||
"玉石作品放在旋转展台上缓慢平稳地旋转360度,"
|
||||
"展示正面、侧面、背面全貌,"
|
||||
"展现玉石温润的质感、细腻的雕刻纹理和通透的光泽,"
|
||||
"电影级画质,微距细节感,平稳流畅的转台旋转"
|
||||
)
|
||||
|
||||
# 视频时长,仅支持 5 或 10
|
||||
duration = str(duration_seconds) if duration_seconds in (5, 10) else "5"
|
||||
|
||||
# Step 1: 提交任务
|
||||
task_id = await _submit_video_task(
|
||||
access_key, secret_key, image_urls, prompt, duration
|
||||
)
|
||||
logger.info(f"可灵视频生成任务已提交: task_id={task_id}")
|
||||
|
||||
# Step 2: 轮询等待结果
|
||||
remote_video_url = await _poll_video_result(access_key, secret_key, task_id)
|
||||
logger.info(f"可灵视频生成完成: {remote_video_url[:80]}...")
|
||||
|
||||
# Step 3: 下载视频到本地存储
|
||||
local_path = await _download_video_to_local(remote_video_url)
|
||||
logger.info(f"视频已保存到本地: {local_path}")
|
||||
|
||||
return local_path
|
||||
|
||||
|
||||
async def _submit_video_task(
|
||||
access_key: str,
|
||||
secret_key: str,
|
||||
image_urls: List[str],
|
||||
prompt: str,
|
||||
duration: str = "5",
|
||||
) -> str:
|
||||
"""提交多图参考生视频任务到可灵 API"""
|
||||
url = f"{KLING_API_BASE}/v1/videos/multi-image2video"
|
||||
|
||||
# 构建 image_list(每个元素是 {"image": "url"})
|
||||
image_list = [{"image": img_url} for img_url in image_urls]
|
||||
|
||||
payload = {
|
||||
"model_name": "kling-v1-6",
|
||||
"image_list": image_list,
|
||||
"prompt": prompt,
|
||||
"mode": "pro", # 高品质模式
|
||||
"duration": duration, # 视频时长
|
||||
"aspect_ratio": "1:1", # 1:1 正方形
|
||||
}
|
||||
|
||||
headers = _build_headers(access_key, secret_key)
|
||||
body = json.dumps(payload, ensure_ascii=False)
|
||||
|
||||
logger.info(f"提交可灵视频任务: {len(image_urls)}张参考图, 时长={duration}s, 模式=pro")
|
||||
|
||||
async with httpx.AsyncClient(timeout=SUBMIT_TIMEOUT) as client:
|
||||
resp = await client.post(url, content=body, headers=headers)
|
||||
if resp.status_code not in (200, 201):
|
||||
error_body = resp.text[:1000]
|
||||
logger.error(f"可灵视频任务提交失败: status={resp.status_code}, body={error_body}")
|
||||
resp.raise_for_status()
|
||||
data = resp.json()
|
||||
|
||||
# 检查响应
|
||||
code = data.get("code", -1)
|
||||
if code != 0:
|
||||
msg = data.get("message", "未知错误")
|
||||
raise RuntimeError(f"可灵视频任务提交失败 (code={code}): {msg}")
|
||||
|
||||
task_id = data.get("data", {}).get("task_id")
|
||||
if not task_id:
|
||||
raise RuntimeError(f"可灵响应中未找到 task_id: {data}")
|
||||
|
||||
return task_id
|
||||
|
||||
|
||||
async def _poll_video_result(
|
||||
access_key: str,
|
||||
secret_key: str,
|
||||
task_id: str,
|
||||
) -> str:
|
||||
"""轮询可灵视频生成结果"""
|
||||
url = f"{KLING_API_BASE}/v1/videos/multi-image2video/{task_id}"
|
||||
|
||||
for attempt in range(1, MAX_POLL_ATTEMPTS + 1):
|
||||
await asyncio.sleep(POLL_INTERVAL)
|
||||
|
||||
# 每次轮询重新生成 JWT(避免过期)
|
||||
headers = _build_headers(access_key, secret_key)
|
||||
|
||||
try:
|
||||
async with httpx.AsyncClient(timeout=POLL_TIMEOUT) as client:
|
||||
resp = await client.get(url, headers=headers)
|
||||
if resp.status_code != 200:
|
||||
logger.warning(
|
||||
f"轮询可灵视频结果失败 (attempt={attempt}): "
|
||||
f"status={resp.status_code}, body={resp.text[:300]}"
|
||||
)
|
||||
continue
|
||||
data = resp.json()
|
||||
except Exception as e:
|
||||
logger.warning(f"轮询可灵视频异常 (attempt={attempt}): {e}")
|
||||
continue
|
||||
|
||||
code = data.get("code", -1)
|
||||
if code != 0:
|
||||
msg = data.get("message", "未知错误")
|
||||
logger.warning(f"轮询可灵视频返回错误 (attempt={attempt}): code={code}, msg={msg}")
|
||||
continue
|
||||
|
||||
task_data = data.get("data", {})
|
||||
task_status = task_data.get("task_status", "")
|
||||
|
||||
if task_status == "succeed":
|
||||
# 从 task_result.videos 中提取视频 URL
|
||||
task_result = task_data.get("task_result", {})
|
||||
videos = task_result.get("videos", [])
|
||||
if videos and videos[0].get("url"):
|
||||
return videos[0]["url"]
|
||||
raise RuntimeError(f"可灵视频生成完成但未找到视频URL: {data}")
|
||||
|
||||
elif task_status == "failed":
|
||||
fail_msg = task_data.get("task_status_msg", "未知原因")
|
||||
raise RuntimeError(f"可灵视频生成失败: {fail_msg}")
|
||||
|
||||
else:
|
||||
# submitted / processing
|
||||
if attempt % 6 == 0:
|
||||
logger.info(
|
||||
f"可灵视频生成中... (attempt={attempt}, status={task_status})"
|
||||
)
|
||||
|
||||
raise RuntimeError(f"可灵视频生成超时: 轮询 {MAX_POLL_ATTEMPTS} 次后仍未完成")
|
||||
|
||||
|
||||
async def _download_video_to_local(remote_url: str) -> str:
|
||||
"""
|
||||
下载远程视频到本地 uploads/videos/ 目录
|
||||
|
||||
Returns:
|
||||
本地视频的 URL 路径,如 /uploads/videos/xxx.mp4
|
||||
"""
|
||||
filename = f"{uuid.uuid4().hex}.mp4"
|
||||
local_file = VIDEO_UPLOAD_DIR / filename
|
||||
|
||||
try:
|
||||
async with httpx.AsyncClient(timeout=120, follow_redirects=True) as client:
|
||||
resp = await client.get(remote_url)
|
||||
resp.raise_for_status()
|
||||
local_file.write_bytes(resp.content)
|
||||
logger.info(f"视频下载完成: {len(resp.content)} 字节 -> {local_file}")
|
||||
except Exception as e:
|
||||
logger.error(f"视频下载失败: {e}")
|
||||
raise RuntimeError(f"视频下载失败: {e}")
|
||||
|
||||
return f"/uploads/videos/{filename}"
|
||||
Reference in New Issue
Block a user