feat(api): enhance task file management and download endpoints

- Update `/tasks/{task_id}/outputs` to include inference configuration details
- Replace `/tasks/{task_id}/outputs/{filename}` with `/tasks/{task_id}/outputs/{file_type}/{filename}` for flexible file downloads
- Support downloading inference outputs, reference audio, and model files
- Add `FileType` validation and path security checks in `TaskService`
- Implement `download_file` method to handle various file types securely

Files changed (2) hide show

api_server/app/api/v1/endpoints/tasks.py +43 -18
api_server/app/services/task_service.py +62 -0

api_server/app/api/v1/endpoints/tasks.py CHANGED Viewed

@@ -10,13 +10,13 @@ API 列表:
 - DELETE /tasks/{task_id}    取消任务
 - GET    /tasks/{task_id}/progress  SSE 进度订阅
 - GET    /tasks/{task_id}/outputs   获取推理输出列表
-- GET    /tasks/{task_id}/outputs/{filename}  下载推理输出文件
 """
 import json
-from typing import Optional
-from fastapi import APIRouter, Depends, HTTPException, Query
 from fastapi.responses import StreamingResponse, Response
 from ....models.schemas.task import (
@@ -238,18 +238,28 @@ async def subscribe_progress(
     response_model=InferenceOutputsResponse,
     summary="获取推理输出列表",
     description="""
-获取任务的推理输出文件列表。
 训练任务完成后，推理阶段会生成测试音频文件。此端点返回所有生成的音频文件元信息，
-包括文件名、使用的模型、文件大小等。
-**返回信息**:
 - `filename`: 文件名
 - `gpt_model`: 使用的 GPT 模型名称
 - `sovits_model`: 使用的 SoVITS 模型名称
-- `file_path`: 文件相对路径
 - `size_bytes`: 文件大小（字节）
 - `created_at`: 创建时间
 """,
     responses={
         200: {"model": InferenceOutputsResponse, "description": "推理输出列表"},
@@ -269,32 +279,47 @@ async def get_task_outputs(
     return result
 @router.get(
-    "/{task_id}/outputs/{filename}",
-    summary="下载推理输出文件",
     description="""
-下载指定的推理输出音频文件。
-文件名可从 `/tasks/{task_id}/outputs` 端点获取。
 **返回**:
-- Content-Type: audio/wav
-- 音频文件二进制数据
 """,
     responses={
-        200: {"description": "音频文件", "content": {"audio/wav": {}}},
         404: {"model": ErrorResponse, "description": "任务或文件不存在"},
     },
 )
-async def download_task_output(
     task_id: str,
-    filename: str,
     service: TaskService = Depends(get_task_service),
 ) -> Response:
     """
-    下载指定的推理输出文件
     """
-    result = await service.download_inference_output(task_id, filename)
     if result is None:
         raise HTTPException(status_code=404, detail="任务或文件不存在")

 - DELETE /tasks/{task_id}    取消任务
 - GET    /tasks/{task_id}/progress  SSE 进度订阅
 - GET    /tasks/{task_id}/outputs   获取推理输出列表
+- GET    /tasks/{task_id}/outputs/{file_type}/{filename}  下载任务相关文件
 """
 import json
+from typing import Literal, Optional
+from fastapi import APIRouter, Depends, HTTPException, Path, Query
 from fastapi.responses import StreamingResponse, Response
 from ....models.schemas.task import (
     response_model=InferenceOutputsResponse,
     summary="获取推理输出列表",
     description="""
+获取任务的推理输出文件列表及推理配置信息。
 训练任务完成后，推理阶段会生成测试音频文件。此端点返回所有生成的音频文件元信息，
+包括文件名、使用的模型路径、文件大小等，以及推理使用的参考音频和文本信息。
+**推理配置**:
+- `ref_text`: 参考音频的文本内容
+- `ref_audio_path`: 参考音频文件路径
+- `target_text`: 合成的目标文本
+**输出文件信息**:
 - `filename`: 文件名
 - `gpt_model`: 使用的 GPT 模型名称
 - `sovits_model`: 使用的 SoVITS 模型名称
+- `gpt_path`: GPT 模型完整路径
+- `sovits_path`: SoVITS 模型完整路径
+- `file_path`: 输出文件相对路径
 - `size_bytes`: 文件大小（字节）
 - `created_at`: 创建时间
+**下载文件**:
+使用 `/tasks/{task_id}/outputs/{file_type}/{filename}` 端点下载相关文件。
 """,
     responses={
         200: {"model": InferenceOutputsResponse, "description": "推理输出列表"},
     return result
+# 文件类型定义
+FileType = Literal["output", "ref_audio", "gpt_model", "sovits_model"]
 @router.get(
+    "/{task_id}/outputs/{file_type}/{filename:path}",
+    summary="下载任务相关文件",
     description="""
+下载任务相关的各类文件。
+**文件类型 (file_type)**:
+- `output` - 推理输出音频文件 (.wav)
+- `ref_audio` - 参考音频文件 (.wav)
+- `gpt_model` - GPT 模型文件 (.ckpt)
+- `sovits_model` - SoVITS 模型文件 (.pth)
+**文件名来源**:
+- `output`: 从 `/tasks/{task_id}/outputs` 端点的 `outputs[].filename` 获取
+- `ref_audio`: 从 `/tasks/{task_id}/outputs` 端点的 `ref_audio_path` 获取
+- `gpt_model`: 从 `/tasks/{task_id}/outputs` 端点的 `outputs[].gpt_path` 获取文件名部分
+- `sovits_model`: 从 `/tasks/{task_id}/outputs` 端点的 `outputs[].sovits_path` 获取文件名部分
 **返回**:
+- 音频文件: Content-Type: audio/wav
+- 模型文件: Content-Type: application/octet-stream
 """,
     responses={
+        200: {"description": "文件内容"},
         404: {"model": ErrorResponse, "description": "任务或文件不存在"},
     },
 )
+async def download_task_file(
     task_id: str,
+    file_type: FileType = Path(..., description="文件类型: output/ref_audio/gpt_model/sovits_model"),
+    filename: str = Path(..., description="文件名或路径"),
     service: TaskService = Depends(get_task_service),
 ) -> Response:
     """
+    下载任务相关文件（推理输出、参考音频、模型文件）
     """
+    result = await service.download_file(task_id, file_type, filename)
     if result is None:
         raise HTTPException(status_code=404, detail="任务或文件不存在")

api_server/app/services/task_service.py CHANGED Viewed

@@ -447,6 +447,68 @@ class TaskService:
         return file_data, filename, "audio/wav"
     def _parse_inference_filename(self, filename: str, exp_name: str) -> Tuple[str, str]:
         """
         解析推理输出文件名，提取 GPT 和 SoVITS 模型名称

         return file_data, filename, "audio/wav"
+    async def download_file(
+        self,
+        task_id: str,
+        file_type: str,
+        filename: str
+    ) -> Optional[Tuple[bytes, str, str]]:
+        """
+        下载指定类型的文件
+        Args:
+            task_id: 任务 ID
+            file_type: 文件类型 (output/ref_audio/gpt_model/sovits_model)
+            filename: 文件名
+        Returns:
+            (文件内容, 文件名, content_type) 或 None（不存在时）
+        """
+        # 获取任务
+        task = await self.db.get_task(task_id)
+        if not task:
+            return None
+        exp_name = task.exp_name
+        version = task.config.get("version", "v2")
+        # 根据文件类型确定路径和 content_type
+        if file_type == "output":
+            file_path = Path(settings.EXP_ROOT) / exp_name / "inference" / filename
+            content_type = "audio/wav"
+        elif file_type == "ref_audio":
+            # ref_audio 使用完整路径（filename 参数实际上是完整路径）
+            file_path = Path(filename)
+            content_type = "audio/wav"
+        elif file_type == "gpt_model":
+            gpt_dir = self._get_gpt_weight_dir(version)
+            file_path = Path(settings.EXP_ROOT) / exp_name / gpt_dir / filename
+            content_type = "application/octet-stream"
+        elif file_type == "sovits_model":
+            sovits_dir = self._get_sovits_weight_dir(version)
+            file_path = Path(settings.EXP_ROOT) / exp_name / sovits_dir / filename
+            content_type = "application/octet-stream"
+        else:
+            return None
+        # 安全检查：确保文件路径有效
+        try:
+            file_path = file_path.resolve()
+        except (ValueError, OSError):
+            return None
+        if not file_path.exists() or not file_path.is_file():
+            return None
+        # 读取文件内容
+        with open(file_path, "rb") as f:
+            file_data = f.read()
+        # 使用文件名（不含路径）作为下载文件名
+        download_filename = file_path.name
+        return file_data, download_filename, content_type
     def _parse_inference_filename(self, filename: str, exp_name: str) -> Tuple[str, str]:
         """
         解析推理输出文件名，提取 GPT 和 SoVITS 模型名称