{"id":204,"date":"2025-04-18T11:08:38","date_gmt":"2025-04-18T03:08:38","guid":{"rendered":"https:\/\/knoka.vip\/?p=204"},"modified":"2025-05-22T12:58:42","modified_gmt":"2025-05-22T04:58:42","slug":"%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b","status":"publish","type":"post","link":"https:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/","title":{"rendered":"\u4e00\u6587\u5feb\u901f\u5b66\u4f1aFastAPI\u90e8\u7f72Step-Audio-TTS-3B\u6a21\u578b"},"content":{"rendered":"\n<h2 class=\"wp-block-heading\">\u73af\u5883\u51c6\u5907<\/h2>\n\n\n\n<p>\u9996\u5148\u51c6\u5907\u4e00\u53f0\u663e\u5b58\uff1e=12G\u7684\u670d\u52a1\u5668\uff0c\u6211\u8fd9\u91cc\u9009\u7528\u7684\u662f4090 24G\u4e91\u670d\u52a1\u5668<\/p>\n\n\n\n<p>\u63a5\u7740\u5148\u62c9\u53d6\u5b98\u65b9\u4ee3\u7801\uff0c\u7136\u540e\u521b\u5efa\u4e00\u4e2a\u865a\u62df\u73af\u5883\uff0c\u518d\u5b89\u88c5\u5176\u5bf9\u5e94\u7684\u4f9d\u8d56\u5e93<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code>git clone https:\/\/github.com\/stepfun-ai\/Step-Audio.git\nconda create -n stepaudio python=3.10\nconda activate stepaudio\ncd Step-Audio\npip install -r requirements.txt\npip install fastapi\npip install loguru\npip install aiohttp<\/code><\/pre>\n\n\n\n<p>\u63a5\u7740\u4e0b\u8f7d\u90e8\u7f72\u6240\u9700\u7684\u6a21\u578b\uff0c\u7531\u4e8e\u6211\u4eec\u4ec5\u4e3a\u90e8\u7f72Step-Audio-TTS-3B\u6a21\u578b\uff0c\u6240\u4ee5\u5e76\u4e0d\u9700\u8981\u5168\u90e8\u4e0b\u8f7d\u6240\u6709\u6a21\u578b\uff0c\u4ec5\u9700\u4e0b\u8f7dStep-Audio-Tokenizer\u548cStep-Audio-TTS-3B\u6a21\u578b\u5373\u53ef\u3002<\/p>\n\n\n\n<p>\u6a21\u578b\u4e0b\u8f7d\u4e0a\uff0c\u6211\u4eec\u53ef\u4ee5\u4eceModelScope\u4e0a\u4ec5\u9700\u4e0b\u8f7d\uff0c\u9996\u5148\u9700\u8981\u5b89\u88c5\u4e00\u4e0b\u5176\u4e0b\u8f7d\u5668\uff0c\u7136\u540e\u524d\u5f80\u5bf9\u5e94\u6a21\u578b\u9875\uff0c\u5373\u53ef\u590d\u5236\u5e76\u4e0b\u8f7d\u3002<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code>pip install modelscope\nmodelscope download --model stepfun-ai\/Step-Audio-TTS-3B --local_dir .\/model\/Step-Audio-TTS-3B\nmodelscope download --model stepfun-ai\/Step-Audio-Tokenizer --local_dir .\/model\/Step-Audio-Tokenizer<\/code><\/pre>\n\n\n\n<h2 class=\"wp-block-heading\">\u811a\u672c\u90e8\u7f72<\/h2>\n\n\n\n<p>\u8fd9\u91cc\u5df2\u7ecf\u51c6\u5907\u597d\u4e86\u90e8\u7f72\u811a\u672c\uff0c\u4ec5\u9700\u8981\u6539\u53d8\u81ea\u5df1\u7684\u5bc6\u94a5\u548cip\u3001\u7aef\u53e3\uff0c\u5373\u53ef\u76f4\u63a5\u90e8\u7f72\uff0c\u5feb\u901f\u4f7f\u7528\u3002<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code>import os\nimport uuid\nimport time\nimport asyncio\nfrom enum import Enum\nfrom contextlib import asynccontextmanager\nfrom fastapi import FastAPI, HTTPException, status, Depends, Request\nfrom fastapi.security import HTTPBearer, HTTPAuthorizationCredentials\nfrom fastapi.staticfiles import StaticFiles\nfrom pydantic import BaseModel, Field, validator, ValidationError, field_validator\nfrom typing import Optional, Dict, List\nfrom loguru import logger\nimport torchaudio\nimport aiohttp\nimport base64\nfrom tts import StepAudioTTS\nfrom tokenizer import StepAudioTokenizer\nfrom datetime import datetime\nfrom concurrent.futures import ThreadPoolExecutor\nfrom fastapi.responses import JSONResponse\nfrom fastapi.exceptions import RequestValidationError\n\nimport os\nos.makedirs(\"static\", exist_ok=True)\n\n# \u521d\u59cb\u5316\u8ba4\u8bc1\u5bc6\u94a5\nsecurity = HTTPBearer(auto_error=False)\nvalid_api_keys = {\"\u4f60\u7684\u5bc6\u94a5\"}  # \u4ece\u73af\u5883\u53d8\u91cf\u8bfb\u53d6\u66f4\u5b89\u5168\n\n# \u4efb\u52a1\u72b6\u6001\u679a\u4e3e\nclass TaskStatus(str, Enum):\n    IN_QUEUE = \"InQueue\"\n    IN_PROGRESS = \"InProgress\"\n    SUCCEEDED = \"Succeed\"\n    FAILED = \"Failed\"\n    CANCELLED = \"Cancelled\"\n\n# \u4efb\u52a1\u5b58\u50a8\u7ed3\u6784\nclass TaskData(BaseModel):\n    status: TaskStatus = TaskStatus.IN_QUEUE\n    audio_type: str  # \"common\", \"music\", \"clone\"\n    params: dict\n    created_at: int = Field(default_factory=lambda: int(time.time()))\n    started_at: Optional&#91;int] = None\n    completed_at: Optional&#91;int] = None\n    download_url: Optional&#91;str] = None\n    reason: Optional&#91;str] = None\n\n# \u751f\u547d\u5468\u671f\u7ba1\u7406\n@asynccontextmanager\nasync def lifespan(app: FastAPI):\n    try:\n        # \u521d\u59cb\u5316\u6a21\u578b\n        model_path = os.getenv(\"MODEL_PATH\", \"\/data\/coding\/model\")\n        app.state.encoder = StepAudioTokenizer(os.path.join(model_path, \"Step-Audio-Tokenizer\"))\n        app.state.tts_engine = StepAudioTTS(os.path.join(model_path, \"Step-Audio-TTS-3B\"), app.state.encoder)\n\n        # \u521d\u59cb\u5316\u4efb\u52a1\u7cfb\u7edf\n        app.state.tasks: Dict&#91;str, TaskData] = {}\n        app.state.pending_queue: List&#91;str] = &#91;]\n        app.state.task_lock = asyncio.Lock()\n        app.state.semaphore = asyncio.Semaphore(5)  # \u5e76\u53d1\u6570\u9650\u5236\uff08\u589e\u52a0\u52305\uff09\n        app.state.base_url = \"ip+\u7aef\u53e3\"\n\n        # \u542f\u52a8\u540e\u53f0\u5904\u7406\u5668\n        asyncio.create_task(task_processor())\n        print(\"\u2705 \u5e94\u7528\u521d\u59cb\u5316\u5b8c\u6210\")\n        yield\n    finally:\n        # \u6e05\u7406\u8d44\u6e90\n        app.state.encoder = None\n        app.state.tts_engine = None\n        torch.cuda.empty_cache()\n\napp = FastAPI(lifespan=lifespan)\napp.mount(\"\/static\", StaticFiles(directory=\"static\"), name=\"static\")\n\n# \u8bf7\u6c42\u6a21\u578b\nclass CommonTTSRequest(BaseModel):\n    text:str = Field(..., min_length=1, description=\"\u9700\u8981\u5408\u6210\u7684\u6587\u672c\u5185\u5bb9\")\n    speaker: str = Field(default=\"Tingting\", description=\"\u4ec5\u652f\u6301 Tingting\")\n    emotion: Optional&#91;str] = Field(None, description=\"\u53ef\u9009\u503c: \u9ad8\u51741, \u9ad8\u51742, \u751f\u6c141, \u751f\u6c142, \u60b2\u4f241, \u6492\u5a071\")\n    language: Optional&#91;str] = Field(None, description=\"\u53ef\u9009\u503c: \u4e2d\u6587, \u82f1\u6587, \u97e9\u8bed, \u65e5\u8bed, \u56db\u5ddd\u8bdd, \u7ca4\u8bed, \u5e7f\u4e1c\u8bdd\")\n    speed: Optional&#91;str] = Field(None, description=\"\u53ef\u9009\u503c: \u6162\u901f1, \u6162\u901f2, \u5feb\u901f1, \u5feb\u901f2\")\n\n    @field_validator(\"speaker\")\n    def validate_speaker(cls, v):\n        if v not in &#91;\"Tingting\"]:\n            raise ValueError(f\"\u4e0d\u652f\u6301\u7684 speaker: {v}\")\n        return v\n\n    @field_validator(\"emotion\")\n    def validate_emotion(cls, v):\n        emotion_options = &#91;\"\u9ad8\u51741\", \"\u9ad8\u51742\", \"\u751f\u6c141\", \"\u751f\u6c142\", \"\u60b2\u4f241\", \"\u6492\u5a071\"]\n        if v and v not in emotion_options:\n            raise ValueError(f\"\u4e0d\u652f\u6301\u7684 emotion: {v}\")\n        return v\n\n    @field_validator(\"language\")\n    def validate_language(cls, v):\n        language_options = &#91;\"\u4e2d\u6587\", \"\u82f1\u6587\", \"\u97e9\u8bed\", \"\u65e5\u8bed\", \"\u56db\u5ddd\u8bdd\", \"\u7ca4\u8bed\", \"\u5e7f\u4e1c\u8bdd\"]\n        if v and v not in language_options:\n            raise ValueError(f\"\u4e0d\u652f\u6301\u7684 language: {v}\")\n        return v\n\n    @field_validator(\"speed\")\n    def validate_speed(cls, v):\n        speed_options = &#91;\"\u6162\u901f1\", \"\u6162\u901f2\", \"\u5feb\u901f1\", \"\u5feb\u901f2\"]\n        if v and v not in speed_options:\n            raise ValueError(f\"\u4e0d\u652f\u6301\u7684 speed: {v}\")\n        return v\n    \n    # \u53ef\u6dfb\u52a0\u66f4\u53cb\u597d\u7684\u9519\u8bef\u63d0\u793a\n    # \u53ef\u6dfb\u52a0\u66f4\u53cb\u597d\u7684\u9519\u8bef\u63d0\u793a\n    @field_validator('text')\n    def check_text_not_empty(cls, v):\n        if not v.strip():\n            raise ValueError('\u6587\u672c\u5185\u5bb9\u4e0d\u80fd\u4e3a\u7a7a')\n        return v\n\n\nclass MusicTTSRequest(BaseModel):\n    text:str = Field(..., min_length=1, description=\"\u9700\u8981\u5408\u6210\u7684\u6587\u672c\u5185\u5bb9\")\n    speaker: str = Field(default=\"Tingting\", description=\"\u4ec5\u652f\u6301 Tingting\")\n    mode: str = Field(default=\"Humming (\u54fc\u5531)\", description=\"\u53ef\u9009\u503c: RAP, Humming (\u54fc\u5531)\")\n\n    @field_validator(\"speaker\")\n    def validate_speaker(cls, v):\n        if v not in &#91;\"Tingting\"]:\n            raise ValueError(f\"\u4e0d\u652f\u6301\u7684 speaker: {v}\")\n        return v\n\n    @field_validator(\"mode\")\n    def validate_mode(cls, v):\n        mode_options = &#91;\"RAP\", \"Humming (\u54fc\u5531)\"]\n        if v not in mode_options:\n            raise ValueError(f\"\u4e0d\u652f\u6301\u7684 mode: {v}\")\n        return v\n        # \u53ef\u6dfb\u52a0\u66f4\u53cb\u597d\u7684\u9519\u8bef\u63d0\u793a\n    @field_validator('text')\n    def check_text_not_empty(cls, v):\n        if not v.strip():\n            raise ValueError('\u6587\u672c\u5185\u5bb9\u4e0d\u80fd\u4e3a\u7a7a')\n        return v\n\n\nclass CloneTTSRequest(BaseModel):\n    text:str = Field(..., min_length=1, description=\"\u9700\u8981\u5408\u6210\u7684\u6587\u672c\u5185\u5bb9\")\n    speaker_prompt: str\n    emotion: Optional&#91;str] = Field(None, description=\"\u53ef\u9009\u503c: \u9ad8\u51741, \u9ad8\u51742, \u751f\u6c141, \u751f\u6c142, \u60b2\u4f241, \u6492\u5a071\")\n    language: Optional&#91;str] = Field(None, description=\"\u53ef\u9009\u503c: \u4e2d\u6587, \u82f1\u6587, \u97e9\u8bed, \u65e5\u8bed, \u56db\u5ddd\u8bdd, \u7ca4\u8bed, \u5e7f\u4e1c\u8bdd\")\n    speed: Optional&#91;str] = Field(None, description=\"\u53ef\u9009\u503c: \u6162\u901f1, \u6162\u901f2, \u5feb\u901f1, \u5feb\u901f2\")\n    audio_source: str\n\n    @field_validator(\"emotion\")\n    def validate_emotion(cls, v):\n        emotion_options = &#91;\"\u9ad8\u51741\", \"\u9ad8\u51742\", \"\u751f\u6c141\", \"\u751f\u6c142\", \"\u60b2\u4f241\", \"\u6492\u5a071\"]\n        if v and v not in emotion_options:\n            raise ValueError(f\"\u4e0d\u652f\u6301\u7684 emotion: {v}\")\n        return v\n\n    @field_validator(\"language\")\n    def validate_language(cls, v):\n        language_options = &#91;\"\u4e2d\u6587\", \"\u82f1\u6587\", \"\u97e9\u8bed\", \"\u65e5\u8bed\", \"\u56db\u5ddd\u8bdd\", \"\u7ca4\u8bed\", \"\u5e7f\u4e1c\u8bdd\"]\n        if v and v not in language_options:\n            raise ValueError(f\"\u4e0d\u652f\u6301\u7684 language: {v}\")\n        return v\n\n    @field_validator(\"speed\")\n    def validate_speed(cls, v):\n        speed_options = &#91;\"\u6162\u901f1\", \"\u6162\u901f2\", \"\u5feb\u901f1\", \"\u5feb\u901f2\"]\n        if v and v not in speed_options:\n            raise ValueError(f\"\u4e0d\u652f\u6301\u7684 speed: {v}\")\n        return v\n    # \u53ef\u6dfb\u52a0\u66f4\u53cb\u597d\u7684\u9519\u8bef\u63d0\u793a\n    @field_validator('text')\n    def check_text_not_empty(cls, v):\n        if not v.strip():\n            raise ValueError('\u6587\u672c\u5185\u5bb9\u4e0d\u80fd\u4e3a\u7a7a')\n        return v\n\n\nclass TaskStatusRequest(BaseModel):\n    request_id: str\n\nclass TaskCancelRequest(BaseModel):\n    request_id: str\n\n# \u54cd\u5e94\u6a21\u578b\nclass TaskSubmitResponse(BaseModel):\n    request_id: str\n\nclass TaskStatusResponse(BaseModel):\n    status: TaskStatus\n    reason: Optional&#91;str] = None\n    results: Optional&#91;dict] = None\n    queue_position: Optional&#91;int] = None\n\n# \u8ba4\u8bc1\u9a8c\u8bc1\nasync def verify_auth(credentials: HTTPAuthorizationCredentials = Depends(security)):\n    if not credentials or credentials.scheme != \"Bearer\":\n        raise HTTPException(401, {\"status\": \"Failed\", \"reason\": \"\u65e0\u6548\u7684\u8ba4\u8bc1\u51ed\u8bc1\"})\n    if credentials.credentials not in valid_api_keys:\n        raise HTTPException(401, {\"status\": \"Failed\", \"reason\": \"\u65e0\u6548\u7684API\u5bc6\u94a5\"})\n    return True\n\n@app.exception_handler(HTTPException)\nasync def http_exception_handler(request, exc: HTTPException):\n    return JSONResponse(\n        content=exc.detail\n    )\n\n@app.exception_handler(RequestValidationError)\nasync def validation_exception_handler(request: Request, exc: RequestValidationError):\n    error_msg = exc.errors()&#91;0]&#91;'msg']\n    return JSONResponse(\n        status_code=status.HTTP_422_UNPROCESSABLE_ENTITY,\n        content={\"status\": \"Failed\", \"reason\": f\"\u53c2\u6570\u6821\u9a8c\u5931\u8d25: {error_msg}\"}\n    )\n\n\n# \u63d0\u4ea4\u4efb\u52a1\u63a5\u53e3\n@app.post(\"\/tts\/submit\/common\", response_model=TaskSubmitResponse)\nasync def submit_common(request: CommonTTSRequest, auth: bool = Depends(verify_auth)):\n    request_id = str(uuid.uuid4())\n    async with app.state.task_lock:\n        app.state.tasks&#91;request_id] = TaskData(\n            audio_type=\"common\",\n            params=request.model_dump()\n        )\n        app.state.pending_queue.append(request_id)\n    return {\"request_id\": request_id}\n\n@app.post(\"\/tts\/submit\/music\", response_model=TaskSubmitResponse)\nasync def submit_music(request: MusicTTSRequest, auth: bool = Depends(verify_auth)):\n    request_id = str(uuid.uuid4())\n    async with app.state.task_lock:\n        app.state.tasks&#91;request_id] = TaskData(\n            audio_type=\"music\",\n            params=request.model_dump()\n        )\n        app.state.pending_queue.append(request_id)\n    return {\"request_id\": request_id}\n\n@app.post(\"\/tts\/submit\/clone\", response_model=TaskSubmitResponse)\nasync def submit_clone(request: CloneTTSRequest, auth: bool = Depends(verify_auth)):\n    request_id = str(uuid.uuid4())\n    async with app.state.task_lock:\n        app.state.tasks&#91;request_id] = TaskData(\n            audio_type=\"clone\",\n            params=request.model_dump()\n        )\n        app.state.pending_queue.append(request_id)\n    return {\"request_id\": request_id}\n\n# \u67e5\u8be2\u72b6\u6001\u63a5\u53e3\n@app.post(\"\/tts\/status\", response_model=TaskStatusResponse)\nasync def get_status(request: TaskStatusRequest, auth: bool = Depends(verify_auth)):\n    task = app.state.tasks.get(request.request_id)\n    if not task:\n        raise HTTPException(\n            status_code=404,\n            detail={\"status\": \"Failed\", \"reason\": \"\u65e0\u6548\u7684\u4efb\u52a1ID\"}\n        )\n\n    # \u8ba1\u7b97\u961f\u5217\u4f4d\u7f6e\uff08\u4ec5\u5f53\u5728\u961f\u5217\u4e2d\u65f6\uff09\n    queue_pos = 0\n    if task.status == TaskStatus.IN_QUEUE and request.request_id in app.state.pending_queue:\n        try:\n            queue_pos = app.state.pending_queue.index(request.request_id) + 1\n        except ValueError:\n            queue_pos = 0\n\n    response = {\n        \"status\": task.status.value,  # \u786e\u4fdd\u8fd4\u56de\u7684\u662f\u5b57\u7b26\u4e32\u5f62\u5f0f\n        \"reason\": task.reason,\n        \"queue_position\": queue_pos if task.status == TaskStatus.IN_QUEUE else None  # \u975e\u6392\u961f\u72b6\u6001\u8fd4\u56denull\n    }\n\n    # \u6210\u529f\u72b6\u6001\u7684\u7279\u6b8a\u5904\u7406\n    if task.status == TaskStatus.SUCCEEDED:\n        response&#91;\"results\"] = {\n            \"audio\": &#91;{\"url\": task.download_url}],  # \u8c03\u6574\u4e3a\u6570\u7ec4\u5f62\u5f0f\n            \"timings\": {\n                \"inference\": task.completed_at - task.started_at\n            },\n            # \"seed\": None\n        }\n    elif task.status == TaskStatus.CANCELLED:\n        response&#91;\"reason\"] = task.reason or \"\u7528\u6237\u4e3b\u52a8\u53d6\u6d88\"  # \u786e\u4fdd\u539f\u56e0\u5b57\u6bb5\u5b58\u5728\n\n    return response\n\n# \u53d6\u6d88\u4efb\u52a1\u63a5\u53e3\n@app.post(\"\/tts\/cancel\", response_model=dict)\nasync def cancel_task(request: TaskCancelRequest, auth: bool = Depends(verify_auth)):\n    request_id = request.request_id\n    async with app.state.task_lock:\n        task = app.state.tasks.get(request_id)\n        if not task:\n            raise HTTPException(404, {\"status\": \"Failed\", \"reason\": \"\u65e0\u6548\u7684\u4efb\u52a1ID\"})\n        current_status = task.status\n        if current_status != TaskStatus.IN_QUEUE:\n            raise HTTPException(400, {\"status\": \"Failed\", \"reason\": f\"\u4ec5\u5141\u8bb8\u53d6\u6d88\u6392\u961f\u4efb\u52a1\uff0c\u5f53\u524d\u72b6\u6001: {current_status}\"})\n        # \u4ece\u961f\u5217\u4e2d\u79fb\u9664\u4efb\u52a1\n        try:\n            app.state.pending_queue.remove(request_id)\n        except ValueError:\n            pass  # \u53ef\u80fd\u5df2\u88ab\u5904\u7406\n        # \u66f4\u65b0\u4efb\u52a1\u72b6\u6001\n        task.status = TaskStatus.CANCELLED\n        task.reason = \"\u7528\u6237\u4e3b\u52a8\u53d6\u6d88\"\n    return {\"status\": \"Succeed\", \"reason\": \"\u53d6\u6d88\u6392\u961f\u4efb\u52a1\u6210\u529f\"}\n\n# \u540e\u53f0\u4efb\u52a1\u5904\u7406\u5668\nasync def task_processor():\n    executor = ThreadPoolExecutor(max_workers=5)  # \u4f7f\u7528\u7ebf\u7a0b\u6c60\u907f\u514d\u963b\u585e\u4e8b\u4ef6\u5faa\u73af\n\n    while True:\n        async with app.state.semaphore:\n            request_id = await get_next_task()\n            if request_id:\n                loop = asyncio.get_event_loop()\n                await loop.run_in_executor(executor, lambda: process_task_sync(request_id))\n            else:\n                await asyncio.sleep(0.5)\n\nasync def get_next_task():\n    async with app.state.task_lock:\n        if app.state.pending_queue:\n            return app.state.pending_queue.pop(0)\n    return None\n\ndef process_task_sync(request_id: str):\n    \"\"\"\u540c\u6b65\u5904\u7406\u5355\u4e2a\u4efb\u52a1\"\"\"\n    task = app.state.tasks.get(request_id)\n    if not task:\n        return\n\n    try:\n        task.status = TaskStatus.IN_PROGRESS\n        task.started_at = int(time.time())\n\n        if task.audio_type == \"common\":\n            audio_data = process_common_sync(task.params)\n        elif task.audio_type == \"music\":\n            audio_data = process_music_sync(task.params)\n        elif task.audio_type == \"clone\":\n            audio_data = process_clone_sync(task.params)\n\n        audio_name = save_audio(task.audio_type, audio_data&#91;0], audio_data&#91;1])\n        task.download_url = f\"{app.state.base_url}\/static\/audio\/{task.audio_type}\/{audio_name}\"\n        task.status = TaskStatus.SUCCEEDED\n        task.completed_at = int(time.time())\n\n    except Exception as e:\n        task.status = TaskStatus.FAILED\n        task.reason = str(e)\n        task.completed_at = int(time.time())\n        logger.error(f\"Task {request_id} failed: {str(e)}\")\n\n# \u97f3\u9891\u5904\u7406\u51fd\u6570\uff08\u540c\u6b65\u7248\u672c\uff09\ndef process_common_sync(params: dict):\n    control_tags = &#91;]\n    for attr in &#91;\"emotion\", \"language\", \"speed\"]:\n        if params.get(attr):\n            control_tags.append(f\"({params&#91;attr]})\")\n    formatted_text = \"\".join(control_tags) + params&#91;\"text\"]\n    return app.state.tts_engine(formatted_text, params&#91;\"speaker\"])\n\ndef process_music_sync(params: dict):\n    formatted_text = f\"({params&#91;'mode']}){params&#91;'text']}\"\n    return app.state.tts_engine(formatted_text, params&#91;\"speaker\"])\n\ndef process_clone_sync(params: dict):\n    temp_audio_path = None\n    try:\n        # \u5904\u7406\u97f3\u9891\u8f93\u5165\n        if params&#91;\"audio_source\"].startswith(('http', 'https')):\n            with aiohttp.ClientSession() as session:\n                resp = session.get(params&#91;\"audio_source\"])\n                audio_contents = resp.read()\n        else:\n            audio_contents = base64.b64decode(params&#91;\"audio_source\"].split(',')&#91;1])\n\n        # \u4fdd\u5b58\u4e34\u65f6\u6587\u4ef6\n        os.makedirs(\"tmp\", exist_ok=True)\n        temp_audio_path = f\"tmp\/clone_{uuid.uuid4()}.wav\"\n        with open(temp_audio_path, \"wb\") as f:\n            f.write(audio_contents)\n\n        # \u6784\u5efa\u514b\u9686\u53c2\u6570\n        clone_speaker = {\n            \"wav_path\": temp_audio_path,\n            \"speaker\": \"custom_voice\",\n            \"prompt_text\": params&#91;\"speaker_prompt\"],\n        }\n\n        # \u5904\u7406\u63a7\u5236\u6807\u8bb0\n        control_tags = &#91;]\n        for param in &#91;\"emotion\", \"language\", \"speed\"]:\n            if params.get(param):\n                control_tags.append(f\"({params&#91;param]})\")\n        formatted_text = \"\".join(control_tags) + params&#91;\"text\"]\n\n        # \u751f\u6210\u97f3\u9891\n        return app.state.tts_engine(formatted_text, \"\", clone_speaker)\n\n    finally:\n        if temp_audio_path and os.path.exists(temp_audio_path):\n            os.remove(temp_audio_path)\n\n# \u4fdd\u5b58\u97f3\u9891\u51fd\u6570\ndef save_audio(audio_type: str, audio_data, sr: int) -> str:\n    current_time = datetime.now().strftime(\"%Y-%m-%d_%H-%M-%S\")\n    save_dir = os.path.join(os.getenv(\"TMP_DIR\", \"\/data\/coding\/Step-Audio\/static\/audio\"), audio_type)\n    os.makedirs(save_dir, exist_ok=True)\n    save_path = os.path.join(save_dir, f\"{current_time}.wav\")\n    torchaudio.save(save_path, audio_data, sr)\n    return f\"{current_time}.wav\"\n\n# \u81ea\u52a8\u6e05\u7406\u4efb\u52a1\nasync def auto_cleanup(file_path: str, delay: int = 3600):\n    await asyncio.sleep(delay)\n    try:\n        if os.path.exists(file_path):\n            os.remove(file_path)\n            logger.info(f\"\u5df2\u6e05\u7406\u6587\u4ef6: {file_path}\")\n    except Exception as e:\n        logger.error(f\"\u6587\u4ef6\u6e05\u7406\u5931\u8d25: {str(e)}\")\n\nif __name__ == \"__main__\":\n    import uvicorn\n    uvicorn.run(app, host=\"0.0.0.0\", port=10341)<\/code><\/pre>\n\n\n\n<h2 class=\"wp-block-heading\">\u811a\u672c\u8bf4\u660e<\/h2>\n\n\n\n<h3 class=\"wp-block-heading\">\u5168\u5c40\u914d\u7f6e<\/h3>\n\n\n\n<pre class=\"wp-block-code\"><code>{\n  \"Authorization\": \"Bearer \u4f60\u7684\u5bc6\u94a5\",\n  \"Content-Type\": \"application\/json\"\n}<\/code><\/pre>\n\n\n\n<h3 class=\"wp-block-heading\">\u63a5\u53e3\u5217\u8868<\/h3>\n\n\n\n<h4 class=\"wp-block-heading\">1\u3001\u63d0\u4ea4\u666e\u901aTTS\u4efb\u52a1<\/h4>\n\n\n\n<ul class=\"wp-block-list\">\n<li><strong>URL<\/strong>: <code>\/tts\/submit\/common<\/code><\/li>\n\n\n\n<li><strong>Method<\/strong>: POST<\/li>\n\n\n\n<li><strong>Body<\/strong>:{<br>&nbsp;&#8220;text&#8221;: &#8220;\u4f60\u597d\u4e16\u754c&#8221;,<br>&nbsp;&#8220;speaker&#8221;: &#8220;Tingting&#8221;,<br>&nbsp;&#8220;emotion&#8221;: &#8220;\u9ad8\u51741&#8221;,<br>&nbsp;&#8220;language&#8221;: &#8220;\u4e2d\u6587&#8221;,<br>&nbsp;&#8220;speed&#8221;: &#8220;\u6162\u901f1&#8221;<br>}<\/li>\n<\/ul>\n\n\n\n<p>\u6210\u529f\u5219\u4e3a\u5982\u4e0b\u54cd\u5e94<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code>{\n&nbsp;\"request_id\": \"550e8400-e29b-41d4-a716-446655440000\"\n}<\/code><\/pre>\n\n\n\n<h4 class=\"wp-block-heading\">2\u3001\u63d0\u4ea4\u97f3\u4e50TTS\u4efb\u52a1<\/h4>\n\n\n\n<ul class=\"wp-block-list\">\n<li><strong>URL<\/strong>: <code>\/tts\/submit\/music<\/code><\/li>\n\n\n\n<li><strong>Method<\/strong>: POST<\/li>\n\n\n\n<li><strong>Body<\/strong>:{<br>&nbsp;&#8220;text&#8221;: &#8220;\u97f3\u4e50\u5408\u6210\u6d4b\u8bd5&#8221;,<br>&nbsp;&#8220;speaker&#8221;: &#8220;Tingting&#8221;,<br>&nbsp;&#8220;mode&#8221;: &#8220;Humming (\u54fc\u5531)&#8221;<br>}<\/li>\n<\/ul>\n\n\n\n<p>\u6210\u529f\u5219\u4e3a\u5982\u4e0b\u54cd\u5e94<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code>{\n&nbsp;\"request_id\": \"550e8400-e29b-41d4-a716-446655440001\"\n}<\/code><\/pre>\n\n\n\n<h4 class=\"wp-block-heading\">3\u3001\u63d0\u4ea4\u514b\u9686TTS\u4efb\u52a1<\/h4>\n\n\n\n<ul class=\"wp-block-list\">\n<li><strong>URL<\/strong>: <code>\/tts\/submit\/clone<\/code><\/li>\n\n\n\n<li><strong>Method<\/strong>: POST<\/li>\n\n\n\n<li><strong>Body<\/strong>:{<br>&nbsp;&#8220;text&#8221;: &#8220;\u8bed\u97f3\u514b\u9686\u6d4b\u8bd5&#8221;,<br>&nbsp;&#8220;speaker_prompt&#8221;: &#8220;\u793a\u4f8b\u8bf4\u8bdd\u4eba&#8221;,<br>&nbsp;&#8220;audio_source&#8221;: &#8220;base64\u7f16\u7801\u97f3\u9891\u6570\u636e\u6216URL&#8221;,<br>&nbsp;&#8220;language&#8221;: &#8220;\u7ca4\u8bed&#8221;<br>}<\/li>\n<\/ul>\n\n\n\n<p>\u6210\u529f\u5219\u4e3a\u5982\u4e0b\u54cd\u5e94<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code>{\n&nbsp;\"request_id\": \"550e8400-e29b-41d4-a716-446655440002\"\n}<\/code><\/pre>\n\n\n\n<h4 class=\"wp-block-heading\">4\u3001\u67e5\u8be2\u4efb\u52a1\u72b6\u6001<\/h4>\n\n\n\n<ul class=\"wp-block-list\">\n<li><strong>URL<\/strong>: <code>\/tts\/status<\/code><\/li>\n\n\n\n<li><strong>Method<\/strong>: POST<\/li>\n\n\n\n<li><strong>Body<\/strong>:{<br>&nbsp;&#8220;request_id&#8221;: &#8220;550e8400-e29b-41d4-a716-446655440000&#8221;<br>}<\/li>\n<\/ul>\n\n\n\n<p>\u6210\u529f\u5219\u4e3a\u5982\u4e0b\u54cd\u5e94<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code>{\n&nbsp; &nbsp;\"status\": \"Succeed\",\n&nbsp; &nbsp;\"reason\": null,\n&nbsp; &nbsp;\"results\": {\n&nbsp; &nbsp; &nbsp; &nbsp;\"audio\": &#91;\n&nbsp; &nbsp; &nbsp; &nbsp; &nbsp; {\n&nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp;\"url\": \"https:\/\/585os96gouen3i3talk4090.funhpc.com:30499\/static\/audio\/clone\/2025-04-18_10-43-55.wav\"\n&nbsp; &nbsp; &nbsp; &nbsp; &nbsp; }\n&nbsp; &nbsp; &nbsp; ],\n&nbsp; &nbsp; &nbsp; &nbsp;\"timings\": {\n&nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp;\"inference\": 7\n&nbsp; &nbsp; &nbsp; }\n&nbsp; },\n&nbsp; &nbsp;\"queue_position\": null\n}<\/code><\/pre>\n\n\n\n<h4 class=\"wp-block-heading\">5\u3001\u53d6\u6d88\u4efb\u52a1<\/h4>\n\n\n\n<ul class=\"wp-block-list\">\n<li><strong>URL<\/strong>: <code>\/tts\/cancel<\/code><\/li>\n\n\n\n<li><strong>Method<\/strong>: POST<\/li>\n\n\n\n<li><strong>Body<\/strong>:{<br>&nbsp;&#8220;request_id&#8221;: &#8220;550e8400-e29b-41d4-a716-446655440000&#8221;<br>}<\/li>\n<\/ul>\n\n\n\n<p>\u6210\u529f\u5219\u4e3a\u5982\u4e0b\u54cd\u5e94<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code>{\n&nbsp;\"status\": \"Succeed\",\n&nbsp;\"reason\": \"\u53d6\u6d88\u6392\u961f\u4efb\u52a1\u6210\u529f\"\n}<\/code><\/pre>\n\n\n\n<h2 class=\"wp-block-heading\">\u53c2\u6570\u8bf4\u660e<\/h2>\n\n\n\n<h3 class=\"wp-block-heading\">\u901a\u7528\u53c2\u6570<\/h3>\n\n\n\n<figure class=\"wp-block-table\"><table class=\"has-fixed-layout\"><thead><tr><th>\u53c2\u6570\u540d<\/th><th>\u5141\u8bb8\u503c<\/th><th>\u8bf4\u660e<\/th><\/tr><\/thead><tbody><tr><td>speaker<\/td><td>Tingting<\/td><td>\u56fa\u5b9a\u503c<\/td><\/tr><tr><td>emotion<\/td><td>\u9ad8\u51741\/2, \u751f\u6c141\/2, \u60b2\u4f241, \u6492\u5a071<\/td><td>\u60c5\u611f\u53c2\u6570<\/td><\/tr><tr><td>language<\/td><td>\u4e2d\u6587\/\u82f1\u6587\/\u97e9\u8bed\/\u65e5\u8bed\/\u56db\u5ddd\u8bdd\/\u7ca4\u8bed\/\u5e7f\u4e1c\u8bdd<\/td><td>\u8bed\u8a00\u9009\u62e9<\/td><\/tr><tr><td>speed<\/td><td>\u6162\u901f1\/2, \u5feb\u901f1\/2<\/td><td>\u8bed\u901f\u63a7\u5236<\/td><\/tr><\/tbody><\/table><\/figure>\n\n\n\n<h3 class=\"wp-block-heading\">\u7279\u6b8a\u53c2\u6570<\/h3>\n\n\n\n<figure class=\"wp-block-table\"><table class=\"has-fixed-layout\"><thead><tr><th>\u63a5\u53e3\u7c7b\u578b<\/th><th>\u7279\u6b8a\u53c2\u6570<\/th><th>\u5141\u8bb8\u503c<\/th><\/tr><\/thead><tbody><tr><td>\u97f3\u4e50\u5408\u6210<\/td><td>mode<\/td><td>RAP, Humming (\u54fc\u5531)<\/td><\/tr><tr><td>\u8bed\u97f3\u514b\u9686<\/td><td>audio_source<\/td><td>\u97f3\u9891URL\u6216Base64\u7f16\u7801\u6570\u636e<\/td><\/tr><\/tbody><\/table><\/figure>\n\n\n\n<h2 class=\"wp-block-heading\">\u9519\u8bef\u7801\u8bf4\u660e<\/h2>\n\n\n\n<figure class=\"wp-block-table\"><table class=\"has-fixed-layout\"><thead><tr><th>HTTP\u72b6\u6001\u7801<\/th><th>\u539f\u56e0<\/th><\/tr><\/thead><tbody><tr><td>401<\/td><td>\u65e0\u6548\u7684API\u5bc6\u94a5<\/td><\/tr><tr><td>404<\/td><td>\u65e0\u6548\u7684\u4efb\u52a1ID<\/td><\/tr><tr><td>422<\/td><td>\u53c2\u6570\u6821\u9a8c\u5931\u8d25<\/td><\/tr><\/tbody><\/table><\/figure>\n\n\n\n<p><\/p>\n","protected":false},"excerpt":{"rendered":"<p>\u73af\u5883\u51c6\u5907 \u9996\u5148\u51c6\u5907\u4e00\u53f0\u663e\u5b58\uff1e=12G\u7684\u670d\u52a1\u5668\uff0c\u6211\u8fd9\u91cc\u9009\u7528\u7684\u662f4090 24G\u4e91\u670d\u52a1\u5668 \u63a5\u7740\u5148\u62c9\u53d6\u5b98\u65b9\u4ee3\u7801\uff0c\u7136\u540e [&hellip;]<\/p>\n","protected":false},"author":1,"featured_media":211,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":[],"categories":[1],"tags":[],"class_list":["post-204","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-model-serve"],"yoast_head":"<!-- This site is optimized with the Yoast SEO plugin v24.8.1 - https:\/\/yoast.com\/wordpress\/plugins\/seo\/ -->\n<title>\u4e00\u6587\u5feb\u901f\u5b66\u4f1aFastAPI\u90e8\u7f72Step-Audio-TTS-3B\u6a21\u578b - \u4eca\u5929\u5f00\u59cb\u5b66AI<\/title>\n<meta name=\"robots\" content=\"index, follow, max-snippet:-1, max-image-preview:large, max-video-preview:-1\" \/>\n<link rel=\"canonical\" href=\"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/\u4e00\u6587\u5feb\u901f\u5b66\u4f1afastapi\u90e8\u7f72step-audio-tts-3b\u6a21\u578b\/\" \/>\n<meta property=\"og:locale\" content=\"zh_CN\" \/>\n<meta property=\"og:type\" content=\"article\" \/>\n<meta property=\"og:title\" content=\"\u4e00\u6587\u5feb\u901f\u5b66\u4f1aFastAPI\u90e8\u7f72Step-Audio-TTS-3B\u6a21\u578b - \u4eca\u5929\u5f00\u59cb\u5b66AI\" \/>\n<meta property=\"og:description\" content=\"\u73af\u5883\u51c6\u5907 \u9996\u5148\u51c6\u5907\u4e00\u53f0\u663e\u5b58\uff1e=12G\u7684\u670d\u52a1\u5668\uff0c\u6211\u8fd9\u91cc\u9009\u7528\u7684\u662f4090 24G\u4e91\u670d\u52a1\u5668 \u63a5\u7740\u5148\u62c9\u53d6\u5b98\u65b9\u4ee3\u7801\uff0c\u7136\u540e [&hellip;]\" \/>\n<meta property=\"og:url\" content=\"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/\u4e00\u6587\u5feb\u901f\u5b66\u4f1afastapi\u90e8\u7f72step-audio-tts-3b\u6a21\u578b\/\" \/>\n<meta property=\"og:site_name\" content=\"\u4eca\u5929\u5f00\u59cb\u5b66AI\" \/>\n<meta property=\"article:published_time\" content=\"2025-04-18T03:08:38+00:00\" \/>\n<meta property=\"article:modified_time\" content=\"2025-05-22T04:58:42+00:00\" \/>\n<meta property=\"og:image\" content=\"http:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/111222.png\" \/>\n\t<meta property=\"og:image:width\" content=\"667\" \/>\n\t<meta property=\"og:image:height\" content=\"342\" \/>\n\t<meta property=\"og:image:type\" content=\"image\/png\" \/>\n<meta name=\"author\" content=\"Knoka\" \/>\n<meta name=\"twitter:card\" content=\"summary_large_image\" \/>\n<meta name=\"twitter:label1\" content=\"\u4f5c\u8005\" \/>\n\t<meta name=\"twitter:data1\" content=\"Knoka\" \/>\n\t<meta name=\"twitter:label2\" content=\"\u9884\u8ba1\u9605\u8bfb\u65f6\u95f4\" \/>\n\t<meta name=\"twitter:data2\" content=\"1 \u5206\" \/>\n<script type=\"application\/ld+json\" class=\"yoast-schema-graph\">{\"@context\":\"https:\/\/schema.org\",\"@graph\":[{\"@type\":\"Article\",\"@id\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/#article\",\"isPartOf\":{\"@id\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/\"},\"author\":{\"name\":\"Knoka\",\"@id\":\"https:\/\/knoka.vip\/#\/schema\/person\/59bf442e4e4c21f6969b984b8c5bfc84\"},\"headline\":\"\u4e00\u6587\u5feb\u901f\u5b66\u4f1aFastAPI\u90e8\u7f72Step-Audio-TTS-3B\u6a21\u578b\",\"datePublished\":\"2025-04-18T03:08:38+00:00\",\"dateModified\":\"2025-05-22T04:58:42+00:00\",\"mainEntityOfPage\":{\"@id\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/\"},\"wordCount\":99,\"commentCount\":0,\"publisher\":{\"@id\":\"https:\/\/knoka.vip\/#\/schema\/person\/59bf442e4e4c21f6969b984b8c5bfc84\"},\"image\":{\"@id\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/#primaryimage\"},\"thumbnailUrl\":\"https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/111222.png\",\"articleSection\":[\"\u6a21\u578b\u90e8\u7f72\"],\"inLanguage\":\"zh-Hans\",\"potentialAction\":[{\"@type\":\"CommentAction\",\"name\":\"Comment\",\"target\":[\"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/#respond\"]}]},{\"@type\":\"WebPage\",\"@id\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/\",\"url\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/\",\"name\":\"\u4e00\u6587\u5feb\u901f\u5b66\u4f1aFastAPI\u90e8\u7f72Step-Audio-TTS-3B\u6a21\u578b - \u4eca\u5929\u5f00\u59cb\u5b66AI\",\"isPartOf\":{\"@id\":\"https:\/\/knoka.vip\/#website\"},\"primaryImageOfPage\":{\"@id\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/#primaryimage\"},\"image\":{\"@id\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/#primaryimage\"},\"thumbnailUrl\":\"https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/111222.png\",\"datePublished\":\"2025-04-18T03:08:38+00:00\",\"dateModified\":\"2025-05-22T04:58:42+00:00\",\"breadcrumb\":{\"@id\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/#breadcrumb\"},\"inLanguage\":\"zh-Hans\",\"potentialAction\":[{\"@type\":\"ReadAction\",\"target\":[\"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/\"]}]},{\"@type\":\"ImageObject\",\"inLanguage\":\"zh-Hans\",\"@id\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/#primaryimage\",\"url\":\"https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/111222.png\",\"contentUrl\":\"https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/111222.png\",\"width\":667,\"height\":342},{\"@type\":\"BreadcrumbList\",\"@id\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/#breadcrumb\",\"itemListElement\":[{\"@type\":\"ListItem\",\"position\":1,\"name\":\"\u9996\u9875\",\"item\":\"https:\/\/knoka.vip\/\"},{\"@type\":\"ListItem\",\"position\":2,\"name\":\"\u4e00\u6587\u5feb\u901f\u5b66\u4f1aFastAPI\u90e8\u7f72Step-Audio-TTS-3B\u6a21\u578b\"}]},{\"@type\":\"WebSite\",\"@id\":\"https:\/\/knoka.vip\/#website\",\"url\":\"https:\/\/knoka.vip\/\",\"name\":\"\u4eca\u5929\u5f00\u59cb\u5b66AI\",\"description\":\"\u77e5\u8bc6\u5206\u4eab\",\"publisher\":{\"@id\":\"https:\/\/knoka.vip\/#\/schema\/person\/59bf442e4e4c21f6969b984b8c5bfc84\"},\"potentialAction\":[{\"@type\":\"SearchAction\",\"target\":{\"@type\":\"EntryPoint\",\"urlTemplate\":\"https:\/\/knoka.vip\/?s={search_term_string}\"},\"query-input\":{\"@type\":\"PropertyValueSpecification\",\"valueRequired\":true,\"valueName\":\"search_term_string\"}}],\"inLanguage\":\"zh-Hans\"},{\"@type\":[\"Person\",\"Organization\"],\"@id\":\"https:\/\/knoka.vip\/#\/schema\/person\/59bf442e4e4c21f6969b984b8c5bfc84\",\"name\":\"Knoka\",\"image\":{\"@type\":\"ImageObject\",\"inLanguage\":\"zh-Hans\",\"@id\":\"https:\/\/knoka.vip\/#\/schema\/person\/image\/\",\"url\":\"https:\/\/gravatar.pho.ink\/avatar\/a81dd1238e551ec6c470995487946913852d59837b557d5166ae60169466da05?s=96&r=g&d=404\",\"contentUrl\":\"https:\/\/gravatar.pho.ink\/avatar\/a81dd1238e551ec6c470995487946913852d59837b557d5166ae60169466da05?s=96&r=g&d=404\",\"caption\":\"Knoka\"},\"logo\":{\"@id\":\"https:\/\/knoka.vip\/#\/schema\/person\/image\/\"},\"sameAs\":[\"http:\/\/118.178.172.39\"],\"url\":\"https:\/\/knoka.vip\/index.php\/author\/admin\/\"}]}<\/script>\n<!-- \/ Yoast SEO plugin. -->","yoast_head_json":{"title":"\u4e00\u6587\u5feb\u901f\u5b66\u4f1aFastAPI\u90e8\u7f72Step-Audio-TTS-3B\u6a21\u578b - \u4eca\u5929\u5f00\u59cb\u5b66AI","robots":{"index":"index","follow":"follow","max-snippet":"max-snippet:-1","max-image-preview":"max-image-preview:large","max-video-preview":"max-video-preview:-1"},"canonical":"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/\u4e00\u6587\u5feb\u901f\u5b66\u4f1afastapi\u90e8\u7f72step-audio-tts-3b\u6a21\u578b\/","og_locale":"zh_CN","og_type":"article","og_title":"\u4e00\u6587\u5feb\u901f\u5b66\u4f1aFastAPI\u90e8\u7f72Step-Audio-TTS-3B\u6a21\u578b - \u4eca\u5929\u5f00\u59cb\u5b66AI","og_description":"\u73af\u5883\u51c6\u5907 \u9996\u5148\u51c6\u5907\u4e00\u53f0\u663e\u5b58\uff1e=12G\u7684\u670d\u52a1\u5668\uff0c\u6211\u8fd9\u91cc\u9009\u7528\u7684\u662f4090 24G\u4e91\u670d\u52a1\u5668 \u63a5\u7740\u5148\u62c9\u53d6\u5b98\u65b9\u4ee3\u7801\uff0c\u7136\u540e [&hellip;]","og_url":"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/\u4e00\u6587\u5feb\u901f\u5b66\u4f1afastapi\u90e8\u7f72step-audio-tts-3b\u6a21\u578b\/","og_site_name":"\u4eca\u5929\u5f00\u59cb\u5b66AI","article_published_time":"2025-04-18T03:08:38+00:00","article_modified_time":"2025-05-22T04:58:42+00:00","og_image":[{"width":667,"height":342,"url":"http:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/111222.png","type":"image\/png"}],"author":"Knoka","twitter_card":"summary_large_image","twitter_misc":{"\u4f5c\u8005":"Knoka","\u9884\u8ba1\u9605\u8bfb\u65f6\u95f4":"1 \u5206"},"schema":{"@context":"https:\/\/schema.org","@graph":[{"@type":"Article","@id":"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/#article","isPartOf":{"@id":"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/"},"author":{"name":"Knoka","@id":"https:\/\/knoka.vip\/#\/schema\/person\/59bf442e4e4c21f6969b984b8c5bfc84"},"headline":"\u4e00\u6587\u5feb\u901f\u5b66\u4f1aFastAPI\u90e8\u7f72Step-Audio-TTS-3B\u6a21\u578b","datePublished":"2025-04-18T03:08:38+00:00","dateModified":"2025-05-22T04:58:42+00:00","mainEntityOfPage":{"@id":"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/"},"wordCount":99,"commentCount":0,"publisher":{"@id":"https:\/\/knoka.vip\/#\/schema\/person\/59bf442e4e4c21f6969b984b8c5bfc84"},"image":{"@id":"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/#primaryimage"},"thumbnailUrl":"https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/111222.png","articleSection":["\u6a21\u578b\u90e8\u7f72"],"inLanguage":"zh-Hans","potentialAction":[{"@type":"CommentAction","name":"Comment","target":["http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/#respond"]}]},{"@type":"WebPage","@id":"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/","url":"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/","name":"\u4e00\u6587\u5feb\u901f\u5b66\u4f1aFastAPI\u90e8\u7f72Step-Audio-TTS-3B\u6a21\u578b - \u4eca\u5929\u5f00\u59cb\u5b66AI","isPartOf":{"@id":"https:\/\/knoka.vip\/#website"},"primaryImageOfPage":{"@id":"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/#primaryimage"},"image":{"@id":"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/#primaryimage"},"thumbnailUrl":"https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/111222.png","datePublished":"2025-04-18T03:08:38+00:00","dateModified":"2025-05-22T04:58:42+00:00","breadcrumb":{"@id":"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/#breadcrumb"},"inLanguage":"zh-Hans","potentialAction":[{"@type":"ReadAction","target":["http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/"]}]},{"@type":"ImageObject","inLanguage":"zh-Hans","@id":"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/#primaryimage","url":"https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/111222.png","contentUrl":"https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/111222.png","width":667,"height":342},{"@type":"BreadcrumbList","@id":"http:\/\/knoka.vip\/index.php\/2025\/04\/18\/%e4%b8%80%e6%96%87%e5%bf%ab%e9%80%9f%e5%ad%a6%e4%bc%9afastapi%e9%83%a8%e7%bd%b2step-audio-tts-3b%e6%a8%a1%e5%9e%8b\/#breadcrumb","itemListElement":[{"@type":"ListItem","position":1,"name":"\u9996\u9875","item":"https:\/\/knoka.vip\/"},{"@type":"ListItem","position":2,"name":"\u4e00\u6587\u5feb\u901f\u5b66\u4f1aFastAPI\u90e8\u7f72Step-Audio-TTS-3B\u6a21\u578b"}]},{"@type":"WebSite","@id":"https:\/\/knoka.vip\/#website","url":"https:\/\/knoka.vip\/","name":"\u4eca\u5929\u5f00\u59cb\u5b66AI","description":"\u77e5\u8bc6\u5206\u4eab","publisher":{"@id":"https:\/\/knoka.vip\/#\/schema\/person\/59bf442e4e4c21f6969b984b8c5bfc84"},"potentialAction":[{"@type":"SearchAction","target":{"@type":"EntryPoint","urlTemplate":"https:\/\/knoka.vip\/?s={search_term_string}"},"query-input":{"@type":"PropertyValueSpecification","valueRequired":true,"valueName":"search_term_string"}}],"inLanguage":"zh-Hans"},{"@type":["Person","Organization"],"@id":"https:\/\/knoka.vip\/#\/schema\/person\/59bf442e4e4c21f6969b984b8c5bfc84","name":"Knoka","image":{"@type":"ImageObject","inLanguage":"zh-Hans","@id":"https:\/\/knoka.vip\/#\/schema\/person\/image\/","url":"https:\/\/gravatar.pho.ink\/avatar\/a81dd1238e551ec6c470995487946913852d59837b557d5166ae60169466da05?s=96&r=g&d=404","contentUrl":"https:\/\/gravatar.pho.ink\/avatar\/a81dd1238e551ec6c470995487946913852d59837b557d5166ae60169466da05?s=96&r=g&d=404","caption":"Knoka"},"logo":{"@id":"https:\/\/knoka.vip\/#\/schema\/person\/image\/"},"sameAs":["http:\/\/118.178.172.39"],"url":"https:\/\/knoka.vip\/index.php\/author\/admin\/"}]}},"_links":{"self":[{"href":"https:\/\/knoka.vip\/index.php\/wp-json\/wp\/v2\/posts\/204","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/knoka.vip\/index.php\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/knoka.vip\/index.php\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/knoka.vip\/index.php\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/knoka.vip\/index.php\/wp-json\/wp\/v2\/comments?post=204"}],"version-history":[{"count":0,"href":"https:\/\/knoka.vip\/index.php\/wp-json\/wp\/v2\/posts\/204\/revisions"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/knoka.vip\/index.php\/wp-json\/wp\/v2\/media\/211"}],"wp:attachment":[{"href":"https:\/\/knoka.vip\/index.php\/wp-json\/wp\/v2\/media?parent=204"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/knoka.vip\/index.php\/wp-json\/wp\/v2\/categories?post=204"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/knoka.vip\/index.php\/wp-json\/wp\/v2\/tags?post=204"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}