{
  "schemaVersion": "1.0",
  "item": {
    "slug": "zhipu-tts",
    "name": "Zhipu AI TTS",
    "source": "tencent",
    "type": "skill",
    "category": "AI 智能",
    "sourceUrl": "https://clawhub.ai/franklu0819-lang/zhipu-tts",
    "canonicalUrl": "https://clawhub.ai/franklu0819-lang/zhipu-tts",
    "targetPlatform": "OpenClaw"
  },
  "install": {
    "downloadMode": "redirect",
    "downloadUrl": "/downloads/zhipu-tts",
    "sourceDownloadUrl": "https://wry-manatee-359.convex.site/api/v1/download?slug=zhipu-tts",
    "sourcePlatform": "tencent",
    "targetPlatform": "OpenClaw",
    "installMethod": "Manual import",
    "extraction": "Extract archive",
    "prerequisites": [
      "OpenClaw"
    ],
    "packageFormat": "ZIP package",
    "includedAssets": [
      "README.md",
      "SKILL.md",
      "package.json",
      "scripts/text_to_speech.sh"
    ],
    "primaryDoc": "SKILL.md",
    "quickSetup": [
      "Download the package from Yavira.",
      "Extract the archive and review SKILL.md first.",
      "Import or place the package into your OpenClaw setup."
    ],
    "agentAssist": {
      "summary": "Hand the extracted package to your coding agent with a concrete install brief instead of figuring it out manually.",
      "steps": [
        "Download the package from Yavira.",
        "Extract it into a folder your agent can access.",
        "Paste one of the prompts below and point your agent at the extracted folder."
      ],
      "prompts": [
        {
          "label": "New install",
          "body": "I downloaded a skill package from Yavira. Read SKILL.md from the extracted folder and install it by following the included instructions. Then review README.md for any prerequisites, environment setup, or post-install checks. Tell me what you changed and call out any manual steps you could not complete."
        },
        {
          "label": "Upgrade existing",
          "body": "I downloaded an updated skill package from Yavira. Read SKILL.md from the extracted folder, compare it with my current installation, and upgrade it while preserving any custom configuration unless the package docs explicitly say otherwise. Then review README.md for any prerequisites, environment setup, or post-install checks. Summarize what changed and any follow-up checks I should run."
        }
      ]
    },
    "sourceHealth": {
      "source": "tencent",
      "status": "healthy",
      "reason": "direct_download_ok",
      "recommendedAction": "download",
      "checkedAt": "2026-04-30T16:55:25.780Z",
      "expiresAt": "2026-05-07T16:55:25.780Z",
      "httpStatus": 200,
      "finalUrl": "https://wry-manatee-359.convex.site/api/v1/download?slug=network",
      "contentType": "application/zip",
      "probeMethod": "head",
      "details": {
        "probeUrl": "https://wry-manatee-359.convex.site/api/v1/download?slug=network",
        "contentDisposition": "attachment; filename=\"network-1.0.0.zip\"",
        "redirectLocation": null,
        "bodySnippet": null
      },
      "scope": "source",
      "summary": "Source download looks usable.",
      "detail": "Yavira can redirect you to the upstream package for this source.",
      "primaryActionLabel": "Download for OpenClaw",
      "primaryActionHref": "/downloads/zhipu-tts"
    },
    "validation": {
      "installChecklist": [
        "Use the Yavira download entry.",
        "Review SKILL.md after the package is downloaded.",
        "Confirm the extracted package contains the expected setup assets."
      ],
      "postInstallChecks": [
        "Confirm the extracted package includes the expected docs or setup files.",
        "Validate the skill or prompts are available in your target agent workspace.",
        "Capture any manual follow-up steps the agent could not complete."
      ]
    },
    "downloadPageUrl": "https://openagent3.xyz/downloads/zhipu-tts",
    "agentPageUrl": "https://openagent3.xyz/skills/zhipu-tts/agent",
    "manifestUrl": "https://openagent3.xyz/skills/zhipu-tts/agent.json",
    "briefUrl": "https://openagent3.xyz/skills/zhipu-tts/agent.md"
  },
  "agentAssist": {
    "summary": "Hand the extracted package to your coding agent with a concrete install brief instead of figuring it out manually.",
    "steps": [
      "Download the package from Yavira.",
      "Extract it into a folder your agent can access.",
      "Paste one of the prompts below and point your agent at the extracted folder."
    ],
    "prompts": [
      {
        "label": "New install",
        "body": "I downloaded a skill package from Yavira. Read SKILL.md from the extracted folder and install it by following the included instructions. Then review README.md for any prerequisites, environment setup, or post-install checks. Tell me what you changed and call out any manual steps you could not complete."
      },
      {
        "label": "Upgrade existing",
        "body": "I downloaded an updated skill package from Yavira. Read SKILL.md from the extracted folder, compare it with my current installation, and upgrade it while preserving any custom configuration unless the package docs explicitly say otherwise. Then review README.md for any prerequisites, environment setup, or post-install checks. Summarize what changed and any follow-up checks I should run."
      }
    ]
  },
  "documentation": {
    "source": "clawhub",
    "primaryDoc": "SKILL.md",
    "sections": [
      {
        "title": "Zhipu AI Text-to-Speech",
        "body": "Convert Chinese text to natural-sounding speech using Zhipu AI's GLM-TTS model."
      },
      {
        "title": "Setup",
        "body": "1. Get your API Key:\nGet a key from Zhipu AI Console\n\n2. Set it in your environment:\n\nexport ZHIPU_API_KEY=\"your-key-here\""
      },
      {
        "title": "System Voices (Pre-built)",
        "body": "tongtong (彤彤) - Default voice, balanced tone\nchuichui (锤锤) - Male voice, deeper tone\nxiaochen (小陈) - Young professional voice\njam - 动动动物圈 Jam voice\nkazi - 动动动物圈 Kazi voice\ndouji - 动动动物圈 Douji voice\nluodo - 动动动物圈 Luodo voice"
      },
      {
        "title": "Basic Text-to-Speech",
        "body": "Convert text to speech with default settings (tongtong voice, normal speed, WAV format):\n\nbash scripts/text_to_speech.sh \"你好，今天天气怎么样\""
      },
      {
        "title": "Advanced Options",
        "body": "Specify voice, speed, format, and output filename:\n\nbash scripts/text_to_speech.sh \"欢迎使用智能语音服务\" xiaochen 1.2 wav greeting.wav\n\nParameters:\n\ntext (required): Chinese text to convert (max 1024 characters)\nvoice (optional): tongtong (default), chuichui, xiaochen, jam, kazi, douji, luodo\nspeed (optional): Speech speed from 0.5 to 2.0 (default: 1.0)\noutput_format (optional): wav (default), pcm\noutput_file (optional): Output filename (default: output.{format})"
      },
      {
        "title": "Voice Selection Guide",
        "body": "Choose tongtong (default) for:\n\nGeneral purpose narration\nProfessional presentations\nBalanced tone requirements\n\nChoose chuichui for:\n\nMale voice needed\nDeeper, authoritative tone\nDocumentary or formal content\n\nChoose xiaochen for:\n\nYoung, energetic tone\nModern, casual content\nFriendly assistant vibe\n\nChoose jam/kazi/douji/luodo for:\n\nEntertainment content\nCharacter voices\nCreative projects"
      },
      {
        "title": "Speed Control",
        "body": "Recommended speeds:\n\n0.8-1.0: Clear, professional narration\n1.0-1.2: Natural conversational pace (default: 1.0)\n1.2-1.5: Energetic, upbeat delivery\n1.5-2.0: Fast-paced summaries (may reduce clarity)"
      },
      {
        "title": "Output Formats",
        "body": "WAV (recommended):\n\nStandard audio format\nWidely compatible\nBetter quality preservation\n\nPCM:\n\nRaw audio format\nSmaller file size\nRequires additional processing for playback"
      },
      {
        "title": "Examples",
        "body": "Create a professional greeting:\n\nbash scripts/text_to_speech.sh \"您好，感谢致电智能客服，请按1选择中文服务\" tongtong 1.0 wav greeting.wav\n\nGenerate an energetic announcement:\n\nbash scripts/text_to_speech.sh \"热烈欢迎各位嘉宾参加今天的活动！\" xiaochen 1.3 wav announcement.wav\n\nCreate a calm narration:\n\nbash scripts/text_to_speech.sh \"在这个宁静的夜晚，让我们一起欣赏美丽的星空\" chuichui 0.9 wav narration.wav"
      },
      {
        "title": "Character Limits",
        "body": "Maximum input: 1024 characters per request\nFor longer texts, split into multiple segments\nCombine audio files post-generation"
      },
      {
        "title": "Audio Quality Tips",
        "body": "Best practices:\n\nUse punctuation for natural pauses (commas, periods)\nBreak long sentences into shorter segments\nUse appropriate line breaks for paragraph pauses\nTest speed settings for your specific content\n\nSample rate: Generated audio uses 24000 Hz sampling rate for optimal quality."
      },
      {
        "title": "Troubleshooting",
        "body": "Text Length Issues:\n\nSplit texts longer than 1024 characters\nProcess segments separately\nCombine using audio editing tools\n\nAudio Quality Issues:\n\nCheck text encoding (use UTF-8)\nVerify punctuation placement\nAdjust speed settings\nTry different voices\n\nFile Playback Issues:\n\nEnsure format compatibility with your player\nWAV format works on most systems\nPCM may require conversion"
      },
      {
        "title": "API Notes",
        "body": "Responses are returned as audio files\nWatermarking enabled by default (can be disabled in account settings)\nNo strict rate limiting documented\nAudio generation typically completes in 1-3 seconds"
      }
    ],
    "body": "Zhipu AI Text-to-Speech\n\nConvert Chinese text to natural-sounding speech using Zhipu AI's GLM-TTS model.\n\nSetup\n\n1. Get your API Key: Get a key from Zhipu AI Console\n\n2. Set it in your environment:\n\nexport ZHIPU_API_KEY=\"your-key-here\"\n\nAvailable Voices\nSystem Voices (Pre-built)\ntongtong (彤彤) - Default voice, balanced tone\nchuichui (锤锤) - Male voice, deeper tone\nxiaochen (小陈) - Young professional voice\njam - 动动动物圈 Jam voice\nkazi - 动动动物圈 Kazi voice\ndouji - 动动动物圈 Douji voice\nluodo - 动动动物圈 Luodo voice\nUsage\nBasic Text-to-Speech\n\nConvert text to speech with default settings (tongtong voice, normal speed, WAV format):\n\nbash scripts/text_to_speech.sh \"你好，今天天气怎么样\"\n\nAdvanced Options\n\nSpecify voice, speed, format, and output filename:\n\nbash scripts/text_to_speech.sh \"欢迎使用智能语音服务\" xiaochen 1.2 wav greeting.wav\n\n\nParameters:\n\ntext (required): Chinese text to convert (max 1024 characters)\nvoice (optional): tongtong (default), chuichui, xiaochen, jam, kazi, douji, luodo\nspeed (optional): Speech speed from 0.5 to 2.0 (default: 1.0)\noutput_format (optional): wav (default), pcm\noutput_file (optional): Output filename (default: output.{format})\nVoice Selection Guide\n\nChoose tongtong (default) for:\n\nGeneral purpose narration\nProfessional presentations\nBalanced tone requirements\n\nChoose chuichui for:\n\nMale voice needed\nDeeper, authoritative tone\nDocumentary or formal content\n\nChoose xiaochen for:\n\nYoung, energetic tone\nModern, casual content\nFriendly assistant vibe\n\nChoose jam/kazi/douji/luodo for:\n\nEntertainment content\nCharacter voices\nCreative projects\nSpeed Control\n\nRecommended speeds:\n\n0.8-1.0: Clear, professional narration\n1.0-1.2: Natural conversational pace (default: 1.0)\n1.2-1.5: Energetic, upbeat delivery\n1.5-2.0: Fast-paced summaries (may reduce clarity)\nOutput Formats\n\nWAV (recommended):\n\nStandard audio format\nWidely compatible\nBetter quality preservation\n\nPCM:\n\nRaw audio format\nSmaller file size\nRequires additional processing for playback\nExamples\n\nCreate a professional greeting:\n\nbash scripts/text_to_speech.sh \"您好，感谢致电智能客服，请按1选择中文服务\" tongtong 1.0 wav greeting.wav\n\n\nGenerate an energetic announcement:\n\nbash scripts/text_to_speech.sh \"热烈欢迎各位嘉宾参加今天的活动！\" xiaochen 1.3 wav announcement.wav\n\n\nCreate a calm narration:\n\nbash scripts/text_to_speech.sh \"在这个宁静的夜晚，让我们一起欣赏美丽的星空\" chuichui 0.9 wav narration.wav\n\nCharacter Limits\nMaximum input: 1024 characters per request\nFor longer texts, split into multiple segments\nCombine audio files post-generation\nAudio Quality Tips\n\nBest practices:\n\nUse punctuation for natural pauses (commas, periods)\nBreak long sentences into shorter segments\nUse appropriate line breaks for paragraph pauses\nTest speed settings for your specific content\n\nSample rate: Generated audio uses 24000 Hz sampling rate for optimal quality.\n\nTroubleshooting\n\nText Length Issues:\n\nSplit texts longer than 1024 characters\nProcess segments separately\nCombine using audio editing tools\n\nAudio Quality Issues:\n\nCheck text encoding (use UTF-8)\nVerify punctuation placement\nAdjust speed settings\nTry different voices\n\nFile Playback Issues:\n\nEnsure format compatibility with your player\nWAV format works on most systems\nPCM may require conversion\nAPI Notes\nResponses are returned as audio files\nWatermarking enabled by default (can be disabled in account settings)\nNo strict rate limiting documented\nAudio generation typically completes in 1-3 seconds"
  },
  "trust": {
    "sourceLabel": "tencent",
    "provenanceUrl": "https://clawhub.ai/franklu0819-lang/zhipu-tts",
    "publisherUrl": "https://clawhub.ai/franklu0819-lang/zhipu-tts",
    "owner": "franklu0819-lang",
    "version": "1.0.0",
    "license": null,
    "verificationStatus": "Indexed source record"
  },
  "links": {
    "detailUrl": "https://openagent3.xyz/skills/zhipu-tts",
    "downloadUrl": "https://openagent3.xyz/downloads/zhipu-tts",
    "agentUrl": "https://openagent3.xyz/skills/zhipu-tts/agent",
    "manifestUrl": "https://openagent3.xyz/skills/zhipu-tts/agent.json",
    "briefUrl": "https://openagent3.xyz/skills/zhipu-tts/agent.md"
  }
}