Loading...
Loading...
Vox single-entry voice orchestration skill. Used to complete environment guarding, CLI installation, on-demand model download, ASR transcription, voice cloning, pipeline execution and task troubleshooting through natural language. It is used when users only describe the target without providing specific commands.
npx skill4agent add catoncat/vox-cli voxSKILL.md# Side-effect-free pre-check (recommended to run first)
bash scripts/bootstrap.sh --check
# Actual installation and repair
bash scripts/bootstrap.shreferences/intents.mdbash scripts/ensure_model.sh <model_id|asr-auto|tts-default>voxbash scripts/self_check.sh [--require-model <...>] [--require-file <...>]bash scripts/log_failure.sh --stage "<stage>" --command "<cmd>" --error "<msg>" [--retry "<retry-cmd>"]Darwin + arm64vox doctor --jsonok=trueverified=true0--json--format ndjsonlog_failure.sh# Environment check
scripts/vox_cmd.sh doctor --json
# Check model status
scripts/vox_cmd.sh model status --json
# Offline transcription
scripts/vox_cmd.sh asr transcribe --audio ./speech.wav --lang zh --model auto --json
# Voice cloning
scripts/vox_cmd.sh tts clone --profile narrator --text "你好" --out ./out.wav --model qwen-tts-1.7b --json
# Integrated workflow
scripts/vox_cmd.sh pipeline run --profile narrator --audio ./input.wav --clone-text "把这段内容读出来" --lang zh --jsonuvffmpegportaudioVOX_CLI_PACKAGE_SPECVOX_CLI_GIT_URLgit+<url>git+https://github.com/catoncat/vox-cli.git