Loading...
Loading...
Transcribe non-realtime speech with Alibaba Cloud Model Studio Qwen ASR models (`qwen3-asr-flash`, `qwen-audio-asr`, `qwen3-asr-flash-filetrans`). Use when converting recorded audio files to text, generating transcripts with timestamps, or documenting DashScope/OpenAI-compatible ASR request and response fields.
npx skill4agent add cinience/alicloud-skills alicloud-ai-audio-asrqwen3-asr-flashqwen-audio-asrqwen3-asr-flash-filetransqwen3-asr-flashqwen-audio-asrqwen3-asr-flash-filetranspython3 -m venv .venv
. .venv/bin/activateDASHSCOPE_API_KEYdashscope_api_key~/.alibabacloud/credentialsaudiomodelqwen3-asr-flashlanguage_hintszhensample_ratevocabulary_iddisfluency_removal_enabledtimestamp_granularitiessentenceasyncqwen3-asr-flash-filetranstexttask_idstatusSUCCEEDEDrawcurl -sS --location 'https://dashscope.aliyuncs.com/compatible-mode/v1/chat/completions' \
--header "Authorization: Bearer $DASHSCOPE_API_KEY" \
--header 'Content-Type: application/json' \
--data '{
"model": "qwen3-asr-flash",
"messages": [
{
"role": "user",
"content": [
{
"type": "input_audio",
"input_audio": {
"data": "https://dashscope.oss-cn-beijing.aliyuncs.com/audios/welcome.mp3"
}
}
]
}
],
"stream": false,
"asr_options": {
"enable_itn": false
}
}'curl -sS --location 'https://dashscope.aliyuncs.com/api/v1/services/audio/asr/transcription' \
--header "Authorization: Bearer $DASHSCOPE_API_KEY" \
--header 'X-DashScope-Async: enable' \
--header 'Content-Type: application/json' \
--data '{
"model": "qwen3-asr-flash-filetrans",
"input": {
"file_url": "https://dashscope.oss-cn-beijing.aliyuncs.com/audios/welcome.mp3"
}
}'curl -sS --location "https://dashscope.aliyuncs.com/api/v1/tasks/<task_id>" \
--header "Authorization: Bearer $DASHSCOPE_API_KEY"python skills/ai/audio/alicloud-ai-audio-asr/scripts/transcribe_audio.py \
--audio "https://dashscope.oss-cn-beijing.aliyuncs.com/audios/welcome.mp3" \
--model qwen3-asr-flash \
--language-hints zh,en \
--print-responsepython skills/ai/audio/alicloud-ai-audio-asr/scripts/transcribe_audio.py \
--audio "https://dashscope.oss-cn-beijing.aliyuncs.com/audios/welcome.mp3" \
--model qwen3-asr-flash-filetrans \
--async \
--waitinput_audio.datalanguage_hintsoutput/ai-audio-asr/transcripts/output/ai-audio-asr/transcripts/OUTPUT_DIRreferences/api_reference.mdreferences/sources.mdskills/ai/audio/alicloud-ai-audio-tts-realtime/