Loading...
Loading...
Use when tasks require all-in-one multimodal understanding or generation with Alibaba Cloud Model Studio Qwen Omni models, including image-plus-audio interaction, voice assistants, and realtime multimodal agents.
npx skill4agent add cinience/alicloud-skills alicloud-ai-multimodal-qwen-omnimkdir -p output/alicloud-ai-multimodal-qwen-omni
python -m py_compile skills/ai/multimodal/alicloud-ai-multimodal-qwen-omni/scripts/prepare_omni_request.py && echo "py_compile_ok" > output/alicloud-ai-multimodal-qwen-omni/validate.txtoutput/alicloud-ai-multimodal-qwen-omni/validate.txtqwen3-omni-flashqwen3-omni-flash-realtimeqwen-omni-turboqwen-omni-turbo-realtimemodelqwen3-omni-flashtextimageaudioresponse_modalities["text"]["text","audio"]textaudio_urlaudio_chunkusagepython skills/ai/multimodal/alicloud-ai-multimodal-qwen-omni/scripts/prepare_omni_request.py \
--output output/alicloud-ai-multimodal-qwen-omni/request.jsonreferences/sources.md