Loading...
Loading...
Analyze video content using visual/video large models. This tool is triggered when the user uses phrases like "analyze video", "video understanding", "look at this video", or "analyze video".
npx skill4agent add zrong/skills video-analyzer# VolcEngine (Doubao)
export ARK_API_KEY="your-api-key"
# OpenAI
export OPENAI_API_KEY="your-api-key"scripts/models.jsonbase_urlapi_key_envmodelapi_typeresponseschat_completionssupports_video$ARGUMENTSdefault_modelmodels.jsonscripts/uv run analyze.py --video <video path or URL> --prompt "<analysis prompt>"--model <name>--frames <number>--max-size <pixels># Local video
uv run analyze.py --video /path/to/video.mp4 --prompt "Describe the video content"
# Direct online video URL
uv run analyze.py --video https://example.com/video.mp4 --prompt "Analyze the video"
# Video website URL (YouTube, Bilibili, etc.)
uv run analyze.py --video https://www.youtube.com/watch?v=xxxxx --prompt "Summarize the video"
# Specify model and number of frames
uv run analyze.py --video video.mp4 --model doubao-vision --frames 20 --prompt "Analyze"yt-dlp