Loading...
Loading...
Transcribe audio files to text with optional diarization and known-speaker hints. Use when a user asks to transcribe speech from audio/video, extract text from recordings, or label speakers in interviews or meetings.
npx skill4agent add openai/skills transcribeOPENAI_API_KEYtranscribe_diarize.pyoutput/transcribe/gpt-4o-mini-transcribe--response-format text--model gpt-4o-transcribe-diarize --response-format diarized_json--chunking-strategy autogpt-4o-transcribe-diarizeoutput/transcribe/<job-id>/--out-diruvuv pip install openaiuvpython3 -m pip install openaiOPENAI_API_KEYexport CODEX_HOME="${CODEX_HOME:-$HOME/.codex}"
export TRANSCRIBE_CLI="$CODEX_HOME/skills/transcribe/scripts/transcribe_diarize.py"$CODEX_HOME/skills~/.codex/skillspython3 "$TRANSCRIBE_CLI" \
path/to/audio.wav \
--out transcript.txtpython3 "$TRANSCRIBE_CLI" \
meeting.m4a \
--model gpt-4o-transcribe-diarize \
--known-speaker "Alice=refs/alice.wav" \
--known-speaker "Bob=refs/bob.wav" \
--response-format diarized_json \
--out-dir output/transcribe/meetingpython3 "$TRANSCRIBE_CLI" \
interview.mp3 \
--response-format text \
--out interview.txtreferences/api.md