label-studio.git

title: Speaker Segmentation
type: community
group: Audio/Speech Processing
image: /static/templates/speaker-segmentation.png
details: |
  <h1>Perform speaker segmentation / diarization task</h1>
  <dl>
    <dt>Industry Applications</dt>
    <dd>meeting transcription, podcast production, call center analytics, courtroom transcription, broadcast news, conference calls, interview processing, lecture recordings, multi-speaker recordings, radio show analysis, parliamentary proceedings, teleconferencing</dd>
    <dt>Associated Models</dt>
    <dd>x-vectors, PLDA, VBx, pyannote.audio, speaker embedding</dd>
    <dt>Domain Terminology</dt>
    <dd>speaker diarization, voice activity detection, speaker identification, speaker change detection</dd>
  </dl>
config: |
  <View>
    <Labels name="label" toName="audio" zoom="true" hotkey="ctrl+enter">
      <Label value="Speaker one" background="#00FF00"/>
      <Label value="Speaker two" background="#12ad59"/>
    </Labels>
    <Audio name="audio" value="$audio" />
  </View>