title: Speech Transcription
|
type: community
|
group: Audio/Speech Processing
|
image: /static/templates/thumbnail-audio-sentiment.png
|
details: |
|
<h1>Transcribe audio recordings with chunks</h1>
|
<dl>
|
<dt>Industry Applications</dt>
|
<dd>medical dictation, legal transcription, podcast transcription, interview transcription, meeting minutes, lecture notes, courtroom reporting, journalism, accessibility services, broadcast media, customer service calls, research interviews</dd>
|
<dt>Associated Models</dt>
|
<dd>Whisper, Wav2Vec2, DeepSpeech, Google Speech-to-Text, Azure Speech Services</dd>
|
<dt>Domain Terminology</dt>
|
<dd>speech-to-text, audio transcription, voice recognition, dictation, transcription with sentiment</dd>
|
</dl>
|
config: |
|
<View>
|
<Audio name="audio" value="$audio" />
|
<Labels name="label" toName="audio">
|
<Label value="Speech"/>
|
<Label value="Noise" background="grey"/>
|
</Labels>
|
<TextArea name="transcription" toName="audio"
|
perRegion="true" whenTagName="label" whenLabelValue="Speech"
|
displayMode="region-list"/>
|
<Choices name="sentiment" toName="audio" showInline="true"
|
perRegion="true" whenTagName="label" whenLabelValue="Speech">
|
<Choice value="Positive" html="<span style='font-size: 45px; vertical-align: middle;'> 😀 </span>"/>
|
<Choice value="Neutral" html="<span style='font-size: 45px; vertical-align: middle;'> 😐 </span>"/>
|
<Choice value="Negative" html="<span style='font-size: 45px; vertical-align: middle;'> 🙁 </span>"/>
|
</Choices>
|
</View>
|