sanchit-gandhi commited on
Commit
d515eda
·
1 Parent(s): 941081c

update description

Browse files
Files changed (1) hide show
  1. app.py +12 -5
app.py CHANGED
@@ -176,11 +176,18 @@ if __name__ == "__main__":
176
  """
177
  )
178
  gr.Markdown(
179
- "Analyse the transcriptions generated by the Whisper and Distil-Whisper models on the TEDLIUM dev set. "
180
- "Analysis is performed on the overall level, where statistics are computed over the entire dev set, and also a per-sample level. "
181
- "The transcriptions for both models are shown at the bottom of the demo. The text diff for each is computed "
182
- "relative to the target transcriptions, where insertions are displayed in <span style='background-color:Lightgreen'>green</span>, and "
183
- "deletions in <span style='background-color:#FFCCCB'><s>red</s></span>."
 
 
 
 
 
 
 
184
  )
185
  gr.Markdown("**Overall statistics:**")
186
  table = gr.Dataframe(
 
176
  """
177
  )
178
  gr.Markdown(
179
+ """
180
+ Analyse the transcriptions generated by the Whisper and Distil-Whisper models on the TED-LIUM dev set.
181
+ Analysis is performed on the overall level, where statistics are computed over the entire dev set, and also a per-sample level.
182
+ The transcriptions for both models are shown at the bottom of the demo. The text diff for each is computed
183
+ relative to the target transcriptions, where insertions are displayed in <span style='background-color:Lightgreen'>green</span>, and
184
+ deletions in <span style='background-color:#FFCCCB'><s>red</s></span>.
185
+
186
+ To quantify the amount of repetition and hallucination in the predicted transcriptions, we measure the number
187
+ of repeated 5-gram word duplicates (5-Dup.) and the insertion error rate (IER). Overall, Distil-Whisper has
188
+ roughly half the number of 5-Dup. and IER. This indicates that it has a lower propensity to hallucinate
189
+ compared to the Whisper model.
190
+ """
191
  )
192
  gr.Markdown("**Overall statistics:**")
193
  table = gr.Dataframe(