Commit
·
d515eda
1
Parent(s):
941081c
update description
Browse files
app.py
CHANGED
@@ -176,11 +176,18 @@ if __name__ == "__main__":
|
|
176 |
"""
|
177 |
)
|
178 |
gr.Markdown(
|
179 |
-
"
|
180 |
-
|
181 |
-
|
182 |
-
|
183 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
184 |
)
|
185 |
gr.Markdown("**Overall statistics:**")
|
186 |
table = gr.Dataframe(
|
|
|
176 |
"""
|
177 |
)
|
178 |
gr.Markdown(
|
179 |
+
"""
|
180 |
+
Analyse the transcriptions generated by the Whisper and Distil-Whisper models on the TED-LIUM dev set.
|
181 |
+
Analysis is performed on the overall level, where statistics are computed over the entire dev set, and also a per-sample level.
|
182 |
+
The transcriptions for both models are shown at the bottom of the demo. The text diff for each is computed
|
183 |
+
relative to the target transcriptions, where insertions are displayed in <span style='background-color:Lightgreen'>green</span>, and
|
184 |
+
deletions in <span style='background-color:#FFCCCB'><s>red</s></span>.
|
185 |
+
|
186 |
+
To quantify the amount of repetition and hallucination in the predicted transcriptions, we measure the number
|
187 |
+
of repeated 5-gram word duplicates (5-Dup.) and the insertion error rate (IER). Overall, Distil-Whisper has
|
188 |
+
roughly half the number of 5-Dup. and IER. This indicates that it has a lower propensity to hallucinate
|
189 |
+
compared to the Whisper model.
|
190 |
+
"""
|
191 |
)
|
192 |
gr.Markdown("**Overall statistics:**")
|
193 |
table = gr.Dataframe(
|