Spaces:

distil-whisper
/

hallucination-analysis

Running

sanchit-gandhi commited on Oct 6, 2023

Commit

65f6dc4

1 Parent(s): eed20cf

make style

Files changed (1) hide show

app.py CHANGED Viewed

@@ -74,9 +74,11 @@ def get_visualisation(idx, model="large-v2", round_dp=2, ngram_degree=5):
     if model == "large-v2":
         text2 = norm_pred_v2[idx]
     elif model == "large-32-2":
-        text2 =  norm_pred_32_2[idx]
     else:
-        raise ValueError(f"Got unknown model {model}, should be one of `'large-v2'` or `'large-32-2'`.")
     wer_output = process_words(text1, text2, wer_default, wer_default)
     wer_percentage = round(100 * wer_output.wer, round_dp)
@@ -96,7 +98,13 @@ def get_visualisation(idx, model="large-v2", round_dp=2, ngram_degree=5):
     diff = compare_string(text1, text2)
     full_text = style_text(diff)
-    return (sampling_rate, array), wer_percentage, ier_percentage, repeated_ngrams, full_text
 def get_side_by_side_visualisation(idx):
@@ -128,7 +136,7 @@ if __name__ == "__main__":
             """
         )
         gr.Markdown(
-            "Analyse the transcriptions generated by the Whisper large-v2 and large-32-2 models on the TEDLIUM dev set."
             "The transcriptions for both models are shown at the bottom of the demo. The text diff for each is computed "
             "relative to the target transcriptions. Insertions are displayed in <span style='background-color:Lightgreen'>green</span>, and "
             "deletions in <span style='background-color:#FFCCCB'><s>red</s></span>."

     if model == "large-v2":
         text2 = norm_pred_v2[idx]
     elif model == "large-32-2":
+        text2 = norm_pred_32_2[idx]
     else:
+        raise ValueError(
+            f"Got unknown model {model}, should be one of `'large-v2'` or `'large-32-2'`."
+        )
     wer_output = process_words(text1, text2, wer_default, wer_default)
     wer_percentage = round(100 * wer_output.wer, round_dp)
     diff = compare_string(text1, text2)
     full_text = style_text(diff)
+    return (
+        (sampling_rate, array),
+        wer_percentage,
+        ier_percentage,
+        repeated_ngrams,
+        full_text,
+    )
 def get_side_by_side_visualisation(idx):
             """
         )
         gr.Markdown(
+            "Analyse the transcriptions generated by the Whisper large-v2 and large-32-2 models on the TEDLIUM dev set. "
             "The transcriptions for both models are shown at the bottom of the demo. The text diff for each is computed "
             "relative to the target transcriptions. Insertions are displayed in <span style='background-color:Lightgreen'>green</span>, and "
             "deletions in <span style='background-color:#FFCCCB'><s>red</s></span>."