import typing as T import gradio as gr from jiwer import process_words, RemovePunctuation, ToLowerCase, Compose def make_string(words: T.List[str]) -> str: """Converts list of strings to a string""" return " ".join(words) def highlight_errors( ground_truth: str, hypothesis: str, remove_punctuation: bool, to_lower_case: bool, ) -> T.Tuple[str, float, int, int, int]: """ Takes in a ground truth and hypothesis string, applies transformations as specified by remove_punctuation and to_lower_case, and returns data to visualize word error rate. Specifically, this returns an HTML string with insertions, deletions, and substitutions highlighted as well as the computed WER, and # of subsititutions, insertions, and deletions. """ highlighted_text = [] transforms = [ RemovePunctuation() if remove_punctuation else None, ToLowerCase() if to_lower_case else None, ] transform = Compose([t for t in transforms if t is not None]) processed = process_words( reference=transform(ground_truth), hypothesis=transform(hypothesis) ) # Process each alignment operation in measures for alignment, ref, hyp in zip( processed.alignments, processed.references, processed.hypotheses ): for chunk in alignment: if chunk.type == "equal": # Add equal words without highlighting highlighted_text.extend(ref[chunk.ref_start_idx : chunk.ref_end_idx]) elif chunk.type == "insert": # Highlight inserted words in green highlighted_text.append( f'' f"{make_string(hyp[chunk.hyp_start_idx:chunk.hyp_end_idx])}" ) elif chunk.type == "substitute": # Highlight substitutions in purple: ground truth is striked through highlighted_text.append( f'' f"{make_string(hyp[chunk.hyp_start_idx:chunk.hyp_end_idx])}" ) # Hypothesis word highlighted_text.append( f'' f"{make_string(ref[chunk.ref_start_idx:chunk.ref_end_idx])}" ) # Ground truth word elif chunk.type == "delete": # Highlight deleted words in red with strikethrough highlighted_text.append( f'' f"{make_string(ref[chunk.ref_start_idx:chunk.ref_end_idx])}" ) highlighted_text_str = make_string(highlighted_text) # Color Legend HTML legend_html = """

Legend
Insertion: Green
Substitution: Purple
Deletion: Red

""" # Combine highlighted output and legend combined_output = f"{legend_html}
{highlighted_text_str}" return ( combined_output, processed.wer, processed.substitutions, processed.insertions, processed.deletions, ) # Gradio Interface interface = gr.Interface( fn=highlight_errors, inputs=[ gr.Textbox(label="Ground Truth"), gr.Textbox(label="Hypothesis"), gr.Checkbox(label="Ignore Punctuation"), gr.Checkbox(label="Ignore Case"), ], outputs=[ gr.HTML(label="Highlighted Transcript"), gr.Number(label="Word Error Rate"), gr.Number(label="Substitutions"), gr.Number(label="Insertions"), gr.Number(label="Deletions"), ], title="WER Analysis", ) interface.launch()