From 3226a277c608ab0f809816e60d28690f25160b99 Mon Sep 17 00:00:00 2001 From: fayejf Date: Mon, 8 May 2023 16:30:51 -0700 Subject: [PATCH] reflect som and vahid comment Signed-off-by: fayejf --- .../ctc/speech_to_text_buffered_infer_ctc.py | 4 +++- nemo/collections/asr/parts/utils/eval_utils.py | 2 +- 2 files changed, 4 insertions(+), 2 deletions(-) diff --git a/examples/asr/asr_chunked_inference/ctc/speech_to_text_buffered_infer_ctc.py b/examples/asr/asr_chunked_inference/ctc/speech_to_text_buffered_infer_ctc.py index 65ae73f15212..41ec4de5c62b 100644 --- a/examples/asr/asr_chunked_inference/ctc/speech_to_text_buffered_infer_ctc.py +++ b/examples/asr/asr_chunked_inference/ctc/speech_to_text_buffered_infer_ctc.py @@ -27,7 +27,9 @@ total_buffer_in_secs=4.0 \ chunk_len_in_secs=1.6 \ model_stride=4 \ - batch_size=32 + batch_size=32 \ + clean_groundtruth_text=True \ + langid='en' # NOTE: You can use `DEBUG=1 python speech_to_text_buffered_infer_ctc.py ...` to print out the diff --git a/nemo/collections/asr/parts/utils/eval_utils.py b/nemo/collections/asr/parts/utils/eval_utils.py index 5d0459978be2..eab975671a15 100644 --- a/nemo/collections/asr/parts/utils/eval_utils.py +++ b/nemo/collections/asr/parts/utils/eval_utils.py @@ -104,7 +104,7 @@ def cal_write_wer( if 'text' not in sample: raise ValueError( - "ground-truth text does not present in manifest! Cannot calculate Word Error Rate. Exiting!" + "ground-truth text is not present in manifest! Cannot calculate Word Error Rate. Exiting!" ) hyp = sample[pred_text_attr_name]