Skip to content

Commit

Permalink
Merge pull request espnet#4114 from ftshijt/master
Browse files Browse the repository at this point in the history
Fix fisher_callhome_spanish update (compatibility to eg1)
  • Loading branch information
ftshijt authored Feb 27, 2022
2 parents 812ab14 + 15edb39 commit 637d8c3
Show file tree
Hide file tree
Showing 7 changed files with 89 additions and 22 deletions.
71 changes: 67 additions & 4 deletions egs2/fisher_callhome_spanish/asr1/RESULTS.md
Original file line number Diff line number Diff line change
@@ -1,12 +1,75 @@
<!-- Generated by scripts/utils/show_asr_result.sh -->
# RESULTS
## Environments
- date: `Sat Nov 27 12:21:09 EST 2021`
- date: `Fri Feb 25 11:45:29 EST 2022`
- python version: `3.9.7 (default, Sep 16 2021, 13:09:58) [GCC 7.5.0]`
- espnet version: `espnet 0.10.3a3`
- espnet version: `espnet 0.10.7a1`
- pytorch version: `pytorch 1.9.0`
- Git hash: `9d06e80ac454bfbc4b95575d7f2f48da0cc880f9`
- Commit date: `Mon Nov 22 01:34:44 2021 -0500`
- Git hash: `54799d2fa7beb702ab909a7e57cc70288e3ce96c`
- Commit date: `Tue Feb 22 10:31:31 2022 -0500`

## asr_8k_conformer (no callhome training)
### WER

|dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
|---|---|---|---|---|---|---|---|---|
|decode_asr_asr_model_valid.acc.ave/callhome_devtest|3956|37982|64.9|24.8|10.3|6.4|41.5|79.8|
|decode_asr_asr_model_valid.acc.ave/callhome_evltest|1825|19035|63.1|25.6|11.3|6.4|43.3|82.2|
|decode_asr_asr_model_valid.acc.ave/fisher_dev|3977|40961|78.5|13.4|8.1|4.8|26.3|65.6|
|decode_asr_asr_model_valid.acc.ave/fisher_dev2|3958|39871|78.2|14.0|7.8|5.8|27.7|68.1|
|decode_asr_asr_model_valid.acc.ave/fisher_test|3641|40011|80.0|12.8|7.2|5.8|25.8|64.2|

### CER

|dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
|---|---|---|---|---|---|---|---|---|
|decode_asr_asr_model_valid.acc.ave/callhome_devtest|3956|180997|80.8|7.1|12.1|6.2|25.4|79.8|
|decode_asr_asr_model_valid.acc.ave/callhome_evltest|1825|91266|79.2|7.6|13.2|5.9|26.8|82.2|
|decode_asr_asr_model_valid.acc.ave/fisher_dev|3977|194297|88.6|3.4|8.0|5.3|16.7|65.6|
|decode_asr_asr_model_valid.acc.ave/fisher_dev2|3958|189893|88.4|3.8|7.7|7.0|18.6|68.1|
|decode_asr_asr_model_valid.acc.ave/fisher_test|3641|194507|89.6|3.2|7.3|5.9|16.3|64.2|

### TER

|dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
|---|---|---|---|---|---|---|---|---|
|decode_asr_asr_model_valid.acc.ave/callhome_devtest|3956|56665|64.3|20.7|15.0|5.6|41.3|79.8|
|decode_asr_asr_model_valid.acc.ave/callhome_evltest|1825|28386|62.2|21.4|16.3|6.1|43.9|82.2|
|decode_asr_asr_model_valid.acc.ave/fisher_dev|3977|55856|79.0|11.6|9.4|6.5|27.5|65.6|
|decode_asr_asr_model_valid.acc.ave/fisher_dev2|3958|53962|79.1|12.5|8.4|8.9|29.8|68.1|
|decode_asr_asr_model_valid.acc.ave/fisher_test|3641|54138|81.4|10.7|7.9|7.7|26.3|64.2|

## asr_8k_transformer (no callhome training)
### WER

|dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
|---|---|---|---|---|---|---|---|---|
|decode_asr_asr_model_valid.acc.ave/callhome_devtest|3956|37982|53.1|33.3|13.7|6.0|52.9|85.1|
|decode_asr_asr_model_valid.acc.ave/callhome_evltest|1825|19035|52.3|34.0|13.7|6.0|53.7|86.7|
|decode_asr_asr_model_valid.acc.ave/fisher_dev|3977|40961|76.8|16.5|6.7|5.1|28.3|70.0|
|decode_asr_asr_model_valid.acc.ave/fisher_dev2|3958|39871|77.8|16.3|5.9|6.0|28.2|70.8|
|decode_asr_asr_model_valid.acc.ave/fisher_test|3641|40011|79.9|14.5|5.5|5.8|25.9|69.2|

### CER

|dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
|---|---|---|---|---|---|---|---|---|
|decode_asr_asr_model_valid.acc.ave/callhome_devtest|3956|180997|74.3|10.0|15.7|6.2|31.9|85.1|
|decode_asr_asr_model_valid.acc.ave/callhome_evltest|1825|91266|73.3|10.2|16.5|6.1|32.8|86.7|
|decode_asr_asr_model_valid.acc.ave/fisher_dev|3977|194297|89.7|4.0|6.3|5.6|15.9|70.0|
|decode_asr_asr_model_valid.acc.ave/fisher_dev2|3958|189893|90.4|4.1|5.5|7.0|16.6|70.8|
|decode_asr_asr_model_valid.acc.ave/fisher_test|3641|194507|91.6|3.4|5.0|5.9|14.3|69.2|

### TER

|dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
|---|---|---|---|---|---|---|---|---|
|decode_asr_asr_model_valid.acc.ave/callhome_devtest|3956|56665|52.2|28.0|19.8|5.0|52.8|85.1|
|decode_asr_asr_model_valid.acc.ave/callhome_evltest|1825|28386|50.8|28.9|20.2|5.2|54.3|86.7|
|decode_asr_asr_model_valid.acc.ave/fisher_dev|3977|55856|76.2|14.3|9.5|5.8|29.6|70.0|
|decode_asr_asr_model_valid.acc.ave/fisher_dev2|3958|53962|77.5|14.3|8.2|7.9|30.4|70.8|
|decode_asr_asr_model_valid.acc.ave/fisher_test|3641|54138|80.1|12.3|7.5|6.6|26.5|69.2|


## asr_train_asr_raw_bpe1000_sp
### WER
Expand Down
2 changes: 1 addition & 1 deletion egs2/fisher_callhome_spanish/asr1/conf/pitch.conf
Original file line number Diff line number Diff line change
@@ -1 +1 @@
--sample-frequency=16000
--sample-frequency=8000
11 changes: 6 additions & 5 deletions egs2/fisher_callhome_spanish/asr1/local/data.sh
Original file line number Diff line number Diff line change
Expand Up @@ -65,13 +65,14 @@ if [ ${stage} -le 1 ] && [ ${stop_stage} -ge 1 ]; then
# concatenate multiple utterances
local/normalize_trans.sh ${sfisher_transcripts} ${callhome_transcripts}

utils/combine_data.sh \
--extra-files "text.lc.es text.lc.rm.es text.tc.es" \
data/train \
data/fisher_train data/callhome_train/
# skip combination to have same condition of previous result
# utils/combine_data.sh \
# --extra-files "text.lc.es text.lc.rm.es text.tc.es" \
# data/train \
# data/fisher_train data/callhome_train/

cp -r data/fisher_train data/train
cp -r data/fisher_dev data/dev

fi


Expand Down
3 changes: 1 addition & 2 deletions egs2/fisher_callhome_spanish/asr1/run.sh
Original file line number Diff line number Diff line change
Expand Up @@ -17,6 +17,7 @@ nbpe=1000

./asr.sh \
--ngpu 1 \
--fs 8k \
--audio_format "flac.ark" \
--local_data_opts "--stage 0" \
--use_lm false \
Expand All @@ -30,7 +31,5 @@ nbpe=1000
--train_set "${train_set}" \
--valid_set "${train_dev}" \
--test_sets "${test_set}" \
--gpu_inference true \
--inference_nj 10 \
--bpe_train_text "data/${train_set}/text" \
--lm_train_text "data/${train_set}/text" "$@"
2 changes: 1 addition & 1 deletion egs2/fisher_callhome_spanish/st1/conf/pitch.conf
Original file line number Diff line number Diff line change
@@ -1 +1 @@
--sample-frequency=16000
--sample-frequency=8000
20 changes: 12 additions & 8 deletions egs2/fisher_callhome_spanish/st1/local/data.sh
Original file line number Diff line number Diff line change
Expand Up @@ -68,16 +68,20 @@ if [ ${stage} -le 1 ] && [ ${stop_stage} -ge 1 ]; then
local/normalize_trans.sh ${sfisher_transcripts} ${callhome_transcripts}
fi

if [ ${stage} -le 1 ] && [ ${stop_stage} -ge 1 ]; then
if [ ${stage} -le 2 ] && [ ${stop_stage} -ge 2 ]; then
log "stage 2: Combine train and dev set"
utils/combine_data.sh \
--extra-files "text.lc.en text.lc.es text.lc.rm.en text.lc.rm.es text.tc.en text.tc.es" \
data/train \
data/fisher_train data/callhome_train/

# skip the combination to have same condition to previous result
# utils/combine_data.sh \
# --extra-files "text.lc.en text.lc.es text.lc.rm.en text.lc.rm.es text.tc.en text.tc.es" \
# data/train \
# data/fisher_train data/callhome_train/

cp -r data/fisher_train data/train
cp -r data/fisher_dev data/dev
rm data/dev/text.*.en
# Use 1 reference as dev set
ln -sf text.lc.en.0 data/dev/text.lc.en
ln -sf text.tc.en.0 data/dev/text.tc.en
ln -sf text.lc.rm.en.0 data/dev/text.lc.rm.en
cp data/fisher_dev/text.lc.en.0 data/dev/text.lc.en
cp data/fisher_dev/text.tc.en.0 data/dev/text.tc.en
cp data/fisher_dev/text.lc.rm.en.0 data/dev/text.lc.rm.en
fi
2 changes: 1 addition & 1 deletion egs2/fisher_callhome_spanish/st1/run.sh
Original file line number Diff line number Diff line change
Expand Up @@ -27,7 +27,7 @@ tgt_case=lc.rm
--use_lm false \
--token_joint false \
--nj 40 \
--inference_nj 8 \
--fs 8k \
--src_lang ${src_lang} \
--tgt_lang ${tgt_lang} \
--src_token_type "bpe" \
Expand Down

0 comments on commit 637d8c3

Please sign in to comment.