Skip to content

Commit 1d86248

Browse files
authored
Merge pull request #1742 from zh794390558/wfst
[speechx] update wfst graph
2 parents 85b50c4 + 4d8aee0 commit 1d86248

File tree

2 files changed

+16
-6
lines changed

2 files changed

+16
-6
lines changed

speechx/examples/ds2_ol/aishell/README.md

Lines changed: 11 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,7 @@ Mandarin -> 16.14 % N=104612 C=88190 S=16110 D=312 I=465
88
Other -> 0.00 % N=0 C=0 S=0 D=0 I=0
99
```
1010

11-
## CTC Prefix Beam Search w LM
11+
## CTC Prefix Beam Search w/ LM
1212

1313
LM: zh_giga.no_cna_cmn.prune01244.klm
1414
```
@@ -19,9 +19,18 @@ Other -> 0.00 % N=0 C=0 S=0 D=0 I=0
1919

2020
## CTC WFST
2121

22-
LM: aishell train
22+
LM: [aishell train](http://paddlespeech.bj.bcebos.com/speechx/examples/ds2_ol/aishell/aishell_graph.zip)
23+
--acoustic_scale=1.2
2324
```
2425
Overall -> 11.14 % N=103017 C=93363 S=9583 D=71 I=1819
2526
Mandarin -> 11.14 % N=103017 C=93363 S=9583 D=71 I=1818
2627
Other -> 0.00 % N=0 C=0 S=0 D=0 I=1
2728
```
29+
30+
LM: [wenetspeech](http://paddlespeech.bj.bcebos.com/speechx/examples/ds2_ol/aishell/wenetspeech_graph.zip)
31+
--acoustic_scale=1.5
32+
```
33+
Overall -> 10.93 % N=104765 C=93410 S=9780 D=1575 I=95
34+
Mandarin -> 10.93 % N=104762 C=93410 S=9779 D=1573 I=95
35+
Other -> 100.00 % N=3 C=0 S=1 D=2 I=0
36+
```

speechx/examples/ds2_ol/aishell/run.sh

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -87,7 +87,7 @@ if [ ${stage} -le 2 ] && [ ${stop_stage} -ge 2 ]; then
8787
ctc-prefix-beam-search-decoder-ol \
8888
--feature_rspecifier=scp:$data/split${nj}/JOB/feat.scp \
8989
--model_path=$model_dir/avg_1.jit.pdmodel \
90-
--params_path=$model_dir/avg_1.jit.pdiparams \
90+
--param_path=$model_dir/avg_1.jit.pdiparams \
9191
--model_output_names=softmax_0.tmp_0,tmp_5,concat_0.tmp_0,concat_1.tmp_0 \
9292
--dict_file=$vocb_dir/vocab.txt \
9393
--result_wspecifier=ark,t:$data/split${nj}/JOB/result
@@ -102,7 +102,7 @@ if [ ${stage} -le 3 ] && [ ${stop_stage} -ge 3 ]; then
102102
ctc-prefix-beam-search-decoder-ol \
103103
--feature_rspecifier=scp:$data/split${nj}/JOB/feat.scp \
104104
--model_path=$model_dir/avg_1.jit.pdmodel \
105-
--params_path=$model_dir/avg_1.jit.pdiparams \
105+
--param_path=$model_dir/avg_1.jit.pdiparams \
106106
--model_output_names=softmax_0.tmp_0,tmp_5,concat_0.tmp_0,concat_1.tmp_0 \
107107
--dict_file=$vocb_dir/vocab.txt \
108108
--lm_path=$lm \
@@ -119,17 +119,18 @@ if [ ${stage} -le 4 ] && [ ${stop_stage} -ge 4 ]; then
119119
pushd $wfst
120120
wget -c https://paddlespeech.bj.bcebos.com/s2t/paddle_asr_online/aishell_graph.zip
121121
unzip aishell_graph.zip
122+
mv aishell_graph/*
122123
popd
123124
fi
124125

125-
graph_dir=$wfst/aishell_graph
126+
graph_dir=$wfst/
126127

127128
# TLG decoder
128129
utils/run.pl JOB=1:$nj $data/split${nj}/JOB/recog.wfst.log \
129130
wfst-decoder-ol \
130131
--feature_rspecifier=scp:$data/split${nj}/JOB/feat.scp \
131132
--model_path=$model_dir/avg_1.jit.pdmodel \
132-
--params_path=$model_dir/avg_1.jit.pdiparams \
133+
--param_path=$model_dir/avg_1.jit.pdiparams \
133134
--word_symbol_table=$graph_dir/words.txt \
134135
--model_output_names=softmax_0.tmp_0,tmp_5,concat_0.tmp_0,concat_1.tmp_0 \
135136
--graph_path=$graph_dir/TLG.fst --max_active=7500 \

0 commit comments

Comments
 (0)