Merge pull request #1752 from yt605155624/fix_wavernn

yt605155624 · web-flow · commit 9121dfc04676 · 2022-04-22T13:55:54.000+08:00
[TTS]fix wavernn white noise bug for paddle develop(2.3)
diff --git a/examples/csmsc/tts3/local/synthesize_e2e.sh b/examples/csmsc/tts3/local/synthesize_e2e.sh
@@ -109,6 +109,6 @@ if [ ${stage} -le 4 ] && [ ${stop_stage} -ge 4 ]; then
         --lang=zh \
         --text=${BIN_DIR}/../sentences.txt \
         --output_dir=${train_output_path}/test_e2e \
-        --phones_dict=dump/phone_id_map.txt #\
-        # --inference_dir=${train_output_path}/inference
+        --phones_dict=dump/phone_id_map.txt \
+        --inference_dir=${train_output_path}/inference
 fi
diff --git a/examples/csmsc/voc6/README.md b/examples/csmsc/voc6/README.md
@@ -114,6 +114,7 @@ The pretrained model can be downloaded here:
 
 The static model can be downloaded here:
 - [wavernn_csmsc_static_0.2.0.zip](https://paddlespeech.bj.bcebos.com/Parakeet/released_models/wavernn/wavernn_csmsc_static_0.2.0.zip)
+- [wavernn_csmsc_static_1.0.0.zip](https://paddlespeech.bj.bcebos.com/Parakeet/released_models/wavernn/wavernn_csmsc_static_1.0.0.zip) (fix bug for paddle 2.3)
 
 Model | Step | eval/loss
 :-------------:|:------------:| :------------:
diff --git a/paddlespeech/t2s/models/wavernn/wavernn.py b/paddlespeech/t2s/models/wavernn/wavernn.py
@@ -360,7 +360,9 @@ def generate(self,
                 x = sample.transpose([1, 0, 2])
 
             elif self.mode == 'RAW':
-                posterior = F.softmax(logits, axis=1)
+                # fix bug for paddle 2.3, see https://github.com/PaddlePaddle/Paddle/commit/01f606b4f1ca3e184a59111084ed460ee0798a5a
+                # posterior = F.softmax(logits, axis=1)
+                posterior = logits
                 distrib = paddle.distribution.Categorical(posterior)
                 # corresponding operate [np.floor((fx + 1) / 2 * mu + 0.5)] in enocde_mu_law
                 # distrib.sample([1])[0].cast('float32'): [0, 2**bits-1]