|
21 | 21 | from numpy import float32
|
22 | 22 | from yacs.config import CfgNode
|
23 | 23 |
|
| 24 | +from paddlespeech.audio.transform.transformation import Transformation |
24 | 25 | from paddlespeech.cli.asr.infer import ASRExecutor
|
25 | 26 | from paddlespeech.cli.log import logger
|
26 | 27 | from paddlespeech.resource import CommonTaskResource
|
27 |
| -from paddlespeech.audio.transform.transformation import Transformation |
28 | 28 | from paddlespeech.s2t.frontend.featurizer.text_featurizer import TextFeaturizer
|
29 | 29 | from paddlespeech.s2t.modules.ctc import CTCDecoder
|
30 | 30 | from paddlespeech.s2t.utils.tensor_utils import add_sos_eos
|
@@ -130,8 +130,8 @@ def model_reset(self):
|
130 | 130 |
|
131 | 131 | ## conformer
|
132 | 132 | # cache for conformer online
|
133 |
| - self.att_cache = paddle.zeros([0,0,0,0]) |
134 |
| - self.cnn_cache = paddle.zeros([0,0,0,0]) |
| 133 | + self.att_cache = paddle.zeros([0, 0, 0, 0]) |
| 134 | + self.cnn_cache = paddle.zeros([0, 0, 0, 0]) |
135 | 135 |
|
136 | 136 | self.encoder_out = None
|
137 | 137 | # conformer decoding state
|
@@ -474,9 +474,10 @@ def advance_decoding(self, is_finished=False):
|
474 | 474 | # cur chunk
|
475 | 475 | chunk_xs = self.cached_feat[:, cur:end, :]
|
476 | 476 | # forward chunk
|
477 |
| - (y, self.att_cache, self.cnn_cache) = self.model.encoder.forward_chunk( |
478 |
| - chunk_xs, self.offset, required_cache_size, |
479 |
| - self.att_cache, self.cnn_cache) |
| 477 | + (y, self.att_cache, |
| 478 | + self.cnn_cache) = self.model.encoder.forward_chunk( |
| 479 | + chunk_xs, self.offset, required_cache_size, self.att_cache, |
| 480 | + self.cnn_cache, paddle.ones([0, 0, 0], dtype=paddle.bool)) |
480 | 481 | outputs.append(y)
|
481 | 482 |
|
482 | 483 | # update the global offset, in decoding frame unit
|
|
0 commit comments