Merge pull request #335 from alibaba-damo-academy/dev_lhn2

update loading cmvn_file
This commit is contained in:
zhifu gao 2023-04-12 18:29:06 +08:00 committed by GitHub
commit fe5f58e188
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -38,7 +38,7 @@ def load_cmvn(cmvn_file):
return cmvn
def apply_cmvn(inputs, cmvn_file): # noqa
def apply_cmvn(inputs, cmvn): # noqa
"""
Apply CMVN with mvn data
"""
@ -47,7 +47,6 @@ def apply_cmvn(inputs, cmvn_file): # noqa
dtype = inputs.dtype
frame, dim = inputs.shape
cmvn = load_cmvn(cmvn_file)
means = np.tile(cmvn[0:1, :dim], (frame, 1))
vars = np.tile(cmvn[1:2, :dim], (frame, 1))
inputs += torch.from_numpy(means).type(dtype).to(device)
@ -111,6 +110,7 @@ class WavFrontend(AbsFrontend):
self.dither = dither
self.snip_edges = snip_edges
self.upsacle_samples = upsacle_samples
self.cmvn = None if self.cmvn_file is None else load_cmvn(self.cmvn_file)
def output_size(self) -> int:
return self.n_mels * self.lfr_m
@ -140,8 +140,8 @@ class WavFrontend(AbsFrontend):
if self.lfr_m != 1 or self.lfr_n != 1:
mat = apply_lfr(mat, self.lfr_m, self.lfr_n)
if self.cmvn_file is not None:
mat = apply_cmvn(mat, self.cmvn_file)
if self.cmvn is not None:
mat = apply_cmvn(mat, self.cmvn)
feat_length = mat.size(0)
feats.append(mat)
feats_lens.append(feat_length)
@ -194,8 +194,8 @@ class WavFrontend(AbsFrontend):
mat = input[i, :input_lengths[i], :]
if self.lfr_m != 1 or self.lfr_n != 1:
mat = apply_lfr(mat, self.lfr_m, self.lfr_n)
if self.cmvn_file is not None:
mat = apply_cmvn(mat, self.cmvn_file)
if self.cmvn is not None:
mat = apply_cmvn(mat, self.cmvn)
feat_length = mat.size(0)
feats.append(mat)
feats_lens.append(feat_length)