Skip to content

Commit f140577

Browse files
authored
Fix nemo feature normalization in test code (#2361)
1 parent 831aff1 commit f140577

File tree

4 files changed

+9
-14
lines changed

4 files changed

+9
-14
lines changed

scripts/nemo/canary/test_180m_flash.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -228,8 +228,8 @@ def main():
228228
features = compute_features(audio, fbank)
229229
if model.normalize_type != "":
230230
assert model.normalize_type == "per_feature", model.normalize_type
231-
mean = features.mean(axis=1, keepdims=True)
232-
stddev = features.std(axis=1, keepdims=True) + 1e-5
231+
mean = features.mean(axis=0, keepdims=True)
232+
stddev = features.std(axis=0, keepdims=True) + 1e-5
233233
features = (features - mean) / stddev
234234

235235
features = np.expand_dims(features, axis=0)

scripts/nemo/fast-conformer-hybrid-transducer-ctc/test-onnx-ctc-non-streaming.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -140,8 +140,8 @@ def main():
140140
if model.normalize_type != "":
141141
assert model.normalize_type == "per_feature", model.normalize_type
142142
features = torch.from_numpy(features)
143-
mean = features.mean(dim=1, keepdims=True)
144-
stddev = features.std(dim=1, keepdims=True) + 1e-5
143+
mean = features.mean(dim=0, keepdims=True)
144+
stddev = features.std(dim=0, keepdims=True) + 1e-5
145145
features = (features - mean) / stddev
146146
features = features.numpy()
147147

scripts/nemo/fast-conformer-hybrid-transducer-ctc/test-onnx-transducer-non-streaming.py

Lines changed: 3 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -184,12 +184,7 @@ def run_decoder(
184184
target = torch.tensor([[token]], dtype=torch.int32).numpy()
185185
target_len = torch.tensor([1], dtype=torch.int32).numpy()
186186

187-
(
188-
decoder_out,
189-
decoder_out_length,
190-
state0_next,
191-
state1_next,
192-
) = self.decoder.run(
187+
(decoder_out, decoder_out_length, state0_next, state1_next,) = self.decoder.run(
193188
[
194189
self.decoder.get_outputs()[0].name,
195190
self.decoder.get_outputs()[1].name,
@@ -267,8 +262,8 @@ def main():
267262
if model.normalize_type != "":
268263
assert model.normalize_type == "per_feature", model.normalize_type
269264
features = torch.from_numpy(features)
270-
mean = features.mean(dim=1, keepdims=True)
271-
stddev = features.std(dim=1, keepdims=True) + 1e-5
265+
mean = features.mean(dim=0, keepdims=True)
266+
stddev = features.std(dim=0, keepdims=True) + 1e-5
272267
features = (features - mean) / stddev
273268
features = features.numpy()
274269
print(audio.shape)

scripts/nemo/parakeet-tdt-0.6b-v2/test_onnx.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -233,8 +233,8 @@ def main():
233233
if model.normalize_type != "":
234234
assert model.normalize_type == "per_feature", model.normalize_type
235235
features = torch.from_numpy(features)
236-
mean = features.mean(dim=1, keepdims=True)
237-
stddev = features.std(dim=1, keepdims=True) + 1e-5
236+
mean = features.mean(dim=0, keepdims=True)
237+
stddev = features.std(dim=0, keepdims=True) + 1e-5
238238
features = (features - mean) / stddev
239239
features = features.numpy()
240240
print(audio.shape)

0 commit comments

Comments
 (0)