Skip to content

Commit 8136ad7

Browse files
authored
Use high_freq -400 in computing fbank features. (#1447)
See also k2-fsa/sherpa-onnx#514
1 parent f42258c commit 8136ad7

File tree

127 files changed

+127
-0
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

127 files changed

+127
-0
lines changed

egs/aidatatang_200zh/ASR/pruned_transducer_stateless2/pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -242,6 +242,7 @@ def main():
242242
opts.frame_opts.snip_edges = False
243243
opts.frame_opts.samp_freq = params.sample_rate
244244
opts.mel_opts.num_bins = params.feature_dim
245+
opts.mel_opts.high_freq = -400
245246

246247
fbank = kaldifeat.Fbank(opts)
247248

egs/aishell/ASR/conformer_ctc/pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -261,6 +261,7 @@ def main():
261261
opts.frame_opts.snip_edges = False
262262
opts.frame_opts.samp_freq = params.sample_rate
263263
opts.mel_opts.num_bins = params.feature_dim
264+
opts.mel_opts.high_freq = -400
264265

265266
fbank = kaldifeat.Fbank(opts)
266267

egs/aishell/ASR/pruned_transducer_stateless2/pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -240,6 +240,7 @@ def main():
240240
opts.frame_opts.snip_edges = False
241241
opts.frame_opts.samp_freq = params.sample_rate
242242
opts.mel_opts.num_bins = params.feature_dim
243+
opts.mel_opts.high_freq = -400
243244

244245
fbank = kaldifeat.Fbank(opts)
245246

egs/aishell/ASR/pruned_transducer_stateless3/pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -241,6 +241,7 @@ def main():
241241
opts.frame_opts.snip_edges = False
242242
opts.frame_opts.samp_freq = params.sample_rate
243243
opts.mel_opts.num_bins = params.feature_dim
244+
opts.mel_opts.high_freq = -400
244245

245246
fbank = kaldifeat.Fbank(opts)
246247

egs/aishell/ASR/pruned_transducer_stateless7/jit_pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -230,6 +230,7 @@ def main():
230230
opts.frame_opts.snip_edges = False
231231
opts.frame_opts.samp_freq = 16000
232232
opts.mel_opts.num_bins = 80
233+
opts.mel_opts.high_freq = -400
233234

234235
fbank = kaldifeat.Fbank(opts)
235236

egs/aishell/ASR/pruned_transducer_stateless7/onnx_pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -369,6 +369,7 @@ def main():
369369
opts.frame_opts.snip_edges = False
370370
opts.frame_opts.samp_freq = args.sample_rate
371371
opts.mel_opts.num_bins = 80
372+
opts.mel_opts.high_freq = -400
372373

373374
fbank = kaldifeat.Fbank(opts)
374375

egs/aishell/ASR/pruned_transducer_stateless7_bbpe/jit_pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -227,6 +227,7 @@ def main():
227227
opts.frame_opts.snip_edges = False
228228
opts.frame_opts.samp_freq = 16000
229229
opts.mel_opts.num_bins = 80
230+
opts.mel_opts.high_freq = -400
230231

231232
fbank = kaldifeat.Fbank(opts)
232233

egs/aishell/ASR/pruned_transducer_stateless7_bbpe/pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -250,6 +250,7 @@ def main():
250250
opts.frame_opts.snip_edges = False
251251
opts.frame_opts.samp_freq = params.sample_rate
252252
opts.mel_opts.num_bins = params.feature_dim
253+
opts.mel_opts.high_freq = -400
253254

254255
fbank = kaldifeat.Fbank(opts)
255256

egs/aishell/ASR/pruned_transducer_stateless7_streaming/streaming_decode.py

+1
Original file line numberDiff line numberDiff line change
@@ -317,6 +317,7 @@ def decode_dataset(
317317
opts.frame_opts.snip_edges = False
318318
opts.frame_opts.samp_freq = 16000
319319
opts.mel_opts.num_bins = 80
320+
opts.mel_opts.high_freq = -400
320321

321322
log_interval = 50
322323

egs/aishell/ASR/tdnn_lstm_ctc/pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -158,6 +158,7 @@ def main():
158158
opts.frame_opts.snip_edges = False
159159
opts.frame_opts.samp_freq = params.sample_rate
160160
opts.mel_opts.num_bins = params.feature_dim
161+
opts.mel_opts.high_freq = -400
161162

162163
fbank = kaldifeat.Fbank(opts)
163164

egs/aishell/ASR/transducer_stateless/pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -258,6 +258,7 @@ def main():
258258
opts.frame_opts.snip_edges = False
259259
opts.frame_opts.samp_freq = params.sample_rate
260260
opts.mel_opts.num_bins = params.feature_dim
261+
opts.mel_opts.high_freq = -400
261262

262263
fbank = kaldifeat.Fbank(opts)
263264

egs/aishell/ASR/transducer_stateless_modified-2/pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -238,6 +238,7 @@ def main():
238238
opts.frame_opts.snip_edges = False
239239
opts.frame_opts.samp_freq = params.sample_rate
240240
opts.mel_opts.num_bins = params.feature_dim
241+
opts.mel_opts.high_freq = -400
241242

242243
fbank = kaldifeat.Fbank(opts)
243244

egs/aishell/ASR/transducer_stateless_modified/pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -238,6 +238,7 @@ def main():
238238
opts.frame_opts.snip_edges = False
239239
opts.frame_opts.samp_freq = params.sample_rate
240240
opts.mel_opts.num_bins = params.feature_dim
241+
opts.mel_opts.high_freq = -400
241242

242243
fbank = kaldifeat.Fbank(opts)
243244

egs/aishell/ASR/zipformer/streaming_decode.py

+1
Original file line numberDiff line numberDiff line change
@@ -572,6 +572,7 @@ def decode_dataset(
572572
opts.frame_opts.snip_edges = False
573573
opts.frame_opts.samp_freq = 16000
574574
opts.mel_opts.num_bins = 80
575+
opts.mel_opts.high_freq = -400
575576

576577
log_interval = 100
577578

egs/aishell2/ASR/pruned_transducer_stateless5/pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -239,6 +239,7 @@ def main():
239239
opts.frame_opts.snip_edges = False
240240
opts.frame_opts.samp_freq = params.sample_rate
241241
opts.mel_opts.num_bins = params.feature_dim
242+
opts.mel_opts.high_freq = -400
242243

243244
fbank = kaldifeat.Fbank(opts)
244245

egs/aishell4/ASR/pruned_transducer_stateless5/pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -251,6 +251,7 @@ def main():
251251
opts.frame_opts.snip_edges = False
252252
opts.frame_opts.samp_freq = params.sample_rate
253253
opts.mel_opts.num_bins = params.feature_dim
254+
opts.mel_opts.high_freq = -400
254255

255256
fbank = kaldifeat.Fbank(opts)
256257

egs/alimeeting/ASR/pruned_transducer_stateless2/pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -242,6 +242,7 @@ def main():
242242
opts.frame_opts.snip_edges = False
243243
opts.frame_opts.samp_freq = params.sample_rate
244244
opts.mel_opts.num_bins = params.feature_dim
245+
opts.mel_opts.high_freq = -400
245246

246247
fbank = kaldifeat.Fbank(opts)
247248

egs/commonvoice/ASR/pruned_transducer_stateless7/onnx_pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -370,6 +370,7 @@ def main():
370370
opts.frame_opts.snip_edges = False
371371
opts.frame_opts.samp_freq = args.sample_rate
372372
opts.mel_opts.num_bins = 80
373+
opts.mel_opts.high_freq = -400
373374

374375
fbank = kaldifeat.Fbank(opts)
375376

egs/commonvoice/ASR/pruned_transducer_stateless7/pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -260,6 +260,7 @@ def main():
260260
opts.frame_opts.snip_edges = False
261261
opts.frame_opts.samp_freq = params.sample_rate
262262
opts.mel_opts.num_bins = params.feature_dim
263+
opts.mel_opts.high_freq = -400
263264

264265
fbank = kaldifeat.Fbank(opts)
265266

egs/commonvoice/ASR/pruned_transducer_stateless7_streaming/streaming_decode.py

+1
Original file line numberDiff line numberDiff line change
@@ -320,6 +320,7 @@ def decode_dataset(
320320
opts.frame_opts.snip_edges = False
321321
opts.frame_opts.samp_freq = 16000
322322
opts.mel_opts.num_bins = 80
323+
opts.mel_opts.high_freq = -400
323324

324325
log_interval = 50
325326

egs/csj/ASR/pruned_transducer_stateless7_streaming/jit_trace_pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -177,6 +177,7 @@ def create_streaming_feature_extractor(sample_rate) -> OnlineFeature:
177177
opts.frame_opts.snip_edges = False
178178
opts.frame_opts.samp_freq = sample_rate
179179
opts.mel_opts.num_bins = 80
180+
opts.mel_opts.high_freq = -400
180181
return OnlineFbank(opts)
181182

182183

egs/csj/ASR/pruned_transducer_stateless7_streaming/pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -252,6 +252,7 @@ def main():
252252
opts.frame_opts.snip_edges = False
253253
opts.frame_opts.samp_freq = params.sample_rate
254254
opts.mel_opts.num_bins = params.feature_dim
255+
opts.mel_opts.high_freq = -400
255256

256257
fbank = kaldifeat.Fbank(opts)
257258

egs/csj/ASR/pruned_transducer_stateless7_streaming/streaming_decode.py

+1
Original file line numberDiff line numberDiff line change
@@ -337,6 +337,7 @@ def decode_dataset(
337337
opts.frame_opts.snip_edges = False
338338
opts.frame_opts.samp_freq = 16000
339339
opts.mel_opts.num_bins = 80
340+
opts.mel_opts.high_freq = -400
340341

341342
log_interval = 50
342343

egs/gigaspeech/ASR/zipformer/streaming_decode.py

+1
Original file line numberDiff line numberDiff line change
@@ -553,6 +553,7 @@ def decode_dataset(
553553
opts.frame_opts.snip_edges = False
554554
opts.frame_opts.samp_freq = 16000
555555
opts.mel_opts.num_bins = 80
556+
opts.mel_opts.high_freq = -400
556557

557558
log_interval = 100
558559

egs/libriheavy/ASR/zipformer_prompt_asr/pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -264,6 +264,7 @@ def main():
264264
opts.frame_opts.snip_edges = False
265265
opts.frame_opts.samp_freq = params.sample_rate
266266
opts.mel_opts.num_bins = params.feature_dim
267+
opts.mel_opts.high_freq = -400
267268

268269
fbank = kaldifeat.Fbank(opts)
269270

egs/librispeech/ASR/conformer_ctc/jit_pretrained_decode_with_H.py

+1
Original file line numberDiff line numberDiff line change
@@ -195,6 +195,7 @@ def main():
195195
opts.frame_opts.snip_edges = False
196196
opts.frame_opts.samp_freq = sample_rate
197197
opts.mel_opts.num_bins = 80
198+
opts.mel_opts.high_freq = -400
198199

199200
fbank = kaldifeat.Fbank(opts)
200201

egs/librispeech/ASR/conformer_ctc/jit_pretrained_decode_with_HL.py

+1
Original file line numberDiff line numberDiff line change
@@ -192,6 +192,7 @@ def main():
192192
opts.frame_opts.snip_edges = False
193193
opts.frame_opts.samp_freq = sample_rate
194194
opts.mel_opts.num_bins = 80
195+
opts.mel_opts.high_freq = -400
195196

196197
fbank = kaldifeat.Fbank(opts)
197198

egs/librispeech/ASR/conformer_ctc/jit_pretrained_decode_with_HLG.py

+1
Original file line numberDiff line numberDiff line change
@@ -191,6 +191,7 @@ def main():
191191
opts.frame_opts.snip_edges = False
192192
opts.frame_opts.samp_freq = sample_rate
193193
opts.mel_opts.num_bins = 80
194+
opts.mel_opts.high_freq = -400
194195

195196
fbank = kaldifeat.Fbank(opts)
196197

egs/librispeech/ASR/conformer_ctc/pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -283,6 +283,7 @@ def main():
283283
opts.frame_opts.snip_edges = False
284284
opts.frame_opts.samp_freq = params.sample_rate
285285
opts.mel_opts.num_bins = params.feature_dim
286+
opts.mel_opts.high_freq = -400
286287

287288
fbank = kaldifeat.Fbank(opts)
288289

egs/librispeech/ASR/conformer_ctc3/jit_pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -271,6 +271,7 @@ def main():
271271
opts.frame_opts.snip_edges = False
272272
opts.frame_opts.samp_freq = params.sample_rate
273273
opts.mel_opts.num_bins = params.feature_dim
274+
opts.mel_opts.high_freq = -400
274275

275276
fbank = kaldifeat.Fbank(opts)
276277

egs/librispeech/ASR/conformer_ctc3/pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -302,6 +302,7 @@ def main():
302302
opts.frame_opts.snip_edges = False
303303
opts.frame_opts.samp_freq = params.sample_rate
304304
opts.mel_opts.num_bins = params.feature_dim
305+
opts.mel_opts.high_freq = -400
305306

306307
fbank = kaldifeat.Fbank(opts)
307308

egs/librispeech/ASR/conv_emformer_transducer_stateless/streaming_decode.py

+1
Original file line numberDiff line numberDiff line change
@@ -623,6 +623,7 @@ def create_streaming_feature_extractor() -> Fbank:
623623
opts.frame_opts.snip_edges = False
624624
opts.frame_opts.samp_freq = 16000
625625
opts.mel_opts.num_bins = 80
626+
opts.mel_opts.high_freq = -400
626627
return Fbank(opts)
627628

628629

egs/librispeech/ASR/conv_emformer_transducer_stateless2/jit_pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -184,6 +184,7 @@ def create_streaming_feature_extractor(sample_rate) -> OnlineFeature:
184184
opts.frame_opts.snip_edges = False
185185
opts.frame_opts.samp_freq = sample_rate
186186
opts.mel_opts.num_bins = 80
187+
opts.mel_opts.high_freq = -400
187188
return OnlineFbank(opts)
188189

189190

egs/librispeech/ASR/conv_emformer_transducer_stateless2/onnx_pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -326,6 +326,7 @@ def create_streaming_feature_extractor() -> OnlineFeature:
326326
opts.frame_opts.snip_edges = False
327327
opts.frame_opts.samp_freq = 16000
328328
opts.mel_opts.num_bins = 80
329+
opts.mel_opts.high_freq = -400
329330
return OnlineFbank(opts)
330331

331332

egs/librispeech/ASR/conv_emformer_transducer_stateless2/streaming-ncnn-decode.py

+1
Original file line numberDiff line numberDiff line change
@@ -276,6 +276,7 @@ def create_streaming_feature_extractor() -> OnlineFeature:
276276
opts.frame_opts.snip_edges = False
277277
opts.frame_opts.samp_freq = 16000
278278
opts.mel_opts.num_bins = 80
279+
opts.mel_opts.high_freq = -400
279280
return OnlineFbank(opts)
280281

281282

egs/librispeech/ASR/conv_emformer_transducer_stateless2/streaming_decode.py

+1
Original file line numberDiff line numberDiff line change
@@ -623,6 +623,7 @@ def create_streaming_feature_extractor() -> Fbank:
623623
opts.frame_opts.snip_edges = False
624624
opts.frame_opts.samp_freq = 16000
625625
opts.mel_opts.num_bins = 80
626+
opts.mel_opts.high_freq = -400
626627
return Fbank(opts)
627628

628629

egs/librispeech/ASR/lstm_transducer_stateless/jit_pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -266,6 +266,7 @@ def main():
266266
opts.frame_opts.snip_edges = False
267267
opts.frame_opts.samp_freq = args.sample_rate
268268
opts.mel_opts.num_bins = 80
269+
opts.mel_opts.high_freq = -400
269270

270271
fbank = kaldifeat.Fbank(opts)
271272

egs/librispeech/ASR/lstm_transducer_stateless/pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -251,6 +251,7 @@ def main():
251251
opts.frame_opts.snip_edges = False
252252
opts.frame_opts.samp_freq = params.sample_rate
253253
opts.mel_opts.num_bins = params.feature_dim
254+
opts.mel_opts.high_freq = -400
254255

255256
fbank = kaldifeat.Fbank(opts)
256257

egs/librispeech/ASR/lstm_transducer_stateless/streaming_decode.py

+1
Original file line numberDiff line numberDiff line change
@@ -615,6 +615,7 @@ def create_streaming_feature_extractor() -> Fbank:
615615
opts.frame_opts.snip_edges = False
616616
opts.frame_opts.samp_freq = 16000
617617
opts.mel_opts.num_bins = 80
618+
opts.mel_opts.high_freq = -400
618619
return Fbank(opts)
619620

620621

egs/librispeech/ASR/lstm_transducer_stateless2/jit_pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -267,6 +267,7 @@ def main():
267267
opts.frame_opts.snip_edges = False
268268
opts.frame_opts.samp_freq = args.sample_rate
269269
opts.mel_opts.num_bins = 80
270+
opts.mel_opts.high_freq = -400
270271

271272
fbank = kaldifeat.Fbank(opts)
272273

egs/librispeech/ASR/lstm_transducer_stateless2/ncnn-decode.py

+1
Original file line numberDiff line numberDiff line change
@@ -255,6 +255,7 @@ def main():
255255
opts.frame_opts.snip_edges = False
256256
opts.frame_opts.samp_freq = sample_rate
257257
opts.mel_opts.num_bins = 80
258+
opts.mel_opts.high_freq = -400
258259

259260
fbank = kaldifeat.Fbank(opts)
260261

egs/librispeech/ASR/lstm_transducer_stateless2/onnx_pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -298,6 +298,7 @@ def create_streaming_feature_extractor() -> OnlineFeature:
298298
opts.frame_opts.snip_edges = False
299299
opts.frame_opts.samp_freq = 16000
300300
opts.mel_opts.num_bins = 80
301+
opts.mel_opts.high_freq = -400
301302
return OnlineFbank(opts)
302303

303304

egs/librispeech/ASR/lstm_transducer_stateless2/pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -254,6 +254,7 @@ def main():
254254
opts.frame_opts.snip_edges = False
255255
opts.frame_opts.samp_freq = params.sample_rate
256256
opts.mel_opts.num_bins = params.feature_dim
257+
opts.mel_opts.high_freq = -400
257258

258259
fbank = kaldifeat.Fbank(opts)
259260

egs/librispeech/ASR/lstm_transducer_stateless2/streaming-ncnn-decode.py

+1
Original file line numberDiff line numberDiff line change
@@ -217,6 +217,7 @@ def create_streaming_feature_extractor() -> OnlineFeature:
217217
opts.frame_opts.snip_edges = False
218218
opts.frame_opts.samp_freq = 16000
219219
opts.mel_opts.num_bins = 80
220+
opts.mel_opts.high_freq = -400
220221
return OnlineFbank(opts)
221222

222223

egs/librispeech/ASR/lstm_transducer_stateless2/streaming-onnx-decode.py

+1
Original file line numberDiff line numberDiff line change
@@ -344,6 +344,7 @@ def create_streaming_feature_extractor() -> OnlineFeature:
344344
opts.frame_opts.snip_edges = False
345345
opts.frame_opts.samp_freq = 16000
346346
opts.mel_opts.num_bins = 80
347+
opts.mel_opts.high_freq = -400
347348
return OnlineFbank(opts)
348349

349350

egs/librispeech/ASR/lstm_transducer_stateless3/jit_pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -266,6 +266,7 @@ def main():
266266
opts.frame_opts.snip_edges = False
267267
opts.frame_opts.samp_freq = args.sample_rate
268268
opts.mel_opts.num_bins = 80
269+
opts.mel_opts.high_freq = -400
269270

270271
fbank = kaldifeat.Fbank(opts)
271272

egs/librispeech/ASR/lstm_transducer_stateless3/pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -252,6 +252,7 @@ def main():
252252
opts.frame_opts.snip_edges = False
253253
opts.frame_opts.samp_freq = params.sample_rate
254254
opts.mel_opts.num_bins = params.feature_dim
255+
opts.mel_opts.high_freq = -400
255256

256257
fbank = kaldifeat.Fbank(opts)
257258

egs/librispeech/ASR/lstm_transducer_stateless3/streaming_decode.py

+1
Original file line numberDiff line numberDiff line change
@@ -615,6 +615,7 @@ def create_streaming_feature_extractor() -> Fbank:
615615
opts.frame_opts.snip_edges = False
616616
opts.frame_opts.samp_freq = 16000
617617
opts.mel_opts.num_bins = 80
618+
opts.mel_opts.high_freq = -400
618619
return Fbank(opts)
619620

620621

egs/librispeech/ASR/pruned_transducer_stateless/pretrained.py

+1
Original file line numberDiff line numberDiff line change
@@ -277,6 +277,7 @@ def main():
277277
opts.frame_opts.snip_edges = False
278278
opts.frame_opts.samp_freq = params.sample_rate
279279
opts.mel_opts.num_bins = params.feature_dim
280+
opts.mel_opts.high_freq = -400
280281

281282
fbank = kaldifeat.Fbank(opts)
282283

egs/librispeech/ASR/pruned_transducer_stateless/streaming_decode.py

+1
Original file line numberDiff line numberDiff line change
@@ -334,6 +334,7 @@ def decode_dataset(
334334
opts.frame_opts.snip_edges = False
335335
opts.frame_opts.samp_freq = 16000
336336
opts.mel_opts.num_bins = 80
337+
opts.mel_opts.high_freq = -400
337338

338339
log_interval = 100
339340

0 commit comments

Comments
 (0)