mirror of
https://github.com/mozilla/DeepSpeech.git
synced 2025-10-26 11:19:39 +00:00
Fix #284; BiRNN with stride 2
This commit is contained in:
parent
7cc75f252f
commit
8e99eeffdd
@ -10,6 +10,9 @@ def audiofile_to_input_vector(audio_filename, numcep, numcontext):
|
||||
# Get mfcc coefficients
|
||||
orig_inputs = mfcc(audio, samplerate=fs, numcep=numcep)
|
||||
|
||||
# We only keep every second feature (BiRNN stride = 2)
|
||||
orig_inputs = orig_inputs[::2]
|
||||
|
||||
# For each time slice of the training set, we need to copy the context this makes
|
||||
# the numcep dimensions vector into a numcep + 2*numcep*numcontext dimensions
|
||||
# because of:
|
||||
|
||||
Loading…
Reference in New Issue
Block a user