-
Notifications
You must be signed in to change notification settings - Fork 43
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
- Loading branch information
vrenkens
committed
Jul 28, 2017
1 parent
a32302d
commit e926522
Showing
89 changed files
with
2,624 additions
and
633 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,3 @@ | ||
[processor] | ||
#type of processor | ||
processor = alignment_processor |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,24 @@ | ||
[processor] | ||
#type of processor | ||
processor = audio_processor | ||
#feature type | ||
feature = fbank | ||
#the dynamic information that is added to the features, options are nodelta, | ||
#delta and ddelta | ||
dynamic = ddelta | ||
#length of the sliding window (seconds) | ||
winlen = 0.025 | ||
#step of the sliding window (seconds) | ||
winstep = 0.01 | ||
#number of fbank filters | ||
nfilt = 40 | ||
#number of fft bins | ||
nfft = 512 | ||
#low cuttof frequency | ||
lowfreq = 0 | ||
#hight cutoff frequency, if -1 set to None | ||
highfreq = -1 | ||
#premphesis | ||
preemph = 0.97 | ||
#include energy in features | ||
include_energy = True |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,35 @@ | ||
[io] | ||
#a space seperated list of input names | ||
inputs = features | ||
#a space seperated list of output names | ||
outputs = alignments | ||
|
||
[encoder] | ||
#type of encoder | ||
encoder = dnn | ||
#number of neurons in the hidden layers | ||
num_units = 2048 | ||
#number of hidden layers | ||
num_layers = 5 | ||
#input noise standart deviation | ||
input_noise = 0 | ||
#dropout rate | ||
dropout = 0.5 | ||
#number of left and right context windows to take into account | ||
context = 5 | ||
#wheter layer normalization should be applied | ||
layer_norm = True | ||
|
||
[decoder] | ||
#type of decoder | ||
decoder = dnn_decoder | ||
#the output dimensions | ||
output_dims = 3100 | ||
#the number of layers in each detector | ||
num_layers = 0 | ||
#the number of units in each detector | ||
num_units = 2024 | ||
#wheter layer normalization should be applied | ||
layer_norm = True | ||
#dropout rate | ||
dropout = 1 |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,11 @@ | ||
[recognizer] | ||
#the number of utterances that are processed simultaniously | ||
batch_size = 8 | ||
#link the input names defined in the classifier config to sections defined in | ||
#the database config | ||
features = test93fbank | ||
|
||
[decoder] | ||
#name of the decoder that should be used | ||
decoder = alignment_decoder | ||
prior = /users/spraak/vrenkens/spchtemp/Nabu/data/wsj/kaldi_alignments/train_si284/prior.npy |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,17 @@ | ||
[evaluator] | ||
#name of the evaluator that should be used | ||
evaluator = decoder_evaluator | ||
#the number of utterances that are processed simultaniously | ||
batch_size = 8 | ||
#link the input names defined in the classifier config to sections defined in | ||
#the database config | ||
features = test93fbank | ||
#a space seperated list of target names used by the evaluator | ||
targets = event | ||
#a mapping between the target names and database sections | ||
event = test93Dental | ||
|
||
[decoder] | ||
#name of the decoder that should be used | ||
decoder = max_decoder | ||
event_alphabet = 0 1 |
Oops, something went wrong.