Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Adding FusionRNN + QLSTM cfg + small QLSTM change #226

Merged
merged 3 commits into from
May 18, 2020
Merged
Show file tree
Hide file tree
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Next Next commit
Adding FusionRNN + QLSTM cfg + small QLSTM change
  • Loading branch information
TParcollet committed May 18, 2020
commit d0bf7a08f95433b8ab6a1da8c1e758c0dd103a37
221 changes: 221 additions & 0 deletions cfg/DIRHA_baselines/DIRHA_QLSTM_MFCC.cfg
Original file line number Diff line number Diff line change
@@ -0,0 +1,221 @@
[cfg_proto]
cfg_proto=proto/global.proto
cfg_proto_chunk=proto/global_chunk.proto

[exp]
cmd=
run_nn_script=run_nn.py
out_folder=exp/dirha_QLSTM_mfcc
pretrain_file=none
seed=1234
use_cuda=True
multi_gpu=False
save_gpumem=False
N_epochs_tr=20

[dataset1]
data_name=tr05_cont
fea:fea_name=mfccLA1
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA1/data/tr05_cont/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA1/data/tr05_cont/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA1/mfcc/cmvn_tr05_cont.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0

fea_name=mfccLA2
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA2/data/tr05_cont/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA2/data/tr05_cont/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA2/mfcc/cmvn_tr05_cont.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0

fea_name=mfccLA3
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA3/data/tr05_cont/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA3/data/tr05_cont/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA3/mfcc/cmvn_tr05_cont.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0

fea_name=mfccLA4
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA4/data/tr05_cont/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA4/data/tr05_cont/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA4/mfcc/cmvn_tr05_cont.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0

lab:lab_name=lab_cd
lab_folder=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_beam/exp/tri4_ali
lab_opts=ali-to-pdf
lab_count_file=auto
lab_data_folder=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_beam/data/tr05_cont/
lab_graph=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_beam/exp/tri4/graph_tgpr_5k/

N_chunks=10

[dataset2]
data_name=dirha_sim
fea:fea_name=mfccLA1
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA1/data/dirha_sim/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA1/data/dirha_sim/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA1/mfcc/cmvn_dirha_sim.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0

fea_name=mfccLA2
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA2/data/dirha_sim/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA2/data/dirha_sim/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA2/mfcc/cmvn_dirha_sim.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0

fea_name=mfccLA3
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA3/data/dirha_sim/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA3/data/dirha_sim/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA3/mfcc/cmvn_dirha_sim.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0

fea_name=mfccLA4
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA4/data/dirha_sim/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA4/data/dirha_sim/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA4/mfcc/cmvn_dirha_sim.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0


lab:lab_name=lab_cd
lab_folder=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_beam/exp/tri4_ali_sim
lab_opts=ali-to-pdf
lab_count_file=auto
lab_data_folder=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_beam/data/dirha_sim/
lab_graph=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_beam/exp/tri4/graph_tgpr_5k/

N_chunks=4



[dataset3]
data_name=dirha_real
fea:fea_name=mfccLA1
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA1/data/dirha_real/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA1/data/dirha_real/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA1/mfcc/cmvn_dirha_real.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0

fea_name=mfccLA2
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA2/data/dirha_real/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA2/data/dirha_real/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA2/mfcc/cmvn_dirha_real.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0

fea_name=mfccLA3
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA3/data/dirha_real/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA3/data/dirha_real/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA3/mfcc/cmvn_dirha_real.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0

fea_name=mfccLA4
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA4/data/dirha_real/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA4/data/dirha_real/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA4/mfcc/cmvn_dirha_real.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0


lab:lab_name=lab_cd
lab_folder=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_beam/exp/tri4_ali_real
lab_opts=ali-to-pdf
lab_count_file=auto
lab_data_folder=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_beam/data/dirha_real/
lab_graph=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_beam/exp/tri4/graph_tgpr_5k/

N_chunks=4


[data_use]
train_with=tr05_cont
valid_with=dirha_sim
forward_with=dirha_real

[batches]
batch_size_train=16
max_seq_length_train=500
increase_seq_length_train=True
start_seq_len_train=100
multply_factor_seq_len_train=2
batch_size_valid=16
max_seq_length_valid=500


[architecture1]
arch_name = QLSTM
arch_proto = proto/QLSTM.proto
arch_library = quaternion_neural_networks
arch_class = QLSTM
arch_pretrain_file = none
arch_freeze = False
arch_seq_model = True
lstm_lay = 512,512,512,512
lstm_drop = 0.2,0.2,0.2,0.2
lstm_bidir = True
lstm_act = tanh,tanh,tanh,tanh
quaternion_init=quaternion
autograd=False
arch_lr = 0.0016
arch_halving_factor = 0.5
arch_improvement_threshold = 0.001
arch_opt = rmsprop
opt_momentum = 0.0
opt_alpha = 0.95
opt_eps = 1e-8
opt_centered = False
opt_weight_decay = 0.0

[architecture2]
arch_name=MLP_layers
arch_proto=proto/MLP.proto
arch_library=neural_networks
arch_class=MLP
arch_pretrain_file=none
arch_freeze=False
arch_seq_model=False
dnn_lay=N_out_lab_cd
dnn_drop=0.0
dnn_use_laynorm_inp=False
dnn_use_batchnorm_inp=False
dnn_use_batchnorm=False
dnn_use_laynorm=False
dnn_act=softmax
arch_lr=0.0004
arch_halving_factor=0.5
arch_improvement_threshold=0.001
arch_opt=rmsprop
opt_momentum=0.0
opt_alpha=0.95
opt_eps=1e-8
opt_centered=False
opt_weight_decay=0.0

[model]
model_proto=proto/model.proto
model:conc1=concatenate(mfccLA1,mfccLA2)
conc2=concatenate(conc1,mfccLA3)
conc3=concatenate(conc2,mfccLA4)
out_dnn1=compute(QLSTM,conc3)
out_dnn2=compute(MLP_layers,out_dnn1)
loss_final=cost_nll(out_dnn2,lab_cd)
err_final=cost_err(out_dnn2,lab_cd)

[forward]
forward_out=out_dnn2
normalize_posteriors=True
normalize_with_counts_from=lab_cd
save_out_file=True
require_decoding=True

[decoding]
decoding_script_folder=kaldi_decoding_scripts/
decoding_script=decode_dnn.sh
decoding_proto=proto/decoding.proto
min_active=200
max_active=7000
max_mem=50000000
beam=20.0
latbeam=12.0
acwt=0.10
max_arcs=-1
skip_scoring=false
scoring_script=local/score.sh
scoring_opts="--min-lmwt 4 --max-lmwt 20"
norm_vars=False
Loading