Skip to content

Commit

Permalink
Adding FusionRNN + QLSTM cfg + small QLSTM change
Browse files Browse the repository at this point in the history
  • Loading branch information
TParcollet committed May 18, 2020
1 parent bab2eeb commit d0bf7a0
Show file tree
Hide file tree
Showing 4 changed files with 1,038 additions and 7 deletions.
221 changes: 221 additions & 0 deletions cfg/DIRHA_baselines/DIRHA_QLSTM_MFCC.cfg
Original file line number Diff line number Diff line change
@@ -0,0 +1,221 @@
[cfg_proto]
cfg_proto=proto/global.proto
cfg_proto_chunk=proto/global_chunk.proto

[exp]
cmd=
run_nn_script=run_nn.py
out_folder=exp/dirha_QLSTM_mfcc
pretrain_file=none
seed=1234
use_cuda=True
multi_gpu=False
save_gpumem=False
N_epochs_tr=20

[dataset1]
data_name=tr05_cont
fea:fea_name=mfccLA1
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA1/data/tr05_cont/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA1/data/tr05_cont/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA1/mfcc/cmvn_tr05_cont.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0

fea_name=mfccLA2
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA2/data/tr05_cont/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA2/data/tr05_cont/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA2/mfcc/cmvn_tr05_cont.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0

fea_name=mfccLA3
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA3/data/tr05_cont/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA3/data/tr05_cont/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA3/mfcc/cmvn_tr05_cont.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0

fea_name=mfccLA4
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA4/data/tr05_cont/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA4/data/tr05_cont/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA4/mfcc/cmvn_tr05_cont.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0

lab:lab_name=lab_cd
lab_folder=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_beam/exp/tri4_ali
lab_opts=ali-to-pdf
lab_count_file=auto
lab_data_folder=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_beam/data/tr05_cont/
lab_graph=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_beam/exp/tri4/graph_tgpr_5k/

N_chunks=10

[dataset2]
data_name=dirha_sim
fea:fea_name=mfccLA1
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA1/data/dirha_sim/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA1/data/dirha_sim/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA1/mfcc/cmvn_dirha_sim.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0

fea_name=mfccLA2
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA2/data/dirha_sim/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA2/data/dirha_sim/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA2/mfcc/cmvn_dirha_sim.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0

fea_name=mfccLA3
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA3/data/dirha_sim/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA3/data/dirha_sim/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA3/mfcc/cmvn_dirha_sim.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0

fea_name=mfccLA4
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA4/data/dirha_sim/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA4/data/dirha_sim/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA4/mfcc/cmvn_dirha_sim.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0


lab:lab_name=lab_cd
lab_folder=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_beam/exp/tri4_ali_sim
lab_opts=ali-to-pdf
lab_count_file=auto
lab_data_folder=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_beam/data/dirha_sim/
lab_graph=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_beam/exp/tri4/graph_tgpr_5k/

N_chunks=4



[dataset3]
data_name=dirha_real
fea:fea_name=mfccLA1
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA1/data/dirha_real/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA1/data/dirha_real/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA1/mfcc/cmvn_dirha_real.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0

fea_name=mfccLA2
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA2/data/dirha_real/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA2/data/dirha_real/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA2/mfcc/cmvn_dirha_real.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0

fea_name=mfccLA3
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA3/data/dirha_real/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA3/data/dirha_real/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA3/mfcc/cmvn_dirha_real.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0

fea_name=mfccLA4
fea_lst=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA4/data/dirha_real/feats_mfcc.scp
fea_opts=apply-cmvn --utt2spk=ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA4/data/dirha_real/utt2spk ark:/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_LA4/mfcc/cmvn_dirha_real.ark ark:- ark:- | add-deltas --delta-order=0 ark:- ark:- |
cw_left=0
cw_right=0


lab:lab_name=lab_cd
lab_folder=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_beam/exp/tri4_ali_real
lab_opts=ali-to-pdf
lab_count_file=auto
lab_data_folder=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_beam/data/dirha_real/
lab_graph=/nfs-share/titouan/workspace/kaldi/egs/dirha/s5_beam/exp/tri4/graph_tgpr_5k/

N_chunks=4


[data_use]
train_with=tr05_cont
valid_with=dirha_sim
forward_with=dirha_real

[batches]
batch_size_train=16
max_seq_length_train=500
increase_seq_length_train=True
start_seq_len_train=100
multply_factor_seq_len_train=2
batch_size_valid=16
max_seq_length_valid=500


[architecture1]
arch_name = QLSTM
arch_proto = proto/QLSTM.proto
arch_library = quaternion_neural_networks
arch_class = QLSTM
arch_pretrain_file = none
arch_freeze = False
arch_seq_model = True
lstm_lay = 512,512,512,512
lstm_drop = 0.2,0.2,0.2,0.2
lstm_bidir = True
lstm_act = tanh,tanh,tanh,tanh
quaternion_init=quaternion
autograd=False
arch_lr = 0.0016
arch_halving_factor = 0.5
arch_improvement_threshold = 0.001
arch_opt = rmsprop
opt_momentum = 0.0
opt_alpha = 0.95
opt_eps = 1e-8
opt_centered = False
opt_weight_decay = 0.0

[architecture2]
arch_name=MLP_layers
arch_proto=proto/MLP.proto
arch_library=neural_networks
arch_class=MLP
arch_pretrain_file=none
arch_freeze=False
arch_seq_model=False
dnn_lay=N_out_lab_cd
dnn_drop=0.0
dnn_use_laynorm_inp=False
dnn_use_batchnorm_inp=False
dnn_use_batchnorm=False
dnn_use_laynorm=False
dnn_act=softmax
arch_lr=0.0004
arch_halving_factor=0.5
arch_improvement_threshold=0.001
arch_opt=rmsprop
opt_momentum=0.0
opt_alpha=0.95
opt_eps=1e-8
opt_centered=False
opt_weight_decay=0.0

[model]
model_proto=proto/model.proto
model:conc1=concatenate(mfccLA1,mfccLA2)
conc2=concatenate(conc1,mfccLA3)
conc3=concatenate(conc2,mfccLA4)
out_dnn1=compute(QLSTM,conc3)
out_dnn2=compute(MLP_layers,out_dnn1)
loss_final=cost_nll(out_dnn2,lab_cd)
err_final=cost_err(out_dnn2,lab_cd)

[forward]
forward_out=out_dnn2
normalize_posteriors=True
normalize_with_counts_from=lab_cd
save_out_file=True
require_decoding=True

[decoding]
decoding_script_folder=kaldi_decoding_scripts/
decoding_script=decode_dnn.sh
decoding_proto=proto/decoding.proto
min_active=200
max_active=7000
max_mem=50000000
beam=20.0
latbeam=12.0
acwt=0.10
max_arcs=-1
skip_scoring=false
scoring_script=local/score.sh
scoring_opts="--min-lmwt 4 --max-lmwt 20"
norm_vars=False
Loading

0 comments on commit d0bf7a0

Please sign in to comment.