Commit 037b95fd authored by Ho Yin Chan's avatar Ho Yin Chan
Browse files

trunk:egs/hkust some run time performances & tidy up

git-svn-id: https://svn.code.sf.net/p/kaldi/code/trunk@3097 5e6a8d80-dfce-4ca6-a32a-6e07a63d50c8
parent 53676ecb
##
## wide beam decoding run time (source code version before 12th Oct 2013)
## Intel(R) Xeon(R) CPU X5690 @ 3.47GHz
### for n in `cat decode_dir `; do sh local/cal_runtime.sh $n; done
# grep real exp/*/decode*wide*/log/*.log | awk '{print $1 "\t" $NF}' | grep closelm | grep xeon > RUNTIMES
# grep real exp/*/decode*wide*/log/*.log | awk '{print $1 "\t" $NF}' | grep -v closelm | grep xeon >> RUNTIMES
## wide beam decoding run time factor (source code version before 12th Oct 2013)
## Intel(R) Xeon(R) CPU X5690 @ 3.47GHz, > 64G RAM
# 1.8M size L.fst, 76M size HCLG.fst
nnet_4m_3l/decode_wide_eval_closelm_xeon3.5/log/decode.1.log:LOG 0.559821
nnet_4m_3l/decode_wide_eval_closelm_xeon3.5/log/decode.2.log:LOG 0.491236
nnet_8m_6l/decode_wide_eval_closelm_xeon3.5/log/decode.1.log:LOG 0.592642
nnet_8m_6l/decode_wide_eval_closelm_xeon3.5/log/decode.2.log:LOG 0.609593
nnet_tanh_3l/decode_wide_eval_closelm_xeon3.5/log/decode.1.log:LOG 0.616046
nnet_tanh_3l/decode_wide_eval_closelm_xeon3.5/log/decode.2.log:LOG 0.572899
nnet_tanh_6l/decode_wide_eval_closelm_xeon3.5/log/decode.1.log:LOG 0.604186
nnet_tanh_6l/decode_wide_eval_closelm_xeon3.5/log/decode.2.log:LOG 0.607741
sgmm_5a/decode_wide_eval_closelm_xeon3.5/log/decode_pass1.1.log:LOG 0.869817
sgmm_5a/decode_wide_eval_closelm_xeon3.5/log/decode_pass1.2.log:LOG 0.803909
tri5a/decode_wide_eval_closelm_xeon3.5/log/decode.1.log:LOG 1.04819
tri5a/decode_wide_eval_closelm_xeon3.5/log/decode.2.log:LOG 0.965748
tri5a_fmmi_b0.1/decode_wide_eval_closelm_iter8_xeon3.5/log/decode.1.log:LOG 1.19066
tri5a_fmmi_b0.1/decode_wide_eval_closelm_iter8_xeon3.5/log/decode.2.log:LOG 1.05439
tri5a_mmi_b0.1/decode_wide_eval_closelm_xeon3.5/log/decode.1.log:LOG 1.11189
tri5a_mmi_b0.1/decode_wide_eval_closelm_xeon3.5/log/decode.2.log:LOG 1.05755
tri5a_pretrain-dbn_dnn_smbr/decode_closelm_it2_dnnwide_xeon3.5/log/decode.1.log:LOG 0.71778
tri5a_pretrain-dbn_dnn_smbr/decode_closelm_it2_dnnwide_xeon3.5/log/decode.2.log:LOG 0.713862
exp/nnet_4m_3l/decode_wide_eval_closelm_xeon3.5/log 0.50984
exp/nnet_8m_6l/decode_wide_eval_closelm_xeon3.5/log 0.604995
exp/nnet_tanh_3l/decode_wide_eval_closelm_xeon3.5/log 0.584603
exp/nnet_tanh_6l/decode_wide_eval_closelm_xeon3.5/log 0.606776
exp/sgmm_5a/decode_wide_eval_closelm_xeon3.5/log 0.821786
exp/tri5a/decode_wide_eval_closelm_xeon3.5/log 0.988112
exp/tri5a_fmmi_b0.1/decode_wide_eval_closelm_iter8_xeon3.5/log 1.09135
exp/tri5a_mmi_b0.1/decode_wide_eval_closelm_xeon3.5/log 1.07229
exp/tri5a_pretrain-dbn_dnn_smbr/decode_closelm_it2_dnnwide_xeon3.5/log 0.714925
#
# 28M size L.fst, 76M size HCLG.fst
exp/nnet_4m_3l/decode_wide_eval_xeon3.5/log 0.924118
exp/nnet_8m_6l/decode_wide_eval_xeon3.5/log 1.00894
exp/nnet_tanh_3l/decode_wide_eval_xeon3.5/log 1.00994
exp/nnet_tanh_6l/decode_wide_eval_xeon3.5/log 0.940629
exp/sgmm_5a/decode_wide_eval_xeon3.5/log 1.14046
exp/tri5a/decode_wide_eval_xeon3.5/log 1.34804
exp/tri5a_fmmi_b0.1/decode_wide_eval_iter8_xeon3.5/log 1.87827
exp/tri5a_mmi_b0.1/decode_wide_eval_xeon3.5/log 1.77104
exp/tri5a_pretrain-dbn_dnn_smbr/decode_it2_dnnwide_xeon3.5/log 1.0829
## Intel(R) Xeon(R) CPU L5420 @ 2.50GHz , 6G RAM
# 1.8M size L.fst, 76M size HCLG.fst
exp/nnet_4m_3l/decode_wide_eval_closelm/log 1.18866
exp/nnet_8m_6l/decode_wide_eval_closelm_rerun/log 1.35657
exp/nnet_tanh_3l/decode_wide_eval_closelm/log 1.34746
exp/nnet_tanh_6l/decode_wide_eval_closelm/log 1.39452
exp/sgmm_5a/decode_wide_eval_closelm/log 1.71265
exp/tri5a/decode_wide_eval_closelm/log 2.29062
exp/tri5a_fmmi_b0.1/decode_wide_eval_closelm_iter8/log 2.66123
exp/tri5a_mmi_b0.1/decode_wide_eval_closelm/log 2.61595
exp/tri5a_pretrain-dbn_dnn_smbr/decode_closelm_it2_dnnwide/log 2.18625
#
# 28M size L.fst, 76M size HCLG.fst
exp/nnet_4m_3l/decode_wide_eval/log 2.01065
exp/nnet_8m_6l/decode_wide_eval_rerun/log 2.16128
exp/nnet_tanh_3l/decode_wide_eval/log 2.16153
exp/nnet_tanh_6l/decode_wide_eval/log 2.09993
exp/sgmm_5a/decode_wide_eval/log 2.28183
exp/tri5a/decode_wide_eval/log 3.09584
exp/tri5a_fmmi_b0.1/decode_wide_eval_iter8/log 4.32505
exp/tri5a_mmi_b0.1/decode_wide_eval/log 4.14296
exp/tri5a_pretrain-dbn_dnn_smbr/decode_it2_dnnwide/log 3.08541
## 28M size L.fst, 76M size HCLG.fst
nnet_4m_3l/decode_wide_eval_xeon3.5/log/decode.1.log:LOG 0.964501
nnet_4m_3l/decode_wide_eval_xeon3.5/log/decode.2.log:LOG 0.909089
nnet_8m_6l/decode_wide_eval_xeon3.5/log/decode.1.log:LOG 1.05101
nnet_8m_6l/decode_wide_eval_xeon3.5/log/decode.2.log:LOG 0.993278
nnet_tanh_3l/decode_wide_eval_xeon3.5/log/decode.1.log:LOG 0.97988
nnet_tanh_3l/decode_wide_eval_xeon3.5/log/decode.2.log:LOG 1.02113
nnet_tanh_6l/decode_wide_eval_xeon3.5/log/decode.1.log:LOG 0.983241
nnet_tanh_6l/decode_wide_eval_xeon3.5/log/decode.2.log:LOG 0.924768
sgmm_5a/decode_wide_eval_xeon3.5/log/decode_pass1.1.log:LOG 1.138
sgmm_5a/decode_wide_eval_xeon3.5/log/decode_pass1.2.log:LOG 1.14137
tri5a/decode_wide_eval_xeon3.5/log/decode.1.log:LOG 1.34334
tri5a/decode_wide_eval_xeon3.5/log/decode.2.log:LOG 1.34979
tri5a_fmmi_b0.1/decode_wide_eval_iter8_xeon3.5/log/decode.1.log:LOG 1.7576
tri5a_fmmi_b0.1/decode_wide_eval_iter8_xeon3.5/log/decode.2.log:LOG 1.92319
tri5a_mmi_b0.1/decode_wide_eval_xeon3.5/log/decode.1.log:LOG 1.67702
tri5a_mmi_b0.1/decode_wide_eval_xeon3.5/log/decode.2.log:LOG 1.80603
tri5a_pretrain-dbn_dnn_smbr/decode_it2_dnnwide_xeon3.5/log/decode.1.log:LOG 1.20916
tri5a_pretrain-dbn_dnn_smbr/decode_it2_dnnwide_xeon3.5/log/decode.2.log:LOG 1.0359
#!/bin/bash
# Apache 2.0. Copyright 2013, Hong Kong University of Science and Technology (author: Ricky Chan Ho Yin)
# This script calculates the average decoding real-time factor of a decoding directory by using the run time information inside the logs
if [ $# -ne 1 ] && [ $# -ne 2 ]; then
echo "Usage: $0 decode_directory [framePerSecond]"
echo ""
echo "## The default framerate framePerSecond = 100 i.e. 10ms sliding for input features during decoding"
exit
fi
decodeDIR=$1
if [ ! -d $decodeDIR/log ]; then
echo "decoding directory $decodeDIR/log not exist"
exit
fi
if [ $# -eq 2 ]; then
framePerSecond=$2
else
framePerSecond=100.0
fi
printf "$decodeDIR/log\t"
tail $decodeDIR/log/decode*.log | egrep -e 'Time taken .* real-time|Overall log-likelihood per frame' | awk -v fps=$framePerSecond 'BEGIN{sumTime=0; sumFrame=0;} {if($0 ~ / Time taken /) {pos=match($0, " [0-9.]+s:"); pos2=match($0, "s: real-time factor"); sumTime+=substr($0, pos+1, pos2-pos-1); } else {sumFrame+=$(NF-1)}; }; END{print sumTime/(sumFrame/fps)}'
......@@ -115,10 +115,10 @@ local/ext/score.sh data/eval exp/tri5a/graph_closelm exp/sgmm_5a_mmi_b0.1/decode
local/ext/score.sh data/eval exp/tri5a/graph_closelm exp/sgmm_5a_mmi_b0.1/decode_wide_eval_closelm_2
local/ext/score.sh data/eval exp/tri5a/graph_closelm exp/sgmm_5a_mmi_b0.1/decode_wide_eval_closelm_3
local/ext/score.sh data/eval exp/tri5a/graph_closelm exp/sgmm_5a_mmi_b0.1/decode_wide_eval_closelm_4 # sgmm+bMMI
local/ext/score.sh data/eval exp/tri5a/graph_closelm exp/nnet_8m_6l/decode_nnwide_eval_closelm # nnet 6 layers (983 neurons)
local/ext/score.sh data/eval exp/tri5a/graph_closelm exp/nnet_tanh_6l/decode_wide_eval_closelm # nnet2 6 layers (1024 neurons)
local/ext/score.sh data/eval exp/tri5a/graph_closelm exp/nnet_4m_3l/decode_wide_eval_closelm # nnet 4 layers (823 neurons)
local/ext/score.sh data/eval exp/tri5a/graph_closelm exp/tri5a_pretrain-dbn_dnn/decode_closelm_dnnwide # pretrained 6 layers RBM DNN
local/ext/score.sh data/eval exp/tri5a/graph_closelm exp/nnet_8m_6l/decode_nnwide_eval_closelm # nnet 6 hidden layers (983 neurons)
local/ext/score.sh data/eval exp/tri5a/graph_closelm exp/nnet_tanh_6l/decode_wide_eval_closelm # nnet2 6 hidden layers (1024 neurons)
local/ext/score.sh data/eval exp/tri5a/graph_closelm exp/nnet_4m_3l/decode_wide_eval_closelm # nnet 3 hidden layers (823 neurons)
local/ext/score.sh data/eval exp/tri5a/graph_closelm exp/tri5a_pretrain-dbn_dnn/decode_closelm_dnnwide # pretrained 6 hidden layers RBM DNN
local/ext/score.sh data/eval exp/tri5a/graph_closelm exp/tri5a_pretrain-dbn_dnn_smbr/decode_closelm_it1_dnnwide
local/ext/score.sh data/eval exp/tri5a/graph_closelm exp/tri5a_pretrain-dbn_dnn_smbr/decode_closelm_it2_dnnwide # state level minimum bayes risk DNN
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment