Skip to content
GitLab
Projects
Groups
Snippets
Help
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Open sidebar
LINAGORA
L
LGS
Labs
kaldi-modelgen
Commits
5f9e8281
Commit
5f9e8281
authored
Dec 04, 2017
by
Abdelwahab HEBA
Browse files
add new modif
parent
0fbad8fa
Changes
5
Expand all
Hide whitespace changes
Inline
Side-by-side
Showing
5 changed files
with
105376 additions
and
1314 deletions
+105376
-1314
Run_ESTER1_2.ipynb
Run_ESTER1_2.ipynb
+319
-1311
cmu_dict/lexicon_new.dict
cmu_dict/lexicon_new.dict
+105052
-0
local/format_lms.sh
local/format_lms.sh
+2
-1
local/lm/train_lm.sh
local/lm/train_lm.sh
+1
-1
local/parseESTERSyncV2.py
local/parseESTERSyncV2.py
+2
-1
No files found.
Run_ESTER1_2.ipynb
View file @
5f9e8281
This diff is collapsed.
Click to expand it.
cmu_dict/lexicon_new.dict
0 → 100644
View file @
5f9e8281
This diff is collapsed.
Click to expand it.
local/format_lms.sh
View file @
5f9e8281
...
...
@@ -43,7 +43,8 @@ trap "rm -r $tmpdir" EXIT
mkdir
-p
$tmpdir
#for lm_suffix in tgsmall tgmed tglarge fglarge; do
for
lm_suffix
in
fglarge tglarge tgsphinx french-small mixed
;
do
#for lm_suffix in fglarge tglarge tgsphinx french-small mixed; do
for
lm_suffix
in
sg
;
do
#for lm_suffix in fglarge; do
#for lm_suffix in mixed; do
#for lm_suffix in linto1; do
...
...
local/lm/train_lm.sh
View file @
5f9e8281
...
...
@@ -39,7 +39,7 @@ lm_dir=$4
[[
-d
"
$corpus_dir
"
]]
||
{
echo
"No such directory '
$corpus_dir
'"
;
exit
1
;
}
# Normalize data
normjobs
=
2
normjobs
=
3
2
split_prefix
=
$tmp_dir
/split
if
[
"
$stage
"
-le
1
]
;
then
...
...
local/parseESTERSyncV2.py
View file @
5f9e8281
...
...
@@ -371,7 +371,8 @@ if __name__=="__main__":
if
spk
[
0
]
in
Spk_that_contribute_to_meeting
:
spk_id
=
str
(
basename
)
+
'_%s-%03d'
%
(
str
(
re
.
sub
(
'\d+'
,
''
,
spk
[
0
])),
int
(
re
.
sub
(
'[a-zA-Z]'
,
''
,
spk
[
0
])))
spk2gender
.
write
(
spk_id
+
" "
+
spk
[
1
]
+
"
\n
"
)
wav_scp
.
write
(
basename
+
" sox "
+
os
.
path
.
dirname
(
file_trs
)
+
'/'
+
basename
+
'.wav'
+
" -t wav -r 16000 -c 1 - |
\n
"
)
wav_scp
.
write
(
basename
+
" ffmpeg-normalize "
+
os
.
path
.
dirname
(
file_trs
)
+
'/'
+
basename
+
'.wav'
+
" && sox "
+
os
.
path
.
dirname
(
file_trs
)
+
'/normalized-'
+
basename
+
'.wav'
+
" -t wav -r 16000 -c 1 - |
\n
"
)
# wav_scp.write(basename+" sox --norm "+os.path.dirname(file_trs) + '/normalized-' + basename + '.wav'+" -t wav -r 16000 -c 1 - |\n")
segments_file
.
close
()
utt2spk_file
.
close
()
text_file
.
close
()
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment