Movatterモバイル変換


[0]ホーム

URL:


Skip to content

Navigation Menu

Sign in
Appearance settings

Search code, repositories, users, issues, pull requests...

Provide feedback

We read every piece of feedback, and take your input very seriously.

Saved searches

Use saved searches to filter your results more quickly

Sign up
Appearance settings
This repository was archived by the owner on Aug 23, 2023. It is now read-only.
/zerothPublic archive

Commit43183c9

Browse files
committed
update: included train_data_03 in data sets. now 95.7 hours of audio data is available. run.sh will be updated and verified soon
1 parent47ecfce commit43183c9

File tree

1 file changed

+8
-7
lines changed

1 file changed

+8
-7
lines changed

‎s5/run.sh‎

Lines changed: 8 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -34,21 +34,21 @@ startTime=$(date +'%F-%H-%M')
3434
echo"started at"$startTime
3535

3636
# download the data.
37-
forpartin train_data_01 train_data_02 test_data_01;do
37+
forpartin train_data_01 train_data_02train_data_03test_data_01;do
3838
local/download_and_untar.sh$data$part
3939
done
4040

4141
# download the LM resources
4242
local/download_lm.sh data/local/lm
4343

4444
# format the data as Kaldi data directories
45-
forpartin train_data_01 train_data_02 test_data_01;do
45+
forpartin train_data_01 train_data_02train_data_03test_data_01;do
4646
# use underscore-separated names in data directories.
4747
local/data_prep.sh$data/$part data/$(echo$part| sed s/-/_/g)
4848
done
4949

5050
# update segmentation of transcripts
51-
forpartin train_data_01 train_data_02 test_data_01;do
51+
forpartin train_data_01 train_data_02train_data_03test_data_01;do
5252
local/updateSegmentation.sh data/$part data/local/lm
5353
done
5454

@@ -74,10 +74,10 @@ mfccdir=mfcc
7474
hostInAtlas="ares hephaestus jupiter neptune"
7575
if [[!-z$(echo$hostInAtlas| grep -o$(hostname -f)) ]];then
7676
mfcc=$(basename mfccdir)# in case was absolute pathname (unlikely), get basename.
77-
utils/create_split_dir.pl /mnt/{ares,hephaestus,jupiter,neptune}/$USER/kaldi-data/zeroth-kaldi/s5/$mfcc/storage \
77+
utils/create_split_dir.pl /mnt/{ares,hephaestus,jupiter,neptune}/$USER/kaldi-data/zeroth/s5/$mfcc/storage \
7878
$mfccdir/storage
7979
fi
80-
forpartin train_data_01 train_data_02 test_data_01;do
80+
forpartin train_data_01 train_data_02train_data_03test_data_01;do
8181
steps/make_mfcc.sh --cmd"$train_cmd" --nj$nCPU data/$part exp/make_mfcc/$part$mfccdir
8282
steps/compute_cmvn_stats.sh data/$part exp/make_mfcc/$part$mfccdir
8383
done
@@ -86,10 +86,11 @@ done
8686
utils/combine_data.sh data/merged data/train_data_01 data/test_data_01
8787
local/split_dataset.sh --ratio 20 data/merged data/trainset_01 data/testset_01
8888
local/split_dataset.sh --ratio 20 data/train_data_02 data/trainset_02 data/testset_02
89+
local/split_dataset.sh --ratio 20 data/train_data_03 data/trainset_03 data/testset_03
8990

9091
# Merge trainsets and testsets
91-
utils/combine_data.sh data/train_clean data/trainset_01 data/trainset_02
92-
utils/combine_data.sh data/test_clean data/testset_01 data/testset_02
92+
utils/combine_data.sh data/train_clean data/trainset_01 data/trainset_02 data/trainset_03
93+
utils/combine_data.sh data/test_clean data/testset_01 data/testset_02 data/testset_03
9394

9495
# Make some small data subsets for early system-build stages.
9596
utils/subset_data_dir.sh --shortest data/train_clean 2000 data/train_2kshort

0 commit comments

Comments
 (0)

[8]ページ先頭

©2009-2025 Movatter.jp