Skip to content

Commit 98d5f82

Browse files
authored
Merge pull request espnet#3324 from pengchengguo/swbd_fix
Fix a type error of swbd data preparation.
2 parents 3a49b02 + b89f2e3 commit 98d5f82

File tree

5 files changed

+7
-6
lines changed

5 files changed

+7
-6
lines changed

egs/swbd/asr1/local/eval2000_data_prep.sh

+1-1
Original file line numberDiff line numberDiff line change
@@ -40,7 +40,7 @@ tdir=$2
4040
dir=data/local/eval2000
4141
mkdir -p $dir
4242

43-
find $sdir/english -iname '*.sph' | sort > $dir/sph.flist
43+
find -L $sdir/english -iname '*.sph' | sort > $dir/sph.flist
4444
sed -e 's?.*/??' -e 's?.sph??' $dir/sph.flist | paste - $dir/sph.flist \
4545
> $dir/sph.scp
4646

egs/swbd/asr1/local/fisher_data_prep.sh

+2-2
Original file line numberDiff line numberDiff line change
@@ -69,10 +69,10 @@ fi
6969

7070
if [ $stage -le 0 ]; then
7171

72-
find $links/fe_03_p1_tran/data $links/fe_03_p2_tran/data -iname '*.txt' > $tmpdir/transcripts.flist
72+
find -L $links/fe_03_p1_tran/data $links/fe_03_p2_tran/data -iname '*.txt' > $tmpdir/transcripts.flist
7373

7474
for dir in fe_03_p{1,2}_sph{1,2,3,4,5,6,7}; do
75-
find $links/$dir/ -iname '*.sph'
75+
find -L $links/$dir/ -iname '*.sph'
7676
done > $tmpdir/sph.flist
7777

7878
n=`cat $tmpdir/transcripts.flist | wc -l`

egs/swbd/asr1/local/rt03_data_prep.sh

+1-1
Original file line numberDiff line numberDiff line change
@@ -29,7 +29,7 @@ rtroot=$sdir
2929
tdir=$sdir/data/references/eval03/english/cts
3030
sdir=$sdir/data/audio/eval03/english/cts
3131

32-
find $sdir -iname '*.sph' | sort > $dir/sph.flist
32+
find -L $sdir -iname '*.sph' | sort > $dir/sph.flist
3333
sed -e 's?.*/??' -e 's?.sph??' $dir/sph.flist | paste - $dir/sph.flist \
3434
> $dir/sph.scp
3535

egs/swbd/asr1/local/swbd1_data_prep.sh

+1-1
Original file line numberDiff line numberDiff line change
@@ -46,7 +46,7 @@ sph2pipe=sph2pipe
4646
echo "SWBD dictionary file does not exist" && exit 1;
4747

4848
# find sph audio files
49-
find $SWBD_DIR -iname '*.sph' | sort > $dir/sph.flist
49+
find -L $SWBD_DIR -iname '*.sph' | sort > $dir/sph.flist
5050

5151
n=`cat $dir/sph.flist | wc -l`
5252
[ $n -ne 2435 ] && [ $n -ne 2438 ] && \

egs2/swbd/asr1/local/data.sh

+2-1
Original file line numberDiff line numberDiff line change
@@ -78,10 +78,11 @@ if [ ${stage} -le 1 ] && [ ${stop_stage} -ge 1 ]; then
7878
fi
7979

8080
if [ ${stage} -le 2 ] && [ ${stop_stage} -ge 2 ]; then
81+
log " Data Formatting"
8182
# remove ._ . _1 symboles from text
8283
cp data/train_nodup/text data/train_nodup/text.backup
8384
cp data/train_dev/text data/train_dev/text.backup
84-
sed -i 's/\._/ /g; s/\.//g; s/them_1/them/g' data/trian_nodup/text
85+
sed -i 's/\._/ /g; s/\.//g; s/them_1/them/g' data/train_nodup/text
8586
sed -i 's/\._/ /g; s/\.//g; s/them_1/them/g' data/train_dev/text
8687
fi
8788

0 commit comments

Comments
 (0)