From 3f6befcc02850e8097acfb4aa9ed77347c1e7d50 Mon Sep 17 00:00:00 2001 From: dohe0342 Date: Tue, 14 Mar 2023 17:03:23 +0900 Subject: [PATCH] from local --- egs/librispeech/ASR/.prepare_vox.sh.swp | Bin 4096 -> 16384 bytes egs/librispeech/ASR/prepare_vox.sh | 61 ++++++++++++++++++++++++ 2 files changed, 61 insertions(+) diff --git a/egs/librispeech/ASR/.prepare_vox.sh.swp b/egs/librispeech/ASR/.prepare_vox.sh.swp index 7fd48707a35f042914c8ad108140d189a6b344f3..36108be5a8014d01da2e6a31a84d4643a511a284 100644 GIT binary patch literal 16384 zcmeI3du$v>9mj{#CUrg4X+I8Ju=&UWm^sS9=xms?kOMN-Og_w`<%|~x0jZDPZUTLxM2mVeo?x23mF{9iK(7WZKdyd_mLaU zo){(yBnl)7Bnl)7Bnl)7Bnl)7BntfhE8sh~kdNawZV7LNf99{Z1#j{D+r#fHe1Ett zJ^Y%yB?=@8Bnl)7Bnl)7Bnl)7Bnl)7Bnl)7Bnl)7ya^RhbwYa4t}z|}!0-Rj`TsBP zB;+c19O&Rf;C`?Z>;S#s{a_2&41RS7Ay0rapbiS)F7Vqeg!~3P2R;cN1V=#@Yyp4W zOvokhEcgmo0S!gOI<2E8r4%9$W-ZfzNYy|(|3^#rDh0P3@t&O(->r^f=v0B}R4CSCwKxwU!il>Lc^wkq=q7 zEk+mjP-L-SU0Ko%mr72PF|L|+iKga#wZ!P)DBWvUoT|^LC`z>Ds9jGHQBlSdR+0%z zx=8Q22bJTR?c~D*UPN3UDHgk20!yUbVuYpz70x zU8QBU2C?mB%d}OU>0H{dp_=VFRS)@^1RWTqhl59MLZhh0^@xnfX93cON*sQXwqyB z(Q0uoaXEy&;#Zt}W?8Kj4b13fwSwd*DJqdt&#qIcMziwnYnW5XrMcm3Hp|_TXOt|a zONQmM5_3D`YHkDRNrwW4jf!gKV=ZbYA8)+DdDHOx&xu)C+4-E|sulKmkf^{0F!l6V)kxM3MM4FzJBwAs<%DtJadA0Z=A8_1- zz=Tp^#utE=3pxwUBLi180&m4jg-SvGbrthMkHLXijC(CR_OemSsH(w(>3lSWjxdk= z_wn6R`i0oCU-zkLEHPSOroAj$b%P! z&mNiE%Z<|MemGCw6$@pd|6zFNL;rP5WUCcd;x%?&#Uq&(GrU_qZGLJ?HIxRF> zvf(LF)KbG(;WI!~AQQs-Ygaalzd1~BybT0zxRxa~EG>n+XPjZ)SRZQPnG{pCO8J7r z@{LA=FV=j$R9#nXP|db{3|)`b>-C)!$;dM4(`5sVi<;F|2DgNjs0gm*47MqJ6=Lu% zmWGXk!SJ_Y>&*1fSebfd+=i~;kynr9ZHG(k;kj3O_AF&}!>2jy#KrDnOxZV~O!0?h zgPl{}S6u~u0hRHWgq4mzLmPj!Y{O&mH*8G|jikfxl$L$p8C8_!nm>|Rku2M- z@X0He&O{C1xz|h}26}^=bW9g|x2FzCC0DJ;s_UrDnVK%QRW}%9a4rq-*3T+pB|o@U6|cFJC&a}a^S%Jx%vFzV+#joXY!NNho|;W@1I#1UznVo84L2^E{aAS z-l9~2!+wax)@MZ8AI0G6$1tZ{n;BPq7{{nmqd;v({GS2QVg71Ng;3;q( z6u}RlaF+iG_yM>8&V$c^$G{0N1pbLL{T1*6coHmu17IB755~YI@Ozx+p9lQB z?}Aw{2wp>9Tn4XzAA;`#-ak)+^MIfG9|3dVUa$jf0s5v1%cdR+}Zsi7~b~t#;#HNKonUD zT2D)uC>;iiDP1O^bU)ASZOcL98hVc?GSF_9S_&>U;Uj3IbXFs(jkBEtAJY z_-cz+FyaQ|Jy=aO4Q#krK3d`UPZ%cxYrd1>rSPa;P@Z@E!;7n79392+M6booMU7B+ zY+2z^beIWkjs_KpP!*5$iAIafT9hZntvh!_WFke))mwL7$k}}?blLR2DR!g(0hM33 A!vFvP delta 16 XcmZo@U~Ev>@RE7r0oKj$n1y%%Ik^T_ diff --git a/egs/librispeech/ASR/prepare_vox.sh b/egs/librispeech/ASR/prepare_vox.sh index 49fdf831f..619e4d37a 100755 --- a/egs/librispeech/ASR/prepare_vox.sh +++ b/egs/librispeech/ASR/prepare_vox.sh @@ -165,3 +165,64 @@ if [ $stage -le 5 ] && [ $stop_stage -ge 5 ]; then done fi +if [ $stage -le 6 ] && [ $stop_stage -ge 6 ]; then + log "Stage 1: Prepare LJSpeech manifest" + # We assume that you have downloaded the LJSpeech corpus (ver 1.1) + # You need to prepare LJSpeech according to data_settings/*_list.txt like below + # $dl_dir/LJSpeech + # |-- wavs + # | |-- train + # | |-- dev + # | |-- test + # |-- texts + # |-- metadata.csv + + # to $dl_dir/LJSpeech + if [ ! -e $dl_dir/vox/.vox.done ]; then + #for dset in "4446"; do + # log "Resampling vox/$dset set" + # file_list=`ls $dl_dir/vox/$dset/` + # for wavfile in $file_list; do + # echo $wavfile + # sox -v 0.9 $dl_dir/vox/$dset/$wavfile -r 16000 -e signed-integer $dl_dir/vox/$dset/tmp_$wavfile + # mv $dl_dir/vox/$dset/tmp_$wavfile $dl_dir/vox/$dset/$wavfile + # done + # log "Resampling $dset done" + #done + + mkdir -p data/manifests + if [ ! -e data/manifests/.vox.done ]; then + for dest in "test-clean" "test-other"; do + for spk in $dl_dir/$dest/*; do + spk_id=${spk#*$dest\/} + python local/prepare_vox.py $dl_dir/$dest "$spk_id" + done + done + #touch data/manifests/.vox.done + fi +fi + +if [ $stage -le 7 ] && [ $stop_stage -ge 7 ]; then + log "Stage 7: Prepare musan manifest" + # We assume that you have downloaded the musan corpus + # to data/musan + mkdir -p data/manifests + if [ ! -e data/manifests/.musan.done ]; then + lhotse prepare musan $dl_dir/musan data/manifests + touch data/manifests/.musan.done + fi +fi + +if [ $stage -le 3 ] && [ $stop_stage -ge 3 ]; then + log "Stage 3: Compute fbank for Vox" + mkdir -p data/fbank + if [ ! -e data/fbank/.LJSpeech.done ]; then + for dest in "test-clean" "test-other"; do + for spk in $dl_dir/$dest/*; do + spk_id=${spk#*$dest\/} + ./local/compute_fbank_vox.py --data-dir $spk --spk-id $spk_id + done + done + #touch data/fbank/.vox.done + fi +