Make test transcript:
...
Copy preexisting test transcript:
cp /disk/scratch/oliver//data/nick_hurricaine/test_transcript.csv /disk/scratch/oliver//data/LJSpeech-1.1/
./util/submit_tf.sh ./synthesize.py -c ./config/lj_01.cfg -N 10
./util/submit_tf.sh synthesise_validation_waveforms.py -c ./config/lj_01.cfg
===
cd /disk/scratch/oliver/data/nick cp -rs /afs/inf.ed.ac.uk/group/cstr/projects/corpus_1/Nick48kHz/wav ./wav/
rm -rf /disk/scratch/oliver/data/nick/transcript_1.csv
for TXT in /afs/inf.ed.ac.uk/group/cstr/projects/corpus_1/Nick48kHz/txt/herald* ; do
BASE=basename $TXT .txt
;
TEXT=cat $TXT
;
echo $BASE||$TEXT >> /disk/scratch/oliver/data/nick/transcript_1.csv
done
./util/submit_tf_cpu.sh ./prepo.py -c ./config/nick_01.cfg -ncores 25
VCTK data:
(waffler) [stardale]owatts: ./util/submit_tf_cpu.sh ./script/split_speech.py -w $DATADIR/wav_norm/ -o $DATADIR/wav_trim/ -dB 15 -ncores 25 -trimonly
It will probably be most convenient to have a central copy of the repository in AFS space, and to synchronise this with local copies on the GPU machines you are using. The script sync_code_from_afs.sh
can be used to keep various versions in synch without pushing to git. E.g., if you are wor
mkdir /disk/scratch/oliver/dc_tts_osw
510 cd /disk/scratch/oliver/dc_tts_osw
511 mkdir util
512 cp ~/repos/dc_tts_osw/util/sync_code_from_afs.sh ./util/
513 ./util/sync_code_from_afs.sh
get data
mkdir /disk/scratch/oliver/data/roger/ cp -rs /afs/inf.ed.ac.uk/group/cstr/projects/corpus_1/CSTR-Private/Roger/peter-release/48kHz/ /disk/scratch/oliver/data/roger/wav/
python ./script/normalise_level.py -i /disk/scratch/oliver/data/roger/wav/ -o /disk/scratch/oliver/data/roger/wav_norm/ -ncores 30
./util/submit_tf_cpu.sh ./script/split_speech.py -w /disk/scratch/oliver/data/roger/wav_norm/ -o /disk/scratch/oliver/data/roger/wav_trim/ -dB 30 -ncores 30 -trimonly
cp /afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/data/dctts/roger/transcript.csv /disk/scratch/oliver/data/roger/transcript.csv
cp /afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/data/dctts/nick_hurricaine/test/test_transcript.csv /disk/scratch/oliver/data/roger/
python ./script/check_transcript.py -i /disk/scratch/oliver/data/roger/transcript.csv -phone
./util/submit_tf_cpu.sh ./prepo.py -c ./config/roger_01.cfg -ncores 20
python ./script/check_transcript.py -i /disk/scratch/oliver/data/roger/transcript.csv -phone -cmp ./work/roger_mags
./util/submit_tf.sh ./train.py -c ./config/roger_01.cfg -m 1
./util/submit_tf.sh ./synth_sweep_devset.py -c ./config/roger_02.cfg -m 2
(waffler) [stardale]owatts: ./util/submit_tf.sh synth_sweep_devset.py -c ./config/roger_02.cfg -m 1
/disk/scratch/oliver/dc_tts_osw/work//roger_02/train-2/archive/model_gs_380k
./util/submit_tf.sh synth_sweep_devset.py -c ./config/roger_02.cfg -m 1 -ssrn /disk/scratch/oliver/dc_tts_osw/work//roger_02/train-2/archive/model_gs_380k
Data here: /group/project/cstr2/owatts/vctk_voices_ossian/VCTK-Corpus/
Make VCTK transcripts:-
mkdir /disk/scratch/oliver/data/vctk
python ./script/datasets/gather_vctk_transcript.py -i /group/project/cstr2/owatts/vctk_voices_ossian/VCTK-Corpus/txt/ -o /disk/scratch/oliver/data/vctk/utts.data
cd /disk/scratch/oliver/data/vctk/
FEST=/afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/tool/festival/festival/bin/festival SCRIPT=/afs/inf.ed.ac.uk/user/o/owatts/repos/dc_tts_osw/script/festival/make_rich_phones_combirpx_noplex.scm $FEST -b $SCRIPT | grep KEEP | sed 's/KEEP//' | tee ./transcript1.csv
cd /disk/scratch/oliver/dc_tts_osw/
python script/check_transcript.py -i /disk/scratch/oliver/data/vctk/transcript1.csv -phone
python script/festival/fix_transcript.py /disk/scratch/oliver/data/vctk/transcript1.csv B C I It K M N P R She V age dot imposition position there wide > /disk/scratch/oliver/data/vctk/transcript.csv
[stardale]owatts: awk -F_ '{print $1}' /disk/scratch/oliver/data/vctk/transcript.csv > /tmp/spkr.txt [stardale]owatts: mv /disk/scratch/oliver/data/vctk/transcript.csv /disk/scratch/oliver/data/vctk/transcript.csv transcript1.csv transcript.csv [stardale]owatts: mv /disk/scratch/oliver/data/vctk/transcript.csv /disk/scratch/oliver/data/vctk/transcript2.csv [stardale]owatts: paste -d | /disk/scratch/oliver/data/vctk/transcript2.csv /tmp/spkr.txt > /disk/scratch/oliver/data/vctk/transcript.csv -bash: /disk/scratch/oliver/data/vctk/transcript2.csv: Permission denied paste: option requires an argument -- 'd' Try 'paste --help' for more information. [stardale]owatts: paste -d'|' /disk/scratch/oliver/data/vctk/transcript2.csv /tmp/spkr.txt > /disk/scratch/oliver/data/vctk/transcript.csv
python ./script/normalise_level.py -i /group/project/cstr2/owatts/vctk_voices_ossian/wav/ -o /disk/scratch/oliver/data/vctk/wav_norm/ -ncores 25
./util/submit_tf_cpu.sh ./script/split_speech.py -w /disk/scratch/oliver/data/vctk/wav_norm/ -o /disk/scratch/oliver/data/vctk/wav_trim/ -dB 30 -ncores 25 -trimonly
./util/submit_tf_cpu.sh ./prepo.py -c ./config/vctk_01.cfg -ncores 25
python script/check_transcript.py -i /disk/scratch/oliver/data/vctk/transcript.csv -phone -cmp ./work/vctk_mags/
python script/check_transcript.py -i /disk/scratch/oliver/data/vctk/transcript.csv -phone -cmp ./work/vctk_mags/ -maxframes 400 -maxletters 80 -speaker
HERE!!!!!!!!!!!!
./util/submit_tf.sh ./train.py -c ./config/vctk_01.cfg -m 1 ./util/submit_tf.sh ./train.py -c ./config/vctk_01.cfg -m 2
: cp /disk/scratch/oliver/data/roger/test_transcript.csv /disk/scratch/oliver/data/vctk
./util/submit_tf.sh ./synthesize.py -c ./config/vctk_01.cfg -speaker p225
===== nancy phones =====
(waffler) [starleader]owatts: pwd /disk/scratch/oliver/data/nancy
cp prompts.data utts.data
emacs /afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/tool/festival/festival/lib/combilex_phones.scm
FEST=/afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/tool/festival/festival/bin/festival SCRIPT=/afs/inf.ed.ac.uk/user/o/owatts/repos/dc_tts_osw/script/festival/make_rich_phones_combirpx_noplex.scm $FEST -b $SCRIPT | grep KEEP | sed 's/KEEP//' | tee ./transcript1.csv
cd /disk/scratch/oliver/dc_tts_osw/
python script/check_transcript.py -i /disk/scratch/oliver/data/nancy/transcript1.csv -phone
python script/festival/fix_transcript.py /disk/scratch/oliver/data/nancy/transcript1.csv A African B Bradley COLUMN Constitution D Dyson E Gore Herald I Israel Joyner Kettering L Ledger Lewinsky M Marting Marts Mifflin Minimalism Moraine N O Packard ROM S Saturdays Speech T Time To Torricelli Two U V Walker War Weaver West Wolf World a access actualized adolescents adult adulthood after age alone along always american americanism and arranger atlantic author authored awaited away axis bang banging barr based bats be bearing bed bedroom being benefit berries birds black blended blood bodied born borne bottomed bound boxing boy brained breaking breathers bred broadway brow building built burner busting calorie cancer candid card care carpenter carpet case catch cell cells center centeredness central cents century chalk changing charge chief child chin class clearing clock closing club cock colored colour company comte concrete cone conserving consistently constitution constructing control counseling counter couture d dance daughter day death deceiving decorated deeper degradation demand democratic destruction detecting diamonds diet digit dimensional disabled diversity do doctoral dog doing dollar dollars door dormant dramatic drenched dried driven drug dumping duty dwelling ear eating ed edge edged effects efficient eight elite emphasize encrusted engage englishman enter enterprises epilepsy eroding ever evolved evolving examination executivedom expressing eye eyed fabric face facing falling farm fascist fat fault feast feathered fed feeder feeling fetus fever fictional field fifth file filled finance fire fired first fishing five-hour flying focused food foot footed for forbidden foreman founder four fourth free friendly front frontal fruit funded game gas generated generation generational ghali girlfriend go gold government grader grandchildren grandparents grass green ground growing guard guidance h haired hand handed hating head headed health heavy heels hero high hill hit home hop hoped hops hormonal host hours human hundred in inch income indicative induced indulgent industries industry infant infective intelligence investment iron it january jewish job jobs july justice key kinesthetic knacks knife laden largest lashed lasting law leading led leg legged less lettered level life like liked limbed limited line liners list lit lived long looking loving low m making man management managers manufactured marketed married mathematical may mellon menopausal miller million minded minute miracles mob moded modified month morning motivation mouthed mover naked native neighbors nested neutral news nineteenth nonsense nosed nursing obsessed of off offered offs old on only opener opening ops optic or ordered organization organized ourselves out outside over owned paid painted pan par part party paying pearl peer per pitched placement planned plate policy polluted poor pots poverty president pressure price print producing production profile profit profits prone protector publicized racer radio rail raiser raisers ramps ranch range ranking rare rate ray raying read real received red referred reflective rejection rejuvenating related reliant replacement report reproducing resident restricted review reviewed rex righteous road rock rocketing rotating rubbing run running salted satisfied saturated savoy scan school scoring sealed seated secondary seizure september sergeant service sessions setting settled seventies sex shaped share sharing sharp shattering shaven shell shelled shot shouldered show sided sit sitting size sized smart smelling sniffing society soil soldier sour specific speech spend spirit spoken spouse spouses square stage staid star started stealing steer step sticky still stitched stocked stomach stop striped strong studded studies style suk sulphur supervisory support swept tag tailed talk tea tech temps ten tension tent than the therapy thick thieves thin thinking thousand threatening thrill through throw thrust thumping tiled timbered time tipped to tolerant tome top tough town trade training transmitting tricarico tries tse tuned twentieth two typical unit up upmanship ups using veto view voiced wage watch wave way wear web weird western whaling white wide wife willed win wink wise with won worker workers worthy ya year years your zionist zip zone > /disk/scratch/oliver/data/nancy/transcript_combilex2.csv
cp -rs /disk/scratch/oliver/dc_tts/work/nancy_mels ./work/nancy_GL_lett
(waffler) [starleader]owatts: cp -rs /disk/scratch/oliver/dc_tts/work/nancy_mags ./work/nancy_mags
python script/check_transcript.py -i /disk/scratch/oliver/data/nancy/transcript_combilex2.csv -phone -cmp ./work/nancy_mels
python script/check_transcript.py -i /disk/scratch/oliver/data/nancy/transcript_combilex2.csv -phone -cmp ./work/nancy_mels -o /disk/scratch/oliver/data/nancy/transcript_combilex.csv
....
./util/submit_tf.sh ./synth_sweep_devset.py -c ./config/nancy_phones_01.cfg -t2m ./work/nancy_phones_01/train-1/archive/model_gs_340k -ssrn ./work/nancy_phones_01/train-2/archive/model_gs_110k -mode synthesis -n 5
./util/submit_tf.sh ./synth_sweep_devset.py -c ./config/nancy_phones_01.cfg -t2m ./work/nancy_phones_01/train-1/archive/model_gs_340k -ssrn ./work/nancy_phones_01/train-2/archive/model_gs_110k -mode synthesis -n 5
fine tune on nick starting at nancy T2M : model_gs_050k (early model) and SSRN model_gs_110k (later model)
./util/submit_tf.sh ./train.py -c ./config/nick_phones_01.cfg -m 1
./util/submit_tf.sh ./train.py -c ./config/nick_phones_01.cfg -m 1 ./util/submit_tf.sh ./train.py -c ./config/nick_phones_01.cfg -m 2
./util/submit_tf.sh ./synth_sweep_devset.py -c ./config/nick_phones_01.cfg -t2m ./work/nick_phones_01/train-1/archive/model_gs_018k -ssrn ./work/nick_phones_01/train-2/archive/model_gs_007k -mode synthesis -n 5
./util/submit_tf.sh ./train.py -c ./config/nick_phones_02.cfg -m 1 ./util/submit_tf.sh ./train.py -c ./config/nick_phones_02.cfg -m 2
./util/submit_tf.sh ./synth_sweep_devset.py -c ./config/nick_phones_02.cfg -t2m ./work/nick_phones_02/train-1/archive/model_gs_001k -ssrn ./work/nick_phones_02/train-2/archive/model_gs_111k -mode synthesis -n 5
./util/submit_tf.sh ./synth_sweep_devset.py -c ./config/nick_phones_02.cfg -t2m ./work/nick_phones_02/train-1/archive/model_gs_030k -ssrn ./work/nick_phones_02/train-2/archive/model_gs_112k -mode synthesis -n 5
./util/submit_tf.sh ./synth_sweep_devset.py -c ./config/nick_phones_02.cfg -t2m ./work/nick_phones_02/train-1/archive/model_gs_050k -ssrn ./work/nick_phones_02/train-2/archive/model_gs_115k -mode synthesis -n 5
./util/submit_tf.sh ./synth_sweep_devset.py -c ./config/nick_phones_02.cfg -t2m ./work/nick_phones_02/train-1/archive/model_gs_040k -ssrn ./work/nick_phones_02/train-2/archive/model_gs_115k -mode synthesis -n 5
./util/submit_tf.sh ./synth_sweep_devset.py -c ./config/nick_phones_02.cfg -t2m ./work/nick_phones_02/train-1/archive/model_gs_150k -ssrn ./work/nick_phones_02/train-2/archive/model_gs_138k -mode synthesis
./util/submit_tf.sh ./synth_sweep_devset.py -c ./config/nick_phones_02.cfg -t2m ./work/nick_phones_02/train-1/archive/model_gs_150k -ssrn ./work/nick_phones_02/train-2/archive/model_gs_138k -mode synthesis
./util/submit_tf_cpu.sh ./copy_synth_GL.py -c ./config/nick_phones_testset_features.cfg -o ./work/nick_resynth_GL_hvd_16bit
cd /afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/data/dctts/nick_hurricaine/
mv transcript.csv transcript.csv.unilex mv transcript2.csv transcript2.csv.unilex
FEST=/afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/tool/festival/festival/bin/festival SCRIPT=/afs/inf.ed.ac.uk/user/o/owatts/repos/dc_tts_osw/script/festival/make_rich_phones_combirpx_noplex.scm $FEST -b $SCRIPT | grep KEEP | sed 's/KEEP//' | tee ./transcript1.csv
cd /disk/scratch/oliver/dc_tts_osw/
python script/check_transcript.py -i /afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/data/dctts/nick_hurricaine/transcript1.csv -phone
python script/festival/fix_transcript.py /afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/data/dctts/nick_hurricaine/transcript1.csv B C K P V imposition wide > /afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/data/dctts/nick_hurricaine/transcript_combilex2.csv
611 mv test_transcript.csv test_transcript.csv.unilex 612 mv test_transcript1.csv test_transcript1.csv.unilex 613 FEST=/afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/tool/festival/festival/bin/festival 614 SCRIPT=/afs/inf.ed.ac.uk/user/o/owatts/repos/dc_tts_osw/script/festival/make_rich_phones_combirpx_noplex.scm 615 $FEST -b $SCRIPT | grep KEEP | sed 's/KEEP//' | tee ./transcript1.csv 616 python script/check_transcript.py -i /afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/data/dctts/nick_hurricaine/test/transcript1.csv -phone 617 cd /disk/scratch/oliver/dc_tts_osw/ 618 python script/check_transcript.py -i /afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/data/dctts/nick_hurricaine/test/transcript1.csv -phone 619 python script/festival/fix_transcript.py /afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/data/dctts/nick_hurricaine/test/transcript1.csv cross > /afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/data/dctts/nick_hurricaine/test/transcript_combilex2.csv 620 python script/check_transcript.py -i /afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/data/dctts/nick_hurricaine/test/transcript_combilex2.csv -phone
wget https://datashare.is.ed.ac.uk/bitstream/handle/10283/347/quiet_mrt.zip?sequence=3&isAllowed=y wget https://datashare.is.ed.ac.uk/bitstream/handle/10283/347/quiet_harvard.zip?sequence=17&isAllowed=y
unzip quiet_mrt.zip?sequence=3 unzip quiet_harvard.zip?sequence=17 mkdir wav mv mrt_*wav wav/ mv hvd_*wav wav/
mkdir /afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/data/dctts/nick_hurricaine/test/wav_renamed
ls /afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/data/dctts/nick_hurricaine/test/wav/*wav | while read WAV ; do
BASE=`basename $WAV .wav`;
echo $BASE ;
PART1=`echo $BASE | awk -F_ '{print $1}'`
PART2=`echo $BASE | awk -F_ '{print $2}'`
BASE3="${PART1}_${PART2}"
echo $BASE3
ln -s $WAV /afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/data/dctts/nick_hurricaine/test/wav_renamed/$BASE3.wav
done
mkdir /afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/data/dctts/nick_hurricaine/wav_renamed
ls /afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/data/dctts/nick_hurricaine/wav/*wav | while read WAV ; do
BASE=`basename $WAV .wav`;
echo $BASE ;
BASE2=`echo $BASE | awk -F_ '{print $1}'`
echo $BASE2
BASE3=$(echo $BASE2 | sed 's/^0*//')
echo $BASE3
ln -s $WAV /afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/data/dctts/nick_hurricaine/wav_renamed/$BASE3.wav
done
cp /afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/data/dctts/nick_hurricaine/transcript_combilex2.csv /disk/scratch/oliver/data/nick_hurricaine/transcript.csv
cp /afs/inf.ed.ac.uk/user/o/owatts/sim2/oliver/data/dctts/nick_hurricaine/test/transcript_combilex2.csv /disk/scratch/oliver/data/nick_hurricaine/test_transcript.csv
./util/submit_tf_cpu.sh ./prepo.py -c ./config/nick_phones_01.cfg -ncores 25