InformationQuantizer/run.sh at main · lwang114/InformationQuantizer

149 lines (130 loc) · 5.02 KB
#!/bin/bash/
source ~/anaconda3/etc/profile.d/conda.sh
conda activate zerospeech2021_baseline
stop_stage=4
iq_root=/ws/ifp-53_2/hasegawa/lwang114/spring2022/InformationQuantizer ###-------> Change this 
data_root=${iq_root}/resources
timit_root=${data_root}/TIMIT
cpc_root=${iq_root}/zerospeech2021_baseline
unsup_seg_root=${iq_root}/UnsupSeg
kaldi_root=/ws/ifp-53_1/hasegawa/tools/kaldi
eval_root=/ws/ifp-53_2/hasegawa/lwang114/spring2021/DiscoPhoneInfoBottleneck/beer/recipes/aud ###-------> Change this
model_root=${iq_root}/checkpoints/debug ###-------> Change this
word_dataset=librispeech_word
k=10 ###-------> Change this to between 30-70 for the actual dataset
setting=unsup_seg_${k}clusters
# Convert TIMIT to be ready for unsupervised segmentation
if [ $stage -le -1 ] && [ $stop_stage -ge -1 ]; then
    cd ${unsup_seg_root}
    conda activate unsup_seg
    python scripts/make_timit.py \
        --inpath ${timit_root}/TEST_subset \
        --outpath ${timit_root}/test_subset \
        --sph2wav ${kaldi_root}/tools/sph2pipe_v2.5/sph2pipe 
    conda deactivate
    cd $iq_root
# Extract CPC features for the spoken word dataset extracted from LibriSpeech
if [ $stage -le 0 ] && [ $stop_stage -ge 0 ]; then
  cwd=$(pwd)
  cd ${cpc_root}
  for split in train-clean-100 dev-clean; do
    CUDA_VISIBLE_DEVICES=0 python scripts/build_CPC_features.py \
        ${cpc_root}/checkpoints/CPC-small-kmeans50/cpc_ls100/checkpoint_170.pt \
        ${data_root}/${word_dataset}/${split} \
        ${data_root}/${word_dataset}_cpc_txt
# Extract CPC features for TIMIT
if [ $stage -le 1 ] && [ $stop_stage -ge 1 ]; then
  cwd=$(pwd)
  cd ${cpc_root}
  for split in test_subset; do
    CUDA_VISIBLE_DEVICES=0 python scripts/build_CPC_features.py \
        ${cpc_root}/checkpoints/CPC-small-kmeans50/cpc_ls100/checkpoint_170.pt \
        ${timit_root}/${split} \
        ${timit_root}/${split}_cpc_txt
# VAD on the spoken word dataset
#if [ $stage -le 2 ] && [ $stop_stage -ge 2 ]; then
#  for split in train-clean-100 dev-clean; do
#    python vad.py --out_extension .wav \
#                  --audio_path resources/librispeech_word/${split}  
# Extract predicted segmentation for the spoken word dataset
if [ $stage -le 2 ] && [ $stop_stage -ge 2 ]; then
  # Extract unsupervised phone-level segmentations
  cd ${unsup_seg_root}
  conda activate unsup_seg
  for seg_conf in conf/librispeech_word_boundary_detection.json; do 
    CUDA_VISIBLE_DEVICES=$gpu_num python predict_whole_dataset.py --config $seg_conf
  conda deactivate
  # Include predicted boundaries as part of the meta data
  cd $iq_root
  for seg_conf in ${unsup_seg_root}/conf/librispeech_word_boundary_detection.json; do
    python utils/extract_pred_boundaries.py --conf $seg_conf 
# Extract predicted segmentation for the TIMIT dataset
if [ $stage -le 3 ] && [ $stop_stage -ge 3 ]; then
  # Extract unsupervised phone-level segmentations
  cd ${unsup_seg_root}
  conda activate unsup_seg
  for seg_conf in conf/timit_boundary_detection.json; do
    CUDA_VISIBLE_DEVICES=$gpu_num python predict_whole_dataset.py --config $seg_conf
  conda deactivate
  # Include predicted boundaries as part of the meta data
  cd $iq_root
  for seg_conf in ${unsup_seg_root}/conf/timit_boundary_detection.json; do
    python utils/extract_pred_boundaries.py --conf $seg_conf 
  mv resources/TIMIT/test_subset/test_subset_with_predicted_segments.json resources/TIMIT/test_subset/test_subset.json 
if [ $stage -le 4 ] && [ $stop_stage -ge 4 ]; then
  config_file=$iq_root/configs/librispeech_word.conf
  CUDA_VISIBLE_DEVICES=$gpu_num python solver.py $config_file --setting ${setting}
# Evaluate in-domain phoneme discovery performance of IQ with gold segmentation
if [ $stage -le 5 ] && [ $stop_stage -ge 5 ]; then
  ref_ali=$data_root/${word_dataset}/test.ali
  in_dirs=""
  for seed in 1234; do      
      hyp_ali=$model_root/pred_test_$seed.ali
      python utils/convert_item_to_beer_format.py \
        --item_file $data_root/${word_dataset}/dev-clean/dev-clean_nonoverlap.item \
        --gold_beer_file $ref_ali \
        --pred_file $model_root/outputs_quantized_$seed.txt
      python utils/convert_output_to_beer_format.py \
        --output_file $model_root/outputs_quantized_$seed.txt \
        --beer_file $hyp_ali 
  for seed in 1234; do
      score_root=$model_root/score_aud_$seed
      if [ -d $score_root ]; then
        rm -r $score_root
      hyp_ali=$model_root/pred_test_$seed.ali
      cwd=$(pwd)
      cd $eval_root
      conda activate beer
      bash $eval_root/steps/score_aud.sh $ref_ali $hyp_ali $model_root/score_aud_$seed
      conda deactivate
      cd $cwd
      # Token F1 score
      python ${iq_root}/utils/evaluate.py 1 $ref_ali $hyp_ali $score_root
      in_dirs="${score_root},${in_dirs}"
  in_dirs=${in_dirs%%,}
  # Compute average and standard deviation
  python ${iq_root}/utils/average_performance.py --in_dirs ${in_dirs} --out_path $model_root/average_performance
Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

run.sh

Latest commit

History

run.sh

File metadata and controls