train_subset_lgbeam.sh 3.72 KB
Newer Older
Nikhilesh Bhatnagar's avatar
Nikhilesh Bhatnagar committed
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129
#!/usr/bin/env bash

out_root=/tmp
out_name=train_${RANDOM}
num_nonsil_states=1

valid="dev_other"
train="train"
mono_size="-1"  # 2000
tri1_size="-1"  # 5000
tri2b_size="-1"  # 10000
tri3b_size="-1"  # 10000

# Acoustic model parameters
numLeavesTri1=2000
numGaussTri1=10000
numLeavesMLLT=2500
numGaussMLLT=15000
numLeavesSAT=2500
numGaussSAT=15000

stage=1
max_stage=1

. ./cmd.sh
. ./path.sh
. parse_options.sh

data=$1
lang=$2
lang_test=$3

exp_root=$out_root/$out_name

# you might not want to do this for interactive shells.
set -e


if [ $stage -le 1 ] && [ $max_stage -ge 1 ]; then
  # train a monophone system
  if [ ! $mono_size -eq -1 ]; then
    utils/subset_data_dir.sh $data/$train $mono_size $data/${train}_${mono_size}
    mono_train=${train}_${mono_size}
  else
    mono_train=${train}
  fi

  steps/train_mono.sh --boost-silence 1.25 --nj 20 --cmd "$train_cmd" \
    --initial-beam 40 --regular-beam 60 --retry-beam 120 \
    $data/$mono_train $lang $exp_root/mono

  utils/mkgraph.sh $lang_test $exp_root/mono $exp_root/mono/graph
  steps/decode.sh --nj 20 --cmd "$decode_cmd" \
    $exp_root/mono/graph $data/$valid $exp_root/mono/decode_$valid &
fi


if [ $stage -le 2 ] && [ $max_stage -ge 2 ]; then
  # train a first delta + delta-delta triphone system on a subset of 5000 utterances
  if [ ! $tri1_size -eq -1 ]; then
    utils/subset_data_dir.sh $data/$train $tri1_size $data/${train}_${tri1_size}
    tri1_train=${train}_${tri1_size}
  else
    tri1_train=${train}
  fi

  steps/align_si.sh --boost-silence 1.25 --nj 10 --cmd "$train_cmd" \
    $data/$tri1_train $lang \
    $exp_root/mono $exp_root/mono_ali_${tri1_train}

  steps_gan/train_deltas.sh --boost-silence 1.25 --cmd "$train_cmd" \
      --num_nonsil_states $num_nonsil_states $numLeavesTri1 $numGaussTri1 \
      $data/$tri1_train $lang \
      $exp_root/mono_ali_${tri1_train} $exp_root/tri1

  utils/mkgraph.sh $lang_test $exp_root/tri1 $exp_root/tri1/graph
  steps/decode.sh --nj 20 --cmd "$decode_cmd" \
    $exp_root/tri1/graph $data/$valid $exp_root/tri1/decode_$valid &
fi

if [ $stage -le 3 ] && [ $max_stage -ge 3 ]; then
  # train an LDA+MLLT system.
  if [ ! $tri2b_size -eq -1 ]; then
    utils/subset_data_dir.sh $data/$train $tri2b_size $data/${train}_${tri2b_size}
    tri2b_train=${train}_${tri2b_size}
  else
    tri2b_train=${train}
  fi

  steps/align_si.sh --nj 10 --cmd "$train_cmd" \
    $data/$tri2b_train $lang \
    $exp_root/tri1 $exp_root/tri1_ali_${tri2b_train}

  steps_gan/train_lda_mllt.sh --cmd "$train_cmd" \
      --num_nonsil_states $num_nonsil_states \
      --splice-opts "--left-context=3 --right-context=3" $numLeavesMLLT $numGaussMLLT \
      $data/$tri2b_train $lang \
      $exp_root/tri1_ali_${tri2b_train} $exp_root/tri2b

  utils/mkgraph.sh $lang_test $exp_root/tri2b $exp_root/tri2b/graph
  steps/decode.sh --nj 20 --cmd "$decode_cmd" \
    $exp_root/tri2b/graph $data/$valid $exp_root/tri2b/decode_$valid &
fi


if [ $stage -le 4 ] && [ $max_stage -ge 4 ]; then
  # Train tri3b, which is LDA+MLLT+SAT on 10k utts
  if [ ! $tri3b_size -eq -1 ]; then
    utils/subset_data_dir.sh $data/$train $tri3b_size $data/${train}_${tri3b_size}
    tri3b_train=${train}_${tri3b_size}
  else
    tri3b_train=${train}
  fi

  steps/align_si.sh  --nj 10 --cmd "$train_cmd" --use-graphs true \
    $data/$tri3b_train $lang \
    $exp_root/tri2b $exp_root/tri2b_ali_${tri2b_train}

  steps_gan/train_sat.sh --cmd "$train_cmd" \
    --num_nonsil_states $num_nonsil_states $numLeavesSAT $numGaussSAT \
    $data/$tri3b_train $lang \
    $exp_root/tri2b_ali_${tri2b_train} $exp_root/tri3b

  utils/mkgraph.sh $lang_test $exp_root/tri3b $exp_root/tri3b/graph
  steps/decode_fmllr.sh --nj 20 --cmd "$decode_cmd" \
    $exp_root/tri3b/graph $data/$valid $exp_root/tri3b/decode_$valid &
fi

wait