##################################### # Hubert ED model # ##################################### [ $# -lt 1 ] && echo "Usage: $0 " && exit 0 #source /mnt/default/v-ziqzhang/.bashrc_sing model_path=$1 gen_set=$2 tgt=$3 src="ltr" max_tokens=$4 word_size=$5 rank=$6 outdir=$7 [ -z $tgt ] && tgt="kmu" [ -z $gen_set ] && gen_set="dev_clean" [ -z $word_size ] && word_size=1 [ -z $rank ] && rank=0 [ -z $max_tokens ] && max_tokens=2000 FAIRSEQ_ROOT=/mnt/output/users/v-kunwei/code/fairseq_mlst DATA_DIR=${gen_set%/*} gen_set=${gen_set##*/} [ $gen_set == "test" ] && DATA_DIR=/mnt/output/users/v-kunwei/data/s2s_data/en_asr_data [ -z $outdir ] && outdir=$DATA_DIR results_path=$outdir/pseudo_${gen_set}_${rank} [ ! -d $results_path ] && mkdir -p $results_path for subset in $gen_set; do python $FAIRSEQ_ROOT/fairseq_cli/generate_mt_label.py $DATA_DIR \ --path ${model_path} \ --task "translation_from_jst" \ --max-target-positions 3000 \ --gen-subset $subset \ -t $tgt -s "ltr" \ --max-tokens ${max_tokens} \ --dataset-impl "raw" \ --max-len-a 2 --max-len-b 100 \ --results-path $results_path \ --skip-invalid-size-inputs-valid-test \ --distributed-world-size $word_size --distributed-rank $rank \ echo "$model" > $results_path/model.record sleep 1s done | tee $results_path/decode.log sleep 2s