amupd's picture
SpeechT5 upload
62e9ca6
raw
history blame
1.15 kB
#####################################
# Fast Text2Unit Model #
#####################################
[ $# -lt 2 ] && echo "Usage: $0 <model_path> <gen_set> [outdir={gen_set%/*}]" && exit 0
[ ${PWD##*/} != SpeechLM ] && echo "Error: dir not match! Switch to SpeechLM/ and run it again!" && exit 1
model_path=$1
src_dir=${model_path%/*}
cpt=${model_path##*/}
cpt=${cpt%.*}
gen_set=$2
outdir=$3
DATA_DIR=${gen_set%/*}
gen_set=${gen_set##*/}
[ -z $outdir ] && outdir=${DATA_DIR}
CODE_ROOT=${PWD}
nj=4
for rank in $(seq 0 $((nj-1))); do
results_path=$outdir/pseudo_${gen_set}/${rank}
[ ! -d $results_path ] && mkdir -p $results_path
echo "$model_path" > $results_path/model.record
python $CODE_ROOT/speechlm/generate_unit.py $DATA_DIR \
--user-dir $CODE_ROOT/speechlm \
--config-yaml config_generate.yaml \
--path ${model_path} \
--task fast_text_to_unit \
--gen-subset $gen_set \
\
--beam 1 \
--max-tokens 10000 \
--results-path $results_path \
--scoring sacrebleu \
--skip-invalid-size-inputs-valid-test \
--distributed-world-size $nj --distributed-rank ${rank} \
&
done
wait