0bc48c11创建于 2025年7月30日历史提交
wav_dir=$1
wav_files=$(ls $wav_dir/*.wav)
# if wav_files is empty, then exit
if [ -z "$wav_files" ]; then
    exit 1
fi
split_name=$2
model_path=models/sherpa-onnx-paraformer-zh-2023-09-14

if [ ! -d $model_path ]; then
    pip install sherpa-onnx
    wget -nc https://github.com/k2-fsa/sherpa-onnx/releases/download/asr-models/sherpa-onnx-paraformer-zh-2023-09-14.tar.bz2
    mkdir models
    tar xvf sherpa-onnx-paraformer-zh-2023-09-14.tar.bz2 -C models
fi

python3 scripts/offline-decode-files.py  \
    --tokens=$model_path/tokens.txt \
    --paraformer=$model_path/model.int8.onnx \
    --num-threads=2 \
    --decoding-method=greedy_search \
    --debug=false \
    --sample-rate=24000 \
    --log-dir $wav_dir \
    --feature-dim=80 \
    --split-name $split_name \
    --name sherpa_onnx \
    $wav_files

# python3 scripts/paraformer-pytriton-client.py  \
#     --log-dir $wav_dir \
#     --split-name $split_name \
#     $wav_files