mirror of
https://github.com/ggerganov/whisper.cpp.git
synced 2025-01-24 23:09:05 +01:00
71 lines
2.1 KiB
Bash
Executable File
71 lines
2.1 KiB
Bash
Executable File
# Benchmark word-level timestamps for different models
|
|
#
|
|
# This script takes two arguments
|
|
# - an audio file
|
|
# - [optional] path to a font file
|
|
|
|
# I'm using "/usr/share/fonts/truetype/freefont/FreeMono.ttf" on Ubuntu
|
|
|
|
if [ -z "$1" ]; then
|
|
echo "Usage: $0 <audio file> [font file]"
|
|
exit 1
|
|
fi
|
|
|
|
#TODO: Make this a command line parameter
|
|
#models="base small large"
|
|
#models="tiny.en tiny base.en base small.en small medium.en medium large-v1 large"
|
|
models="tiny.en base.en small.en medium.en large"
|
|
|
|
DURATION=$(ffprobe -i $1 -show_entries format=duration -v quiet -of csv="p=0")
|
|
DURATION=$(printf "%.2f" $DURATION)
|
|
echo "Input file duration: ${DURATION}s"
|
|
|
|
for model in $models; do
|
|
echo "Running $model"
|
|
COMMAND="./main -m models/ggml-$model.bin -owts -f $1 -of $1.$model"
|
|
|
|
if [ ! -z "$2" ]; then
|
|
COMMAND="$COMMAND -fp $2"
|
|
fi
|
|
#TODO: Surface errors better
|
|
# TIMEFMT is for zsh, TIMEFORMAT is for bash
|
|
EXECTIME=$({ TIMEFMT="%E";TIMEFORMAT=%E; time $COMMAND >/dev/null 2>&1; } 2>&1)
|
|
|
|
# Slightly different formats between zsh and bash
|
|
if [ "${EXECTIME: -1}" == "s" ]; then
|
|
EXECTIME=${EXECTIME::-1}
|
|
fi
|
|
|
|
RATIO=$(echo "$DURATION / $EXECTIME" | bc -l)
|
|
RATIO=$(printf "%.2f" $RATIO)
|
|
|
|
echo "Execution time: ${EXECTIME}s (${RATIO}x realtime)"
|
|
|
|
# If the file already exists, delete it
|
|
if [ -f $1.mp4 ]; then
|
|
rm $1.mp4
|
|
fi
|
|
|
|
bash $1.$model.wts >/dev/null 2>&1
|
|
mv $1.mp4 $1.$model.mp4
|
|
|
|
ffmpeg -y -f lavfi -i color=c=black:s=1200x50:d=$DURATION -vf "drawtext=fontfile=$2:fontsize=36:x=10:y=(h-text_h)/2:text='ggml-$model - ${EXECTIME}s (${RATIO}x realtime)':fontcolor=lightgrey" $1.$model.info.mp4 >/dev/null 2>&1
|
|
done
|
|
|
|
COMMAND="ffmpeg -y"
|
|
for model in $models; do
|
|
COMMAND="$COMMAND -i $1.$model.info.mp4 -i $1.$model.mp4"
|
|
done
|
|
COMMAND="$COMMAND -filter_complex \""
|
|
COUNT=0
|
|
for model in $models; do
|
|
COMMAND="$COMMAND[${COUNT}:v][$(($COUNT+1)):v]"
|
|
COUNT=$((COUNT+2))
|
|
done
|
|
COMMAND="$COMMAND vstack=inputs=${COUNT}[v]\" -map \"[v]\" -map 1:a $1.all.mp4 >/dev/null 2>&1"
|
|
|
|
echo $COMMAND
|
|
|
|
# Run the command
|
|
eval $COMMAND
|