File size: 2,113 Bytes
613af8d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
# Benchmark word-level timestamps for different models
#
# This script takes two arguments
# - an audio file
# - [optional] path to a font file

# I'm using "/usr/share/fonts/truetype/freefont/FreeMono.ttf" on Ubuntu

if [ -z "$1" ]; then
    echo "Usage: $0 <audio file> [font file]"
    exit 1
fi

#TODO: Make this a command line parameter
#models="base small large"
#models="tiny.en tiny base.en base small.en small medium.en medium large-v1 large"
models="tiny.en base.en small.en medium.en large"

DURATION=$(ffprobe -i $1 -show_entries format=duration -v quiet -of csv="p=0")
DURATION=$(printf "%.2f" $DURATION)
echo "Input file duration: ${DURATION}s"

for model in $models; do
    echo "Running $model"
    COMMAND="./main -m models/ggml-$model.bin -owts -f $1 -of $1.$model"

    if [ ! -z "$2" ]; then
        COMMAND="$COMMAND -fp $2"
    fi
    #TODO: Surface errors better
    # TIMEFMT is for zsh, TIMEFORMAT is for bash
    EXECTIME=$({ TIMEFMT="%E";TIMEFORMAT=%E; time $COMMAND >/dev/null 2>&1; } 2>&1)

    # Slightly different formats between zsh and bash
    if [ "${EXECTIME: -1}" == "s" ]; then
        EXECTIME=${EXECTIME::-1}
    fi

    RATIO=$(echo "$DURATION / $EXECTIME" | bc -l)
    RATIO=$(printf "%.2f" $RATIO)

    echo "Execution time: ${EXECTIME}s (${RATIO}x realtime)"

    # If the file already exists, delete it
    if [ -f $1.mp4 ]; then
        rm $1.mp4
    fi

    bash $1.$model.wts >/dev/null 2>&1
    mv $1.mp4 $1.$model.mp4

    ffmpeg -y -f lavfi -i color=c=black:s=1200x50:d=$DURATION -vf "drawtext=fontfile=$2:fontsize=36:x=10:y=(h-text_h)/2:text='ggml-$model - ${EXECTIME}s (${RATIO}x realtime)':fontcolor=lightgrey" $1.$model.info.mp4 >/dev/null 2>&1
done

COMMAND="ffmpeg -y"
for model in $models; do
    COMMAND="$COMMAND -i $1.$model.info.mp4 -i $1.$model.mp4"
done
COMMAND="$COMMAND -filter_complex \""
COUNT=0
for model in $models; do
    COMMAND="$COMMAND[${COUNT}:v][$(($COUNT+1)):v]"
    COUNT=$((COUNT+2))
done
COMMAND="$COMMAND vstack=inputs=${COUNT}[v]\" -map \"[v]\" -map 1:a $1.all.mp4 >/dev/null 2>&1"

echo $COMMAND

# Run the command
eval $COMMAND