#!/bin/bash if [ $# != 1 ]; then echo "Usage: transcribe-audio.sh <audio>" echo "e.g.: transcribe-audio.sh dr_strangelove.mp3" exit 1; fi ! GST_PLUGIN_PATH=../src gst-inspect-1.0 kaldinnet2onlinedecoder > /dev/null 2>&1 && echo "Compile the plugin in ../src first" && exit 1; if [ ! -f HCLG.fst ]; then echo "Run ./prepare-models.sh first to download models" exit 1; fi audio=$1 GST_PLUGIN_PATH=../src gst-launch-1.0 --gst-debug="" -q filesrc location=$audio ! decodebin ! audioconvert ! audioresample ! \ kaldinnet2onlinedecoder \ model=final.mdl \ fst=HCLG.fst \ word-syms=words.txt \ feature-type=mfcc \ mfcc-config=conf/mfcc.conf \ ivector-extraction-config=conf/ivector_extractor.fixed.conf \ max-active=7000 \ beam=11.0 \ lattice-beam=5.0 \ do-endpointing=true \ endpoint-silence-phones="1:2:3:4:5:6:7:8:9:10" \ ! filesink location=/dev/stdout buffer-mode=2