diff --git a/speak-mp3.sh b/speak-mp3.sh new file mode 100755 index 0000000..851adf2 --- /dev/null +++ b/speak-mp3.sh @@ -0,0 +1,7 @@ +#!/bin/bash + +FILE="ffmpeg_output.wav" +MP3="ffmpeg_output.mp3" + +ffmpeg -i $FILE -acodec mp3 $MP3 -y +ffplay $MP3 -nodisp -autoexit diff --git a/speak.sh b/speak.sh new file mode 100755 index 0000000..6474174 --- /dev/null +++ b/speak.sh @@ -0,0 +1,25 @@ +#!/bin/bash + +if [ -z "$1" ]; then + echo usage: $0 \"text\" [tempo] [model] + exit +fi + +STR=$1 +MODEL="tts_models/en/jenny/jenny" +TEMPO=1.0 + +if [ -z "$2" ]; then + TEMPO=$TEMPO +else + TEMPO=$2 + if [ -z "$3" ]; then + MODEL=$MODEL + else + MODEL=$3 + fi +fi + +tts --text "$STR" --model_name "$MODEL" && \ +ffmpeg -i tts_output.wav -filter:a "atempo=$TEMPO" -vn ffmpeg_output.wav -y && \ +ffplay ffmpeg_output.wav -nodisp -autoexit