Praxis_Bot/tts.py
dtookey 68674de54e removed pyglet because playsound appears to work just fine
added documentation to several functions in tty.py
2020-09-20 13:52:29 -04:00

115 lines
3.7 KiB
Python

import datetime
import hashlib
import os
import requests
from gtts import gTTS
from playsound import playsound
import config
streamLabsUrl = "https://streamlabs.com/polly/speak"
def tts(inputText: str, *args):
outpath = create_speech_file(inputText)
playsound(outpath)
def create_speech_gtts(input_text: str):
"""
Will create a sound file for the provided text by using gTTS
:param input_text: any reasonable english text
:return: returns the path of the file for the sound
"""
path = os.path.join(get_tts_dir(), create_file_name(input_text, "mp3"))
if not os.path.exists(path):
sound_digest = gTTS(text=input_text, lang='en')
sound_digest.save(path)
return path
def create_speech_streamlabs(text: str):
"""
Will create a sound file for the provided text by querying and downloading a file from streamlabs
:param text: any reasonable english text
:return: returns the path of the file for the sound
"""
path = os.path.join(get_tts_dir(), create_file_name(text, "ogg"))
if not os.path.exists(path):
body = {"voice": config.streamlabsVoice.value, "text": text}
resp = requests.post(streamLabsUrl, data=body).json()
sound_file_url = resp["speak_url"]
if sound_file_url is not None:
sound_bytes = requests.get(sound_file_url, stream=True)
f = open(path, "+wb")
f.write(sound_bytes.content)
f.close()
return path
speechCreationFunctions = { # this is a mapping of the Speaker enum to function pointers
config.Speaker.STREAMLABS_API: create_speech_streamlabs,
config.Speaker.GOOGLE_TEXT_TO_SPEECH: create_speech_gtts
}
def create_speech_file(text: str):
"""
Helper function that will create a sound file for the provided text. This will use the configuration in config.py
to use TTS engines and name the file
:param text: the text you would like to turn into a sound file
:return: returns the path of the sound file
"""
text_creation_function = speechCreationFunctions.get(config.currentSpeaker)
output_path = text_creation_function(text)
return output_path
def create_file_name(text: str, ext: str):
"""
:param text: the content of the message. using the CONTENT_BASED FileNameStrategy, this will (ostensibly) produce a
unique file name based on the content of the message. Two messages of equal content will produce the same name
:param ext: the desired file extension i.e. mp3, ogg, wav, etc...
:return: returns the formatted filename i.e. 01-01-20_01-01-01_tts.mp3
"""
if config.fileNameStrategy == config.FileNameStrategy.CONTENT_BASED:
unique_id = hashlib.md5(bytes(text, 'utf-8')).hexdigest()
return "%s_tts.%s" % (unique_id, ext)
elif config.fileNameStrategy == config.FileNameStrategy.TIME_BASED:
time = datetime.datetime.now()
return "%s_tts.%s" % (time.strftime("%m-%d-%Y_%H-%M-%S"), ext)
else:
return "unconfigured_tts.%s" % ext
def play_speech(fileName):
destPath = get_tts_dir()
playsound(destPath + fileName)
def get_tts_dir():
"""
Checks for the tts directory, and will create it if it does not exist
:return: the relative file path of the tts dir
"""
dir = os.path.join(os.getcwd(), "tts") # this is platform-agnostic
if not os.path.exists(dir):
os.mkdir(dir)
return dir
if __name__ == "__main__":
print("Enter Text: ")
textInput = str(input())
print("Custom FileName? y/n: ")
bool_string = str(input())
if bool_string == "y":
print("Enter FileName: ")
fileName = str(input())
tts(textInput, fileName)
else:
tts(textInput)