bisoye's picture
Upload 7 files
d64d27f verified
raw
history blame contribute delete
819 Bytes
import whisper
from gtts import gTTS
from pydub import AudioSegment
#text to sppech function
def text_to_speech(text):
# Convert text to speech with a US accent using gTTS
tts = gTTS(text=text, lang='en', tld='us', slow=False)
tts.save('temp.mp3')
# Load the audio file
audio = AudioSegment.from_file('temp.mp3')
# Adjust the speed to approximately 170 wpm
playback_speed = 1.20
audio = audio.speedup(playback_speed=playback_speed)
# Save and return the adjusted audio file
final_filename = 'text_to_speech.mp3'
audio.export(final_filename, format='mp3')
return final_filename
#speech to text function
def audio_to_text(audio):
model = whisper.load_model("base.en")
result = model.transcribe(audio)
return result["text"]