30 lines
1.1 KiB
Python
30 lines
1.1 KiB
Python
# Theoretical Upgrade Test
|
|
from piper.voice import PiperVoice # Backbone of text to speech
|
|
import pyaudio
|
|
# import os
|
|
# print(os.popen('xsel').read()) # In Theory grab selected text and print ot to terminal
|
|
|
|
texttospeak = "Welcome to the world of speech synthesis! This is an example of text-to-speech using Piper TTS." #os.popen('xsel').read() # In Theory grab selected text into Varible cakked TextToSpeak
|
|
|
|
voice = PiperVoice.load("~/en_US-amy-medium.onnx") # Load the model
|
|
|
|
chunks = voice.synthesize(texttospeak) # Set up Piper to stream audio from TextToSpeak
|
|
first_chunk = next(chunks) # Get the first chunk to set up audio stream configuration
|
|
|
|
p = pyaudio.PyAudio()
|
|
stream = p.open( # Open audio stream with correct settings
|
|
format=p.get_format_from_width(first_chunk.sample_width),
|
|
channels=first_chunk.sample_channels,
|
|
rate=first_chunk.sample_rate,
|
|
output=True,
|
|
)
|
|
|
|
stream.write(first_chunk.audio_int16_bytes) # Play the first chunk
|
|
|
|
for chunk in chunks: # Play subsequent chunks of audio
|
|
stream.write(chunk.audio_int16_bytes)
|
|
|
|
# Cleanup
|
|
stream.stop_stream()
|
|
stream.close()
|
|
p.terminate() |