Add gong to the output sound
This commit is contained in:
parent
a07f85f653
commit
0e5bf750ac
1 changed files with 23 additions and 16 deletions
39
ansage.py
39
ansage.py
|
|
@ -5,29 +5,36 @@ from TTS.api import TTS
|
||||||
device = "cuda" if torch.cuda.is_available() else "cpu"
|
device = "cuda" if torch.cuda.is_available() else "cpu"
|
||||||
|
|
||||||
# List available 🐸TTS models
|
# List available 🐸TTS models
|
||||||
print(TTS().list_models())
|
#print(TTS().list_models())
|
||||||
|
|
||||||
# Initialize TTS
|
# Initialize TTS
|
||||||
tts = TTS("tts_models/multilingual/multi-dataset/xtts_v2").to(device)
|
tts = TTS("tts_models/multilingual/multi-dataset/xtts_v2").to(device)
|
||||||
|
|
||||||
# List speakers
|
# List speakers
|
||||||
print(tts.speakers)
|
|
||||||
|
|
||||||
# Run TTS
|
# Configure output path
|
||||||
# ❗ XTTS supports both, but many models allow only one of the `speaker` and
|
output_path = "output.wav"
|
||||||
# `speaker_wav` arguments
|
|
||||||
|
|
||||||
# TTS with list of amplitude values as output, clone the voice from `speaker_wav`
|
|
||||||
#wav = tts.tts(
|
|
||||||
# text="Hello world!",
|
|
||||||
# speaker_wav="my/cloning/audio.wav",
|
|
||||||
# language="en"
|
|
||||||
#)
|
|
||||||
|
|
||||||
# TTS to a file, use a preset speaker
|
# TTS to a file, use a preset speaker
|
||||||
tts.tts_to_file(
|
tts.tts_to_file(
|
||||||
text="Hallo Oliver, herzlichen Glückwunsch zur erfolgreichen Entlastung",
|
text="Verehrte Fahrgäste, das heutige Besäufnis wird Ihnen gesponsert von, Rheinmetall",
|
||||||
speaker_wav="./0248.wav",
|
speaker_wav=["./0248.wav"],
|
||||||
language="en",
|
language="de",
|
||||||
file_path="output2.wav"
|
file_path=output_path
|
||||||
)
|
)
|
||||||
|
|
||||||
|
# Process Audio (geklaut von meinem guten Freund flon)
|
||||||
|
|
||||||
|
from pydub import AudioSegment
|
||||||
|
from pydub.utils import make_chunks
|
||||||
|
|
||||||
|
audio = AudioSegment.from_wav(output_path)
|
||||||
|
audio = audio.set_channels(1)
|
||||||
|
audio = audio.set_sample_width(2)
|
||||||
|
audio = audio.set_frame_rate(16000)
|
||||||
|
|
||||||
|
silence = AudioSegment.silent(duration=1000)
|
||||||
|
gong = AudioSegment.from_wav("./513_1.wav")
|
||||||
|
|
||||||
|
audio = silence + gong + audio
|
||||||
|
audio.export(output_path, format="wav")
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue