mars5_space

Paused

App Files Files Community

arnavmehta7 commited on Jun 17, 2024

Commit

9f8a599

verified ·

1 Parent(s): 779952a

Update app.py

Browse files

Files changed (1) hide show

app.py +5 -14

app.py CHANGED Viewed

@@ -5,7 +5,6 @@ import librosa
 from pathlib import Path
 import tempfile, torchaudio
 from transformers import pipeline
-from uuid import uuid4
 # Load the MARS5 model
 mars5, config_class = torch.hub.load('Camb-ai/mars5-tts', 'mars5_english', trust_repo=True)
@@ -24,16 +23,6 @@ def transcribe_file(f: str) -> str:
 # Function to process the text and audio input and generate the synthesized output
 def synthesize(text, audio_file, transcript, kwargs_dict):
     print(f">>>>>>> Kwargs dict: {kwargs_dict}")
-    # audio_file = Path(audio_file)
-    # temp_file = f"{uuid4()}.{audio_file.suffix}"
-    # # copying the audio_file
-    # with open(audio_file, 'rb') as src, open(temp_file, 'wb') as dst:
-    #     dst.write(src.read())
-    # audio_file = temp_file
-    print(f">>>>> synthesizing! audio_file: {audio_file}")
     if not transcript:
         transcript = transcribe_file(audio_file)
@@ -67,7 +56,9 @@ defaults = {
 with gr.Blocks() as demo:
-    gr.Markdown("## MARS5 TTS Demo\nEnter text and upload an audio file to clone the voice and generate synthesized speech using MARS5 TTS.")
     text = gr.Textbox(label="Text to synthesize")
     audio_file = gr.Audio(label="Audio file to clone from", type="filepath")
@@ -143,8 +134,8 @@ with gr.Blocks() as demo:
     # Add examples
     defaults = [0.8, -1, 0.2, 1.0, 2.6, 0.4, 100, 3, True]
     examples = [
-        ["Today is a wonderful day!", "female_speaker_1.flac", "People look, but no one ever finds it.", *defaults],
-        ["You guys need to figure this out.", "male_speaker_1.flac", "Ask her to bring these things with her from the store.", *defaults]
     ]
     gr.Examples(

 from pathlib import Path
 import tempfile, torchaudio
 from transformers import pipeline
 # Load the MARS5 model
 mars5, config_class = torch.hub.load('Camb-ai/mars5-tts', 'mars5_english', trust_repo=True)
 # Function to process the text and audio input and generate the synthesized output
 def synthesize(text, audio_file, transcript, kwargs_dict):
     print(f">>>>>>> Kwargs dict: {kwargs_dict}")
     if not transcript:
         transcript = transcribe_file(audio_file)
 with gr.Blocks() as demo:
+    link = "https://github.com/Camb-ai/MARS5-TTS"
+    gr.Markdown("## MARS5 TTS Demo\nEnter text and upload an audio file to clone the voice and generate synthesized speech using **[MARS5-TTS]({link})**")
     text = gr.Textbox(label="Text to synthesize")
     audio_file = gr.Audio(label="Audio file to clone from", type="filepath")
     # Add examples
     defaults = [0.8, -1, 0.2, 1.0, 2.6, 0.4, 100, 3, True]
     examples = [
+        ["Can you please go there and figure it out?", "female_speaker_1.flac", "People look, but no one ever finds it.", *defaults],
+        ["Hey, do you need my help?", "male_speaker_1.flac", "Ask her to bring these things with her from the store.", *defaults]
     ]
     gr.Examples(