neutts-air

Running

StorageDater commited on 19 days ago

Commit

d2078f6

verified ·

1 Parent(s): a8f789a

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -7,18 +7,18 @@ import numpy as np
 import gradio as gr
 SAMPLES_PATH = os.path.join(os.getcwd(), "neutts-air", "samples")
-DEFAULT_REF_TEXT = "So I'm live on radio. And I say, well, my dear friend James here clearly, and the whole room just froze. Turns out I'd completely misspoken and mentioned our other friend."
 DEFAULT_REF_PATH = os.path.join(SAMPLES_PATH, "dave.wav")
 DEFAULT_GEN_TEXT = "My name is Dave, and um, I'm from London."
 tts = NeuTTSAir(
     backbone_repo="neuphonic/neutts-air",
-    backbone_device="cuda",
     codec_repo="neuphonic/neucodec",
-    codec_device="cuda"
 )
-@spaces.GPU()
 def infer(
     ref_text: str,
     ref_audio_path: str,
@@ -35,7 +35,7 @@ def infer(
         tuple [int, np.ndarray]: A tuple containing the sample rate (24000) and the generated audio waveform as a numpy array.
     """
-    gr.Info("Starting inference request!")
     gr.Info("Encoding reference...")
     ref_codes = tts.encode_reference(ref_audio_path)
@@ -52,9 +52,9 @@ demo = gr.Interface(
         gr.Textbox(label="Text to Generate", value=DEFAULT_GEN_TEXT),
     ],
     outputs=gr.Audio(type="numpy", label="Generated Speech"),
-    title="NeuTTS-Air☁️",
-    description="Upload a reference audio sample, provide the reference text, and enter new text to synthesize."
 )
 if __name__ == "__main__":
-    demo.launch(allowed_paths=[SAMPLES_PATH], mcp_server=True, inbrowser=True)

 import gradio as gr
 SAMPLES_PATH = os.path.join(os.getcwd(), "neutts-air", "samples")
+DEFAULT_REF_TEXT = "So I'm live on radio. And I say, well, my dear friend James here clearly, and the whole room just froze. Turns out I'd completely misspoken and mentioned our other friend."
 DEFAULT_REF_PATH = os.path.join(SAMPLES_PATH, "dave.wav")
 DEFAULT_GEN_TEXT = "My name is Dave, and um, I'm from London."
+# --- Force CPU usage ---
 tts = NeuTTSAir(
     backbone_repo="neuphonic/neutts-air",
+    backbone_device="cpu",
     codec_repo="neuphonic/neucodec",
+    codec_device="cpu"
 )
 def infer(
     ref_text: str,
     ref_audio_path: str,
         tuple [int, np.ndarray]: A tuple containing the sample rate (24000) and the generated audio waveform as a numpy array.
     """
+    gr.Info("Starting inference request (CPU mode)!")
     gr.Info("Encoding reference...")
     ref_codes = tts.encode_reference(ref_audio_path)
         gr.Textbox(label="Text to Generate", value=DEFAULT_GEN_TEXT),
     ],
     outputs=gr.Audio(type="numpy", label="Generated Speech"),
+    title="NeuTTS-Air☁️ (CPU Mode)",
+    description="Upload a reference audio sample, provide the reference text, and enter new text to synthesize (running on CPU)."
 )
 if __name__ == "__main__":
+    demo.launch(allowed_paths=[SAMPLES_PATH], mcp_server=True, inbrowser=True)