Spaces:

suprimedev
/

speh32

Sleeping

App Files Files Community

suprimedev commited on 25 days ago

Commit

4742671

verified ·

1 Parent(s): 145d58c

Update app.py

Browse files

Files changed (1) hide show

app.py +24 -24

app.py CHANGED Viewed

@@ -113,7 +113,7 @@ def process_audio_chunk(audio_tuple):
         text = ""
         try:
             text = recognizer.recognize_google(audio, language='fa-IR')  # Persian first
-            # اگر key داری: recognize_google(audio, language='fa-IR', key="YOUR_GOOGLE_API_KEY")
         except sr.UnknownValueError:
             try:
                 text = recognizer.recognize_google(audio, language='en-US')
@@ -153,10 +153,13 @@ def clear_transcript():
         current_transcript = ""
     # Clear queue
     while not audio_queue.empty():
-        audio_queue.get_nowait()
     return ""
-# File transcription (unchanged, works fine)
 def transcribe_file(audio_file, chunk_duration=30):
     if audio_file is None:
         yield "لطفاً فایل آپلود کنید", ""
@@ -210,7 +213,7 @@ def save_text(text):
     temp_file.close()
     return temp_file.name
-# Gradio UI with Timer for live updates
 with gr.Blocks(
     title="تبدیل گفتار به متن - Real-time Fixed",
     theme=gr.themes.Soft(),
@@ -229,7 +232,7 @@ with gr.Blocks(
     """)
     with gr.Tabs():
-        with gr.TabItem("🎙️ ضبط مستقیم"):
             gr.Markdown("### فعال کنید و 5+ ثانیه واضح صحبت کنید (متن هر 3s آپدیت می‌شه)", elem_classes="rtl")
             with gr.Row():
@@ -239,9 +242,6 @@ with gr.Blocks(
                     label="میکروفون (ضبط رو شروع کن)",
                     elem_classes="rtl"
                 )
-                start_btn = gr.Button("▶️ شروع real-time", variant="primary")
-                stop_btn = gr.Button("⏹️ توقف", variant="secondary")
             realtime_output = gr.Textbox(
                 label="متن live",
@@ -255,23 +255,23 @@ with gr.Blocks(
             clear_btn = gr.Button("🗑️ پاک کردن", variant="secondary")
-            # Events
-            audio_input.change(handle_realtime_audio, inputs=[audio_input], outputs=[audio_input])  # Handle chunks
-            # Timer for live update (هر 2s transcript رو pull کن)
-            timer = gr.Timer(2.0)  # Start after tab open
             timer.tick(get_current_transcript, outputs=[realtime_output])
             clear_btn.click(clear_transcript, outputs=[realtime_output])
-            # Start/stop recording (toggle microphone)
-            def toggle_recording(active):
-                return gr.update(value=active)  # Simple toggle, but Gradio handles start/stop
-            start_btn.click(lambda: gr.update(visible=True), outputs=[stop_btn]).click(
-                toggle_recording, inputs=[audio_input], outputs=[audio_input]
-            )
-            stop_btn.click(lambda: gr.update(visible=False), outputs=[start_btn])
         with gr.TabItem("📁 فایل صوتی"):
             gr.Markdown("### فایل آپلود کن و تبدیل کن", elem_classes="rtl")
@@ -290,13 +290,13 @@ with gr.Blocks(
                 download_file = gr.File(label="دانلود TXT", visible=False, elem_classes="rtl")
             process_btn.click(transcribe_file, [file_input, chunk_slider], [file_output, progress_label])
-            save_btn.click(save_text, file_output, download_file).then(lambda: gr.update(visible=True), download_file)
             clear_file_btn.click(lambda: ("", ""), [file_output, progress_label])
     with gr.Accordion("📖 راهنما", open=False, elem_classes="rtl"):
         gr.Markdown("""
         ### استفاده:
-        - **Real-time**: میکروفون رو فعال کن، 5s+ صحبت کن. هر 3s متن آپدیت می‌شه (background).
         - **فایل**: آپلود و دکمه بزن.
         ### نکات:
         - 🗣️ واضح صحبت کن، نویز کم.
@@ -306,7 +306,7 @@ with gr.Blocks(
         - توزیع: share لینک رو share کن، همه browserها ساپورت.
         """, elem_classes="rtl")
-    gr.HTML('<div style="text-align: center; margin-top: 2em; padding: 1em; background: #f8f9fa;"><p style="color: #666;">نسخه 2.2 - Fixed Real-time با Timer | Google Backend</p></div>')
 if __name__ == "__main__":
     demo.queue().launch(share=True, show_error=True, server_name="0.0.0.0", server_port=7860)

         text = ""
         try:
             text = recognizer.recognize_google(audio, language='fa-IR')  # Persian first
+            # اگر key داری: text = recognizer.recognize_google(audio, language='fa-IR', key="YOUR_GOOGLE_API_KEY")
         except sr.UnknownValueError:
             try:
                 text = recognizer.recognize_google(audio, language='en-US')
         current_transcript = ""
     # Clear queue
     while not audio_queue.empty():
+        try:
+            audio_queue.get_nowait()
+        except queue.Empty:
+            break
     return ""
+# File transcription (unchanged)
 def transcribe_file(audio_file, chunk_duration=30):
     if audio_file is None:
         yield "لطفاً فایل آپلود کنید", ""
     temp_file.close()
     return temp_file.name
+# Gradio UI (Fixed: Separate clicks, Timer with load event)
 with gr.Blocks(
     title="تبدیل گفتار به متن - Real-time Fixed",
     theme=gr.themes.Soft(),
     """)
     with gr.Tabs():
+        with gr.TabItem("🎙️ ضبط مستقیم", id="realtime_tab") as realtime_tab:
             gr.Markdown("### فعال کنید و 5+ ثانیه واضح صحبت کنید (متن هر 3s آپدیت می‌شه)", elem_classes="rtl")
             with gr.Row():
                     label="میکروفون (ضبط رو شروع کن)",
                     elem_classes="rtl"
                 )
             realtime_output = gr.Textbox(
                 label="متن live",
             clear_btn = gr.Button("🗑️ پاک کردن", variant="secondary")
+            # Events (Fixed: Separate clicks)
+            audio_input.change(
+                handle_realtime_audio,
+                inputs=[audio_input],
+                outputs=[realtime_output]  # Update output on change
+            )
+            # Timer for live update: Start when tab loads
+            timer = gr.Timer(value=2.0, active=False)
+            def start_timer():
+                timer.change(active=True)
+                return get_current_transcript()
+            realtime_tab.select(start_timer, outputs=[realtime_output])
             timer.tick(get_current_transcript, outputs=[realtime_output])
             clear_btn.click(clear_transcript, outputs=[realtime_output])
         with gr.TabItem("📁 فایل صوتی"):
             gr.Markdown("### فایل آپلود کن و تبدیل کن", elem_classes="rtl")
                 download_file = gr.File(label="دانلود TXT", visible=False, elem_classes="rtl")
             process_btn.click(transcribe_file, [file_input, chunk_slider], [file_output, progress_label])
+            save_btn.click(save_text, file_output, download_file).then(lambda: gr.update(visible=True), outputs=[download_file])
             clear_file_btn.click(lambda: ("", ""), [file_output, progress_label])
     with gr.Accordion("📖 راهنما", open=False, elem_classes="rtl"):
         gr.Markdown("""
         ### استفاده:
+        - **Real-time**: تب رو باز کن، میکروفون فعال کن، 5s+ صحبت کن. هر 3s متن آپدیت می‌شه (background).
         - **فایل**: آپلود و دکمه بزن.
         ### نکات:
         - 🗣️ واضح صحبت کن، نویز کم.
         - توزیع: share لینک رو share کن، همه browserها ساپورت.
         """, elem_classes="rtl")
+    gr.HTML('<div style="text-align: center; margin-top: 2em; padding: 1em; background: #f8f9fa;"><p style="color: #666;">نسخه 2.3 - Fixed Timer & Clicks | Google Backend</p></div>')
 if __name__ == "__main__":
     demo.queue().launch(share=True, show_error=True, server_name="0.0.0.0", server_port=7860)