Spaces:

BHW
/

Streaming-AST

Running

App Files Files Community

BHW commited on Apr 11, 2024

Commit

c5cb4be

verified ·

1 Parent(s): 66d40fc

Update app.py

Browse files

Files changed (1) hide show

app.py +6 -6

app.py CHANGED Viewed

@@ -3,11 +3,11 @@ import time
 import gradio as gr
 import librosa
 import numpy as np
-import soundfile as sf
 from transformers import pipeline
 TARGET_SAMPLE_RATE = 16_000
-AUDIO_SECONDS_THRESHOLD = 5
 pipe = pipeline("audio-classification", model="MIT/ast-finetuned-audioset-10-10-0.4593")
 prediction = [{"score": 1, "label": "recording..."}]
@@ -27,7 +27,7 @@ def streaming_recording_fn(stream, new_chunk):
         if (stream.shape[-1] / TARGET_SAMPLE_RATE) >= AUDIO_SECONDS_THRESHOLD:
             prediction = pipe(stream)
             file_name = f'./audio/{time.strftime("%Y%m%d_%H%M%S", time.localtime())}.wav'
-            sf.write(file_name, stream, TARGET_SAMPLE_RATE)
             print(f"SAVE AUDIO: {file_name}")
             print(f">>>>>>1\t{y.shape=}, {stream.shape=}\n\t{prediction[0]=}")
             stream = None
@@ -49,7 +49,7 @@ def microphone_fn(waveform):
     y = librosa.resample(y, orig_sr=sr, target_sr=TARGET_SAMPLE_RATE)
     result = pipe(y)
     file_name = f'./audio/{time.strftime("%Y%m%d_%H%M%S", time.localtime())}.wav'
-    sf.write(file_name, y, TARGET_SAMPLE_RATE)
     return {i['label']: i['score'] for i in result}
@@ -61,7 +61,7 @@ def file_fn(waveform):
     y = librosa.resample(y, orig_sr=sr, target_sr=TARGET_SAMPLE_RATE)
     result = pipe(y)
     file_name = f'./audio/{time.strftime("%Y%m%d_%H%M%S", time.localtime())}.wav'
-    sf.write(file_name, y, TARGET_SAMPLE_RATE)
     return {i['label']: i['score'] for i in result}
@@ -98,7 +98,7 @@ with gr.Blocks() as example:
 with gr.Blocks() as demo:
     gr.TabbedInterface([file_demo, streaming_demo, microphone_demo, example],
-                       ["Audio file", "Streaming", "Microphone", "example"])
 if __name__ == "__main__":

 import gradio as gr
 import librosa
 import numpy as np
+# import soundfile as sf
 from transformers import pipeline
 TARGET_SAMPLE_RATE = 16_000
+AUDIO_SECONDS_THRESHOLD = 2
 pipe = pipeline("audio-classification", model="MIT/ast-finetuned-audioset-10-10-0.4593")
 prediction = [{"score": 1, "label": "recording..."}]
         if (stream.shape[-1] / TARGET_SAMPLE_RATE) >= AUDIO_SECONDS_THRESHOLD:
             prediction = pipe(stream)
             file_name = f'./audio/{time.strftime("%Y%m%d_%H%M%S", time.localtime())}.wav'
+            # # sf.write(file_name, stream, TARGET_SAMPLE_RATE)
             print(f"SAVE AUDIO: {file_name}")
             print(f">>>>>>1\t{y.shape=}, {stream.shape=}\n\t{prediction[0]=}")
             stream = None
     y = librosa.resample(y, orig_sr=sr, target_sr=TARGET_SAMPLE_RATE)
     result = pipe(y)
     file_name = f'./audio/{time.strftime("%Y%m%d_%H%M%S", time.localtime())}.wav'
+    # sf.write(file_name, y, TARGET_SAMPLE_RATE)
     return {i['label']: i['score'] for i in result}
     y = librosa.resample(y, orig_sr=sr, target_sr=TARGET_SAMPLE_RATE)
     result = pipe(y)
     file_name = f'./audio/{time.strftime("%Y%m%d_%H%M%S", time.localtime())}.wav'
+    # sf.write(file_name, y, TARGET_SAMPLE_RATE)
     return {i['label']: i['score'] for i in result}
 with gr.Blocks() as demo:
     gr.TabbedInterface([file_demo, streaming_demo, microphone_demo, example],
+                       ["Audio file", "Streaming", "Microphone", "Example"])
 if __name__ == "__main__":