Spaces:
Runtime error
Runtime error
| import gradio as gr | |
| import tensorflow as tf | |
| from wav2vec2 import Wav2Vec2Processor, Wav2Vec2ForCTC | |
| if __name__ == '__main__': | |
| processor = Wav2Vec2Processor(is_tokenizer=False) | |
| tokenizer = Wav2Vec2Processor(is_tokenizer=True) | |
| model = Wav2Vec2ForCTC.from_pretrained("vasudevgupta/gsoc-wav2vec2-960h") | |
| def _forward(speech: tf.Tensor): | |
| speech = processor(speech)[None] | |
| tf_out = model(speech, training=False) | |
| return tf.squeeze(tf.argmax(tf_out, axis=-1)) | |
| def transcribe_text(inputs): | |
| _, speech = inputs | |
| speech = tf.constant(speech, dtype=tf.float32) | |
| speech = tf.transpose(speech) | |
| tf_out = _forward(speech) | |
| return tokenizer.decode(tf_out.numpy().tolist()) | |
| gr.Interface(fn=transcribe_text, inputs="audio", outputs="text").launch() | |