Spaces:
Runtime error
Runtime error
| from youtube_transcript_api import YouTubeTranscriptApi | |
| import re | |
| def get_youtube_video_id(query): | |
| try: | |
| match = re.search(r'(?:youtu\.be/|youtube\.com/(?:watch\?v=|embed/|v/|shorts/))([\w-]{11})', query) | |
| if match: | |
| video_id = match.group(1) | |
| print(video_id) | |
| return video_id | |
| except: | |
| print("Did not find youtube video id from query ", query) | |
| def fetch_transcript_english(video_id): | |
| try: | |
| ytt_api = YouTubeTranscriptApi() | |
| transcript = ytt_api.fetch(video_id,languages=['en']) | |
| return transcript | |
| except: | |
| print("Error ") | |
| def post_process_transcript(transcript_snippets): | |
| full_transcript = " ".join([transcript_snippet.text for transcript_snippet in transcript_snippets]) | |
| return full_transcript | |