Spaces:
Runtime error
Runtime error
| import gradio as gr | |
| from dataset import TranscriptDataset | |
| from downloader import WhisperPP, YoutubeDownloader | |
| from interpreter import WhisperInterpreter | |
| model_size = "base" | |
| mode = "transcribe" | |
| write = False | |
| download_path = "tmp/" | |
| def dataset(url, name, token): | |
| ds = TranscriptDataset(name) | |
| data = [] | |
| #whisper_options = dict( | |
| # model_size=model_size, mode=mode, write=write, number_videos=500) | |
| #whisperPP = WhisperPP(data,name, **whisper_options) | |
| #downloader = YoutubeDownloader(download_path) | |
| #downloader.download(url, whisperPP) | |
| params = dict(model_size=model_size,write=write, number_videos=500) | |
| overwrite = True | |
| ds.generate_dataset(url, download_path, overwrite, params) | |
| ds.upload(token) | |
| return "Playlist Name: " + name + "!!" | |
| yt_input = gr.Textbox(label = 'Youtube Link') | |
| name_input = gr.Textbox(label = 'Dataset Name') | |
| token_input = gr.Textbox(placeholder="Write access token") | |
| repo_output = gr.Textbox(label = "Outcome") | |
| iface = gr.Interface(fn=dataset, inputs=[yt_input, name_input, token_input], outputs=repo_output, title="Create Transcription Dataset for Youtube using OpenAI Whisper !", | |
| description="Create a HuggingFace repository for Youtube Transcripts! You need to specify a write token obtained in https://hf.co/settings/token. This Space is a an experimental demo.", | |
| article="<p>Find your write token at <a href='https://huggingface.co/settings/token' target='_blank'>token settings</a></p>") | |
| iface.launch() |