smakamali commited on
Commit
b313c5d
1 Parent(s): aa0044b

update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -2
app.py CHANGED
@@ -18,8 +18,10 @@ def transcribe_youtube_video(url, force_transcribe=False):
18
  if text == '' or force_transcribe:
19
  from pytube import YouTube
20
  import torch
 
21
 
22
  save_dir="./docs/youtube/"
 
23
  yt = YouTube(str(url))
24
  audio = yt.streams.filter(only_audio = True).first()
25
  out_file = audio.download(filename="audio.mp3",output_path = save_dir)
@@ -172,9 +174,9 @@ def summarize_text(title,text):
172
  from langchain.document_loaders import TextLoader
173
  from langchain.text_splitter import TokenTextSplitter
174
 
175
- with open('./transcript.txt','w') as f:
176
  f.write(text)
177
- loader = TextLoader("./transcript.txt")
178
  doc = loader.load()
179
  text_splitter = TokenTextSplitter(chunk_size=500, chunk_overlap=0)
180
  docs = text_splitter.split_documents(doc)
 
18
  if text == '' or force_transcribe:
19
  from pytube import YouTube
20
  import torch
21
+ import os
22
 
23
  save_dir="./docs/youtube/"
24
+ os.mkdir(save_dir)
25
  yt = YouTube(str(url))
26
  audio = yt.streams.filter(only_audio = True).first()
27
  out_file = audio.download(filename="audio.mp3",output_path = save_dir)
 
174
  from langchain.document_loaders import TextLoader
175
  from langchain.text_splitter import TokenTextSplitter
176
 
177
+ with open('./docs/transcript.txt','w') as f:
178
  f.write(text)
179
+ loader = TextLoader("./docs/transcript.txt")
180
  doc = loader.load()
181
  text_splitter = TokenTextSplitter(chunk_size=500, chunk_overlap=0)
182
  docs = text_splitter.split_documents(doc)