Spaces:

siddhartharya
/

My_NotebookLM_Podcast_Generator

Running

App Files Files Community

siddhartharya commited on 18 days ago

Commit

f0db570

•

1 Parent(s): 652d9d0

Update app.py

Browse files

Files changed (1) hide show

app.py +34 -74

app.py CHANGED Viewed

@@ -1,89 +1,49 @@
 import gradio as gr
-import PyPDF2
-import docx
-import requests
-from bs4 import BeautifulSoup
-from groq import Groq
-from gtts import gTTS
 from pydub import AudioSegment
 import os
-import io
-# Initialize Groq client
-groq_client = Groq()
-def extract_text(file_or_url):
-    if isinstance(file_or_url, str):  # URL
-        response = requests.get(file_or_url)
-        soup = BeautifulSoup(response.text, 'html.parser')
-        return soup.get_text()
-    elif file_or_url is not None:
-        if file_or_url.name.endswith('.pdf'):
-            reader = PyPDF2.PdfReader(file_or_url.file)
-            return ' '.join([page.extract_text() for page in reader.pages])
-        elif file_or_url.name.endswith('.docx'):
-            doc = docx.Document(file_or_url.file)
-            return ' '.join([para.text for para in doc.paragraphs])
-    return ""
-def generate_podcast_script(text):
-    prompt = f"""Generate a podcast script between a man and a woman discussing the following text:
-    {text}
-    The podcast should be informative and engaging, with a natural conversation flow.
-    Limit the script to approximately 750 words to fit within a 5-minute podcast."""
-    response = groq_client.chat.completions.create(
-        messages=[
-            {"role": "system", "content": "You are an AI assistant that generates podcast scripts based on given text."},
-            {"role": "user", "content": prompt}
-        ],
-        model="llama-3.1-70b-versatile",  # Using LLaMa 3.1 70B model
-        max_tokens=1000,
-        temperature=0.7
-    )
-    return response.choices[0].message.content
-def text_to_speech(script):
-    lines = script.split('\n')
-    audio_segments = []
-    for line in lines:
-        if line.startswith("Man:"):
-            tts = gTTS(line[4:], lang='en', tld='co.uk')
-        elif line.startswith("Woman:"):
-            tts = gTTS(line[6:], lang='en', tld='com.au')
-        else:
-            continue
-        buffer = io.BytesIO()
-        tts.write_to_fp(buffer)
-        buffer.seek(0)
-        audio_segments.append(AudioSegment.from_mp3(buffer))
-    final_audio = sum(audio_segments)
-    final_audio = final_audio[:300000]  # Trim to 5 minutes (300,000 ms)
-    buffer = io.BytesIO()
-    final_audio.export(buffer, format="mp3")
-    buffer.seek(0)
-    return buffer
-def generate_podcast(file_or_url):
-    text = extract_text(file_or_url)
-    if not text:
-        return None, "Failed to extract text. Please check your input."
-    script = generate_podcast_script(text)
-    audio_file = text_to_speech(script)
-    return audio_file, script
 iface = gr.Interface(
     fn=generate_podcast,
     inputs=[
-        gr.File(label="Upload PDF/DOC file"),
-        gr.Textbox(label="Or enter URL")
     ],
     outputs=[
         gr.Audio(label="Generated Podcast"),
-        gr.Textbox(label="Podcast Script")
     ],
-    title="Custom NotebookLM-type Podcast Generator (LLaMa 3.1 70B)"
 )
 iface.launch()

 import gradio as gr
+from utils import generate_script, generate_audio
+from prompts import SYSTEM_PROMPT
 from pydub import AudioSegment
 import os
+def generate_podcast(file, tone, length):
+    # Extract text from PDF
+    # Generate script using generate_script function
+    # Generate audio for each dialogue item
+    # Combine audio segments
+    # Return audio file and transcript
+# Gradio interface
+instructions = """
+# Podcast Generator
+Welcome to the Podcast Generator project! This tool allows you to create custom podcast episodes using AI-generated content.
+## Features
+* Generate podcast scripts on any topic
+* Convert text to speech for a natural listening experience
+* Choose the tone of your podcast
+* Export episodes as MP3 files
+## How to Use
+1. Upload a PDF file (max 2048 tokens)
+2. Select the desired tone (humorous, casual, formal)
+3. Choose the podcast length
+4. Click "Generate" to create your podcast
+5. Listen to the generated audio and review the transcript
+"""
 iface = gr.Interface(
     fn=generate_podcast,
     inputs=[
+        gr.File(label="Upload PDF file"),
+        gr.Radio(["humorous", "casual", "formal"], label="Select podcast tone", value="casual"),
+        gr.Radio(["Short (1-2 min)", "Medium (3-5 min)"], label="Podcast length", value="Medium (3-5 min)")
     ],
     outputs=[
         gr.Audio(label="Generated Podcast"),
+        gr.Markdown(label="Transcript")
     ],
+    title="Custom NotebookLM-type Podcast Generator",
+    description=instructions
 )
 iface.launch()