import streamlit as st import tempfile import os import google.generativeai as genai from dotenv import load_dotenv load_dotenv() GOOGLE_API_KEY = os.getenv("GOOGLE_API_KEY") genai.configure(api_key=GOOGLE_API_KEY) def summarize_audio(audio_file_path): """Summarize the audio using Google's Generative API.""" model = genai.GenerativeModel("models/gemini-1.5-pro-latest") audio_file = genai.upload_file(path=audio_file_path) response = model.generate_content( [ "Please summarize the following audio.", audio_file ] ) return response.text def save_uploaded_file(uploaded_file): """Save uploaded file to a temporary file and return the path.""" try: with tempfile.NamedTemporaryFile(delete=False, suffix='.' + uploaded_file.name.split('.')[-1]) as tmp_file: tmp_file.write(uploaded_file.getvalue()) return tmp_file.name except Exception as e: st.error(f"Error handling uploaded file: {e}") return None st.title('Audio Summarization App') with st.expander("About this app"): st.write(""" This app uses Google's Gemini Pro Multimodel to summarize audio files. Upload your audio file in WAV or MP3 form and get a concise summary of its content. """) audio_file = st.file_uploader("Upload Audio File", type=['wav', 'mp3']) if audio_file is not None: audio_path = save_uploaded_file(audio_file) # Save the uploaded file and get the path st.audio(audio_path) if st.button('Summarize Audio'): with st.spinner('Summarizing...'): summary_text = summarize_audio(audio_path) st.success(summary_text)