Spaces:

Pixeltable
/

video-to-social-media-post-generator

Running

App Files Files Community

1littlecoder commited on Oct 2, 2024

Commit

304ad78

verified ·

1 Parent(s): 21e5246

fixed some edge cases like existing transcription and some code refactoring

Browse files

Files changed (1) hide show

app.py +68 -26

app.py CHANGED Viewed

@@ -6,13 +6,21 @@ from pixeltable.functions.video import extract_audio
 from pixeltable.functions import openai as pxop
 import openai
 # Set your OpenAI API key
 if 'OPENAI_API_KEY' not in os.environ:
     os.environ['OPENAI_API_KEY'] = getpass.getpass('OpenAI API Key:')
-# PixelTable setup
-db_directory = 'video_db'
-table_name = 'video_table'
 pxt.drop_dir('video_db', force=True)
 if table_name in pxt.list_tables():
@@ -42,12 +50,12 @@ else:
 # Function to generate social media post using OpenAI GPT-4 API
 def generate_social_media_post(transcript_text, social_media_type):
     response = openai.chat.completions.create(
-        model="gpt-4o-mini-2024-07-18",
         messages=[
             {"role": "system", "content": f"You are an expert in creating social media content for {social_media_type}."},
             {"role": "user", "content": f"Generate an effective and casual social media post based on this video transcript below. Make it a viral and suitable post for {social_media_type}. Transcript:\n{transcript_text}."}
         ],
-        max_tokens=500
     )
     return response.choices[0].message.content
@@ -58,34 +66,56 @@ def process_and_generate_post(video_file, social_media_type):
         try:
             video_size = os.path.getsize(video_file) / (1024 * 1024)  # Convert to MB
-            if video_size > 25:
-                return "The video file is larger than 25 MB. Please upload a smaller file."
             video_filename = os.path.basename(video_file)
-            video_df = t.where(t.video_filename == video_filename).tail(1)
             sm_gen_flag = True
             # Check if video and sm type exists
             video_type_df = t.where((t.video_filename == video_filename) & (t.sm_type == social_media_type)).tail(1)
             if video_type_df:
-                print('Video & Type Exists')
                 sm_gen_flag = False
-            if video_df and not video_type_df:
                 # Insert video into PixelTable
                 t.insert([{'video': video_file, 'video_filename': video_filename, 'sm_type': social_media_type, 'sm_post': ''}])
-            # Extract audio from video
-            if not t.get_column(name='audio'):
-                t['audio'] = extract_audio(t.video, format='mp3')
-            else:
-                t.audio = extract_audio(t.video, format='mp3')
-            # Transcribe audio using OpenAI Whisper API
-            if not t.get_column(name='transcription'):
-                t['transcription'] = pxop.transcriptions(t.audio, model='whisper-1')
-            else:
-                t.transcription = pxop.transcriptions(t.audio, model='whisper-1')
             #cur_video_df = t.where((t.video_filename == video_filename) & (t.sm_type == social_media_type)).tail(1)[0]
@@ -100,10 +130,23 @@ def process_and_generate_post(video_file, social_media_type):
             #plain_text = cur_video_df['transcription']['text']
-            # Generate social media post using GPT-4
-            social_media_post = generate_social_media_post(plain_text, social_media_type)
-            if sm_gen_flag:
-                cur_video_df.update({'sm_post': social_media_post})
             return cur_video_df['sm_post']
@@ -122,7 +165,6 @@ def gradio_interface():
 """)
         gr.Markdown("""<center><font size=6>Data Ops powered by <a href="https://github.com/pixeltable/pixeltable">Pixeltable</a></center>""")
         gr.Markdown("""<center>Pixeltable is a Python library providing a declarative interface for multimodal data (text, images, audio, video). It features built-in versioning, lineage tracking, and incremental updates, enabling users to store, transform, index, and iterate on data for their ML workflows. Data transformations, model inference, and custom logic are embedded as computed columns.
 </center>""")
         video_input = gr.Video(label="Upload Video File (max 25 MB):")
         social_media_type = gr.Dropdown(choices=["X (Twitter)", "Facebook", "LinkedIn"], label="Select Social Media Platform:", value='X (Twitter)')
@@ -137,4 +179,4 @@ def gradio_interface():
     return demo
-gradio_interface().launch(show_api=False)

 from pixeltable.functions import openai as pxop
 import openai
+# pixeltable setup
+db_directory = 'video_db'
+table_name = 'video_table'
+# constants
+MAX_VIDEO_SIZE_MB = 35
+GPT_MODEL = "gpt-4o-mini-2024-07-18"
+MAX_TOKENS = 500
+WHISPER_MODEL = 'whisper-1'
 # Set your OpenAI API key
 if 'OPENAI_API_KEY' not in os.environ:
     os.environ['OPENAI_API_KEY'] = getpass.getpass('OpenAI API Key:')
 pxt.drop_dir('video_db', force=True)
 if table_name in pxt.list_tables():
 # Function to generate social media post using OpenAI GPT-4 API
 def generate_social_media_post(transcript_text, social_media_type):
     response = openai.chat.completions.create(
+        model= GPT_MODEL,
         messages=[
             {"role": "system", "content": f"You are an expert in creating social media content for {social_media_type}."},
             {"role": "user", "content": f"Generate an effective and casual social media post based on this video transcript below. Make it a viral and suitable post for {social_media_type}. Transcript:\n{transcript_text}."}
         ],
+        max_tokens=MAX_TOKENS
     )
     return response.choices[0].message.content
         try:
             video_size = os.path.getsize(video_file) / (1024 * 1024)  # Convert to MB
+            if video_size > MAX_VIDEO_SIZE_MB:
+                return f"The video file is larger than {MAX_VIDEO_SIZE_MB} MB. Please upload a smaller file."
             video_filename = os.path.basename(video_file)
+            tr_audio_gen_flag = True
             sm_gen_flag = True
+            print("##################\nthe video file and social media are..."+video_file+"....."+social_media_type)
+            video_df = t.where(t.video_filename == video_filename).tail(1)
+            if t.select().where(t.video_filename == video_filename).count() >=1:
+                #print('Video Exists')
+                tr_audio_gen_flag = False
             # Check if video and sm type exists
             video_type_df = t.where((t.video_filename == video_filename) & (t.sm_type == social_media_type)).tail(1)
             if video_type_df:
+                #print('Video & Type Exists')
                 sm_gen_flag = False
+            #print(video_df)
+            #print('both the cases....')
+            #print(video_df  and not video_type_df)
+            #print(t.select().where(t.video_filename == video_filename).count() >=1 )
+            #print(t.select().where((t.video_filename == video_filename) & (t.sm_type == social_media_type)).count() >=1 )
+            if (t.count() < 1) or not (t.select().where(t.video_filename == video_filename).count() >=1) or (video_df  and not video_type_df) :
                 # Insert video into PixelTable
                 t.insert([{'video': video_file, 'video_filename': video_filename, 'sm_type': social_media_type, 'sm_post': ''}])
+            if tr_audio_gen_flag:
+                # Extract audio from video
+                if not t.get_column(name='audio'):
+                    t['audio'] = extract_audio(t.video, format='mp3')
+                else:
+                    t.audio = extract_audio(t.video, format='mp3')
+                print("########### processing transcription #############")
+                # Transcribe audio using OpenAI Whisper API
+                if not t.get_column(name='transcription'):
+                    t['transcription'] = pxop.transcriptions(t.audio, model= WHISPER_MODEL)
+                else:
+                    t.transcription = pxop.transcriptions(t.audio, model= WHISPER_MODEL)
             #cur_video_df = t.where((t.video_filename == video_filename) & (t.sm_type == social_media_type)).tail(1)[0]
             #plain_text = cur_video_df['transcription']['text']
+            #print(t.show())
+            #print('status of social media type')
+            #print(t.select().where((t.video_filename == video_filename) & (t.sm_type == social_media_type)).count() >=1)
+            if t.select().where((t.video_filename == video_filename) & (t.sm_type == social_media_type)  & (t.sm_post != '')).count() >=1:
+                print("retrieving existing social media post")
+                social_media_post = t.select(t.sm_post).where((t.sm_type ==social_media_type) & (t.video_filename == video_filename)).collect()['sm_post']
+                return(social_media_post)
+            else:
+                print("generating new social media post")
+                social_media_post = generate_social_media_post(plain_text, social_media_type)
+                if sm_gen_flag:
+                    cur_video_df.update({'sm_post': social_media_post})
+#            print(t.show())
             return cur_video_df['sm_post']
 """)
         gr.Markdown("""<center><font size=6>Data Ops powered by <a href="https://github.com/pixeltable/pixeltable">Pixeltable</a></center>""")
         gr.Markdown("""<center>Pixeltable is a Python library providing a declarative interface for multimodal data (text, images, audio, video). It features built-in versioning, lineage tracking, and incremental updates, enabling users to store, transform, index, and iterate on data for their ML workflows. Data transformations, model inference, and custom logic are embedded as computed columns.
 </center>""")
         video_input = gr.Video(label="Upload Video File (max 25 MB):")
         social_media_type = gr.Dropdown(choices=["X (Twitter)", "Facebook", "LinkedIn"], label="Select Social Media Platform:", value='X (Twitter)')
     return demo
+gradio_interface().launch(show_api=False)