Spaces:

akthangdz
/

TEXT_TO_VIDEO

Running

App Files Files Community

akthangdz commited on 26 days ago

Commit

a2495b3

1 Parent(s): e226cbd

main

Browse files

Files changed (3) hide show

app.py +78 -13
input.jpg +3 -0
ttv.py +10 -2

app.py CHANGED Viewed

@@ -1,18 +1,53 @@
 import gradio as gr
 import subprocess
 import os
-def run_ttv():
     try:
-        result = subprocess.run(['python', 'ttv.py'], capture_output=True, text=True)
-        # Lấy danh sách file video trong thư mục temp
-        video_files = [f for f in os.listdir('temp') if f.endswith(('.mp4', '.avi', '.mov'))]
         if video_files:
-            # Trả về đường dẫn đến file video mới nhất
-            latest_video = os.path.join('temp', video_files[-1])
-            return result.stdout, latest_video
-        return result.stdout, None
     except Exception as e:
         return f"Có lỗi xảy ra: {str(e)}", None
@@ -21,13 +56,43 @@ with gr.Blocks() as demo:
     gr.Markdown("# Ứng dụng Text-to-Video")
     with gr.Row():
-        run_button = gr.Button("Chạy Text-to-Video")
-        output = gr.Textbox(label="Kết quả")
-    # Thay đổi từ Audio sang Video
-    video_output = gr.Video(label="File video đã tạo")
-    run_button.click(fn=run_ttv, outputs=[output, video_output])
 # Chạy ứng dụng
 if __name__ == "__main__":

 import gradio as gr
 import subprocess
 import os
+import time
+def run_ttv(prompt, progress=gr.Progress()):
     try:
+        # Kiểm tra file input.jpg
+        if not os.path.exists("input.jpg"):
+            return "Lỗi: Không tìm thấy file input.jpg", None
+        progress(0, desc="Đang khởi động mô hình...")
+        # Chạy file ttv.py với prompt được truyền vào
+        env = os.environ.copy()
+        env["PROMPT_TEXT"] = prompt  # Truyền prompt qua biến môi trường
+        process = subprocess.Popen(
+            ['python', 'ttv.py'],
+            env=env,
+            stdout=subprocess.PIPE,
+            stderr=subprocess.PIPE,
+            universal_newlines=True
+        )
+        # Theo dõi output và cập nhật progress
+        output_lines = []
+        while True:
+            line = process.stdout.readline()
+            if not line and process.poll() is not None:
+                break
+            if line:
+                output_lines.append(line.strip())
+                if "Starting..." in line:
+                    progress(0.2, desc="Đang xử lý...")
+                elif "Loading model..." in line:
+                    progress(0.4, desc="Đang tải mô hình...")
+                elif "Generating..." in line:
+                    progress(0.6, desc="Đang tạo video...")
+        progress(0.8, desc="Đang hoàn thiện...")
+        # Kiểm tra và trả về video mới nhất
+        video_files = [f for f in os.listdir('.') if f.endswith(('.mp4', '.avi', '.mov'))]
         if video_files:
+            latest_video = video_files[-1]
+            progress(1.0, desc="Hoàn thành!")
+            return "\n".join(output_lines), latest_video
+        return "\n".join(output_lines), None
     except Exception as e:
         return f"Có lỗi xảy ra: {str(e)}", None
     gr.Markdown("# Ứng dụng Text-to-Video")
     with gr.Row():
+        # Thêm input cho prompt
+        text_input = gr.Textbox(
+            label="Nhập mô tả cho video",
+            placeholder="Ví dụ: A little girl is riding a bicycle at high speed...",
+            lines=3
+        )
+    with gr.Row():
+        # Thêm preview cho input image
+        input_image = gr.Image(
+            label="Ảnh input.jpg",
+            value="input.jpg" if os.path.exists("input.jpg") else None,
+            interactive=False
+        )
+        video_output = gr.Video(label="Video đã tạo")
+    with gr.Row():
+        run_button = gr.Button("Tạo Video", variant="primary")
+        output = gr.Textbox(label="Trạng thái")
+    # Thêm các thông tin hướng dẫn
+    gr.Markdown("""
+    ### Hướng dẫn sử dụng:
+    1. Đặt ảnh nguồn với tên `input.jpg` vào thư mục chứa code
+    2. Nhập mô tả chi tiết cho video bạn muốn tạo
+    3. Nhấn "Tạo Video" và đợi quá trình xử lý hoàn tất
+    ### Lưu ý:
+    - Quá trình tạo video có thể mất vài phút
+    - Đảm bảo máy tính có đủ RAM và GPU để xử lý
+    """)
+    run_button.click(
+        fn=run_ttv,
+        inputs=text_input,
+        outputs=[output, video_output]
+    )
 # Chạy ứng dụng
 if __name__ == "__main__":

input.jpg ADDED Viewed

Git LFS Details

SHA256: c86f52bddce88afb46a6218203d32f1948554183a2dad4dac3e364cde516c827
Pointer size: 130 Bytes
Size of remote file: 64.3 kB

ttv.py CHANGED Viewed

@@ -1,9 +1,14 @@
 import torch
 from diffusers import CogVideoXImageToVideoPipeline
 from diffusers.utils import export_to_video, load_image
 print("Starting...")
-prompt = "A little girl is riding a bicycle at high speed. Focused, detailed, realistic."
 image = load_image(image="input.jpg")
 pipe = CogVideoXImageToVideoPipeline.from_pretrained(
     "THUDM/CogVideoX-5b-I2V",
@@ -14,6 +19,7 @@ pipe.enable_sequential_cpu_offload()
 pipe.vae.enable_tiling()
 pipe.vae.enable_slicing()
 video = pipe(
     prompt=prompt,
     image=image,
@@ -24,4 +30,6 @@ video = pipe(
     generator=torch.Generator(device="cuda").manual_seed(42),
 ).frames[0]
-export_to_video(video, "temp/output.mp4", fps=8)

 import torch
 from diffusers import CogVideoXImageToVideoPipeline
 from diffusers.utils import export_to_video, load_image
+import os
 print("Starting...")
+# Lấy prompt từ biến môi trường hoặc sử dụng giá trị mặc định
+prompt = os.getenv('PROMPT_TEXT', "A little girl is riding a bicycle at high speed. Focused, detailed, realistic.")
+print("Loading model...")
 image = load_image(image="input.jpg")
 pipe = CogVideoXImageToVideoPipeline.from_pretrained(
     "THUDM/CogVideoX-5b-I2V",
 pipe.vae.enable_tiling()
 pipe.vae.enable_slicing()
+print("Generating...")
 video = pipe(
     prompt=prompt,
     image=image,
     generator=torch.Generator(device="cuda").manual_seed(42),
 ).frames[0]
+print("Saving video...")
+export_to_video(video, "output.mp4", fps=8)
+print("Done!")