File size: 2,013 Bytes
cc8d245
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
e65e6e5
cc8d245
 
64fa793
cc8d245
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
07ecc9d
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
import streamlit as st  
import numpy as np  
import cv2  
import tempfile  
from gradio_client import Client  
from PIL import Image  

# Проверка доступности API  
api_url = "https://pragnakalp-ocr-image-to-text.hf.space/--replicas/lhzf3/"  
try:  
    client = Client(api_url)  
except Exception as e:  
    st.error(f"Failed to initialize client: {str(e)}")  
    st.stop()  

# Заголовок приложения  
st.title("Video Frame to Image Description")  

# Загрузка видеофайла  
uploaded_file = st.file_uploader("Upload a video file", type=["mp4", "avi", "mov"])  

cap = None  # Инициализируем объект cap как None  

if uploaded_file is not None:  
    tfile = tempfile.NamedTemporaryFile(delete=False)  
    tfile.write(uploaded_file.read())  
    
    cap = cv2.VideoCapture(tfile.name)  
    length = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))  
    
    if length > 0:  
        random_frame = np.random.randint(length)  
        cap.set(cv2.CAP_PROP_POS_FRAMES, random_frame)  
        ret, frame = cap.read()  

        if ret:  
            frame_rgb = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)  
            pil_image = Image.fromarray(frame_rgb)  
            st.image(pil_image, caption=f"Random Frame {random_frame}")  

            buf = tempfile.NamedTemporaryFile(suffix='.jpg', delete=False)  
            pil_image.save(buf, format='JPEG')  
            buf.close()  

            try:  
                result = client.predict("PaddleOCR", buf.name, api_name="/predict")  
                description = result['data']  
                st.success(f"Generated Description: {description}")  
            except Exception as e:  
                st.error(f"Error: Could not get a response from the model. {str(e)}")  
        else:  
            st.error("Error: Could not read a frame from the video.")  
    else:  
        st.error("Error: Video file does not contain any frames.")  

if cap is not None:  
    cap.release()