hprasath's picture
Upload 9 files
bbcc5b2 verified
raw
history blame
1.55 kB
import cv2
import numpy as np
from utils.imageEmbedding.index import get_image_embedding
from utils.imageToText.index import extract_text
def get_video_embedding(video_url):
try:
cap = cv2.VideoCapture(video_url)
fps = cap.get(cv2.CAP_PROP_FPS)
interval = int(fps) # Capture a frame every second
frame_count = 0
video_embeddings = []
while(cap.isOpened()):
ret, frame = cap.read()
if ret:
if frame_count % interval == 0:
# Convert frame to binary format
ret, buffer = cv2.imencode('.jpg', frame)
if not ret:
continue
# Convert frame binary data to bytes
frame_bytes = buffer.tobytes()
# Get image embedding for the frame
extracted_text = extract_text(frame_bytes)
image_embedding = get_image_embedding(frame_bytes)
image_embedding_list = image_embedding.tolist()
video_embeddings.append({"image_embedding": image_embedding_list ,"extracted_text":extracted_text})
frame_count += 1
else:
break
cap.release()
return video_embeddings
except Exception as e:
print(e)
# Example usage:
# video_url = "https://utfs.io/f/ef6c037f-fa61-471a-8956-562bc2d62531-fzxs1i.mp4"
# video_embeddings = get_video_embedding(video_url)
# print("Video Embeddings:", video_embeddings)