AI-based_security_risk_identification_and_prevention_applications

Paused

App Files Files Community

qsitj commited on 9 days ago

Commit

fd08bcf

verified ·

1 Parent(s): aae3e7a

Update app.py

Browse files

Files changed (1) hide show

app.py +39 -10

app.py CHANGED Viewed

@@ -1,7 +1,7 @@
 import gradio as gr
 import cv2
 import numpy as np
-from PIL import Image,ImageDraw
 from transformers import pipeline
 import torch
 from random import choice
@@ -28,9 +28,27 @@ label_color_dict = {}
 def query_data(in_pil_img: Image.Image):
     results = detector(in_pil_img)
-    # print(f"检测结果：{results}")
     return results
 def get_annotated_image(in_pil_img):
     draw = ImageDraw.Draw(in_pil_img)
     in_results = query_data(in_pil_img)
@@ -40,23 +58,34 @@ def get_annotated_image(in_pil_img):
         label = prediction['label']
         score = round(prediction['score'] * 100, 1)
         if score < 50:
-            continue # 过滤掉低置信度的预测结果
-        if label not in label_color_dict: # 为每个类别随机分配颜色, 后续维持一致
             color = choice(COLORS)
             label_color_dict[label] = color
         else:
             color = label_color_dict[label]
         # 绘制矩形
         draw.rectangle([box['xmin'], box['ymin'], box['xmax'], box['ymax']], outline=color, width=3)
         # 添加文本
-        draw.text((box['xmin'], box['ymin']), f"{label}: {score}%", fill=color, fontdict=fdic)
     # 返回的是原始图像对象，它已经被修改了
     return np.array(in_pil_img.convert('RGB'))
 def process_video(input_video_path):
     cap = cv2.VideoCapture(input_video_path)
     if not cap.isOpened():
@@ -74,7 +103,7 @@ def process_video(input_video_path):
     timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
     output_video_filename = f"output_{timestamp}.mp4"
     output_video_path = os.path.join(output_dir, output_video_filename)
-    # print(f"输出视频信息：{output_video_path}, {width}x{height}, {fps}fps")
     out = cv2.VideoWriter(output_video_path, fourcc, fps, (width, height))
     while True:
@@ -84,15 +113,15 @@ def process_video(input_video_path):
         rgb_frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
         pil_image = Image.fromarray(rgb_frame)
-        # print(f"Input frame of shape {rgb_frame.shape} and type {rgb_frame.dtype}")  # 调试信息
         annotated_frame = get_annotated_image(pil_image)
         bgr_frame = cv2.cvtColor(annotated_frame, cv2.COLOR_RGB2BGR)
-        # print(f"Annotated frame of shape {bgr_frame.shape} and type {bgr_frame.dtype}")  # 调试信息
         # 确保帧的尺寸与视频输出一致
         if bgr_frame.shape[:2] != (height, width):
             bgr_frame = cv2.resize(bgr_frame, (width, height))
-        # print(f"Writing frame of shape {bgr_frame.shape} and type {bgr_frame.dtype}")  # 调试信息
         out.write(bgr_frame)
     cap.release()

 import gradio as gr
 import cv2
 import numpy as np
+from PIL import Image,ImageDraw, ImageFont
 from transformers import pipeline
 import torch
 from random import choice
 def query_data(in_pil_img: Image.Image):
     results = detector(in_pil_img)
+    print(f"检测结果：{results}")
     return results
+def get_font_size(box_width, min_size=10, max_size=48):
+    """根据边界框宽度计算合适的字体大小"""
+    # 字体大小取决于边界框宽度，取值最小为24
+    font_size = max(24,int(box_width / 10))
+    return max(min(font_size, max_size), min_size)
+def get_text_position(box, text_bbox):
+    """根据边界框和文本边界框返回适当的位置"""
+    xmin, ymin, xmax, ymax = box['xmin'], box['ymin'], box['xmax'], box['ymax']
+    text_width, text_height = text_bbox[2] - text_bbox[0], text_bbox[3] - text_bbox[1]
+    # 尝试将文本放置在边界框上方，但如果空间不足，则放置在边界框内
+    if ymin - text_height >= 0:
+        return (xmin, ymin - text_height)  # 上方
+    else:
+        return (xmin, ymin)  # 内部
 def get_annotated_image(in_pil_img):
     draw = ImageDraw.Draw(in_pil_img)
     in_results = query_data(in_pil_img)
         label = prediction['label']
         score = round(prediction['score'] * 100, 1)
         if score < 50:
+            continue  # 过滤掉低置信度的预测结果
+        if label not in label_color_dict:  # 为每个类别随机分配颜色, 后续维持一致
             color = choice(COLORS)
             label_color_dict[label] = color
         else:
             color = label_color_dict[label]
+        # 计算字体大小
+        box_width = box['xmax'] - box['xmin']
+        font_size = get_font_size(box_width)
+        font = ImageFont.truetype("arial.ttf", size=font_size)  # 确保你有可用的字体文件
+        # 获取文本边界框
+        text = f"{label}: {score}%"
+        text_bbox = draw.textbbox((0, 0), text, font=font)
         # 绘制矩形
         draw.rectangle([box['xmin'], box['ymin'], box['xmax'], box['ymax']], outline=color, width=3)
         # 添加文本
+        text_pos = get_text_position(box, text_bbox)
+        draw.text(text_pos, text, fill=color, font=font)
     # 返回的是原始图像对象，它已经被修改了
     return np.array(in_pil_img.convert('RGB'))
 def process_video(input_video_path):
     cap = cv2.VideoCapture(input_video_path)
     if not cap.isOpened():
     timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
     output_video_filename = f"output_{timestamp}.mp4"
     output_video_path = os.path.join(output_dir, output_video_filename)
+    print(f"输出视频信息：{output_video_path}, {width}x{height}, {fps}fps")
     out = cv2.VideoWriter(output_video_path, fourcc, fps, (width, height))
     while True:
         rgb_frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
         pil_image = Image.fromarray(rgb_frame)
+        print(f"Input frame of shape {rgb_frame.shape} and type {rgb_frame.dtype}")  # 调试信息
         annotated_frame = get_annotated_image(pil_image)
         bgr_frame = cv2.cvtColor(annotated_frame, cv2.COLOR_RGB2BGR)
+        print(f"Annotated frame of shape {bgr_frame.shape} and type {bgr_frame.dtype}")  # 调试信息
         # 确保帧的尺寸与视频输出一致
         if bgr_frame.shape[:2] != (height, width):
             bgr_frame = cv2.resize(bgr_frame, (width, height))
+        print(f"Writing frame of shape {bgr_frame.shape} and type {bgr_frame.dtype}")  # 调试信息
         out.write(bgr_frame)
     cap.release()