Spaces:
Sleeping
Sleeping
import PIL #version 1.2.0 | |
import torch | |
import os | |
import torchvision.transforms.functional as F | |
import numpy as np | |
import random | |
def intersect(boxes1, boxes2): | |
''' | |
Find intersection of every box combination between two sets of box | |
boxes1: bounding boxes 1, a tensor of dimensions (n1, 4) | |
boxes2: bounding boxes 2, a tensor of dimensions (n2, 4) | |
Out: Intersection each of boxes1 with respect to each of boxes2, | |
a tensor of dimensions (n1, n2) | |
''' | |
n1 = boxes1.size(0) | |
n2 = boxes2.size(0) | |
max_xy = torch.min(boxes1[:, 2:].unsqueeze(1).expand(n1, n2, 2), | |
boxes2[:, 2:].unsqueeze(0).expand(n1, n2, 2)) | |
min_xy = torch.max(boxes1[:, :2].unsqueeze(1).expand(n1, n2, 2), | |
boxes2[:, :2].unsqueeze(0).expand(n1, n2, 2)) | |
inter = torch.clamp(max_xy - min_xy , min=0) # (n1, n2, 2) | |
return inter[:, :, 0] * inter[:, :, 1] #(n1, n2) | |
def find_IoU(boxes1, boxes2): | |
''' | |
Find IoU between every boxes set of boxes | |
boxes1: a tensor of dimensions (n1, 4) (left, top, right , bottom) | |
boxes2: a tensor of dimensions (n2, 4) | |
Out: IoU each of boxes1 with respect to each of boxes2, a tensor of | |
dimensions (n1, n2) | |
Formula: | |
(box1 ∩ box2) / (box1 u box2) = (box1 ∩ box2) / (area(box1) + area(box2) - (box1 ∩ box2 )) | |
''' | |
inter = intersect(boxes1, boxes2) | |
area_boxes1 = (boxes1[:, 2] - boxes1[:, 0]) * (boxes1[:, 3] - boxes1[:, 1]) | |
area_boxes2 = (boxes2[:, 2] - boxes2[:, 0]) * (boxes2[:, 3] - boxes2[:, 1]) | |
area_boxes1 = area_boxes1.unsqueeze(1).expand_as(inter) #(n1, n2) | |
area_boxes2 = area_boxes2.unsqueeze(0).expand_as(inter) #(n1, n2) | |
union = (area_boxes1 + area_boxes2 - inter) | |
return inter / union | |
def random_crop(image, boxes, labels, difficulties=None): | |
''' | |
image: A PIL image | |
boxes: Bounding boxes, a tensor of dimensions (#objects, 4) | |
labels: labels of object, a tensor of dimensions (#objects) | |
difficulties: difficulties of detect object, a tensor of dimensions (#objects) | |
Out: cropped image , new boxes, new labels, new difficulties | |
''' | |
if type(image) == PIL.Image.Image: | |
image = F.to_tensor(image) | |
original_h = image.size(1) | |
original_w = image.size(2) | |
while True: | |
mode = random.choice([0.1, 0.3, 0.5, 0.9, None]) | |
if mode is None: | |
return F.to_pil_image(image), boxes, labels, difficulties | |
new_image = image | |
new_boxes = boxes | |
new_difficulties = difficulties | |
new_labels = labels | |
for _ in range(50): | |
# Crop dimensions: [0.3, 1] of original dimensions | |
new_h = random.uniform(0.3*original_h, original_h) | |
new_w = random.uniform(0.3*original_w, original_w) | |
# Aspect ratio constraint b/t .5 & 2 | |
if new_h/new_w < 0.5 or new_h/new_w > 2: | |
continue | |
#Crop coordinate | |
left = random.uniform(0, original_w - new_w) | |
right = left + new_w | |
top = random.uniform(0, original_h - new_h) | |
bottom = top + new_h | |
crop = torch.FloatTensor([int(left), int(top), int(right), int(bottom)]) | |
# Calculate IoU between the crop and the bounding boxes | |
overlap = find_IoU(crop.unsqueeze(0), boxes) #(1, #objects) | |
overlap = overlap.squeeze(0) | |
# If not a single bounding box has a IoU of greater than the minimum, try again | |
if overlap.shape[0] == 0: | |
continue | |
if overlap.max().item() < mode: | |
continue | |
#Crop | |
new_image = image[:, int(top):int(bottom), int(left):int(right)] #(3, new_h, new_w) | |
#Center of bounding boxes | |
center_bb = (boxes[:, :2] + boxes[:, 2:])/2.0 | |
#Find bounding box has been had center in crop | |
center_in_crop = (center_bb[:, 0] >left) * (center_bb[:, 0] < right | |
) *(center_bb[:, 1] > top) * (center_bb[:, 1] < bottom) #( #objects) | |
if not center_in_crop.any(): | |
continue | |
#take matching bounding box | |
new_boxes = boxes[center_in_crop, :] | |
#take matching labels | |
new_labels = labels[center_in_crop] | |
#take matching difficulities | |
if difficulties is not None: | |
new_difficulties = difficulties[center_in_crop] | |
else: | |
new_difficulties = None | |
#Use the box left and top corner or the crop's | |
new_boxes[:, :2] = torch.max(new_boxes[:, :2], crop[:2]) | |
#adjust to crop | |
new_boxes[:, :2] -= crop[:2] | |
new_boxes[:, 2:] = torch.min(new_boxes[:, 2:],crop[2:]) | |
#adjust to crop | |
new_boxes[:, 2:] -= crop[:2] | |
return F.to_pil_image(new_image), new_boxes, new_labels, new_difficulties |