Spaces:
Sleeping
Sleeping
| from random import sample, shuffle | |
| import cv2 | |
| import numpy as np | |
| import torch | |
| from PIL import Image | |
| from torch.utils.data.dataset import Dataset | |
| from utils.utils import cvtColor, preprocess_input | |
| class YoloDataset(Dataset): | |
| def __init__(self, annotation_lines, clean_lines, input_shape, num_classes, anchors, anchors_mask, epoch_length, train): | |
| super(YoloDataset, self).__init__() | |
| self.annotation_lines = annotation_lines | |
| self.clean_lines = clean_lines | |
| self.input_shape = input_shape | |
| self.num_classes = num_classes | |
| self.anchors = anchors | |
| self.anchors_mask = anchors_mask | |
| self.epoch_length = epoch_length | |
| self.train = train | |
| self.epoch_now = -1 | |
| self.length = len(self.annotation_lines) | |
| self.bbox_attrs = 5 + num_classes | |
| def __len__(self): | |
| return self.length | |
| def __getitem__(self, index): | |
| index = index % self.length | |
| image, box, clearimg= self.get_random_data(self.annotation_lines[index],self.clean_lines[index], self.input_shape, random = self.train) | |
| image = np.transpose(preprocess_input(np.array(image, dtype=np.float32)), (2, 0, 1)) | |
| box = np.array(box, dtype=np.float32) | |
| clearimg = np.transpose(preprocess_input(np.array(clearimg, dtype=np.float32)), (2, 0, 1)) | |
| nL = len(box) | |
| labels_out = np.zeros((nL, 6)) | |
| if nL: | |
| box[:, [0, 2]] = box[:, [0, 2]] / self.input_shape[1] | |
| box[:, [1, 3]] = box[:, [1, 3]] / self.input_shape[0] | |
| box[:, 2:4] = box[:, 2:4] - box[:, 0:2] | |
| box[:, 0:2] = box[:, 0:2] + box[:, 2:4] / 2 | |
| labels_out[:, 1] = box[:, -1] | |
| labels_out[:, 2:] = box[:, :4] | |
| return image, labels_out, clearimg | |
| def rand(self, a=0, b=1): | |
| return np.random.rand()*(b-a) + a | |
| def get_random_data(self, annotation_line,clean_line, input_shape, jitter=.3, hue=.1, sat=0.7, val=0.4, random=True): | |
| line = annotation_line.split() | |
| clearline = clean_line.split() | |
| image = Image.open(line[0]) | |
| image = cvtColor(image) | |
| clearimg = Image.open(clearline[0]) | |
| clearimg = cvtColor(clearimg) | |
| iw, ih = image.size | |
| h, w = input_shape | |
| box = np.array([np.array(list(map(int,box.split(',')))) for box in line[1:]]) | |
| if not random: | |
| scale = min(w/iw, h/ih) | |
| nw = int(iw*scale) | |
| nh = int(ih*scale) | |
| dx = (w-nw)//2 | |
| dy = (h-nh)//2 | |
| image = image.resize((nw,nh), Image.BICUBIC) | |
| new_image = Image.new('RGB', (w,h), (128,128,128)) | |
| new_image.paste(image, (dx, dy)) | |
| image_data = np.array(new_image, np.float32) | |
| clearimg = clearimg.resize((nw, nh), Image.BICUBIC) | |
| new_clearimg = Image.new('RGB', (w, h), (128, 128, 128)) | |
| new_clearimg.paste(clearimg, (dx, dy)) | |
| clear_image_data = np.array(new_clearimg, np.float32) | |
| if len(box)>0: | |
| np.random.shuffle(box) | |
| box[:, [0,2]] = box[:, [0,2]]*nw/iw + dx | |
| box[:, [1,3]] = box[:, [1,3]]*nh/ih + dy | |
| box[:, 0:2][box[:, 0:2]<0] = 0 | |
| box[:, 2][box[:, 2]>w] = w | |
| box[:, 3][box[:, 3]>h] = h | |
| box_w = box[:, 2] - box[:, 0] | |
| box_h = box[:, 3] - box[:, 1] | |
| box = box[np.logical_and(box_w>1, box_h>1)] | |
| return image_data, box, clear_image_data | |
| new_ar = iw/ih * self.rand(1-jitter,1+jitter) / self.rand(1-jitter,1+jitter) | |
| scale = self.rand(.25, 2) | |
| if new_ar < 1: | |
| nh = int(scale*h) | |
| nw = int(nh*new_ar) | |
| else: | |
| nw = int(scale*w) | |
| nh = int(nw/new_ar) | |
| image = image.resize((nw,nh), Image.BICUBIC) | |
| clearimg = clearimg.resize((nw, nh), Image.BICUBIC) | |
| dx = int(self.rand(0, w-nw)) | |
| dy = int(self.rand(0, h-nh)) | |
| new_image = Image.new('RGB', (w,h), (128,128,128)) | |
| new_image.paste(image, (dx, dy)) | |
| image = new_image | |
| new_clearimg = Image.new('RGB', (w, h), (128, 128, 128)) | |
| new_clearimg.paste(clearimg, (dx, dy)) | |
| clearimg = new_clearimg | |
| flip = self.rand()<.5 | |
| if flip: | |
| image = image.transpose(Image.FLIP_LEFT_RIGHT) | |
| clearimg = clearimg.transpose(Image.FLIP_LEFT_RIGHT) | |
| image_data = np.array(image, np.uint8) | |
| clear_image_data = np.array(clearimg, np.uint8) | |
| r = np.random.uniform(-1, 1, 3) * [hue, sat, val] + 1 | |
| hue, sat, val = cv2.split(cv2.cvtColor(image_data, cv2.COLOR_RGB2HSV)) | |
| dtype = image_data.dtype | |
| hue1, sat1, val1 = cv2.split(cv2.cvtColor(clear_image_data, cv2.COLOR_RGB2HSV)) | |
| dtype1 = clear_image_data.dtype | |
| x = np.arange(0, 256, dtype=r.dtype) | |
| lut_hue = ((x * r[0]) % 180).astype(dtype) | |
| lut_sat = np.clip(x * r[1], 0, 255).astype(dtype) | |
| lut_val = np.clip(x * r[2], 0, 255).astype(dtype) | |
| x1 = np.arange(0, 256, dtype=r.dtype) | |
| lut_hue1 = ((x1 * r[0]) % 180).astype(dtype) | |
| lut_sat1 = np.clip(x1 * r[1], 0, 255).astype(dtype) | |
| lut_val1 = np.clip(x1 * r[2], 0, 255).astype(dtype) | |
| image_data = cv2.merge((cv2.LUT(hue, lut_hue), cv2.LUT(sat, lut_sat), cv2.LUT(val, lut_val))) | |
| image_data = cv2.cvtColor(image_data, cv2.COLOR_HSV2RGB) | |
| clear_image_data = cv2.merge((cv2.LUT(hue1, lut_hue1), cv2.LUT(sat1, lut_sat1), cv2.LUT(val1, lut_val1))) | |
| clear_image_data = cv2.cvtColor(clear_image_data, cv2.COLOR_HSV2RGB) | |
| if len(box)>0: | |
| np.random.shuffle(box) | |
| box[:, [0,2]] = box[:, [0,2]]*nw/iw + dx | |
| box[:, [1,3]] = box[:, [1,3]]*nh/ih + dy | |
| if flip: box[:, [0,2]] = w - box[:, [2,0]] | |
| box[:, 0:2][box[:, 0:2]<0] = 0 | |
| box[:, 2][box[:, 2]>w] = w | |
| box[:, 3][box[:, 3]>h] = h | |
| box_w = box[:, 2] - box[:, 0] | |
| box_h = box[:, 3] - box[:, 1] | |
| box = box[np.logical_and(box_w>1, box_h>1)] | |
| return image_data, box, clear_image_data | |
| def merge_bboxes(self, bboxes, cutx, cuty): | |
| merge_bbox = [] | |
| for i in range(len(bboxes)): | |
| for box in bboxes[i]: | |
| tmp_box = [] | |
| x1, y1, x2, y2 = box[0], box[1], box[2], box[3] | |
| if i == 0: | |
| if y1 > cuty or x1 > cutx: | |
| continue | |
| if y2 >= cuty and y1 <= cuty: | |
| y2 = cuty | |
| if x2 >= cutx and x1 <= cutx: | |
| x2 = cutx | |
| if i == 1: | |
| if y2 < cuty or x1 > cutx: | |
| continue | |
| if y2 >= cuty and y1 <= cuty: | |
| y1 = cuty | |
| if x2 >= cutx and x1 <= cutx: | |
| x2 = cutx | |
| if i == 2: | |
| if y2 < cuty or x2 < cutx: | |
| continue | |
| if y2 >= cuty and y1 <= cuty: | |
| y1 = cuty | |
| if x2 >= cutx and x1 <= cutx: | |
| x1 = cutx | |
| if i == 3: | |
| if y1 > cuty or x2 < cutx: | |
| continue | |
| if y2 >= cuty and y1 <= cuty: | |
| y2 = cuty | |
| if x2 >= cutx and x1 <= cutx: | |
| x1 = cutx | |
| tmp_box.append(x1) | |
| tmp_box.append(y1) | |
| tmp_box.append(x2) | |
| tmp_box.append(y2) | |
| tmp_box.append(box[-1]) | |
| merge_bbox.append(tmp_box) | |
| return merge_bbox | |
| def yolo_dataset_collate(batch): | |
| images = [] | |
| bboxes = [] | |
| clearimg = [] | |
| for i, (img, box, clear) in enumerate(batch): | |
| images.append(img) | |
| box[:, 0] = i | |
| bboxes.append(box) | |
| clearimg.append(clear) | |
| images = torch.from_numpy(np.array(images)).type(torch.FloatTensor) | |
| bboxes = torch.from_numpy(np.concatenate(bboxes, 0)).type(torch.FloatTensor) | |
| clearimg = torch.from_numpy(np.array(clearimg)).type(torch.FloatTensor) | |
| return images, bboxes, clearimg | |