PICS / datasets /cityscapes.py
Hang Zhou
Upload folder using huggingface_hub
0103f17 verified
import cv2
import numpy as np
import os
from PIL import Image
from .data_utils import *
from .base import BaseDataset
import PIL.ImageDraw as ImageDraw
from util.box_ops import mask_to_bbox_xywh, compute_iou_matrix, draw_bboxes
from util.cityscapes_ops import Annotation, name2label
from pathlib import Path
import shutil
IS_VERIFY = False
class CityscapesDataset(BaseDataset):
def __init__(self, construct_dataset_dir, obj_thr=20, area_ratio=0.02):
self.obj_thr = obj_thr
self.construct_dataset_dir = construct_dataset_dir
os.makedirs(Path(self.construct_dataset_dir), exist_ok=True)
self.area_ratio = area_ratio
self.sample_list = os.listdir(self.construct_dataset_dir)
def _intersect_2_obj(self, image_dir, json_dir, idx):
json_list = os.listdir(json_dir)
image_name = json_list[idx][:-21]
image_path = os.path.join(image_dir, image_name+'_leftImg8bit.png')
image = cv2.imread(image_path)
image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
json_path = os.path.join(json_dir, image_name+'_gtFine_polygons.json')
annotation = Annotation()
annotation.fromJsonFile(json_path)
size = (annotation.imgWidth, annotation.imgHeight)
image_area = size[0]*size[1]
# the background
background = name2label['unlabeled'].color
obj_ids = []
obj_areas = []
obj_bbox = []
counter = 0
# loop over all objects
for obj in annotation.objects:
label = obj.label
polygon = obj.polygon
if (not label in name2label) and label.endswith('group'):
label = label[:-len('group')]
# only get car/truck/bus class
if name2label[label].id !=26 and name2label[label].id !=27 and name2label[label].id !=28:
continue
labelImg = Image.new("RGBA", size, background)
drawer = ImageDraw.Draw(labelImg)
drawer.polygon(polygon, fill=(255, 255, 255))
mask = np.array(labelImg)[:, :, 0]
area = np.sum(mask/255)
bbox = mask_to_bbox_xywh(mask)
if area > image_area * self.area_ratio:
obj_ids.append(counter)
obj_areas.append(area)
obj_bbox.append(bbox)
counter += 1
if len(obj_bbox) < 2:
print(f"[Info] Skip image index {image_name} due to insufficient bbox.")
return
# filter by IOU
bbox_xyxy = []
for box in obj_bbox:
x, y, w, h = box
bbox_xyxy.append([x, y, x + w, y + h])
bbox_xyxy = np.array(bbox_xyxy) # shape: [N, 4]
if IS_VERIFY:
os.makedirs(Path(self.construct_dataset_dir) / image_name, exist_ok=True)
image_with_boxes = draw_bboxes(image, bbox_xyxy)
cv2.imwrite(str(Path(self.construct_dataset_dir) / image_name / "bboxes_image.png"), cv2.cvtColor(image_with_boxes, cv2.COLOR_RGB2BGR))
iou_matrix = compute_iou_matrix(bbox_xyxy)
np.fill_diagonal(iou_matrix, -1) # Exclude self-comparisons (i.e., each box with itself)
max_index = np.unravel_index(np.argmax(iou_matrix), iou_matrix.shape)
index0, index1 = max_index[0], max_index[1]
max_iou = iou_matrix[index0, index1]
if max_iou <= 0:
print(f"[Info] Skip image index {image_name} due to no overlapping bboxes.")
return
os.makedirs(Path(self.construct_dataset_dir) / image_name, exist_ok=True)
dst = Path(self.construct_dataset_dir) / image_name / "image.jpg"
dst.parent.mkdir(parents=True, exist_ok=True)
shutil.copy(image_path, dst)
counter = 0
for obj in annotation.objects:
label = obj.label
polygon = obj.polygon
if (not label in name2label) and label.endswith('group'):
label = label[:-len('group')]
# only get car/truck/bus class
if name2label[label].id !=26 and name2label[label].id !=27 and name2label[label].id !=28:
continue
if counter == obj_ids[index0]:
labelImg = Image.new("RGBA", size, background)
drawer = ImageDraw.Draw(labelImg)
drawer.polygon(polygon, fill=(255, 255, 255))
mask = np.array(labelImg)[:, :, 0]/255
cv2.imwrite(str(Path(self.construct_dataset_dir) / image_name / "object_0_mask.png"), 255*mask)
patch = self.get_patch(image, mask)
patch = cv2.cvtColor(patch, cv2.COLOR_RGB2BGR)
cv2.imwrite(str(Path(self.construct_dataset_dir) / image_name / "object_0.png"), patch)
break
counter += 1
if IS_VERIFY:
mask_color = np.stack([mask * 255]*3, axis=-1).astype(np.uint8)
highlight = np.zeros_like(image)
highlight[:, :, 2] = 255 # red channel
alpha = 0.5
image_with_boxes = np.where(mask_color == 255, cv2.addWeighted(image_with_boxes, 1 - alpha, highlight, alpha, 0), image_with_boxes)
counter = 0
for obj in annotation.objects:
label = obj.label
polygon = obj.polygon
if (not label in name2label) and label.endswith('group'):
label = label[:-len('group')]
# only get car/truck/bus class
if name2label[label].id !=26 and name2label[label].id !=27 and name2label[label].id !=28:
continue
if counter == obj_ids[index1]:
labelImg = Image.new("RGBA", size, background)
drawer = ImageDraw.Draw(labelImg)
drawer.polygon(polygon, fill=(255, 255, 255))
mask = np.array(labelImg)[:, :, 0]/255
cv2.imwrite(str(Path(self.construct_dataset_dir) / image_name / "object_1_mask.png"), 255*mask)
patch = self.get_patch(image, mask)
patch = cv2.cvtColor(patch, cv2.COLOR_RGB2BGR)
cv2.imwrite(str(Path(self.construct_dataset_dir) / image_name / "object_1.png"), patch)
break
counter += 1
if IS_VERIFY:
mask_color = np.stack([mask * 255]*3, axis=-1).astype(np.uint8)
highlight = np.zeros_like(image)
highlight[:, :, 0] = 255 # blue channel
alpha = 0.5
image_with_boxes = np.where(mask_color == 255, cv2.addWeighted(image_with_boxes, 1 - alpha, highlight, alpha, 0), image_with_boxes)
cv2.imwrite(str(Path(self.construct_dataset_dir) / image_name / "highlighted_image.png"), cv2.cvtColor(image_with_boxes, cv2.COLOR_RGB2BGR))
def _get_sample(self, idx):
sample_path = os.path.join(self.construct_dataset_dir, self.sample_list[idx])
image = cv2.cvtColor(cv2.imread(os.path.join(sample_path, "image.jpg")), cv2.COLOR_BGR2RGB)
object_0 = cv2.cvtColor(cv2.imread(os.path.join(sample_path, "object_0.png")), cv2.COLOR_BGR2RGB)
object_1 = cv2.cvtColor(cv2.imread(os.path.join(sample_path, "object_1.png")), cv2.COLOR_BGR2RGB)
mask_0 = cv2.imread(os.path.join(sample_path, "object_0_mask.png"), cv2.IMREAD_GRAYSCALE)
mask_1 = cv2.imread(os.path.join(sample_path, "object_1_mask.png"), cv2.IMREAD_GRAYSCALE)
collage = self._construct_collage(image, object_0, object_1, mask_0, mask_1)
return collage
def __len__(self):
return len(os.listdir(self.construct_dataset_dir))
if __name__ == "__main__":
'''
two-object case: train/test: 536/78
'''
import argparse
parser = argparse.ArgumentParser(description="CityscapesDataset Analysis")
parser.add_argument("--dataset_dir", type=str, required=True, help="Path to the dataset directory.")
parser.add_argument("--construct_dataset_dir", type=str, default='bin', help="Path to the debug bin directory.")
parser.add_argument("--dataset_name", type=str, default='Cityscapes', help="Dataset name.")
parser.add_argument('--is_train', action='store_true', help="Train/Test")
parser.add_argument('--is_build_data', action='store_true', help="Build data")
parser.add_argument('--is_multiple', action='store_true', help="Multiple/Two objects")
parser.add_argument("--area_ratio", type=float, default=0.01171, help="Area ratio for filtering out small objects.")
parser.add_argument("--obj_thr", type=int, default=20, help="Object threshold for filtering.")
parser.add_argument("--index", type=int, default=0, help="Index of the sample to test.")
args = parser.parse_args()
if args.is_train:
image_dir = Path(args.dataset_dir) / args.dataset_name / "train" / "images"
json_dir = Path(args.dataset_dir) / args.dataset_name / "train" / "jsons"
max_num = 2975
else:
image_dir = Path(args.dataset_dir) / args.dataset_name / "val" / "images"
json_dir = Path(args.dataset_dir) / args.dataset_name / "val" / "jsons"
max_num = 500
dataset = CityscapesDataset(
construct_dataset_dir = args.construct_dataset_dir,
obj_thr = args.obj_thr,
area_ratio = args.area_ratio,
)
if args.is_build_data:
if not args.is_multiple:
for index in range(max_num):
dataset._intersect_2_obj(image_dir, json_dir, index)
else:
for index in range(len(os.listdir(args.construct_dataset_dir))):
collage = dataset._get_sample(index)