Added functionality to use SSD with COCO data set

Signed-off-by: Jim Martens <github@2martens.de>
2019-07-23 11:21:06 +02:00
parent e20167182f
commit d6047665ef
3 changed files with 177 additions and 14 deletions
--- a/src/twomartens/masterthesis/cli.py
+++ b/src/twomartens/masterthesis/cli.py
@ -227,6 +227,7 @@ def _ssd_test(args: argparse.Namespace) -> None:
    batch_size, image_size, learning_rate, \
        forward_passes_per_image, nr_classes, iou_threshold, dropout_rate, \
        use_entropy_threshold, entropy_threshold_min, entropy_threshold_max, \
+        use_coco, \
        top_k, nr_trajectories, test_pretrained, \
        coco_path, output_path, weights_path, ground_truth_path = _ssd_test_get_config_values(args, conf.get_property)
    
@ -252,6 +253,8 @@ def _ssd_test(args: argparse.Namespace) -> None:
    ssd.compile_model(ssd_model, learning_rate, loss_func)

    test_generator, length_dataset, test_debug_generator = _ssd_test_get_generators(args,
+                                                                                    use_coco,
+                                                                                    data.load_coco_val_ssd,
                                                                                    data.load_scenenet_data,
                                                                                    file_names,
                                                                                    instances,
@ -531,6 +534,7 @@ def _ssd_test_get_config_values(args: argparse.Namespace,
                                config_get: Callable[[str], Union[str, float, int, bool]]
                                ) -> Tuple[int, int, float, int, int, float, float,
                                           bool, float, float,
+                                           bool,
                                           int, int, bool,
                                           str, str, str, str]:
    
@ -544,6 +548,7 @@ def _ssd_test_get_config_values(args: argparse.Namespace,
    use_entropy_threshold = config_get("Parameters.ssd_use_entropy_threshold")
    entropy_threshold_min = config_get("Parameters.ssd_entropy_threshold_min")
    entropy_threshold_max = config_get("Parameters.ssd_entropy_threshold_max")
+    use_coco = config_get("Parameters.ssd_use_coco")
    top_k = config_get("Parameters.ssd_top_k")
    nr_trajectories = config_get("Parameters.nr_trajectories")
    test_pretrained = config_get("Parameters.ssd_test_pretrained")
@ -569,6 +574,8 @@ def _ssd_test_get_config_values(args: argparse.Namespace,
        entropy_threshold_min,
        entropy_threshold_max,
        #
+        use_coco,
+        #
        top_k,
        nr_trajectories,
        test_pretrained,
@ -798,7 +805,9 @@ def _ssd_train_get_generators(args: argparse.Namespace,


 def _ssd_test_get_generators(args: argparse.Namespace,
-                             load_data: callable,
+                             use_coco: bool,
+                             load_data_coco: callable,
+                             load_data_scenenet: callable,
                             file_names: Sequence[Sequence[str]],
                             instances: Sequence[Sequence[Sequence[dict]]],
                             coco_path: str,
@ -807,10 +816,21 @@ def _ssd_test_get_generators(args: argparse.Namespace,
                             nr_trajectories: int,
                             predictor_sizes: Sequence[Sequence[int]]) -> Tuple[Generator, int, Generator]:
    
+    from twomartens.masterthesis import data
+    
    if nr_trajectories == -1:
        nr_trajectories = None
    
-    generator, length, debug_generator = load_data(file_names, instances, coco_path,
+    if use_coco:
+        generator, length, debug_generator = load_data_coco(data.clean_dataset,
+                                                            data.group_bboxes_to_images,
+                                                            coco_path,
+                                                            batch_size,
+                                                            image_size,
+                                                            training=False, evaluation=True, augment=False,
+                                                            debug=args.debug)
+    else:
+        generator, length, debug_generator = load_data_scenenet(file_names, instances, coco_path,
                                                                predictor_sizes=predictor_sizes,
                                                                batch_size=batch_size,
                                                                image_size=image_size,
--- a/src/twomartens/masterthesis/config.py
+++ b/src/twomartens/masterthesis/config.py
@ -63,6 +63,7 @@ _CONFIG_PROPS = {
        "ssd_entropy_threshold_min": (float, "0.1"),
        "ssd_entropy_threshold_max": (float, "2.5"),
        "ssd_test_pretrained": (bool, "False"),
+        "ssd_use_coco": (bool, "False"),
        "nr_trajectories": (int, "-1")
    }
 }
--- a/src/twomartens/masterthesis/data.py
+++ b/src/twomartens/masterthesis/data.py
@ -78,7 +78,7 @@ def load_coco_train(data_path: str, category: int,
    file_names.update(file_names_val)
    ids_to_images = {image['id']: image for image in images}
    
-    checked_file_names, checked_bboxes = _clean_dataset(annotations, file_names, ids_to_images)
+    checked_file_names, checked_bboxes = clean_dataset(annotations, file_names, ids_to_images)
    length_dataset = len(checked_file_names)
    
    # build image data set
@ -119,7 +119,7 @@ def load_coco_val(data_path: str, category: int,
    file_names = {image['id']: f"{data_path}/val2014/{image['file_name']}" for image in images}
    ids_to_images = {image['id']: image for image in images}
    
-    checked_file_names, checked_bboxes = _clean_dataset(annotations, file_names, ids_to_images)
+    checked_file_names, checked_bboxes = clean_dataset(annotations, file_names, ids_to_images)
    length_dataset = len(checked_file_names)
    
    # build image data set
@ -133,7 +133,7 @@ def load_coco_val(data_path: str, category: int,
    return dataset


-def _clean_dataset(annotations: Sequence[dict], file_names: Mapping[str, str],
+def clean_dataset(annotations: Sequence[dict], file_names: Mapping[str, str],
                  ids_to_images: Mapping[str, dict]) -> Tuple[List[str], List[List[float]]]:
    """
    Cleans a given data set from problematic cases and returns cleaned version.
@ -152,7 +152,7 @@ def _clean_dataset(annotations: Sequence[dict], file_names: Mapping[str, str],
        img_id = annotation['image_id']
        image = ids_to_images[img_id]
        file_name = file_names[img_id]
-        bbox = annotation['bbox']
+        bbox = annotation['bbox']  # type: List[float]
        target_height = round(bbox[3])
        target_width = round(bbox[2])
        image_width, image_height = image['width'], image['height']
@ -178,9 +178,16 @@ def _clean_dataset(annotations: Sequence[dict], file_names: Mapping[str, str],
            continue
        bbox[2] = target_width
        bbox[3] = target_height
+        new_bbox = [
+            annotation['category_id'],
+            x1,
+            y1,
+            round(bbox[0] + bbox[2]),
+            round(bbox[1] + bbox[3])
+        ]
        
        checked_file_names.append(file_name)
-        checked_bboxes.append(bbox)
+        checked_bboxes.append(new_bbox)
    
    return checked_file_names, checked_bboxes

@ -232,6 +239,141 @@ def _load_images_callback(resized_shape: Sequence[int]) -> Callable[
    return _load_images


+def group_bboxes_to_images(file_names: Sequence[str], bboxes: Sequence[Sequence[int]]) -> Tuple[List[str],
+                                                                                                List[List[List[int]]]]:
+    return_labels = {}
+    for file_name, bbox in zip(file_names, bboxes):
+        if file_name not in return_labels:
+            return_labels[file_name] = []
+        return_labels[file_name].append(bbox)
+    
+    return list(return_labels.keys()), list(return_labels.values())
+
+
+def load_coco_val_ssd(clean_dataset: callable,
+                      group_bboxes_to_images: callable,
+                      coco_path: str,
+                      batch_size: int,
+                      image_size: int,
+                      training: bool,
+                      evaluation: bool,
+                      augment: bool,
+                      debug: bool,
+                      predictor_sizes: Optional[np.ndarray]) -> Tuple[Generator, int, Optional[Generator]]:
+    """
+    Loads the COCO minival2014/val2017 data and returns a data set.
+
+    Args:
+        clean_dataset: function that cleans the data set
+        group_bboxes_to_images: function that groups bounding boxes to corresponding file name
+        coco_path: path to the COCO data set
+        batch_size: batch size
+        image_size: size of images after resizing them
+        training: True if training data is desired
+        evaluation: True if evaluation-ready data is desired
+        augment: True if training data should be augmented
+        debug: True if a more extensive generator should be added to output
+        predictor_sizes: sizes of the predictor layers, can be None for evaluation
+        
+    Returns:
+        coco data set generator
+        length of dataset
+        generator which offers processed_labels as well (only if debug is True)
+    """
+    from pycocotools import coco
+    
+    from twomartens.masterthesis.ssd_keras.eval_utils import coco_utils
+    
+    annotation_file_minival = f"{coco_path}/annotations/instances_minival2014.json"
+    resized_shape = (image_size, image_size)
+    
+    coco_val = coco.COCO(annotation_file_minival)
+    img_ids = coco_val.getImgIds()  # return all image IDs belonging to given category
+    images = coco_val.loadImgs(img_ids)  # load all images
+    annotation_ids = coco_val.getAnnIds(img_ids)
+    annotations = coco_val.loadAnns(annotation_ids)  # load all image annotations
+    file_names = {image['id']: f"{coco_path}/val2014/{image['file_name']}" for image in images}
+    ids_to_images = {image['id']: image for image in images}
+
+    annotation_file_train = f"{coco_path}/annotations/instances_train2014.json"
+    cats_to_classes, _, _, _ = coco_utils.get_coco_category_maps(annotation_file_train)
+    
+    checked_image_paths, checked_bboxes = clean_dataset(annotations, file_names, ids_to_images)
+    final_image_paths, final_labels = group_bboxes_to_images(checked_image_paths, checked_bboxes)
+
+    data_generator = object_detection_2d_data_generator.DataGenerator(
+        filenames=final_image_paths,
+        labels=final_labels
+    )
+
+    shuffle = True if training else False
+
+    if training and augment:
+        transformations = [data_augmentation_chain_original_ssd.SSDDataAugmentation(
+            img_width=resized_shape[0],
+            img_height=resized_shape[1]
+        )]
+    else:
+        transformations = [
+            object_detection_2d_photometric_ops.ConvertTo3Channels(),
+            object_detection_2d_geometric_ops.Resize(height=resized_shape[0],
+                                                     width=resized_shape[1])
+        ]
+
+    returns = {'processed_images', 'encoded_labels'}
+    returns_debug = {'processed_images', 'encoded_labels', 'processed_labels'}
+
+    if not training and evaluation:
+        returns = {
+            'processed_images',
+            'filenames',
+            'inverse_transform',
+            'original_labels'}
+        label_encoder = None
+    else:
+        if predictor_sizes is None:
+            raise ValueError("predictor_sizes cannot be None for training/validation")
+        label_encoder = ssd_input_encoder.SSDInputEncoder(
+            img_height=resized_shape[0],
+            img_width=resized_shape[1],
+            n_classes=len(cats_to_classes),  # 80
+            predictor_sizes=predictor_sizes,
+            steps=[8, 16, 32, 64, 100, 300],
+            coords="corners",
+            aspect_ratios_per_layer=[[1.0, 2.0, 0.5],
+                                     [1.0, 2.0, 0.5, 3.0, 1.0 / 3.0],
+                                     [1.0, 2.0, 0.5, 3.0, 1.0 / 3.0],
+                                     [1.0, 2.0, 0.5, 3.0, 1.0 / 3.0],
+                                     [1.0, 2.0, 0.5],
+                                     [1.0, 2.0, 0.5]]
+        )
+
+    if debug:
+        debug_generator = data_generator.generate(
+            batch_size=batch_size,
+            shuffle=shuffle,
+            transformations=transformations,
+            label_encoder=label_encoder,
+            returns=returns_debug,
+            keep_images_without_gt=False
+        )
+    else:
+        debug_generator = None
+
+    length_dataset = data_generator.dataset_size
+
+    generator = data_generator.generate(
+        batch_size=batch_size,
+        shuffle=shuffle,
+        transformations=transformations,
+        label_encoder=label_encoder,
+        returns=returns,
+        keep_images_without_gt=False
+    )
+    
+    return generator, length_dataset, debug_generator
+
+
 def load_scenenet_data(photo_paths: Sequence[Sequence[str]],
                       instances: Sequence[Sequence[Sequence[dict]]],
                       coco_path: str,