Source code for tests.test_yolo_inference

"""
Inference tests using weights of pretrained YOLOv5
"""

import matplotlib.pyplot as plt
import numpy as np

from inet.data.load_dataset import directory_to_two_in_one_dataset
from inet.losses.giou_loss import GIoULoss
from inet.models.data_structures import BoundingBox
from inet.models.tf_lite.tflite_methods import evaluate_interpreted_model
from tests.helper import Timer, build_tf_model_from_file


[docs]def filter_classes(classes_in):
    """
    transforms one-hot-encoded prediction into class indices

    :param classes_in: one-hot-encoded predictions
    :return: converted labels
    """
    classes_out = []
    for i in range(classes_in.shape[0]):
        classes_out.append(classes_in.argmax())
    return classes_out


[docs]def process_best_prediction(prediction):
    """
    Select best prediction for each sample

    :param prediction: iterable holding performed predictions
    :return: The best prediction for each input sample
    """
    processed_predictions = []
    for pred in prediction:
        preds = pred[0]
        preds = preds[preds[..., 5] > 0.25]
        max_conf = preds[..., 5].argmax()
        filtered_predictions = preds[max_conf]
        boxes = filtered_predictions[:4]
        scores = filtered_predictions[5]
        class_label = filtered_predictions[5:]
        b1_x1, b1_x2 = boxes[0] - boxes[2] / 2, boxes[0] + boxes[2] / 2
        b1_y1, b1_y2 = boxes[1] - boxes[3] / 2, boxes[1] + boxes[3] / 2
        yxhw = np.array([b1_y1, b1_x1, (b1_y2 - b1_y1), (b1_x2 - b1_x1)]) * 100.
        processed_predictions.append([yxhw, class_label, scores])
    return processed_predictions


[docs]def yolo2voc(bboxes):
    """
    Converts yolo output to VOC format

    yolo => [xmid, ymid, w, h] (normalized)
    voc  => [x1, y1, x2, y1]

    :param bboxes: bounding boxes to convert
    :return: converted bboxes
    """
    bboxes = bboxes.copy().astype(float)  # otherwise all value will be 0 as voc_pascal dtype is np.int

    bboxes[..., [0, 2]] = bboxes[..., [0, 2]]
    bboxes[..., [1, 3]] = bboxes[..., [1, 3]]
    return bboxes


[docs]def scale_bb(bb, h, w):
    """
    Scales percentage BB into real sized BB.

    :param bb: the bb to scale
    :param h: image width
    :param w: image height
    :return: scaled BBox
    """
    bb_vals = np.array(bb) / 100.
    bb_vals[::2] *= w
    bb_vals[1::2] *= h
    return bb_vals


if __name__ == '__main__':
    mytimer = Timer()

    tfmodel = build_tf_model_from_file('weights/yolo-best-fp16.tflite')

    test_set, train_set, validation_set = directory_to_two_in_one_dataset('data/iNat/data', img_width=640,
                                                                          img_height=640)
    test_images, test_labels = tuple(zip(*test_set.unbatch()))
    test_images = np.array(test_images)
    o_test_images = test_images.copy()
    test_labels = np.array(test_labels)
    with mytimer:
        predictions = evaluate_interpreted_model(tfmodel, test_images)

    print(f'Inference time: {mytimer.results[0].microseconds / 100_000} seconds')

    index = 0
    gloss_fn = GIoULoss()
    gious = []
    for i, batch in enumerate(predictions):
        for sample in batch:
            img = o_test_images[index]
            sample = sample[sample[:, 4] >= 1.]  # [-1:, :]
            bbs = yolo2voc(sample[:, :4])
            conf = sample[:, 4:5]
            cls = sample[:, 5:]
            fig = plt.figure()
            gc = plt.gca()
            gc.imshow(img/255.)
            current_gious = []
            for bb in bbs:
                x, y, x2, y2 = bb
                bb_obj = BoundingBox(x*100., y*100., (x2 - x)*100., (y2 - y)*100.)
                scaled_bb = BoundingBox(*scale_bb(bb_obj.values, img.shape[0], img.shape[1]))
                scaled_bb.draw(gc)
                current_gious.append(bb_obj.GIoU(BoundingBox(*test_labels[i][1])))

            if current_gious:
                gious.append(sum(current_gious)/len(current_gious))

            index += 1
            plt.show()
    print('AVG GIoU:', sum(gious)/len(gious))