CS766Projects_Medical_Ima / Git / Diff of /SSD/predict

Models:
DavidFeaster/
CS766Projects_Medical_Ima
Downloads: 1
Diff of /SSD/predict_top2.py [000000] .. [54586b]
Switch to side-by-side view

--- a
+++ b/SSD/predict_top2.py
@@ -0,0 +1,194 @@
+from keras.optimizers import Adam, SGD
+from keras.callbacks import ModelCheckpoint, LearningRateScheduler, TerminateOnNaN, CSVLogger
+from keras import backend as K
+from keras.models import load_model
+from math import ceil
+import numpy as np
+from matplotlib import pyplot as plt
+import csv
+from models.keras_ssd300 import ssd_300
+from keras_loss_function.keras_ssd_loss import SSDLoss
+from keras_layers.keras_layer_AnchorBoxes import AnchorBoxes
+from keras_layers.keras_layer_DecodeDetections import DecodeDetections
+from keras_layers.keras_layer_DecodeDetectionsFast import DecodeDetectionsFast
+from keras_layers.keras_layer_L2Normalization import L2Normalization
+
+from ssd_encoder_decoder.ssd_input_encoder import SSDInputEncoder
+from ssd_encoder_decoder.ssd_output_decoder import decode_detections, decode_detections_fast
+
+from data_generator.object_detection_2d_data_generator import DataGenerator
+from data_generator.object_detection_2d_geometric_ops import Resize
+from data_generator.object_detection_2d_photometric_ops import ConvertTo3Channels
+from data_generator.data_augmentation_chain_original_ssd import SSDDataAugmentation
+from data_generator.object_detection_2d_misc_utils import apply_inverse_transforms
+
+def bbox_iou(a, b):
+    """Calculate the Intersection of Unions (IoUs) between bounding boxes.
+    IoU is calculated as a ratio of area of the intersection
+    and area of the union.
+
+    Args:
+        a: (list of 4 numbers) [y1,x1,y2,x2]
+        b: (list of 4 numbers) [y1,x1,y2,x2]
+    Returns:
+        iou: the value of the IoU of two bboxes
+
+    """
+    # (float) Small value to prevent division by zero
+    epsilon = 1e-5
+    # COORDINATES OF THE INTERSECTION BOX
+    # print(a)
+    # print(b)
+    y1 = max(a[0], b[0])
+    x1 = max(a[1], b[1])
+    y2 = min(a[2], b[2])
+    x2 = min(a[3], b[3])
+
+    # AREA OF OVERLAP - Area where the boxes intersect
+    width = (x2 - x1)
+    height = (y2 - y1)
+    # handle case where there is NO overlap
+    if (width < 0) or (height < 0):
+        return 0.0
+    area_overlap = width * height
+
+    # COMBINED AREA
+    area_a = (a[2] - a[0]) * (a[3] - a[1])
+    area_b = (b[2] - b[0]) * (b[3] - b[1])
+    area_combined = area_a + area_b - area_overlap
+
+    # RATIO OF AREA OF OVERLAP OVER COMBINED AREA
+    iou = area_overlap / (area_combined+epsilon)
+    return iou
+
+img_height = 512 # Height of the model input images
+img_width = 512 # Width of the model input images
+img_channels = 3 # Number of color channels of the model input images
+mean_color = [123, 117, 104] # The per-channel mean of the images in the dataset. Do not change this value if you're using any of the pre-trained weights.
+swap_channels = [2, 1, 0] # The color channel order in the original SSD is BGR, so we'll have the model reverse the color channel order of the input images.
+n_classes = 1 # Number of positive classes, e.g. 20 for Pascal VOC, 80 for MS COCO
+scales_pascal = [0.1, 0.2, 0.37, 0.54, 0.71, 0.88, 1.05] # The anchor box scaling factors used in the original SSD300 for the Pascal VOC datasets
+scales_coco = [0.07, 0.15, 0.33, 0.51, 0.69, 0.87, 1.05] # The anchor box scaling factors used in the original SSD300 for the MS COCO datasets
+scales = scales_coco
+aspect_ratios = [[1.0, 2.0, 0.5],
+                 [1.0, 2.0, 0.5, 3.0, 1.0/3.0],
+                 [1.0, 2.0, 0.5, 3.0, 1.0/3.0],
+                 [1.0, 2.0, 0.5, 3.0, 1.0/3.0],
+                 [1.0, 2.0, 0.5],
+                 [1.0, 2.0, 0.5]] # The anchor box aspect ratios used in the original SSD300; the order matters
+two_boxes_for_ar1 = True
+steps = [8, 16, 32, 64, 100, 300] # The space between two adjacent anchor box center points for each predictor layer.
+offsets = [0.5, 0.5, 0.5, 0.5, 0.5, 0.5] # The offsets of the first anchor box center points from the top and left borders of the image as a fraction of the step size for each predictor layer.
+clip_boxes = False # Whether or not to clip the anchor boxes to lie entirely within the image boundaries
+variances = [0.1, 0.1, 0.2, 0.2] # The variances by which the encoded target coordinates are divided as in the original implementation
+normalize_coords = True
+
+# 1: Build the Keras model.
+
+K.clear_session() # Clear previous models from memory.
+
+#model = ssd_300(image_size=(img_height, img_width, img_channels),
+#                n_classes=n_classes,
+#                mode='training',
+#                l2_regularization=0.0005,
+#                scales=scales,
+#                aspect_ratios_per_layer=aspect_ratios,
+#                two_boxes_for_ar1=two_boxes_for_ar1,
+#                steps=steps,
+#                offsets=offsets,
+#                clip_boxes=clip_boxes,
+#                variances=variances,
+#                normalize_coords=normalize_coords,
+#                subtract_mean=mean_color,
+#                swap_channels=swap_channels)
+
+model_path = './ssd512_mine.h5'
+
+ssd_loss = SSDLoss(neg_pos_ratio=3, alpha=1.0)
+
+model = load_model(model_path, custom_objects={'AnchorBoxes': AnchorBoxes,
+                                               'L2Normalization': L2Normalization,
+                                               'compute_loss': ssd_loss.compute_loss})
+testimages_dir = './data/testImages'
+testlabels = './data/testlabels.csv'
+
+convert_to_3_channels = ConvertTo3Channels()
+resize = Resize(height=img_height, width=img_width)
+
+input_format = ['image_name', 'class_id', 'ymin', 'xmin', 'ymax', 'xmax']
+
+val_dataset = DataGenerator(load_images_into_memory=False, hdf5_dataset_path=None)
+
+val_dataset.parse_csv(images_dir=testimages_dir,
+                  labels_filename=testlabels,
+                  input_format=input_format,
+                  include_classes='all',
+                  random_sample=False,
+                  ret=False,
+                  verbose=True)
+
+val_dataset.create_hdf5_dataset(file_path='dataset_pascal_voc_07_test.h5',
+                                resize=False,
+                                variable_image_size=True,
+                                verbose=True)
+
+predict_generator = val_dataset.generate(batch_size=1,
+                                         shuffle=False,
+                                         transformations=[convert_to_3_channels,
+                                                          resize],
+                                         label_encoder=None,
+                                         returns={'processed_images',
+                                                  'filenames',
+                                                  'inverse_transform',
+                                                  'original_images',
+                                                  'original_labels'},
+                                         keep_images_without_gt=False)
+
+np.set_printoptions(precision = 2, suppress = True, linewidth = 90)
+
+hits = 0
+total = 33
+
+rescsv1 = open('result1.csv', 'w', newline = '')
+writer1 = csv.writer(rescsv1, delimiter=',', quotechar='|', quoting=csv.QUOTE_MINIMAL)
+rescsv2 = open('result2.csv', 'w', newline = '')
+writer2 = csv.writer(rescsv2, delimiter=',', quotechar='|', quoting=csv.QUOTE_MINIMAL)
+
+labcsv = open('label.csv', 'w', newline = '')
+writer3 = csv.writer(labcsv, delimiter=',', quotechar='|', quoting=csv.QUOTE_MINIMAL)
+
+for i in range(33):
+	batch_images, batch_filenames, batch_inverse_transforms, batch_original_images, batch_original_labels = next(predict_generator)
+
+	y_pred = model.predict(batch_images)
+
+	y_pred_decoded = decode_detections(y_pred,
+                                   	confidence_thresh=0.0005,
+                                   	iou_threshold=0.0001,
+                                   	top_k=2,
+                                   	normalize_coords=normalize_coords,
+                                   	img_height=img_height,
+                                   	img_width=img_width)
+
+	y_pred_decoded_inv = apply_inverse_transforms(y_pred_decoded, batch_inverse_transforms)
+
+	writer1.writerow([batch_filenames[0], y_pred_decoded_inv[0][0][2], y_pred_decoded_inv[0][0][3], y_pred_decoded_inv[0][0][4],y_pred_decoded_inv[0][0][5], y_pred_decoded_inv[0][0][1]])
+	
+	if(len(y_pred_decoded_inv[0]) >= 2):
+		writer2.writerow([batch_filenames[0], y_pred_decoded_inv[0][1][2], y_pred_decoded_inv[0][1][3], y_pred_decoded_inv[0][1][4],y_pred_decoded_inv[0][1][5], y_pred_decoded_inv[0][1][1]])
+	else:
+		writer2.writerow([batch_filenames[0], 0, 0, 0, 0, 0])
+		
+	result_bbox = [y_pred_decoded_inv[0][0][2], y_pred_decoded_inv[0][0][3], y_pred_decoded_inv[0][0][4],y_pred_decoded_inv[0][0][5]]
+	print (result_bbox)
+        
+	writer3.writerow([batch_original_labels[0][0][0], batch_original_labels[0][0][1], batch_original_labels[0][0][2], batch_original_labels[0][0][3], batch_original_labels[0][0][4]])
+
+	label_bbox = [batch_original_labels[0][0][1], batch_original_labels[0][0][2], batch_original_labels[0][0][3], batch_original_labels[0][0][4]]
+	print (label_bbox)
+
+	if(bbox_iou(result_bbox, label_bbox) > 0) :
+		hits = hits + 1
+
+precision = hits / total
+print(precision)