LinkDecoder
diff --git a/‎PyTorch/Classification/RN50v1.5/main.py‎
Lines changed: 1 addition & 1 deletion b/‎PyTorch/Classification/RN50v1.5/main.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎PyTorch/Detection/SSD/Dockerfile‎
Lines changed: 3 additions & 1 deletion b/‎PyTorch/Detection/SSD/Dockerfile‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎PyTorch/Detection/SSD/README.md‎
Lines changed: 459 additions & 160 deletions b/‎PyTorch/Detection/SSD/README.md‎
Lines changed: 459 additions & 160 deletions
diff --git a/‎PyTorch/Detection/SSD/dle/inference.py‎
Lines changed: 44 additions & 0 deletions b/‎PyTorch/Detection/SSD/dle/inference.py‎
Lines changed: 44 additions & 0 deletions
diff --git a/‎PyTorch/Detection/SSD/examples/SSD300_FP16_1GPU.sh‎
Lines changed: 1 addition & 1 deletion b/‎PyTorch/Detection/SSD/examples/SSD300_FP16_1GPU.sh‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎PyTorch/Detection/SSD/examples/SSD300_FP16_4GPU.sh‎
Lines changed: 1 addition & 1 deletion b/‎PyTorch/Detection/SSD/examples/SSD300_FP16_4GPU.sh‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎PyTorch/Detection/SSD/examples/SSD300_FP16_8GPU.sh‎
Lines changed: 1 addition & 1 deletion b/‎PyTorch/Detection/SSD/examples/SSD300_FP16_8GPU.sh‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎PyTorch/Detection/SSD/examples/SSD300_FP16_EVAL.sh‎
Lines changed: 1 addition & 1 deletion b/‎PyTorch/Detection/SSD/examples/SSD300_FP16_EVAL.sh‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎PyTorch/Detection/SSD/examples/SSD300_FP16_INFERENCE_BENCHMARK.sh‎
Lines changed: 1 addition & 1 deletion b/‎PyTorch/Detection/SSD/examples/SSD300_FP16_INFERENCE_BENCHMARK.sh‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎PyTorch/Detection/SSD/examples/SSD300_inference.py‎
Lines changed: 82 additions & 0 deletions b/‎PyTorch/Detection/SSD/examples/SSD300_inference.py‎
Lines changed: 82 additions & 0 deletions
@@ -40,7 +40,7 @@ def add_parser_arguments(parser):
 
     parser.add_argument('data', metavar='DIR',
                         help='path to dataset')
-    parser.add_argument('--data-backend', metavar='BACKEND', default='pytorch',
+    parser.add_argument('--data-backend', metavar='BACKEND', default='dali-cpu',
                         choices=DATA_BACKEND_CHOICES)
 
     parser.add_argument('--arch', '-a', metavar='ARCH', default='resnet50',
 
@@ -1,7 +1,9 @@
 FROM nvcr.io/nvidia/pytorch:19.05-py3
 
 # Set working directory
-WORKDIR /mlperf
+WORKDIR /workspace
+
+ENV PYTHONPATH "${PYTHONPATH}:/workspace"
 
 RUN apt-get update && apt-get install -y python3-tk python-pip git tmux htop tree
 
 
@@ -0,0 +1,44 @@
+import numpy as np
+import skimage
+
+def load_image(image_path):
+    """Code from Loading_Pretrained_Models.ipynb - a Caffe2 tutorial"""
+    mean, std = 128, 128
+    img = skimage.img_as_float(skimage.io.imread(image_path))
+    if len(img.shape) == 2:
+        img = np.array([img, img, img]).swapaxes(0,2)
+    return img
+
+def rescale(img, input_height, input_width):
+    """Code from Loading_Pretrained_Models.ipynb - a Caffe2 tutorial"""
+    aspect = img.shape[1]/float(img.shape[0])
+    if(aspect>1):
+        # landscape orientation - wide image
+        res = int(aspect * input_height)
+        imgScaled = skimage.transform.resize(img, (input_width, res))
+    if(aspect<1):
+        # portrait orientation - tall image
+        res = int(input_width/aspect)
+        imgScaled = skimage.transform.resize(img, (res, input_height))
+    if(aspect == 1):
+        imgScaled = skimage.transform.resize(img, (input_width, input_height))
+    return imgScaled
+
+def crop_center(img,cropx,cropy):
+    """Code from Loading_Pretrained_Models.ipynb - a Caffe2 tutorial"""
+    y,x,c = img.shape
+    startx = x//2-(cropx//2)
+    starty = y//2-(cropy//2)
+    return img[starty:starty+cropy,startx:startx+cropx]
+
+def normalize(img, mean=128, std=128):
+    img = (img * 256 - mean) / std
+    return img
+
+def prepare_input(img_uri):
+    img = load_image(img_uri)
+    img = rescale(img, 300, 300)
+    img = crop_center(img, 300, 300)
+    img = normalize(img)
+
+    return img
@@ -1,4 +1,4 @@
 # This script launches SSD300 training in FP16 on 1 GPUs using 64 batch size
 # Usage bash SSD300_FP16_1GPU.sh <path to this repository> <path to dataset> <additional flags>
 
-python $1/main.py --backbone resnet50 --warmup 300 --bs 64 --fp16 --data $2 ${@:3}
+python $1/main.py --backbone resnet50 --warmup 300 --bs 64 --amp --data $2 ${@:3}
@@ -1,4 +1,4 @@
 # This script launches SSD300 training in FP16 on 4 GPUs using 256 batch size (64 per GPU)
 # Usage ./SSD300_FP16_4GPU.sh <path to this repository> <path to dataset> <additional flags>
 
-python -m torch.distributed.launch --nproc_per_node=4 $1/main.py --backbone resnet50 --warmup 300 --bs 64 --fp16 --data $2 ${@:3}
+python -m torch.distributed.launch --nproc_per_node=4 $1/main.py --backbone resnet50 --warmup 300 --bs 64 --amp --data $2 ${@:3}
@@ -1,4 +1,4 @@
 # This script launches SSD300 training in FP16 on 8 GPUs using 512 batch size (64 per GPU)
 # Usage ./SSD300_FP16_8GPU.sh <path to this repository> <path to dataset> <additional flags>
 
-python -m torch.distributed.launch --nproc_per_node=8 $1/main.py --backbone resnet50 --warmup 300 --bs 64 --fp16 --data $2 ${@:3}
+python -m torch.distributed.launch --nproc_per_node=8 $1/main.py --backbone resnet50 --warmup 300 --bs 64 --amp --data $2 ${@:3}
@@ -1,4 +1,4 @@
 # This script evaluates SSD300 model in FP16 using 32 batch size on 1 GPU
 # Usage: ./SSD300_FP16_EVAL.sh <path to this repository> <path to dataset> <path to checkpoint> <additional flags>
 
-python $1/main.py --backbone resnet50 --fp16 --ebs 32 --data $2 --mode evaluation --checkpoint $3 ${@:4}
+python $1/main.py --backbone resnet50 --amp --ebs 32 --data $2 --mode evaluation --checkpoint $3 ${@:4}
@@ -1,4 +1,4 @@
 # This script launches SSD300 inference benchmark in FP16 on 1 GPU with 64 batch size
 # Usage bash SSD300_FP16_INFERENCE_BENCHMARK.sh <path to this repository> <path to dataset> <additional flags>
 
-python $1/main.py --backbone resnet50 --mode benchmark-inference --bs 64 --fp16 --data $2 ${@:3}
+python $1/main.py --backbone resnet50 --mode benchmark-inference --bs 64 --amp --data $2 ${@:3}
@@ -0,0 +1,82 @@
+import torch
+import numpy as np
+
+from apex.fp16_utils import network_to_half
+
+from dle.inference import prepare_input
+from src.model import SSD300, ResNet
+from src.utils import dboxes300_coco, Encoder
+
+
+def load_checkpoint(model, model_file):
+    cp = torch.load(model_file)['model']
+    cp = { k.replace('module.1.', ''): cp[k] for k in cp }
+    model.load_state_dict(cp)
+
+
+def build_predictor(model_file, backbone='resnet50'):
+    ssd300 = SSD300(backbone=ResNet(backbone))
+    load_checkpoint(ssd300, model_file)
+
+    return ssd300
+
+
+def prepare_model(checkpoint_path):
+    ssd300 = build_predictor(checkpoint_path)
+    ssd300 = ssd300.cuda()
+    ssd300 = network_to_half(ssd300)
+    ssd300 = ssd300.eval()
+
+    return ssd300
+
+
+def prepare_tensor(inputs):
+    NHWC = np.array(inputs)
+    NCHW = np.swapaxes(np.swapaxes(NHWC, 2, 3), 1, 2)
+    tensor = torch.from_numpy(NCHW)
+    tensor = tensor.cuda()
+    tensor = tensor.half()
+
+    return tensor
+
+
+def decode_results(predictions):
+    dboxes = dboxes300_coco()
+    encoder = Encoder(dboxes)
+    ploc, plabel = [val.float() for val in predictions]
+    results = encoder.decode_batch(ploc, plabel, criteria=0.5, max_output=20)
+
+    return [ [ pred.detach().cpu().numpy()
+               for pred in detections
+             ]
+             for detections in results
+           ]
+
+
+def pick_best(detections, treshold):
+    bboxes, classes, confidences = detections
+    best = np.argwhere(confidences > 0.3).squeeze(axis=1)
+
+    return [pred[best] for pred in detections]
+
+
+def main(checkpoint_path, imgs):
+    inputs = [prepare_input(uri) for uri in imgs]
+    tensor = prepare_tensor(inputs)
+    ssd300 = prepare_model(checkpoint_path)
+
+    predictions = ssd300(tensor)
+
+    results = decode_results(predictions)
+    best_results = [pick_best(detections, treshold=0.3) for detections in results]
+    return best_results
+
+if __name__ == '__main__':
+    best_results = main(
+            checkpoint_path='/checkpoints/SSD300v1.1.pt',
+            imgs=[ 'http://images.cocodataset.org/val2017/000000397133.jpg',
+                   'http://images.cocodataset.org/val2017/000000037777.jpg',
+                   'http://images.cocodataset.org/val2017/000000252219.jpg',
+                 ]
+    )
+    print(best_results)