diff --git a/mask_rcnn/.gitignore b/mask_rcnn/.gitignore
new file mode 100644
index 00000000..fbb17b59
--- /dev/null
+++ b/mask_rcnn/.gitignore
@@ -0,0 +1,8 @@
+__pycache__/
+.vscode/
+.idea/
+*.h5
+*.pb
+**/dataset/train/
+**/dataset/val/
+**/mask_rcnn/logs/
diff --git a/mask_rcnn/README.md b/mask_rcnn/README.md
new file mode 100644
index 00000000..68e87b0b
--- /dev/null
+++ b/mask_rcnn/README.md
@@ -0,0 +1,73 @@
+# Pointless Packaging W/ Mask R-CNN
+
+MASK R-CNN: https://github.com/matterport/Mask_RCNN
+
+```
+DIRECTORY STRUCTURE
+.
+|____.gitignore
+|____dataset
+| |____train - contains all training images (in Google Drive)
+| |____TRAIN-MINI.json - VIA annotations for training images
+| |____val  - contains all vaidation images (in Google Drive)
+| |____VAL-MINI.json - VIA annotations for validation images
+| |____val_img_results - contains results of validation images after inference
+| |____via.html - VIA annotator program
+|____eval_on_val_set.py - performs inference on validation test, resuls in 
+                          `val_img_results`
+|____logs - training logs from the mask r-cnn library
+|____models - contains trained models
+| |____mask_rcnn_final.h5 (256MB) - DOWNLOAD LINK BELOW
+| |____.gitkeep - Dummy file. Just ignore it.
+|____mrcnn - matterport/Mask_RCNN library
+|____README.md
+|____requirements.txt
+|____test_images - images that can be tested by running `score.py`
+|____trainer.py - train a dataset using the Mask R-CNN library
+|____trainer_voc.py - train a dataset in PASCAL-VOC format using the Mask R-CNN library
+|
+|____score.py - RUN THIS script to obtain scores of images 
+                containing pointless packaging.
+```
+
+- Download the latest trained model and place it in the `models/` directory.
+    - ### <a href="https://drive.google.com/a/ucdavis.edu/file/d/1b82OoKjJksEZ0JZfZS4Y8DPK5VkSDVtp/view?usp=sharing" target="blank">CLICK HERE TO DOWNLOAD TRAINED MODEL</a>
+    - The model was trained for oly 50 epochs on 150 training images and 32 test images.
+
+
+## score.py
+```
+usage: score.py [-h] -m MODEL_SRC [-i IMG_SRC | -d DIR_SRC] [-v]
+
+Simple script that takes a trained MASK R-CNN model (.h5), pointless
+packaging image/images and then generates score of the packaging purely based on
+the area of the package relative to the item inside; using the provided model.
+
+optional arguments:
+  -h, --help            show this help message and exit
+  -m MODEL_SRC, --model MODEL_SRC
+                        Absolute/Relative path to the MASK R-CNN Model
+  -i IMG_SRC, --img IMG_SRC
+                        Absolute/Relative path of the image. Cannot include
+                        --dir argument.
+  -d DIR_SRC, --dir DIR_SRC
+                        Absolute/Relative path of the directory containing the
+                        images. Cannot include --img argument.
+  -v, --visualize       Visualize the image.
+
+```
+### Example:
+- Get score of a single image WITH visulatization.
+    -  `python3 score.py -v -m models/mask_rcnn_final.h5 -i test_images/IMG_0.jpg`
+- Get score for every single image in a directory WITH visualization.
+    -  `python3 score.py -v -m models/mask_rcnn_final.h5 -d test_images/`
+- Get score for every single image in a directory WITHOUT visualization.
+    -  `python3 score.py -m models/mask_rcnn_final.h5 -d test_images/`
+
+## TODO:
+- Need to come up with a proper scoring function. 
+  Currently, `score.py` gives only the area of the 
+  box and items in pixels.
+
+## RESULTS:
+![Results](dataset/val_img_results/Figure_1.png)
\ No newline at end of file
diff --git a/mask_rcnn/dataset/TRAIN-MINI.json b/mask_rcnn/dataset/TRAIN-MINI.json
new file mode 100644
index 00000000..9df8f179
--- /dev/null
+++ b/mask_rcnn/dataset/TRAIN-MINI.json
@@ -0,0 +1 @@
+{"_via_settings":{"ui":{"annotation_editor_height":25,"annotation_editor_fontsize":0.8,"leftsidebar_width":18,"image_grid":{"img_height":80,"rshape_fill":"none","rshape_fill_opacity":0.3,"rshape_stroke":"yellow","rshape_stroke_width":2,"show_region_shape":true,"show_image_policy":"all"},"image":{"region_label":"name","region_color":"__via_default_region_color__","region_label_font":"10px Sans","on_image_annotation_editor_placement":"NEAR_REGION"}},"core":{"buffer_size":"18","filepath":{},"default_filepath":"train/"},"project":{"name":"TRAIN"}},"_via_img_metadata":{"IMG_0.jpg52157":{"filename":"IMG_0.jpg","size":52157,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[263,278,266,251],"all_points_y":[137,139,196,192]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[197,414,414,192],"all_points_y":[92,86,248,238]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[134,194,199,415,414,497,501,411,412,188,192,129],"all_points_y":[94,92,24,13,86,86,247,246,298,298,232,227]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_1.jpg13491":{"filename":"IMG_1.jpg","size":13491,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[70,87,86,70],"all_points_y":[145,145,172,171]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[41,114,122,41],"all_points_y":[98,96,206,211]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[43,110,113,142,143,121,121,41,40,2,7,40],"all_points_y":[65,63,94,97,207,207,251,254,210,212,98,98]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_2.jpg14457":{"filename":"IMG_2.jpg","size":14457,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[50,73,87,64],"all_points_y":[141,118,134,156]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[39,110,112,44],"all_points_y":[81,83,189,196]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[38,106,109,136,138,112,110,45,44,5,2,38],"all_points_y":[43,48,83,86,183,187,220,233,196,199,79,80]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_3.jpg28329":{"filename":"IMG_3.jpg","size":28329,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[100,144,120,73],"all_points_y":[109,130,195,174]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[86,184,140,17],"all_points_y":[46,92,253,223]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[101,222,183,224,197,140,168,8,17,1,78,85],"all_points_y":[5,67,90,110,267,251,282,250,224,231,1,44]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_4.jpg18069":{"filename":"IMG_4.jpg","size":18069,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[109,154,150,107],"all_points_y":[101,106,151,150]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[61,168,168,68],"all_points_y":[72,66,221,225]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[58,165,168,216,214,169,172,67,67,16,4,61],"all_points_y":[15,8,67,56,241,221,281,279,223,228,74,72]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_5.jpg30039":{"filename":"IMG_5.jpg","size":30039,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[106,120,91,75],"all_points_y":[128,134,202,197]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[69,63,127,133],"all_points_y":[128,146,166,151]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[90,188,114,3],"all_points_y":[70,186,265,129]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[97,99,91,128,225,189,223,141,117,115,2,1,1,98],"all_points_y":[36,33,70,43,152,186,185,287,267,285,152,131,86,33]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_6.jpg18991":{"filename":"IMG_6.jpg","size":18991,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[108,141,128,95],"all_points_y":[136,145,192,182]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[131,185,98,43,131],"all_points_y":[109,182,247,172,109]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[100,130,160,212,183,218,127,99,56,2,43,12],"all_points_y":[68,108,91,156,180,223,292,250,277,203,174,134]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_7.jpg22888":{"filename":"IMG_7.jpg","size":22888,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[65,153,154,55],"all_points_y":[110,113,245,242]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[65,156,152,195,203,151,165,45,55,37,50,64],"all_points_y":[64,69,114,106,248,243,267,267,243,247,94,110]},"region_attributes":{"name":"outerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[122,118,146,145],"all_points_y":[133,235,237,133]},"region_attributes":{"name":"item_rect_slim"}}],"file_attributes":{}},"IMG_8.jpg19591":{"filename":"IMG_8.jpg","size":19591,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[71,143,138,95,83,74,70,72],"all_points_y":[120,124,209,204,202,202,203,121]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[57,159,170,61],"all_points_y":[89,87,230,233]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[50,167,158,211,225,225,168,182,56,62,4,2,58],"all_points_y":[50,48,87,80,193,230,228,286,293,233,237,90,88]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_9.jpg26999":{"filename":"IMG_9.jpg","size":26999,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[72,168,154,41],"all_points_y":[68,92,235,224]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[84,190,164,200,185,156,174,43,2,1,31,72],"all_points_y":[28,58,92,72,254,235,238,230,229,159,31,68]},"region_attributes":{"name":"outerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[84,88,144,146],"all_points_y":[106,134,134,107]},"region_attributes":{"name":"item_rect"}}],"file_attributes":{}},"IMG_10.jpg33625":{"filename":"IMG_10.jpg","size":33625,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[227,239,247,252,255,254,250,242,231,224,222,224],"all_points_y":[171,168,170,175,182,191,197,200,199,190,182,175]},"region_attributes":{"name":"item_circ"}},{"shape_attributes":{"name":"polygon","all_points_x":[117,120,280,286,124],"all_points_y":[123,123,115,231,237]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[107,280,281,306,317,285,295,105,127,68,63,118],"all_points_y":[72,61,117,108,243,230,257,262,233,243,123,123]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_11.jpg27698":{"filename":"IMG_11.jpg","size":27698,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[24,118,163,69],"all_points_y":[100,81,215,257]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[21,57,90,129,136,117,162,208,162,192,159,147,135,82,68,68,31,2,25],"all_points_y":[71,62,57,56,55,80,71,200,216,225,247,256,262,282,257,283,185,75,102]},"region_attributes":{"name":"outerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[57,109,124,76],"all_points_y":[143,192,174,127]},"region_attributes":{"name":"item_rect_slim"}}],"file_attributes":{}},"IMG_12.jpg15001":{"filename":"IMG_12.jpg","size":15001,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[54,101,101,54],"all_points_y":[101,101,152,153]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[38,108,109,36],"all_points_y":[97,97,204,204]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[38,106,107,141,144,109,108,37,36,2,4,37],"all_points_y":[61,62,97,98,202,201,240,243,204,204,95,96]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_13.jpg18832":{"filename":"IMG_13.jpg","size":18832,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[110,191,130,49],"all_points_y":[66,119,214,157]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[71,109,140,220,191,224,224,174,129,105,32,50,4],"all_points_y":[35,65,23,72,118,135,168,244,211,243,190,158,128]},"region_attributes":{"name":"outerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[85,88,150,146],"all_points_y":[156,176,162,146]},"region_attributes":{"name":"item_rect_slim"}}],"file_attributes":{}},"IMG_14.jpg25014":{"filename":"IMG_14.jpg","size":25014,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[78,151,154,75],"all_points_y":[103,103,213,213]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[76,156,151,189,197,152,157,75,76,32,37,76],"all_points_y":[64,65,103,97,214,212,251,255,212,216,94,102]},"region_attributes":{"name":"outerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[88,89,137,136],"all_points_y":[118,187,188,118]},"region_attributes":{"name":"item_rect"}}],"file_attributes":{}},"IMG_15.jpg26787":{"filename":"IMG_15.jpg","size":26787,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[80,104,140,118],"all_points_y":[151,174,132,112]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[60,163,182,66],"all_points_y":[37,60,205,227]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[203,225,225,184,218,87,67,11,17,29,64,76,149,192,159,165],"all_points_y":[28,153,208,206,203,213,232,234,1,1,39,1,0,15,60,61]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_16.jpg14129":{"filename":"IMG_16.jpg","size":14129,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[48,117,120,53],"all_points_y":[89,88,189,193]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[49,115,117,144,143,120,116,118,54,54,17,14,48],"all_points_y":[52,53,90,88,187,187,189,223,227,192,195,88,89]},"region_attributes":{"name":"outerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[56,56,100,100],"all_points_y":[111,144,143,107]},"region_attributes":{"name":"item_rect"}}],"file_attributes":{}},"IMG_17.jpg24868":{"filename":"IMG_17.jpg","size":24868,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[105,151,147,98],"all_points_y":[167,161,112,117]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[76,164,169,76],"all_points_y":[187,189,59,58]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[30,77,68,179,167,190,181,164,168,76,77,35],"all_points_y":[55,60,36,34,61,48,201,187,230,231,184,194]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_18.jpg12729":{"filename":"IMG_18.jpg","size":12729,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[48,60,71,80,85,85,81,72,60,49,46,49],"all_points_y":[121,130,131,125,114,104,100,94,94,100,108,122]},"region_attributes":{"name":"item_circ"}},{"shape_attributes":{"name":"polygon","all_points_x":[30,104,111,28],"all_points_y":[71,72,186,188]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[30,100,103,140,144,145,110,113,26,28,1,1,28],"all_points_y":[41,40,70,63,94,182,184,229,232,189,189,74,72]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_19.jpg12969":{"filename":"IMG_19.jpg","size":12969,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[39,93,94,38],"all_points_y":[97,99,134,135]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[34,100,105,39],"all_points_y":[81,81,182,191]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[34,99,100,135,138,103,107,43,40,2,1,1,35],"all_points_y":[45,50,84,81,182,182,216,226,191,193,114,78,80]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_20.jpg41369":{"filename":"IMG_20.jpg","size":41369,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[133,193,181,122],"all_points_y":[90,117,147,124]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[109,385,309,79],"all_points_y":[12,99,241,190]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[65,80,39,34,35,29,42,58,91,103,110,92,135,144,204,398,399,384,399,399,354,348,340,308,281],"all_points_y":[263,186,248,246,169,166,69,13,8,13,7,2,1,1,14,77,99,98,109,232,294,300,299,241,300]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_21.jpg44654":{"filename":"IMG_21.jpg","size":44654,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[109,161,165,114,110],"all_points_y":[145,132,150,163,156]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[35,288,304,102],"all_points_y":[115,44,188,250]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[35,101,98,148,342,303,304,356,362,286,307,178,2,2,31],"all_points_y":[151,282,300,299,231,185,183,215,54,42,2,1,45,84,113]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_22.jpg46718":{"filename":"IMG_22.jpg","size":46718,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[103,301,305,33],"all_points_y":[66,157,292,213]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[130,302,296,355,387,314,344,11,34,25,120,104],"all_points_y":[16,101,157,121,284,293,299,209,212,169,1,65]},"region_attributes":{"name":"outerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[119,199,208,129],"all_points_y":[170,206,185,149]},"region_attributes":{"name":"item_rect_slim"}}],"file_attributes":{}},"IMG_23.jpg14528":{"filename":"IMG_23.jpg","size":14528,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[55,67,68,57],"all_points_y":[127,126,160,160]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[35,106,109,113,43],"all_points_y":[112,108,111,215,219]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[32,106,108,143,144,114,109,109,45,43,11,2,36],"all_points_y":[79,71,108,109,213,215,217,246,249,217,218,117,116]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_24.jpg27556":{"filename":"IMG_24.jpg","size":27556,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[202,245,253,212],"all_points_y":[93,113,92,71]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[124,265,262,123],"all_points_y":[166,161,58,64]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[116,270,260,314,313,264,270,267,111,121,121,73,78,127],"all_points_y":[204,205,160,160,62,66,21,19,25,64,68,62,167,163]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_25.jpg31143":{"filename":"IMG_25.jpg","size":31143,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[74,125,121,316,313,377,377,375,377,345,307,307,116,122,69],"all_points_y":[76,88,16,8,88,75,151,199,239,234,225,298,286,215,227]},"region_attributes":{"name":"outerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[172,171,290,290],"all_points_y":[114,202,208,113]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[120,308,313,124],"all_points_y":[218,226,82,84]},"region_attributes":{"name":"innerbox"}}],"file_attributes":{}},"IMG_26.jpg39280":{"filename":"IMG_26.jpg","size":39280,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[175,181,246,239],"all_points_y":[118,202,197,115]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[148,265,273,152],"all_points_y":[71,61,237,238]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[131,270,267,268,286,294,272,280,146,151,92,89,150],"all_points_y":[35,21,60,64,40,250,235,296,299,236,245,63,70]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_27.jpg29843":{"filename":"IMG_27.jpg","size":29843,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[71,166,143,38],"all_points_y":[80,100,244,229]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[27,73,74,184,164,194,165,145,154,35,43,1,1],"all_points_y":[53,79,45,69,99,81,265,243,249,230,227,227,156]},"region_attributes":{"name":"outerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[99,134,139,108],"all_points_y":[160,182,170,150]},"region_attributes":{"name":"item_rect_slim"}}],"file_attributes":{}},"IMG_28.jpg13869":{"filename":"IMG_28.jpg","size":13869,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[40,111,116,36],"all_points_y":[93,94,205,205]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[45,110,111,144,144,115,115,38,39,0,5,41],"all_points_y":[61,61,95,95,205,203,244,245,203,202,94,93]},"region_attributes":{"name":"outerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[72,72,83,79],"all_points_y":[134,170,169,133]},"region_attributes":{"name":"item_rect_slim"}}],"file_attributes":{}},"IMG_29.jpg39275":{"filename":"IMG_29.jpg","size":39275,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[210,252,250,207],"all_points_y":[168,167,101,102]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[155,155,295,297,153],"all_points_y":[88,88,83,187,188]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[149,298,295,351,351,292,296,144,153,106,107,155],"all_points_y":[38,27,88,83,189,187,239,235,185,186,83,90]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_30.jpg21750":{"filename":"IMG_30.jpg","size":21750,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[108,134,131,115],"all_points_y":[184,184,115,115]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[72,153,158,76],"all_points_y":[99,95,209,213]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[69,154,153,193,198,156,162,75,77,39,33,72],"all_points_y":[57,53,96,93,212,207,248,253,213,219,97,101]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_31.jpg33187":{"filename":"IMG_31.jpg","size":33187,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[123,243,303,183],"all_points_y":[155,83,190,259]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[91,214,245,288,341,301,335,245,205,183,125,66,125],"all_points_y":[99,28,85,65,159,191,247,299,300,257,289,185,155]},"region_attributes":{"name":"outerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[170,174,247,242],"all_points_y":[152,183,172,138]},"region_attributes":{"name":"item_rect"}}],"file_attributes":{}},"IMG_32.jpg26592":{"filename":"IMG_32.jpg","size":26592,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[104,281,357,193,168],"all_points_y":[148,63,221,299,299]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[64,195,253,281,340,397,399,357,398,195,165,65,14,104],"all_points_y":[66,1,1,64,47,165,189,221,299,299,298,299,187,149]},"region_attributes":{"name":"outerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[163,177,259,242],"all_points_y":[140,176,135,104]},"region_attributes":{"name":"item_rect"}}],"file_attributes":{}},"IMG_33.jpg13396":{"filename":"IMG_33.jpg","size":13396,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[37,101,113,41],"all_points_y":[115,110,209,215]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[45,117,113,144,144,134,101,97,35,38,5,5,42],"all_points_y":[256,249,210,207,165,99,110,81,85,113,116,218,215]},"region_attributes":{"name":"outerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[66,65,79,78],"all_points_y":[145,194,195,144]},"region_attributes":{"name":"item_rect_slim"}}],"file_attributes":{}},"IMG_34.jpg52750":{"filename":"IMG_34.jpg","size":52750,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[247,323,326,325,243,243],"all_points_y":[177,176,172,142,141,176]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[174,399,393,179],"all_points_y":[221,220,75,75]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[473,461,390,389,182,180,106,96,175,170,403,397],"all_points_y":[215,79,77,15,13,75,75,217,215,296,295,217]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_35.jpg14549":{"filename":"IMG_35.jpg","size":14549,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[58,85,98,69],"all_points_y":[158,166,122,112]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[45,119,112,43],"all_points_y":[197,193,89,90]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[45,119,115,145,143,111,108,42,43,8,7,45],"all_points_y":[235,232,193,193,89,89,56,58,90,91,197,195]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_36.jpg17102":{"filename":"IMG_36.jpg","size":17102,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[62,157,149,55],"all_points_y":[227,223,92,95]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[59,165,156,171,163,149,154,46,59,56,27,33,62],"all_points_y":[279,271,223,233,76,90,58,61,95,96,81,244,224]},"region_attributes":{"name":"outerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[70,73,136,137],"all_points_y":[116,191,191,112]},"region_attributes":{"name":"item_rect"}}],"file_attributes":{}},"IMG_37.jpg25967":{"filename":"IMG_37.jpg","size":25967,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[133,301,297,126],"all_points_y":[245,231,87,90]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[45,127,118,313,295,341,350,300,308,130,134,47],"all_points_y":[91,90,5,10,89,90,219,227,298,299,242,249]},"region_attributes":{"name":"outerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[190,197,279,265],"all_points_y":[108,173,152,98]},"region_attributes":{"name":"item_rect"}}],"file_attributes":{}},"IMG_38.jpg13127":{"filename":"IMG_38.jpg","size":13127,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[74,79,83,85,84,80,73,71],"all_points_y":[173,175,172,167,165,163,163,169]},"region_attributes":{"name":"item_circ"}},{"shape_attributes":{"name":"polygon","all_points_x":[44,118,108,41],"all_points_y":[224,219,115,118]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[46,119,117,145,144,140,109,105,39,40,7,6,43],"all_points_y":[265,259,220,217,155,113,115,83,85,117,117,227,223]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_39.jpg51999":{"filename":"IMG_39.jpg","size":51999,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[211,349,342,210],"all_points_y":[201,195,111,115]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[164,389,375,163],"all_points_y":[227,213,78,80]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[156,224,405,387,388,461,440,374,369,167,165,94,87,165],"all_points_y":[297,295,286,214,212,209,77,79,15,20,82,87,226,223]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_40.jpg22486":{"filename":"IMG_40.jpg","size":22486,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[75,124,137,87],"all_points_y":[190,197,116,109]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[63,170,163,62],"all_points_y":[223,221,102,105]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[69,167,170,224,224,217,162,160,61,63,7,3,63],"all_points_y":[270,267,222,222,155,93,101,51,53,105,103,225,224]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_41.jpg32999":{"filename":"IMG_41.jpg","size":32999,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[173,263,260,170],"all_points_y":[199,197,131,135]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[112,309,311,114],"all_points_y":[213,228,90,88]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[82,315,306,386,385,308,311,113,114,50,45,43,39,111],"all_points_y":[268,292,226,229,89,89,14,21,90,82,85,91,214,211]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_42.jpg25634":{"filename":"IMG_42.jpg","size":25634,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[71,147,147,65],"all_points_y":[194,194,82,84]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[68,147,145,186,189,147,149,62,69,21,31,71],"all_points_y":[233,235,195,205,83,88,44,45,85,85,201,193]},"region_attributes":{"name":"outerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[82,84,130,128],"all_points_y":[131,168,166,130]},"region_attributes":{"name":"item_rect"}}],"file_attributes":{}},"IMG_43.jpg42950":{"filename":"IMG_43.jpg","size":42950,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[201,220,247,229],"all_points_y":[108,160,148,95]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[123,322,277,272,37,120],"all_points_y":[285,185,46,45,149,287]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[346,387,318,379,243,112,33,35,39,-1,1,199,284,274,278],"all_points_y":[35,203,183,225,299,299,169,157,150,115,74,0,1,45,49]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_44.jpg31593":{"filename":"IMG_44.jpg","size":31593,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[107,272,260,97],"all_points_y":[238,222,82,93]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[57,107,110,279,269,339,329,262,255,91,98,95,46],"all_points_y":[233,235,297,299,221,215,81,85,8,21,94,100,106]},"region_attributes":{"name":"outerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[115,115,252,255],"all_points_y":[119,198,212,127]},"region_attributes":{"name":"item_rect"}}],"file_attributes":{}},"IMG_45.jpg27066":{"filename":"IMG_45.jpg","size":27066,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[84,110,119,91],"all_points_y":[169,180,152,143]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[24,127,198,78],"all_points_y":[80,63,205,258]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[93,197,199,224,225,199,224,224,173,127,145,91,14,26,0,1,68,77],"all_points_y":[271,233,227,212,203,206,194,137,51,64,17,17,29,79,41,55,269,257]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_46.jpg13433":{"filename":"IMG_46.jpg","size":13433,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[53,99,93,47],"all_points_y":[199,193,155,161]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[38,109,102,36],"all_points_y":[217,213,113,114]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[39,113,109,144,140,133,100,99,37,36,4,1,37],"all_points_y":[256,252,214,211,153,109,113,79,82,114,110,218,217]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_47.jpg25203":{"filename":"IMG_47.jpg","size":25203,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[28,40,47,35],"all_points_y":[144,168,165,140]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[14,149,149,30],"all_points_y":[243,234,65,49]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[183,145,208,197,148,176,96,34,35,13,9,0,1,15,7,47,83,123,123],"all_points_y":[253,233,235,73,69,35,11,1,49,1,1,81,251,242,267,272,270,267,263]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_48.jpg34931":{"filename":"IMG_48.jpg","size":34931,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[120,279,276,119],"all_points_y":[201,199,79,91]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[111,279,272,335,331,271,276,107,120,64,64,123],"all_points_y":[255,257,197,202,80,88,21,36,91,86,203,199]},"region_attributes":{"name":"outerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[171,170,233,233],"all_points_y":[148,182,185,147]},"region_attributes":{"name":"item_rect"}}],"file_attributes":{}},"IMG_49.jpg19284":{"filename":"IMG_49.jpg","size":19284,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[126,144,145,125],"all_points_y":[192,194,141,140]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[65,148,151,66],"all_points_y":[227,225,109,105]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[61,150,147,188,191,149,153,66,68,27,25,67],"all_points_y":[269,270,221,235,107,109,67,64,107,103,231,224]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_50.jpg19178":{"filename":"IMG_50.jpg","size":19178,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[77,63,117,130],"all_points_y":[97,185,199,99]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[57,61,169,153],"all_points_y":[81,235,225,76]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[13,12,60,64,176,170,224,205,156,153,49,56],"all_points_y":[59,246,237,296,284,227,220,71,75,20,22,79]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_51.jpg12578":{"filename":"IMG_51.jpg","size":12578,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[55,62,77,70],"all_points_y":[119,145,135,117]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[36,39,107,107],"all_points_y":[76,187,180,79]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[38,106,106,141,142,108,105,39,38,1,0,35],"all_points_y":[37,44,78,77,182,181,216,222,187,190,71,74]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_52.jpg20139":{"filename":"IMG_52.jpg","size":20139,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[75,75,110,110],"all_points_y":[104,169,170,104]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[67,58,130,139],"all_points_y":[86,184,192,92]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[39,30,56,50,126,129,160,170,140,142,66,70],"all_points_y":[75,186,184,216,225,193,199,87,93,66,60,83]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_53.jpg17290":{"filename":"IMG_53.jpg","size":17290,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[85,87,116,118],"all_points_y":[129,168,173,131]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[123,119,151,156],"all_points_y":[126,168,172,129]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[59,68,164,162],"all_points_y":[85,230,231,79]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[57,160,162,211,208,164,168,68,66,67,18,6,59],"all_points_y":[30,24,79,71,250,229,286,289,282,230,235,87,85]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_54.jpg21501":{"filename":"IMG_54.jpg","size":21501,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[87,96,124,114],"all_points_y":[112,151,144,105]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[61,61,146,150],"all_points_y":[60,181,183,60]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[56,151,147,189,187,147,154,52,62,60,41,42,61],"all_points_y":[13,11,58,50,184,183,201,202,183,181,189,46,62]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_55.jpg17905":{"filename":"IMG_55.jpg","size":17905,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[123,126,160,158],"all_points_y":[147,202,200,147]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[60,68,166,159],"all_points_y":[154,236,228,142]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[53,156,160,204,214,167,174,72,69,36,27,60],"all_points_y":[109,96,140,137,226,228,275,284,238,234,156,154]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_56.jpg14750":{"filename":"IMG_56.jpg","size":14750,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[61,73,87,74],"all_points_y":[128,153,148,122]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[56,54,145,144],"all_points_y":[98,200,202,101]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[59,146,145,190,195,147,143,54,54,1,8,57],"all_points_y":[52,56,100,94,202,201,241,240,200,199,90,97]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_57.jpg32976":{"filename":"IMG_57.jpg","size":32976,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[167,177,236,226],"all_points_y":[152,177,144,124]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[125,177,304,249],"all_points_y":[163,272,209,100]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[95,221,250,296,343,305,335,275,190,176,124,67,126],"all_points_y":[105,42,100,80,180,207,272,299,300,274,300,191,163]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_58.jpg32868":{"filename":"IMG_58.jpg","size":32868,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[213,272,236,177],"all_points_y":[197,166,107,136]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[107,110,308,306],"all_points_y":[87,213,218,76]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[104,304,304,382,387,310,316,80,111,37,36,106],"all_points_y":[19,2,74,74,217,218,283,269,213,218,85,88]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_59.jpg30456":{"filename":"IMG_59.jpg","size":30456,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[155,154,286,288],"all_points_y":[100,123,133,109]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[118,134,319,308],"all_points_y":[71,205,194,60]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[103,230,314,309,377,389,316,334,124,134,63,52,117],"all_points_y":[10,1,0,58,45,199,193,259,269,202,216,72,73]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_60.jpg18946":{"filename":"IMG_60.jpg","size":18946,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[116,104,118,132],"all_points_y":[134,184,188,140]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[41,102,181,119],"all_points_y":[181,246,176,109]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[4,84,116,146,203,182,212,132,101,65,4,40],"all_points_y":[146,73,107,86,148,175,212,286,247,282,215,182]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_61.jpg24194":{"filename":"IMG_61.jpg","size":24194,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[109,109,131,131],"all_points_y":[134,157,157,134]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[76,76,150,154],"all_points_y":[85,191,195,86]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[33,38,75,72,149,150,187,195,155,158,74,78],"all_points_y":[81,200,190,225,231,196,202,86,87,46,46,84]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_62.jpg20584":{"filename":"IMG_62.jpg","size":20584,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[105,140,124,89],"all_points_y":[178,170,100,110]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[75,158,156,77],"all_points_y":[80,80,194,191]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[76,158,157,199,197,154,156,73,78,38,34,78],"all_points_y":[38,37,80,78,198,192,231,226,190,196,76,80]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_63.jpg12702":{"filename":"IMG_63.jpg","size":12702,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[66,66,90,89],"all_points_y":[144,184,184,145]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[40,38,112,107],"all_points_y":[108,211,209,106]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[40,105,105,139,144,144,113,113,40,40,1,6,42],"all_points_y":[73,73,105,104,156,210,209,247,250,211,215,100,107]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_64.jpg27386":{"filename":"IMG_64.jpg","size":27386,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[84,89,136,132],"all_points_y":[92,120,110,85]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[53,161,145,41],"all_points_y":[63,75,226,227]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[28,21,42,38,164,145,193,211,160,185,51,55],"all_points_y":[35,258,228,261,257,224,228,80,76,62,40,63]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_65.jpg14005":{"filename":"IMG_65.jpg","size":14005,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[67,61,80,85],"all_points_y":[153,188,193,157]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[38,41,113,98],"all_points_y":[110,202,196,106]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[39,95,99,126,144,144,114,119,45,43,5,7,39],"all_points_y":[85,84,107,106,184,192,194,233,241,201,206,111,110]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_66.jpg16631":{"filename":"IMG_66.jpg","size":16631,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[119,129,166,156],"all_points_y":[177,197,180,162]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[59,64,182,178],"all_points_y":[123,223,219,114]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[54,175,178,215,222,180,187,66,64,10,6,58],"all_points_y":[67,58,114,115,207,214,272,278,222,226,126,122]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_67.jpg20229":{"filename":"IMG_67.jpg","size":20229,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[108,108,142,143],"all_points_y":[113,200,201,116]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[64,163,168,63],"all_points_y":[79,79,230,232]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[62,168,164,216,224,168,170,62,63,12,23,65],"all_points_y":[22,23,79,76,231,228,285,287,232,241,59,80]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_68.jpg33373":{"filename":"IMG_68.jpg","size":33373,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[165,154,210,222],"all_points_y":[145,188,205,163]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[109,117,285,280],"all_points_y":[101,220,213,92]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[96,282,280,344,349,286,294,109,118,56,48,108],"all_points_y":[41,35,92,88,212,212,275,279,218,229,97,99]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_69.jpg18623":{"filename":"IMG_69.jpg","size":18623,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[76,127,147,92],"all_points_y":[125,167,148,100]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[40,133,192,100],"all_points_y":[137,204,124,56]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[16,67,96,128,224,224,193,225,224,179,135,109,2,41],"all_points_y":[115,44,58,12,74,84,124,146,171,235,206,252,172,136]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_70.jpg19499":{"filename":"IMG_70.jpg","size":19499,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[78,88,118,110],"all_points_y":[116,191,186,114]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[70,70,162,165],"all_points_y":[66,197,204,68]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[72,168,166,218,212,162,164,64,70,19,20,70],"all_points_y":[16,18,69,68,209,202,247,242,196,201,61,68]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_71.jpg45811":{"filename":"IMG_71.jpg","size":45811,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[187,237,252,200],"all_points_y":[157,214,200,145]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[130,198,299,234],"all_points_y":[221,72,118,270]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[157,76,127,124,238,243,247,328,302,298,324,210,200],"all_points_y":[42,211,222,225,278,292,293,107,117,115,94,41,75]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_72.jpg15553":{"filename":"IMG_72.jpg","size":15553,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[41,41,94,93],"all_points_y":[109,175,174,110]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[35,36,104,103],"all_points_y":[94,200,195,95]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[36,104,104,133,133,103,102,38,38,0,1,35],"all_points_y":[57,61,96,97,194,196,228,234,200,202,93,94]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_73.jpg19455":{"filename":"IMG_73.jpg","size":19455,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[109,104,131,136],"all_points_y":[140,176,179,142]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[68,70,168,164],"all_points_y":[102,237,232,96]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[66,165,162,208,214,164,173,67,70,23,23,69],"all_points_y":[54,48,102,93,241,230,283,286,234,245,97,103]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_74.jpg13680":{"filename":"IMG_74.jpg","size":13680,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[49,49,70,70],"all_points_y":[100,131,131,101]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[38,41,112,112],"all_points_y":[76,186,182,77]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[36,108,110,142,143,110,111,43,42,3,0,1,37],"all_points_y":[37,42,80,78,181,182,218,224,186,190,108,74,76]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_75.jpg20669":{"filename":"IMG_75.jpg","size":20669,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[111,112,133,131],"all_points_y":[109,167,166,110]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[72,107,182,148],"all_points_y":[108,193,164,76]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[108,123,197,180,222,189,147,129,60,73,29,67],"all_points_y":[194,232,202,164,149,62,77,48,72,106,123,210]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_76.jpg27147":{"filename":"IMG_76.jpg","size":27147,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[174,178,238,234],"all_points_y":[108,130,120,97]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[186,188,247,243],"all_points_y":[139,160,150,128]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[135,138,311,305],"all_points_y":[82,201,199,85]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[135,310,305,362,365,308,331,133,140,78,75,87,136],"all_points_y":[24,27,86,86,193,198,243,250,199,207,84,79,87]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_77.jpg45935":{"filename":"IMG_77.jpg","size":45935,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[154,192,239,193],"all_points_y":[164,246,229,147]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[71,92,327,278],"all_points_y":[121,269,220,77]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[62,263,279,304,344,370,327,368,368,112,62,93,50,35,74],"all_points_y":[54,13,77,36,117,209,218,229,234,298,298,265,279,92,119]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_78.jpg18381":{"filename":"IMG_78.jpg","size":18381,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[101,96,98,102,111,124,134,141,144,144,141,136,127,119,112,106],"all_points_y":[127,136,146,155,162,164,161,154,145,136,128,123,118,118,119,121]},"region_attributes":{"name":"item_circ"}},{"shape_attributes":{"name":"polygon","all_points_x":[65,57,157,165],"all_points_y":[79,218,224,80]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[64,168,163,211,208,156,164,44,58,3,20,67],"all_points_y":[26,29,83,72,232,221,271,267,214,222,62,78]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_79.jpg18012":{"filename":"IMG_79.jpg","size":18012,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[103,130,144,116],"all_points_y":[127,172,163,120]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[47,93,188,140],"all_points_y":[116,225,183,76]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[42,93,115,208,184,224,225,188,139,120,36,48,0,2],"all_points_y":[250,226,276,232,183,166,140,58,79,48,79,114,135,156]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_80.jpg19043":{"filename":"IMG_80.jpg","size":19043,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[111,104,132,142],"all_points_y":[102,188,191,105]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[66,73,155,155],"all_points_y":[87,206,204,81]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[59,159,155,198,197,155,162,64,73,56,48,67],"all_points_y":[46,39,82,76,212,203,229,234,203,220,80,89]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_81.jpg18816":{"filename":"IMG_81.jpg","size":18816,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[88,84,124,126],"all_points_y":[121,188,190,123]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[77,68,176,175],"all_points_y":[83,222,228,87]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[73,186,174,224,224,176,189,58,69,10,26,78],"all_points_y":[42,49,90,86,230,227,282,275,219,219,77,84]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_82.jpg55185":{"filename":"IMG_82.jpg","size":55185,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[240,241,310,308],"all_points_y":[137,160,154,131]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[153,154,376,370],"all_points_y":[71,220,218,61]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[155,154,88,89,155,155,380,375,456,450,369,368],"all_points_y":[4,74,81,218,218,292,296,213,215,68,68,1]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_83.jpg34933":{"filename":"IMG_83.jpg","size":34933,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[202,191,251,261],"all_points_y":[120,173,184,131]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[154,151,305,307],"all_points_y":[94,200,204,87]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[100,99,149,140,307,302,361,362,301,312,137,155],"all_points_y":[91,199,197,249,264,201,208,85,93,31,45,93]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_84.jpg19315":{"filename":"IMG_84.jpg","size":19315,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[77,100,149,127],"all_points_y":[131,159,115,90]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[53,59,157,163],"all_points_y":[64,203,208,66]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[41,172,161,221,211,153,162,47,61,7,1,1,54],"all_points_y":[9,10,67,67,213,207,250,243,203,211,124,63,65]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_85.jpg28749":{"filename":"IMG_85.jpg","size":28749,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[54,64,128,125,117,51],"all_points_y":[133,128,153,170,172,148]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[99,1,1,127,187],"all_points_y":[63,127,137,284,196]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[6,130,133,98,138,215,188,224,225,191,149,126,141,133,1,1],"all_points_y":[102,29,35,63,39,163,193,198,229,300,300,284,299,299,147,117]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_86.jpg14521":{"filename":"IMG_86.jpg","size":14521,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[37,46,82,72],"all_points_y":[104,180,174,100]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[22,32,103,97],"all_points_y":[84,195,189,80]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[22,95,96,128,136,101,104,36,33,1,1,26],"all_points_y":[47,45,82,81,183,187,222,230,191,195,85,85]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_87.jpg24135":{"filename":"IMG_87.jpg","size":24135,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[61,62,150,153],"all_points_y":[104,189,189,101]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[56,52,164,168],"all_points_y":[71,226,224,72]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[52,178,165,224,220,159,169,48,53,3,8,57],"all_points_y":[10,15,72,67,237,222,283,288,226,243,49,71]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_88.jpg17219":{"filename":"IMG_88.jpg","size":17219,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[116,94,128,150],"all_points_y":[134,175,194,154]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[66,76,171,160],"all_points_y":[71,202,196,68]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[59,164,159,207,220,167,180,77,76,25,16,67],"all_points_y":[22,18,70,64,193,196,247,255,199,209,71,74]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_89.jpg13203":{"filename":"IMG_89.jpg","size":13203,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[46,52,79,71],"all_points_y":[145,156,137,127]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[31,35,106,100],"all_points_y":[84,192,185,85]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[31,101,99,132,138,102,106,38,37,1,0,32],"all_points_y":[44,48,86,85,185,186,222,228,191,198,76,84]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_90.jpg18293":{"filename":"IMG_90.jpg","size":18293,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[82,75,115,123],"all_points_y":[122,162,171,129]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[72,142,144,70],"all_points_y":[180,177,78,77]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[36,39,73,71,146,141,175,178,144,147,66,70],"all_points_y":[73,182,179,212,211,174,180,71,78,43,42,76]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_91.jpg18187":{"filename":"IMG_91.jpg","size":18187,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[65,67,96,93],"all_points_y":[158,225,223,158]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[58,61,152,146],"all_points_y":[111,238,233,106]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[48,147,145,186,194,149,158,59,62,17,15,59],"all_points_y":[74,68,110,100,240,231,281,286,235,248,108,112]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_92.jpg48632":{"filename":"IMG_92.jpg","size":48632,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[193,203,214,219,221,217,209,203,198,194,193],"all_points_y":[191,200,199,191,182,175,172,171,174,179,185]},"region_attributes":{"name":"item_circ"}},{"shape_attributes":{"name":"polygon","all_points_x":[111,204,326,216],"all_points_y":[124,284,204,53]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[80,198,214,212,361,357,333,337,196,206,200,131,47,112,113],"all_points_y":[84,7,52,7,206,211,211,200,295,295,299,300,132,123,115]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_93.jpg30568":{"filename":"IMG_93.jpg","size":30568,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[165,236,215,141],"all_points_y":[116,141,201,175]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[132,141,295,285],"all_points_y":[87,224,205,76]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[120,297,283,324,336,290,306,148,141,65,54,131],"all_points_y":[10,7,77,77,195,203,277,300,222,233,89,86]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_94.jpg38226":{"filename":"IMG_94.jpg","size":38226,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[181,170,264,276],"all_points_y":[114,178,195,125]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[141,131,293,304],"all_points_y":[86,196,218,97]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[88,79,132,116,289,291,349,363,301,313,131,144],"all_points_y":[76,194,195,244,272,214,226,97,99,49,32,84]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_95.jpg18135":{"filename":"IMG_95.jpg","size":18135,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[93,112,131,112],"all_points_y":[171,180,132,125]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[67,73,161,156],"all_points_y":[110,235,229,104]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[63,155,156,199,203,158,168,72,73,31,24,68],"all_points_y":[67,61,108,101,239,226,275,285,235,246,109,109]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_96.jpg30610":{"filename":"IMG_96.jpg","size":30610,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[199,206,249,242],"all_points_y":[153,170,150,136]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[123,179,295,238],"all_points_y":[152,253,184,83]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[89,207,238,279,332,295,328,225,203,178,127,70,122],"all_points_y":[100,30,84,63,155,184,239,300,299,252,280,184,153]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_97.jpg59317":{"filename":"IMG_97.jpg","size":59317,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[247,244,323,327],"all_points_y":[97,181,183,95]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[180,184,394,387],"all_points_y":[76,218,212,57]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[180,180,120,123,184,185,402,395,477,467,385,384,294],"all_points_y":[11,78,85,217,216,287,292,209,211,55,64,3,3]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_98.jpg44280":{"filename":"IMG_98.jpg","size":44280,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[146,164,197,177],"all_points_y":[153,223,213,145]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[23,113,333,295],"all_points_y":[189,62,121,297]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[143,351,334,375,380,340,300,271,2,1,24,1,1,82,110],"all_points_y":[11,53,120,53,148,287,299,298,195,186,189,171,82,2,62]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_99.jpg12953":{"filename":"IMG_99.jpg","size":12953,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[38,38,80,80],"all_points_y":[100,118,119,100]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[32,35,104,103],"all_points_y":[88,195,191,89]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[32,101,102,138,139,103,102,36,35,1,1,33],"all_points_y":[51,57,91,88,191,190,225,231,194,197,84,88]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_100.jpg44961":{"filename":"IMG_100.jpg","size":44961,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[169,184,242,224],"all_points_y":[113,100,174,187]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[101,330,288,66],"all_points_y":[44,83,260,193]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[80,367,341,291,296,291,109,9,65,3,2,36,99,59],"all_points_y":[1,43,81,282,275,299,299,261,192,186,160,11,45,1]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_101.jpg19203":{"filename":"IMG_101.jpg","size":19203,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[98,142,144,99],"all_points_y":[106,105,181,181]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[165,167,68,62],"all_points_y":[85,227,230,84]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[223,224,219,166,171,60,64,7,14,67,62,176,167,225],"all_points_y":[201,202,77,85,27,28,82,80,240,231,280,283,226,237]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_102.jpg44827":{"filename":"IMG_102.jpg","size":44827,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[181,270,264,176],"all_points_y":[117,129,182,167]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[272,277,146,142],"all_points_y":[201,100,99,190]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[267,271,321,325,278,281,139,145,98,96,141,130],"all_points_y":[248,198,206,105,106,51,53,97,97,187,189,236]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_103.jpg43859":{"filename":"IMG_103.jpg","size":43859,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[148,183,177,141],"all_points_y":[100,105,146,138]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[97,266,230,99],"all_points_y":[44,58,235,239]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[272,357,293,230,243,92,99,97,79,72,100,94,297,96,103,272,276],"all_points_y":[28,49,269,232,293,299,239,239,299,13,11,41,60,41,10,28,36]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_104.jpg20819":{"filename":"IMG_104.jpg","size":20819,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[100,131,123,94],"all_points_y":[92,93,169,166]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[139,139,65,62],"all_points_y":[74,179,181,71]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[63,141,138,174,173,139,138,56,63,34,29,60],"all_points_y":[28,29,72,70,188,180,217,216,181,188,61,70]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_105.jpg23594":{"filename":"IMG_105.jpg","size":23594,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[123,140,99,82],"all_points_y":[124,182,189,132]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[154,162,80,73],"all_points_y":[92,205,210,95]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[207,159,165,80,80,35,33,75,69,154,152,194],"all_points_y":[203,205,248,251,210,215,91,94,56,52,91,83]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_106.jpg18173":{"filename":"IMG_106.jpg","size":18173,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[81,130,129,84],"all_points_y":[120,119,190,192]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[165,173,63,63],"all_points_y":[78,222,224,79]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[175,166,221,225,225,173,184,56,65,6,9,64,57],"all_points_y":[39,77,72,119,220,222,278,282,223,226,76,80,38]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_107.jpg24766":{"filename":"IMG_107.jpg","size":24766,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[77,129,151,100],"all_points_y":[143,129,206,223]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[154,163,65,64],"all_points_y":[102,238,242,107]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[155,155,199,212,163,175,56,64,46,45,61,59],"all_points_y":[56,104,93,238,237,264,273,241,254,90,107,57]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_108.jpg27807":{"filename":"IMG_108.jpg","size":27807,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[103,113,117,118,118,115,109,103,99,97,95,94,94,95,98,99,100],"all_points_y":[127,128,131,136,144,149,152,152,152,150,147,145,142,138,131,131,129]},"region_attributes":{"name":"item_circ"}},{"shape_attributes":{"name":"polygon","all_points_x":[120,181,72,22],"all_points_y":[73,212,261,103]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[122,169,225,224,182,208,168,163,153,97,90,82,76,73,73,57,1,1,22,6,78,106,126,130],"all_points_y":[72,57,176,194,214,223,247,251,257,279,281,283,286,283,264,285,115,86,100,70,49,46,41,41]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_109.jpg22710":{"filename":"IMG_109.jpg","size":22710,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[77,126,125,81],"all_points_y":[145,145,208,206]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[153,157,64,68],"all_points_y":[96,222,223,96]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[202,157,166,54,66,48,50,67,65,157,153,195],"all_points_y":[225,223,244,246,221,231,79,91,50,50,97,86]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_110.jpg17364":{"filename":"IMG_110.jpg","size":17364,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[77,104,153,125],"all_points_y":[110,94,180,196]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[168,163,65,70],"all_points_y":[74,208,204,66]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[176,167,218,216,164,167,62,67,11,16,70,70],"all_points_y":[20,73,74,210,207,261,258,203,205,61,68,14]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_111.jpg15269":{"filename":"IMG_111.jpg","size":15269,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[48,95,106,57],"all_points_y":[116,109,175,184]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[40,107,110,41],"all_points_y":[98,100,198,199]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[43,105,107,137,141,105,109,41,41,3,8,41],"all_points_y":[70,70,98,100,195,197,237,236,198,200,97,98]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_112.jpg21597":{"filename":"IMG_112.jpg","size":21597,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[83,140,141,83],"all_points_y":[123,123,196,196]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[159,161,66,71],"all_points_y":[93,221,223,92]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[166,160,201,204,160,165,65,66,21,27,71,68],"all_points_y":[49,95,84,225,221,268,266,217,226,83,92,46]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_113.jpg19243":{"filename":"IMG_113.jpg","size":19243,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[137,112,137,157],"all_points_y":[117,138,163,132]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[170,170,77,83],"all_points_y":[112,242,240,110]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[81,175,168,214,217,169,178,69,79,36,44,83],"all_points_y":[66,65,113,104,251,240,290,287,236,247,102,111]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_114.jpg17093":{"filename":"IMG_114.jpg","size":17093,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[88,97,134,123],"all_points_y":[103,157,151,97]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[151,151,159,80,74],"all_points_y":[59,58,174,180,61]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[66,153,151,192,202,159,162,85,79,47,40,73],"all_points_y":[13,13,59,54,172,174,216,224,178,188,48,62]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_115.jpg29392":{"filename":"IMG_115.jpg","size":29392,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[116,117,166,166,117],"all_points_y":[128,128,128,148,149]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[205,77,11,143],"all_points_y":[148,243,143,64]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[174,224,224,207,206,224,224,72,76,2,10,0,1,131,143,145],"all_points_y":[32,99,136,145,148,146,154,267,247,133,142,129,78,8,63,66]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_116.jpg18564":{"filename":"IMG_116.jpg","size":18564,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[102,148,133,92],"all_points_y":[94,98,203,199]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[159,163,62,57],"all_points_y":[72,226,226,77]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[160,160,162,210,206,159,170,62,65,13,0,55,54],"all_points_y":[15,16,73,65,247,223,283,278,226,228,79,77,21]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_117.jpg17005":{"filename":"IMG_117.jpg","size":17005,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[102,113,110,98],"all_points_y":[131,132,173,170]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[143,151,59,56],"all_points_y":[98,198,202,100]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[55,140,142,186,198,151,151,64,61,3,8,56],"all_points_y":[56,55,96,88,194,198,237,244,203,203,101,101]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_118.jpg20674":{"filename":"IMG_118.jpg","size":20674,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[93,142,142,91],"all_points_y":[131,133,209,208]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[70,163,171,66],"all_points_y":[92,91,240,242]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[67,166,163,213,225,224,170,171,69,66,19,27,68],"all_points_y":[40,39,92,89,218,237,239,298,300,242,252,74,93]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_119.jpg23138":{"filename":"IMG_119.jpg","size":23138,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[114,134,118,99],"all_points_y":[129,132,204,198]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[150,153,70,70],"all_points_y":[105,219,217,104]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[71,153,150,186,193,152,156,67,71,42,38,68,73],"all_points_y":[76,76,105,98,224,217,258,258,216,227,94,103,102]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_120.jpg33838":{"filename":"IMG_120.jpg","size":33838,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[158,227,222,153],"all_points_y":[97,103,183,185]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[127,233,226,117],"all_points_y":[88,94,244,240]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[240,235,283,277,225,231,109,119,57,75,128,128],"all_points_y":[43,92,90,253,240,292,295,241,245,77,86,36]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_121.jpg50287":{"filename":"IMG_121.jpg","size":50287,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[254,278,280,254],"all_points_y":[139,139,203,206]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[162,367,382,165],"all_points_y":[102,89,227,246]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[161,360,369,434,450,378,389,340,169,165,90,90,162],"all_points_y":[40,30,91,87,221,228,299,299,300,244,246,105,104]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_122.jpg55699":{"filename":"IMG_122.jpg","size":55699,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[209,360,363,213],"all_points_y":[101,98,212,223]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[172,407,403,173],"all_points_y":[82,86,235,240]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[173,401,404,474,474,403,400,175,175,93,89,172],"all_points_y":[5,12,86,90,235,235,299,299,240,242,85,83]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_123.jpg43650":{"filename":"IMG_123.jpg","size":43650,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[152,173,202,178],"all_points_y":[111,196,189,104]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[98,226,283,118],"all_points_y":[81,53,214,258]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[74,156,219,221,225,233,238,324,293,298,96,122,68,24,24,96,101],"all_points_y":[21,4,4,50,50,3,3,228,246,217,267,291,300,298,58,82,80]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_124.jpg13800":{"filename":"IMG_124.jpg","size":13800,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[58,58,86,86],"all_points_y":[132,165,164,132]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[109,110,45,43],"all_points_y":[88,185,189,83]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[43,107,108,138,139,110,110,44,45,9,8,43],"all_points_y":[50,55,87,88,182,184,218,223,188,191,82,86]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_125.jpg21059":{"filename":"IMG_125.jpg","size":21059,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[80,136,137,83],"all_points_y":[127,127,190,191]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[60,156,168,63],"all_points_y":[78,77,224,235]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[204,224,167,173,66,65,17,15,57,53,154,156],"all_points_y":[73,220,222,280,291,231,246,59,82,23,21,75]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_126.jpg28377":{"filename":"IMG_126.jpg","size":28377,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[116,145,130,99],"all_points_y":[114,123,194,187]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[36,139,190,89],"all_points_y":[73,50,193,237]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[44,91,101,214,224,224,167,140,152,30,38,1,1],"all_points_y":[269,237,240,192,190,182,14,48,4,24,72,65,144]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_127.jpg25215":{"filename":"IMG_127.jpg","size":25215,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[158,192,217,182],"all_points_y":[156,145,206,222]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[229,269,131,104],"all_points_y":[90,234,265,114]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[104,210,228,293,342,270,288,289,137,133,56,33,105],"all_points_y":[73,49,90,71,219,236,296,299,298,267,291,111,113]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_128.jpg19327":{"filename":"IMG_128.jpg","size":19327,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[91,164,162,96],"all_points_y":[80,78,189,191]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[73,168,166,80],"all_points_y":[73,73,201,201]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[67,173,169,189,186,169,175,72,78,67,60,73],"all_points_y":[25,21,72,63,220,202,237,233,201,217,66,70]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_129.jpg15895":{"filename":"IMG_129.jpg","size":15895,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[100,125,137,111],"all_points_y":[164,151,173,184]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[162,170,64,55],"all_points_y":[97,218,221,101]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[47,160,163,224,225,169,167,73,67,8,2,1,55],"all_points_y":[40,35,98,87,228,217,250,257,224,225,157,104,101]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_130.jpg24806":{"filename":"IMG_130.jpg","size":24806,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[96,106,121,112],"all_points_y":[123,144,135,117]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[34,167,219,58],"all_points_y":[38,28,225,265]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[25,61,52,107,210,208,224,224,164,179,26,35,8,1,2],"all_points_y":[298,264,300,298,277,272,264,19,28,1,0,36,1,0,169]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_131.jpg31491":{"filename":"IMG_131.jpg","size":31491,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[154,238,239,155],"all_points_y":[139,140,201,198]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[147,320,323,145],"all_points_y":[85,80,208,204]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[89,90,147,138,330,320,388,387,319,333,133,148],"all_points_y":[74,208,202,260,267,204,214,74,82,23,28,83]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_132.jpg33547":{"filename":"IMG_132.jpg","size":33547,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[236,234,261,265],"all_points_y":[108,188,190,109]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[188,325,326,186],"all_points_y":[100,98,197,196]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[182,335,324,378,377,326,334,181,187,147,147,187],"all_points_y":[59,57,99,94,200,197,243,238,194,198,93,97]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_133.jpg17878":{"filename":"IMG_133.jpg","size":17878,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[95,160,142,81],"all_points_y":[102,119,184,170]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[58,170,160,63],"all_points_y":[65,69,209,206]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[45,178,172,223,214,160,165,52,65,11,1,57],"all_points_y":[17,15,69,67,215,210,254,247,206,210,66,66]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_134.jpg18332":{"filename":"IMG_134.jpg","size":18332,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[72,137,138,69],"all_points_y":[89,91,195,196]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[63,149,153,65],"all_points_y":[75,76,197,199]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[56,155,150,162,167,153,161,57,64,45,46,63],"all_points_y":[38,40,75,56,200,197,241,245,199,204,56,75]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_135.jpg54041":{"filename":"IMG_135.jpg","size":54041,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[233,270,287,250],"all_points_y":[149,116,137,169]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[154,364,378,152],"all_points_y":[64,59,199,212]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[360,367,435,452,373,385,152,150,74,82,154,157],"all_points_y":[0,60,61,192,201,276,289,210,213,70,67,4]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_136.jpg13267":{"filename":"IMG_136.jpg","size":13267,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[71,53,71,91],"all_points_y":[149,178,189,160]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[33,95,103,36],"all_points_y":[115,112,206,211]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[94,96,125,136,103,106,37,35,1,3,32,35],"all_points_y":[83,111,111,204,206,242,250,211,214,108,113,83]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_137.jpg21402":{"filename":"IMG_137.jpg","size":21402,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[70,71,115,115,71],"all_points_y":[108,108,106,169,170]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[58,131,127,164,161,126,124,51,55,30,29,57],"all_points_y":[60,66,100,102,206,201,232,228,196,205,90,96]},"region_attributes":{"name":"outerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[129,128,126,55,55,125],"all_points_y":[108,102,201,196,94,99]},"region_attributes":{"name":"innerbox"}}],"file_attributes":{}},"IMG_138.jpg26859":{"filename":"IMG_138.jpg","size":26859,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[128,134,157,150],"all_points_y":[198,221,217,194]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[22,142,224,224,106],"all_points_y":[100,56,202,227,300]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[148,138,187,192,223,223,225,224,199,69,2,2,18,21,2,2,37],"all_points_y":[1,54,35,35,80,196,228,286,300,300,139,87,100,99,59,51,36]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_139.jpg13632":{"filename":"IMG_139.jpg","size":13632,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[41,74,77,43],"all_points_y":[99,99,143,146]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[37,37,101,99,39],"all_points_y":[78,77,81,175,180]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[34,101,99,132,131,99,103,40,39,1,1,34],"all_points_y":[42,48,79,79,178,176,206,214,182,185,74,77]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_140.jpg24619":{"filename":"IMG_140.jpg","size":24619,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[61,132,141,68],"all_points_y":[116,111,201,207]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[48,142,149,51],"all_points_y":[99,96,231,236]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[42,143,142,186,198,147,156,36,50,27,26,47],"all_points_y":[52,50,95,86,234,229,257,266,235,250,84,100]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_141.jpg35744":{"filename":"IMG_141.jpg","size":35744,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[193,125,138,207],"all_points_y":[141,216,227,148]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[245,245,297,83,42],"all_points_y":[75,76,210,282,133]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[12,34,73,65,101,333,294,295,343,294,284,252,247,240],"all_points_y":[69,117,284,300,297,222,212,208,203,67,49,76,74,3]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_142.jpg14503":{"filename":"IMG_142.jpg","size":14503,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[61,91,91,63],"all_points_y":[129,129,184,182]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[43,112,118,43],"all_points_y":[103,100,201,205]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[42,107,108,144,143,145,119,117,45,45,8,9,41],"all_points_y":[70,66,98,100,132,201,200,238,243,205,208,102,102]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_143.jpg52315":{"filename":"IMG_143.jpg","size":52315,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[318,343,352,356,359,354,351,347,336,324,309,304,291,288,288,287,287,293,300,304],"all_points_y":[85,93,101,112,121,137,143,153,156,158,156,154,141,137,127,120,108,98,93,89]},"region_attributes":{"name":"item_circ"}},{"shape_attributes":{"name":"polygon","all_points_x":[377,377,394,172,164],"all_points_y":[41,40,179,198,53]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[446,468,392,403,173,175,98,91,165,164,370,377],"all_points_y":[35,171,176,254,278,198,207,63,53,1,1,37]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_144.jpg26901":{"filename":"IMG_144.jpg","size":26901,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[194,174,195,216],"all_points_y":[134,198,205,142]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[283,183,106,210],"all_points_y":[171,260,169,84]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[250,314,285,328,236,216,186,143,65,107,63,172,210,210],"all_points_y":[57,134,170,217,299,299,259,297,204,171,125,34,83,79]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_145.jpg26898":{"filename":"IMG_145.jpg","size":26898,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[106,127,134,107],"all_points_y":[111,111,187,190]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[155,151,59,67],"all_points_y":[90,215,210,83]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[67,161,157,190,194,152,157,52,61,17,28,67],"all_points_y":[38,47,90,78,224,212,245,241,208,213,66,84]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_146.jpg19663":{"filename":"IMG_146.jpg","size":19663,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[82,137,158,101],"all_points_y":[148,131,198,216]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[68,167,168,65],"all_points_y":[94,92,231,237]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[65,170,167,219,219,168,175,60,65,17,19,69],"all_points_y":[41,43,95,85,242,230,289,290,235,244,87,93]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_147.jpg20190":{"filename":"IMG_147.jpg","size":20190,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[88,151,148,87],"all_points_y":[82,85,160,158]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[58,165,156,62],"all_points_y":[70,69,221,216]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[59,167,166,212,195,155,158,58,63,14,5,57],"all_points_y":[13,12,72,66,241,218,273,268,214,218,68,69]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_148.jpg28133":{"filename":"IMG_148.jpg","size":28133,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[278,303,295,271],"all_points_y":[74,80,109,102]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[160,314,312,162],"all_points_y":[72,64,199,201]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[111,160,156,317,315,387,387,315,319,164,165,113],"all_points_y":[76,72,1,1,66,63,198,198,271,269,198,196]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_149.jpg19729":{"filename":"IMG_149.jpg","size":19729,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[100,123,111,89],"all_points_y":[108,113,188,185]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[68,69,165,162,69],"all_points_y":[70,71,69,201,202]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[56,170,165,166,182,179,162,166,65,71,26,21,66],"all_points_y":[45,41,67,69,55,217,199,252,250,201,211,65,69]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}}},"_via_attributes":{"region":{"name":{"type":"dropdown","description":"","options":{"outerbox":"","innerbox":"","item_sq":"","item_rect":"","item_rect_slim":"","item_circ":""},"default_options":{}}},"file":{}}}
\ No newline at end of file
diff --git a/mask_rcnn/dataset/VAL-MINI.json b/mask_rcnn/dataset/VAL-MINI.json
new file mode 100644
index 00000000..e6284959
--- /dev/null
+++ b/mask_rcnn/dataset/VAL-MINI.json
@@ -0,0 +1 @@
+{"_via_settings":{"ui":{"annotation_editor_height":25,"annotation_editor_fontsize":0.8,"leftsidebar_width":18,"image_grid":{"img_height":80,"rshape_fill":"none","rshape_fill_opacity":0.3,"rshape_stroke":"yellow","rshape_stroke_width":2,"show_region_shape":true,"show_image_policy":"all"},"image":{"region_label":"name","region_color":"__via_default_region_color__","region_label_font":"10px Sans","on_image_annotation_editor_placement":"NEAR_REGION"}},"core":{"buffer_size":"18","filepath":{},"default_filepath":"val/"},"project":{"name":"VAL"}},"_via_img_metadata":{"IMG_150.jpg31278":{"filename":"IMG_150.jpg","size":31278,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[138,139,226,226],"all_points_y":[125,185,187,124]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[127,129,310,304],"all_points_y":[66,192,193,62]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[70,70,130,121,316,305,373,368,301,315,116,128],"all_points_y":[58,195,188,248,249,189,195,53,65,3,10,68]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_151.jpg16222":{"filename":"IMG_151.jpg","size":16222,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[86,87,122,120],"all_points_y":[114,161,161,113]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[56,56,169,166],"all_points_y":[72,196,196,71]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[3,1,59,54,169,166,223,224,159,156,62,58],"all_points_y":[58,200,196,254,254,193,195,67,72,38,40,74]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_152.jpg13817":{"filename":"IMG_152.jpg","size":13817,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[71,73,93,90],"all_points_y":[92,119,116,91]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[42,43,114,113],"all_points_y":[75,188,183,77]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[5,7,46,45,111,112,140,138,110,109,41,42],"all_points_y":[74,191,187,223,216,180,180,82,81,46,40,78]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_153.jpg14604":{"filename":"IMG_153.jpg","size":14604,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[48,50,90,86],"all_points_y":[98,150,150,98]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[41,42,122,112],"all_points_y":[77,180,179,74]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[9,6,44,44,119,116,144,142,110,105,43,41],"all_points_y":[78,182,180,220,216,177,176,76,76,45,46,77]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_154.jpg13797":{"filename":"IMG_154.jpg","size":13797,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[28,32,105,104],"all_points_y":[114,216,217,112]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[36,101,100,134,139,102,104,31,30,1,4,35],"all_points_y":[244,247,214,218,114,115,75,77,115,115,213,214]},"region_attributes":{"name":"outerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[60,74,83,84,79,62,55,52,52],"all_points_y":[146,148,154,165,170,169,165,155,149]},"region_attributes":{"name":"item_circ"}}],"file_attributes":{}},"IMG_155.jpg29096":{"filename":"IMG_155.jpg","size":29096,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[170,153,250,266],"all_points_y":[98,188,203,114]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[115,129,304,285],"all_points_y":[84,237,215,64]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[44,54,132,135,268,315,300,354,335,285,277,106,114],"all_points_y":[96,239,231,298,300,296,206,200,69,68,1,9,86]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_156.jpg40095":{"filename":"IMG_156.jpg","size":40095,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[160,203,224,174],"all_points_y":[123,186,170,112]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[112,105,312,306],"all_points_y":[90,227,238,97]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[91,78,108,74,211,337,306,344,348,340,303,308,118,112],"all_points_y":[70,233,221,256,263,264,230,246,138,81,104,33,28,92]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_157.jpg29987":{"filename":"IMG_157.jpg","size":29987,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[250,261,284,278],"all_points_y":[114,176,175,109]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[170,172,319,317],"all_points_y":[79,207,203,75]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[120,126,175,176,322,318,384,382,316,320,169,170],"all_points_y":[88,200,206,273,268,199,202,77,77,8,10,84]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_158.jpg20022":{"filename":"IMG_158.jpg","size":20022,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[79,91,144,130],"all_points_y":[84,170,163,78]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[65,66,160,155],"all_points_y":[66,198,196,62]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[19,19,69,66,163,158,203,199,155,158,60,66],"all_points_y":[60,202,194,242,242,192,195,53,63,15,21,71]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_159.jpg23088":{"filename":"IMG_159.jpg","size":23088,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[101,93,126,133],"all_points_y":[133,192,197,136]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[79,77,158,152],"all_points_y":[124,231,230,124]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[48,41,81,76,160,155,187,174,148,152,80,80],"all_points_y":[116,232,228,252,252,226,231,117,126,92,92,126]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_160.jpg14487":{"filename":"IMG_160.jpg","size":14487,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[46,48,92,88],"all_points_y":[118,165,163,113]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[37,41,114,113],"all_points_y":[81,199,191,81]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[42,111,112,143,144,112,112,44,42,3,1,40],"all_points_y":[45,48,85,86,188,190,225,233,194,197,81,82]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_161.jpg35869":{"filename":"IMG_161.jpg","size":35869,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[168,167,282,280],"all_points_y":[112,192,192,108]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[132,131,292,292],"all_points_y":[90,203,205,87]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[79,76,132,122,292,289,349,347,288,293,121,135],"all_points_y":[93,201,200,258,265,201,210,84,91,26,42,95]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_162.jpg42329":{"filename":"IMG_162.jpg","size":42329,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[157,161,280,276],"all_points_y":[115,199,193,105]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[126,131,311,303],"all_points_y":[99,222,221,90]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[63,69,132,113,320,305,341,334,299,303,112,127],"all_points_y":[100,232,219,246,245,216,229,79,94,30,44,103]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_163.jpg24084":{"filename":"IMG_163.jpg","size":24084,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[89,90,134,132],"all_points_y":[110,170,168,108]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[71,73,144,146],"all_points_y":[93,193,196,93]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[73,146,146,185,176,140,142,70,74,38,35,74],"all_points_y":[58,60,97,96,203,195,229,226,190,197,92,94]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_164.jpg46002":{"filename":"IMG_164.jpg","size":46002,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[104,114,242,241],"all_points_y":[79,190,182,74]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[73,101,315,302],"all_points_y":[68,231,198,50]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[37,47,56,72,100,107,161,321,312,355,357,348,299,346,195,43,73],"all_points_y":[62,192,192,264,226,300,297,268,197,220,118,40,54,15,20,38,70]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_165.jpg23943":{"filename":"IMG_165.jpg","size":23943,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[78,80,144,136],"all_points_y":[119,205,200,114]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[74,73,168,160],"all_points_y":[105,233,227,102]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[36,31,75,73,177,164,188,180,158,170,71,74],"all_points_y":[98,237,231,277,270,223,232,90,105,76,78,106]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_166.jpg27222":{"filename":"IMG_166.jpg","size":27222,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[75,142,146,128,72,67],"all_points_y":[124,132,160,165,162,142]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[49,72,196,157],"all_points_y":[69,248,221,62]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[24,41,51,74,70,144,176,177,218,224,224,191,224,223,204,155,175,43,50],"all_points_y":[32,218,263,243,267,257,252,247,234,232,225,216,214,113,54,62,23,27,72]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_167.jpg17439":{"filename":"IMG_167.jpg","size":17439,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[123,117,145,151],"all_points_y":[160,183,188,166]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[40,67,187,157],"all_points_y":[151,252,219,116]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[21,139,156,195,220,183,202,106,80,69,14,1,1,38],"all_points_y":[99,62,118,107,197,218,271,298,298,248,265,216,163,152]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_168.jpg17812":{"filename":"IMG_168.jpg","size":17812,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[108,105,136,134],"all_points_y":[89,157,156,92]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[66,70,167,161],"all_points_y":[67,178,176,63]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[16,20,72,76,162,162,215,211,161,160,65,68],"all_points_y":[67,181,176,210,211,173,176,52,67,13,19,70]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_169.jpg24933":{"filename":"IMG_169.jpg","size":24933,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[116,108,130,137],"all_points_y":[126,188,192,130]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[66,64,162,159],"all_points_y":[92,222,224,96]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[66,160,155,202,208,160,156,156,62,68,64,17,21,70],"all_points_y":[48,50,98,88,226,222,223,271,268,218,218,222,84,95]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_170.jpg40002":{"filename":"IMG_170.jpg","size":40002,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[180,236,255,195],"all_points_y":[208,162,185,230]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[86,77,306,303],"all_points_y":[96,248,262,107]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[58,40,40,79,44,180,334,301,347,354,344,300,306,90,89],"all_points_y":[75,204,265,248,290,299,299,258,281,162,92,112,36,23,96]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_171.jpg17521":{"filename":"IMG_171.jpg","size":17521,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[93,98,133,128],"all_points_y":[106,158,155,103]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[30,38,163,160],"all_points_y":[92,203,199,86]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[25,163,159,216,216,162,164,41,39,5,1,32],"all_points_y":[32,27,89,90,193,198,251,256,199,194,100,94]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_172.jpg30798":{"filename":"IMG_172.jpg","size":30798,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[202,178,207,255],"all_points_y":[96,157,180,140]},"region_attributes":{"name":"item_sq"}},{"shape_attributes":{"name":"polygon","all_points_x":[144,154,290,278],"all_points_y":[87,208,196,76]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[82,95,155,160,294,284,329,314,275,284,136,144],"all_points_y":[92,209,207,270,254,192,182,82,81,19,29,90]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_173.jpg23233":{"filename":"IMG_173.jpg","size":23233,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[88,91,127,124],"all_points_y":[103,160,159,101]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[66,72,165,164],"all_points_y":[70,204,201,69]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[20,30,74,68,168,162,181,184,162,174,57,70],"all_points_y":[68,214,203,251,249,200,218,61,72,44,51,73]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_174.jpg28656":{"filename":"IMG_174.jpg","size":28656,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[76,108,107,74],"all_points_y":[130,130,145,143]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[12,94,205,109],"all_points_y":[109,269,194,65]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[112,109,150,224,224,202,223,224,181,105,95,81,35,8,0,1,16,0,1],"all_points_y":[26,70,48,132,178,194,188,198,236,282,270,284,207,154,132,99,112,82,64]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_175.jpg18443":{"filename":"IMG_175.jpg","size":18443,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[68,61,175,166],"all_points_y":[88,233,236,90]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[14,2,63,51,184,172,222,224,218,164,175,63,71],"all_points_y":[85,232,231,286,290,235,236,146,89,94,52,50,89]},"region_attributes":{"name":"outerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[92,89,87,91,99,108,116,129,139,142,144,143,138,132,124,108,97],"all_points_y":[145,161,175,183,198,207,209,208,201,189,178,162,150,142,136,134,138]},"region_attributes":{"name":"item_circ"}}],"file_attributes":{}},"IMG_176.jpg24093":{"filename":"IMG_176.jpg","size":24093,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[95,92,112,109],"all_points_y":[118,195,193,118]},"region_attributes":{"name":"item_rect_slim"}},{"shape_attributes":{"name":"polygon","all_points_x":[73,76,162,159],"all_points_y":[98,219,217,95]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[36,35,78,72,164,159,174,171,155,163,68,74],"all_points_y":[99,223,217,259,256,213,225,86,99,73,78,101]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_177.jpg17580":{"filename":"IMG_177.jpg","size":17580,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[113,116,159,156],"all_points_y":[110,163,162,110]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[81,86,163,157],"all_points_y":[109,219,214,105]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[48,50,88,84,166,160,197,193,155,157,79,82],"all_points_y":[109,225,217,255,252,213,217,104,107,70,73,111]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_178.jpg22572":{"filename":"IMG_178.jpg","size":22572,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[89,88,128,127],"all_points_y":[133,189,189,134]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[72,70,160,162],"all_points_y":[101,234,232,103]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[29,26,70,65,166,159,204,204,160,168,69,73],"all_points_y":[100,240,231,280,275,229,241,102,106,64,65,105]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_179.jpg14341":{"filename":"IMG_179.jpg","size":14341,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[52,54,91,88],"all_points_y":[126,154,152,125]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[43,45,118,117],"all_points_y":[81,197,194,82]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[4,43,44,113,116,144,144,116,115,47,45,6],"all_points_y":[78,80,42,48,86,88,188,191,227,234,195,199]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_180.jpg23144":{"filename":"IMG_180.jpg","size":23144,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[104,104,134,133],"all_points_y":[132,173,174,134]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[81,79,156,161],"all_points_y":[95,208,210,99]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[47,44,83,73,157,152,156,187,190,159,165,79,82],"all_points_y":[92,214,204,234,238,207,205,221,97,102,63,60,98]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}},"IMG_181.jpg14152":{"filename":"IMG_181.jpg","size":14152,"regions":[{"shape_attributes":{"name":"polygon","all_points_x":[64,66,97,95],"all_points_y":[149,188,185,144]},"region_attributes":{"name":"item_rect"}},{"shape_attributes":{"name":"polygon","all_points_x":[35,38,109,106],"all_points_y":[90,202,193,90]},"region_attributes":{"name":"innerbox"}},{"shape_attributes":{"name":"polygon","all_points_x":[38,107,105,136,140,105,108,43,41,38,5,2,38],"all_points_y":[49,55,92,91,193,192,228,236,201,199,209,82,90]},"region_attributes":{"name":"outerbox"}}],"file_attributes":{}}},"_via_attributes":{"region":{"name":{"type":"dropdown","description":"","options":{"outerbox":"","innerbox":"","item_sq":"","item_rect":"","item_rect_slim":"","item_circ":""},"default_options":{}}},"file":{}}}
\ No newline at end of file
diff --git a/mask_rcnn/dataset/val_img_results/Figure_1.png b/mask_rcnn/dataset/val_img_results/Figure_1.png
new file mode 100644
index 00000000..ec7ae97f
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_1.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_10.png b/mask_rcnn/dataset/val_img_results/Figure_10.png
new file mode 100644
index 00000000..eac33a4d
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_10.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_11.png b/mask_rcnn/dataset/val_img_results/Figure_11.png
new file mode 100644
index 00000000..dd77bdae
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_11.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_12.png b/mask_rcnn/dataset/val_img_results/Figure_12.png
new file mode 100644
index 00000000..02e8d818
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_12.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_13.png b/mask_rcnn/dataset/val_img_results/Figure_13.png
new file mode 100644
index 00000000..f073487a
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_13.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_14.png b/mask_rcnn/dataset/val_img_results/Figure_14.png
new file mode 100644
index 00000000..934d874a
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_14.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_15.png b/mask_rcnn/dataset/val_img_results/Figure_15.png
new file mode 100644
index 00000000..733dc30f
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_15.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_16.png b/mask_rcnn/dataset/val_img_results/Figure_16.png
new file mode 100644
index 00000000..6e9b4961
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_16.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_17.png b/mask_rcnn/dataset/val_img_results/Figure_17.png
new file mode 100644
index 00000000..88f1028b
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_17.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_18.png b/mask_rcnn/dataset/val_img_results/Figure_18.png
new file mode 100644
index 00000000..e24b821c
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_18.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_19.png b/mask_rcnn/dataset/val_img_results/Figure_19.png
new file mode 100644
index 00000000..34adaec8
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_19.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_2.png b/mask_rcnn/dataset/val_img_results/Figure_2.png
new file mode 100644
index 00000000..995faede
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_2.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_20.png b/mask_rcnn/dataset/val_img_results/Figure_20.png
new file mode 100644
index 00000000..76946653
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_20.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_21.png b/mask_rcnn/dataset/val_img_results/Figure_21.png
new file mode 100644
index 00000000..90b8dd19
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_21.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_22.png b/mask_rcnn/dataset/val_img_results/Figure_22.png
new file mode 100644
index 00000000..3d48ba55
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_22.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_23.png b/mask_rcnn/dataset/val_img_results/Figure_23.png
new file mode 100644
index 00000000..0b175fdb
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_23.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_24.png b/mask_rcnn/dataset/val_img_results/Figure_24.png
new file mode 100644
index 00000000..25070069
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_24.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_25.png b/mask_rcnn/dataset/val_img_results/Figure_25.png
new file mode 100644
index 00000000..a05a9aae
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_25.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_26.png b/mask_rcnn/dataset/val_img_results/Figure_26.png
new file mode 100644
index 00000000..ac1ab512
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_26.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_27.png b/mask_rcnn/dataset/val_img_results/Figure_27.png
new file mode 100644
index 00000000..721770fb
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_27.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_28.png b/mask_rcnn/dataset/val_img_results/Figure_28.png
new file mode 100644
index 00000000..94dfe667
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_28.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_29.png b/mask_rcnn/dataset/val_img_results/Figure_29.png
new file mode 100644
index 00000000..109a5cf9
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_29.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_3.png b/mask_rcnn/dataset/val_img_results/Figure_3.png
new file mode 100644
index 00000000..d761ce2e
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_3.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_30.png b/mask_rcnn/dataset/val_img_results/Figure_30.png
new file mode 100644
index 00000000..75186b3c
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_30.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_4.png b/mask_rcnn/dataset/val_img_results/Figure_4.png
new file mode 100644
index 00000000..f2ca7041
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_4.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_5.png b/mask_rcnn/dataset/val_img_results/Figure_5.png
new file mode 100644
index 00000000..dcaad0f6
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_5.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_6.png b/mask_rcnn/dataset/val_img_results/Figure_6.png
new file mode 100644
index 00000000..a0bb395f
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_6.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_7.png b/mask_rcnn/dataset/val_img_results/Figure_7.png
new file mode 100644
index 00000000..feb4ce38
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_7.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_8.png b/mask_rcnn/dataset/val_img_results/Figure_8.png
new file mode 100644
index 00000000..9ff3b2bb
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_8.png differ
diff --git a/mask_rcnn/dataset/val_img_results/Figure_9.png b/mask_rcnn/dataset/val_img_results/Figure_9.png
new file mode 100644
index 00000000..2fc94c9a
Binary files /dev/null and b/mask_rcnn/dataset/val_img_results/Figure_9.png differ
diff --git a/mask_rcnn/dataset/via.html b/mask_rcnn/dataset/via.html
new file mode 100644
index 00000000..8f538b06
--- /dev/null
+++ b/mask_rcnn/dataset/via.html
@@ -0,0 +1,10946 @@
+<!DOCTYPE html>
+<html lang="en">
+  <head>
+    <meta charset="UTF-8">
+    <!--
+        VGG Image Annotator (via)
+        www.robots.ox.ac.uk/~vgg/software/via/
+
+        Copyright (c) 2016-2018, Abhishek Dutta, Visual Geometry Group, Oxford University and VIA Contributors..
+        All rights reserved.
+
+        Redistribution and use in source and binary forms, with or without
+        modification, are permitted provided that the following conditions are met:
+
+        Redistributions of source code must retain the above copyright notice, this
+        list of conditions and the following disclaimer.
+        Redistributions in binary form must reproduce the above copyright notice,
+        this list of conditions and the following disclaimer in the documentation
+        and/or other materials provided with the distribution.
+        THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+        AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+        IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+        ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
+        LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+        CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+        SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
+        INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
+        CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
+        ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
+        POSSIBILITY OF SUCH DAMAGE.
+      -->
+    <title>VGG Image Annotator</title>
+    <meta name="author" content="Abhishek Dutta">
+    <meta name="description" content="VIA is a standalone image annotator application packaged as a single HTML file (< 400 KB) that runs on most modern web browsers.">
+
+    <!--
+    Development of VIA is supported by the EPSRC programme grant
+    Seebibyte: Visual Search for the Era of Big Data (EP/M013774/1).
+    Using Google Analytics, we record the usage of this application.
+    This data is used in reporting of this programme grant.
+
+    If you do not wish to share this data, you can safely remove the
+    javascript code below.
+    -->
+    <script type="text/javascript">
+      (function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+        (i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+                               m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+                              })(window,document,'script','https://www.google-analytics.com/analytics.js','ga');
+      ga('create', 'UA-20555581-2', 'auto');
+      ga('set', 'page', 'via-2.0.0.html');
+      ga('send', 'pageview');
+    </script>
+
+<!-- START: Contents of file: via.css-->
+<style>
+/* 
+  CSS style definitions for VIA 2.x.y
+  http://www.robots.ox.ac.uk/~vgg/software/via/
+  Author: Abhishek Dutta <adutta@robots.ox.ac.uk>
+  Date: moved from index.html to via.css on 13 June 2019
+*/
+
+body { min-width:200px; padding:0; margin:0; font-family:sans-serif; }
+* { box-sizing: border-box; }
+input[type=text] { border:1px solid #cccccc; margin:0.6rem 0; padding:0.2rem 0.4rem; }
+a { text-decoration:none; }
+textarea { border:1px solid #cccccc; margin:0.6rem 0; padding:0.2rem 0.4rem; }
+
+/* Top panel : #navbar, #toolbar */
+.top_panel { font-size:0.9rem; display:block; background-color:#212121; color:#ffffff; z-index:1001; margin-bottom:1rem;}
+
+/* Navigation menu bar that appear at the top */
+.menubar { display:inline-block; height:1.8rem; } /* height needed to avoid extra bottom border */
+.menubar a:link { color:#eeeeee; text-decoration:none; }
+.menubar a:visited { color:#eeeeee; text-decoration:none; }
+.menubar ul { display:block; padding:0; margin:0; }
+.menubar li { display:inline; float:left; padding:0.45rem 1rem; }
+.menubar li:hover { background-color:#616161; cursor:default; }
+
+.menubar li ul { display:none; background-color:#212121; border:1px solid #616161; min-width:10rem; position:absolute; z-index:100; margin:0.4rem -1rem;}
+.menubar li ul li { display:block; float:none; color:#eeeeee; margin:0; padding:0.6rem 1rem; }
+.menubar li ul li:hover { cursor:pointer; }
+.menubar li ul li.submenu_divider { margin:0 0.4rem; padding:0; height:1px; border-bottom:1px solid #424242; }
+.menubar li:hover ul { display:block; }
+
+/* toolbar containing small icons for tools */
+.toolbar { display:inline-block; margin-left:1rem; }
+.toolbar svg { fill:white; margin: 0.2rem 0.1rem; height:1.2rem;  -moz-user-select:none; -webkit-user-select:none; -ms-user-select:none;}
+.toolbar svg:hover { fill:yellow; cursor:pointer; }
+.toolbar svg:active { fill:white; }
+.toolbar ul { display:inline-block; padding:0.2rem; margin:0; }
+.toolbar li { display:inline; float:left; padding:0rem 0.3rem; border:1px solid white;} /* main menu items */
+.toolbar li:hover { color:red; cursor:pointer; }
+
+/* Middle panel: containing #image_panel, #leftsidebar */
+.middle_panel { display:table; table-layout:fixed; width:100%; z-index:1; padding:0;}
+#leftsidebar { display:none; z-index:10; vertical-align:top;}
+#display_area { display:table-cell; width:100%; z-index:1; margin:0; padding-left:1em; vertical-align:top; }
+/* layers of canvas */
+#image_panel        { position:relative; outline:none; }
+#image_panel img    { visibility:hidden; opacity:0; position:absolute; top:0px; left:0px; width:100%; height:100%; outline:none; }
+#image_panel canvas { position:absolute; top:0px; left:0px; outline:none;}
+#image_panel .visible { visibility:visible !important; opacity:1 !important; }
+#image_panel label>img { visibility:visible; opacity:1; position:relative; width:auto; height:4em; outline:none; }
+
+/* image buffer
+#image_panel .fadein { visibility:visible; opacity:1; transition: visibility 0s linear 0s, opacity 300ms; }
+#image_panel .fadeout { visibility:hidden; opacity:0; transition: visibility 0s linear 300ms, opacity 300ms; }
+*/
+
+/* image grid view */
+#image_grid_panel { position:relative; margin:0; padding:0; width:100%; }
+#image_grid_panel #image_grid_toolbar { display:block; font-size:small; padding:0.5rem 0;}
+#image_grid_panel #image_grid_toolbar select { font-size:small; }
+#image_grid_panel #image_grid_toolbar .tool { display:inline; margin:0 0.5rem;}
+#image_grid_panel #image_grid_group_panel { font-size:small; }
+#image_grid_panel #image_grid_group_panel select { font-size:small; }
+#image_grid_panel #image_grid_group_panel .image_grid_group_toolbar { display:inline; margin-left: 2rem;}
+#image_grid_panel #image_grid_group_panel .image_grid_group_toolbar select { margin:0 0.2rem; padding:0; font-size:small;}
+
+#image_grid_panel #image_grid_nav { display:inline; font-size:small; padding-left:0.5rem; margin-top:0.2rem; }
+#image_grid_panel #image_grid_nav span { margin: 0 0.2rem; }
+#image_grid_panel #image_grid_content { position:relative; overflow:hidden; margin:0; padding:0; outline:none; }
+#image_grid_panel #image_grid_content #image_grid_content_img img { margin:0.3em; padding:0; border:0.2em solid #ffffff; outline:0.1em solid #0066ff;}
+#image_grid_panel #image_grid_content #image_grid_content_img .not_sel { opacity:0.6; outline:none; }
+#image_grid_panel #image_grid_content #image_grid_content_img { position:absolute; top:0; left:0; width:100%; height:100%; }
+#image_grid_panel #image_grid_content #image_grid_content_rshape { position:absolute; top:0; left:0; width:100%; height:100%; pointer-events:none; }
+#image_grid_panel #image_grid_content img { float:left; margin:0; }
+
+#leftsidebar_collapse_panel { display:none; position:relative; z-index:10; vertical-align:top; }
+#leftsidebar_show_button { font-size:large; margin-left:0.1rem; }
+#leftsidebar_show_button:hover { color:red; cursor: pointer; }
+
+/* Left sidebar accordion */
+button.leftsidebar_accordion { font-size:large; background-color:#f2f2f2; cursor:pointer; padding:0.5em 0.5em; width:100%; text-align:left; border:0; outline:none; }
+button.leftsidebar_accordion:focus { outline: none; }
+button.leftsidebar_accordion.active, button.leftsidebar_accordion:hover { background-color: #e6e6e6; }
+button.leftsidebar_accordion:after { content:'\02795'; color:#4d4d4d; float:right; }
+button.leftsidebar_accordion.active:after { content: '\2796'; }
+.leftsidebar_accordion_panel { display:none; padding:0 0.5em; font-size:small; border-right:2px solid #f2f2f2; border-bottom:2px solid #f2f2f2; }
+.leftsidebar_accordion_panel.show { display:block; }
+
+/* Keyboard shortcut panel */
+.leftsidebar_accordion_panel table { border-collapse:collapse; }
+.leftsidebar_accordion_panel td { border:1px solid #f2f2f2; padding:0.2rem 0.4rem; }
+
+/* buttons */
+.button_panel { display:inline-block; width:100%; margin:0.2rem 0; }
+.button_panel .text_button, .text_button { color: #0000ff; padding: 0.2rem 0.2rem; -moz-user-select:none; -webkit-user-select:none; -ms-user-select:none; }
+.button_panel .flush_right { float:right; }
+.button_panel .text_button:hover, .text_button:hover { cursor:pointer; }
+.button_panel .text_button:active, .text_button:active { color: #000000; }
+.button_panel .active { border-bottom:1px solid black; }
+.button_panel .button { display:inline-block; padding:0.35rem 0.5rem; margin:0 0.05rem; cursor:pointer; background-color:#cccccc; border-radius:0.2rem; -moz-user-select:none; -webkit-user-select:none; -ms-user-select:none; }
+.button_panel .button:hover { background-color:black; color:white; }
+
+/* Attributes properties: name, description, type, ... */
+#attribute_properties { display:table; width:100%; border-collapse:collapse; margin:1rem 0; border:1px solid #cccccc; }
+#attribute_properties .property { display:table-row;}
+#attribute_properties .property span { display:table-cell; padding: 0.2rem 0.4rem; }
+#attribute_properties .property span input { width: 100%; border:1px solid #cccccc; margin: 0;}
+#attribute_properties .property span input:focus { border:1px solid black; }
+#attribute_properties .property span select { width: 100%; border:1px solid #cccccc; margin: 0;}
+
+/* Attributes options: options for attribute type={checkbox,radio,...} */
+#attribute_options { display:table; width:100%; border-collapse:collapse; margin:1rem 0; border:1px solid #cccccc; table-layout:fixed; }
+#attribute_options .new_option_id_entry { display:inline-block; padding:1rem 0.2rem; }
+#attribute_options .new_option_id_entry input {border:none; border-bottom:1px solid #cccccc; margin: 0; font-size: 0.8rem;}
+#attribute_options .property { display:table-row;}
+#attribute_options .property span { display:table-cell; padding: 0.2rem 0.2rem; font-weight:bold; }
+#attribute_options .property input { display:table-cell; width:94%; border:none; border-bottom:1px solid #cccccc; margin: 0; font-size: 0.8rem;}
+#attribute_options .property input:focus { border-bottom:1px solid #000000; background-color:#f2f2f2; color:#000000; }
+#attribute_options .property span input[type=checkbox] { vertical-align:middle; }
+#attribute_options .property span input[type=radio] { vertical-align:middle; }
+
+/* overlay panel used to gather user inputs before invoking a function using invoke_with_user_inputs() */
+#user_input_panel { position:fixed; display:none; width:100%; height:100%; top:0; left:0; right:0; bottom:0; background-color: rgba(0,0,0,0.6); z-index:1002; }
+#user_input_panel .content { position:fixed; background-color:white; top:50%; left:50%; transform:translate(-50%,-50%);  -webkit-transform: translate(-50%, -50%); -moz-transform: translate(-50%, -50%);  -o-transform: translate(-50%, -50%); -ms-transform: translate(-50%, -50%); padding:2rem 4rem;}
+#user_input_panel .content .title { font-size:large; font-weight:bold; }
+#user_input_panel .content .user_inputs { display:table; width:100%; border-collapse:collapse;}
+#user_input_panel .content .user_inputs .row { display:table-row; }
+#user_input_panel .content .user_inputs .cell { display:table-cell; padding:1rem 0.5rem; vertical-align:middle; border:1px solid #f2f2f2; }
+#user_input_panel .content .user_confirm { display:table; width:100%; text-align:center; margin:2rem 0;}
+#user_input_panel .content .user_confirm .ok { display:table-cell; width:48%; }
+#user_input_panel .content .user_confirm .cancel { display:table-cell; width:48%; }
+#user_input_panel .content .warning { color:red; }
+
+/* Attribute editor */
+#annotation_editor_panel { position:fixed; display:none; width:100%; left:0; bottom:0; background-color:white; border-top:2px solid #cccccc; padding:0.2em 1em; overflow:auto; z-index:1001; box-shadow: 0 0 1em #cccccc;}
+#annotation_editor { display:table; margin-bottom:3em; border-collapse:collapse; font-size:inherit; position: absolute; background-color:white; }
+#annotation_editor .row { display:table-row; }
+#annotation_editor .highlight .col { background-color:#e6e6e6;}
+
+#annotation_editor .col { display:table-cell; padding:0.4em 0.6em; border:1px solid #000000; vertical-align:middle; font-size:inherit; }
+#annotation_editor .header { font-weight:bold; }
+#annotation_editor .id { font-weight:bold; }
+#annotation_editor .col input[type=checkbox] { vertical-align:middle; }
+#annotation_editor .col input[type=radio] { vertical-align:middle; font-size:inherit; }
+#annotation_editor .col label { vertical-align:middle; font-size:inherit; }
+#annotation_editor .col textarea { border:0.1em solid #cccccc; padding:0; margin:0; font-size:inherit; background-color:#ffffff; }
+#annotation_editor .col textarea:focus { border:0.1em dashed #cccccc; }
+#annotation_editor .col span { display:block; }
+#annotation_editor .col horizontal_container { display:inline-block; }
+
+#annotation_editor .col .img_options { display:inline; }
+#annotation_editor .col .img_options .imrow { display:block; }
+#annotation_editor .col .img_options span { display:inline-block; margin: 0.2rem 0.4rem;}
+#annotation_editor .col .img_options span img { height:4em; }
+#annotation_editor .col .img_options p { margin:0; padding:0; font-size:inherit; }
+#annotation_editor .col .img_options input[type=radio] { display:none; }
+#annotation_editor .col .img_options input[type=radio] + label { display:block; cursor:pointer; text-align:center;}
+#annotation_editor .col .img_options input[type=radio]:checked + label { border: 0.1em solid black; background-color:#cccccc; cursor:default; font-size:inherit; }
+
+#project_info_panel      { display:table; border-collapse:collapse; font-size:0.8rem; }
+#project_info_panel .row { display:table-row; }
+#project_info_panel .col { display:table-cell; padding:0.4rem 0.1rem; border:none;  }
+#project_info_panel .col input[type=text] { font-size:0.8rem; border:none; border-bottom:1px solid #cccccc; margin: 0; width:100%;}
+#project_info_panel .col input:focus      { border-bottom:1px solid #000000; background-color:#f2f2f2; color:#000000; }
+
+/* Region shape selection panel inside leftsidebar */
+ul.region_shape          { font-size:xx-large; list-style-type:none; overflow:hidden; padding:0.4em 0; margin:0; }
+ul.region_shape li       { float:left; padding:0 0.2em; fill:#ffffff; stroke:#000000; }
+ul.region_shape li:hover { cursor:pointer; fill:#ffffff; stroke:#ff0000; }
+ul.region_shape .selected { fill:#ffffff; stroke:#ff0000; }
+
+/* cursor coordinates inside region shape selection panel in leftsidebar */
+#region_info { font-size:0.8em; margin-bottom:0.4em; }
+
+/* Loaded image list shown in leftsidebar panel */
+#img_fn_list    { display:none; font-size:small; overflow:scroll; min-height:10rem; max-height:25rem; }
+#img_fn_list ul { position:relative; line-height:1.3em; margin:0; padding:0; list-style-type:none;}
+#img_fn_list li { white-space:nowrap; display:block; padding:0 0.4rem; }
+#img_fn_list li:hover   { background-color:#d5e5ff; cursor:pointer; }
+#img_fn_list .error     { color:red; }
+#img_fn_list .sel       { border-left:0.2rem solid black !important; font-weight:bold; }
+#img_fn_list .buffered  { border-left:0.2rem solid #cccccc; }
+
+#message_panel         { display:block; width:100%; position:fixed; bottom:0px; z-index:9999; text-align:center; }
+#message_panel .content { display:inline; margin:auto; background-color:#000000; color:#ffff00; font-size:small; white-space:nowrap; overflow:hidden; text-overflow:ellipsis; line-height:2rem; padding: 0.5rem 2rem;}
+
+.text_panel    { display:none; margin:auto; font-size:medium; line-height:1.3em; margin: 0; max-width:700px; }
+.text_panel li { margin:1em 0; text-align:left; }
+.text_panel p  { text-align:left; }
+
+.svg_button:hover { cursor:pointer; }
+
+/* Loading spinbar */
+.loading_spinbox        { display:inline-block; border:0.4em solid #cccccc; border-radius:50%; border-top:0.4em solid black; border-bottom:0.4em solid black;-webkit-animation:spin 2s linear infinite; animation:spin 2s linear infinite; }
+@-webkit-keyframes spin { 0% { -webkit-transform: rotate(0deg); } 100% { -webkit-transform: rotate(360deg); } }
+@keyframes spin         { 0% { transform: rotate(0deg); } 100% { transform: rotate(360deg); } }
+
+#invisible_file_input { width:0.1px; height:0.1px; opacity:0; overflow:hidden; position:absolute; z-index:-1; }
+
+.display_none  { display:none !important; }
+.display_block { display:block !important; }
+
+/* project settings */
+#settings_panel { font-size:1rem; border-collapse:collapse; width:95%; }
+#settings_panel a { border: 1px solid #f2f2f2; }
+#settings_panel .row { display:table-row; border-bottom:1px solid #f2f2f2; }
+#settings_panel .variable { display:table-cell; width:60%; padding:0.5rem 0.5rem; }
+#settings_panel .variable div { display:block; }
+#settings_panel .variable .name { }
+#settings_panel .variable .desc { font-size:0.7em; color:#808080; padding:0.2rem 0rem; }
+#settings_panel .value { display:table-cell; vertical-align:middle; padding-left:1rem; }
+
+/* page {about, help, file not found, etc.} */
+.display_area_content { } /* this class is used to clear the display area content */
+.narrow_page_content li { font-size:0.9rem; margin: 0.4rem 0; }
+.narrow_page_content { width:60%; }
+
+.force_small_font { font-size:small !important; }
+.key { font-family:monospace; padding:1px 6px; background:linear-gradient(to bottom,#f0f0f0,#fcfcfc);; border:1px solid #e0e0e0; white-space:nowrap; color:#303030; border-bottom-width:2px; border-radius:3px; font-size:1.2em; }
+</style>
+<!-- END: Contents of file: via.css-->
+  </head>
+
+  <body onload="_via_init()" onresize="_via_update_ui_components()">
+    <!--
+        SVG icon set definitions
+        Material icons downloaded from https://material.io/icons
+      -->
+    <svg style="display:none;" version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
+      <defs>
+        <symbol id="via_logo">
+          <!-- Logo designed by Abhishek Dutta <adutta@robots.ox.ac.uk>, May 2018 -->
+          <title>VGG Image Annotator Logo</title>
+          <rect width="400" height="160" x="0" y="0" fill="#212121"></rect>
+
+          <text x="56" y="130" font-family="Serif" font-size="100" fill="white">V</text>
+          <text x="180" y="130" font-family="Serif" font-size="100" fill="white">I</text>
+          <text x="270" y="130" font-family="Serif" font-size="100" fill="white">A</text>
+
+          <rect width="80" height="100" x="52" y="40" stroke="yellow" fill="none" stroke-width="2"></rect>
+          <text x="72" y="30" font-family="'Comic Sans MS', cursive, sans-serif" font-size="18" fill="yellow">VGG</text>
+
+          <rect width="50" height="100" x="175" y="45" stroke="yellow" fill="none" stroke-width="2"></rect>
+          <text x="175" y="35" font-family="'Comic Sans MS', cursive, sans-serif" font-size="18" fill="yellow">Image</text>
+
+          <rect width="80" height="100" x="265" y="40" stroke="yellow" fill="none" stroke-width="2"></rect>
+          <text x="265" y="30" font-family="'Comic Sans MS', cursive, sans-serif" font-size="18" fill="yellow">Annotator</text>
+        </symbol>
+        <symbol id="shape_rectangle">
+          <title>Rectangular region shape</title>
+          <rect width="20" height="12" x="6" y="10" stroke-width="2"></rect>
+        </symbol>
+        <symbol id="shape_circle">
+          <title>Circular region shape</title>
+          <circle r="10" cx="16" cy="16" stroke-width="2"></circle>
+        </symbol>
+        <symbol id="shape_ellipse">
+          <title>Elliptical region shape</title>
+          <ellipse rx="12" ry="8" cx="16" cy="16" stroke-width="2"></ellipse>
+        </symbol>
+        <symbol id="shape_polygon">
+          <title>Polygon region shape</title>
+          <path d="M 15.25,2.2372 3.625,11.6122 6,29.9872 l 20.75,-9.625 2.375,-14.75 z" stroke-width="2"></path>
+        </symbol>
+        <symbol id="shape_point">
+          <title>Point region shape</title>
+          <circle r="3" cx="16" cy="16" stroke-width="2"></circle>
+        </symbol>
+        <symbol id="shape_polyline">
+          <title>Polyline region shape</title>
+          <path d="M 2,12 10,24 18,12 24,18" stroke-width="2"></path>
+          <circle r="1" cx="2" cy="12" stroke-width="2"></circle>
+          <circle r="1" cx="10" cy="24" stroke-width="2"></circle>
+          <circle r="1" cx="18" cy="12" stroke-width="2"></circle>
+          <circle r="1" cx="24" cy="18" stroke-width="2"></circle>
+        </symbol>
+
+        <!-- Material icons downloaded from https://material.io/icons -->
+        <symbol id="icon_settings">
+          <path d="M19.43 12.98c.04-.32.07-.64.07-.98s-.03-.66-.07-.98l2.11-1.65c.19-.15.24-.42.12-.64l-2-3.46c-.12-.22-.39-.3-.61-.22l-2.49 1c-.52-.4-1.08-.73-1.69-.98l-.38-2.65C14.46 2.18 14.25 2 14 2h-4c-.25 0-.46.18-.49.42l-.38 2.65c-.61.25-1.17.59-1.69.98l-2.49-1c-.23-.09-.49 0-.61.22l-2 3.46c-.13.22-.07.49.12.64l2.11 1.65c-.04.32-.07.65-.07.98s.03.66.07.98l-2.11 1.65c-.19.15-.24.42-.12.64l2 3.46c.12.22.39.3.61.22l2.49-1c.52.4 1.08.73 1.69.98l.38 2.65c.03.24.24.42.49.42h4c.25 0 .46-.18.49-.42l.38-2.65c.61-.25 1.17-.59 1.69-.98l2.49 1c.23.09.49 0 .61-.22l2-3.46c.12-.22.07-.49-.12-.64l-2.11-1.65zM12 15.5c-1.93 0-3.5-1.57-3.5-3.5s1.57-3.5 3.5-3.5 3.5 1.57 3.5 3.5-1.57 3.5-3.5 3.5z"></path>
+        </symbol>
+        <symbol id="icon_save">
+          <path d="M17 3H5c-1.11 0-2 .9-2 2v14c0 1.1.89 2 2 2h14c1.1 0 2-.9 2-2V7l-4-4zm-5 16c-1.66 0-3-1.34-3-3s1.34-3 3-3 3 1.34 3 3-1.34 3-3 3zm3-10H5V5h10v4z"></path>
+        </symbol>
+        <symbol id="icon_open">
+          <path d="M20 6h-8l-2-2H4c-1.1 0-1.99.9-1.99 2L2 18c0 1.1.9 2 2 2h16c1.1 0 2-.9 2-2V8c0-1.1-.9-2-2-2zm0 12H4V8h16v10z"></path>
+        </symbol>
+        <symbol id="icon_gridon">
+          <path d="M20 2H4c-1.1 0-2 .9-2 2v16c0 1.1.9 2 2 2h16c1.1 0 2-.9 2-2V4c0-1.1-.9-2-2-2zM8 20H4v-4h4v4zm0-6H4v-4h4v4zm0-6H4V4h4v4zm6 12h-4v-4h4v4zm0-6h-4v-4h4v4zm0-6h-4V4h4v4zm6 12h-4v-4h4v4zm0-6h-4v-4h4v4zm0-6h-4V4h4v4z"></path>
+        </symbol>
+        <symbol id="icon_gridoff">
+          <path d="M8 4v1.45l2 2V4h4v4h-3.45l2 2H14v1.45l2 2V10h4v4h-3.45l2 2H20v1.45l2 2V4c0-1.1-.9-2-2-2H4.55l2 2H8zm8 0h4v4h-4V4zM1.27 1.27L0 2.55l2 2V20c0 1.1.9 2 2 2h15.46l2 2 1.27-1.27L1.27 1.27zM10 12.55L11.45 14H10v-1.45zm-6-6L5.45 8H4V6.55zM8 20H4v-4h4v4zm0-6H4v-4h3.45l.55.55V14zm6 6h-4v-4h3.45l.55.54V20zm2 0v-1.46L17.46 20H16z"></path>
+        </symbol>
+        <symbol id="icon_next">
+          <path d="M10 6L8.59 7.41 13.17 12l-4.58 4.59L10 18l6-6z"></path>
+        </symbol>
+        <symbol id="icon_prev">
+          <path d="M15.41 7.41L14 6l-6 6 6 6 1.41-1.41L10.83 12z"></path>
+        </symbol>
+        <symbol id="icon_list">
+          <path d="M3 13h2v-2H3v2zm0 4h2v-2H3v2zm0-8h2V7H3v2zm4 4h14v-2H7v2zm0 4h14v-2H7v2zM7 7v2h14V7H7z"></path>
+        </symbol>
+        <symbol id="icon_zoomin">
+          <path d="M15.5 14h-.79l-.28-.27C15.41 12.59 16 11.11 16 9.5 16 5.91 13.09 3 9.5 3S3 5.91 3 9.5 5.91 16 9.5 16c1.61 0 3.09-.59 4.23-1.57l.27.28v.79l5 4.99L20.49 19l-4.99-5zm-6 0C7.01 14 5 11.99 5 9.5S7.01 5 9.5 5 14 7.01 14 9.5 11.99 14 9.5 14z"></path>
+          <path d="M12 10h-2v2H9v-2H7V9h2V7h1v2h2v1z"/>
+        </symbol>
+        <symbol id="icon_zoomout">
+          <path d="M15.5 14h-.79l-.28-.27C15.41 12.59 16 11.11 16 9.5 16 5.91 13.09 3 9.5 3S3 5.91 3 9.5 5.91 16 9.5 16c1.61 0 3.09-.59 4.23-1.57l.27.28v.79l5 4.99L20.49 19l-4.99-5zm-6 0C7.01 14 5 11.99 5 9.5S7.01 5 9.5 5 14 7.01 14 9.5 11.99 14 9.5 14zM7 9h5v1H7z"></path>
+        </symbol>
+        <symbol id="icon_copy">
+          <path d="M16 1H4c-1.1 0-2 .9-2 2v14h2V3h12V1zm3 4H8c-1.1 0-2 .9-2 2v14c0 1.1.9 2 2 2h11c1.1 0 2-.9 2-2V7c0-1.1-.9-2-2-2zm0 16H8V7h11v14z"></path>
+        </symbol>
+        <symbol id="icon_paste">
+          <path d="M19 2h-4.18C14.4.84 13.3 0 12 0c-1.3 0-2.4.84-2.82 2H5c-1.1 0-2 .9-2 2v16c0 1.1.9 2 2 2h14c1.1 0 2-.9 2-2V4c0-1.1-.9-2-2-2zm-7 0c.55 0 1 .45 1 1s-.45 1-1 1-1-.45-1-1 .45-1 1-1zm7 18H5V4h2v3h10V4h2v16z"></path>
+        </symbol>
+        <symbol id="icon_pasten">
+          <path d="M19 2h-4.18C14.4.84 13.3 0 12 0c-1.3 0-2.4.84-2.82 2H5c-1.1 0-2 .9-2 2v16c0 1.1.9 2 2 2h14c1.1 0 2-.9 2-2V4c0-1.1-.9-2-2-2zm-7 0c.55 0 1 .45 1 1s-.45 1-1 1-1-.45-1-1 .45-1 1-1zm7 18H5V4h2v3h10V4h2v16z"></path>
+          <text x="8" y="18">n</text>
+        </symbol>
+        <symbol id="icon_pasteundo">
+          <path d="M19 2h-4.18C14.4.84 13.3 0 12 0c-1.3 0-2.4.84-2.82 2H5c-1.1 0-2 .9-2 2v16c0 1.1.9 2 2 2h14c1.1 0 2-.9 2-2V4c0-1.1-.9-2-2-2zm-7 0c.55 0 1 .45 1 1s-.45 1-1 1-1-.45-1-1 .45-1 1-1zm7 18H5V4h2v3h10V4h2v16z"></path>
+          <text x="8" y="18">x</text>
+        </symbol>
+        <symbol id="icon_selectall">
+          <path d="M3 5h2V3c-1.1 0-2 .9-2 2zm0 8h2v-2H3v2zm4 8h2v-2H7v2zM3 9h2V7H3v2zm10-6h-2v2h2V3zm6 0v2h2c0-1.1-.9-2-2-2zM5 21v-2H3c0 1.1.9 2 2 2zm-2-4h2v-2H3v2zM9 3H7v2h2V3zm2 18h2v-2h-2v2zm8-8h2v-2h-2v2zm0 8c1.1 0 2-.9 2-2h-2v2zm0-12h2V7h-2v2zm0 8h2v-2h-2v2zm-4 4h2v-2h-2v2zm0-16h2V3h-2v2zM7 17h10V7H7v10zm2-8h6v6H9V9z"></path>
+        </symbol>
+        <symbol id="icon_close">
+          <path d="M19 6.41L17.59 5 12 10.59 6.41 5 5 6.41 10.59 12 5 17.59 6.41 19 12 13.41 17.59 19 19 17.59 13.41 12z"></path>
+        </symbol>
+        <symbol id="icon_insertcomment">
+          <path d="M20 2H4c-1.1 0-2 .9-2 2v12c0 1.1.9 2 2 2h14l4 4V4c0-1.1-.9-2-2-2zm-2 12H6v-2h12v2zm0-3H6V9h12v2zm0-3H6V6h12v2z"></path>
+        </symbol>
+        <symbol id="icon_checkbox">
+          <path d="M12 2C6.48 2 2 6.48 2 12s4.48 10 10 10 10-4.48 10-10S17.52 2 12 2zm-2 15l-5-5 1.41-1.41L10 14.17l7.59-7.59L19 8l-9 9z"></path>
+        </symbol>
+        <symbol id="icon_fileupload">
+          <path d="M9 16h6v-6h4l-7-7-7 7h4zm-4 2h14v2H5z"></path>
+        </symbol>
+        <symbol id="icon_filedownload">
+          <path d="M19 9h-4V3H9v6H5l7 7 7-7zM5 18v2h14v-2H5z"></path>
+        </symbol>
+      </defs>
+    </svg>
+
+    <!-- used by invoke_with_user_inputs() to gather user inputs -->
+    <div id="user_input_panel"></div>
+
+    <!-- to show status messages -->
+    <div id="message_panel">
+      <div id="message_panel_content" class="content"></div>
+    </div>
+
+    <!-- spreadsheet like editor for annotations -->
+    <div id="annotation_editor_panel">
+      <div class="button_panel">
+        <span class="text_button" onclick="edit_region_metadata_in_annotation_editor()" id="button_edit_region_metadata" title="Manual annotations of regions">Region Annotations</span>
+        <span class="text_button" onclick="edit_file_metadata_in_annotation_editor()" id="button_edit_file_metadata" title="Manual annotations of a file">File Annotations</span>
+
+        <span class="button" style="float:right;margin-right:0.2rem;" onclick="annotation_editor_toggle_all_regions_editor()" title="Close this window of annotation editor">&times;</span>
+        <span class="button" style="float:right;margin-right:0.2rem;" onclick="annotation_editor_increase_panel_height()" title="Increase the height of this panel">&uarr;</span>
+        <span class="button" style="float:right;margin-right:0.2rem;" onclick="annotation_editor_decrease_panel_height()" title="Decrease the height of this panel">&darr;</span>
+        <span class="button" style="float:right;margin-right:0.2rem;" onclick="annotation_editor_increase_content_size()" title="Increase size of contents in annotation editor">&plus;</span>
+        <span class="button" style="float:right;margin-right:0.2rem;" onclick="annotation_editor_decrease_content_size()" title="Decrease size of contents in annotation editor">&minus;</span>
+      </div>
+      <!-- here, a child div with id="annotation_editor" is added by javascript -->
+    </div>
+
+    <div class="top_panel" id="ui_top_panel">
+      <!-- menu bar -->
+      <div class="menubar">
+        <ul>
+          <li onclick="show_home_panel()" style="cursor:pointer;">Home</li>
+          <li>Project
+            <ul>
+              <li onclick="project_open_select_project_file()" title="Load a VIA project (from a JSON file)">Load</li>
+              <li onclick="project_save_with_confirm()" title="Save this VIA project (as a JSON file)">Save</li>
+              <li onclick="settings_panel_toggle()" title="Show/edit project settings">Settings</li>
+              <li class="submenu_divider"></li>
+              <li onclick="sel_local_images()" title="Add images locally stored in this computer">Add local files</li>
+              <li onclick="project_file_add_url_with_input()" title="Add images from a web URL (e.g. http://www.robots.ox.ac.uk/~vgg/software/via/images/swan.jpg)">Add files from URL</li>
+              <li onclick="project_file_add_abs_path_with_input()" title="Add images using absolute path of file (e.g. /home/abhishek/image1.jpg)">Add file using absolute path</li>
+              <li onclick="sel_local_data_file('files_url')" title="Add images from a list of web url or absolute path stored in a text file (one url or path per line)">Add url or path from text file</li>
+              <li onclick="project_file_remove_with_confirm()" title="Remove selected file (i.e. file currently being shown)">Remove file</li>
+              <li class="submenu_divider"></li>
+              <li onclick="sel_local_data_file('attributes')" title="Import region and file attributes from a JSON file">Import region/file attributes</li>
+              <li onclick="project_save_attributes()" title="Export region and file attributes to a JSON file">Export region/file attributes</li>
+            </ul>
+          </li>
+
+          <li>Annotation
+            <ul>
+              <li onclick="download_all_region_data('csv')" title="Export annotations to a CSV file">Export Annotations (as csv)</li>
+              <li onclick="download_all_region_data('json')" title="Export annotaitons to a JSON file">Export Annotations (as json)</li>
+              <li onclick="download_all_region_data('coco', 'json')" title="Export annotaitons to COCO (http://cocodataset.org) format">Export Annotations (COCO format)</li>
+              <li onclick="" class="submenu_divider"></li>
+              <li onclick="sel_local_data_file('annotations')" title="Import annotations from a CSV file">Import Annotations (from csv)</li>
+              <li onclick="sel_local_data_file('annotations')" title="Import annotations from a JSON file">Import Annotations (from json)</li>
+              <li onclick="sel_local_data_file('annotations_coco')" title="Import annotations from a COCO (http://cocodataset.org) formatted JSON file">Import Annotations (COCO format)</li>
+
+              <li class="submenu_divider"></li>
+              <li onclick="show_annotation_data()" title="Show a preview of annotations (opens in a new browser windows)">Preview Annotations</li>
+              <li onclick="download_as_image()" title="Download an image containing the annotations">Download as Image</li>
+            </ul>
+          </li>
+
+          <li>View
+            <ul>
+              <li onclick="image_grid_toggle()" title="Toggle between single image view and image grid view">Toggle image grid view</li>
+              <li onclick="leftsidebar_toggle()" title="Show or hide the sidebar shown in left hand side">Toggle left sidebar</li>
+<li onclick="toggle_img_fn_list_visibility()" title="Show or hide a panel to update annotations corresponding to file and region">Toggle image filename list</li>
+              <li class="submenu_divider"></li>
+              <li onclick="toggle_attributes_editor()" title="Show or hide a panel to update file and region attributes">Toggle attributes editor</li>
+              <li onclick="annotation_editor_toggle_all_regions_editor()" title="Show or hide a panel to update annotations corresponding to file and region">Toggle annotation editor (Space)</li>
+              <li class="submenu_divider"></li>
+              <li onclick="toggle_region_boundary_visibility()" title="Show or hide the region boundaries">Show/hide region boundaries (b)</li>
+              <li onclick="toggle_region_id_visibility()" title="Show or hide the region id labels">Show/hide region labels (l)</li>
+              <li onclick="toggle_region_info_visibility()" title="Show or hide the image coordinates">Show/hide region info.</li>
+            </ul>
+          </li>
+
+          <li>Help
+            <ul>
+              <li onclick="set_display_area_content(VIA_DISPLAY_AREA_CONTENT_NAME.PAGE_GETTING_STARTED)" title="Show a guide to get started with this application">Getting Started</li>
+              <li title="Visit the project page for this application"><a href="http://www.robots.ox.ac.uk/~vgg/software/via/" target="_blank">VGG Project Page</a></li>
+              <li onclick="" title="Report an issue to the developers of this application (requires an account at gitlab.com)"><a href="https://gitlab.com/vgg/via/issues" target="_blank">Report issues</a></li>
+              <li class="submenu_divider"></li>
+              <li><a target="_blank" href="https://gitlab.com/vgg/via/blob/master/Contributors.md" title="List of people who have contributed towards the development of VIA">Contributors</a></li>
+              <li onclick="set_display_area_content(VIA_DISPLAY_AREA_CONTENT_NAME.PAGE_LICENSE)" title="View license of this application">License</li>
+              <li onclick="set_display_area_content(VIA_DISPLAY_AREA_CONTENT_NAME.PAGE_ABOUT)" title="Show more details about this application">About VIA</li>
+            </ul>
+          </li>
+        </ul>
+      </div> <!-- end of menubar -->
+
+      <!-- Shortcut toolbar -->
+      <div class="toolbar">
+        <svg onclick="project_open_select_project_file()" viewbox="0 0 24 24"><use xlink:href="#icon_open"></use><title>Open Project</title></svg>
+        <svg onclick="project_save_with_confirm()" viewbox="0 0 24 24"><use xlink:href="#icon_save"></use><title>Save Project</title></svg>
+        <svg onclick="settings_panel_toggle()" viewbox="0 0 24 24"><use xlink:href="#icon_settings"></use><title>Update Project Settings</title></svg>
+        <!--
+        <svg onclick="" viewbox="0 0 24 24"><use xlink:href="#icon_checkbox"></use><title>Locate Files</title></svg>
+        -->
+
+        <svg onclick="sel_local_data_file('annotations')" style="margin-left:1rem;" viewbox="0 0 24 24"><use xlink:href="#icon_fileupload"></use><title>Import Annotations from CSV</title></svg>
+        <svg onclick="download_all_region_data('csv')" viewbox="0 0 24 24"><use xlink:href="#icon_filedownload"></use><title>Download Annotations as CSV</title></svg>
+
+        <svg onclick="image_grid_toggle()" id="toolbar_image_grid_toggle" style="margin-left:1rem;" viewbox="0 0 24 24"><use xlink:href="#icon_gridon"></use><title>Switch to Image Grid View</title></svg>
+        <svg onclick="annotation_editor_toggle_all_regions_editor()" viewbox="0 0 24 24"><use xlink:href="#icon_insertcomment"></use><title>Toggle Annotation Editor</title></svg>
+
+        <svg onclick="move_to_prev_image()" style="margin-left:1rem;" viewbox="0 0 24 24"><use xlink:href="#icon_prev"></use><title>Previous</title></svg>
+        <svg onclick="toggle_img_fn_list_visibility()" viewbox="0 0 24 24"><use xlink:href="#icon_list"></use><title>Toggle Filename List</title></svg>
+        <svg onclick="move_to_next_image()" viewbox="0 0 24 24"><use xlink:href="#icon_next"></use><title>Next</title></svg>
+
+        <svg onclick="zoom_in()" style="margin-left:1rem;" viewbox="0 0 24 24"><use xlink:href="#icon_zoomin"></use><title>Zoom In</title></svg>
+        <svg onclick="zoom_out()" viewbox="0 0 24 24"><use xlink:href="#icon_zoomout"></use><title>Zoom Out</title></svg>
+
+        <svg onclick="sel_all_regions()" viewbox="0 0 24 24" style="margin-left:1rem;"><use xlink:href="#icon_selectall"></use><title>Select All Regions</title></svg>
+        <svg onclick="copy_sel_regions()" viewbox="0 0 24 24"><use xlink:href="#icon_copy"></use><title>Copy Regions</title></svg>
+        <svg onclick="paste_sel_regions_in_current_image()" viewbox="0 0 24 24"><use xlink:href="#icon_paste"></use><title>Paste Regions</title></svg>
+        <svg onclick="paste_to_multiple_images_with_confirm()" viewbox="0 0 24 24"><use xlink:href="#icon_pasten"></use><title>Paste Region in Multiple Images</title></svg>
+        <svg onclick="del_sel_regions_with_confirm()" viewbox="0 0 24 24"><use xlink:href="#icon_pasteundo"></use><title>Undo Regions Pasted in Multiple Images</title></svg>
+        <svg onclick="del_sel_regions()" viewbox="0 0 24 24"><use xlink:href="#icon_close"></use><title>Delete Region</title></svg>
+      </div>
+      <!-- end of shortcut toolbar -->
+      <input type="file" id="invisible_file_input" name="files[]" style="display:none">
+    </div> <!-- endof #top_panel -->
+
+    <!-- Middle Panel contains a left-sidebar and image display areas -->
+    <div class="middle_panel">
+      <!-- this panel contains a button to shows the left side bar -->
+      <div id="leftsidebar_collapse_panel">
+        <span class="text_button" onclick="leftsidebar_toggle()" title="Show left sidebar">&rtrif;</span>
+      </div>
+
+      <div id="leftsidebar">
+        <div class="leftsidebar_accordion_panel show" style="float:right; border:2px solid #f2f2f2;">
+          <span class="text_button" onclick="leftsidebar_decrease_width()" title="Reduce width of this toolbar panel">&larr;</span>
+          <span class="text_button" onclick="leftsidebar_increase_width()" title="Increase width of this toolbar panel">&rarr;</span>
+          <span class="text_button" onclick="leftsidebar_toggle()" title="Show/hide this toolbar panel">&ltrif;</span>
+        </div>
+
+        <button class="leftsidebar_accordion active">Region Shape</button>
+        <div class="leftsidebar_accordion_panel show">
+          <ul class="region_shape">
+            <li id="region_shape_rect" class="selected" onclick="select_region_shape('rect')" title="Rectangle (Shortcut key 1)"><svg height="32" viewbox="0 0 32 32"><use xlink:href="#shape_rectangle"></use></svg></li>
+            <li id="region_shape_circle" onclick="select_region_shape('circle')" title="Circle (Shortcut key 2)"><svg height="32" viewbox="0 0 32 32"><use xlink:href="#shape_circle"></use></svg></li>
+            <li id="region_shape_ellipse" onclick="select_region_shape('ellipse')" title="Ellipse (Shortcut key 3)"><svg height="32" viewbox="0 0 32 32"><use xlink:href="#shape_ellipse"></use></svg></li>
+            <li id="region_shape_polygon" onclick="select_region_shape('polygon')" title="Polygon (Shortcut key 4)"><svg height="32" viewbox="0 0 32 32"><use xlink:href="#shape_polygon"></use></svg></li>
+            <li id="region_shape_point" onclick="select_region_shape('point')" title="Point (Shortcut key 5)"><svg height="32" viewbox="0 0 32 32"><use xlink:href="#shape_point"></use></svg></li>
+            <li id="region_shape_polyline" onclick="select_region_shape('polyline')" title="Polyline (Shortcut key 6)"><svg height="32" viewbox="0 0 32 32"><use xlink:href="#shape_polyline"></use></svg></li>
+          </ul>
+          <div id="region_info" class="display_none">&nbsp;</div>
+        </div>
+
+        <!-- Project -->
+        <button class="leftsidebar_accordion active" id="project_panel_title">Project</button>
+        <div class="leftsidebar_accordion_panel show" id="img_fn_list_panel">
+          <div id="project_info_panel">
+            <div class="row">
+              <span class="col"><label for="project_name">Name: </label></span>
+              <span class="col"><input type="text" value="" onchange="project_on_name_update(this)" id="project_name" title="VIA project name"></span>
+            </div>
+          </div>
+          <div id="project_tools_panel">
+            <div class="button_panel" style="margin:0.1rem 0;" >
+              <select style="width:48%" id="filelist_preset_filters_list" onchange="img_fn_list_onpresetfilter_select()" title="Filter file list using predefined filters">
+                <option value="all">All files</option>
+                <option value="files_without_region">Show files without regions</option>
+                <option value="files_missing_region_annotations">Show files missing region annotations</option>
+                <option value="files_missing_file_annotations">Show files missing file annotations</option>
+                <option value="files_error_loading">Files that could not be loaded</option>
+                <option value="regex">Regular Expression</option>
+              </select>
+              <input style="width:50%" type="text" placeholder="regular expression" oninput="img_fn_list_onregex()" id="img_fn_list_regex" title="Filter using regular expression">
+            </div>
+          </div>
+          <div id="img_fn_list"></div>
+          <p>
+            <div class="button_panel">
+              <span class="button" onclick="sel_local_images()" title="Add new file from local disk">Add Files</span>
+              <span class="button" onclick="project_file_add_url_with_input()" title="Add new file using URL">Add URL</span>
+              <span class="button" onclick="project_file_remove_with_confirm()" title="Remove selected file (i.e. file currently being shown) from project">Remove</span>
+            </div>
+          </p>
+        </div>
+
+        <!-- Attributes -->
+        <button class="leftsidebar_accordion" id="attributes_editor_panel_title">Attributes</button>
+        <div class="leftsidebar_accordion_panel" id="attributes_editor_panel">
+          <div class="button_panel" style="padding:1rem 0;">
+            <span class="text_button" onclick="show_region_attributes_update_panel()" id="button_show_region_attributes" title="Show region attributes">Region Attributes</span>
+            <span class="text_button" onclick="show_file_attributes_update_panel()" id="button_show_file_attributes" title="Show file attributes">File Attributes</span>
+          </div>
+          <div id="attributes_update_panel">
+            <div class="button_panel">
+              <input style="width:70%" type="text" placeholder="attribute name" id="user_input_attribute_id" value="">
+              <span id="button_add_new_attribute" class="button" onclick="add_new_attribute_from_user_input()" title="Add new attribute">&plus;</span>
+              <span id="button_del_attribute" class="button" onclick="delete_existing_attribute_with_confirm()" title="Delete existing attribute">&minus;</span>
+            </div>
+            <div class="button_panel" style="margin:0.1rem 0;" >
+              <select style="width:100%" id="attributes_name_list" onchange="update_current_attribute_id(this)" title="List of existing attributes"></select>
+            </div>
+            <div id="attribute_properties"></div>
+            <div id="attribute_options"></div>
+            <p style="text-align:center">
+              <span class="text_button" title="Show a spreadsheet like editor for all manual annotations" onclick="annotation_editor_toggle_all_regions_editor()">Toggle Annotation Editor</span>
+            </p>
+          </div>
+        </div>
+
+        <button class="leftsidebar_accordion">Keyboard Shortcuts</button>
+        <div class="leftsidebar_accordion_panel">
+          <div style="display:block; text-align:center; padding:1rem;">Available only on image focus</div>
+          <table>
+            <tr>
+              <td style="width:8em;"><span class="key">&larr;</span>&nbsp;<span class="key">&uarr;</span>&nbsp;<span class="key">&rarr;</span>&nbsp;<span class="key">&darr;</span></td>
+              <td>Move selected region by 1 px (Shift to jump)</td>
+            </tr>
+            <tr>
+              <td><span class="key">a</span></td>
+              <td>Select all regions</td>
+            </tr>
+
+            <tr>
+              <td><span class="key">c</span></td>
+              <td>Copy selected regions</td>
+            </tr>
+            <tr>
+              <td><span class="key">v</span></td>
+              <td>Paste selected regions</td>
+            </tr>
+            <tr>
+              <td><span class="key">d</span></td>
+              <td>Delete selected regions</td>
+            </tr>
+            <tr>
+              <td><span class="key">Ctrl</span> + Wheel</td>
+              <td>Zoom in/out (mouse cursor is over image)</td>
+            </tr>
+            <tr>
+              <td><span class="key">l</span></td>
+              <td>Toggle region label</td>
+            </tr>
+            <tr>
+              <td><span class="key">b</span></td>
+              <td>Toggle region boundary</td>
+            </tr>
+            <tr>
+              <td><span class="key">Enter</span></td>
+              <td>Finish drawing polyshape</td>
+            </tr>
+            <tr>
+              <td><span class="key">Backspace</span></td>
+              <td>Delete last polyshape vertex</td>
+            </tr>
+          </table>
+
+          <div style="display:block; text-align:center; padding:1rem;">Always Available</div>
+          <table>
+            <tr>
+              <td style="width:8em;"><span class="key">&larr;</span>&nbsp;<span class="key">&rarr;</span></td>
+              <td>Move to next/previous image</td>
+            </tr>
+            <tr>
+              <td><span class="key">+</span>&nbsp;<span class="key">-</span>&nbsp;<span class="key">=</span></td>
+              <td>Zoom in/out/reset</td>
+            </tr>
+            <tr>
+              <td><span class="key">&uarr;</span></td>
+              <td>Update region label</td>
+            </tr>
+            <tr>
+              <td><span class="key">&darr;</span></td>
+              <td>Update region colour</td>
+            </tr>
+            <tr>
+              <td><span class="key">Spacebar</span></td>
+              <td>Toggle annotation editor (Ctrl to toggle on image editor)</td>
+            </tr>
+            <tr>
+              <td><span class="key">Home</span> / <span class="key">h</span></td>
+              <td>Jump to first image</td>
+            </tr>
+            <tr>
+              <td><span class="key">End</span> / <span class="key">e</span></td>
+              <td>Jump to last image</td>
+            </tr>
+            <tr>
+              <td><span class="key">PgUp</span> / <span class="key">u</span></td>
+              <td>Jump several images</td>
+            </tr>
+            <tr>
+              <td><span class="key">PgDown</span> / <span class="key">d</span></td>
+              <td>Jump several images</td>
+            </tr>
+
+            <tr>
+              <td><span class="key">Esc</span></td>
+              <td>Cancel ongoing task</td>
+            </tr>
+          </table>
+        </div>
+
+      </div> <!-- end of leftsidebar -->
+
+      <!-- Main display area: contains image canvas, ... -->
+      <div id="display_area">
+        <div id="image_panel" class="display_area_content display_none">
+          <!-- buffer images using <img> element will be added here -->
+
+          <!-- @todo: in future versions, this canvas will be replaced by a <svg> element -->
+            <canvas id="region_canvas" width="1" height="1" tabindex="1">Sorry, your browser does not support HTML5 Canvas functionality which is required for this application.</canvas>
+            <!-- here, a child div with id="annotation_editor" is added by javascript -->
+        </div>
+        <div id="image_grid_panel" class="display_area_content display_none">
+
+          <div id="image_grid_group_panel">
+            <span class="tool">Group by&nbsp; <select id="image_grid_toolbar_group_by_select" onchange="image_grid_toolbar_onchange_group_by_select(this)"></select></span>
+          </div>
+
+          <div id="image_grid_toolbar">
+            <span>Selected</span>
+            <span id="image_grid_group_by_sel_img_count">0</span>
+            <span>of</span>
+            <span id="image_grid_group_by_img_count">0</span>
+            <span>images in current group, show</span>
+
+            <span>
+              <select id="image_grid_show_image_policy" onchange="image_grid_onchange_show_image_policy(this)">
+                <option value="all">all images (paginated)</option>
+                <option value="first_mid_last">only first, middle and last image</option>
+                <option value="even_indexed">even indexed images (i.e. 0,2,4,...)</option>
+                <option value="odd_indexed">odd indexed images (i.e. 1,3,5,...)</option>
+                <option value="gap5">images 1, 5, 10, 15,...</option>
+                <option value="gap25">images 1, 25, 50, 75, ...</option>
+                <option value="gap50">images 1, 50, 100, 150, ...</option>
+              </select>
+            </span>
+
+            <div id="image_grid_nav"></div>
+          </div>
+
+          <div id="image_grid_content">
+            <div id="image_grid_content_img"></div>
+            <svg xmlns:xlink="http://www.w3.org/2000/svg" id="image_grid_content_rshape"></svg>
+          </div>
+
+          <div id="image_grid_info">
+          </div>
+        </div> <!-- end of image grid panel -->
+
+        <div id="settings_panel" class="display_area_content display_none">
+          <h2>Settings</h2>
+          <div class="row">
+            <div class="variable">
+              <div class="name">Project Name</div>
+            </div>
+
+            <div class="value">
+              <input type="text" id="_via_settings.project.name"/>
+            </div>
+          </div>
+
+          <div class="row">
+            <div class="variable">
+              <div class="name">Default Path</div>
+              <div class="desc">If all images in your project are saved in a single folder, set the default path to the location of this folder. The VIA application will load images from this folder by default. Note: a default path of <code>"./"</code> indicates that the folder containing <code>via.html</code> application file also contains the images in this project. For example: <code>/datasets/VOC2012/JPEGImages/</code> or <code>C:\Documents\data\</code>&nbsp;<strong>(note the trailing <code>/</code> and <code>\</code></strong>)</div>
+            </div>
+
+            <div class="value">
+              <input type="text" id="_via_settings.core.default_filepath" placeholder="/datasets/pascal/voc2012/VOCdevkit/VOC2012/JPEGImages/"/>
+            </div>
+          </div>
+
+          <div class="row">
+            <div class="variable">
+              <div class="name">Search Path List</div>
+              <div class="desc">If you define multiple paths, all these folders will be searched to find images in this project. We do not recommend this approach as it is computationally expensive to search for images in multiple folders. <ol id="_via_settings.core.filepath"></ol></div>
+            </div>
+
+            <div class="value">
+              <input type="text" id="settings_input_new_filepath" placeholder="/datasets/pascal/voc2012/VOCdevkit/VOC2012/JPEGImages"/>
+            </div>
+          </div>
+
+          <div class="row">
+            <div class="variable">
+              <div class="name">Region Label</div>
+              <div class="desc">By default, each region in an image is labelled using the region-id. Here, you can select a more descriptive labelling of regions.</div>
+            </div>
+
+            <div class="value">
+              <select id="_via_settings.ui.image.region_label"></select>
+            </div>
+          </div>
+
+          <div class="row">
+            <div class="variable">
+              <div class="name">Region Colour</div>
+              <div class="desc">By default, each region is drawn using a single colour. Using this setting, you can assign a unique colour to regions grouped according to a region attribute.</div>
+            </div>
+
+            <div class="value">
+              <select id="_via_settings.ui.image.region_color"></select>
+            </div>
+          </div>
+
+          <div class="row">
+            <div class="variable">
+              <div class="name">Region Label Font</div>
+              <div class="desc">Font size and font family for showing region labels.</div>
+            </div>
+
+            <div class="value">
+              <input id="_via_settings.ui.image.region_label_font" placeholder="12px Arial"/>
+            </div>
+          </div>
+
+          <div class="row">
+            <div class="variable">
+              <div class="name">Preload Buffer Size</div>
+              <div class="desc">Images are preloaded in buffer to allow smoother navigation of next/prev images. A large buffer size may slow down the overall browser performance. To disable preloading, set buffer size to 0.</div>
+            </div>
+            <div class="value">
+              <input type="text" id="_via_settings.core.buffer_size" />
+            </div>
+          </div>
+
+          <div class="row">
+            <div class="variable">
+              <div class="name">On-image Annotation Editor</div>
+              <div class="desc">When a single region is selected, the on-image annotation editor is gets activated which the user to update annotations of this region. By default, this on-image annotation editor is placed near the selected region.</div>
+            </div>
+
+            <div class="value">
+              <select id="_via_settings.ui.image.on_image_annotation_editor_placement">
+                <option value="NEAR_REGION">close to selected region</option>
+                <option value="IMAGE_BOTTOM">at the bottom of image being annotated</option>
+                <option value="DISABLE">DISABLE on-image annotation editor</option>
+              </select>
+            </div>
+          </div>
+
+          <div class="row" style="border:none;">
+            <button onclick="settings_save()" value="save_settings" style="margin-top:2rem">Save</button>
+            <button onclick="settings_panel_toggle()" value="cancel_settings" style="margin-left:2rem;">Cancel</button>
+          </div>
+        </div> <!-- end of settings panel -->
+
+        <div id="page_404" class="display_area_content display_none narrow_page_content">
+          <h2>File Not Found</h2>
+          <p>Filename: <span style="font-family:Mono;" id="page_404_filename"></span></p>
+
+          <p>We recommend that you update the default path in <span class="text_button" title="Show Project Settings" onclick="settings_panel_toggle()">project settings</span> to the folder which contains this image.</p>
+
+          <p>A temporary fix is to use <span class="text_button" title="Load or Add Images" onclick="sel_local_images()">browser's file selector</span> to manually locate and add this file. We do not recommend this approach because it requires you to repeat this process every time your load this project in the VIA application.</p>
+        </div> <!-- end of file not found panel -->
+
+        <div id="page_start_info" class="display_area_content display_none narrow_page_content">
+          <ul>
+            <li>To start annotation, <span class="text_button" title="Load or Add Images" onclick="sel_local_images()">select images</span> (or, add images from <span class="text_button" title="Add images from a web URL (e.g. http://www.robots.ox.ac.uk/~vgg/software/via/images/swan.jpg)" onclick="project_file_add_url_with_input()">URL</span> or <span class="text_button" title="Add images using absolute path of file (e.g. /home/abhishek/image1.jpg)" onclick="project_file_add_abs_path_with_input()">absolute path</span>) and draw regions</li>
+            <li>Use <span class="text_button" title="Toggle attributes editor panel" onclick="toggle_attributes_editor()">attribute editor</span> to define attributes (e.g. name) and <span class="text_button" title="Toggle annotations editor panel" onclick="annotation_editor_toggle_all_regions_editor()">annotation editor</span> to describe each region (e.g. cat) using these attributes.</li>
+            <li>Remember to <span class="text_button" onclick="project_save_with_confirm()">save</span> your project before closing this application so that you can <span class="text_button" onclick="project_open_select_project_file()">load</span> it later to continue annotation.</li>
+            <li>For help, see the <span class="text_button" onclick="set_display_area_content(VIA_DISPLAY_AREA_CONTENT_NAME.PAGE_GETTING_STARTED)">Getting Started</span> page and pre-loaded demo: <a href="http://www.robots.ox.ac.uk/~vgg/software/via/via_demo.html">image annotation</a> and <a href="http://www.robots.ox.ac.uk/~vgg/software/via/via_face_demo.html">face annotation</a>.</li>
+          </ul>
+
+        </div>
+
+        <div id="page_getting_started" class="display_area_content display_none narrow_page_content">
+          <p>A more detailed user guide (with screenshots and descriptions) is <a href="http://www.robots.ox.ac.uk/~vgg/software/via/docs/user_guide.html">available here</a>.</p>
+          <ol>
+            <li><strong>Load Images</strong>: The first step is to load all the images that you wish to annotate. There are multiple ways to add images to a VIA project. Choose the method that suits your use case.
+              <ul>
+                <li>Method 1: Selecting local files using browser's file selector
+                  <ol>
+                    <li>Click <span class="text_button" title="Load or Add Images" onclick="sel_local_images()"><code>Project &rarr; Add local files</code></span></li>
+                    <li>Select desired images and click <code>Open</code></li>
+                  </ol>
+                </li>
+                <li>Method 2: Adding files from URL or absolute path
+                  <ol>
+                    <li>Click <span class="text_button" title="Add images from a web URL (e.g. http://www.robots.ox.ac.uk/~vgg/software/via/images/swan.jpg)" onclick="project_file_add_url_with_input()"><code>Project &rarr; Add files from URL</code></span></li>
+                    <li>Enter URL and click <code>OK</code></li>
+                  </ol>
+                </li>
+                <li>Method 3: Adding files from list of url or absolute path stored in text file
+                  <ol>
+                    <li>Create a text file containing URL and absolute path (one per line)</li>
+                    <li>Click <span class="text_button" title="Add images from a list of web url or absolute path stored in a text file (one url or path per line)" onclick="sel_local_data_file('files_url')"><code>Project &rarr; Add url or path from text file</code></span></li>
+                    <li>Select the text file and click <code>Open</code></li>
+                  </ol>
+                </li>
+              </ul>
+            </li>
+            <li><strong>Draw Regions</strong>: Select a region shape (<span class="text_button" onclick="select_region_shape('rect')">rectangle</span>, <span class="text_button" onclick="select_region_shape('circle')">circle</span>, <span class="text_button" onclick="select_region_shape('ellipse')">ellipse</span>, <span class="text_button" onclick="select_region_shape('polygon')">polygon</span>, <span class="text_button" onclick="select_region_shape('point')">point</span>, <span class="text_button" onclick="select_region_shape('polyline')">polyline</span>) from the left sidebar and draw regions as follows:
+
+              <ul>
+                <li>Rectangle, Circle and Ellipse
+                  <ul>
+                    <li>Press left mouse button, drag mouse cursor and release mouse button.</li>
+                    <li>To define a point inside an existing region, click inside the region to select it (if not already selected), now press left mouse button, drag and release to draw region inside existing region.</li>
+                    <li>To select, click inside the region. If the click point contains multiple regions, then clicking multiple times at that location shuffles selection through those regions.</li>
+                  </ul>
+                </li>
+              </ul>
+
+              <ul>
+                <li>Point
+                  <ul>
+                    <li>Click to define points.</li>
+                    <li>To draw a region inside existing region, click inside the region to select it (if not already selected), now click again to define the point.</li>
+                    <li>To select, click on (or near) the existing point.</li>
+                  </ul>
+                </li>
+              </ul>
+
+              <ul>
+                <li>Polygon and Polyline
+                  <ul>
+                    <li>Click to define vertices.</li>
+                    <li>Press <strong>[Enter]</strong> to finish drawing the region or press [Esc] to cancel.</li>
+                    <li>If the first vertex needs to be defined inside an existing region, click inside the region to select it (if not already selected), now click again to define the vertex.</li>
+                    <li>To select, click inside the region. If the click point contains multiple regions, then clicking multiple times at that location shuffles selection through those regions.</li>
+                  </ul>
+                </li>
+              </ul>
+            </li>
+
+            <li><strong>Create Annotations</strong>: For a more detailed description of this step, see <a href="http://www.robots.ox.ac.uk/~vgg/software/via/docs/creating_annotations.html">Creating Annotations : VIA User Guide</a>. Click the <span class="text_button" onclick="annotation_editor_toggle_all_regions_editor()"><code>View &rarr; Toggle attributes editor</code></span> to show attributes editor panel in left sidebar and add the desired file or region attributes (e.g. name). Now click <span class="text_button" onclick="annotation_editor_toggle_all_regions_editor()"><code>View &rarr; Toggle annotations editor</code></span> to show the annotation editor panel in the bottom side. Update the annotations for each region.</li>
+            <li><strong>Export Annotations</strong>: To export the annotations in json or csv format, click <span class="text_button" onclick="download_all_region_data('csv')"><code>Annotation &rarr; Export annotations</code></span> in top menubar.</li>
+            <li><strong>Save Project</strong>: To save the project, click <span class="text_button" onclick="project_save_with_confirm()"><code>Project &rarr; Save</code></span> in top menubar.</li>
+          </ol>
+        </div>
+
+        <div id="page_load_ongoing" class="display_area_content narrow_page_content">
+          <div style="text-align:center">
+            <a href="http://www.robots.ox.ac.uk/~vgg/software/via/">
+              <svg height="160" viewbox="0 0 400 160" style="background-color:#212121;">
+                <use xlink:href="#via_logo"></use>
+              </svg>
+            </a>
+            <div style="margin-top:4rem">Loading ...</div>
+          </div>
+        </div>
+
+        <div id="page_about" class="display_area_content display_none" style="width:40rem !important">
+          <div style="text-align:center">
+            <a href="http://www.robots.ox.ac.uk/~vgg/software/via/">
+              <svg height="160" viewbox="0 0 400 160" style="background-color:#212121;">
+                <use xlink:href="#via_logo"></use>
+              </svg>
+            </a>
+          </div>
+
+          <p style="font-family:mono; font-size:0.8em;text-align:center;"><a href="https://gitlab.com/vgg/via/blob/master/CHANGELOG">Version 2.0.9</a></p>
+          <p>VGG Image Annotator (VIA) is an image annotation tool that can be used to define regions in an image and create textual descriptions of those regions. VIA is an <a href="https://gitlab.com/vgg/via/">open source project</a> developed at the <a href="http://www.robots.ox.ac.uk/~vgg/">Visual Geometry Group</a> and released under the BSD-2 clause <a href="https://gitlab.com/vgg/via/blob/master/LICENSE">license</a>.</p>
+          <p>Here is a list of some salient features of VIA:
+            <ul>
+              <li>based solely on HTML, CSS and Javascript (no external javascript libraries)</li>
+              <li>can be used off-line (full application in a single html file of size &lt; 400KB)</li>
+              <li>requires nothing more than a modern web browser (tested on Firefox, Chrome and Safari)</li>
+              <li>supported region shapes: rectangle, circle, ellipse, polygon, point and polyline</li>
+              <li>import/export of region data in csv and json file format</li>
+            </ul>
+          </p>
+          <p>For more details, visit <a href="http://www.robots.ox.ac.uk/~vgg/software/via/">http://www.robots.ox.ac.uk/~vgg/software/via/</a>.</p>
+          <p>&nbsp;</p>
+          <p>Copyright &copy; 2016-2019, <a href="mailto:adutta-removeme@robots.ox.ac.uk">Abhishek Dutta</a>,Visual Geometry Group, Oxford University and <a target="_blank" href="https://gitlab.com/vgg/via/blob/master/Contributors.md">VIA Contributors</a>.</p>
+        </div> <!-- end of page_about -->
+
+        <div id="page_license" class="display_area_content display_none narrow_page_content">
+          <pre>
+Copyright (c) 2016-2019, Abhishek Dutta, Visual Geometry Group, Oxford University and VIA Contributors.
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+
+Redistributions of source code must retain the above copyright notice, this
+list of conditions and the following disclaimer.
+Redistributions in binary form must reproduce the above copyright notice,
+this list of conditions and the following disclaimer in the documentation
+and/or other materials provided with the distribution.
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS &quot;AS IS&quot;
+AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
+LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
+INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
+CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
+ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
+POSSIBILITY OF SUCH DAMAGE.
+          </pre>
+        </div>
+      </div> <!-- end of display_area -->
+    </div> <!-- end of middle_panel -->
+
+    <!-- this vertical spacer is needed to allow scrollbar to show
+         items like Keyboard Shortcut hidden under the attributes panel -->
+    <div style="width: 100%;" id="vertical_space"></div>
+
+    <!-- DEMO SCRIPT AUTOMATICALLY INSERTED BY VIA PACKER SCRIPT -->
+<!-- START: Contents of file: via.js-->
+<script>
+/*
+  VGG Image Annotator (via)
+  www.robots.ox.ac.uk/~vgg/software/via/
+
+  Copyright (c) 2016-2019, Abhishek Dutta, Visual Geometry Group, Oxford University and VIA Contributors.
+  All rights reserved.
+
+  Redistribution and use in source and binary forms, with or without
+  modification, are permitted provided that the following conditions are met:
+
+  Redistributions of source code must retain the above copyright notice, this
+  list of conditions and the following disclaimer.
+  Redistributions in binary form must reproduce the above copyright notice,
+  this list of conditions and the following disclaimer in the documentation
+  and/or other materials provided with the distribution.
+  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+  AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+  IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+  ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
+  LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+  CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+  SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
+  INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
+  CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
+  ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
+  POSSIBILITY OF SUCH DAMAGE.
+*/
+
+/*
+  Links:
+  - https://gitlab.com/vgg/via/blob/master/Contributors.md : list of developers who have contributed code to the VIA project.
+  - https://gitlab.com/vgg/via/blob/master/CodeDoc.md : source code documentation
+  - https://gitlab.com/vgg/via/blob/master/CONTRIBUTING.md : guide for contributors
+
+  This source code can be grouped into the following categories:
+  - Data structure for annotations
+  - Initialization routine
+  - Handlers for top navigation bar
+  - Local file uploaders
+  - Data Importer
+  - Data Exporter
+  - Maintainers of user interface
+  - Image click handlers
+  - Canvas update routines
+  - Region collision routines
+  - Shortcut key handlers
+  - Persistence of annotation data in browser cache (i.e. localStorage)
+  - Handlers for attributes input panel (spreadsheet like user input panel)
+*/
+
+"use strict";
+
+var VIA_VERSION      = '2.0.9';
+var VIA_NAME         = 'VGG Image Annotator';
+var VIA_SHORT_NAME   = 'VIA';
+var VIA_REGION_SHAPE = { RECT:'rect',
+                         CIRCLE:'circle',
+                         ELLIPSE:'ellipse',
+                         POLYGON:'polygon',
+                         POINT:'point',
+                         POLYLINE:'polyline'
+                       };
+
+var VIA_ATTRIBUTE_TYPE = { TEXT:'text',
+                           CHECKBOX:'checkbox',
+                           RADIO:'radio',
+                           IMAGE:'image',
+                           DROPDOWN:'dropdown'
+                         };
+
+var VIA_DISPLAY_AREA_CONTENT_NAME = {IMAGE:'image_panel',
+                                     IMAGE_GRID:'image_grid_panel',
+                                     SETTINGS:'settings_panel',
+                                     PAGE_404:'page_404',
+                                     PAGE_GETTING_STARTED:'page_getting_started',
+                                     PAGE_ABOUT:'page_about',
+                                     PAGE_START_INFO:'page_start_info',
+                                     PAGE_LICENSE:'page_license'
+                                    };
+
+var VIA_ANNOTATION_EDITOR_MODE    = {SINGLE_REGION:'single_region',
+                                     ALL_REGIONS:'all_regions'};
+var VIA_ANNOTATION_EDITOR_PLACEMENT = {NEAR_REGION:'NEAR_REGION',
+                                       IMAGE_BOTTOM:'IMAGE_BOTTOM',
+                                       DISABLE:'DISABLE'};
+
+var VIA_REGION_EDGE_TOL           = 5;   // pixel
+var VIA_REGION_CONTROL_POINT_SIZE = 2;
+var VIA_POLYGON_VERTEX_MATCH_TOL  = 5;
+var VIA_REGION_MIN_DIM            = 3;
+var VIA_MOUSE_CLICK_TOL           = 2;
+var VIA_ELLIPSE_EDGE_TOL          = 0.2; // euclidean distance
+var VIA_THETA_TOL                 = Math.PI/18; // 10 degrees
+var VIA_POLYGON_RESIZE_VERTEX_OFFSET  = 100;
+var VIA_CANVAS_DEFAULT_ZOOM_LEVEL_INDEX = 3;
+var VIA_CANVAS_ZOOM_LEVELS = [0.25, 0.5, 0.75, 1.0, 1.5, 2.0, 2.5, 3.0, 4, 5, 6, 7, 8, 9, 10];
+var VIA_REGION_COLOR_LIST = ["#E69F00", "#56B4E9", "#009E73", "#D55E00", "#CC79A7", "#F0E442", "#ffffff"];
+var VIA_REGION_POINT_RADIUS         = 3;
+var VIA_REGION_POINT_RADIUS_DEFAULT = 3;
+
+var VIA_THEME_REGION_BOUNDARY_WIDTH = 3;
+var VIA_THEME_BOUNDARY_LINE_COLOR   = "black";
+var VIA_THEME_BOUNDARY_FILL_COLOR   = "yellow";
+var VIA_THEME_SEL_REGION_FILL_COLOR = "#808080";
+var VIA_THEME_SEL_REGION_FILL_BOUNDARY_COLOR = "yellow";
+var VIA_THEME_SEL_REGION_OPACITY    = 0.5;
+var VIA_THEME_MESSAGE_TIMEOUT_MS    = 6000;
+var VIA_THEME_CONTROL_POINT_COLOR   = '#ff0000';
+
+var VIA_CSV_SEP        = ',';
+var VIA_CSV_QUOTE_CHAR = '"';
+var VIA_CSV_KEYVAL_SEP = ':';
+
+var _via_img_metadata = {};   // data structure to store loaded images metadata
+var _via_img_src      = {};   // image content {abs. path, url, base64 data, etc}
+var _via_img_fileref  = {};   // reference to local images selected by using browser file selector
+var _via_img_count    = 0;    // count of the loaded images
+var _via_canvas_regions = []; // image regions spec. in canvas space
+var _via_canvas_scale   = 1.0;// current scale of canvas image
+
+var _via_image_id       = ''; // id={filename+length} of current image
+var _via_image_index    = -1; // index
+
+var _via_current_image_filename;
+var _via_current_image;
+var _via_current_image_width;
+var _via_current_image_height;
+
+// a record of image statistics (e.g. width, height)
+var _via_img_stat     = {};
+var _via_is_all_img_stat_read_ongoing = false;
+var _via_img_stat_current_img_index = false;
+
+// image canvas
+var _via_display_area = document.getElementById('display_area');
+var _via_img_panel    = document.getElementById('image_panel');
+var _via_reg_canvas   = document.getElementById('region_canvas');
+var _via_reg_ctx; // initialized in _via_init()
+var _via_canvas_width, _via_canvas_height;
+
+// canvas zoom
+var _via_canvas_zoom_level_index   = VIA_CANVAS_DEFAULT_ZOOM_LEVEL_INDEX; // 1.0
+var _via_canvas_scale_without_zoom = 1.0;
+
+// state of the application
+var _via_is_user_drawing_region  = false;
+var _via_current_image_loaded    = false;
+var _via_is_window_resized       = false;
+var _via_is_user_resizing_region = false;
+var _via_is_user_moving_region   = false;
+var _via_is_user_drawing_polygon = false;
+var _via_is_region_selected      = false;
+var _via_is_all_region_selected  = false;
+var _via_is_loaded_img_list_visible  = false;
+var _via_is_attributes_panel_visible = false;
+var _via_is_reg_attr_panel_visible   = false;
+var _via_is_file_attr_panel_visible  = false;
+var _via_is_canvas_zoomed            = false;
+var _via_is_loading_current_image    = false;
+var _via_is_region_id_visible        = true;
+var _via_is_region_boundary_visible  = true;
+var _via_is_region_info_visible      = false;
+var _via_is_ctrl_pressed             = false;
+var _via_is_debug_mode               = false;
+
+// region
+var _via_current_shape             = VIA_REGION_SHAPE.RECT;
+var _via_current_polygon_region_id = -1;
+var _via_user_sel_region_id        = -1;
+var _via_click_x0 = 0; var _via_click_y0 = 0;
+var _via_click_x1 = 0; var _via_click_y1 = 0;
+var _via_region_click_x, _via_region_click_y;
+var _via_region_edge          = [-1, -1];
+var _via_current_x = 0; var _via_current_y = 0;
+
+// region copy/paste
+var _via_region_selected_flag = []; // region select flag for current image
+var _via_copied_image_regions = [];
+var _via_paste_to_multiple_images_input;
+
+// message
+var _via_message_clear_timer;
+
+// attributes
+var _via_attribute_being_updated       = 'region'; // {region, file}
+var _via_attributes                    = { 'region':{}, 'file':{} };
+var _via_current_attribute_id          = '';
+
+// region group color
+var _via_canvas_regions_group_color = {}; // color of each region
+
+// invoke a method after receiving user input
+var _via_user_input_ok_handler     = null;
+var _via_user_input_cancel_handler = null;
+var _via_user_input_data           = {};
+
+// annotation editor
+var _via_annotaion_editor_panel     = document.getElementById('annotation_editor_panel');
+var _via_metadata_being_updated     = 'region'; // {region, file}
+var _via_annotation_editor_mode     = VIA_ANNOTATION_EDITOR_MODE.SINGLE_REGION;
+
+// persistence to local storage
+var _via_is_local_storage_available = false;
+var _via_is_save_ongoing            = false;
+
+// all the image_id and image_filename of images added by the user is
+// stored in _via_image_id_list and _via_image_filename_list
+//
+// Image filename list (img_fn_list) contains a filtered list of images
+// currently accessible by the user. The img_fn_list is visible in the
+// left side toolbar. image_grid, next/prev, etc operations depend on
+// the contents of _via_img_fn_list_img_index_list.
+var _via_image_id_list                 = []; // array of all image id (in order they were added by user)
+var _via_image_filename_list           = []; // array of all image filename
+var _via_image_load_error              = []; // {true, false}
+var _via_image_filepath_resolved       = []; // {true, false}
+var _via_image_filepath_id_list        = []; // path for each file
+
+var _via_reload_img_fn_list_table      = true;
+var _via_img_fn_list_img_index_list    = []; // image index list of images show in img_fn_list
+var _via_img_fn_list_html              = []; // html representation of image filename list
+
+// image grid
+var image_grid_panel                        = document.getElementById('image_grid_panel');
+var _via_display_area_content_name          = ''; // describes what is currently shown in display area
+var _via_display_area_content_name_prev     = '';
+var _via_image_grid_requires_update         = false;
+var _via_image_grid_content_overflow        = false;
+var _via_image_grid_load_ongoing            = false;
+var _via_image_grid_page_first_index        = 0; // array index in _via_img_fn_list_img_index_list[]
+var _via_image_grid_page_last_index         = -1;
+var _via_image_grid_selected_img_index_list = [];
+var _via_image_grid_page_img_index_list     = []; // list of all image index in current page of image grid
+var _via_image_grid_visible_img_index_list  = []; // list of images currently visible in grid
+var _via_image_grid_mousedown_img_index     = -1;
+var _via_image_grid_mouseup_img_index       = -1;
+var _via_image_grid_img_index_list          = []; // list of all image index in the image grid
+var _via_image_grid_region_index_list       = []; // list of all image index in the image grid
+var _via_image_grid_group                   = {}; // {'value':[image_index_list]}
+var _via_image_grid_group_var               = []; // {type, name, value}
+var _via_image_grid_group_show_all          = false;
+var _via_image_grid_stack_prev_page         = []; // stack of first img index of every page navigated so far
+
+// image buffer
+var VIA_IMG_PRELOAD_INDICES         = [1, -1, 2, 3, -2, 4]; // for any image, preload previous 2 and next 4 images
+var VIA_IMG_PRELOAD_COUNT           = 4;
+var _via_buffer_preload_img_index   = -1;
+var _via_buffer_img_index_list      = [];
+var _via_buffer_img_shown_timestamp = [];
+var _via_preload_img_promise_list   = [];
+
+// via settings
+var _via_settings = {};
+_via_settings.ui  = {};
+_via_settings.ui.annotation_editor_height   = 25; // in percent of the height of browser window
+_via_settings.ui.annotation_editor_fontsize = 0.8;// in rem
+_via_settings.ui.leftsidebar_width          = 18;  // in rem
+
+_via_settings.ui.image_grid = {};
+_via_settings.ui.image_grid.img_height          = 80;  // in pixel
+_via_settings.ui.image_grid.rshape_fill         = 'none';
+_via_settings.ui.image_grid.rshape_fill_opacity = 0.3;
+_via_settings.ui.image_grid.rshape_stroke       = 'yellow';
+_via_settings.ui.image_grid.rshape_stroke_width = 2;
+_via_settings.ui.image_grid.show_region_shape   = true;
+_via_settings.ui.image_grid.show_image_policy   = 'all';
+
+_via_settings.ui.image = {};
+_via_settings.ui.image.region_label      = '__via_region_id__'; // default: region_id
+_via_settings.ui.image.region_color      = '__via_default_region_color__'; // default color: yellow
+_via_settings.ui.image.region_label_font = '10px Sans';
+_via_settings.ui.image.on_image_annotation_editor_placement = VIA_ANNOTATION_EDITOR_PLACEMENT.NEAR_REGION;
+
+_via_settings.core                  = {};
+_via_settings.core.buffer_size      = 4*VIA_IMG_PRELOAD_COUNT + 2;
+_via_settings.core.filepath         = {};
+_via_settings.core.default_filepath = '';
+
+// UI html elements
+var invisible_file_input = document.getElementById("invisible_file_input");
+var display_area    = document.getElementById("display_area");
+var ui_top_panel    = document.getElementById("ui_top_panel");
+var image_panel     = document.getElementById("image_panel");
+var img_buffer_now  = document.getElementById("img_buffer_now");
+
+var annotation_list_snippet = document.getElementById("annotation_list_snippet");
+var annotation_textarea     = document.getElementById("annotation_textarea");
+
+var img_fn_list_panel     = document.getElementById('img_fn_list_panel');
+var img_fn_list           = document.getElementById('img_fn_list');
+var attributes_panel      = document.getElementById('attributes_panel');
+var leftsidebar           = document.getElementById('leftsidebar');
+
+var BBOX_LINE_WIDTH       = 4;
+var BBOX_SELECTED_OPACITY = 0.3;
+var BBOX_BOUNDARY_FILL_COLOR_ANNOTATED = "#f2f2f2";
+var BBOX_BOUNDARY_FILL_COLOR_NEW       = "#aaeeff";
+var BBOX_BOUNDARY_LINE_COLOR           = "#1a1a1a";
+var BBOX_SELECTED_FILL_COLOR           = "#ffffff";
+
+var VIA_ANNOTATION_EDITOR_HEIGHT_CHANGE   = 5;   // in percent
+var VIA_ANNOTATION_EDITOR_FONTSIZE_CHANGE = 0.1; // in rem
+var VIA_IMAGE_GRID_IMG_HEIGHT_CHANGE      = 20;  // in percent
+var VIA_LEFTSIDEBAR_WIDTH_CHANGE          = 1;   // in rem
+var VIA_POLYGON_SEGMENT_SUBTENDED_ANGLE   = 5;   // in degree (used to approximate shapes using polygon)
+var VIA_FLOAT_PRECISION = 3; // number of decimal places to include in float values
+
+//
+// Data structure to store metadata about file and regions
+//
+function file_metadata(filename, size) {
+  this.filename = filename;
+  this.size     = size;         // file size in bytes
+  this.regions  = [];           // array of file_region()
+  this.file_attributes = {};    // image attributes
+}
+
+function file_region() {
+  this.shape_attributes  = {}; // region shape attributes
+  this.region_attributes = {}; // region attributes
+}
+
+//
+// Initialization routine
+//
+function _via_init() {
+  console.log(VIA_NAME);
+  show_message(VIA_NAME + ' (' + VIA_SHORT_NAME + ') version ' + VIA_VERSION +
+               '. Ready !', 2*VIA_THEME_MESSAGE_TIMEOUT_MS);
+
+  if ( _via_is_debug_mode ) {
+    document.getElementById('ui_top_panel').innerHTML += '<span>DEBUG MODE</span>';
+  }
+
+  document.getElementById('img_fn_list').style.display = 'block';
+  document.getElementById('leftsidebar').style.display = 'table-cell';
+
+  // initialize default project
+  project_init_default_project();
+
+  // initialize region canvas 2D context
+  _via_init_reg_canvas_context();
+
+  // initialize user input handlers (for both window and via_reg_canvas)
+  // handles drawing of regions by user over the image
+  _via_init_keyboard_handlers();
+  _via_init_mouse_handlers();
+
+  // initialize image grid
+  image_grid_init();
+
+  show_single_image_view();
+  init_leftsidebar_accordion();
+  attribute_update_panel_set_active_button();
+  annotation_editor_set_active_button();
+  init_message_panel();
+
+  // run attached sub-modules (if any)
+  // e.g. demo modules
+  if (typeof _via_load_submodules === 'function') {
+    console.log('Loading VIA submodule');
+    setTimeout( async function() {
+      await _via_load_submodules();
+    }, 100);
+  }
+
+}
+
+function _via_init_reg_canvas_context() {
+  _via_reg_ctx  = _via_reg_canvas.getContext('2d');
+}
+
+function _via_init_keyboard_handlers() {
+  window.addEventListener('keydown', _via_window_keydown_handler, false);
+  _via_reg_canvas.addEventListener('keydown', _via_reg_canvas_keydown_handler, false);
+  _via_reg_canvas.addEventListener('keyup', _via_reg_canvas_keyup_handler, false);
+}
+
+// handles drawing of regions over image by the user
+function _via_init_mouse_handlers() {
+  _via_reg_canvas.addEventListener('dblclick', _via_reg_canvas_dblclick_handler, false);
+  _via_reg_canvas.addEventListener('mousedown', _via_reg_canvas_mousedown_handler, false);
+  _via_reg_canvas.addEventListener('mouseup', _via_reg_canvas_mouseup_handler, false);
+  _via_reg_canvas.addEventListener('mouseover', _via_reg_canvas_mouseover_handler, false);
+  _via_reg_canvas.addEventListener('mousemove', _via_reg_canvas_mousemove_handler, false);
+  _via_reg_canvas.addEventListener('wheel', _via_reg_canvas_mouse_wheel_listener, false);
+  // touch screen event handlers
+  // @todo: adapt for mobile users
+  _via_reg_canvas.addEventListener('touchstart', _via_reg_canvas_mousedown_handler, false);
+  _via_reg_canvas.addEventListener('touchend', _via_reg_canvas_mouseup_handler, false);
+  _via_reg_canvas.addEventListener('touchmove', _via_reg_canvas_mousemove_handler, false);
+}
+
+//
+// Download image with annotations
+//
+
+function download_as_image() {
+  if ( _via_display_area_content_name !== VIA_DISPLAY_AREA_CONTENT_NAME['IMAGE'] ) {
+    show_message('This functionality is only available in single image view mode');
+    return;
+  } else {
+    var c = document.createElement('canvas');
+
+    // ensures that downloaded image is scaled at current zoom level
+    c.width  = _via_reg_canvas.width;
+    c.height = _via_reg_canvas.height;
+
+    var ct = c.getContext('2d');
+    // draw current image
+    ct.drawImage(_via_current_image, 0, 0, _via_reg_canvas.width, _via_reg_canvas.height);
+    // draw current regions
+    ct.drawImage(_via_reg_canvas, 0, 0);
+
+    var cur_img_mime = 'image/jpeg';
+    if ( _via_current_image.src.startsWith('data:') )  {
+      var c1 = _via_current_image.src.indexOf(':', 0);
+      var c2 = _via_current_image.src.indexOf(';', c1);
+      cur_img_mime = _via_current_image.src.substring(c1 + 1, c2);
+    }
+
+    // extract image data from canvas
+    var saved_img = c.toDataURL(cur_img_mime);
+    saved_img.replace(cur_img_mime, "image/octet-stream");
+
+    // simulate user click to trigger download of image
+    var a      = document.createElement('a');
+    a.href     = saved_img;
+    a.target   = '_blank';
+    a.download = _via_current_image_filename;
+
+    // simulate a mouse click event
+    var event = new MouseEvent('click', {
+      view: window,
+      bubbles: true,
+      cancelable: true
+    });
+
+    a.dispatchEvent(event);
+  }
+}
+
+//
+// Display area content
+//
+function clear_display_area() {
+  var panels = document.getElementsByClassName('display_area_content');
+  var i;
+  for ( i = 0; i < panels.length; ++i ) {
+    panels[i].classList.add('display_none');
+  }
+}
+
+function is_content_name_valid(content_name) {
+  var e;
+  for ( e in VIA_DISPLAY_AREA_CONTENT_NAME ) {
+    if ( VIA_DISPLAY_AREA_CONTENT_NAME[e] === content_name ) {
+      return true;
+    }
+  }
+  return false;
+}
+
+function show_home_panel() {
+  show_single_image_view();
+}
+
+function set_display_area_content(content_name) {
+  if ( is_content_name_valid(content_name) ) {
+    _via_display_area_content_name_prev = _via_display_area_content_name;
+    clear_display_area();
+    var p = document.getElementById(content_name);
+    p.classList.remove('display_none');
+    _via_display_area_content_name = content_name;
+  }
+}
+
+function show_single_image_view() {
+  if (_via_current_image_loaded) {
+    img_fn_list_clear_all_style();
+    _via_show_img(_via_image_index);
+    set_display_area_content(VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE);
+    annotation_editor_update_content();
+
+    var p = document.getElementById('toolbar_image_grid_toggle');
+    p.firstChild.setAttribute('xlink:href', '#icon_gridon');
+    p.childNodes[1].innerHTML = 'Switch to Image Grid View';
+  } else {
+    set_display_area_content(VIA_DISPLAY_AREA_CONTENT_NAME.PAGE_START_INFO);
+  }
+}
+
+function show_image_grid_view() {
+  if (_via_current_image_loaded) {
+    img_fn_list_clear_all_style();
+    set_display_area_content(VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID);
+    image_grid_toolbar_update_group_by_select();
+
+    if ( _via_image_grid_group_var.length === 0 ) {
+      image_grid_show_all_project_images();
+    }
+    annotation_editor_update_content();
+
+    var p = document.getElementById('toolbar_image_grid_toggle');
+    p.firstChild.setAttribute('xlink:href', '#icon_gridoff');
+    p.childNodes[1].innerHTML = 'Switch to Single Image View';
+
+    //edit_file_metadata_in_annotation_editor();
+  } else {
+    set_display_area_content(VIA_DISPLAY_AREA_CONTENT_NAME.PAGE_START_INFO);
+  }
+}
+
+//
+// Handlers for top navigation bar
+//
+function sel_local_images() {
+  // source: https://developer.mozilla.org/en-US/docs/Using_files_from_web_applications
+  if (invisible_file_input) {
+    invisible_file_input.setAttribute('multiple', 'multiple')
+    invisible_file_input.accept   = '.jpg,.jpeg,.png,.bmp';
+    invisible_file_input.onchange = project_file_add_local;
+    invisible_file_input.click();
+  }
+}
+
+function download_all_region_data(type, file_extension) {
+  if ( typeof(file_extension) === 'undefined' ) {
+    file_extension = type;
+  }
+
+  // Javascript strings (DOMString) is automatically converted to utf-8
+  // see: https://developer.mozilla.org/en-US/docs/Web/API/Blob/Blob
+  pack_via_metadata(type).then( function(data) {
+    var blob_attr = {type: 'text/'+file_extension+';charset=utf-8'};
+    var all_region_data_blob = new Blob(data, blob_attr);
+
+    var filename = 'via_export';
+    if ( file_extension !== 'csv' || file_extension !== 'json' ) {
+      filename += '_' + type + '.' + file_extension;
+    }
+    save_data_to_local_file(all_region_data_blob, filename);
+  }.bind(this), function(err) {
+    show_message('Failed to download data: [' + err + ']');
+  }.bind(this));
+}
+
+function sel_local_data_file(type) {
+  if (invisible_file_input) {
+    switch(type) {
+    case 'annotations':
+      invisible_file_input.accept='.csv,.json';
+      invisible_file_input.onchange = import_annotations_from_file;
+      break;
+
+    case 'annotations_coco':
+      invisible_file_input.accept='.json';
+      invisible_file_input.onchange = import_annotations_from_file;
+      break;
+
+    case 'files_url':
+      invisible_file_input.accept='';
+      invisible_file_input.onchange = import_files_url_from_file;
+      break;
+
+    case 'attributes':
+      invisible_file_input.accept='json';
+      invisible_file_input.onchange = project_import_attributes_from_file;
+      break;
+
+    default:
+      console.log('sel_local_data_file() : unknown type ' + type);
+      return;
+    }
+    invisible_file_input.removeAttribute('multiple');
+    invisible_file_input.click();
+  }
+}
+
+//
+// Data Importer
+//
+function import_files_url_from_file(event) {
+  var selected_files = event.target.files;
+  var i, file;
+  for ( i = 0; i < selected_files.length; ++i ) {
+    file = selected_files[i];
+    load_text_file(file, import_files_url_from_csv);
+  }
+}
+
+function import_annotations_from_file(event) {
+  var selected_files = event.target.files;
+  var i, file;
+  for ( i = 0; i < selected_files.length; ++i ) {
+    file = selected_files[i];
+    switch ( file.type ) {
+    case '': // Fall-through // Windows 10: Firefox and Chrome do not report filetype
+      show_message('File type for ' + file.name + ' cannot be determined! Assuming text/plain.');
+    case 'text/plain': // Fall-through
+    case 'application/vnd.ms-excel': // Fall-through // @todo: filetype of VIA csv annotations in Windows 10 , fix this (reported by @Eli Walker)
+    case 'text/csv':
+      load_text_file(file, import_annotations_from_csv);
+      break;
+
+    case 'text/json': // Fall-through
+    case 'application/json':
+      load_text_file(file, import_annotations_from_json);
+      break;
+
+    default:
+      show_message('Annotations cannot be imported from file of type ' + file.type);
+      break;
+    }
+  }
+}
+
+function import_annotations_from_csv(data) {
+  return new Promise( function(ok_callback, err_callback) {
+    if ( data === '' || typeof(data) === 'undefined') {
+      err_callback();
+    }
+
+    var region_import_count = 0;
+    var malformed_csv_lines_count = 0;
+    var file_added_count = 0;
+
+    var line_split_regex = new RegExp('\n|\r|\r\n', 'g');
+    var csvdata = data.split(line_split_regex);
+
+    var parsed_header = parse_csv_header_line(csvdata[0]);
+    console.log(parsed_header)
+    if ( ! parsed_header.is_header ) {
+      show_message('Header line missing in the CSV file');
+      err_callback();
+      return;
+    }
+
+    var percent_completed = 0;
+    var n = csvdata.length;
+    var i;
+    var first_img_id = '';
+    for ( i = 1; i < n; ++i ) {
+      // ignore blank lines
+      if (csvdata[i].charAt(0) === '\n' || csvdata[i].charAt(0) === '') {
+        continue;
+      }
+
+      var d = parse_csv_line(csvdata[i]);
+
+      // check if csv line was malformed
+      if ( d.length !== parsed_header.csv_column_count ) {
+        malformed_csv_lines_count += 1;
+        continue;
+      }
+
+      var filename = d[parsed_header.filename_index];
+      var size     = d[parsed_header.size_index];
+      var img_id   = _via_get_image_id(filename, size);
+
+      // check if file is already present in this project
+      if ( ! _via_img_metadata.hasOwnProperty(img_id) ) {
+        img_id = project_add_new_file(filename, size);
+        if ( _via_settings.core.default_filepath === '' ) {
+          _via_img_src[img_id] = filename;
+        } else {
+          _via_file_resolve_file_to_default_filepath(img_id);
+        }
+        file_added_count += 1;
+
+        if ( first_img_id === '' ) {
+          first_img_id = img_id;
+        }
+      }
+
+      // copy file attributes
+      if ( d[parsed_header.file_attr_index] !== '"{}"') {
+        var fattr = d[parsed_header.file_attr_index];
+        fattr     = remove_prefix_suffix_quotes( fattr );
+        fattr     = unescape_from_csv( fattr );
+
+        var m = json_str_to_map( fattr );
+        for( var key in m ) {
+          _via_img_metadata[img_id].file_attributes[key] = m[key];
+
+          // add this file attribute to _via_attributes
+          if ( ! _via_attributes['file'].hasOwnProperty(key) ) {
+            _via_attributes['file'][key] = { 'type':'text' };
+          }
+        }
+      }
+
+      var region_i = new file_region();
+      // copy regions shape attributes
+      if ( d[parsed_header.region_shape_attr_index] !== '"{}"' ) {
+        var sattr = d[parsed_header.region_shape_attr_index];
+        sattr     = remove_prefix_suffix_quotes( sattr );
+        sattr     = unescape_from_csv( sattr );
+
+        var m = json_str_to_map( sattr );
+        for ( var key in m ) {
+          region_i.shape_attributes[key] = m[key];
+        }
+      }
+
+      // copy region attributes
+      if ( d[parsed_header.region_attr_index] !== '"{}"' ) {
+        var rattr = d[parsed_header.region_attr_index];
+        rattr     = remove_prefix_suffix_quotes( rattr );
+        rattr     = unescape_from_csv( rattr );
+
+        var m = json_str_to_map( rattr );
+        for ( var key in m ) {
+          region_i.region_attributes[key] = m[key];
+
+          // add this region attribute to _via_attributes
+          if ( ! _via_attributes['region'].hasOwnProperty(key) ) {
+            _via_attributes['region'][key] = { 'type':'text' };
+          }
+        }
+      }
+
+      // add regions only if they are present
+      if (Object.keys(region_i.shape_attributes).length > 0 ||
+          Object.keys(region_i.region_attributes).length > 0 ) {
+        _via_img_metadata[img_id].regions.push(region_i);
+        region_import_count += 1;
+      }
+    }
+    show_message('Import Summary : [' + file_added_count + '] new files, ' +
+                 '[' + region_import_count + '] regions, ' +
+                 '[' + malformed_csv_lines_count  + '] malformed csv lines.');
+
+    if ( file_added_count ) {
+      update_img_fn_list();
+    }
+
+    if ( _via_current_image_loaded ) {
+      if ( region_import_count ) {
+        update_attributes_update_panel();
+        annotation_editor_update_content();
+        _via_load_canvas_regions(); // image to canvas space transform
+        _via_redraw_reg_canvas();
+        _via_reg_canvas.focus();
+      }
+    } else {
+      if ( file_added_count ) {
+        var first_img_index = _via_image_id_list.indexOf(first_img_id);
+        _via_show_img( first_img_index );
+      }
+    }
+    ok_callback([file_added_count, region_import_count, malformed_csv_lines_count]);
+  });
+}
+
+function parse_csv_header_line(line) {
+  var header_via_10x = '#filename,file_size,file_attributes,region_count,region_id,region_shape_attributes,region_attributes'; // VIA versions 1.0.x
+  var header_via_11x = 'filename,file_size,file_attributes,region_count,region_id,region_shape_attributes,region_attributes'; // VIA version 1.1.x
+
+  if ( line === header_via_10x || line === header_via_11x ) {
+    return { 'is_header':true,
+             'filename_index': 0,
+             'size_index': 1,
+             'file_attr_index': 2,
+             'region_shape_attr_index': 5,
+             'region_attr_index': 6,
+             'csv_column_count': 7
+           }
+  } else {
+    return { 'is_header':false };
+  }
+}
+
+function import_annotations_from_json(data_str) {
+  return new Promise( function(ok_callback, err_callback) {
+    if (data_str === '' || typeof(data_str) === 'undefined') {
+      return;
+    }
+
+    var data = JSON.parse(data_str);
+    var d;
+
+    if ( data.hasOwnProperty('info') && data.hasOwnProperty('categories') &&
+         data.hasOwnProperty('images') && data.hasOwnProperty('annotations')
+       ) {
+      // import annotations in COCO format
+      d = coco_to_via(data);
+    } else {
+      d = data;
+    }
+
+    var region_import_count = 0;
+    var file_added_count    = 0;
+    var malformed_entries_count    = 0;
+    for (var img_id in d) {
+      if ( ! _via_img_metadata.hasOwnProperty(img_id) ) {
+        project_add_new_file(d[img_id].filename, d[img_id].size, img_id);
+        if ( _via_settings.core.default_filepath === '' ) {
+          _via_img_src[img_id] = d[img_id].filename;
+        } else {
+          _via_file_resolve_file_to_default_filepath(img_id);
+        }
+        file_added_count += 1;
+      }
+
+      // copy file attributes
+      var key;
+      for ( key in d[img_id].file_attributes ) {
+        if ( key === '' ) {
+          continue;
+        }
+
+        _via_img_metadata[img_id].file_attributes[key] = d[img_id].file_attributes[key];
+
+        // add this file attribute to _via_attributes
+        if ( ! _via_attributes['file'].hasOwnProperty(key) ) {
+          _via_attributes['file'][key] = { 'type':'text' };
+        }
+      }
+
+      // copy regions
+      var regions = d[img_id].regions;
+      var key, i;
+      for ( i in regions ) {
+        var region_i = new file_region();
+        for ( key in regions[i].shape_attributes ) {
+          region_i.shape_attributes[key] = regions[i].shape_attributes[key];
+        }
+        for ( var key in regions[i].region_attributes ) {
+          if ( key === '' ) {
+            continue;
+          }
+
+          region_i.region_attributes[key] = regions[i].region_attributes[key];
+
+          // add this region attribute to _via_attributes
+          if ( ! _via_attributes['region'].hasOwnProperty(key) ) {
+            _via_attributes['region'][key] = { 'type':'text' };
+          }
+        }
+
+        // add regions only if they are present
+        if ( Object.keys(region_i.shape_attributes).length > 0 ||
+             Object.keys(region_i.region_attributes).length > 0 ) {
+          _via_img_metadata[img_id].regions.push(region_i);
+          region_import_count += 1;
+        }
+      }
+    }
+    show_message('Import Summary : [' + file_added_count + '] new files, ' +
+                 '[' + region_import_count + '] regions, ' +
+                 '[' + malformed_entries_count + '] malformed entries.');
+
+    if ( file_added_count ) {
+      update_img_fn_list();
+    }
+
+    if ( _via_current_image_loaded ) {
+      if ( region_import_count ) {
+        update_attributes_update_panel();
+        annotation_editor_update_content();
+        _via_load_canvas_regions(); // image to canvas space transform
+        _via_redraw_reg_canvas();
+        _via_reg_canvas.focus();
+      }
+    } else {
+      if ( file_added_count ) {
+        _via_show_img(0);
+      }
+    }
+
+    ok_callback([file_added_count, region_import_count, malformed_entries_count]);
+  });
+}
+
+// convert from coco JSON format to VIA JSON format
+// see http://cocodataset.org/#format-data
+function coco_to_via(coco) {
+  var d = {};
+
+  // create an index of all categories
+  var category_list = {}
+  for ( var cat_index in coco.categories ) {
+    var catid = coco.categories[cat_index]['id'];
+    category_list[catid] = coco.categories[cat_index]['name'];
+  }
+
+  // create an index of all annotations
+  var annotation_list = {}
+  for ( var annotation_index in coco.annotations ) {
+    var coco_image_id = coco.annotations[annotation_index]['image_id'];
+    if ( ! annotation_list.hasOwnProperty(coco_image_id) ) {
+      annotation_list[coco_image_id] = [];
+    }
+    annotation_list[coco_image_id].push( annotation_index );
+  }
+
+  // add all files and annotations
+  for ( var coco_img_index in coco.images ) {
+    var filename = coco.images[coco_img_index]['file_name'];
+    if ( coco.images[coco_img_index].hasOwnProperty('coco_url') ) {
+      filename = coco.images[coco_img_index]['coco_url'];
+    }
+    var size = -1;
+    var via_img_id = _via_get_image_id(filename, size);
+    var coco_img_id = coco.images[coco_img_index]['id'];
+    var width = coco.images[coco_img_index]['width'];
+    var height = coco.images[coco_img_index]['height'];
+
+    d[via_img_id] = { 'filename':filename,
+                      'size':size,
+                      'regions':[],
+                      'file_attributes':{'width':width, 'height':height},
+                    };
+
+    // add all annotations associated with this file
+    if ( annotation_list.hasOwnProperty(coco_img_id) ) {
+      for ( var i in annotation_list[coco_img_id] ) {
+        var annotation = coco.annotations[ annotation_list[coco_img_id][i] ];
+
+        var category_id = -1;
+        if ( annotation.category_id !== "undefined") {
+          category_id = annotation.category_id - 1;
+        }
+
+        var bbox_from_polygon = polygon_to_bbox(annotation['segmentation']);
+
+        // fix for variations in segmentation:
+        // annotation['segmentation'] = [x0,y0,x1,y1,...]
+        // annotation['segmentation'] = [[x0,y0,x1,y1,...]]
+        var seg = annotation['segmentation'];
+        if ( seg.length === 1 && seg[0].length !== 0 ) {
+          seg = annotation['segmentation'][0];
+        }
+
+        // check if imported region is polygon or rectangle
+        var is_rectangle = true;
+        var anno_bbox = annotation['bbox'];
+        for (var i = 0; i < anno_bbox.length; ++i) {
+          if (anno_bbox[i] !== bbox_from_polygon[i]) {
+            is_rectangle = false;
+            break;
+          }
+        }
+
+        if ( seg.length === 8 && is_rectangle ) {
+          // a rectangle
+          var r = { 'shape_attributes': { 'name':'rect', 'x': [], 'y': [], 'width': [], 'height': []},
+                    'region_attributes': {},
+                  };
+          r['shape_attributes']['x'].push( anno_bbox[0] );
+          r['shape_attributes']['y'].push( anno_bbox[1] );
+          r['shape_attributes']['width'].push( anno_bbox[2] );
+          r['shape_attributes']['height'].push( anno_bbox[3] );
+
+          if ( category_id !== -1 && !isNaN(category_id)) {
+            var sup_category = coco.categories[category_id]['supercategory'];
+            r['region_attributes'][sup_category] = coco.categories[category_id]['name'];
+          }
+        } else {
+          // other shapes
+          var r = { 'shape_attributes': { 'name':'polygon', 'all_points_x':[], 'all_points_y':[] },
+            'region_attributes': {},
+          };
+          for ( var j = 0; j < seg.length; j = j + 2 ) {
+            r['shape_attributes']['all_points_x'].push( seg[j] );
+            r['shape_attributes']['all_points_y'].push( seg[j+1] );
+          }
+        }
+        d[via_img_id].regions.push(r);
+      }
+    }
+  }
+  return d;
+}
+
+// assumes that csv line follows the RFC 4180 standard
+// see: https://en.wikipedia.org/wiki/Comma-separated_values
+function parse_csv_line(s, field_separator) {
+  if (typeof(s) === 'undefined' || s.length === 0 ) {
+    return [];
+  }
+
+  if (typeof(field_separator) === 'undefined') {
+    field_separator = ',';
+  }
+  var double_quote_seen = false;
+  var start = 0;
+  var d = [];
+
+  var i = 0;
+  while ( i < s.length) {
+    if (s.charAt(i) === field_separator) {
+      if (double_quote_seen) {
+        // field separator inside double quote is ignored
+        i = i + 1;
+      } else {
+        //var part = s.substr(start, i - start);
+        d.push( s.substr(start, i - start) );
+        start = i + 1;
+        i = i + 1;
+      }
+    } else {
+      if (s.charAt(i) === '"') {
+        if (double_quote_seen) {
+          if (s.charAt(i+1) === '"') {
+            // ignore escaped double quotes
+            i = i + 2;
+          } else {
+            // closing of double quote
+            double_quote_seen = false;
+            i = i + 1;
+          }
+        } else {
+          double_quote_seen = true;
+          start = i;
+          i = i + 1;
+        }
+      } else {
+        i = i + 1;
+      }
+    }
+
+  }
+  // extract the last field (csv rows have no trailing comma)
+  d.push( s.substr(start) );
+  return d;
+}
+
+// s = '{"name":"rect","x":188,"y":90,"width":243,"height":233}'
+function json_str_to_map(s) {
+  if (typeof(s) === 'undefined' || s.length === 0 ) {
+    return {};
+  }
+
+  return JSON.parse(s);
+}
+
+// ensure the exported json string conforms to RFC 4180
+// see: https://en.wikipedia.org/wiki/Comma-separated_values
+function map_to_json(m) {
+  var s = [];
+  for ( var key in m ) {
+    var v   = m[key];
+    var si  = JSON.stringify(key);
+    si += VIA_CSV_KEYVAL_SEP;
+    si += JSON.stringify(v);
+    s.push( si );
+  }
+  return '{' + s.join(VIA_CSV_SEP) + '}';
+}
+
+function escape_for_csv(s) {
+  return s.replace(/["]/g, '""');
+}
+
+function unescape_from_csv(s) {
+  return s.replace(/""/g, '"');
+}
+
+function remove_prefix_suffix_quotes(s) {
+  if ( s.charAt(0) === '"' && s.charAt(s.length-1) === '"' ) {
+    return s.substr(1, s.length-2);
+  } else {
+    return s;
+  }
+}
+
+function clone_image_region(r0) {
+  var r1 = new file_region();
+
+  // copy shape attributes
+  for ( var key in r0.shape_attributes ) {
+    r1.shape_attributes[key] = clone_value(r0.shape_attributes[key]);
+  }
+
+  // copy region attributes
+  for ( var key in r0.region_attributes ) {
+    r1.region_attributes[key] = clone_value(r0.region_attributes[key]);
+  }
+  return r1;
+}
+
+function clone_value(value) {
+  if ( typeof(value) === 'object' ) {
+    if ( Array.isArray(value) ) {
+      return value.slice(0);
+    } else {
+      var copy = {};
+      for ( var p in value ) {
+        if ( value.hasOwnProperty(p) ) {
+          copy[p] = clone_value(value[p]);
+        }
+      }
+      return copy;
+    }
+  }
+  return value;
+}
+
+function _via_get_image_id(filename, size) {
+  if ( typeof(size) === 'undefined' ) {
+    return filename;
+  } else {
+    return filename + size;
+  }
+}
+
+function load_text_file(text_file, callback_function) {
+  if (text_file) {
+    var text_reader = new FileReader();
+    text_reader.addEventListener( 'progress', function(e) {
+      show_message('Loading data from file : ' + text_file.name + ' ... ');
+    }, false);
+
+    text_reader.addEventListener( 'error', function() {
+      show_message('Error loading data text file :  ' + text_file.name + ' !');
+      callback_function('');
+    }, false);
+
+    text_reader.addEventListener( 'load', function() {
+      callback_function(text_reader.result);
+    }, false);
+    text_reader.readAsText(text_file, 'utf-8');
+  }
+}
+
+function import_files_url_from_csv(data) {
+  return new Promise( function(ok_callback, err_callback) {
+    if ( data === '' || typeof(data) === 'undefined') {
+      err_callback();
+    }
+
+    var malformed_url_count = 0;
+    var url_added_count = 0;
+
+    var line_split_regex = new RegExp('\n|\r|\r\n', 'g');
+    var csvdata = data.split(line_split_regex);
+
+    var percent_completed = 0;
+    var n = csvdata.length;
+    var i;
+    var img_id;
+    var first_img_id = '';
+    for ( i=0; i < n; ++i ) {
+      // ignore blank lines
+      if (csvdata[i].charAt(0) === '\n' || csvdata[i].charAt(0) === '') {
+        malformed_url_count += 1;
+        continue;
+      } else {
+        img_id = project_file_add_url(csvdata[i]);
+        if ( first_img_id === '' ) {
+          first_img_id = img_id;
+        }
+        url_added_count += 1;
+      }
+    }
+    show_message('Added ' + url_added_count + ' files to project');
+    if ( url_added_count ) {
+      var first_img_index = _via_image_id_list.indexOf(first_img_id);
+      _via_show_img(first_img_index);
+      update_img_fn_list();
+    }
+  });
+}
+
+//
+// Data Exporter
+//
+function pack_via_metadata(return_type) {
+  return new Promise( function(ok_callback, err_callback) {
+    if( return_type === 'csv' ) {
+      var csvdata = [];
+      var csvheader = 'filename,file_size,file_attributes,region_count,region_id,region_shape_attributes,region_attributes';
+      csvdata.push(csvheader);
+
+      for ( var image_id in _via_img_metadata ) {
+        var fattr = map_to_json( _via_img_metadata[image_id].file_attributes );
+        fattr = escape_for_csv( fattr );
+
+        var prefix = '\n' + _via_img_metadata[image_id].filename;
+        prefix += ',' + _via_img_metadata[image_id].size;
+        prefix += ',"' + fattr + '"';
+
+        var r = _via_img_metadata[image_id].regions;
+
+        if ( r.length !==0 ) {
+          for ( var i = 0; i < r.length; ++i ) {
+            var csvline = [];
+            csvline.push(prefix);
+            csvline.push(r.length);
+            csvline.push(i);
+
+            var sattr = map_to_json( r[i].shape_attributes );
+            sattr = '"' +  escape_for_csv( sattr ) + '"';
+            csvline.push(sattr);
+
+            var rattr = map_to_json( r[i].region_attributes );
+            rattr = '"' +  escape_for_csv( rattr ) + '"';
+            csvline.push(rattr);
+            csvdata.push( csvline.join(VIA_CSV_SEP) );
+          }
+        } else {
+          // @todo: reconsider this practice of adding an empty entry
+          csvdata.push(prefix + ',0,0,"{}","{}"');
+        }
+      }
+      ok_callback(csvdata);
+    }
+
+    // see http://cocodataset.org/#format-data
+    if( return_type === 'coco' ) {
+      img_stat_set_all().then( function(ok) {
+        var d = { 'info':{}, 'images':[], 'annotations':[], 'licenses':[], 'categories':[] };
+        d.info = {
+          'year': new Date().getFullYear(),
+          'version': '1',
+          'description': 'Exported using VGG Image Annotator (http://www.robots.ox.ac.uk/~vgg/software/via/)',
+          'contributor': '',
+          'url': 'http://www.robots.ox.ac.uk/~vgg/software/via/',
+          'date_created': new Date().toString(),
+        };
+        d.licenses = [ { 'id':1, 'name':'Unknown', 'url':'' } ];
+
+        // add files
+        var img_id, file_src;
+        var annotation_id = 0;
+        for ( var img_index in _via_image_id_list ) {
+          img_id = _via_image_id_list[img_index];
+
+          // add file
+          if ( _via_img_fileref[img_id] instanceof File ) {
+            file_src = _via_img_fileref[img_id].filename;
+          } else {
+            //file_src = _via_img_src[img_id];
+            file_src = _via_img_metadata[img_id].filename;
+          }
+          d.images.push( {
+            'id':parseInt(img_index),
+            'width':_via_img_stat[img_index][0],
+            'height':_via_img_stat[img_index][1],
+            'file_name':_via_img_metadata[img_id].filename,
+            'license':1,
+            'flickr_url':file_src,
+            'coco_url':file_src,
+            'date_captured':'',
+          } );
+
+          // initialize categories
+          var attrval_to_catid = {};
+          var cat_id = 1;
+          for ( var rid in _via_attributes['region'] ) {
+            if ( _via_attributes['region'][rid].type === VIA_ATTRIBUTE_TYPE.CHECKBOX ||
+                 _via_attributes['region'][rid].type === VIA_ATTRIBUTE_TYPE.DROPDOWN ||
+                 _via_attributes['region'][rid].type === VIA_ATTRIBUTE_TYPE.RADIO ) {
+              for ( var oid in _via_attributes['region'][rid]['options'] ) {
+                d.categories.push( { 'id':cat_id, 'name':oid, 'supercategory':rid } );
+                attrval_to_catid[oid] = cat_id;
+                cat_id = cat_id + 1;
+              }
+            }
+          }
+
+          var shape_name, region;
+          for ( var rindex in _via_img_metadata[img_id].regions ) {
+            region = _via_img_metadata[img_id].regions[rindex];
+            if ( region.shape_attributes['name'] === 'rect' ||
+                 region.shape_attributes['name'] === 'circle' ||
+                 region.shape_attributes['name'] === 'ellipse' ||
+                 region.shape_attributes['name'] === 'polygon' ||
+                 region.shape_attributes['name'] === 'point' ) {
+              var annotation = via_region_shape_to_coco_annotation(region.shape_attributes);
+              var attr_val;
+              for(var k in region.region_attributes) {
+                if ( region.region_attributes[k] !== "undefined" &&
+                     Object.entries(region.region_attributes[k]).length > 0) {
+                    attr_val = region.region_attributes[k];
+                }
+              }
+              // assume there is only one value (radio button)
+              cat_id = attrval_to_catid[attr_val];
+
+              d.annotations.push( Object.assign({
+                'id':annotation_id,
+                'image_id':img_index,
+                'category_id':cat_id,
+              }, annotation) );
+              annotation_id = annotation_id + 1;
+            }
+          }
+        }
+        ok_callback( [ JSON.stringify(d) ] );
+      }.bind(this), function(err) {
+        err_callback(err);
+      }.bind(this));
+    } else {
+      // default format is JSON
+      ok_callback( [ JSON.stringify(_via_img_metadata) ] );
+    }
+  }.bind(this));
+}
+
+function via_region_shape_to_coco_annotation(shape_attributes) {
+  var annotation = { 'segmentation':[], 'area':[], 'bbox':[], 'iscrowd':0 };
+
+  switch(shape_attributes['name']) {
+  case 'rect':
+    var x0 = shape_attributes['x'];
+    var y0 = shape_attributes['y'];
+    var w  = parseInt(shape_attributes['width']);
+    var h  = parseInt(shape_attributes['height']);
+    var x1 = x0 + w;
+    var y1 = y0 + h;
+    annotation['segmentation'] = [x0, y0, x1, y0, x1, y1, x0, y1];
+    annotation['area'] =  w * h ;
+
+    annotation['bbox'] = [x0, y0, w, h];
+    break;
+
+  case 'point':
+    var cx = shape_attributes['cx'];
+    var cy = shape_attributes['cy'];
+    // 2 is for visibility - currently set to always inside segmentation.
+    // see Keypoint Detection: http://cocodataset.org/#format-data
+    annotation['keypoints'] = [cx, cy, 2];
+    annotation['num_keypoints'] = 1;
+    break;
+
+  case 'circle':
+    var a,b;
+    a = shape_attributes['r'];
+    b = shape_attributes['r'];
+    var theta_to_radian = Math.PI/180;
+
+    for ( var theta = 0; theta < 360; theta = theta + VIA_POLYGON_SEGMENT_SUBTENDED_ANGLE ) {
+      var theta_radian = theta * theta_to_radian;
+      var x = shape_attributes['cx'] + a * Math.cos(theta_radian);
+      var y = shape_attributes['cy'] + b * Math.sin(theta_radian);
+      annotation['segmentation'].push( fixfloat(x), fixfloat(y) );
+    }
+    annotation['bbox'] = polygon_to_bbox(annotation['segmentation']);
+    annotation['area'] = annotation['bbox'][2] * annotation['bbox'][3];
+    break;
+
+  case 'ellipse':
+    var a,b;
+    a = shape_attributes['rx'];
+    b = shape_attributes['ry'];
+    var rotation = shape_attributes['theta'];
+    var theta_to_radian = Math.PI/180;
+
+    for ( var theta = 0; theta < 360; theta = theta + VIA_POLYGON_SEGMENT_SUBTENDED_ANGLE ) {
+      var theta_radian = theta * theta_to_radian;
+      var x = shape_attributes['cx'] +
+              ( a * Math.cos(theta_radian) * Math.cos(rotation) ) -
+              ( b * Math.sin(theta_radian) * Math.sin(rotation) );
+      var y = shape_attributes['cy'] +
+              ( a * Math.cos(theta_radian) * Math.sin(rotation) ) +
+              ( b * Math.sin(theta_radian) * Math.cos(rotation) );
+      annotation['segmentation'].push( fixfloat(x), fixfloat(y) );
+    }
+    annotation['bbox'] = polygon_to_bbox(annotation['segmentation']);
+    annotation['area'] = annotation['bbox'][2] * annotation['bbox'][3];
+    break;
+
+  case 'polygon':
+    annotation['segmentation'] = [];
+    var x0 = +Infinity;
+    var y0 = +Infinity;
+    var x1 = -Infinity;
+    var y1 = -Infinity;
+    for ( var i in shape_attributes['all_points_x'] ) {
+      annotation['segmentation'].push( shape_attributes['all_points_x'][i] );
+      annotation['segmentation'].push( shape_attributes['all_points_y'][i] );
+      if ( shape_attributes['all_points_x'][i] < x0 ) {
+        x0 = shape_attributes['all_points_x'][i];
+      }
+      if ( shape_attributes['all_points_y'][i] < y0 ) {
+        y0 = shape_attributes['all_points_y'][i];
+      }
+      if ( shape_attributes['all_points_x'][i] > x1 ) {
+        x1 = shape_attributes['all_points_x'][i];
+      }
+      if ( shape_attributes['all_points_y'][i] > y1 ) {
+        y1 = shape_attributes['all_points_y'][i];
+      }
+    }
+    var w = x1 - x0;
+    var h = y1 - y0;
+    annotation['bbox'] = [x0, y0, w, h];
+    annotation['area'] = w * h; // approximate area
+  }
+  return annotation;
+}
+
+function save_data_to_local_file(data, filename) {
+  var a      = document.createElement('a');
+  a.href     = URL.createObjectURL(data);
+  a.download = filename;
+
+  // simulate a mouse click event
+  var event = new MouseEvent('click', {
+    view: window,
+    bubbles: true,
+    cancelable: true
+  });
+  a.dispatchEvent(event);
+
+  // @todo: replace a.dispatchEvent() with a.click()
+  // a.click() based trigger is supported in Chrome 70 and Safari 11/12 but **not** in Firefox 63
+  //a.click();
+}
+
+//
+// Maintainers of user interface
+//
+
+function init_message_panel() {
+  var p = document.getElementById('message_panel');
+  p.addEventListener('mousedown', function() {
+    this.style.display = 'none';
+  }, false);
+  p.addEventListener('mouseover', function() {
+    clearTimeout(_via_message_clear_timer); // stop any previous timeouts
+  }, false);
+}
+
+function show_message(msg, t) {
+  if ( _via_message_clear_timer ) {
+    clearTimeout(_via_message_clear_timer); // stop any previous timeouts
+  }
+  var timeout = t;
+  if ( typeof t === 'undefined' ) {
+    timeout = VIA_THEME_MESSAGE_TIMEOUT_MS;
+  }
+  document.getElementById('message_panel_content').innerHTML = msg;
+  document.getElementById('message_panel').style.display = 'block';
+
+  _via_message_clear_timer = setTimeout( function() {
+    document.getElementById('message_panel').style.display = 'none';
+  }, timeout);
+}
+
+function _via_regions_group_color_init() {
+  _via_canvas_regions_group_color = {};
+  var aid = _via_settings.ui.image.region_color;
+  if ( aid !== '__via_default_region_color__' ) {
+    var avalue;
+    for ( var i = 0; i < _via_img_metadata[_via_image_id].regions.length; ++i ) {
+      avalue = _via_img_metadata[_via_image_id].regions[i].region_attributes[aid];
+      _via_canvas_regions_group_color[avalue] = 1;
+    }
+    var color_index = 0;
+    for ( avalue in _via_canvas_regions_group_color ) {
+      _via_canvas_regions_group_color[avalue] = VIA_REGION_COLOR_LIST[ color_index % VIA_REGION_COLOR_LIST.length ];
+      color_index = color_index + 1;
+    }
+  }
+}
+
+// transform regions in image space to canvas space
+function _via_load_canvas_regions() {
+  _via_regions_group_color_init();
+
+  // load all existing annotations into _via_canvas_regions
+  var regions = _via_img_metadata[_via_image_id].regions;
+  _via_canvas_regions  = [];
+  for ( var i = 0; i < regions.length; ++i ) {
+    var region_i = new file_region();
+    for ( var key in regions[i].shape_attributes ) {
+      region_i.shape_attributes[key] = regions[i].shape_attributes[key];
+    }
+    _via_canvas_regions.push(region_i);
+
+    switch(_via_canvas_regions[i].shape_attributes['name']) {
+    case VIA_REGION_SHAPE.RECT:
+      var x      = regions[i].shape_attributes['x'] / _via_canvas_scale;
+      var y      = regions[i].shape_attributes['y'] / _via_canvas_scale;
+      var width  = regions[i].shape_attributes['width']  / _via_canvas_scale;
+      var height = regions[i].shape_attributes['height'] / _via_canvas_scale;
+
+      _via_canvas_regions[i].shape_attributes['x'] = Math.round(x);
+      _via_canvas_regions[i].shape_attributes['y'] = Math.round(y);
+      _via_canvas_regions[i].shape_attributes['width'] = Math.round(width);
+      _via_canvas_regions[i].shape_attributes['height'] = Math.round(height);
+      break;
+
+    case VIA_REGION_SHAPE.CIRCLE:
+      var cx = regions[i].shape_attributes['cx'] / _via_canvas_scale;
+      var cy = regions[i].shape_attributes['cy'] / _via_canvas_scale;
+      var r  = regions[i].shape_attributes['r']  / _via_canvas_scale;
+      _via_canvas_regions[i].shape_attributes['cx'] = Math.round(cx);
+      _via_canvas_regions[i].shape_attributes['cy'] = Math.round(cy);
+      _via_canvas_regions[i].shape_attributes['r'] = Math.round(r);
+      break;
+
+    case VIA_REGION_SHAPE.ELLIPSE:
+      var cx = regions[i].shape_attributes['cx'] / _via_canvas_scale;
+      var cy = regions[i].shape_attributes['cy'] / _via_canvas_scale;
+      var rx = regions[i].shape_attributes['rx'] / _via_canvas_scale;
+      var ry = regions[i].shape_attributes['ry'] / _via_canvas_scale;
+      // rotation in radians
+      var theta = regions[i].shape_attributes['theta'];
+      _via_canvas_regions[i].shape_attributes['cx'] = Math.round(cx);
+      _via_canvas_regions[i].shape_attributes['cy'] = Math.round(cy);
+      _via_canvas_regions[i].shape_attributes['rx'] = Math.round(rx);
+      _via_canvas_regions[i].shape_attributes['ry'] = Math.round(ry);
+      _via_canvas_regions[i].shape_attributes['theta'] = theta;
+      break;
+
+    case VIA_REGION_SHAPE.POLYLINE: // handled by polygon
+    case VIA_REGION_SHAPE.POLYGON:
+      var all_points_x = regions[i].shape_attributes['all_points_x'].slice(0);
+      var all_points_y = regions[i].shape_attributes['all_points_y'].slice(0);
+      for (var j=0; j<all_points_x.length; ++j) {
+        all_points_x[j] = Math.round(all_points_x[j] / _via_canvas_scale);
+        all_points_y[j] = Math.round(all_points_y[j] / _via_canvas_scale);
+      }
+      _via_canvas_regions[i].shape_attributes['all_points_x'] = all_points_x;
+      _via_canvas_regions[i].shape_attributes['all_points_y'] = all_points_y;
+      break;
+
+    case VIA_REGION_SHAPE.POINT:
+      var cx = regions[i].shape_attributes['cx'] / _via_canvas_scale;
+      var cy = regions[i].shape_attributes['cy'] / _via_canvas_scale;
+
+      _via_canvas_regions[i].shape_attributes['cx'] = Math.round(cx);
+      _via_canvas_regions[i].shape_attributes['cy'] = Math.round(cy);
+      break;
+    }
+  }
+}
+
+// updates currently selected region shape
+function select_region_shape(sel_shape_name) {
+  for ( var shape_name in VIA_REGION_SHAPE ) {
+    var ui_element = document.getElementById('region_shape_' + VIA_REGION_SHAPE[shape_name]);
+    ui_element.classList.remove('selected');
+  }
+
+  _via_current_shape = sel_shape_name;
+  var ui_element = document.getElementById('region_shape_' + _via_current_shape);
+  ui_element.classList.add('selected');
+
+  switch(_via_current_shape) {
+  case VIA_REGION_SHAPE.RECT: // Fall-through
+  case VIA_REGION_SHAPE.CIRCLE: // Fall-through
+  case VIA_REGION_SHAPE.ELLIPSE:
+    show_message('Press single click and drag mouse to draw ' +
+                 _via_current_shape + ' region');
+    break;
+
+  case VIA_REGION_SHAPE.POLYLINE:
+  case VIA_REGION_SHAPE.POLYGON:
+    _via_is_user_drawing_polygon = false;
+    _via_current_polygon_region_id = -1;
+
+    show_message('[Single Click] to define polygon/polyline vertices, ' +
+                 '[Backspace] to delete last vertex, [Enter] to finish, [Esc] to cancel drawing.' );
+    break;
+
+  case VIA_REGION_SHAPE.POINT:
+    show_message('Press single click to define points (or landmarks)');
+    break;
+
+  default:
+    show_message('Unknown shape selected!');
+    break;
+  }
+}
+
+function set_all_canvas_size(w, h) {
+  _via_reg_canvas.height = h;
+  _via_reg_canvas.width = w;
+
+  image_panel.style.height = h + 'px';
+  image_panel.style.width  = w + 'px';
+}
+
+function set_all_canvas_scale(s) {
+  _via_reg_ctx.scale(s, s);
+}
+
+function show_all_canvas() {
+  image_panel.style.display = 'inline-block';
+}
+
+function hide_all_canvas() {
+  image_panel.style.display = 'none';
+}
+
+function jump_to_image(image_index) {
+  if ( _via_img_count <= 0 ) {
+    return;
+  }
+
+  switch(_via_display_area_content_name) {
+  case VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID:
+    if ( image_index >= 0 && image_index < _via_img_count) {
+      // @todo: jump to image grid page view with the given first image index
+      show_single_image_view();
+      _via_show_img(image_index);
+    }
+    break;
+  default:
+    if ( image_index >= 0 && image_index < _via_img_count) {
+      _via_show_img(image_index);
+    }
+    break;
+  }
+}
+
+function count_missing_region_attr(img_id) {
+  var miss_region_attr_count = 0;
+  var attr_count = Object.keys(_via_region_attributes).length;
+  for( var i=0; i < _via_img_metadata[img_id].regions.length; ++i ) {
+    var set_attr_count = Object.keys(_via_img_metadata[img_id].regions[i].region_attributes).length;
+    miss_region_attr_count += ( attr_count - set_attr_count );
+  }
+  return miss_region_attr_count;
+}
+
+function count_missing_file_attr(img_id) {
+  return Object.keys(_via_file_attributes).length - Object.keys(_via_img_metadata[img_id].file_attributes).length;
+}
+
+function toggle_all_regions_selection(is_selected) {
+  var n = _via_img_metadata[_via_image_id].regions.length;
+  var i;
+  _via_region_selected_flag = [];
+  for ( i = 0; i < n; ++i) {
+    _via_region_selected_flag[i] = is_selected;
+  }
+  _via_is_all_region_selected = is_selected;
+  annotation_editor_hide();
+  if ( _via_annotation_editor_mode === VIA_ANNOTATION_EDITOR_MODE.ALL_REGIONS ) {
+    annotation_editor_clear_row_highlight();
+  }
+}
+
+function select_only_region(region_id) {
+  toggle_all_regions_selection(false);
+  set_region_select_state(region_id, true);
+  _via_is_region_selected = true;
+  _via_is_all_region_selected = false;
+  _via_user_sel_region_id = region_id;
+}
+
+function set_region_select_state(region_id, is_selected) {
+  _via_region_selected_flag[region_id] = is_selected;
+}
+
+function show_annotation_data() {
+  pack_via_metadata('csv').then( function(data) {
+    var hstr = '<pre>' + data.join('') + '</pre>';
+    var window_features = 'toolbar=no,menubar=no,location=no,resizable=yes,scrollbars=yes,status=no';
+    window_features += ',width=800,height=600';
+    var annotation_data_window = window.open('', 'Annotations (preview) ', window_features);
+    annotation_data_window.document.body.innerHTML = hstr;
+  }.bind(this), function(err) {
+    show_message('Failed to collect annotation data!');
+  }.bind(this));
+}
+
+//
+// Image click handlers
+//
+
+// enter annotation mode on double click
+function _via_reg_canvas_dblclick_handler(e) {
+  e.stopPropagation();
+  // @todo: use double click in future
+}
+
+// user clicks on the canvas
+function _via_reg_canvas_mousedown_handler(e) {
+  e.stopPropagation();
+  _via_click_x0 = e.offsetX; _via_click_y0 = e.offsetY;
+  _via_region_edge = is_on_region_corner(_via_click_x0, _via_click_y0);
+  var region_id = is_inside_region(_via_click_x0, _via_click_y0);
+
+  if ( _via_is_region_selected ) {
+    // check if user clicked on the region boundary
+    if ( _via_region_edge[1] > 0 ) {
+      if ( !_via_is_user_resizing_region ) {
+        if ( _via_region_edge[0] !== _via_user_sel_region_id ) {
+          _via_user_sel_region_id = _via_region_edge[0];
+        }
+        // resize region
+        _via_is_user_resizing_region = true;
+      }
+    } else {
+      var yes = is_inside_this_region(_via_click_x0,
+                                      _via_click_y0,
+                                      _via_user_sel_region_id);
+      if (yes) {
+        if( !_via_is_user_moving_region ) {
+          _via_is_user_moving_region = true;
+          _via_region_click_x = _via_click_x0;
+          _via_region_click_y = _via_click_y0;
+        }
+      }
+      if ( region_id === -1 ) {
+        // mousedown on outside any region
+        _via_is_user_drawing_region = true;
+        // unselect all regions
+        _via_is_region_selected = false;
+        _via_user_sel_region_id = -1;
+        toggle_all_regions_selection(false);
+      }
+    }
+  } else {
+    if ( region_id === -1 ) {
+      // mousedown outside a region
+      if (_via_current_shape !== VIA_REGION_SHAPE.POLYGON &&
+          _via_current_shape !== VIA_REGION_SHAPE.POLYLINE &&
+          _via_current_shape !== VIA_REGION_SHAPE.POINT) {
+        // this is a bounding box drawing event
+        _via_is_user_drawing_region = true;
+      }
+    } else {
+      // mousedown inside a region
+      // this could lead to (1) region selection or (2) region drawing
+      _via_is_user_drawing_region = true;
+    }
+  }
+}
+
+// implements the following functionalities:
+//  - new region drawing (including polygon)
+//  - moving/resizing/select/unselect existing region
+function _via_reg_canvas_mouseup_handler(e) {
+  e.stopPropagation();
+  _via_click_x1 = e.offsetX; _via_click_y1 = e.offsetY;
+
+  var click_dx = Math.abs(_via_click_x1 - _via_click_x0);
+  var click_dy = Math.abs(_via_click_y1 - _via_click_y0);
+
+  // indicates that user has finished moving a region
+  if ( _via_is_user_moving_region ) {
+    _via_is_user_moving_region = false;
+    _via_reg_canvas.style.cursor = "default";
+
+    var move_x = Math.round(_via_click_x1 - _via_region_click_x);
+    var move_y = Math.round(_via_click_y1 - _via_region_click_y);
+
+    if (Math.abs(move_x) > VIA_MOUSE_CLICK_TOL ||
+        Math.abs(move_y) > VIA_MOUSE_CLICK_TOL) {
+      // move all selected regions
+      _via_move_selected_regions(move_x, move_y);
+    } else {
+      // indicates a user click on an already selected region
+      // this could indicate the user's intention to select another
+      // nested region within this region
+      // OR
+      // draw a nested region (i.e. region inside a region)
+
+      // traverse the canvas regions in alternating ascending
+      // and descending order to solve the issue of nested regions
+      var nested_region_id = is_inside_region(_via_click_x0, _via_click_y0, true);
+      if (nested_region_id >= 0 &&
+          nested_region_id !== _via_user_sel_region_id) {
+        _via_user_sel_region_id = nested_region_id;
+        _via_is_region_selected = true;
+        _via_is_user_moving_region = false;
+
+        // de-select all other regions if the user has not pressed Shift
+        if ( !e.shiftKey ) {
+          toggle_all_regions_selection(false);
+        }
+        set_region_select_state(nested_region_id, true);
+        annotation_editor_show();
+      } else {
+        // user clicking inside an already selected region
+        // indicates that the user intends to draw a nested region
+        toggle_all_regions_selection(false);
+        _via_is_region_selected = false;
+
+        switch (_via_current_shape) {
+        case VIA_REGION_SHAPE.POLYLINE: // handled by case for POLYGON
+        case VIA_REGION_SHAPE.POLYGON:
+          // user has clicked on the first point in a new polygon
+          // see also event 'mouseup' for _via_is_user_drawing_polygon=true
+          _via_is_user_drawing_polygon = true;
+
+          var canvas_polygon_region = new file_region();
+          canvas_polygon_region.shape_attributes['name'] = _via_current_shape;
+          canvas_polygon_region.shape_attributes['all_points_x'] = [Math.round(_via_click_x0)];
+          canvas_polygon_region.shape_attributes['all_points_y'] = [Math.round(_via_click_y0)];
+          var new_length = _via_canvas_regions.push(canvas_polygon_region);
+          _via_current_polygon_region_id = new_length - 1;
+          break;
+
+        case VIA_REGION_SHAPE.POINT:
+          // user has marked a landmark point
+          var point_region = new file_region();
+          point_region.shape_attributes['name'] = VIA_REGION_SHAPE.POINT;
+          point_region.shape_attributes['cx'] = Math.round(_via_click_x0 * _via_canvas_scale);
+          point_region.shape_attributes['cy'] = Math.round(_via_click_y0 * _via_canvas_scale);
+          _via_img_metadata[_via_image_id].regions.push(point_region);
+
+          var canvas_point_region = new file_region();
+          canvas_point_region.shape_attributes['name'] = VIA_REGION_SHAPE.POINT;
+          canvas_point_region.shape_attributes['cx'] = Math.round(_via_click_x0);
+          canvas_point_region.shape_attributes['cy'] = Math.round(_via_click_y0);
+          _via_canvas_regions.push(canvas_point_region);
+          break;
+        }
+        annotation_editor_update_content();
+      }
+    }
+    _via_redraw_reg_canvas();
+    _via_reg_canvas.focus();
+    return;
+  }
+
+  // indicates that user has finished resizing a region
+  if ( _via_is_user_resizing_region ) {
+    // _via_click(x0,y0) to _via_click(x1,y1)
+    _via_is_user_resizing_region = false;
+    _via_reg_canvas.style.cursor = "default";
+
+    // update the region
+    var region_id = _via_region_edge[0];
+    var image_attr = _via_img_metadata[_via_image_id].regions[region_id].shape_attributes;
+    var canvas_attr = _via_canvas_regions[region_id].shape_attributes;
+
+    switch (canvas_attr['name']) {
+    case VIA_REGION_SHAPE.RECT:
+      var d = [canvas_attr['x'], canvas_attr['y'], 0, 0];
+      d[2] = d[0] + canvas_attr['width'];
+      d[3] = d[1] + canvas_attr['height'];
+
+      var mx = _via_current_x;
+      var my = _via_current_y;
+      var preserve_aspect_ratio = false;
+
+      // constrain (mx,my) to lie on a line connecting a diagonal of rectangle
+      if ( _via_is_ctrl_pressed ) {
+        preserve_aspect_ratio = true;
+      }
+
+      rect_update_corner(_via_region_edge[1], d, mx, my, preserve_aspect_ratio);
+      rect_standardize_coordinates(d);
+
+      var w = Math.abs(d[2] - d[0]);
+      var h = Math.abs(d[3] - d[1]);
+
+      image_attr['x'] = Math.round(d[0] * _via_canvas_scale);
+      image_attr['y'] = Math.round(d[1] * _via_canvas_scale);
+      image_attr['width'] = Math.round(w * _via_canvas_scale);
+      image_attr['height'] = Math.round(h * _via_canvas_scale);
+
+      canvas_attr['x'] = Math.round( image_attr['x'] / _via_canvas_scale);
+      canvas_attr['y'] = Math.round( image_attr['y'] / _via_canvas_scale);
+      canvas_attr['width'] = Math.round( image_attr['width'] / _via_canvas_scale);
+      canvas_attr['height'] = Math.round( image_attr['height'] / _via_canvas_scale);
+      break;
+
+    case VIA_REGION_SHAPE.CIRCLE:
+      var dx = Math.abs(canvas_attr['cx'] - _via_current_x);
+      var dy = Math.abs(canvas_attr['cy'] - _via_current_y);
+      var new_r = Math.sqrt( dx*dx + dy*dy );
+
+      image_attr['r'] = fixfloat(new_r * _via_canvas_scale);
+      canvas_attr['r'] = Math.round( image_attr['r'] / _via_canvas_scale);
+      break;
+
+    case VIA_REGION_SHAPE.ELLIPSE:
+      var new_rx = canvas_attr['rx'];
+      var new_ry = canvas_attr['ry'];
+      var new_theta = canvas_attr['theta'];
+      var dx = Math.abs(canvas_attr['cx'] - _via_current_x);
+      var dy = Math.abs(canvas_attr['cy'] - _via_current_y);
+
+      switch(_via_region_edge[1]) {
+      case 5:
+        new_ry = Math.sqrt(dx*dx + dy*dy);
+        new_theta = Math.atan2(- (_via_current_x - canvas_attr['cx']), (_via_current_y - canvas_attr['cy']));
+        break;
+
+      case 6:
+        new_rx = Math.sqrt(dx*dx + dy*dy);
+        new_theta = Math.atan2((_via_current_y - canvas_attr['cy']), (_via_current_x - canvas_attr['cx']));
+        break;
+
+      default:
+        new_rx = dx;
+        new_ry = dy;
+        new_theta = 0;
+        break;
+      }
+
+      image_attr['rx'] = fixfloat(new_rx * _via_canvas_scale);
+      image_attr['ry'] = fixfloat(new_ry * _via_canvas_scale);
+      image_attr['theta'] = fixfloat(new_theta);
+
+      canvas_attr['rx'] = Math.round(image_attr['rx'] / _via_canvas_scale);
+      canvas_attr['ry'] = Math.round(image_attr['ry'] / _via_canvas_scale);
+      canvas_attr['theta'] = fixfloat(new_theta);
+      break;
+
+    case VIA_REGION_SHAPE.POLYLINE: // handled by polygon
+    case VIA_REGION_SHAPE.POLYGON:
+      var moved_vertex_id = _via_region_edge[1] - VIA_POLYGON_RESIZE_VERTEX_OFFSET;
+
+      if ( e.ctrlKey ) {
+        // if on vertex, delete it
+        // if on edge, add a new vertex
+        var r = _via_canvas_regions[_via_user_sel_region_id].shape_attributes;
+        var shape = r.name;
+        var is_on_vertex = is_on_polygon_vertex(r['all_points_x'], r['all_points_y'], _via_current_x, _via_current_y);
+
+        if ( is_on_vertex === _via_region_edge[1] ) {
+          // click on vertex, hence delete vertex
+          if ( _via_polygon_del_vertex(region_id, moved_vertex_id) ) {
+            show_message('Deleted vertex ' + moved_vertex_id + ' from region');
+          }
+        } else {
+          var is_on_edge = is_on_polygon_edge(r['all_points_x'], r['all_points_y'], _via_current_x, _via_current_y);
+          if ( is_on_edge === _via_region_edge[1] ) {
+            // click on edge, hence add new vertex
+            var vertex_index = is_on_edge - VIA_POLYGON_RESIZE_VERTEX_OFFSET;
+            var canvas_x0 = Math.round(_via_click_x1);
+            var canvas_y0 = Math.round(_via_click_y1);
+            var img_x0 = Math.round( canvas_x0 * _via_canvas_scale );
+            var img_y0 = Math.round( canvas_y0 * _via_canvas_scale );
+            canvas_x0 = Math.round( img_x0 / _via_canvas_scale );
+            canvas_y0 = Math.round( img_y0 / _via_canvas_scale );
+
+            _via_canvas_regions[region_id].shape_attributes['all_points_x'].splice(vertex_index+1, 0, canvas_x0);
+            _via_canvas_regions[region_id].shape_attributes['all_points_y'].splice(vertex_index+1, 0, canvas_y0);
+            _via_img_metadata[_via_image_id].regions[region_id].shape_attributes['all_points_x'].splice(vertex_index+1, 0, img_x0);
+            _via_img_metadata[_via_image_id].regions[region_id].shape_attributes['all_points_y'].splice(vertex_index+1, 0, img_y0);
+
+            show_message('Added 1 new vertex to ' + shape + ' region');
+          }
+        }
+      } else {
+        // update coordinate of vertex
+        var imx = Math.round(_via_current_x * _via_canvas_scale);
+        var imy = Math.round(_via_current_y * _via_canvas_scale);
+        image_attr['all_points_x'][moved_vertex_id] = imx;
+        image_attr['all_points_y'][moved_vertex_id] = imy;
+        canvas_attr['all_points_x'][moved_vertex_id] = Math.round( imx / _via_canvas_scale );
+        canvas_attr['all_points_y'][moved_vertex_id] = Math.round( imy / _via_canvas_scale );
+      }
+      break;
+    } // end of switch()
+    _via_redraw_reg_canvas();
+    _via_reg_canvas.focus();
+    return;
+  }
+
+  // denotes a single click (= mouse down + mouse up)
+  if ( click_dx < VIA_MOUSE_CLICK_TOL ||
+       click_dy < VIA_MOUSE_CLICK_TOL ) {
+    // if user is already drawing polygon, then each click adds a new point
+    if ( _via_is_user_drawing_polygon ) {
+      var canvas_x0 = Math.round(_via_click_x1);
+      var canvas_y0 = Math.round(_via_click_y1);
+      var n = _via_canvas_regions[_via_current_polygon_region_id].shape_attributes['all_points_x'].length;
+      var last_x0 = _via_canvas_regions[_via_current_polygon_region_id].shape_attributes['all_points_x'][n-1];
+      var last_y0 = _via_canvas_regions[_via_current_polygon_region_id].shape_attributes['all_points_y'][n-1];
+      // discard if the click was on the last vertex
+      if ( canvas_x0 !== last_x0 || canvas_y0 !== last_y0 ) {
+        // user clicked on a new polygon point
+        _via_canvas_regions[_via_current_polygon_region_id].shape_attributes['all_points_x'].push(canvas_x0);
+        _via_canvas_regions[_via_current_polygon_region_id].shape_attributes['all_points_y'].push(canvas_y0);
+      }
+    } else {
+      var region_id = is_inside_region(_via_click_x0, _via_click_y0);
+      if ( region_id >= 0 ) {
+        // first click selects region
+        _via_user_sel_region_id     = region_id;
+        _via_is_region_selected     = true;
+        _via_is_user_moving_region  = false;
+        _via_is_user_drawing_region = false;
+
+        // de-select all other regions if the user has not pressed Shift
+        if ( !e.shiftKey ) {
+          annotation_editor_clear_row_highlight();
+          toggle_all_regions_selection(false);
+        }
+        set_region_select_state(region_id, true);
+
+        // show annotation editor only when a single region is selected
+        if ( !e.shiftKey ) {
+          annotation_editor_show();
+        } else {
+          annotation_editor_hide();
+        }
+
+        // show the region info
+        if (_via_is_region_info_visible) {
+          var canvas_attr = _via_canvas_regions[region_id].shape_attributes;
+
+          switch (canvas_attr['name']) {
+          case VIA_REGION_SHAPE.RECT:
+            break;
+
+          case VIA_REGION_SHAPE.CIRCLE:
+            var rf = document.getElementById('region_info');
+            var attr = _via_canvas_regions[_via_user_sel_region_id].shape_attributes;
+            rf.innerHTML +=  ',' + ' Radius:' + attr['r'];
+            break;
+
+          case VIA_REGION_SHAPE.ELLIPSE:
+            var rf = document.getElementById('region_info');
+            var attr = _via_canvas_regions[_via_user_sel_region_id].shape_attributes;
+            rf.innerHTML +=  ',' + ' X-radius:' + attr['rx'] + ',' + ' Y-radius:' + attr['ry'];
+            break;
+
+          case VIA_REGION_SHAPE.POLYLINE:
+          case VIA_REGION_SHAPE.POLYGON:
+            break;
+          }
+        }
+
+        show_message('Region selected. If you intended to draw a region, click again inside the selected region to start drawing a region.')
+      } else {
+        if ( _via_is_user_drawing_region ) {
+          // clear all region selection
+          _via_is_user_drawing_region = false;
+          _via_is_region_selected     = false;
+          toggle_all_regions_selection(false);
+          annotation_editor_hide();
+        } else {
+          switch (_via_current_shape) {
+          case VIA_REGION_SHAPE.POLYLINE: // handled by case for POLYGON
+          case VIA_REGION_SHAPE.POLYGON:
+            // user has clicked on the first point in a new polygon
+            // see also event 'mouseup' for _via_is_user_moving_region=true
+            _via_is_user_drawing_polygon = true;
+
+            var canvas_polygon_region = new file_region();
+            canvas_polygon_region.shape_attributes['name'] = _via_current_shape;
+            canvas_polygon_region.shape_attributes['all_points_x'] = [ Math.round(_via_click_x0) ];
+            canvas_polygon_region.shape_attributes['all_points_y'] = [ Math.round(_via_click_y0)] ;
+
+            var new_length = _via_canvas_regions.push(canvas_polygon_region);
+            _via_current_polygon_region_id = new_length - 1;
+            break;
+
+          case VIA_REGION_SHAPE.POINT:
+            // user has marked a landmark point
+            var point_region = new file_region();
+            point_region.shape_attributes['name'] = VIA_REGION_SHAPE.POINT;
+            point_region.shape_attributes['cx'] = Math.round(_via_click_x0 * _via_canvas_scale);
+            point_region.shape_attributes['cy'] = Math.round(_via_click_y0 * _via_canvas_scale);
+            _via_img_metadata[_via_image_id].regions.push(point_region);
+
+            var canvas_point_region = new file_region();
+            canvas_point_region.shape_attributes['name'] = VIA_REGION_SHAPE.POINT;
+            canvas_point_region.shape_attributes['cx'] = Math.round(_via_click_x0);
+            canvas_point_region.shape_attributes['cy'] = Math.round(_via_click_y0);
+            _via_canvas_regions.push(canvas_point_region);
+
+            annotation_editor_update_content();
+            break;
+          }
+        }
+      }
+    }
+    _via_redraw_reg_canvas();
+    _via_reg_canvas.focus();
+    return;
+  }
+
+  // indicates that user has finished drawing a new region
+  if ( _via_is_user_drawing_region ) {
+    _via_is_user_drawing_region = false;
+    var region_x0 = _via_click_x0;
+    var region_y0 = _via_click_y0;
+    var region_x1 = _via_click_x1;
+    var region_y1 = _via_click_y1;
+
+    var original_img_region = new file_region();
+    var canvas_img_region = new file_region();
+    var region_dx = Math.abs(region_x1 - region_x0);
+    var region_dy = Math.abs(region_y1 - region_y0);
+    var new_region_added = false;
+
+    if ( region_dx > VIA_REGION_MIN_DIM && region_dy > VIA_REGION_MIN_DIM ) { // avoid regions with 0 dim
+      switch(_via_current_shape) {
+      case VIA_REGION_SHAPE.RECT:
+        // ensure that (x0,y0) is top-left and (x1,y1) is bottom-right
+        if ( _via_click_x0 < _via_click_x1 ) {
+          region_x0 = _via_click_x0;
+          region_x1 = _via_click_x1;
+        } else {
+          region_x0 = _via_click_x1;
+          region_x1 = _via_click_x0;
+        }
+
+        if ( _via_click_y0 < _via_click_y1 ) {
+          region_y0 = _via_click_y0;
+          region_y1 = _via_click_y1;
+        } else {
+          region_y0 = _via_click_y1;
+          region_y1 = _via_click_y0;
+        }
+
+        var x = Math.round(region_x0 * _via_canvas_scale);
+        var y = Math.round(region_y0 * _via_canvas_scale);
+        var width  = Math.round(region_dx * _via_canvas_scale);
+        var height = Math.round(region_dy * _via_canvas_scale);
+        original_img_region.shape_attributes['name'] = 'rect';
+        original_img_region.shape_attributes['x'] = x;
+        original_img_region.shape_attributes['y'] = y;
+        original_img_region.shape_attributes['width'] = width;
+        original_img_region.shape_attributes['height'] = height;
+
+        canvas_img_region.shape_attributes['name'] = 'rect';
+        canvas_img_region.shape_attributes['x'] = Math.round( x / _via_canvas_scale );
+        canvas_img_region.shape_attributes['y'] = Math.round( y / _via_canvas_scale );
+        canvas_img_region.shape_attributes['width'] = Math.round( width / _via_canvas_scale );
+        canvas_img_region.shape_attributes['height'] = Math.round( height / _via_canvas_scale );
+
+        new_region_added = true;
+        break;
+
+      case VIA_REGION_SHAPE.CIRCLE:
+        var cx = Math.round(region_x0 * _via_canvas_scale);
+        var cy = Math.round(region_y0 * _via_canvas_scale);
+        var r  = Math.round( Math.sqrt(region_dx*region_dx + region_dy*region_dy) * _via_canvas_scale );
+
+        original_img_region.shape_attributes['name'] = 'circle';
+        original_img_region.shape_attributes['cx'] = cx;
+        original_img_region.shape_attributes['cy'] = cy;
+        original_img_region.shape_attributes['r'] = r;
+
+        canvas_img_region.shape_attributes['name'] = 'circle';
+        canvas_img_region.shape_attributes['cx'] = Math.round( cx / _via_canvas_scale );
+        canvas_img_region.shape_attributes['cy'] = Math.round( cy / _via_canvas_scale );
+        canvas_img_region.shape_attributes['r'] = Math.round( r / _via_canvas_scale );
+
+        new_region_added = true;
+        break;
+
+      case VIA_REGION_SHAPE.ELLIPSE:
+        var cx = Math.round(region_x0 * _via_canvas_scale);
+        var cy = Math.round(region_y0 * _via_canvas_scale);
+        var rx = Math.round(region_dx * _via_canvas_scale);
+        var ry = Math.round(region_dy * _via_canvas_scale);
+        var theta = 0;
+
+        original_img_region.shape_attributes['name'] = 'ellipse';
+        original_img_region.shape_attributes['cx'] = cx;
+        original_img_region.shape_attributes['cy'] = cy;
+        original_img_region.shape_attributes['rx'] = rx;
+        original_img_region.shape_attributes['ry'] = ry;
+        original_img_region.shape_attributes['theta'] = theta;
+
+        canvas_img_region.shape_attributes['name'] = 'ellipse';
+        canvas_img_region.shape_attributes['cx'] = Math.round( cx / _via_canvas_scale );
+        canvas_img_region.shape_attributes['cy'] = Math.round( cy / _via_canvas_scale );
+        canvas_img_region.shape_attributes['rx'] = Math.round( rx / _via_canvas_scale );
+        canvas_img_region.shape_attributes['ry'] = Math.round( ry / _via_canvas_scale );
+        canvas_img_region.shape_attributes['theta'] = theta;
+
+        new_region_added = true;
+        break;
+
+      case VIA_REGION_SHAPE.POINT:    // handled by case VIA_REGION_SHAPE.POLYGON
+      case VIA_REGION_SHAPE.POLYLINE: // handled by case VIA_REGION_SHAPE.POLYGON
+      case VIA_REGION_SHAPE.POLYGON:
+        // handled by _via_is_user_drawing_polygon
+        break;
+      } // end of switch
+
+      if ( new_region_added ) {
+        var n1 = _via_img_metadata[_via_image_id].regions.push(original_img_region);
+        var n2 = _via_canvas_regions.push(canvas_img_region);
+
+        if ( n1 !== n2 ) {
+          console.log('_via_img_metadata.regions[' + n1 + '] and _via_canvas_regions[' + n2 + '] count mismatch');
+        }
+        var new_region_id = n1 - 1;
+
+        set_region_annotations_to_default_value( new_region_id );
+        select_only_region(new_region_id);
+        if ( _via_annotation_editor_mode === VIA_ANNOTATION_EDITOR_MODE.ALL_REGIONS &&
+             _via_metadata_being_updated === 'region' ) {
+          annotation_editor_add_row( new_region_id );
+          annotation_editor_scroll_to_row( new_region_id );
+          annotation_editor_clear_row_highlight();
+          annotation_editor_highlight_row( new_region_id );
+        }
+        annotation_editor_show();
+      }
+      _via_redraw_reg_canvas();
+      _via_reg_canvas.focus();
+    } else {
+      show_message('Prevented accidental addition of a very small region.');
+    }
+    return;
+  }
+}
+
+function _via_reg_canvas_mouseover_handler(e) {
+  // change the mouse cursor icon
+  _via_redraw_reg_canvas();
+  _via_reg_canvas.focus();
+}
+
+function _via_reg_canvas_mousemove_handler(e) {
+  if ( !_via_current_image_loaded ) {
+    return;
+  }
+
+  _via_current_x = e.offsetX; _via_current_y = e.offsetY;
+
+  // display the cursor coordinates
+  var rf = document.getElementById('region_info');
+  if ( rf != null && _via_is_region_info_visible ) {
+    var img_x = Math.round( _via_current_x * _via_canvas_scale );
+    var img_y = Math.round( _via_current_y * _via_canvas_scale );
+    rf.innerHTML = 'X:' + img_x + ',' + ' Y:' + img_y;
+  }
+
+  if ( _via_is_region_selected ) {
+    // display the region's info if a region is selected
+    if ( rf != null && _via_is_region_info_visible && _via_user_sel_region_id !== -1) {
+      var canvas_attr = _via_canvas_regions[_via_user_sel_region_id].shape_attributes;
+      switch (canvas_attr['name']) {
+      case VIA_REGION_SHAPE.RECT:
+        break;
+
+      case VIA_REGION_SHAPE.CIRCLE:
+        var rf = document.getElementById('region_info');
+        var attr = _via_canvas_regions[_via_user_sel_region_id].shape_attributes;
+        rf.innerHTML +=  ',' + ' Radius:' + attr['r'];
+        break;
+
+      case VIA_REGION_SHAPE.ELLIPSE:
+        var rf = document.getElementById('region_info');
+        var attr = _via_canvas_regions[_via_user_sel_region_id].shape_attributes;
+        rf.innerHTML +=  ',' + ' X-radius:' + attr['rx'] + ',' + ' Y-radius:' + attr['ry'];
+        break;
+
+      case VIA_REGION_SHAPE.POLYLINE:
+      case VIA_REGION_SHAPE.POLYGON:
+        break;
+      }
+    }
+
+    if ( !_via_is_user_resizing_region ) {
+      // check if user moved mouse cursor to region boundary
+      // which indicates an intention to resize the region
+      _via_region_edge = is_on_region_corner(_via_current_x, _via_current_y);
+
+      if ( _via_region_edge[0] === _via_user_sel_region_id ) {
+        switch(_via_region_edge[1]) {
+          // rect
+        case 1: // Fall-through // top-left corner of rect
+        case 3: // bottom-right corner of rect
+          _via_reg_canvas.style.cursor = "nwse-resize";
+          break;
+        case 2: // Fall-through // top-right corner of rect
+        case 4: // bottom-left corner of rect
+          _via_reg_canvas.style.cursor = "nesw-resize";
+          break;
+
+        case 5: // Fall-through // top-middle point of rect
+        case 7: // bottom-middle point of rect
+          _via_reg_canvas.style.cursor = "ns-resize";
+          break;
+        case 6: // Fall-through // top-middle point of rect
+        case 8: // bottom-middle point of rect
+          _via_reg_canvas.style.cursor = "ew-resize";
+          break;
+
+          // circle and ellipse
+        case 5:
+          _via_reg_canvas.style.cursor = "n-resize";
+          break;
+        case 6:
+          _via_reg_canvas.style.cursor = "e-resize";
+          break;
+
+        default:
+          _via_reg_canvas.style.cursor = "default";
+          break;
+        }
+
+        if (_via_region_edge[1] >= VIA_POLYGON_RESIZE_VERTEX_OFFSET) {
+          // indicates mouse over polygon vertex
+          _via_reg_canvas.style.cursor = "crosshair";
+          show_message('To move vertex, simply drag the vertex. To add vertex, press [Ctrl] key and click on the edge. To delete vertex, press [Ctrl] key and click on vertex.');
+        }
+      } else {
+        var yes = is_inside_this_region(_via_current_x,
+                                        _via_current_y,
+                                        _via_user_sel_region_id);
+        if (yes) {
+          _via_reg_canvas.style.cursor = "move";
+        } else {
+          _via_reg_canvas.style.cursor = "default";
+        }
+
+      }
+    } else {
+      annotation_editor_hide() // resizing
+    }
+  }
+
+  if(_via_is_user_drawing_region) {
+    // draw region as the user drags the mouse cursor
+    if (_via_canvas_regions.length) {
+      _via_redraw_reg_canvas(); // clear old intermediate rectangle
+    } else {
+      // first region being drawn, just clear the full region canvas
+      _via_reg_ctx.clearRect(0, 0, _via_reg_canvas.width, _via_reg_canvas.height);
+    }
+
+    var region_x0 = _via_click_x0;
+    var region_y0 = _via_click_y0;
+
+    var dx = Math.round(Math.abs(_via_current_x - _via_click_x0));
+    var dy = Math.round(Math.abs(_via_current_y - _via_click_y0));
+    _via_reg_ctx.strokeStyle = VIA_THEME_BOUNDARY_FILL_COLOR;
+
+    switch (_via_current_shape ) {
+    case VIA_REGION_SHAPE.RECT:
+      if ( _via_click_x0 < _via_current_x ) {
+        if ( _via_click_y0 < _via_current_y ) {
+          region_x0 = _via_click_x0;
+          region_y0 = _via_click_y0;
+        } else {
+          region_x0 = _via_click_x0;
+          region_y0 = _via_current_y;
+        }
+      } else {
+        if ( _via_click_y0 < _via_current_y ) {
+          region_x0 = _via_current_x;
+          region_y0 = _via_click_y0;
+        } else {
+          region_x0 = _via_current_x;
+          region_y0 = _via_current_y;
+        }
+      }
+
+      _via_draw_rect_region(region_x0, region_y0, dx, dy, false);
+
+      // display the current region info
+      if ( rf != null && _via_is_region_info_visible ) {
+        rf.innerHTML +=  ',' + ' W:' + dx + ',' + ' H:' + dy;
+      }
+      break;
+
+    case VIA_REGION_SHAPE.CIRCLE:
+      var circle_radius = Math.round(Math.sqrt( dx*dx + dy*dy ));
+      _via_draw_circle_region(region_x0, region_y0, circle_radius, false);
+
+      // display the current region info
+      if ( rf != null && _via_is_region_info_visible ) {
+        rf.innerHTML +=  ',' + ' Radius:' + circle_radius;
+      }
+      break;
+
+    case VIA_REGION_SHAPE.ELLIPSE:
+      _via_draw_ellipse_region(region_x0, region_y0, dx, dy, 0, false);
+
+      // display the current region info
+      if ( rf != null && _via_is_region_info_visible ) {
+        rf.innerHTML +=  ',' + ' X-radius:' + fixfloat(dx) + ',' + ' Y-radius:' + fixfloat(dy);
+      }
+      break;
+
+    case VIA_REGION_SHAPE.POLYLINE: // handled by polygon
+    case VIA_REGION_SHAPE.POLYGON:
+      // this is handled by the if ( _via_is_user_drawing_polygon ) { ... }
+      // see below
+      break;
+    }
+    _via_reg_canvas.focus();
+  }
+
+  if ( _via_is_user_resizing_region ) {
+    // user has clicked mouse on bounding box edge and is now moving it
+    // draw region as the user drags the mouse coursor
+    if (_via_canvas_regions.length) {
+      _via_redraw_reg_canvas(); // clear old intermediate rectangle
+    } else {
+      // first region being drawn, just clear the full region canvas
+      _via_reg_ctx.clearRect(0, 0, _via_reg_canvas.width, _via_reg_canvas.height);
+    }
+
+    var region_id = _via_region_edge[0];
+    var attr = _via_canvas_regions[region_id].shape_attributes;
+    switch (attr['name']) {
+    case VIA_REGION_SHAPE.RECT:
+      // original rectangle
+      var d = [attr['x'], attr['y'], 0, 0];
+      d[2] = d[0] + attr['width'];
+      d[3] = d[1] + attr['height'];
+
+      var mx = _via_current_x;
+      var my = _via_current_y;
+      var preserve_aspect_ratio = false;
+      // constrain (mx,my) to lie on a line connecting a diagonal of rectangle
+      if ( _via_is_ctrl_pressed ) {
+        preserve_aspect_ratio = true;
+      }
+
+      rect_update_corner(_via_region_edge[1], d, mx, my, preserve_aspect_ratio);
+      rect_standardize_coordinates(d);
+
+      var w = Math.abs(d[2] - d[0]);
+      var h = Math.abs(d[3] - d[1]);
+      _via_draw_rect_region(d[0], d[1], w, h, true);
+
+      if ( rf != null && _via_is_region_info_visible ) {
+        rf.innerHTML +=  ',' + ' W:' + w + ',' + ' H:' + h;
+      }
+      break;
+
+    case VIA_REGION_SHAPE.CIRCLE:
+      var dx = Math.abs(attr['cx'] - _via_current_x);
+      var dy = Math.abs(attr['cy'] - _via_current_y);
+      var new_r = Math.sqrt( dx*dx + dy*dy );
+      _via_draw_circle_region(attr['cx'],
+                              attr['cy'],
+                              new_r,
+                              true);
+      if ( rf != null && _via_is_region_info_visible ) {
+        var curr_texts = rf.innerHTML.split(",");
+        rf.innerHTML = "";
+        rf.innerHTML +=  curr_texts[0] + ',' + curr_texts[1] + ',' + ' Radius:' + Math.round(new_r);
+      }
+      break;
+
+    case VIA_REGION_SHAPE.ELLIPSE:
+      var new_rx = attr['rx'];
+      var new_ry = attr['ry'];
+      var new_theta = attr['theta'];
+      var dx = Math.abs(attr['cx'] - _via_current_x);
+      var dy = Math.abs(attr['cy'] - _via_current_y);
+      switch(_via_region_edge[1]) {
+      case 5:
+        new_ry = Math.sqrt(dx*dx + dy*dy);
+        new_theta = Math.atan2(- (_via_current_x - attr['cx']), (_via_current_y - attr['cy']));
+        break;
+
+      case 6:
+        new_rx = Math.sqrt(dx*dx + dy*dy);
+        new_theta = Math.atan2((_via_current_y - attr['cy']), (_via_current_x - attr['cx']));
+        break;
+
+      default:
+        new_rx = dx;
+        new_ry = dy;
+        new_theta = 0;
+        break;
+      }
+
+      _via_draw_ellipse_region(attr['cx'],
+                               attr['cy'],
+                               new_rx,
+                               new_ry,
+                               new_theta,
+                               true);
+      if ( rf != null && _via_is_region_info_visible ) {
+        var curr_texts = rf.innerHTML.split(",");
+        rf.innerHTML = "";
+        rf.innerHTML = curr_texts[0] + ',' + curr_texts[1] + ',' + ' X-radius:' + fixfloat(new_rx) + ',' + ' Y-radius:' + fixfloat(new_ry);
+      }
+      break;
+
+    case VIA_REGION_SHAPE.POLYLINE: // handled by polygon
+    case VIA_REGION_SHAPE.POLYGON:
+      var moved_all_points_x = attr['all_points_x'].slice(0);
+      var moved_all_points_y = attr['all_points_y'].slice(0);
+      var moved_vertex_id = _via_region_edge[1] - VIA_POLYGON_RESIZE_VERTEX_OFFSET;
+
+      moved_all_points_x[moved_vertex_id] = _via_current_x;
+      moved_all_points_y[moved_vertex_id] = _via_current_y;
+
+      _via_draw_polygon_region(moved_all_points_x,
+                               moved_all_points_y,
+                               true,
+                               attr['name']);
+      if ( rf != null && _via_is_region_info_visible ) {
+        rf.innerHTML +=  ',' + ' Vertices:' + attr['all_points_x'].length;
+      }
+      break;
+    }
+    _via_reg_canvas.focus();
+  }
+
+  if ( _via_is_user_moving_region ) {
+    // draw region as the user drags the mouse coursor
+    if (_via_canvas_regions.length) {
+      _via_redraw_reg_canvas(); // clear old intermediate rectangle
+    } else {
+      // first region being drawn, just clear the full region canvas
+      _via_reg_ctx.clearRect(0, 0, _via_reg_canvas.width, _via_reg_canvas.height);
+    }
+
+    var move_x = (_via_current_x - _via_region_click_x);
+    var move_y = (_via_current_y - _via_region_click_y);
+    var attr = _via_canvas_regions[_via_user_sel_region_id].shape_attributes;
+
+    switch (attr['name']) {
+    case VIA_REGION_SHAPE.RECT:
+      _via_draw_rect_region(attr['x'] + move_x,
+                            attr['y'] + move_y,
+                            attr['width'],
+                            attr['height'],
+                            true);
+      // display the current region info
+      if ( rf != null && _via_is_region_info_visible ) {
+        rf.innerHTML +=  ',' + ' W:' + attr['width'] + ',' + ' H:' + attr['height'];
+      }
+      break;
+
+    case VIA_REGION_SHAPE.CIRCLE:
+      _via_draw_circle_region(attr['cx'] + move_x,
+                              attr['cy'] + move_y,
+                              attr['r'],
+                              true);
+      break;
+
+    case VIA_REGION_SHAPE.ELLIPSE:
+      if (typeof(attr['theta']) === 'undefined') { attr['theta'] = 0; }
+      _via_draw_ellipse_region(attr['cx'] + move_x,
+                               attr['cy'] + move_y,
+                               attr['rx'],
+                               attr['ry'],
+                               attr['theta'],
+                               true);
+      break;
+
+    case VIA_REGION_SHAPE.POLYLINE: // handled by polygon
+    case VIA_REGION_SHAPE.POLYGON:
+      var moved_all_points_x = attr['all_points_x'].slice(0);
+      var moved_all_points_y = attr['all_points_y'].slice(0);
+      for (var i=0; i<moved_all_points_x.length; ++i) {
+        moved_all_points_x[i] += move_x;
+        moved_all_points_y[i] += move_y;
+      }
+      _via_draw_polygon_region(moved_all_points_x,
+                               moved_all_points_y,
+                               true,
+                               attr['name']);
+      if ( rf != null && _via_is_region_info_visible ) {
+        rf.innerHTML +=  ',' + ' Vertices:' + attr['all_points_x'].length;
+      }
+      break;
+
+    case VIA_REGION_SHAPE.POINT:
+      _via_draw_point_region(attr['cx'] + move_x,
+                             attr['cy'] + move_y,
+                             true);
+      break;
+    }
+    _via_reg_canvas.focus();
+    annotation_editor_hide() // moving
+    return;
+  }
+
+  if ( _via_is_user_drawing_polygon ) {
+    _via_redraw_reg_canvas();
+    var attr = _via_canvas_regions[_via_current_polygon_region_id].shape_attributes;
+    var all_points_x = attr['all_points_x'];
+    var all_points_y = attr['all_points_y'];
+    var npts = all_points_x.length;
+
+    if ( npts > 0 ) {
+      var line_x = [all_points_x.slice(npts-1), _via_current_x];
+      var line_y = [all_points_y.slice(npts-1), _via_current_y];
+      _via_draw_polygon_region(line_x, line_y, false, attr['name']);
+    }
+
+    if ( rf != null && _via_is_region_info_visible ) {
+      rf.innerHTML +=  ',' + ' Vertices:' + npts;
+    }
+  }
+}
+
+function _via_move_selected_regions(move_x, move_y) {
+  var i, n;
+  n = _via_region_selected_flag.length;
+  for ( i = 0; i < n; ++i ) {
+    if ( _via_region_selected_flag[i] ) {
+      _via_move_region(i, move_x, move_y);
+    }
+  }
+}
+
+function _via_validate_move_region(x, y, canvas_attr) {
+  switch( canvas_attr['name'] ) {
+    case VIA_REGION_SHAPE.RECT:
+      // left and top boundary check
+      if (x < 0 || y < 0) {
+          show_message('Region moved beyond image boundary. Resetting.');
+          return false;
+      }
+      // right and bottom boundary check
+      if ((y + canvas_attr['height']) > _via_current_image_height ||
+          (x + canvas_attr['width']) > _via_current_image_width) {
+            show_message('Region moved beyond image boundary. Resetting.');
+            return false;
+      }
+
+    // same validation for all
+    case VIA_REGION_SHAPE.CIRCLE:
+    case VIA_REGION_SHAPE.ELLIPSE:
+    case VIA_REGION_SHAPE.POINT:
+    case VIA_REGION_SHAPE.POLYLINE:
+    case VIA_REGION_SHAPE.POLYGON:
+      if (x < 0 || y < 0 ||
+          x > _via_current_image_width || y > _via_current_image_height) {
+          show_message('Region moved beyond image boundary. Resetting.');
+          return false;
+      }
+  }
+  return true;
+}
+
+function _via_move_region(region_id, move_x, move_y) {
+  var image_attr = _via_img_metadata[_via_image_id].regions[region_id].shape_attributes;
+  var canvas_attr = _via_canvas_regions[region_id].shape_attributes;
+
+  switch( canvas_attr['name'] ) {
+  case VIA_REGION_SHAPE.RECT:
+    var xnew = image_attr['x'] + Math.round(move_x * _via_canvas_scale);
+    var ynew = image_attr['y'] + Math.round(move_y * _via_canvas_scale);
+
+    var is_valid = _via_validate_move_region(xnew, ynew, image_attr);
+    if (! is_valid ) { break; }
+
+    image_attr['x'] = xnew;
+    image_attr['y'] = ynew;
+
+    canvas_attr['x'] = Math.round( image_attr['x'] / _via_canvas_scale);
+    canvas_attr['y'] = Math.round( image_attr['y'] / _via_canvas_scale);
+    break;
+
+  case VIA_REGION_SHAPE.CIRCLE: // Fall-through
+  case VIA_REGION_SHAPE.ELLIPSE: // Fall-through
+  case VIA_REGION_SHAPE.POINT:
+    var cxnew = image_attr['cx'] + Math.round(move_x * _via_canvas_scale);
+    var cynew = image_attr['cy'] + Math.round(move_y * _via_canvas_scale);
+
+    var is_valid = _via_validate_move_region(cxnew, cynew, image_attr);
+    if (! is_valid ) { break; }
+
+    image_attr['cx'] = cxnew;
+    image_attr['cy'] = cynew;
+
+    canvas_attr['cx'] = Math.round( image_attr['cx'] / _via_canvas_scale);
+    canvas_attr['cy'] = Math.round( image_attr['cy'] / _via_canvas_scale);
+    break;
+
+  case VIA_REGION_SHAPE.POLYLINE: // handled by polygon
+  case VIA_REGION_SHAPE.POLYGON:
+    var img_px = image_attr['all_points_x'];
+    var img_py = image_attr['all_points_y'];
+    var canvas_px = canvas_attr['all_points_x'];
+    var canvas_py = canvas_attr['all_points_y'];
+    // clone for reverting if valiation fails
+    var img_px_old = Object.assign({}, img_px);
+    var img_py_old = Object.assign({}, img_py);
+
+    // validate move
+    for (var i=0; i<img_px.length; ++i) {
+      var pxnew = img_px[i] + Math.round(move_x * _via_canvas_scale);
+      var pynew = img_py[i] + Math.round(move_y * _via_canvas_scale);
+      if (! _via_validate_move_region(pxnew, pynew, image_attr) ) {
+        img_px = img_px_old;
+        img_py = img_py_old;
+        break;
+      }
+    }
+    // move points
+    for (var i=0; i<img_px.length; ++i) {
+      img_px[i] = img_px[i] + Math.round(move_x * _via_canvas_scale);
+      img_py[i] = img_py[i] + Math.round(move_y * _via_canvas_scale);
+    }
+
+    for (var i=0; i<canvas_px.length; ++i) {
+      canvas_px[i] = Math.round( img_px[i] / _via_canvas_scale );
+      canvas_py[i] = Math.round( img_py[i] / _via_canvas_scale );
+    }
+    break;
+  }
+}
+
+function _via_polygon_del_vertex(region_id, vertex_id) {
+  var rs    = _via_canvas_regions[region_id].shape_attributes;
+  var npts  = rs['all_points_x'].length;
+  var shape = rs['name'];
+  if ( shape !== VIA_REGION_SHAPE.POLYGON && shape !== VIA_REGION_SHAPE.POLYLINE ) {
+    show_message('Vertices can only be deleted from polygon/polyline.');
+    return false;
+  }
+  if ( npts <=3 && shape === VIA_REGION_SHAPE.POLYGON ) {
+    show_message('Failed to delete vertex because a polygon must have at least 3 vertices.');
+    return false;
+  }
+  if ( npts <=2 && shape === VIA_REGION_SHAPE.POLYLINE ) {
+    show_message('Failed to delete vertex because a polyline must have at least 2 vertices.');
+    return false;
+  }
+  // delete vertex from canvas
+  _via_canvas_regions[region_id].shape_attributes['all_points_x'].splice(vertex_id, 1);
+  _via_canvas_regions[region_id].shape_attributes['all_points_y'].splice(vertex_id, 1);
+
+  // delete vertex from image metadata
+  _via_img_metadata[_via_image_id].regions[region_id].shape_attributes['all_points_x'].splice(vertex_id, 1);
+  _via_img_metadata[_via_image_id].regions[region_id].shape_attributes['all_points_y'].splice(vertex_id, 1);
+  return true;
+}
+
+//
+// Canvas update routines
+//
+function _via_redraw_reg_canvas() {
+  if (_via_current_image_loaded) {
+    _via_reg_ctx.clearRect(0, 0, _via_reg_canvas.width, _via_reg_canvas.height);
+    if ( _via_canvas_regions.length > 0 ) {
+      if (_via_is_region_boundary_visible) {
+        draw_all_regions();
+      }
+      if (_via_is_region_id_visible) {
+        draw_all_region_id();
+      }
+    }
+  }
+}
+
+function _via_clear_reg_canvas() {
+  _via_reg_ctx.clearRect(0, 0, _via_reg_canvas.width, _via_reg_canvas.height);
+}
+
+function draw_all_regions() {
+  var aid = _via_settings.ui.image.region_color;
+  var attr, is_selected, aid, avalue;
+  for (var i=0; i < _via_canvas_regions.length; ++i) {
+    attr = _via_canvas_regions[i].shape_attributes;
+    is_selected = _via_region_selected_flag[i];
+
+    // region stroke style may depend on attribute value
+    _via_reg_ctx.strokeStyle = VIA_THEME_BOUNDARY_FILL_COLOR;
+    if ( ! _via_is_user_drawing_polygon &&
+         aid !== '__via_default_region_color__' ) {
+      avalue = _via_img_metadata[_via_image_id].regions[i].region_attributes[aid];
+      if ( _via_canvas_regions_group_color.hasOwnProperty(avalue) ) {
+        _via_reg_ctx.strokeStyle = _via_canvas_regions_group_color[avalue];
+      }
+    }
+
+    switch( attr['name'] ) {
+    case VIA_REGION_SHAPE.RECT:
+      _via_draw_rect_region(attr['x'],
+                            attr['y'],
+                            attr['width'],
+                            attr['height'],
+                            is_selected);
+      break;
+
+    case VIA_REGION_SHAPE.CIRCLE:
+      _via_draw_circle_region(attr['cx'],
+                              attr['cy'],
+                              attr['r'],
+                              is_selected);
+      break;
+
+    case VIA_REGION_SHAPE.ELLIPSE:
+      if (typeof(attr['theta']) === 'undefined') { attr['theta'] = 0; }
+      _via_draw_ellipse_region(attr['cx'],
+                               attr['cy'],
+                               attr['rx'],
+                               attr['ry'],
+                               attr['theta'],
+                               is_selected);
+      break;
+
+    case VIA_REGION_SHAPE.POLYLINE: // handled by polygon
+    case VIA_REGION_SHAPE.POLYGON:
+      _via_draw_polygon_region(attr['all_points_x'],
+                               attr['all_points_y'],
+                               is_selected,
+                               attr['name']);
+      break;
+
+    case VIA_REGION_SHAPE.POINT:
+      _via_draw_point_region(attr['cx'],
+                             attr['cy'],
+                             is_selected);
+      break;
+    }
+  }
+}
+
+// control point for resize of region boundaries
+function _via_draw_control_point(cx, cy) {
+  _via_reg_ctx.beginPath();
+  _via_reg_ctx.arc(cx, cy, VIA_REGION_POINT_RADIUS, 0, 2*Math.PI, false);
+  _via_reg_ctx.closePath();
+
+  _via_reg_ctx.fillStyle = VIA_THEME_CONTROL_POINT_COLOR;
+  _via_reg_ctx.globalAlpha = 1.0;
+  _via_reg_ctx.fill();
+}
+
+function _via_draw_rect_region(x, y, w, h, is_selected) {
+  if (is_selected) {
+    _via_draw_rect(x, y, w, h);
+
+    _via_reg_ctx.strokeStyle = VIA_THEME_SEL_REGION_FILL_BOUNDARY_COLOR;
+    _via_reg_ctx.lineWidth   = VIA_THEME_REGION_BOUNDARY_WIDTH/2;
+    _via_reg_ctx.stroke();
+
+    _via_reg_ctx.fillStyle   = VIA_THEME_SEL_REGION_FILL_COLOR;
+    _via_reg_ctx.globalAlpha = VIA_THEME_SEL_REGION_OPACITY;
+    _via_reg_ctx.fill();
+    _via_reg_ctx.globalAlpha = 1.0;
+
+    _via_draw_control_point(x  ,   y);
+    _via_draw_control_point(x+w, y+h);
+    _via_draw_control_point(x  , y+h);
+    _via_draw_control_point(x+w,   y);
+    _via_draw_control_point(x+w/2,   y);
+    _via_draw_control_point(x+w/2, y+h);
+    _via_draw_control_point(x    , y+h/2);
+    _via_draw_control_point(x+w  , y+h/2);
+  } else {
+    // draw a fill line
+    _via_reg_ctx.lineWidth   = VIA_THEME_REGION_BOUNDARY_WIDTH/2;
+    _via_draw_rect(x, y, w, h);
+    _via_reg_ctx.stroke();
+
+    if ( w > VIA_THEME_REGION_BOUNDARY_WIDTH &&
+         h > VIA_THEME_REGION_BOUNDARY_WIDTH ) {
+      // draw a boundary line on both sides of the fill line
+      _via_reg_ctx.strokeStyle = VIA_THEME_BOUNDARY_LINE_COLOR;
+      _via_reg_ctx.lineWidth   = VIA_THEME_REGION_BOUNDARY_WIDTH/4;
+      _via_draw_rect(x - VIA_THEME_REGION_BOUNDARY_WIDTH/2,
+                     y - VIA_THEME_REGION_BOUNDARY_WIDTH/2,
+                     w + VIA_THEME_REGION_BOUNDARY_WIDTH,
+                     h + VIA_THEME_REGION_BOUNDARY_WIDTH);
+      _via_reg_ctx.stroke();
+
+      _via_draw_rect(x + VIA_THEME_REGION_BOUNDARY_WIDTH/2,
+                     y + VIA_THEME_REGION_BOUNDARY_WIDTH/2,
+                     w - VIA_THEME_REGION_BOUNDARY_WIDTH,
+                     h - VIA_THEME_REGION_BOUNDARY_WIDTH);
+      _via_reg_ctx.stroke();
+    }
+  }
+}
+
+function _via_draw_rect(x, y, w, h) {
+  _via_reg_ctx.beginPath();
+  _via_reg_ctx.moveTo(x  , y);
+  _via_reg_ctx.lineTo(x+w, y);
+  _via_reg_ctx.lineTo(x+w, y+h);
+  _via_reg_ctx.lineTo(x  , y+h);
+  _via_reg_ctx.closePath();
+}
+
+function _via_draw_circle_region(cx, cy, r, is_selected) {
+  if (is_selected) {
+    _via_draw_circle(cx, cy, r);
+
+    _via_reg_ctx.strokeStyle = VIA_THEME_SEL_REGION_FILL_BOUNDARY_COLOR;
+    _via_reg_ctx.lineWidth   = VIA_THEME_REGION_BOUNDARY_WIDTH/2;
+    _via_reg_ctx.stroke();
+
+    _via_reg_ctx.fillStyle   = VIA_THEME_SEL_REGION_FILL_COLOR;
+    _via_reg_ctx.globalAlpha = VIA_THEME_SEL_REGION_OPACITY;
+    _via_reg_ctx.fill();
+    _via_reg_ctx.globalAlpha = 1.0;
+
+    _via_draw_control_point(cx + r, cy);
+  } else {
+    // draw a fill line
+    _via_reg_ctx.lineWidth   = VIA_THEME_REGION_BOUNDARY_WIDTH/2;
+    _via_draw_circle(cx, cy, r);
+    _via_reg_ctx.stroke();
+
+    if ( r > VIA_THEME_REGION_BOUNDARY_WIDTH ) {
+      // draw a boundary line on both sides of the fill line
+      _via_reg_ctx.strokeStyle = VIA_THEME_BOUNDARY_LINE_COLOR;
+      _via_reg_ctx.lineWidth   = VIA_THEME_REGION_BOUNDARY_WIDTH/4;
+      _via_draw_circle(cx, cy,
+                       r - VIA_THEME_REGION_BOUNDARY_WIDTH/2);
+      _via_reg_ctx.stroke();
+      _via_draw_circle(cx, cy,
+                       r + VIA_THEME_REGION_BOUNDARY_WIDTH/2);
+      _via_reg_ctx.stroke();
+    }
+  }
+}
+
+function _via_draw_circle(cx, cy, r) {
+  _via_reg_ctx.beginPath();
+  _via_reg_ctx.arc(cx, cy, r, 0, 2*Math.PI, false);
+  _via_reg_ctx.closePath();
+}
+
+function _via_draw_ellipse_region(cx, cy, rx, ry, rr, is_selected) {
+  if (is_selected) {
+    _via_draw_ellipse(cx, cy, rx, ry, rr);
+
+    _via_reg_ctx.strokeStyle = VIA_THEME_SEL_REGION_FILL_BOUNDARY_COLOR;
+    _via_reg_ctx.lineWidth   = VIA_THEME_REGION_BOUNDARY_WIDTH/2;
+    _via_reg_ctx.stroke();
+
+    _via_reg_ctx.fillStyle   = VIA_THEME_SEL_REGION_FILL_COLOR;
+    _via_reg_ctx.globalAlpha = VIA_THEME_SEL_REGION_OPACITY;
+    _via_reg_ctx.fill();
+    _via_reg_ctx.globalAlpha = 1.0;
+
+    _via_draw_control_point(cx + rx * Math.cos(rr), cy + rx * Math.sin(rr));
+    _via_draw_control_point(cx - rx * Math.cos(rr), cy - rx * Math.sin(rr));
+    _via_draw_control_point(cx + ry * Math.sin(rr), cy - ry * Math.cos(rr));
+    _via_draw_control_point(cx - ry * Math.sin(rr), cy + ry * Math.cos(rr));
+
+  } else {
+    // draw a fill line
+    _via_reg_ctx.lineWidth   = VIA_THEME_REGION_BOUNDARY_WIDTH/2;
+    _via_draw_ellipse(cx, cy, rx, ry, rr);
+    _via_reg_ctx.stroke();
+
+    if ( rx > VIA_THEME_REGION_BOUNDARY_WIDTH &&
+         ry > VIA_THEME_REGION_BOUNDARY_WIDTH ) {
+      // draw a boundary line on both sides of the fill line
+      _via_reg_ctx.strokeStyle = VIA_THEME_BOUNDARY_LINE_COLOR;
+      _via_reg_ctx.lineWidth   = VIA_THEME_REGION_BOUNDARY_WIDTH/4;
+      _via_draw_ellipse(cx, cy,
+                        rx + VIA_THEME_REGION_BOUNDARY_WIDTH/2,
+                        ry + VIA_THEME_REGION_BOUNDARY_WIDTH/2,
+                        rr);
+      _via_reg_ctx.stroke();
+      _via_draw_ellipse(cx, cy,
+                        rx - VIA_THEME_REGION_BOUNDARY_WIDTH/2,
+                        ry - VIA_THEME_REGION_BOUNDARY_WIDTH/2,
+                        rr);
+      _via_reg_ctx.stroke();
+    }
+  }
+}
+
+function _via_draw_ellipse(cx, cy, rx, ry, rr) {
+  _via_reg_ctx.save();
+
+  _via_reg_ctx.beginPath();
+  _via_reg_ctx.ellipse(cx, cy, rx, ry, rr, 0, 2 * Math.PI);
+
+  _via_reg_ctx.restore(); // restore to original state
+  _via_reg_ctx.closePath();
+}
+
+function _via_draw_polygon_region(all_points_x, all_points_y, is_selected, shape) {
+  if ( is_selected ) {
+    _via_reg_ctx.strokeStyle = VIA_THEME_SEL_REGION_FILL_BOUNDARY_COLOR;
+    _via_reg_ctx.lineWidth   = VIA_THEME_REGION_BOUNDARY_WIDTH/2;
+    _via_reg_ctx.beginPath();
+    _via_reg_ctx.moveTo(all_points_x[0], all_points_y[0]);
+    for ( var i=1; i < all_points_x.length; ++i ) {
+      _via_reg_ctx.lineTo(all_points_x[i], all_points_y[i]);
+    }
+    if ( shape === VIA_REGION_SHAPE.POLYGON ) {
+      _via_reg_ctx.lineTo(all_points_x[0], all_points_y[0]); // close loop
+    }
+    _via_reg_ctx.stroke();
+
+    _via_reg_ctx.fillStyle   = VIA_THEME_SEL_REGION_FILL_COLOR;
+    _via_reg_ctx.globalAlpha = VIA_THEME_SEL_REGION_OPACITY;
+    _via_reg_ctx.fill();
+    _via_reg_ctx.globalAlpha = 1.0;
+    for ( var i=0; i < all_points_x.length; ++i ) {
+      _via_draw_control_point(all_points_x[i], all_points_y[i]);
+    }
+  } else {
+    // draw a fill line
+    _via_reg_ctx.lineWidth   = VIA_THEME_REGION_BOUNDARY_WIDTH/2;
+    _via_reg_ctx.beginPath();
+    _via_reg_ctx.moveTo(all_points_x[0], all_points_y[0]);
+    for ( var i=0; i < all_points_x.length; ++i ) {
+      _via_reg_ctx.lineTo(all_points_x[i], all_points_y[i]);
+    }
+    if ( shape === VIA_REGION_SHAPE.POLYGON ) {
+      _via_reg_ctx.lineTo(all_points_x[0], all_points_y[0]); // close loop
+    }
+    _via_reg_ctx.stroke();
+  }
+}
+
+function _via_draw_point_region(cx, cy, is_selected) {
+  if (is_selected) {
+    _via_draw_point(cx, cy, VIA_REGION_POINT_RADIUS);
+
+    _via_reg_ctx.strokeStyle = VIA_THEME_SEL_REGION_FILL_BOUNDARY_COLOR;
+    _via_reg_ctx.lineWidth   = VIA_THEME_REGION_BOUNDARY_WIDTH/2;
+    _via_reg_ctx.stroke();
+
+    _via_reg_ctx.fillStyle   = VIA_THEME_SEL_REGION_FILL_COLOR;
+    _via_reg_ctx.globalAlpha = VIA_THEME_SEL_REGION_OPACITY;
+    _via_reg_ctx.fill();
+    _via_reg_ctx.globalAlpha = 1.0;
+  } else {
+    // draw a fill line
+    _via_reg_ctx.lineWidth   = VIA_THEME_REGION_BOUNDARY_WIDTH/2;
+    _via_draw_point(cx, cy, VIA_REGION_POINT_RADIUS);
+    _via_reg_ctx.stroke();
+
+    // draw a boundary line on both sides of the fill line
+    _via_reg_ctx.strokeStyle = VIA_THEME_BOUNDARY_LINE_COLOR;
+    _via_reg_ctx.lineWidth   = VIA_THEME_REGION_BOUNDARY_WIDTH/4;
+    _via_draw_point(cx, cy,
+                    VIA_REGION_POINT_RADIUS - VIA_THEME_REGION_BOUNDARY_WIDTH/2);
+    _via_reg_ctx.stroke();
+    _via_draw_point(cx, cy,
+                    VIA_REGION_POINT_RADIUS + VIA_THEME_REGION_BOUNDARY_WIDTH/2);
+    _via_reg_ctx.stroke();
+  }
+}
+
+function _via_draw_point(cx, cy, r) {
+  _via_reg_ctx.beginPath();
+  _via_reg_ctx.arc(cx, cy, r, 0, 2*Math.PI, false);
+  _via_reg_ctx.closePath();
+}
+
+function draw_all_region_id() {
+  _via_reg_ctx.shadowColor = "transparent";
+  _via_reg_ctx.font = _via_settings.ui.image.region_label_font;
+  for ( var i = 0; i < _via_img_metadata[_via_image_id].regions.length; ++i ) {
+    var canvas_reg = _via_canvas_regions[i];
+
+    var bbox = get_region_bounding_box(canvas_reg);
+    var x = bbox[0];
+    var y = bbox[1];
+    var w = Math.abs(bbox[2] - bbox[0]);
+
+    var char_width  = _via_reg_ctx.measureText('M').width;
+    var char_height = 1.8 * char_width;
+
+    var annotation_str  = (i+1).toString();
+    var rattr = _via_img_metadata[_via_image_id].regions[i].region_attributes[_via_settings.ui.image.region_label];
+    var rshape = _via_img_metadata[_via_image_id].regions[i].shape_attributes['name'];
+    if ( _via_settings.ui.image.region_label !== '__via_region_id__' ) {
+      if ( typeof(rattr) !== 'undefined' ) {
+        switch( typeof(rattr) ) {
+        default:
+        case 'string':
+          annotation_str = rattr;
+          break;
+        case 'object':
+          annotation_str = Object.keys(rattr).join(',');
+          break;
+        }
+      } else {
+        annotation_str = 'undefined';
+      }
+    }
+
+    var bgnd_rect_width;
+    var strw = _via_reg_ctx.measureText(annotation_str).width;
+    if ( strw > w ) {
+      if ( _via_settings.ui.image.region_label === '__via_region_id__' ) {
+        // region-id is always visible in full
+        bgnd_rect_width = strw + char_width;
+      } else {
+
+        // if text overflows, crop it
+        var str_max     = Math.floor((w * annotation_str.length) / strw);
+        if ( str_max > 1 ) {
+          annotation_str  = annotation_str.substr(0, str_max-1) + '.';
+          bgnd_rect_width = w;
+        } else {
+          annotation_str  = annotation_str.substr(0, 1) + '.';
+          bgnd_rect_width = 2 * char_width;
+        }
+      }
+    } else {
+      bgnd_rect_width = strw + char_width;
+    }
+
+    if (canvas_reg.shape_attributes['name'] === VIA_REGION_SHAPE.POLYGON ||
+        canvas_reg.shape_attributes['name'] === VIA_REGION_SHAPE.POLYLINE) {
+      // put label near the first vertex
+      x = canvas_reg.shape_attributes['all_points_x'][0];
+      y = canvas_reg.shape_attributes['all_points_y'][0];
+    } else {
+      // center the label
+      x = x - (bgnd_rect_width/2 - w/2);
+    }
+
+    // ensure that the text is within the image boundaries
+    if ( y < char_height ) {
+      y = char_height;
+    }
+
+    // first, draw a background rectangle first
+    _via_reg_ctx.fillStyle = 'black';
+    _via_reg_ctx.globalAlpha = 0.8;
+    _via_reg_ctx.fillRect(Math.floor(x),
+                          Math.floor(y - 1.1*char_height),
+                          Math.floor(bgnd_rect_width),
+                          Math.floor(char_height));
+
+    // then, draw text over this background rectangle
+    _via_reg_ctx.globalAlpha = 1.0;
+    _via_reg_ctx.fillStyle = 'yellow';
+    _via_reg_ctx.fillText(annotation_str,
+                          Math.floor(x + 0.4*char_width),
+                          Math.floor(y - 0.35*char_height));
+
+  }
+}
+
+function get_region_bounding_box(region) {
+  var d = region.shape_attributes;
+  var bbox = new Array(4);
+
+  switch( d['name'] ) {
+  case 'rect':
+    bbox[0] = d['x'];
+    bbox[1] = d['y'];
+    bbox[2] = d['x'] + d['width'];
+    bbox[3] = d['y'] + d['height'];
+    break;
+
+  case 'circle':
+    bbox[0] = d['cx'] - d['r'];
+    bbox[1] = d['cy'] - d['r'];
+    bbox[2] = d['cx'] + d['r'];
+    bbox[3] = d['cy'] + d['r'];
+    break;
+
+  case 'ellipse':
+    let radians = d['theta'];
+    let radians90 = radians + Math.PI / 2;
+    let ux = d['rx'] * Math.cos(radians);
+    let uy = d['rx'] * Math.sin(radians);
+    let vx = d['ry'] * Math.cos(radians90);
+    let vy = d['ry'] * Math.sin(radians90);
+
+    let width = Math.sqrt(ux * ux + vx * vx) * 2;
+    let height = Math.sqrt(uy * uy + vy * vy) * 2;
+
+    bbox[0] = d['cx'] - (width / 2);
+    bbox[1] = d['cy'] - (height / 2);
+    bbox[2] = d['cx'] + (width / 2);
+    bbox[3] = d['cy'] + (height / 2);
+    break;
+
+  case 'polyline': // handled by polygon
+  case 'polygon':
+    var all_points_x = d['all_points_x'];
+    var all_points_y = d['all_points_y'];
+
+    var minx = Number.MAX_SAFE_INTEGER;
+    var miny = Number.MAX_SAFE_INTEGER;
+    var maxx = 0;
+    var maxy = 0;
+    for ( var i=0; i < all_points_x.length; ++i ) {
+      if ( all_points_x[i] < minx ) {
+        minx = all_points_x[i];
+      }
+      if ( all_points_x[i] > maxx ) {
+        maxx = all_points_x[i];
+      }
+      if ( all_points_y[i] < miny ) {
+        miny = all_points_y[i];
+      }
+      if ( all_points_y[i] > maxy ) {
+        maxy = all_points_y[i];
+      }
+    }
+    bbox[0] = minx;
+    bbox[1] = miny;
+    bbox[2] = maxx;
+    bbox[3] = maxy;
+    break;
+
+  case 'point':
+    bbox[0] = d['cx'] - VIA_REGION_POINT_RADIUS;
+    bbox[1] = d['cy'] - VIA_REGION_POINT_RADIUS;
+    bbox[2] = d['cx'] + VIA_REGION_POINT_RADIUS;
+    bbox[3] = d['cy'] + VIA_REGION_POINT_RADIUS;
+    break;
+  }
+  return bbox;
+}
+
+//
+// Region collision routines
+//
+function is_inside_region(px, py, descending_order) {
+  var N = _via_canvas_regions.length;
+  if ( N === 0 ) {
+    return -1;
+  }
+  var start, end, del;
+  // traverse the canvas regions in alternating ascending
+  // and descending order to solve the issue of nested regions
+  if ( descending_order ) {
+    start = N - 1;
+    end   = -1;
+    del   = -1;
+  } else {
+    start = 0;
+    end   = N;
+    del   = 1;
+  }
+
+  var i = start;
+  while ( i !== end ) {
+    var yes = is_inside_this_region(px, py, i);
+    if (yes) {
+      return i;
+    }
+    i = i + del;
+  }
+  return -1;
+}
+
+function is_inside_this_region(px, py, region_id) {
+  var attr   = _via_canvas_regions[region_id].shape_attributes;
+  var result = false;
+  switch ( attr['name'] ) {
+  case VIA_REGION_SHAPE.RECT:
+    result = is_inside_rect(attr['x'],
+                            attr['y'],
+                            attr['width'],
+                            attr['height'],
+                            px, py);
+    break;
+
+  case VIA_REGION_SHAPE.CIRCLE:
+    result = is_inside_circle(attr['cx'],
+                              attr['cy'],
+                              attr['r'],
+                              px, py);
+    break;
+
+  case VIA_REGION_SHAPE.ELLIPSE:
+    result = is_inside_ellipse(attr['cx'],
+                               attr['cy'],
+                               attr['rx'],
+                               attr['ry'],
+                               attr['theta'],
+                               px, py);
+    break;
+
+  case VIA_REGION_SHAPE.POLYLINE: // handled by POLYGON
+  case VIA_REGION_SHAPE.POLYGON:
+    result = is_inside_polygon(attr['all_points_x'],
+                               attr['all_points_y'],
+                               px, py);
+    break;
+
+  case VIA_REGION_SHAPE.POINT:
+    result = is_inside_point(attr['cx'],
+                             attr['cy'],
+                             px, py);
+    break;
+  }
+  return result;
+}
+
+function is_inside_circle(cx, cy, r, px, py) {
+  var dx = px - cx;
+  var dy = py - cy;
+  return (dx * dx + dy * dy) < r * r;
+}
+
+function is_inside_rect(x, y, w, h, px, py) {
+  return px > x &&
+    px < (x + w) &&
+    py > y &&
+    py < (y + h);
+}
+
+function is_inside_ellipse(cx, cy, rx, ry, rr, px, py) {
+  // Inverse rotation of pixel coordinates
+  var dx = Math.cos(-rr) * (cx - px) - Math.sin(-rr) * (cy - py)
+  var dy = Math.sin(-rr) * (cx - px) + Math.cos(-rr) * (cy - py)
+
+  return ((dx * dx) / (rx * rx)) + ((dy * dy) / (ry * ry)) < 1;
+}
+
+// returns 0 when (px,py) is outside the polygon
+// source: http://geomalgorithms.com/a03-_inclusion.html
+function is_inside_polygon(all_points_x, all_points_y, px, py) {
+  if ( all_points_x.length === 0 || all_points_y.length === 0 ) {
+    return 0;
+  }
+
+  var wn = 0;    // the  winding number counter
+  var n = all_points_x.length;
+  var i;
+  // loop through all edges of the polygon
+  for ( i = 0; i < n-1; ++i ) {   // edge from V[i] to  V[i+1]
+    var is_left_value = is_left( all_points_x[i], all_points_y[i],
+                                 all_points_x[i+1], all_points_y[i+1],
+                                 px, py);
+
+    if (all_points_y[i] <= py) {
+      if (all_points_y[i+1]  > py && is_left_value > 0) {
+        ++wn;
+      }
+    }
+    else {
+      if (all_points_y[i+1]  <= py && is_left_value < 0) {
+        --wn;
+      }
+    }
+  }
+
+  // also take into account the loop closing edge that connects last point with first point
+  var is_left_value = is_left( all_points_x[n-1], all_points_y[n-1],
+                               all_points_x[0], all_points_y[0],
+                               px, py);
+
+  if (all_points_y[n-1] <= py) {
+    if (all_points_y[0]  > py && is_left_value > 0) {
+      ++wn;
+    }
+  }
+  else {
+    if (all_points_y[0]  <= py && is_left_value < 0) {
+      --wn;
+    }
+  }
+
+  if ( wn === 0 ) {
+    return 0;
+  }
+  else {
+    return 1;
+  }
+}
+
+function is_inside_point(cx, cy, px, py) {
+  var dx = px - cx;
+  var dy = py - cy;
+  var r2 = VIA_POLYGON_VERTEX_MATCH_TOL * VIA_POLYGON_VERTEX_MATCH_TOL;
+  return (dx * dx + dy * dy) < r2;
+}
+
+// returns
+// >0 if (x2,y2) lies on the left side of line joining (x0,y0) and (x1,y1)
+// =0 if (x2,y2) lies on the line joining (x0,y0) and (x1,y1)
+// >0 if (x2,y2) lies on the right side of line joining (x0,y0) and (x1,y1)
+// source: http://geomalgorithms.com/a03-_inclusion.html
+function is_left(x0, y0, x1, y1, x2, y2) {
+  return ( ((x1 - x0) * (y2 - y0))  - ((x2 -  x0) * (y1 - y0)) );
+}
+
+function is_on_region_corner(px, py) {
+  var _via_region_edge = [-1, -1]; // region_id, corner_id [top-left=1,top-right=2,bottom-right=3,bottom-left=4]
+
+  for ( var i = 0; i < _via_canvas_regions.length; ++i ) {
+    var attr = _via_canvas_regions[i].shape_attributes;
+    var result = false;
+    _via_region_edge[0] = i;
+
+    switch ( attr['name'] ) {
+    case VIA_REGION_SHAPE.RECT:
+      result = is_on_rect_edge(attr['x'],
+                               attr['y'],
+                               attr['width'],
+                               attr['height'],
+                               px, py);
+      break;
+
+    case VIA_REGION_SHAPE.CIRCLE:
+      result = is_on_circle_edge(attr['cx'],
+                                 attr['cy'],
+                                 attr['r'],
+                                 px, py);
+      break;
+
+    case VIA_REGION_SHAPE.ELLIPSE:
+      result = is_on_ellipse_edge(attr['cx'],
+                                  attr['cy'],
+                                  attr['rx'],
+                                  attr['ry'],
+                                  attr['theta'],
+                                  px, py);
+      break;
+
+    case VIA_REGION_SHAPE.POLYLINE: // handled by polygon
+    case VIA_REGION_SHAPE.POLYGON:
+      result = is_on_polygon_vertex(attr['all_points_x'],
+                                    attr['all_points_y'],
+                                    px, py);
+      if ( result === 0 ) {
+        result = is_on_polygon_edge(attr['all_points_x'],
+                                    attr['all_points_y'],
+                                    px, py);
+      }
+      break;
+
+    case VIA_REGION_SHAPE.POINT:
+      // since there are no edges of a point
+      result = 0;
+      break;
+    }
+
+    if (result > 0) {
+      _via_region_edge[1] = result;
+      return _via_region_edge;
+    }
+  }
+  _via_region_edge[0] = -1;
+  return _via_region_edge;
+}
+
+function is_on_rect_edge(x, y, w, h, px, py) {
+  var dx0 = Math.abs(x - px);
+  var dy0 = Math.abs(y - py);
+  var dx1 = Math.abs(x + w - px);
+  var dy1 = Math.abs(y + h - py);
+  //[top-left=1,top-right=2,bottom-right=3,bottom-left=4]
+  if ( dx0 < VIA_REGION_EDGE_TOL &&
+       dy0 < VIA_REGION_EDGE_TOL ) {
+    return 1;
+  }
+  if ( dx1 < VIA_REGION_EDGE_TOL &&
+       dy0 < VIA_REGION_EDGE_TOL ) {
+    return 2;
+  }
+  if ( dx1 < VIA_REGION_EDGE_TOL &&
+       dy1 < VIA_REGION_EDGE_TOL ) {
+    return 3;
+  }
+
+  if ( dx0 < VIA_REGION_EDGE_TOL &&
+       dy1 < VIA_REGION_EDGE_TOL ) {
+    return 4;
+  }
+
+  var mx0 = Math.abs(x + w/2 - px);
+  var my0 = Math.abs(y + h/2 - py);
+  //[top-middle=5,right-middle=6,bottom-middle=7,left-middle=8]
+  if ( mx0 < VIA_REGION_EDGE_TOL &&
+       dy0 < VIA_REGION_EDGE_TOL ) {
+    return 5;
+  }
+  if ( dx1 < VIA_REGION_EDGE_TOL &&
+       my0 < VIA_REGION_EDGE_TOL ) {
+    return 6;
+  }
+  if ( mx0 < VIA_REGION_EDGE_TOL &&
+       dy1 < VIA_REGION_EDGE_TOL ) {
+    return 7;
+  }
+  if ( dx0 < VIA_REGION_EDGE_TOL &&
+       my0 < VIA_REGION_EDGE_TOL ) {
+    return 8;
+  }
+
+  return 0;
+}
+
+function is_on_circle_edge(cx, cy, r, px, py) {
+  var dx = cx - px;
+  var dy = cy - py;
+  if ( Math.abs(Math.sqrt( dx*dx + dy*dy ) - r) < VIA_REGION_EDGE_TOL ) {
+    var theta = Math.atan2( py - cy, px - cx );
+    if ( Math.abs(theta - (Math.PI/2)) < VIA_THETA_TOL ||
+         Math.abs(theta + (Math.PI/2)) < VIA_THETA_TOL) {
+      return 5;
+    }
+    if ( Math.abs(theta) < VIA_THETA_TOL ||
+         Math.abs(Math.abs(theta) - Math.PI) < VIA_THETA_TOL) {
+      return 6;
+    }
+
+    if ( theta > 0 && theta < (Math.PI/2) ) {
+      return 1;
+    }
+    if ( theta > (Math.PI/2) && theta < (Math.PI) ) {
+      return 4;
+    }
+    if ( theta < 0 && theta > -(Math.PI/2) ) {
+      return 2;
+    }
+    if ( theta < -(Math.PI/2) && theta > -Math.PI ) {
+      return 3;
+    }
+  } else {
+    return 0;
+  }
+}
+
+function is_on_ellipse_edge(cx, cy, rx, ry, rr, px, py) {
+  // Inverse rotation of pixel coordinates
+  px = px - cx;
+  py = py - cy;
+  var px_ = Math.cos(-rr) * px - Math.sin(-rr) * py;
+  var py_ = Math.sin(-rr) * px + Math.cos(-rr) * py;
+  px = px_ + cx;
+  py = py_ + cy;
+
+  var dx = (cx - px)/rx;
+  var dy = (cy - py)/ry;
+
+  if ( Math.abs(Math.sqrt( dx*dx + dy*dy ) - 1) < VIA_ELLIPSE_EDGE_TOL ) {
+    var theta = Math.atan2( py - cy, px - cx );
+    if ( Math.abs(theta - (Math.PI/2)) < VIA_THETA_TOL ||
+         Math.abs(theta + (Math.PI/2)) < VIA_THETA_TOL) {
+      return 5;
+    }
+    if ( Math.abs(theta) < VIA_THETA_TOL ||
+         Math.abs(Math.abs(theta) - Math.PI) < VIA_THETA_TOL) {
+      return 6;
+    }
+  } else {
+    return 0;
+  }
+}
+
+function is_on_polygon_vertex(all_points_x, all_points_y, px, py) {
+  var i, n;
+  n = all_points_x.length;
+
+  for ( i = 0; i < n; ++i ) {
+    if ( Math.abs(all_points_x[i] - px) < VIA_POLYGON_VERTEX_MATCH_TOL &&
+         Math.abs(all_points_y[i] - py) < VIA_POLYGON_VERTEX_MATCH_TOL ) {
+      return (VIA_POLYGON_RESIZE_VERTEX_OFFSET+i);
+    }
+  }
+  return 0;
+}
+
+function is_on_polygon_edge(all_points_x, all_points_y, px, py) {
+  var i, n, di, d;
+  n = all_points_x.length;
+  d = [];
+  for ( i = 0; i < n - 1; ++i )  {
+    di = dist_to_line(px, py, all_points_x[i], all_points_y[i], all_points_x[i+1], all_points_y[i+1]);
+    d.push(di);
+  }
+  // closing edge
+  di = dist_to_line(px, py, all_points_x[n-1], all_points_y[n-1], all_points_x[0], all_points_y[0]);
+  d.push(di);
+
+  var smallest_value = d[0];
+  var smallest_index = 0;
+  n = d.length;
+  for ( i = 1; i < n; ++i ) {
+    if ( d[i] < smallest_value ) {
+      smallest_value = d[i];
+      smallest_index = i;
+    }
+  }
+  if ( smallest_value < VIA_POLYGON_VERTEX_MATCH_TOL ) {
+    return (VIA_POLYGON_RESIZE_VERTEX_OFFSET + smallest_index);
+  } else {
+    return 0;
+  }
+}
+
+function is_point_inside_bounding_box(x, y, x1, y1, x2, y2) {
+  // ensure that (x1,y1) is top left and (x2,y2) is bottom right corner of rectangle
+  var rect = {};
+  if( x1 < x2 ) {
+    rect.x1 = x1;
+    rect.x2 = x2;
+  } else {
+    rect.x1 = x2;
+    rect.x2 = x1;
+  }
+  if ( y1 < y2 ) {
+    rect.y1 = y1;
+    rect.y2 = y2;
+  } else {
+    rect.y1 = y2;
+    rect.y2 = y1;
+  }
+
+  if ( x >= rect.x1 && x <= rect.x2 && y >= rect.y1 && y <= rect.y2 ) {
+    return true;
+  } else {
+    return false;
+  }
+}
+
+function dist_to_line(x, y, x1, y1, x2, y2) {
+  if ( is_point_inside_bounding_box(x, y, x1, y1, x2, y2) ) {
+    var dy = y2 - y1;
+    var dx = x2 - x1;
+    var nr = Math.abs( dy*x - dx*y + x2*y1 - y2*x1 );
+    var dr = Math.sqrt( dx*dx + dy*dy );
+    var dist = nr / dr;
+    return Math.round(dist);
+  } else {
+    return Number.MAX_SAFE_INTEGER;
+  }
+}
+
+function rect_standardize_coordinates(d) {
+  // d[x0,y0,x1,y1]
+  // ensures that (d[0],d[1]) is top-left corner while
+  // (d[2],d[3]) is bottom-right corner
+  if ( d[0] > d[2] ) {
+    // swap
+    var t = d[0];
+    d[0] = d[2];
+    d[2] = t;
+  }
+
+  if ( d[1] > d[3] ) {
+    // swap
+    var t = d[1];
+    d[1] = d[3];
+    d[3] = t;
+  }
+}
+
+function rect_update_corner(corner_id, d, x, y, preserve_aspect_ratio) {
+  // pre-condition : d[x0,y0,x1,y1] is standardized
+  // post-condition : corner is moved ( d may not stay standardized )
+  if (preserve_aspect_ratio) {
+    switch(corner_id) {
+    case 1: // Fall-through // top-left
+    case 3: // bottom-right
+      var dx = d[2] - d[0];
+      var dy = d[3] - d[1];
+      var norm = Math.sqrt( dx*dx + dy*dy );
+      var nx = dx / norm; // x component of unit vector along the diagonal of rect
+      var ny = dy / norm; // y component
+      var proj = (x - d[0]) * nx + (y - d[1]) * ny;
+      var proj_x = nx * proj;
+      var proj_y = ny * proj;
+      // constrain (mx,my) to lie on a line connecting (x0,y0) and (x1,y1)
+      x = Math.round( d[0] + proj_x );
+      y = Math.round( d[1] + proj_y );
+      break;
+
+    case 2: // Fall-through // top-right
+    case 4: // bottom-left
+      var dx = d[2] - d[0];
+      var dy = d[1] - d[3];
+      var norm = Math.sqrt( dx*dx + dy*dy );
+      var nx = dx / norm; // x component of unit vector along the diagonal of rect
+      var ny = dy / norm; // y component
+      var proj = (x - d[0]) * nx + (y - d[3]) * ny;
+      var proj_x = nx * proj;
+      var proj_y = ny * proj;
+      // constrain (mx,my) to lie on a line connecting (x0,y0) and (x1,y1)
+      x = Math.round( d[0] + proj_x );
+      y = Math.round( d[3] + proj_y );
+      break;
+    }
+  }
+
+  switch(corner_id) {
+  case 1: // top-left
+    d[0] = x;
+    d[1] = y;
+    break;
+
+  case 3: // bottom-right
+    d[2] = x;
+    d[3] = y;
+    break;
+
+  case 2: // top-right
+    d[2] = x;
+    d[1] = y;
+    break;
+
+  case 4: // bottom-left
+    d[0] = x;
+    d[3] = y;
+    break;
+
+  case 5: // top-middle
+    d[1] = y;
+    break;
+
+  case 6: // right-middle
+    d[2] = x;
+    break;
+
+  case 7: // bottom-middle
+    d[3] = y;
+    break;
+
+  case 8: // left-middle
+    d[0] = x;
+    break;
+  }
+}
+
+function _via_update_ui_components() {
+  if ( ! _via_current_image_loaded ) {
+    return;
+  }
+
+  show_message('Updating user interface components.');
+  switch(_via_display_area_content_name) {
+  case VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID:
+    image_grid_set_content_panel_height_fixed();
+    image_grid_set_content_to_current_group();
+    break;
+  case VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE:
+    if ( !_via_is_window_resized && _via_current_image_loaded ) {
+      _via_is_window_resized = true;
+      _via_show_img(_via_image_index);
+
+      if (_via_is_canvas_zoomed) {
+        reset_zoom_level();
+      }
+    }
+    break;
+  }
+}
+
+//
+// Shortcut key handlers
+//
+function _via_window_keydown_handler(e) {
+  if ( e.target === document.body ) {
+    // process the keyboard event
+    _via_handle_global_keydown_event(e);
+  }
+}
+
+// global keys are active irrespective of element focus
+// arrow keys, n, p, s, o, space, d, Home, End, PageUp, PageDown
+function _via_handle_global_keydown_event(e) {
+  // zoom
+  if (_via_current_image_loaded) {
+    if ( e.key === "+") {
+      zoom_in();
+      return;
+    }
+
+    if ( e.key === "=") {
+      reset_zoom_level();
+      return;
+    }
+
+    if ( e.key === "-") {
+      zoom_out();
+      return;
+    }
+  }
+
+  if ( e.key === 'ArrowRight' || e.key === 'n') {
+    move_to_next_image();
+    e.preventDefault();
+    return;
+  }
+  if ( e.key === 'ArrowLeft' || e.key === 'p') {
+    move_to_prev_image();
+    e.preventDefault();
+    return;
+  }
+
+  if ( e.key === 'ArrowUp' ) {
+    region_visualisation_update('region_label', '__via_region_id__', 1);
+    e.preventDefault();
+    return;
+  }
+
+  if ( e.key === 'ArrowDown' ) {
+    region_visualisation_update('region_color', '__via_default_region_color__', -1);
+    e.preventDefault();
+    return;
+  }
+
+
+  if ( e.key === 'Home') {
+    show_first_image();
+    e.preventDefault();
+    return;
+  }
+  if ( e.key === 'End') {
+    show_last_image();
+    e.preventDefault();
+    return;
+  }
+  if ( e.key === 'PageDown') {
+    jump_to_next_image_block();
+    e.preventDefault();
+    return;
+  }
+  if ( e.key === 'PageUp') {
+    jump_to_prev_image_block();
+    e.preventDefault();
+    return;
+  }
+
+  if ( e.key === 'a' ) {
+    if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+      // select all in image grid
+      image_grid_group_toggle_select_all();
+    }
+  }
+
+  if ( e.key === 'Escape' ) {
+    e.preventDefault();
+    if ( _via_is_loading_current_image ) {
+      _via_cancel_current_image_loading();
+    }
+
+    if ( _via_is_user_resizing_region ) {
+      // cancel region resizing action
+      _via_is_user_resizing_region = false;
+    }
+
+    if ( _via_is_region_selected ) {
+      // clear all region selections
+      _via_is_region_selected = false;
+      _via_user_sel_region_id = -1;
+      toggle_all_regions_selection(false);
+    }
+
+    if ( _via_is_user_drawing_polygon ) {
+      _via_is_user_drawing_polygon = false;
+      _via_canvas_regions.splice(_via_current_polygon_region_id, 1);
+    }
+
+    if ( _via_is_user_drawing_region ) {
+      _via_is_user_drawing_region = false;
+    }
+
+    if ( _via_is_user_resizing_region ) {
+      _via_is_user_resizing_region = false
+    }
+
+    if ( _via_is_user_moving_region ) {
+      _via_is_user_moving_region = false
+    }
+
+    _via_redraw_reg_canvas();
+    return;
+  }
+
+  if ( e.key === ' ' ) { // Space key
+    if ( e.ctrlKey ) {
+      annotation_editor_toggle_on_image_editor();
+    } else {
+      annotation_editor_toggle_all_regions_editor();
+    }
+    e.preventDefault();
+    return;
+  }
+
+  if ( e.key === 'F1' ) { // F1 for help
+    set_display_area_content(VIA_DISPLAY_AREA_CONTENT_NAME.PAGE_GETTING_STARTED);
+    e.preventDefault();
+    return;
+  }
+  if ( e.key === 'F2' ) { // F2 for about
+    set_display_area_content(VIA_DISPLAY_AREA_CONTENT_NAME.PAGE_ABOUT);
+    e.preventDefault();
+    return;
+  }
+}
+
+function _via_reg_canvas_keyup_handler(e) {
+  if ( e.ctrlKey ) {
+    _via_is_ctrl_pressed = false;
+  }
+}
+
+function _via_reg_canvas_keydown_handler(e) {
+  if ( e.ctrlKey ) {
+    _via_is_ctrl_pressed = true;
+  }
+
+  if (_via_current_image_loaded) {
+    if ( e.key === 'Enter' ) {
+        if ( _via_current_shape === VIA_REGION_SHAPE.POLYLINE ||
+             _via_current_shape === VIA_REGION_SHAPE.POLYGON) {
+          _via_polyshape_finish_drawing();
+        }
+    }
+    if ( e.key === 'Backspace' ) {
+        if ( _via_current_shape === VIA_REGION_SHAPE.POLYLINE ||
+             _via_current_shape === VIA_REGION_SHAPE.POLYGON) {
+          _via_polyshape_delete_last_vertex();
+        }
+    }
+
+    if ( e.key === 'a' ) {
+      sel_all_regions();
+      e.preventDefault();
+      return;
+    }
+
+    if ( e.key === 'c' ) {
+      if (_via_is_region_selected ||
+          _via_is_all_region_selected) {
+        copy_sel_regions();
+      }
+      e.preventDefault();
+      return;
+    }
+
+    if ( e.key === 'v' ) {
+      paste_sel_regions_in_current_image();
+      e.preventDefault();
+      return;
+    }
+
+    if ( e.key === 'b' ) {
+      toggle_region_boundary_visibility();
+      e.preventDefault();
+      return;
+    }
+
+    if ( e.key === 'l' ) {
+      toggle_region_id_visibility();
+      e.preventDefault();
+      return;
+    }
+
+    if ( e.key === 'd' ) {
+      if ( _via_is_region_selected ||
+           _via_is_all_region_selected ) {
+        del_sel_regions();
+      }
+      e.preventDefault();
+      return;
+    }
+
+    if ( _via_is_region_selected ) {
+      if ( e.key === 'ArrowRight' ||
+           e.key === 'ArrowLeft'  ||
+           e.key === 'ArrowDown'  ||
+           e.key === 'ArrowUp' ) {
+        var del = 1;
+        if ( e.shiftKey ) {
+          del = 10;
+        }
+        var move_x = 0;
+        var move_y = 0;
+        switch( e.key ) {
+        case 'ArrowLeft':
+          move_x = -del;
+          break;
+        case 'ArrowUp':
+          move_y = -del;
+          break;
+        case 'ArrowRight':
+          move_x =  del;
+          break;
+        case 'ArrowDown':
+          move_y =  del;
+          break;
+        }
+        _via_move_selected_regions(move_x, move_y);
+        _via_redraw_reg_canvas();
+        e.preventDefault();
+        return;
+      }
+    }
+  }
+  _via_handle_global_keydown_event(e);
+}
+
+function _via_polyshape_finish_drawing() {
+  if ( _via_is_user_drawing_polygon ) {
+    // double click is used to indicate completion of
+    // polygon or polyline drawing action
+    var new_region_id = _via_current_polygon_region_id;
+    var new_region_shape = _via_current_shape;
+
+    var npts =  _via_canvas_regions[new_region_id].shape_attributes['all_points_x'].length;
+    if ( npts <=2 && new_region_shape === VIA_REGION_SHAPE.POLYGON ) {
+      show_message('For a polygon, you must define at least 3 points. ' +
+                   'Press [Esc] to cancel drawing operation.!');
+      return;
+    }
+    if ( npts <=1 && new_region_shape === VIA_REGION_SHAPE.POLYLINE ) {
+      show_message('A polyline must have at least 2 points. ' +
+                   'Press [Esc] to cancel drawing operation.!');
+      return;
+    }
+
+    var img_id = _via_image_id;
+    _via_current_polygon_region_id = -1;
+    _via_is_user_drawing_polygon = false;
+    _via_is_user_drawing_region = false;
+
+    _via_img_metadata[img_id].regions[new_region_id] = {}; // create placeholder
+    _via_polyshape_add_new_polyshape(img_id, new_region_shape, new_region_id);
+    select_only_region(new_region_id); // select new region
+    set_region_annotations_to_default_value( new_region_id );
+    annotation_editor_add_row( new_region_id );
+    annotation_editor_scroll_to_row( new_region_id );
+
+    _via_redraw_reg_canvas();
+    _via_reg_canvas.focus();
+  }
+  return;
+}
+
+function _via_polyshape_delete_last_vertex() {
+  if ( _via_is_user_drawing_polygon ) {
+    var npts = _via_canvas_regions[_via_current_polygon_region_id].shape_attributes['all_points_x'].length;
+    if ( npts > 0 ) {
+      _via_canvas_regions[_via_current_polygon_region_id].shape_attributes['all_points_x'].splice(npts - 1, 1);
+      _via_canvas_regions[_via_current_polygon_region_id].shape_attributes['all_points_y'].splice(npts - 1, 1);
+
+      _via_redraw_reg_canvas();
+      _via_reg_canvas.focus();
+    }
+  }
+}
+
+function _via_polyshape_add_new_polyshape(img_id, region_shape, region_id) {
+  // add all polygon points stored in _via_canvas_regions[]
+  var all_points_x = _via_canvas_regions[region_id].shape_attributes['all_points_x'].slice(0);
+  var all_points_y = _via_canvas_regions[region_id].shape_attributes['all_points_y'].slice(0);
+
+  var canvas_all_points_x = [];
+  var canvas_all_points_y = [];
+  var n = all_points_x.length;
+  var i;
+  for ( i = 0; i < n; ++i ) {
+    all_points_x[i] = Math.round( all_points_x[i] * _via_canvas_scale );
+    all_points_y[i] = Math.round( all_points_y[i] * _via_canvas_scale );
+
+    canvas_all_points_x[i] = Math.round( all_points_x[i] / _via_canvas_scale );
+    canvas_all_points_y[i] = Math.round( all_points_y[i] / _via_canvas_scale );
+  }
+
+  var polygon_region = new file_region();
+  polygon_region.shape_attributes['name'] = region_shape;
+  polygon_region.shape_attributes['all_points_x'] = all_points_x;
+  polygon_region.shape_attributes['all_points_y'] = all_points_y;
+  _via_img_metadata[img_id].regions[region_id] = polygon_region;
+
+  // update canvas
+  if ( img_id === _via_image_id ) {
+    _via_canvas_regions[region_id].shape_attributes['name'] = region_shape;
+    _via_canvas_regions[region_id].shape_attributes['all_points_x'] = canvas_all_points_x;
+    _via_canvas_regions[region_id].shape_attributes['all_points_y'] = canvas_all_points_y;
+  }
+}
+
+function del_sel_regions() {
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+    return;
+  }
+
+  if ( !_via_current_image_loaded ) {
+    show_message('First load some images!');
+    return;
+  }
+
+  var del_region_count = 0;
+  if ( _via_is_all_region_selected ) {
+    del_region_count = _via_canvas_regions.length;
+    _via_canvas_regions.splice(0);
+    _via_img_metadata[_via_image_id].regions.splice(0);
+  } else {
+    var sorted_sel_reg_id = [];
+    for ( var i = 0; i < _via_canvas_regions.length; ++i ) {
+      if ( _via_region_selected_flag[i] ) {
+        sorted_sel_reg_id.push(i);
+        _via_region_selected_flag[i] = false;
+      }
+    }
+    sorted_sel_reg_id.sort( function(a,b) {
+      return (b-a);
+    });
+    for ( var i = 0; i < sorted_sel_reg_id.length; ++i ) {
+      _via_canvas_regions.splice( sorted_sel_reg_id[i], 1);
+      _via_img_metadata[_via_image_id].regions.splice( sorted_sel_reg_id[i], 1);
+      del_region_count += 1;
+    }
+
+    if ( sorted_sel_reg_id.length ) {
+      _via_reg_canvas.style.cursor = "default";
+    }
+  }
+
+  _via_is_all_region_selected = false;
+  _via_is_region_selected     = false;
+  _via_user_sel_region_id     = -1;
+
+  if ( _via_canvas_regions.length === 0 ) {
+    // all regions were deleted, hence clear region canvas
+    _via_clear_reg_canvas();
+  } else {
+    _via_redraw_reg_canvas();
+  }
+  _via_reg_canvas.focus();
+  annotation_editor_show();
+
+  show_message('Deleted ' + del_region_count + ' selected regions');
+}
+
+function sel_all_regions() {
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+    image_grid_group_toggle_select_all();
+    return;
+  }
+
+  if (!_via_current_image_loaded) {
+    show_message('First load some images!');
+    return;
+  }
+
+  toggle_all_regions_selection(true);
+  _via_is_all_region_selected = true;
+  _via_redraw_reg_canvas();
+}
+
+function copy_sel_regions() {
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+    return;
+  }
+
+  if (!_via_current_image_loaded) {
+    show_message('First load some images!');
+    return;
+  }
+
+  if (_via_is_region_selected ||
+      _via_is_all_region_selected) {
+    _via_copied_image_regions.splice(0);
+    for ( var i = 0; i < _via_img_metadata[_via_image_id].regions.length; ++i ) {
+      var img_region = _via_img_metadata[_via_image_id].regions[i];
+      var canvas_region = _via_canvas_regions[i];
+      if ( _via_region_selected_flag[i] ) {
+        _via_copied_image_regions.push( clone_image_region(img_region) );
+      }
+    }
+    show_message('Copied ' + _via_copied_image_regions.length +
+                 ' selected regions. Press Ctrl + v to paste');
+  } else {
+    show_message('Select a region first!');
+  }
+}
+
+function paste_sel_regions_in_current_image() {
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+    return;
+  }
+
+  if ( !_via_current_image_loaded ) {
+    show_message('First load some images!');
+    return;
+  }
+
+  if ( _via_copied_image_regions.length ) {
+    var pasted_reg_count = 0;
+    for ( var i = 0; i < _via_copied_image_regions.length; ++i ) {
+      // ensure copied the regions are within this image's boundaries
+      var bbox = get_region_bounding_box( _via_copied_image_regions[i] );
+      if (bbox[2] < _via_current_image_width &&
+          bbox[3] < _via_current_image_height) {
+        var r = clone_image_region(_via_copied_image_regions[i]);
+        _via_img_metadata[_via_image_id].regions.push(r);
+
+        pasted_reg_count += 1;
+      }
+    }
+    _via_load_canvas_regions();
+    var discarded_reg_count = _via_copied_image_regions.length - pasted_reg_count;
+    show_message('Pasted ' + pasted_reg_count + ' regions. ' +
+                 'Discarded ' + discarded_reg_count + ' regions exceeding image boundary.');
+    _via_redraw_reg_canvas();
+    _via_reg_canvas.focus();
+  } else {
+    show_message('To paste a region, you first need to select a region and copy it!');
+  }
+}
+
+function paste_to_multiple_images_with_confirm() {
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+    return;
+  }
+
+  if ( _via_copied_image_regions.length === 0 ) {
+    show_message('First copy some regions!');
+    return;
+  }
+
+  var config = {'title':'Paste Regions to Multiple Images' };
+  var input = { 'region_count': { type:'text', name:'Number of copied regions', value:_via_copied_image_regions.length, disabled:true },
+                'prev_next_count':{ type:'text', name:'Copy to (count format)<br><span style="font-size:0.8rem">For example: to paste copied regions to the <i>previous 2 images</i> and <i>next 3 images</i>, type <strong>2,3</strong> in the textbox and to paste only in <i>next 5 images</i>, type <strong>0,5</strong></span>', placeholder:'2,3', disabled:false, size:30},
+                'img_index_list':{ type:'text', name:'Copy to (image index list)<br><span style="font-size:0.8rem">For example: <strong>2-5,7,9</strong> pastes the copied regions to the images with the following id <i>2,3,4,5,7,9</i> and <strong>3,8,141</strong> pastes to the images with id <i>3,8 and 141</i></span>', placeholder:'2-5,7,9', disabled:false, size:30},
+                'regex':{ type:'text', name:'Copy to filenames matching a regular expression<br><span style="font-size:0.8rem">For example: <strong>_large</strong> pastes the copied regions to all images whose filename contain the keyword <i>_large</i></span>', placeholder:'regular expression', disabled:false, size:30},
+                'include_region_attributes':{ type:'checkbox', name:'Paste also the region annotations', checked:true},
+              };
+
+  invoke_with_user_inputs(paste_to_multiple_images_confirmed, input, config);
+}
+
+function paste_to_multiple_images_confirmed(input) {
+  // keep a copy of user inputs for the undo operation
+  _via_paste_to_multiple_images_input = input;
+  var intersect = generate_img_index_list(input);
+  var i;
+  var total_pasted_region_count = 0;
+  for ( i = 0; i < intersect.length; i++ ) {
+    total_pasted_region_count += paste_regions( intersect[i] );
+  }
+
+  show_message('Pasted [' + total_pasted_region_count + '] regions ' +
+               'in ' + intersect.length + ' images');
+
+  if ( intersect.includes(_via_image_index) ) {
+    _via_load_canvas_regions();
+    _via_redraw_reg_canvas();
+    _via_reg_canvas.focus();
+  }
+  user_input_default_cancel_handler();
+}
+
+function paste_regions(img_index) {
+  var pasted_reg_count = 0;
+  if ( _via_copied_image_regions.length ) {
+    var img_id = _via_image_id_list[img_index];
+    var i;
+    for ( i = 0; i < _via_copied_image_regions.length; ++i ) {
+      var r = clone_image_region(_via_copied_image_regions[i]);
+      _via_img_metadata[img_id].regions.push(r);
+
+      pasted_reg_count += 1;
+    }
+  }
+  return pasted_reg_count;
+}
+
+
+function del_sel_regions_with_confirm() {
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+    return;
+  }
+
+  if ( _via_copied_image_regions.length === 0 ) {
+    show_message('First copy some regions!');
+    return;
+  }
+
+  var prev_next_count, img_index_list, regex;
+  if ( _via_paste_to_multiple_images_input ) {
+    prev_next_count = _via_paste_to_multiple_images_input.prev_next_count.value;
+    img_index_list  = _via_paste_to_multiple_images_input.img_index_list.value;
+    regex = _via_paste_to_multiple_images_input.regex.value;
+  }
+
+  var config = {'title':'Undo Regions Pasted to Multiple Images' };
+  var input = { 'region_count': { type:'text', name:'Number of regions selected', value:_via_copied_image_regions.length, disabled:true },
+                'prev_next_count':{ type:'text', name:'Delete from (count format)<br><span style="font-size:0.8rem">For example: to delete copied regions from the <i>previous 2 images</i> and <i>next 3 images</i>, type <strong>2,3</strong> in the textbox and to delete regions only in <i>next 5 images</i>, type <strong>0,5</strong></span>', placeholder:'2,3', disabled:false, size:30, value:prev_next_count},
+                'img_index_list':{ type:'text', name:'Delete from (image index list)<br><span style="font-size:0.8rem">For example: <strong>2-5,7,9</strong> deletes the copied regions to the images with the following id <i>2,3,4,5,7,9</i> and <strong>3,8,141</strong> deletes regions from the images with id <i>3,8 and 141</i></span>', placeholder:'2-5,7,9', disabled:false, size:30, value:img_index_list},
+                'regex':{ type:'text', name:'Delete from filenames matching a regular expression<br><span style="font-size:0.8rem">For example: <strong>_large</strong> deletes the copied regions from all images whose filename contain the keyword <i>_large</i></span>', placeholder:'regular expression', disabled:false, size:30, value:regex},
+              };
+
+  invoke_with_user_inputs(del_sel_regions_confirmed, input, config);
+}
+
+function del_sel_regions_confirmed(input) {
+  user_input_default_cancel_handler();
+  var intersect = generate_img_index_list(input);
+  var i;
+  var total_deleted_region_count = 0;
+  for ( i = 0; i < intersect.length; i++ ) {
+    total_deleted_region_count += delete_regions( intersect[i] );
+  }
+
+  show_message('Deleted [' + total_deleted_region_count + '] regions ' +
+               'in ' + intersect.length + ' images');
+
+  if ( intersect.includes(_via_image_index) ) {
+    _via_load_canvas_regions();
+    _via_redraw_reg_canvas();
+    _via_reg_canvas.focus();
+  }
+}
+
+function delete_regions(img_index) {
+  var del_region_count = 0;
+  if ( _via_copied_image_regions.length ) {
+    var img_id = _via_image_id_list[img_index];
+    var i;
+    for ( i = 0; i < _via_copied_image_regions.length; ++i ) {
+      var copied_region_shape_str = JSON.stringify(_via_copied_image_regions[i].shape_attributes);
+      var j;
+      // start from last region in order to delete the last pasted region
+      for ( j = _via_img_metadata[img_id].regions.length-1; j >= 0; --j ) {
+        if ( JSON.stringify(_via_img_metadata[img_id].regions[j].shape_attributes) === copied_region_shape_str ) {
+          _via_img_metadata[img_id].regions.splice( j, 1);
+          del_region_count += 1;
+          break; // delete only one matching region
+        }
+      }
+    }
+  }
+  return del_region_count;
+}
+
+function show_first_image() {
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+    if ( _via_image_grid_group_var.length ) {
+      image_grid_group_prev( { 'value':0 } ); // simulate button click
+    } else {
+      show_message('First, create groups by selecting items from "Group by" dropdown list');
+    }
+    return;
+  }
+
+  if (_via_img_count > 0) {
+    _via_show_img( _via_img_fn_list_img_index_list[0] );
+  }
+}
+
+function show_last_image() {
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+    if ( _via_image_grid_group_var.length ) {
+      image_grid_group_prev( { 'value':_via_image_grid_group_var.length-1 } ); // simulate button click
+    } else {
+      show_message('First, create groups by selecting items from "Group by" dropdown list');
+    }
+    return;
+  }
+
+  if (_via_img_count > 0) {
+    var last_img_index = _via_img_fn_list_img_index_list.length - 1;
+    _via_show_img( _via_img_fn_list_img_index_list[ last_img_index ] );
+  }
+}
+
+function jump_image_block_get_count() {
+  var n = _via_img_fn_list_img_index_list.length;
+  if ( n < 20 ) {
+    return 2;
+  }
+  if ( n < 100 ) {
+    return 10;
+  }
+  if ( n < 1000 ) {
+    return 25;
+  }
+  if ( n < 5000 ) {
+    return 50;
+  }
+  if ( n < 10000 ) {
+    return 100;
+  }
+  if ( n < 50000 ) {
+    return 500;
+  }
+
+  return Math.round( n / 50 );
+}
+
+function jump_to_next_image_block() {
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+    return;
+  }
+
+  var jump_count = jump_image_block_get_count();
+  if ( jump_count > 1 ) {
+    var current_img_index = _via_image_index;
+    if ( _via_img_fn_list_img_index_list.includes( current_img_index ) ) {
+      var list_index = _via_img_fn_list_img_index_list.indexOf( current_img_index );
+      var next_list_index = list_index + jump_count;
+      if ( (next_list_index + 1) > _via_img_fn_list_img_index_list.length ) {
+        next_list_index = 0;
+      }
+      var next_img_index = _via_img_fn_list_img_index_list[next_list_index];
+      _via_show_img(next_img_index);
+    }
+  } else {
+    move_to_next_image();
+  }
+}
+
+function jump_to_prev_image_block() {
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+    return;
+  }
+
+  var jump_count = jump_image_block_get_count();
+  if ( jump_count > 1 ) {
+    var current_img_index = _via_image_index;
+    if ( _via_img_fn_list_img_index_list.includes( current_img_index ) ) {
+      var list_index = _via_img_fn_list_img_index_list.indexOf( current_img_index );
+      var prev_list_index = list_index - jump_count;
+      if ( prev_list_index < 0 ) {
+        prev_list_index = _via_img_fn_list_img_index_list.length - 1;
+      }
+      var prev_img_index = _via_img_fn_list_img_index_list[prev_list_index];
+      _via_show_img(prev_img_index);
+    }
+  } else {
+    move_to_prev_image();
+  }
+}
+
+function move_to_prev_image() {
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+    if ( _via_image_grid_group_var.length ) {
+      var last_group_index = _via_image_grid_group_var.length - 1;
+      image_grid_group_prev( { 'value':last_group_index } ); // simulate button click
+    } else {
+      show_message('First, create groups by selecting items from "Group by" dropdown list');
+    }
+    return;
+  }
+
+  if (_via_img_count > 0) {
+    var current_img_index = _via_image_index;
+    if ( _via_img_fn_list_img_index_list.includes( current_img_index ) ) {
+      var list_index = _via_img_fn_list_img_index_list.indexOf( current_img_index );
+      var next_list_index = list_index - 1;
+      if ( next_list_index === -1 ) {
+        next_list_index = _via_img_fn_list_img_index_list.length - 1;
+      }
+      var next_img_index = _via_img_fn_list_img_index_list[next_list_index];
+      _via_show_img(next_img_index);
+    } else {
+      if ( _via_img_fn_list_img_index_list.length === 0 ) {
+        show_message('Filtered file list does not any files!');
+      } else {
+        _via_show_img( _via_img_fn_list_img_index_list[0] );
+      }
+    }
+
+    if (typeof _via_hook_prev_image === 'function') {
+      _via_hook_prev_image(current_img_index);
+    }
+  }
+}
+
+function move_to_next_image() {
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+    if ( _via_image_grid_group_var.length ) {
+      var last_group_index = _via_image_grid_group_var.length - 1;
+      image_grid_group_next( { 'value':last_group_index } ); // simulate button click
+    } else {
+      show_message('First, create groups by selecting items from "Group by" dropdown list');
+    }
+    return;
+  }
+
+  if (_via_img_count > 0) {
+    var current_img_index = _via_image_index;
+    if ( _via_img_fn_list_img_index_list.includes( current_img_index ) ) {
+      var list_index = _via_img_fn_list_img_index_list.indexOf( current_img_index );
+      var next_list_index = list_index + 1;
+      if ( next_list_index === _via_img_fn_list_img_index_list.length ) {
+        next_list_index = 0;
+      }
+      var next_img_index = _via_img_fn_list_img_index_list[next_list_index];
+      _via_show_img(next_img_index);
+    } else {
+      if ( _via_img_fn_list_img_index_list.length === 0 ) {
+        show_message('Filtered file list does not contain any files!');
+      } else {
+        _via_show_img( _via_img_fn_list_img_index_list[0] );
+      }
+    }
+
+    if (typeof _via_hook_next_image === 'function') {
+      _via_hook_next_image(current_img_index);
+    }
+  }
+}
+
+function set_zoom(zoom_level_index) {
+  if ( zoom_level_index === VIA_CANVAS_DEFAULT_ZOOM_LEVEL_INDEX ) {
+    _via_is_canvas_zoomed = false;
+    _via_canvas_zoom_level_index = VIA_CANVAS_DEFAULT_ZOOM_LEVEL_INDEX;
+  } else {
+    _via_is_canvas_zoomed = true;
+    _via_canvas_zoom_level_index = zoom_level_index;
+  }
+
+  var zoom_scale = VIA_CANVAS_ZOOM_LEVELS[_via_canvas_zoom_level_index];
+  set_all_canvas_scale(zoom_scale);
+  var canvas_w = ( _via_current_image.naturalWidth  * zoom_scale ) / _via_canvas_scale_without_zoom;
+  var canvas_h = ( _via_current_image.naturalHeight * zoom_scale ) / _via_canvas_scale_without_zoom;
+  set_all_canvas_size(canvas_w, canvas_h);
+  _via_canvas_scale = _via_canvas_scale_without_zoom / zoom_scale;
+  _via_canvas_scale = _via_canvas_scale_without_zoom / zoom_scale;
+
+  if ( zoom_scale === 1 ) {
+    VIA_REGION_POINT_RADIUS = VIA_REGION_POINT_RADIUS_DEFAULT;
+  } else {
+    if ( zoom_scale > 1 ) {
+      VIA_REGION_POINT_RADIUS = VIA_REGION_POINT_RADIUS_DEFAULT * zoom_scale;
+    }
+  }
+
+  _via_load_canvas_regions(); // image to canvas space transform
+  _via_redraw_reg_canvas();
+  _via_reg_canvas.focus();
+  update_vertical_space();
+}
+
+function reset_zoom_level() {
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+    image_grid_image_size_reset();
+    show_message('Zoom reset');
+    return;
+  }
+
+  if (!_via_current_image_loaded) {
+    show_message('First load some images!');
+    return;
+  }
+
+  if (_via_is_canvas_zoomed) {
+    set_zoom(VIA_CANVAS_DEFAULT_ZOOM_LEVEL_INDEX);
+    show_message('Zoom reset');
+  } else {
+    show_message('Cannot reset zoom because image zoom has not been applied!');
+  }
+  update_vertical_space();
+}
+
+function zoom_in() {
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+    image_grid_image_size_increase();
+    show_message('Increased size of images shown in image grid');
+    return;
+  }
+
+  if (!_via_current_image_loaded) {
+    show_message('First load some images!');
+    return;
+  }
+
+  if ( _via_is_user_drawing_polygon || _via_is_user_drawing_region ) {
+    return;
+  }
+
+  if (_via_canvas_zoom_level_index === (VIA_CANVAS_ZOOM_LEVELS.length-1)) {
+    show_message('Further zoom-in not possible');
+  } else {
+    var new_zoom_level_index = _via_canvas_zoom_level_index + 1;
+    set_zoom( new_zoom_level_index );
+    show_message('Zoomed in to level ' + VIA_CANVAS_ZOOM_LEVELS[_via_canvas_zoom_level_index] + 'X');
+  }
+}
+
+function zoom_out() {
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+    image_grid_image_size_decrease();
+    show_message('Reduced size of images shown in image grid');
+    return;
+  }
+
+  if (!_via_current_image_loaded) {
+    show_message('First load some images!');
+    return;
+  }
+
+  if ( _via_is_user_drawing_polygon || _via_is_user_drawing_region ) {
+    return;
+  }
+
+  if (_via_canvas_zoom_level_index === 0) {
+    show_message('Further zoom-out not possible');
+  } else {
+    var new_zoom_level_index = _via_canvas_zoom_level_index - 1;
+    set_zoom( new_zoom_level_index );
+    show_message('Zoomed out to level ' + VIA_CANVAS_ZOOM_LEVELS[_via_canvas_zoom_level_index] + 'X');
+  }
+}
+
+function toggle_region_boundary_visibility() {
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE ) {
+    _via_is_region_boundary_visible = !_via_is_region_boundary_visible;
+    _via_redraw_reg_canvas();
+    _via_reg_canvas.focus();
+  }
+
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+    if ( _via_settings.ui.image_grid.show_region_shape ) {
+      _via_settings.ui.image_grid.show_region_shape = false;
+      document.getElementById('image_grid_content_rshape').innerHTML = '';
+    } else {
+      _via_settings.ui.image_grid.show_region_shape = true;
+      image_grid_page_show_all_regions();
+    }
+  }
+}
+
+function toggle_region_id_visibility() {
+  _via_is_region_id_visible = !_via_is_region_id_visible;
+  _via_redraw_reg_canvas();
+  _via_reg_canvas.focus();
+}
+
+function toggle_region_info_visibility() {
+  var elem = document.getElementById('region_info');
+  // toggle between displaying and not displaying
+  if ( elem.classList.contains('display_none') ) {
+    elem.classList.remove('display_none');
+    _via_is_region_info_visible = true;
+  } else {
+    elem.classList.add('display_none');
+    _via_is_region_info_visible = false;
+  }
+}
+
+//
+// Mouse wheel event listener
+//
+function _via_reg_canvas_mouse_wheel_listener(e) {
+  if (!_via_current_image_loaded) {
+    return;
+  }
+
+  if ( e.ctrlKey ) {
+    // perform zoom
+    if (e.deltaY < 0) {
+      zoom_in();
+    } else {
+      zoom_out();
+    }
+    e.preventDefault();
+  }
+}
+
+function region_visualisation_update(type, default_id, next_offset) {
+  var attr_list = [ default_id ];
+  attr_list = attr_list.concat(Object.keys(_via_attributes['region']));
+  var n = attr_list.length;
+  var current_index = attr_list.indexOf(_via_settings.ui.image[type]);
+  var new_index;
+  if ( current_index !== -1 ) {
+    new_index = current_index + next_offset;
+
+    if ( new_index < 0 ) {
+      new_index = n + new_index;
+    }
+    if ( new_index >= n ) {
+      new_index = new_index - n;
+    }
+    switch(type) {
+    case 'region_label':
+      _via_settings.ui.image.region_label = attr_list[new_index];
+      _via_redraw_reg_canvas();
+      break;
+    case 'region_color':
+      _via_settings.ui.image.region_color = attr_list[new_index];
+      _via_regions_group_color_init();
+      _via_redraw_reg_canvas();
+    }
+
+    var type_str = type.replace('_', ' ');
+    if ( _via_settings.ui.image[type].startsWith('__via') ) {
+      show_message(type_str + ' cleared');
+    } else {
+      show_message(type_str + ' set to region attribute [' + _via_settings.ui.image[type] + ']');
+    }
+  }
+}
+
+//
+// left sidebar toolbox maintainer
+//
+function leftsidebar_toggle() {
+  var leftsidebar = document.getElementById('leftsidebar');
+  if ( leftsidebar.style.display === 'none' ) {
+    leftsidebar.style.display = 'table-cell';
+    document.getElementById('leftsidebar_collapse_panel').style.display = 'none';
+  } else {
+    leftsidebar.style.display = 'none';
+    document.getElementById('leftsidebar_collapse_panel').style.display = 'table-cell';
+  }
+  _via_update_ui_components();
+}
+
+function leftsidebar_increase_width() {
+  var leftsidebar = document.getElementById('leftsidebar');
+  var new_width = _via_settings.ui.leftsidebar_width + VIA_LEFTSIDEBAR_WIDTH_CHANGE;
+  leftsidebar.style.width = new_width + 'rem';
+  _via_settings.ui.leftsidebar_width = new_width;
+  if ( _via_current_image_loaded ) {
+    _via_show_img(_via_image_index);
+  }
+}
+
+function leftsidebar_decrease_width() {
+  var leftsidebar = document.getElementById('leftsidebar');
+  var new_width = _via_settings.ui.leftsidebar_width - VIA_LEFTSIDEBAR_WIDTH_CHANGE;
+  if ( new_width >= 5 ) {
+    leftsidebar.style.width = new_width + 'rem';
+    _via_settings.ui.leftsidebar_width = new_width;
+    if ( _via_current_image_loaded ) {
+      _via_show_img(_via_image_index);
+    }
+  }
+}
+
+function leftsidebar_show() {
+  var leftsidebar = document.getElementById('leftsidebar');
+  leftsidebar.style.display = 'table-cell';
+  document.getElementById('leftsidebar_collapse_panel').style.display = 'none';
+}
+
+// source: https://www.w3schools.com/howto/howto_js_accordion.asp
+function init_leftsidebar_accordion() {
+  var leftsidebar = document.getElementById('leftsidebar');
+  leftsidebar.style.width = _via_settings.ui.leftsidebar_width + 'rem';
+
+  var acc = document.getElementsByClassName('leftsidebar_accordion');
+  var i;
+  for ( i = 0; i < acc.length; ++i ) {
+    acc[i].addEventListener('click', function() {
+      update_vertical_space();
+      this.classList.toggle('active');
+      this.nextElementSibling.classList.toggle('show');
+
+      switch( this.innerHTML ) {
+      case 'Attributes':
+        update_attributes_update_panel();
+        break;
+      case 'Project':
+        update_img_fn_list();
+        break;
+      }
+    });
+  }
+}
+
+//
+// image filename list shown in leftsidebar panel
+//
+function is_img_fn_list_visible() {
+  return img_fn_list_panel.classList.contains('show');
+}
+
+function img_loading_spinbar(image_index, show) {
+  var panel = document.getElementById('project_panel_title');
+  if ( show ) {
+    panel.innerHTML = 'Project <span style="margin-left:1rem;" class="loading_spinbox"></span>';
+  } else {
+    panel.innerHTML = 'Project';
+  }
+}
+
+function update_img_fn_list() {
+  var regex = document.getElementById('img_fn_list_regex').value;
+  var p = document.getElementById('filelist_preset_filters_list');
+  if ( regex === '' || regex === null ) {
+    if ( p.selectedIndex === 0 ) {
+      // show all files
+      _via_img_fn_list_html = [];
+      _via_img_fn_list_img_index_list = [];
+      _via_img_fn_list_html.push('<ul>');
+      for ( var i=0; i < _via_image_filename_list.length; ++i ) {
+        _via_img_fn_list_html.push( img_fn_list_ith_entry_html(i) );
+        _via_img_fn_list_img_index_list.push(i);
+      }
+      _via_img_fn_list_html.push('</ul>');
+      img_fn_list.innerHTML = _via_img_fn_list_html.join('');
+      img_fn_list_scroll_to_current_file();
+    } else {
+      // filter according to preset filters
+      img_fn_list_onpresetfilter_select();
+    }
+  } else {
+    img_fn_list_generate_html(regex);
+    img_fn_list.innerHTML = _via_img_fn_list_html.join('');
+    img_fn_list_scroll_to_current_file();
+  }
+}
+
+function img_fn_list_onregex() {
+  var regex = document.getElementById('img_fn_list_regex').value;
+  img_fn_list_generate_html( regex );
+  img_fn_list.innerHTML = _via_img_fn_list_html.join('');
+  img_fn_list_scroll_to_current_file();
+
+  // select 'regex' in the predefined filter list
+  var p = document.getElementById('filelist_preset_filters_list');
+  if ( regex === '' ) {
+    p.selectedIndex = 0;
+  } else {
+    var i;
+    for ( i=0; i<p.options.length; ++i ) {
+      if ( p.options[i].value === 'regex' ) {
+        p.selectedIndex = i;
+        break;
+      }
+    }
+  }
+}
+
+function img_fn_list_onpresetfilter_select() {
+  var p = document.getElementById('filelist_preset_filters_list');
+  var filter = p.options[p.selectedIndex].value;
+  switch(filter) {
+  case 'all':
+    document.getElementById('img_fn_list_regex').value = '';
+    img_fn_list_generate_html();
+    img_fn_list.innerHTML = _via_img_fn_list_html.join('');
+    img_fn_list_scroll_to_current_file();
+    break;
+  case 'regex':
+    document.getElementById('img_fn_list_regex').focus();
+    break;
+  default:
+    _via_img_fn_list_html = [];
+    _via_img_fn_list_img_index_list = [];
+    _via_img_fn_list_html.push('<ul>');
+    var i;
+    for ( i=0; i < _via_image_filename_list.length; ++i ) {
+      var img_id = _via_image_id_list[i];
+      var add_to_list = false;
+      switch(filter) {
+      case 'files_without_region':
+        if ( _via_img_metadata[img_id].regions.length === 0 ) {
+          add_to_list = true;
+        }
+        break;
+      case 'files_missing_region_annotations':
+        if ( is_region_annotation_missing(img_id) ) {
+          add_to_list = true;
+        }
+        break;
+      case 'files_missing_file_annotations':
+        if ( is_file_annotation_missing(img_id) ) {
+          add_to_list = true;
+        }
+        break;
+      case 'files_error_loading':
+        if ( _via_image_load_error[i] === true ) {
+          add_to_list = true;
+        }
+      }
+      if ( add_to_list ) {
+        _via_img_fn_list_html.push( img_fn_list_ith_entry_html(i) );
+        _via_img_fn_list_img_index_list.push(i);
+      }
+    }
+    _via_img_fn_list_html.push('</ul>');
+    img_fn_list.innerHTML = _via_img_fn_list_html.join('');
+    img_fn_list_scroll_to_current_file();
+    break;
+  }
+}
+
+function is_region_annotation_missing(img_id) {
+  var region_attribute;
+  var i;
+  for ( i = 0; i < _via_img_metadata[img_id].regions.length; ++i ) {
+    for ( region_attribute in _via_attributes['region'] ) {
+      if ( _via_img_metadata[img_id].regions[i].region_attributes.hasOwnProperty(region_attribute) ) {
+        if ( _via_img_metadata[img_id].regions[i].region_attributes[region_attribute] === '' ) {
+          return true;
+        }
+      } else {
+        return true;
+      }
+    }
+  }
+  return false;
+}
+
+function is_file_annotation_missing(img_id) {
+  var file_attribute;
+  for ( file_attribute in _via_attributes['file'] ) {
+    if ( _via_img_metadata[img_id].file_attributes.hasOwnProperty(file_attribute) ) {
+      if ( _via_img_metadata[img_id].file_attributes[file_attribute] === '' ) {
+        return true;
+      }
+    } else {
+      return true;
+    }
+  }
+  return false;
+}
+
+function img_fn_list_ith_entry_selected(img_index, is_selected) {
+  if ( is_selected ) {
+    img_fn_list_ith_entry_add_css_class(img_index, 'sel');
+  } else {
+    img_fn_list_ith_entry_remove_css_class(img_index, 'sel');
+  }
+}
+
+function img_fn_list_ith_entry_error(img_index, is_error) {
+  if ( is_error ) {
+    img_fn_list_ith_entry_add_css_class(img_index, 'error');
+  } else {
+    img_fn_list_ith_entry_remove_css_class(img_index, 'error');
+  }
+}
+
+function img_fn_list_ith_entry_add_css_class(img_index, classname) {
+  var li = document.getElementById('fl' + img_index);
+  if ( li && ! li.classList.contains(classname)  ) {
+    li.classList.add(classname);
+  }
+}
+
+function img_fn_list_ith_entry_remove_css_class(img_index, classname) {
+  var li = document.getElementById('fl' + img_index);
+  if ( li && li.classList.contains(classname) ) {
+    li.classList.remove(classname);
+  }
+}
+
+function img_fn_list_clear_all_style() {
+  var cn = document.getElementById('img_fn_list').childNodes[0].childNodes;
+  var i, j;
+  var n = cn.length;
+  var nclass;
+  for ( i = 0; i < n; ++i ) {
+    //cn[i].classList = []; // throws error in Edge browser
+    nclass = cn[i].classList.length;
+    if ( nclass ) {
+      for ( j = 0; j < nclass; ++j ) {
+        cn[i].classList.remove( cn[i].classList.item(j) );
+      }
+    }
+  }
+}
+
+function img_fn_list_clear_css_classname(classname) {
+  var cn = document.getElementById('img_fn_list').childNodes[0].childNodes;
+  var i;
+  var n = cn.length;
+  for ( i = 0; i < n; ++i ) {
+    if ( cn[i].classList.contains(classname) ) {
+      cn[i].classList.remove(classname);
+    }
+  }
+}
+
+function img_fn_list_ith_entry_html(i) {
+  var htmli = '';
+  var filename = _via_image_filename_list[i];
+  if ( is_url(filename) ) {
+    filename = filename.substr(0,4) + '...' + get_filename_from_url(filename);
+  }
+
+  htmli += '<li id="fl' + i + '"';
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+    if ( _via_image_grid_page_img_index_list.includes(i) ) {
+      // highlight images being shown in image grid
+      htmli += ' class="sel"';
+    }
+
+  } else {
+    if ( i === _via_image_index ) {
+      // highlight the current entry
+      htmli += ' class="sel"';
+    }
+  }
+  htmli += ' onclick="jump_to_image(' + (i) + ')" title="' + _via_image_filename_list[i] + '">[' + (i+1) + '] ' + filename + '</li>';
+  return htmli;
+}
+
+function img_fn_list_generate_html(regex) {
+  _via_img_fn_list_html = [];
+  _via_img_fn_list_img_index_list = [];
+  _via_img_fn_list_html.push('<ul>');
+  for ( var i=0; i < _via_image_filename_list.length; ++i ) {
+    var filename = _via_image_filename_list[i];
+    if ( filename.match(regex) !== null ) {
+      _via_img_fn_list_html.push( img_fn_list_ith_entry_html(i) );
+      _via_img_fn_list_img_index_list.push(i);
+    }
+  }
+  _via_img_fn_list_html.push('</ul>');
+}
+
+function img_fn_list_scroll_to_current_file() {
+  img_fn_list_scroll_to_file( _via_image_index );
+}
+
+function img_fn_list_scroll_to_file(file_index) {
+  if( _via_img_fn_list_img_index_list.includes(file_index) ) {
+    var sel_file     = document.getElementById( 'fl' + file_index );
+    var panel_height = img_fn_list.clientHeight - 20;
+    var window_top    = img_fn_list.scrollTop;
+    var window_bottom = img_fn_list.scrollTop + panel_height
+    if ( sel_file.offsetTop > window_top ) {
+      if ( sel_file.offsetTop > window_bottom ) {
+        img_fn_list.scrollTop = sel_file.offsetTop;
+      }
+    } else {
+      img_fn_list.scrollTop = sel_file.offsetTop - panel_height;
+    }
+  }
+}
+
+function toggle_img_fn_list_visibility() {
+  leftsidebar_show();
+  document.getElementById('img_fn_list_panel').classList.toggle('show');
+  document.getElementById('project_panel_title').classList.toggle('active');
+}
+
+function toggle_attributes_editor() {
+  leftsidebar_show();
+  document.getElementById('attributes_editor_panel').classList.toggle('show');
+  document.getElementById('attributes_editor_panel_title').classList.toggle('active');
+}
+
+// this vertical spacer is needed to allow scrollbar to show
+// items like Keyboard Shortcut hidden under the attributes panel
+function update_vertical_space() {
+  var panel = document.getElementById('vertical_space');
+  var aepanel = document.getElementById('annotation_editor_panel');
+  panel.style.height = (aepanel.offsetHeight + 40) + 'px';
+}
+
+//
+// region and file attributes update panel
+//
+function attribute_update_panel_set_active_button() {
+  var attribute_type;
+  for ( attribute_type in _via_attributes ) {
+    var bid = 'button_show_' + attribute_type + '_attributes';
+    document.getElementById(bid).classList.remove('active');
+  }
+  var bid = 'button_show_' + _via_attribute_being_updated + '_attributes';
+  document.getElementById(bid).classList.add('active');
+}
+
+function show_region_attributes_update_panel() {
+  _via_attribute_being_updated = 'region';
+  var rattr_list = Object.keys(_via_attributes['region']);
+  if ( rattr_list.length ) {
+    _via_current_attribute_id = rattr_list[0];
+  } else {
+    _via_current_attribute_id = '';
+  }
+  update_attributes_update_panel();
+  attribute_update_panel_set_active_button();
+
+}
+
+function show_file_attributes_update_panel() {
+  _via_attribute_being_updated = 'file';
+  var fattr_list = Object.keys(_via_attributes['file']);
+  if ( fattr_list.length ) {
+    _via_current_attribute_id = fattr_list[0];
+  } else {
+    _via_current_attribute_id = '';
+  }
+  update_attributes_update_panel();
+  attribute_update_panel_set_active_button();
+}
+
+function update_attributes_name_list() {
+  var p = document.getElementById('attributes_name_list');
+  p.innerHTML = '';
+
+  var attr;
+  for ( attr in _via_attributes[_via_attribute_being_updated] ) {
+    var option = document.createElement('option');
+    option.setAttribute('value', attr)
+    option.innerHTML = attr;
+    if ( attr === _via_current_attribute_id ) {
+      option.setAttribute('selected', 'selected');
+    }
+    p.appendChild(option);
+  }
+}
+
+function update_attributes_update_panel() {
+  if ( document.getElementById('attributes_editor_panel').classList.contains('show') ) {
+    update_attributes_name_list();
+    show_attribute_properties();
+    show_attribute_options();
+  }
+}
+
+function update_attribute_properties_panel() {
+  if ( document.getElementById('attributes_editor_panel').classList.contains('show') ) {
+    show_attribute_properties();
+    show_attribute_options();
+  }
+}
+
+function show_attribute_properties() {
+  var attr_list = document.getElementById('attributes_name_list');
+  document.getElementById('attribute_properties').innerHTML = '';
+
+  if ( attr_list.options.length === 0 ) {
+    return;
+  }
+
+  if ( typeof(_via_current_attribute_id) === 'undefined' || _via_current_attribute_id === '' ) {
+    _via_current_attribute_id = attr_list.options[0].value;
+  }
+
+  var attr_id = _via_current_attribute_id;
+  var attr_type = _via_attribute_being_updated;
+  var attr_input_type = _via_attributes[attr_type][attr_id].type;
+  var attr_desc = _via_attributes[attr_type][attr_id].description;
+
+  attribute_property_add_input_property('Name of attribute (appears in exported annotations)',
+                                        'Name',
+                                        attr_id,
+                                        'attribute_name');
+  attribute_property_add_input_property('Description of attribute (shown to user during annotation session)',
+                                        'Desc.',
+                                        attr_desc,
+                                        'attribute_description');
+
+  if ( attr_input_type === 'text' ) {
+    var attr_default_value = _via_attributes[attr_type][attr_id].default_value;
+    attribute_property_add_input_property('Default value of this attribute',
+                                          'Def.',
+                                          attr_default_value,
+                                          'attribute_default_value');
+  }
+
+  // add dropdown for type of attribute
+  var p = document.createElement('div');
+  p.setAttribute('class', 'property');
+  var c0 = document.createElement('span');
+  c0.setAttribute('title', 'Attribute type (e.g. text, checkbox, radio, etc)');
+  c0.innerHTML = 'Type';
+  var c1 = document.createElement('span');
+  var c1b = document.createElement('select');
+  c1b.setAttribute('onchange', 'attribute_property_on_update(this)');
+  c1b.setAttribute('id', 'attribute_type');
+  var type_id;
+  for ( type_id in VIA_ATTRIBUTE_TYPE ) {
+    var type = VIA_ATTRIBUTE_TYPE[type_id];
+    var option = document.createElement('option');
+    option.setAttribute('value', type);
+    option.innerHTML = type;
+    if ( attr_input_type == type ) {
+      option.setAttribute('selected', 'selected');
+    }
+    c1b.appendChild(option);
+  }
+  c1.appendChild(c1b);
+  p.appendChild(c0);
+  p.appendChild(c1);
+  document.getElementById('attribute_properties').appendChild(p);
+}
+
+function show_attribute_options() {
+  var attr_list = document.getElementById('attributes_name_list');
+  document.getElementById('attribute_options').innerHTML = '';
+  if ( attr_list.options.length === 0 ) {
+    return;
+  }
+
+  var attr_id = attr_list.value;
+  var attr_type = _via_attributes[_via_attribute_being_updated][attr_id].type;
+
+  // populate additional options based on attribute type
+  switch( attr_type ) {
+  case VIA_ATTRIBUTE_TYPE.TEXT:
+    // text does not have any additional properties
+    break;
+  case VIA_ATTRIBUTE_TYPE.IMAGE:
+    var p = document.createElement('div');
+    p.setAttribute('class', 'property');
+    p.setAttribute('style', 'text-align:center');
+    var c0 = document.createElement('span');
+    c0.setAttribute('style', 'width:25%');
+    c0.setAttribute('title', 'When selected, this is the value that appears in exported annotations');
+    c0.innerHTML = 'id';
+    var c1 = document.createElement('span');
+    c1.setAttribute('style', 'width:60%');
+    c1.setAttribute('title', 'URL or base64 (see https://www.base64-image.de/) encoded image data that corresponds to the image shown as an option to the annotator');
+    c1.innerHTML = 'image url or b64';
+    var c2 = document.createElement('span');
+    c2.setAttribute('title', 'The default value of this attribute');
+    c2.innerHTML = 'def.';
+    p.appendChild(c0);
+    p.appendChild(c1);
+    p.appendChild(c2);
+    document.getElementById('attribute_options').appendChild(p);
+
+    var options = _via_attributes[_via_attribute_being_updated][attr_id].options;
+    var option_id;
+    for ( option_id in options ) {
+      var option_desc = options[option_id];
+
+      var option_default = _via_attributes[_via_attribute_being_updated][attr_id].default_options[option_id];
+      attribute_property_add_option(attr_id, option_id, option_desc, option_default, attr_type);
+    }
+    attribute_property_add_new_entry_option(attr_id, attr_type);
+    break;
+  case VIA_ATTRIBUTE_TYPE.CHECKBOX: // handled by next case
+  case VIA_ATTRIBUTE_TYPE.DROPDOWN: // handled by next case
+  case VIA_ATTRIBUTE_TYPE.RADIO:
+    var p = document.createElement('div');
+    p.setAttribute('class', 'property');
+    p.setAttribute('style', 'text-align:center');
+    var c0 = document.createElement('span');
+    c0.setAttribute('style', 'width:25%');
+    c0.setAttribute('title', 'When selected, this is the value that appears in exported annotations');
+    c0.innerHTML = 'id';
+    var c1 = document.createElement('span');
+    c1.setAttribute('style', 'width:60%');
+    c1.setAttribute('title', 'This is the text shown as an option to the annotator');
+    c1.innerHTML = 'description';
+    var c2 = document.createElement('span');
+    c2.setAttribute('title', 'The default value of this attribute');
+    c2.innerHTML = 'def.';
+    p.appendChild(c0);
+    p.appendChild(c1);
+    p.appendChild(c2);
+    document.getElementById('attribute_options').appendChild(p);
+
+    var options = _via_attributes[_via_attribute_being_updated][attr_id].options;
+    var option_id;
+    for ( option_id in options ) {
+      var option_desc = options[option_id];
+
+      var option_default = _via_attributes[_via_attribute_being_updated][attr_id].default_options[option_id];
+      attribute_property_add_option(attr_id, option_id, option_desc, option_default, attr_type);
+    }
+    attribute_property_add_new_entry_option(attr_id, attr_type);
+    break;
+  default:
+    console.log('Attribute type ' + attr_type + ' is unavailable');
+  }
+}
+
+function attribute_property_add_input_property(title, name, value, id) {
+  var p = document.createElement('div');
+  p.setAttribute('class', 'property');
+  var c0 = document.createElement('span');
+  c0.setAttribute('title', title);
+  c0.innerHTML = name;
+  var c1 = document.createElement('span');
+  var c1b = document.createElement('input');
+  c1b.setAttribute('onchange', 'attribute_property_on_update(this)');
+  if ( typeof(value) !== 'undefined' ) {
+    c1b.setAttribute('value', value);
+  }
+  c1b.setAttribute('id', id);
+  c1.appendChild(c1b);
+  p.appendChild(c0);
+  p.appendChild(c1);
+
+  document.getElementById('attribute_properties').appendChild(p);
+}
+
+function attribute_property_add_option(attr_id, option_id, option_desc, option_default, attribute_type) {
+  var p = document.createElement('div');
+  p.setAttribute('class', 'property');
+  var c0 = document.createElement('span');
+  var c0b = document.createElement('input');
+  c0b.setAttribute('type', 'text');
+  c0b.setAttribute('value', option_id);
+  c0b.setAttribute('title', option_id);
+  c0b.setAttribute('onchange', 'attribute_property_on_option_update(this)');
+  c0b.setAttribute('id', '_via_attribute_option_id_' + option_id);
+
+  var c1 = document.createElement('span');
+  var c1b = document.createElement('input');
+  c1b.setAttribute('type', 'text');
+
+  if ( attribute_type === VIA_ATTRIBUTE_TYPE.IMAGE ) {
+    var option_desc_info = option_desc.length + ' bytes of base64 image data';
+    c1b.setAttribute('value', option_desc_info);
+    c1b.setAttribute('title', 'To update, copy and paste base64 image data in this text box');
+  } else {
+    c1b.setAttribute('value', option_desc);
+    c1b.setAttribute('title', option_desc);
+  }
+  c1b.setAttribute('onchange', 'attribute_property_on_option_update(this)');
+  c1b.setAttribute('id', '_via_attribute_option_description_' + option_id);
+
+  var c2 = document.createElement('span');
+  var c2b = document.createElement('input');
+  c2b.setAttribute('type', attribute_type);
+  if ( typeof option_default !== 'undefined' ) {
+    c2b.checked = option_default;
+  }
+  if ( attribute_type === 'radio' || attribute_type === 'image' || attribute_type === 'dropdown' ) {
+    // ensured that user can activate only one radio button
+    c2b.setAttribute('type', 'radio');
+    c2b.setAttribute('name', attr_id);
+  }
+
+  c2b.setAttribute('onchange', 'attribute_property_on_option_update(this)');
+  c2b.setAttribute('id', '_via_attribute_option_default_' + option_id);
+
+  c0.appendChild(c0b);
+  c1.appendChild(c1b);
+  c2.appendChild(c2b);
+  p.appendChild(c0);
+  p.appendChild(c1);
+  p.appendChild(c2);
+
+  document.getElementById('attribute_options').appendChild(p);
+}
+
+function attribute_property_add_new_entry_option(attr_id, attribute_type) {
+  var p = document.createElement('div');
+  p.setAttribute('class', 'new_option_id_entry');
+  var c0b = document.createElement('input');
+  c0b.setAttribute('type', 'text');
+  c0b.setAttribute('onchange', 'attribute_property_on_option_add(this)');
+  c0b.setAttribute('id', '_via_attribute_new_option_id');
+  c0b.setAttribute('placeholder', 'Add new option id');
+  p.appendChild(c0b);
+  document.getElementById('attribute_options').appendChild(p);
+}
+
+function attribute_property_on_update(p) {
+  var attr_id = get_current_attribute_id();
+  var attr_type = _via_attribute_being_updated;
+  var attr_value = p.value;
+
+  switch(p.id) {
+  case 'attribute_name':
+    if ( attr_value !== attr_id ) {
+      Object.defineProperty(_via_attributes[attr_type],
+                            attr_value,
+                            Object.getOwnPropertyDescriptor(_via_attributes[attr_type], attr_id));
+
+      delete _via_attributes[attr_type][attr_id];
+      update_attributes_update_panel();
+      annotation_editor_update_content();
+    }
+    break;
+  case 'attribute_description':
+    _via_attributes[attr_type][attr_id].description = attr_value;
+    update_attributes_update_panel();
+    annotation_editor_update_content();
+    break;
+  case 'attribute_default_value':
+    _via_attributes[attr_type][attr_id].default_value = attr_value;
+    update_attributes_update_panel();
+    annotation_editor_update_content();
+    break;
+  case 'attribute_type':
+    _via_attributes[attr_type][attr_id].type = attr_value;
+    if( attr_value === VIA_ATTRIBUTE_TYPE.TEXT ) {
+      _via_attributes[attr_type][attr_id].default_value = '';
+      delete _via_attributes[attr_type][attr_id].options;
+      delete _via_attributes[attr_type][attr_id].default_options;
+    } else {
+      // preserve existing options
+      if ( ! _via_attributes[attr_type][attr_id].hasOwnProperty('options') ) {
+        _via_attributes[attr_type][attr_id].options = {};
+        _via_attributes[attr_type][attr_id].default_options = {};
+      }
+
+      if ( _via_attributes[attr_type][attr_id].hasOwnProperty('default_value') ) {
+        delete _via_attributes[attr_type][attr_id].default_value;
+      }
+
+      // collect existing attribute values and add them as options
+      var attr_values = attribute_get_unique_values(attr_type, attr_id);
+      var i;
+      for ( i = 0; i < attr_values.length; ++i ) {
+        var attr_val = attr_values[i];
+        if ( attr_val !== '' ) {
+          _via_attributes[attr_type][attr_id].options[attr_val] = attr_val;
+        }
+      }
+    }
+    show_attribute_properties();
+    show_attribute_options();
+    annotation_editor_update_content();
+    break;
+  }
+}
+
+function attribute_get_unique_values(attr_type, attr_id) {
+  var values = [];
+  switch ( attr_type ) {
+  case 'file':
+    var img_id, attr_val;
+    for ( img_id in _via_img_metadata ) {
+      if ( _via_img_metadata[img_id].file_attributes.hasOwnProperty(attr_id) ) {
+        attr_val = _via_img_metadata[img_id].file_attributes[attr_id];
+        if ( ! values.includes(attr_val) ) {
+          values.push(attr_val);
+        }
+      }
+    }
+    break;
+  case 'region':
+    var img_id, attr_val, i;
+    for ( img_id in _via_img_metadata ) {
+      for ( i = 0; i < _via_img_metadata[img_id].regions.length; ++i ) {
+        if ( _via_img_metadata[img_id].regions[i].region_attributes.hasOwnProperty(attr_id) ) {
+          attr_val = _via_img_metadata[img_id].regions[i].region_attributes[attr_id];
+          if ( ! values.includes(attr_val) ) {
+            values.push(attr_val);
+          }
+        }
+      }
+    }
+    break;
+  default:
+    break;
+  }
+  return values;
+}
+
+function attribute_property_on_option_update(p) {
+  var attr_id = get_current_attribute_id();
+  if ( p.id.startsWith('_via_attribute_option_id_') ) {
+    var old_key = p.id.substr( '_via_attribute_option_id_'.length );
+    var new_key = p.value;
+    if ( old_key !== new_key ) {
+      var option_id_test = attribute_property_option_id_is_valid(attr_id, new_key);
+      if ( option_id_test.is_valid ) {
+        update_attribute_option_id_with_confirm(_via_attribute_being_updated,
+                                                attr_id,
+                                                old_key,
+                                                new_key);
+      } else {
+        p.value = old_key; // restore old value
+        show_message( option_id_test.message );
+        show_attribute_properties();
+      }
+      return;
+    }
+  }
+
+  if ( p.id.startsWith('_via_attribute_option_description_') ) {
+    var key = p.id.substr( '_via_attribute_option_description_'.length );
+    var old_value = _via_attributes[_via_attribute_being_updated][attr_id].options[key];
+    var new_value = p.value;
+    if ( new_value !== old_value ) {
+      _via_attributes[_via_attribute_being_updated][attr_id].options[key] = new_value;
+      show_attribute_properties();
+      annotation_editor_update_content();
+    }
+  }
+
+  if ( p.id.startsWith('_via_attribute_option_default_') ) {
+    var new_default_option_id = p.id.substr( '_via_attribute_option_default_'.length );
+    var old_default_option_id_list = Object.keys(_via_attributes[_via_attribute_being_updated][attr_id].default_options);
+
+    if ( old_default_option_id_list.length === 0 ) {
+      // default set for the first time
+      _via_attributes[_via_attribute_being_updated][attr_id].default_options[new_default_option_id] = p.checked;
+    } else {
+      switch ( _via_attributes[_via_attribute_being_updated][attr_id].type ) {
+      case 'image':    // fallback
+      case 'dropdown': // fallback
+      case 'radio':    // fallback
+        // to ensure that only one radio button is selected at a time
+        _via_attributes[_via_attribute_being_updated][attr_id].default_options = {};
+        _via_attributes[_via_attribute_being_updated][attr_id].default_options[new_default_option_id] = p.checked;
+        break;
+      case 'checkbox':
+        _via_attributes[_via_attribute_being_updated][attr_id].default_options[new_default_option_id] = p.checked;
+        break;
+      }
+    }
+    // default option updated
+    attribute_property_on_option_default_update(_via_attribute_being_updated,
+                                                attr_id,
+                                                new_default_option_id).then( function() {
+                                                  show_attribute_properties();
+                                                  annotation_editor_update_content();
+                                                });
+  }
+}
+
+function attribute_property_on_option_default_update(attribute_being_updated, attr_id, new_default_option_id) {
+  return new Promise( function(ok_callback, err_callback) {
+    // set all metadata to new_value if:
+    // - metadata[attr_id] is missing
+    // - metadata[attr_id] is set to option_old_value
+    var img_id, attr_value, n, i;
+    var attr_type = _via_attributes[attribute_being_updated][attr_id].type;
+    switch( attribute_being_updated ) {
+    case 'file':
+      for ( img_id in _via_img_metadata ) {
+        if ( ! _via_img_metadata[img_id].file_attributes.hasOwnProperty(attr_id) ) {
+          _via_img_metadata[img_id].file_attributes[attr_id] = new_default_option_id;
+        }
+      }
+      break;
+    case 'region':
+      for ( img_id in _via_img_metadata ) {
+        n = _via_img_metadata[img_id].regions.length;
+        for ( i = 0; i < n; ++i ) {
+          if ( ! _via_img_metadata[img_id].regions[i].region_attributes.hasOwnProperty(attr_id) ) {
+            _via_img_metadata[img_id].regions[i].region_attributes[attr_id] = new_default_option_id;
+          }
+        }
+      }
+      break;
+    }
+    ok_callback();
+  });
+}
+
+function attribute_property_on_option_add(p) {
+  if ( p.value === '' || p.value === null ) {
+    return;
+  }
+
+  if ( p.id === '_via_attribute_new_option_id' ) {
+    var attr_id = get_current_attribute_id();
+    var option_id = p.value;
+    var option_id_test = attribute_property_option_id_is_valid(attr_id, option_id);
+    if ( option_id_test.is_valid ) {
+      _via_attributes[_via_attribute_being_updated][attr_id].options[option_id] = '';
+      show_attribute_options();
+      annotation_editor_update_content();
+    } else {
+      show_message( option_id_test.message );
+      attribute_property_reset_new_entry_inputs();
+    }
+  }
+}
+
+function attribute_property_reset_new_entry_inputs() {
+  var container = document.getElementById('attribute_options');
+  var p = container.lastChild;
+  console.log(p.childNodes)
+  if ( p.childNodes[0] ) {
+    p.childNodes[0].value = '';
+  }
+  if ( p.childNodes[1] ) {
+    p.childNodes[1].value = '';
+  }
+}
+
+function attribute_property_show_new_entry_inputs(attr_id, attribute_type) {
+  var n0 = document.createElement('div');
+  n0.classList.add('property');
+  var n1a = document.createElement('span');
+  var n1b = document.createElement('input');
+  n1b.setAttribute('onchange', 'attribute_property_on_option_add(this)');
+  n1b.setAttribute('placeholder', 'Add new id');
+  n1b.setAttribute('value', '');
+  n1b.setAttribute('id', '_via_attribute_new_option_id');
+  n1a.appendChild(n1b);
+
+  var n2a = document.createElement('span');
+  var n2b = document.createElement('input');
+  n2b.setAttribute('onchange', 'attribute_property_on_option_add(this)');
+  n2b.setAttribute('placeholder', 'Optional description');
+  n2b.setAttribute('value', '');
+  n2b.setAttribute('id', '_via_attribute_new_option_description');
+  n2a.appendChild(n2b);
+
+  var n3a = document.createElement('span');
+  var n3b = document.createElement('input');
+  n3b.setAttribute('type', attribute_type);
+  if ( attribute_type === 'radio' ) {
+    n3b.setAttribute('name', attr_id);
+  }
+  n3b.setAttribute('onchange', 'attribute_property_on_option_add(this)');
+  n3b.setAttribute('id', '_via_attribute_new_option_default');
+  n3a.appendChild(n3b);
+
+  n0.appendChild(n1a);
+  n0.appendChild(n2a);
+  n0.appendChild(n3a);
+
+  var container = document.getElementById('attribute_options');
+  container.appendChild(n0);
+}
+
+function attribute_property_option_id_is_valid(attr_id, new_option_id) {
+  var option_id;
+  for ( option_id in _via_attributes[_via_attribute_being_updated][attr_id].options ) {
+    if ( option_id === new_option_id ) {
+      return { 'is_valid':false, 'message':'Option id [' + attr_id + '] already exists' };
+    }
+  }
+
+  if ( new_option_id.includes('__') ) { // reserved separator for attribute-id, row-id, option-id
+    return {'is_valid':false, 'message':'Option id cannot contain two consecutive underscores'};
+  }
+
+  return {'is_valid':true};
+}
+
+function attribute_property_id_exists(name) {
+  var attr_name;
+  for ( attr_name in _via_attributes[_via_attribute_being_updated] ) {
+    if ( attr_name === name ) {
+      return true;
+    }
+  }
+  return false;
+}
+
+function delete_existing_attribute_with_confirm() {
+  var attr_id = document.getElementById('user_input_attribute_id').value;
+  if ( attr_id === '' ) {
+    show_message('Enter the name of attribute that you wish to delete');
+    return;
+  }
+  if ( attribute_property_id_exists(attr_id) ) {
+    var config = {'title':'Delete ' + _via_attribute_being_updated + ' attribute [' + attr_id + ']' };
+    var input = { 'attr_type':{'type':'text', 'name':'Attribute Type', 'value':_via_attribute_being_updated, 'disabled':true},
+                  'attr_id':{'type':'text', 'name':'Attribute Id', 'value':attr_id, 'disabled':true}
+                };
+    invoke_with_user_inputs(delete_existing_attribute_confirmed, input, config);
+  } else {
+    show_message('Attribute [' + attr_id + '] does not exist!');
+    return;
+  }
+}
+
+function delete_existing_attribute_confirmed(input) {
+  var attr_type = input.attr_type.value;
+  var attr_id   = input.attr_id.value;
+  delete_existing_attribute(attr_type, attr_id);
+  document.getElementById('user_input_attribute_id').value = '';
+  show_message('Deleted ' + attr_type + ' attribute [' + attr_id + ']');
+  user_input_default_cancel_handler();
+}
+
+function delete_existing_attribute(attribute_type, attribute_id) {
+  if ( _via_attributes[attribute_type].hasOwnProperty( attribute_id ) ) {
+    var attr_id_list = Object.keys(_via_attributes[attribute_type]);
+    if ( attr_id_list.length === 1 ) {
+      _via_current_attribute_id = '';
+    } else {
+      var current_index = attr_id_list.indexOf(attribute_id);
+      var next_index = current_index + 1;
+      if ( next_index === attr_id_list.length ) {
+        next_index = current_index - 1;
+      }
+      _via_current_attribute_id = attr_id_list[next_index];
+    }
+    delete _via_attributes[attribute_type][attribute_id];
+    update_attributes_update_panel();
+    annotation_editor_update_content();
+  }
+}
+
+function add_new_attribute_from_user_input() {
+  var attr_id = document.getElementById('user_input_attribute_id').value;
+  if ( attr_id === '' ) {
+    show_message('Enter the name of attribute that you wish to delete');
+    return;
+  }
+
+  if ( attribute_property_id_exists(attr_id) ) {
+    show_message('The ' + _via_attribute_being_updated + ' attribute [' + attr_id + '] already exists.');
+  } else {
+    _via_current_attribute_id = attr_id;
+    add_new_attribute(attr_id);
+    update_attributes_update_panel();
+    annotation_editor_update_content();
+    show_message('Added ' + _via_attribute_being_updated + ' attribute [' + attr_id + '].');
+  }
+}
+
+function add_new_attribute(attribute_id) {
+  _via_attributes[_via_attribute_being_updated][attribute_id] = {};
+  _via_attributes[_via_attribute_being_updated][attribute_id].type = 'text';
+  _via_attributes[_via_attribute_being_updated][attribute_id].description = '';
+  _via_attributes[_via_attribute_being_updated][attribute_id].default_value = '';
+}
+
+function update_current_attribute_id(p) {
+  _via_current_attribute_id = p.options[p.selectedIndex].value;
+  update_attribute_properties_panel();
+}
+
+function get_current_attribute_id() {
+  return document.getElementById('attributes_name_list').value;
+}
+
+function update_attribute_option_id_with_confirm(attr_type, attr_id, option_id, new_option_id) {
+  var is_delete = false;
+  var config;
+  if ( new_option_id === '' || typeof(new_option_id) === 'undefined' ) {
+    // an empty new_option_id indicates deletion of option_id
+    config = {'title':'Delete an option for ' + attr_type + ' attribute'};
+    is_delete = true;
+  } else {
+    config = {'title':'Rename an option for ' + attr_type + ' attribute'};
+  }
+
+  var input = { 'attr_type':{'type':'text', 'name':'Attribute Type', 'value':attr_type, 'disabled':true},
+                'attr_id':{'type':'text', 'name':'Attribute Id', 'value':attr_id, 'disabled':true}
+              };
+
+  if ( is_delete ) {
+    input['option_id'] = {'type':'text', 'name':'Attribute Option', 'value':option_id, 'disabled':true};
+  } else {
+    input['option_id']     = {'type':'text', 'name':'Attribute Option (old)', 'value':option_id, 'disabled':true},
+    input['new_option_id'] = {'type':'text', 'name':'Attribute Option (new)', 'value':new_option_id, 'disabled':true};
+  }
+
+  invoke_with_user_inputs(update_attribute_option_id_confirmed, input, config, update_attribute_option_id_cancel);
+}
+
+function update_attribute_option_id_cancel(input) {
+  update_attribute_properties_panel();
+}
+
+function update_attribute_option_id_confirmed(input) {
+  var attr_type = input.attr_type.value;
+  var attr_id = input.attr_id.value;
+  var option_id = input.option_id.value;
+  var is_delete;
+  var new_option_id;
+  if ( typeof(input.new_option_id) === 'undefined' || input.new_option_id === '' ) {
+    is_delete = true;
+    new_option_id = '';
+  } else {
+    is_delete = false;
+    new_option_id = input.new_option_id.value;
+  }
+
+  update_attribute_option(is_delete, attr_type, attr_id, option_id, new_option_id);
+
+  if ( is_delete ) {
+    show_message('Deleted option [' + option_id + '] for ' + attr_type + ' attribute [' + attr_id + '].');
+  } else {
+    show_message('Renamed option [' + option_id + '] to [' + new_option_id + '] for ' + attr_type + ' attribute [' + attr_id + '].');
+  }
+  update_attribute_properties_panel();
+  annotation_editor_update_content();
+  user_input_default_cancel_handler();
+}
+
+function update_attribute_option(is_delete, attr_type, attr_id, option_id, new_option_id) {
+  switch ( attr_type ) {
+  case 'region':
+    update_region_attribute_option_in_all_metadata(is_delete, attr_id, option_id, new_option_id);
+    if ( ! is_delete ) {
+      Object.defineProperty(_via_attributes[attr_type][attr_id].options,
+                            new_option_id,
+                            Object.getOwnPropertyDescriptor(_via_attributes[_via_attribute_being_updated][attr_id].options, option_id));
+    }
+    delete _via_attributes['region'][attr_id].options[option_id];
+
+    break;
+  case 'file':
+    update_file_attribute_option_in_all_metadata(attr_id, option_id);
+    if ( ! is_delete ) {
+      Object.defineProperty(_via_attributes[attr_type][attr_id].options,
+                            new_option_id,
+                            Object.getOwnPropertyDescriptor(_via_attributes[_via_attribute_being_updated][attr_id].options, option_id));
+    }
+
+    delete _via_attributes['file'][attr_id].options[option_id];
+    break;
+  }
+}
+
+function update_file_attribute_option_in_all_metadata(is_delete, attr_id, option_id, new_option_id) {
+  var image_id;
+  for ( image_id in _via_img_metadata ) {
+    if ( _via_img_metadata[image_id].file_attributes.hasOwnProperty(attr_id) ) {
+      if ( _via_img_metadata[image_id].file_attributes[attr_id].hasOwnProperty(option_id) ) {
+        Object.defineProperty(_via_img_metadata[image_id].file_attributes[attr_id],
+                              new_option_id,
+                              Object.getOwnPropertyDescriptor(_via_img_metadata[image_id].file_attributes[attr_id], option_id));
+        delete _via_img_metadata[image_id].file_attributes[attr_id][option_id];
+      }
+    }
+  }
+}
+
+function update_region_attribute_option_in_all_metadata(is_delete, attr_id, option_id, new_option_id) {
+  var image_id;
+  for ( image_id in _via_img_metadata ) {
+    update_region_attribute_option_from_metadata(image_id, is_delete, attr_id, option_id, new_option_id);
+  }
+}
+
+function update_region_attribute_option_from_metadata(image_id, is_delete, attr_id, option_id, new_option_id) {
+  var i;
+  for ( i = 0; i < _via_img_metadata[image_id].regions.length; ++i ) {
+    if ( _via_img_metadata[image_id].regions[i].region_attributes.hasOwnProperty(attr_id) ) {
+      if ( _via_img_metadata[image_id].regions[i].region_attributes[attr_id].hasOwnProperty(option_id) ) {
+        Object.defineProperty(_via_img_metadata[image_id].regions[i].region_attributes[attr_id],
+                              new_option_id,
+                              Object.getOwnPropertyDescriptor(_via_img_metadata[image_id].regions[i].region_attributes[attr_id], option_id));
+        delete _via_img_metadata[image_id].regions[i].region_attributes[attr_id][option_id];
+      }
+    }
+  }
+}
+
+function delete_file_attribute_option_from_all_metadata(attr_id, option_id) {
+  var image_id;
+  for ( image_id in _via_img_metadata ) {
+    if ( _via_img_metadata.hasOwnProperty(image_id) ) {
+      delete_file_attribute_option_from_metadata(image_id, attr_id, option_id);
+    }
+  }
+}
+
+function delete_file_attribute_option_from_metadata(image_id, attr_id, option_id) {
+  var i;
+  if ( _via_img_metadata[image_id].file_attributes.hasOwnProperty(attr_id) ) {
+    if ( _via_img_metadata[image_id].file_attributes[attr_id].hasOwnProperty(option_id) ) {
+      delete _via_img_metadata[image_id].file_attributes[attr_id][option_id];
+    }
+  }
+}
+
+function delete_file_attribute_from_all_metadata(image_id, attr_id) {
+  var image_id;
+  for ( image_id in _via_img_metadata ) {
+    if ( _via_img_metadata.hasOwnProperty(image_id) ) {
+      if ( _via_img_metadata[image_id].file_attributes.hasOwnProperty(attr_id) ) {
+        delete _via_img_metadata[image_id].file_attributes[attr_id];
+      }
+    }
+  }
+}
+
+//
+// invoke a method after receiving inputs from user
+//
+function invoke_with_user_inputs(ok_handler, input, config, cancel_handler) {
+  setup_user_input_panel(ok_handler, input, config, cancel_handler);
+  show_user_input_panel();
+}
+
+function setup_user_input_panel(ok_handler, input, config, cancel_handler) {
+  // create html page with OK and CANCEL button
+  // when OK is clicked
+  //  - setup input with all the user entered values
+  //  - invoke handler with input
+  // when CANCEL is clicked
+  //  - invoke user_input_cancel()
+  _via_user_input_ok_handler = ok_handler;
+  _via_user_input_cancel_handler = cancel_handler;
+  _via_user_input_data = input;
+
+  var p = document.getElementById('user_input_panel');
+  var c = document.createElement('div');
+  c.setAttribute('class', 'content');
+  var html = [];
+  html.push('<p class="title">' + config.title + '</p>');
+
+  html.push('<div class="user_inputs">');
+  var key;
+  for ( key in _via_user_input_data ) {
+    html.push('<div class="row">');
+    html.push('<span class="cell">' + _via_user_input_data[key].name + '</span>');
+    var disabled_html = '';
+    if ( _via_user_input_data[key].disabled ) {
+      disabled_html = 'disabled="disabled"';
+    }
+    var value_html = '';
+    if ( _via_user_input_data[key].value ) {
+      value_html = 'value="' + _via_user_input_data[key].value + '"';
+    }
+
+    switch(_via_user_input_data[key].type) {
+    case 'checkbox':
+      if ( _via_user_input_data[key].checked ) {
+        value_html = 'checked="checked"';
+      } else {
+        value_html = '';
+      }
+      html.push('<span class="cell">' +
+                '<input class="_via_user_input_variable" ' +
+                value_html + ' ' +
+                disabled_html + ' ' +
+                'type="checkbox" id="' + key + '"></span>');
+      break;
+    case 'text':
+      var size = '50';
+      if ( _via_user_input_data[key].size ) {
+        size = _via_user_input_data[key].size;
+      }
+      var placeholder = '';
+      if ( _via_user_input_data[key].placeholder ) {
+        placeholder = _via_user_input_data[key].placeholder;
+      }
+      html.push('<span class="cell">' +
+                '<input class="_via_user_input_variable" ' +
+                value_html + ' ' +
+                disabled_html + ' ' +
+                'size="' + size + '" ' +
+                'placeholder="' + placeholder + '" ' +
+                'type="text" id="' + key + '"></span>');
+
+      break;
+    case 'textarea':
+      var rows = '5';
+      var cols = '50'
+      if ( _via_user_input_data[key].rows ) {
+        rows = _via_user_input_data[key].rows;
+      }
+      if ( _via_user_input_data[key].cols ) {
+        cols = _via_user_input_data[key].cols;
+      }
+      var placeholder = '';
+      if ( _via_user_input_data[key].placeholder ) {
+        placeholder = _via_user_input_data[key].placeholder;
+      }
+      html.push('<span class="cell">' +
+                '<textarea class="_via_user_input_variable" ' +
+                disabled_html + ' ' +
+                'rows="' + rows + '" ' +
+                'cols="' + cols + '" ' +
+                'placeholder="' + placeholder + '" ' +
+                'id="' + key + '">' + value_html + '</textarea></span>');
+
+      break;
+
+    }
+    html.push('</div>'); // end of row
+  }
+  html.push('</div>'); // end of user_input div
+  html.push('<div class="user_confirm">' +
+            '<span class="ok">' +
+            '<button id="user_input_ok_button" onclick="user_input_parse_and_invoke_handler()">&nbsp;OK&nbsp;</button></span>' +
+            '<span class="cancel">' +
+            '<button id="user_input_cancel_button" onclick="user_input_cancel_handler()">CANCEL</button></span></div>');
+  c.innerHTML = html.join('');
+  p.innerHTML = '';
+  p.appendChild(c);
+
+}
+
+function user_input_default_cancel_handler() {
+  hide_user_input_panel();
+  _via_user_input_data = {};
+  _via_user_input_ok_handler = null;
+  _via_user_input_cancel_handler = null;
+}
+
+function user_input_cancel_handler() {
+  if ( _via_user_input_cancel_handler ) {
+    _via_user_input_cancel_handler();
+  }
+  user_input_default_cancel_handler();
+}
+
+function user_input_parse_and_invoke_handler() {
+  var elist = document.getElementsByClassName('_via_user_input_variable');
+  var i;
+  for ( i=0; i < elist.length; ++i ) {
+    var eid = elist[i].id;
+    if ( _via_user_input_data.hasOwnProperty(eid) ) {
+      switch(_via_user_input_data[eid].type) {
+      case 'checkbox':
+        _via_user_input_data[eid].value = elist[i].checked;
+        break;
+      default:
+        _via_user_input_data[eid].value = elist[i].value;
+        break;
+      }
+    }
+  }
+  if ( typeof(_via_user_input_data.confirm) !== 'undefined' ) {
+    if ( _via_user_input_data.confirm.value ) {
+      _via_user_input_ok_handler(_via_user_input_data);
+    } else {
+      if ( _via_user_input_cancel_handler ) {
+        _via_user_input_cancel_handler();
+      }
+    }
+  } else {
+    _via_user_input_ok_handler(_via_user_input_data);
+  }
+  user_input_default_cancel_handler();
+}
+
+function show_user_input_panel() {
+  document.getElementById('user_input_panel').style.display = 'block';
+}
+
+function hide_user_input_panel() {
+  document.getElementById('user_input_panel').style.display = 'none';
+}
+
+//
+// annotations editor panel
+//
+function annotation_editor_show() {
+  // remove existing annotation editor (if any)
+  annotation_editor_remove();
+
+  // create new container of annotation editor
+  var ae = document.createElement('div');
+  ae.setAttribute('id', 'annotation_editor');
+
+  if ( _via_annotation_editor_mode === VIA_ANNOTATION_EDITOR_MODE.SINGLE_REGION ) {
+    if ( _via_settings.ui.image.on_image_annotation_editor_placement === VIA_ANNOTATION_EDITOR_PLACEMENT.DISABLE ) {
+      return;
+    }
+
+    // only display on-image annotation editor if
+    // - region attribute are defined
+    // - region is selected
+    if ( _via_is_region_selected &&
+         Object.keys(_via_attributes['region']).length &&
+         _via_attributes['region'].constructor === Object ) {
+      ae.classList.add('force_small_font');
+      ae.classList.add('display_area_content'); // to enable automatic hiding of this content
+      // add annotation editor to image_panel
+      if ( _via_settings.ui.image.on_image_annotation_editor_placement === VIA_ANNOTATION_EDITOR_PLACEMENT.NEAR_REGION ) {
+        var html_position = annotation_editor_get_placement(_via_user_sel_region_id);
+        ae.style.top = html_position.top;
+        ae.style.left = html_position.left;
+      }
+      _via_display_area.appendChild(ae);
+      annotation_editor_update_content();
+      update_vertical_space();
+    }
+  } else {
+    // show annotation editor in a separate panel at the bottom
+    _via_annotaion_editor_panel.appendChild(ae);
+    annotation_editor_update_content();
+    update_vertical_space();
+
+    if ( _via_is_region_selected ) {
+      // highlight entry for region_id in annotation editor panel
+      annotation_editor_scroll_to_row(_via_user_sel_region_id);
+      annotation_editor_highlight_row(_via_user_sel_region_id);
+    }
+  }
+}
+
+function annotation_editor_hide() {
+  if ( _via_annotation_editor_mode === VIA_ANNOTATION_EDITOR_MODE.SINGLE_REGION ) {
+    // remove existing annotation editor (if any)
+    annotation_editor_remove();
+  } else {
+    annotation_editor_clear_row_highlight();
+  }
+}
+
+function annotation_editor_toggle_on_image_editor() {
+  if ( _via_settings.ui.image.on_image_annotation_editor_placement === VIA_ANNOTATION_EDITOR_PLACEMENT.DISABLE ) {
+    _via_annotation_editor_mode = VIA_ANNOTATION_EDITOR_MODE.SINGLE_REGION;
+    _via_settings.ui.image.on_image_annotation_editor_placement = VIA_ANNOTATION_EDITOR_PLACEMENT.NEAR_REGION;
+    annotation_editor_show();
+    show_message('Enabled on image annotation editor');
+  } else {
+    _via_settings.ui.image.on_image_annotation_editor_placement = VIA_ANNOTATION_EDITOR_PLACEMENT.DISABLE;
+    _via_annotation_editor_mode === VIA_ANNOTATION_EDITOR_MODE.ALL_REGIONS;
+    annotation_editor_hide();
+    show_message('Disabled on image annotation editor');
+  }
+}
+
+function annotation_editor_update_content() {
+  return new Promise( function(ok_callback, err_callback) {
+    var ae = document.getElementById('annotation_editor');
+    if (ae ) {
+      ae.innerHTML = '';
+      annotation_editor_update_header_html();
+      annotation_editor_update_metadata_html();
+    }
+    ok_callback();
+  });
+}
+
+function annotation_editor_get_placement(region_id) {
+  var html_position = {};
+  var r = _via_canvas_regions[region_id]['shape_attributes'];
+  var shape = r['name'];
+  switch( shape ) {
+  case 'rect':
+    html_position.top = r['y'] + r['height'];
+    html_position.left = r['x'] + r['width'];
+    break;
+  case 'circle':
+    html_position.top = r['cy'] + r['r'];
+    html_position.left = r['cx'];
+    break;
+  case 'ellipse':
+    html_position.top = r['cy'] + r['ry'] * Math.cos(r['theta']);
+    html_position.left = r['cx'] - r['ry'] * Math.sin(r['theta']);
+    break;
+  case 'polygon':
+  case 'polyline':
+    var most_left =
+      Object.keys(r['all_points_x']).reduce(function(a, b){
+        return r['all_points_x'][a] > r['all_points_x'][b] ? a : b });
+    html_position.top  = Math.max( r['all_points_y'][most_left] );
+    html_position.left = Math.max( r['all_points_x'][most_left] );
+    break;
+  case 'point':
+    html_position.top = r['cy'];
+    html_position.left = r['cx'];
+    break;
+  }
+  html_position.top  = html_position.top + _via_img_panel.offsetTop + VIA_REGION_EDGE_TOL + 'px';
+  html_position.left = html_position.left + _via_img_panel.offsetLeft + VIA_REGION_EDGE_TOL + 'px';
+  return html_position;
+}
+
+function annotation_editor_remove() {
+  var p = document.getElementById('annotation_editor');
+  if ( p ) {
+    p.remove();
+  }
+}
+
+function is_annotation_editor_visible() {
+  return document.getElementById('annotation_editor_panel').classList.contains('display_block');
+}
+
+function annotation_editor_toggle_all_regions_editor() {
+  var p = document.getElementById('annotation_editor_panel');
+  if ( p.classList.contains('display_block') ) {
+    p.classList.remove('display_block');
+    _via_annotation_editor_mode = VIA_ANNOTATION_EDITOR_MODE.SINGLE_REGION;
+  } else {
+    _via_annotation_editor_mode = VIA_ANNOTATION_EDITOR_MODE.ALL_REGIONS;
+    p.classList.add('display_block');
+    p.style.height = _via_settings.ui.annotation_editor_height + '%';
+    p.style.fontSize = _via_settings.ui.annotation_editor_fontsize + 'rem';
+    annotation_editor_show();
+  }
+}
+
+function annotation_editor_set_active_button() {
+  var attribute_type;
+  for ( attribute_type in _via_attributes ) {
+    var bid = 'button_edit_' + attribute_type + '_metadata';
+    document.getElementById(bid).classList.remove('active');
+  }
+  var bid = 'button_edit_' + _via_metadata_being_updated + '_metadata';
+  document.getElementById(bid).classList.add('active');
+}
+
+function edit_region_metadata_in_annotation_editor() {
+  _via_metadata_being_updated = 'region';
+  annotation_editor_set_active_button();
+  annotation_editor_update_content();
+}
+function edit_file_metadata_in_annotation_editor() {
+  _via_metadata_being_updated = 'file';
+  annotation_editor_set_active_button();
+  annotation_editor_update_content();
+}
+
+function annotation_editor_update_header_html() {
+  var head = document.createElement('div');
+  head.setAttribute('class', 'row');
+  head.setAttribute('id', 'annotation_editor_header');
+
+  if ( _via_metadata_being_updated === 'region' ) {
+    var rid_col = document.createElement('span');
+    rid_col.setAttribute('class', 'col');
+    rid_col.innerHTML = '';
+    head.appendChild(rid_col);
+  }
+
+  if ( _via_metadata_being_updated === 'file' ) {
+    var rid_col = document.createElement('span');
+    rid_col.setAttribute('class', 'col header');
+    if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+      rid_col.innerHTML = 'group';
+    } else {
+      rid_col.innerHTML = 'filename';
+    }
+    head.appendChild(rid_col);
+  }
+
+  var attr_id;
+  for ( attr_id in _via_attributes[_via_metadata_being_updated] ) {
+    var col = document.createElement('span');
+    col.setAttribute('class', 'col header');
+    col.innerHTML = attr_id;
+    head.appendChild(col);
+  }
+
+  var ae = document.getElementById('annotation_editor');
+  if ( ae.childNodes.length === 0 ) {
+    ae.appendChild(head);
+  } else {
+    if ( ae.firstChild.id === 'annotation_editor_header') {
+      ae.replaceChild(head, ae.firstChild);
+    } else {
+      // header node is absent
+      ae.insertBefore(head, ae.firstChild);
+    }
+  }
+}
+
+function annotation_editor_update_metadata_html() {
+  if ( ! _via_img_count ) {
+    return;
+  }
+
+  var ae = document.getElementById('annotation_editor');
+  switch ( _via_metadata_being_updated ) {
+  case 'region':
+    var rindex;
+    if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+      ae.appendChild( annotation_editor_get_metadata_row_html(0) );
+    } else {
+      if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE ) {
+        if ( _via_annotation_editor_mode === VIA_ANNOTATION_EDITOR_MODE.SINGLE_REGION ) {
+          ae.appendChild( annotation_editor_get_metadata_row_html(_via_user_sel_region_id) );
+        } else {
+          for ( rindex = 0; rindex < _via_img_metadata[_via_image_id].regions.length; ++rindex ) {
+            ae.appendChild( annotation_editor_get_metadata_row_html(rindex) );
+          }
+        }
+      }
+    }
+    break;
+
+  case 'file':
+    ae.appendChild( annotation_editor_get_metadata_row_html(0) );
+    break;
+  }
+}
+
+function annotation_editor_update_row(row_id) {
+  var ae = document.getElementById('annotation_editor');
+
+  var new_row = annotation_editor_get_metadata_row_html(row_id);
+  var old_row = document.getElementById(new_row.getAttribute('id'));
+  ae.replaceChild(new_row, old_row);
+}
+
+function annotation_editor_add_row(row_id) {
+  if ( is_annotation_editor_visible() ) {
+    var ae = document.getElementById('annotation_editor');
+    var new_row = annotation_editor_get_metadata_row_html(row_id);
+    var penultimate_row_id = parseInt(row_id) - 1;
+    if ( penultimate_row_id >= 0 ) {
+      var penultimate_row_html_id = 'ae_' + _via_metadata_being_updated + '_' + penultimate_row_id;
+      var penultimate_row = document.getElementById(penultimate_row_html_id);
+      ae.insertBefore(new_row, penultimate_row.nextSibling);
+    } else {
+      ae.appendChild(new_row);
+    }
+  }
+}
+
+function annotation_editor_get_metadata_row_html(row_id) {
+  var row = document.createElement('div');
+  row.setAttribute('class', 'row');
+  row.setAttribute('id', 'ae_' + _via_metadata_being_updated + '_' + row_id);
+
+  if ( _via_metadata_being_updated === 'region' ) {
+    var rid = document.createElement('span');
+
+    switch(_via_display_area_content_name) {
+    case VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID:
+      rid.setAttribute('class', 'col');
+      rid.innerHTML = 'Grouped regions in ' + _via_image_grid_selected_img_index_list.length + ' files';
+      break;
+    case VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE:
+      rid.setAttribute('class', 'col id');
+      rid.innerHTML = (row_id + 1);
+      break;
+    }
+    row.appendChild(rid);
+  }
+
+  if ( _via_metadata_being_updated === 'file' ) {
+    var rid = document.createElement('span');
+    rid.setAttribute('class', 'col');
+    switch(_via_display_area_content_name) {
+    case VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID:
+      rid.innerHTML = 'Group of ' + _via_image_grid_selected_img_index_list.length + ' files';
+      break;
+    case VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE:
+      rid.innerHTML = _via_image_filename_list[_via_image_index];
+      break;
+    }
+
+    row.appendChild(rid);
+  }
+
+  var attr_id;
+  for ( attr_id in _via_attributes[_via_metadata_being_updated] ) {
+    var col = document.createElement('span');
+    col.setAttribute('class', 'col');
+
+    var attr_type    = _via_attributes[_via_metadata_being_updated][attr_id].type;
+    var attr_desc    = _via_attributes[_via_metadata_being_updated][attr_id].desc;
+    if ( typeof(attr_desc) === 'undefined' ) {
+      attr_desc = '';
+    }
+    var attr_html_id = attr_id + '__' + row_id;
+
+    var attr_value = '';
+    var attr_placeholder = '';
+    if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE ) {
+      switch(_via_metadata_being_updated) {
+      case 'region':
+        if ( _via_img_metadata[_via_image_id].regions[row_id].region_attributes.hasOwnProperty(attr_id) ) {
+          attr_value = _via_img_metadata[_via_image_id].regions[row_id].region_attributes[attr_id];
+        } else {
+          attr_placeholder = 'not defined yet!';
+        }
+      case 'file':
+        if ( _via_img_metadata[_via_image_id].file_attributes.hasOwnProperty(attr_id) ) {
+          attr_value = _via_img_metadata[_via_image_id].file_attributes[attr_id];
+        } else {
+          attr_placeholder = 'not defined yet!';
+        }
+      }
+    }
+
+    if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+      var attr_metadata_stat;
+      switch(_via_metadata_being_updated) {
+      case 'region':
+        attr_metadata_stat = _via_get_region_metadata_stat(_via_image_grid_selected_img_index_list, attr_id);
+        break;
+      case 'file':
+        attr_metadata_stat = _via_get_file_metadata_stat(_via_image_grid_selected_img_index_list, attr_id);
+        break;
+      }
+
+      switch ( attr_type ) {
+      case 'text':
+        if ( attr_metadata_stat.hasOwnProperty(attr_id) ) {
+          var attr_value_set = Object.keys(attr_metadata_stat[attr_id]);
+          if ( attr_value_set.includes('undefined') ) {
+            attr_value = '';
+            attr_placeholder = 'includes ' + attr_metadata_stat[attr_id]['undefined'] + ' undefined values';
+          } else {
+            switch( attr_value_set.length ) {
+            case 0:
+              attr_value = '';
+              attr_placeholder = 'not applicable';
+              break;
+            case 1:
+              attr_value = attr_value_set[0];
+              attr_placeholder = '';
+              break;
+            default:
+              attr_value = '';
+              attr_placeholder = attr_value_set.length + ' different values: ' + JSON.stringify(attr_value_set).replace(/"/g,'\'');
+              console.log(JSON.stringify(attr_value_set))
+            }
+          }
+        } else {
+          attr_value = '';
+          attr_placeholder = 'not defined yet!';
+        }
+        break;
+
+      case 'radio':    // fallback
+      case 'dropdown': // fallback
+      case 'image':    // fallback
+        if ( attr_metadata_stat.hasOwnProperty(attr_id) ) {
+          var attr_value_set = Object.keys(attr_metadata_stat[attr_id]);
+          if ( attr_value_set.length === 1 ) {
+            attr_value = attr_value_set[0];
+          } else {
+            attr_value = '';
+          }
+        } else {
+          attr_value = '';
+        }
+        break;
+
+      case 'checkbox':
+        attr_value = {};
+        if ( attr_metadata_stat.hasOwnProperty(attr_id) ) {
+          var attr_value_set = Object.keys(attr_metadata_stat[attr_id]);
+          var same_count = true;
+          var i, n;
+          var attr_value_curr, attr_value_next;
+          n = attr_value_set.length;
+          for ( i = 0; i < n - 1; ++i ) {
+            attr_value_curr = attr_value_set[i];
+            attr_value_next = attr_value_set[i+1];
+
+            if ( attr_metadata_stat[attr_id][attr_value_curr] !== attr_metadata_stat[attr_id][attr_value_next] ) {
+              same_count = false;
+              break;
+            }
+          }
+          if ( same_count ) {
+            var attr_value_i;
+            for ( attr_value_i in attr_metadata_stat[attr_id] ) {
+              attr_value[attr_value_i] = true;
+            }
+          }
+        }
+        break;
+      }
+    }
+
+    switch(attr_type) {
+    case 'text':
+      col.innerHTML = '<textarea ' +
+        'onchange="annotation_editor_on_metadata_update(this)" ' +
+        'onfocus="annotation_editor_on_metadata_focus(this)" ' +
+        'title="' + attr_desc + '" ' +
+        'placeholder="' + attr_placeholder + '" ' +
+        'id="' + attr_html_id + '">' + attr_value + '</textarea>';
+      break;
+    case 'checkbox':
+      var options = _via_attributes[_via_metadata_being_updated][attr_id].options;
+      var option_id;
+      for ( option_id in options ) {
+        var option_html_id = attr_html_id + '__' + option_id;
+        var option = document.createElement('input');
+        option.setAttribute('type', 'checkbox');
+        option.setAttribute('value', option_id);
+        option.setAttribute('id', option_html_id);
+        option.setAttribute('onfocus', 'annotation_editor_on_metadata_focus(this)');
+        option.setAttribute('onchange', 'annotation_editor_on_metadata_update(this)');
+
+        var option_desc  = _via_attributes[_via_metadata_being_updated][attr_id].options[option_id];
+        if ( option_desc === '' || typeof(option_desc) === 'undefined' ) {
+          // option description is optional, use option_id when description is not present
+          option_desc = option_id;
+        }
+
+        // set the value of options based on the user annotations
+        if ( typeof attr_value !== 'undefined') {
+          if ( attr_value.hasOwnProperty(option_id) ) {
+            option.checked = attr_value[option_id];
+          }
+        }
+
+        var label  = document.createElement('label');
+        label.setAttribute('for', option_html_id);
+        label.innerHTML = option_desc;
+
+        var container = document.createElement('span');
+        container.appendChild(option);
+        container.appendChild(label);
+        col.appendChild(container);
+      }
+      break;
+    case 'radio':
+      var option_id;
+      for ( option_id in _via_attributes[_via_metadata_being_updated][attr_id].options ) {
+        var option_html_id = attr_html_id + '__' + option_id;
+        var option = document.createElement('input');
+        option.setAttribute('type', 'radio');
+        option.setAttribute('name', attr_html_id);
+        option.setAttribute('value', option_id);
+        option.setAttribute('id', option_html_id);
+        option.setAttribute('onfocus', 'annotation_editor_on_metadata_focus(this)');
+        option.setAttribute('onchange', 'annotation_editor_on_metadata_update(this)');
+
+        var option_desc  = _via_attributes[_via_metadata_being_updated][attr_id].options[option_id];
+        if ( option_desc === '' || typeof(option_desc) === 'undefined' ) {
+          // option description is optional, use option_id when description is not present
+          option_desc = option_id;
+        }
+
+        if ( attr_value === option_id ) {
+          option.checked = true;
+        }
+
+        var label  = document.createElement('label');
+        label.setAttribute('for', option_html_id);
+        label.innerHTML = option_desc;
+
+        var container = document.createElement('span');
+        container.appendChild(option);
+        container.appendChild(label);
+        col.appendChild(container);
+      }
+      break;
+    case 'image':
+      var option_id;
+      var option_count = 0;
+      for ( option_id in _via_attributes[_via_metadata_being_updated][attr_id].options ) {
+        option_count = option_count + 1;
+      }
+      var img_options = document.createElement('div');
+      img_options.setAttribute('class', 'img_options');
+      col.appendChild(img_options);
+
+      var option_index = 0;
+      for ( option_id in _via_attributes[_via_metadata_being_updated][attr_id].options ) {
+        var option_html_id = attr_html_id + '__' + option_id;
+        var option = document.createElement('input');
+        option.setAttribute('type', 'radio');
+        option.setAttribute('name', attr_html_id);
+        option.setAttribute('value', option_id);
+        option.setAttribute('id', option_html_id);
+        option.setAttribute('onfocus', 'annotation_editor_on_metadata_focus(this)');
+        option.setAttribute('onchange', 'annotation_editor_on_metadata_update(this)');
+
+        var option_desc  = _via_attributes[_via_metadata_being_updated][attr_id].options[option_id];
+        if ( option_desc === '' || typeof(option_desc) === 'undefined' ) {
+          // option description is optional, use option_id when description is not present
+          option_desc = option_id;
+        }
+
+        if ( attr_value === option_id ) {
+          option.checked = true;
+        }
+
+        var label  = document.createElement('label');
+        label.setAttribute('for', option_html_id);
+        label.innerHTML = '<img src="' + option_desc + '"><p>' + option_id + '</p>';
+
+        var container = document.createElement('span');
+        container.appendChild(option);
+        container.appendChild(label);
+        img_options.appendChild(container);
+      }
+      break;
+
+    case 'dropdown':
+      var sel = document.createElement('select');
+      sel.setAttribute('id', attr_html_id);
+      sel.setAttribute('onfocus', 'annotation_editor_on_metadata_focus(this)');
+      sel.setAttribute('onchange', 'annotation_editor_on_metadata_update(this)');
+      var option_id;
+      var option_selected = false;
+      for ( option_id in _via_attributes[_via_metadata_being_updated][attr_id].options ) {
+        var option_html_id = attr_html_id + '__' + option_id;
+        var option = document.createElement('option');
+        option.setAttribute('value', option_id);
+
+        var option_desc  = _via_attributes[_via_metadata_being_updated][attr_id].options[option_id];
+        if ( option_desc === '' || typeof(option_desc) === 'undefined' ) {
+          // option description is optional, use option_id when description is not present
+          option_desc = option_id;
+        }
+
+        if ( option_id === attr_value ) {
+          option.setAttribute('selected', 'selected');
+          option_selected = true;
+        }
+        option.innerHTML = option_desc;
+        sel.appendChild(option);
+      }
+
+      if ( ! option_selected ) {
+        sel.selectedIndex = '-1';
+      }
+      col.appendChild(sel);
+      break;
+    }
+
+    row.appendChild(col);
+  }
+  return row;
+}
+
+function annotation_editor_scroll_to_row(row_id) {
+  if ( is_annotation_editor_visible() ) {
+    var row_html_id = 'ae_' + _via_metadata_being_updated + '_' + row_id;
+    var row = document.getElementById(row_html_id);
+    row.scrollIntoView(false);
+  }
+}
+
+function annotation_editor_highlight_row(row_id) {
+  if ( is_annotation_editor_visible() ) {
+    var row_html_id = 'ae_' + _via_metadata_being_updated + '_' + row_id;
+    var row = document.getElementById(row_html_id);
+    row.classList.add('highlight');
+  }
+}
+
+function annotation_editor_clear_row_highlight() {
+  if ( is_annotation_editor_visible() ) {
+    var ae = document.getElementById('annotation_editor');
+    var i;
+    for ( i=0; i<ae.childNodes.length; ++i ) {
+      ae.childNodes[i].classList.remove('highlight');
+    }
+  }
+}
+
+function annotation_editor_extract_html_id_components(html_id) {
+  // html_id : attribute_name__row-id__option_id
+  var parts = html_id.split('__');
+  var parsed_id = {};
+  switch( parts.length ) {
+  case 3:
+    // html_id : attribute-id__row-id__option_id
+    parsed_id.attr_id = parts[0];
+    parsed_id.row_id  = parts[1];
+    parsed_id.option_id = parts[2];
+    break;
+  case 2:
+    // html_id : attribute-id__row-id
+    parsed_id.attr_id = parts[0];
+    parsed_id.row_id  = parts[1];
+    break;
+  default:
+  }
+  return parsed_id;
+}
+
+function _via_get_file_metadata_stat(img_index_list, attr_id) {
+  var stat = {};
+  stat[attr_id] = {};
+  var i, n, img_id, img_index, value;
+  n = img_index_list.length;
+  for ( i = 0; i < n; ++i ) {
+    img_index = img_index_list[i];
+    img_id = _via_image_id_list[img_index];
+    if ( _via_img_metadata[img_id].file_attributes.hasOwnProperty(attr_id) ) {
+      value = _via_img_metadata[img_id].file_attributes[attr_id];
+      if ( typeof(value) === 'object' ) {
+        // checkbox has multiple values and hence is object
+        var key;
+        for ( key in value ) {
+          if ( stat[attr_id].hasOwnProperty(key) ) {
+            stat[attr_id][key] += 1;
+          } else {
+            stat[attr_id][key] = 1;
+          }
+        }
+      } else {
+        if ( stat[attr_id].hasOwnProperty(value) ) {
+          stat[attr_id][value] += 1;
+        } else {
+          stat[attr_id][value] = 1;
+        }
+      }
+    }
+
+  }
+  return stat;
+}
+
+function _via_get_region_metadata_stat(img_index_list, attr_id) {
+  var stat = {};
+  stat[attr_id] = {};
+  var i, n, img_id, img_index, value;
+  var j, m;
+  n = img_index_list.length;
+  for ( i = 0; i < n; ++i ) {
+    img_index = img_index_list[i];
+    img_id = _via_image_id_list[img_index];
+    m = _via_img_metadata[img_id].regions.length;
+    for ( j = 0; j < m; ++j ) {
+      if ( ! image_grid_is_region_in_current_group( _via_img_metadata[img_id].regions[j].region_attributes ) ) {
+        // skip region not in current group
+        continue;
+      }
+
+      value = _via_img_metadata[img_id].regions[j].region_attributes[attr_id];
+      if ( typeof(value) === 'object' ) {
+        // checkbox has multiple values and hence is object
+        var key;
+        for ( key in value ) {
+          if ( stat[attr_id].hasOwnProperty(key) ) {
+            stat[attr_id][key] += 1;
+          } else {
+            stat[attr_id][key] = 1;
+          }
+        }
+      } else {
+        if ( stat[attr_id].hasOwnProperty(value) ) {
+          stat[attr_id][value] += 1;
+        } else {
+          stat[attr_id][value] = 1;
+        }
+      }
+    }
+  }
+  return stat;
+}
+
+// invoked when the input entry in annotation editor receives focus
+function annotation_editor_on_metadata_focus(p) {
+  if ( _via_annotation_editor_mode === VIA_ANNOTATION_EDITOR_MODE.ALL_REGIONS ) {
+    var pid       = annotation_editor_extract_html_id_components(p.id);
+    var region_id = pid.row_id;
+    // clear existing highlights (if any)
+    toggle_all_regions_selection(false);
+    annotation_editor_clear_row_highlight();
+    // set new selection highlights
+    set_region_select_state(region_id, true);
+    annotation_editor_scroll_to_row(region_id);
+    annotation_editor_highlight_row(region_id);
+
+    _via_redraw_reg_canvas();
+  }
+}
+
+// invoked when the user updates annotations using the annotation editor
+function annotation_editor_on_metadata_update(p) {
+  var pid       = annotation_editor_extract_html_id_components(p.id);
+  var img_id    = _via_image_id;
+
+  var img_index_list = [ _via_image_index ];
+  var region_id = pid.row_id;
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+    img_index_list = _via_image_grid_selected_img_index_list.slice(0);
+    region_id = -1; // this flag denotes that we want to update all regions
+  }
+
+  if ( _via_metadata_being_updated === 'file' ) {
+    annotation_editor_update_file_metadata(img_index_list, pid.attr_id, p.value, p.checked).then( function(update_count) {
+      annotation_editor_on_metadata_update_done('file', pid.attr_id, update_count);
+    }, function(err) {
+      console.log(err)
+      show_message('Failed to update file attributes! ' + err);
+    });
+    return;
+  }
+
+  if ( _via_metadata_being_updated === 'region' ) {
+    annotation_editor_update_region_metadata(img_index_list, region_id, pid.attr_id, p.value, p.checked).then( function(update_count) {
+      annotation_editor_on_metadata_update_done('region', pid.attr_id, update_count);
+    }, function(err) {
+      show_message('Failed to update region attributes! ');
+    });
+    return;
+  }
+}
+
+function annotation_editor_on_metadata_update_done(type, attr_id, update_count) {
+  show_message('Updated ' + type + ' attributes of ' + update_count + ' ' + type + 's');
+  // check if the updated attribute is one of the group variables
+  var i, n, type, attr_id;
+  n = _via_image_grid_group_var.length;
+  var clear_all_group = false;
+  for ( i = 0; i < n; ++i ) {
+    if ( _via_image_grid_group_var[i].type === type &&
+         _via_image_grid_group_var[i].name === attr_id ) {
+      clear_all_group = true;
+      break;
+    }
+  }
+  _via_regions_group_color_init();
+  _via_redraw_reg_canvas();
+
+  // @todo: it is wasteful to cancel the full set of groups.
+  // we should only cancel the groups that are affected by this update.
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+    if ( clear_all_group ) {
+      image_grid_show_all_project_images();
+    }
+  }
+}
+
+function annotation_editor_update_file_metadata(img_index_list, attr_id, new_value, new_checked) {
+  return new Promise( function(ok_callback, err_callback) {
+    var i, n, img_id, img_index;
+    n = img_index_list.length;
+    var update_count = 0;
+    for ( i = 0; i < n; ++i ) {
+      img_index = img_index_list[i];
+      img_id = _via_image_id_list[img_index];
+
+      switch( _via_attributes['file'][attr_id].type ) {
+      case 'text':  // fallback
+      case 'radio': // fallback
+      case 'dropdown': // fallback
+      case 'image':
+        _via_img_metadata[img_id].file_attributes[attr_id] = new_value;
+        update_count += 1;
+        break;
+
+      case 'checkbox':
+        var option_id = new_value;
+        console.log('option_id='+option_id)
+        console.log('attr_id='+attr_id)
+        console.log('img_id='+img_id)
+        console.log(_via_img_metadata[img_id].file_attributes)
+        console.log(_via_attributes['file'][attr_id])
+        if ( _via_img_metadata[img_id].file_attributes.hasOwnProperty(attr_id) ) {
+          if ( typeof(_via_img_metadata[img_id].file_attributes[attr_id]) !== 'object' ) {
+            var old_value = _via_img_metadata[img_id].file_attributes[attr_id];
+            _via_img_metadata[img_id].file_attributes[attr_id] = {};
+            if ( Object.keys(_via_attributes['file'][attr_id]['options']).includes(old_value) ) {
+              // transform existing value as checkbox option
+              _via_img_metadata[img_id].file_attributes[attr_id] = {};
+              _via_img_metadata[img_id].file_attributes[attr_id][old_value] = true;
+            }
+          }
+        } else {
+          _via_img_metadata[img_id].file_attributes[attr_id] = {};
+        }
+
+        console.log(_via_img_metadata[img_id].file_attributes[attr_id])
+        console.log(new_checked)
+        console.log(new_value)
+        if ( new_checked ) {
+          _via_img_metadata[img_id].file_attributes[attr_id][option_id] = true;
+        } else {
+          // false option values are not stored
+          delete _via_img_metadata[img_id].file_attributes[attr_id][option_id];
+        }
+        update_count += 1;
+        break;
+      }
+    }
+    ok_callback(update_count);
+  });
+}
+
+function annotation_editor_update_region_metadata(img_index_list, region_id, attr_id, new_value, new_checked) {
+  return new Promise( function(ok_callback, err_callback) {
+    var i, n, img_id, img_index;
+    n = img_index_list.length;
+    var update_count = 0;
+    var region_list = [];
+    var j, m;
+
+    if ( region_id === -1 ) {
+      // update all regions on a file (for image grid view)
+      for ( i = 0; i < n; ++i ) {
+        img_index = img_index_list[i];
+        img_id = _via_image_id_list[img_index];
+
+        m = _via_img_metadata[img_id].regions.length;
+        for ( j = 0; j < m; ++j ) {
+          if ( ! image_grid_is_region_in_current_group( _via_img_metadata[img_id].regions[j].region_attributes ) ) {
+            continue;
+          }
+
+          switch( _via_attributes['region'][attr_id].type ) {
+          case 'text':  // fallback
+          case 'dropdown': // fallback
+          case 'radio': // fallback
+          case 'image':
+            _via_img_metadata[img_id].regions[j].region_attributes[attr_id] = new_value;
+            update_count += 1;
+            break;
+          case 'checkbox':
+            var option_id = new_value;
+            if ( _via_img_metadata[img_id].regions[j].region_attributes.hasOwnProperty(attr_id) ) {
+              if ( typeof(_via_img_metadata[img_id].regions[j].region_attributes[attr_id]) !== 'object' ) {
+                var old_value = _via_img_metadata[img_id].regions[j].region_attributes[attr_id];
+                _via_img_metadata[img_id].regions[j].region_attributes[attr_id] = {}
+                if ( Object.keys(_via_attributes['region'][attr_id]['options']).includes(old_value) ) {
+                  // transform existing value as checkbox option
+                  _via_img_metadata[img_id].regions[j].region_attributes[attr_id][old_value] = true;
+                }
+              }
+            } else {
+              _via_img_metadata[img_id].regions[j].region_attributes[attr_id] = {};
+            }
+
+            if ( new_checked ) {
+              _via_img_metadata[img_id].regions[j].region_attributes[attr_id][option_id] = true;
+            } else {
+              // false option values are not stored
+              delete _via_img_metadata[img_id].regions[j].region_attributes[attr_id][option_id];
+            }
+            update_count += 1;
+            break;
+          }
+        }
+      }
+    } else {
+      // update a single region in a file (for single image view)
+      // update all regions on a file (for image grid view)
+      for ( i = 0; i < n; ++i ) {
+        img_index = img_index_list[i];
+        img_id = _via_image_id_list[img_index];
+
+        switch( _via_attributes['region'][attr_id].type ) {
+        case 'text':  // fallback
+        case 'dropdown': // fallback
+        case 'radio': // fallback
+        case 'image':
+          _via_img_metadata[img_id].regions[region_id].region_attributes[attr_id] = new_value;
+          update_count += 1;
+          break;
+        case 'checkbox':
+          var option_id = new_value;
+
+          if ( _via_img_metadata[img_id].regions[region_id].region_attributes.hasOwnProperty(attr_id) ) {
+            if ( typeof(_via_img_metadata[img_id].regions[region_id].region_attributes[attr_id]) !== 'object' ) {
+              var old_value = _via_img_metadata[img_id].regions[region_id].region_attributes[attr_id];
+              _via_img_metadata[img_id].regions[region_id].region_attributes[attr_id] = {};
+              if ( Object.keys(_via_attributes['region'][attr_id]['options']).includes(old_value) ) {
+                // transform existing value as checkbox option
+                _via_img_metadata[img_id].regions[region_id].region_attributes[attr_id][old_value] = true;
+              }
+            }
+          } else {
+            _via_img_metadata[img_id].regions[region_id].region_attributes[attr_id] = {};
+          }
+
+          if ( new_checked ) {
+            _via_img_metadata[img_id].regions[region_id].region_attributes[attr_id][option_id] = true;
+          } else {
+            // false option values are not stored
+            delete _via_img_metadata[img_id].regions[region_id].region_attributes[attr_id][option_id];
+          }
+          update_count += 1;
+          break;
+        }
+      }
+    }
+    ok_callback(update_count);
+  });
+}
+
+function set_region_annotations_to_default_value(rid) {
+  var attr_id;
+  for ( attr_id in _via_attributes['region'] ) {
+    var attr_type = _via_attributes['region'][attr_id].type;
+    switch( attr_type ) {
+    case 'text':
+      var default_value = _via_attributes['region'][attr_id].default_value;
+      if ( typeof(default_value) !== 'undefined' ) {
+        _via_img_metadata[_via_image_id].regions[rid].region_attributes[attr_id] = default_value;
+      }
+      break;
+    case 'image':    // fallback
+    case 'dropdown': // fallback
+    case 'radio':
+      _via_img_metadata[_via_image_id].regions[rid].region_attributes[attr_id] = '';
+      var default_options = _via_attributes['region'][attr_id].default_options;
+      if ( typeof(default_options) !== 'undefined' ) {
+        _via_img_metadata[_via_image_id].regions[rid].region_attributes[attr_id] = Object.keys(default_options)[0];
+      }
+      break;
+
+    case 'checkbox':
+      _via_img_metadata[_via_image_id].regions[rid].region_attributes[attr_id] = {};
+      var default_options = _via_attributes['region'][attr_id].default_options;
+      if ( typeof(default_options) !== 'underfined' ) {
+        var option_id;
+        for ( option_id in default_options ) {
+          var default_value = default_options[option_id];
+          if ( typeof(default_value) !== 'underfined' ) {
+            _via_img_metadata[_via_image_id].regions[rid].region_attributes[attr_id][option_id] = default_value;
+          }
+        }
+      }
+      break;
+    }
+  }
+}
+
+function set_file_annotations_to_default_value(image_id) {
+  var attr_id;
+  for ( attr_id in _via_attributes['file'] ) {
+    var attr_type = _via_attributes['file'][attr_id].type;
+    switch( attr_type ) {
+    case 'text':
+      var default_value = _via_attributes['file'][attr_id].default_value;
+      _via_img_metadata[image_id].file_attributes[attr_id] = default_value;
+      break;
+    case 'image':    // fallback
+    case 'dropdown': // fallback
+    case 'radio':
+      _via_img_metadata[image_id].file_attributes[attr_id] = '';
+      var default_options = _via_attributes['file'][attr_id].default_options;
+      _via_img_metadata[image_id].file_attributes[attr_id] = Object.keys(default_options)[0];
+      break;
+    case 'checkbox':
+      _via_img_metadata[image_id].file_attributes[attr_id] = {};
+      var default_options = _via_attributes['file'][attr_id].default_options;
+      var option_id;
+      for ( option_id in default_options ) {
+        var default_value = default_options[option_id];
+        _via_img_metadata[image_id].file_attributes[attr_id][option_id] = default_value;
+      }
+      break;
+    }
+  }
+}
+
+function annotation_editor_increase_panel_height() {
+  var p = document.getElementById('annotation_editor_panel');
+  if ( _via_settings.ui.annotation_editor_height < 95 ) {
+    _via_settings.ui.annotation_editor_height += VIA_ANNOTATION_EDITOR_HEIGHT_CHANGE;
+    p.style.height = _via_settings.ui.annotation_editor_height + '%';
+  }
+}
+
+function annotation_editor_decrease_panel_height() {
+  var p = document.getElementById('annotation_editor_panel');
+  if ( _via_settings.ui.annotation_editor_height > 10 ) {
+    _via_settings.ui.annotation_editor_height -= VIA_ANNOTATION_EDITOR_HEIGHT_CHANGE;
+    p.style.height = _via_settings.ui.annotation_editor_height + '%';
+  }
+}
+
+function annotation_editor_increase_content_size() {
+  var p = document.getElementById('annotation_editor_panel');
+  if ( _via_settings.ui.annotation_editor_fontsize < 1.6 ) {
+    _via_settings.ui.annotation_editor_fontsize += VIA_ANNOTATION_EDITOR_FONTSIZE_CHANGE;
+    p.style.fontSize = _via_settings.ui.annotation_editor_fontsize + 'rem';
+  }
+}
+
+function annotation_editor_decrease_content_size() {
+  var p = document.getElementById('annotation_editor_panel');
+  if ( _via_settings.ui.annotation_editor_fontsize > 0.4 ) {
+    _via_settings.ui.annotation_editor_fontsize -= VIA_ANNOTATION_EDITOR_FONTSIZE_CHANGE;
+    p.style.fontSize = _via_settings.ui.annotation_editor_fontsize + 'rem';
+  }
+}
+
+//
+// via project
+//
+function project_set_name(name) {
+  _via_settings.project.name = name;
+
+  var p = document.getElementById('project_name');
+  p.value = _via_settings.project.name;
+}
+
+function project_init_default_project() {
+  if ( ! _via_settings.hasOwnProperty('project') ) {
+    _via_settings.project = {};
+  }
+
+  project_set_name( project_get_default_project_name() );
+}
+
+function project_on_name_update(p) {
+  project_set_name(p.value);
+}
+
+function project_get_default_project_name() {
+  const now = new Date();
+  var MONTH_SHORT_NAME = ['Jan', 'Feb', 'Mar', 'Apr', 'May', 'Jun', 'Jul', 'Aug', 'Sep', 'Oct', 'Nov', 'Dec'];
+  var ts = now.getDate() + MONTH_SHORT_NAME[now.getMonth()] + now.getFullYear() +
+      '_' + now.getHours() + 'h' + now.getMinutes() + 'm';
+
+  var project_name = 'via_project_' + ts;
+  return project_name;
+}
+
+function project_save_with_confirm() {
+  var config = {'title':'Save Project' };
+  var input = { 'project_name': { type:'text', name:'Project Name', value:_via_settings.project.name, disabled:false, size:30 },
+                'save_annotations':{ type:'checkbox', name:'Save region and file annotations (i.e. manual annotations)', checked:true, disabled:false},
+                'save_attributes':{ type:'checkbox', name:'Save region and file attributes.', checked:true},
+                'save_via_settings':{ type:'checkbox', name:'Save VIA application settings', checked:true},
+                //                'save_base64_data':{ type:'checkbox', name:'Save base64 data of images (if present)', checked:false},
+                //                'save_images':{type:'checkbox', 'name':'Save images <span class="warning">(WARNING: only recommended for projects containing small number of images)</span>', value:false},
+              };
+
+  invoke_with_user_inputs(project_save_confirmed, input, config);
+}
+
+function project_save_confirmed(input) {
+  if ( input.project_name.value !== _via_settings.project.name ) {
+    project_set_name(input.project_name.value);
+  }
+
+  // via project
+  var _via_project = { '_via_settings': _via_settings,
+                       '_via_img_metadata': _via_img_metadata,
+                       '_via_attributes': _via_attributes };
+
+  var filename = input.project_name.value + '.json';
+  var data_blob = new Blob( [JSON.stringify(_via_project)],
+                            {type: 'text/json;charset=utf-8'});
+
+  save_data_to_local_file(data_blob, filename);
+
+  user_input_default_cancel_handler();
+}
+
+function project_open_select_project_file() {
+  if (invisible_file_input) {
+    invisible_file_input.accept = '.json';
+    invisible_file_input.onchange = project_open;
+    invisible_file_input.removeAttribute('multiple');
+    invisible_file_input.click();
+  }
+}
+
+function project_open(event) {
+  var selected_file = event.target.files[0];
+  load_text_file(selected_file, project_open_parse_json_file);
+}
+
+function project_open_parse_json_file(project_file_data) {
+  var d = JSON.parse(project_file_data);
+  if ( d['_via_settings'] && d['_via_img_metadata'] && d['_via_attributes'] ) {
+    // import settings
+    project_import_settings(d['_via_settings']);
+
+    // clear existing data (if any)
+    _via_image_id_list = [];
+    _via_image_filename_list = [];
+    _via_img_count = 0;
+    _via_img_metadata = {};
+    _via_img_fileref = {};
+    _via_img_src = {};
+    _via_attributes = { 'region':{}, 'file':{} };
+    _via_buffer_remove_all();
+
+    // import image metadata
+    _via_img_metadata = d['_via_img_metadata'];
+    var img_id;
+    for ( img_id in _via_img_metadata ) {
+      _via_image_id_list.push(img_id);
+      _via_image_filename_list.push( _via_img_metadata[img_id].filename );
+      set_file_annotations_to_default_value(img_id);
+      _via_img_count += 1;
+    }
+
+    // import attributes
+    _via_attributes = d['_via_attributes'];
+    project_parse_via_attributes_from_img_metadata();
+    var fattr_id_list = Object.keys(_via_attributes['file']);
+    var rattr_id_list = Object.keys(_via_attributes['region']);
+    if ( rattr_id_list.length ) {
+      _via_attribute_being_updated = 'region';
+      _via_current_attribute_id = rattr_id_list[0];
+    } else {
+      if ( fattr_id_list.length ) {
+        _via_attribute_being_updated = 'file';
+        _via_current_attribute_id = fattr_id_list[0];
+      }
+    }
+
+    if ( _via_settings.core.default_filepath !== '' ) {
+      _via_file_resolve_all_to_default_filepath();
+    }
+
+    show_message('Imported project [' + _via_settings['project'].name + '] with ' + _via_img_count + ' files.');
+
+    if ( _via_img_count > 0 ) {
+      _via_show_img(0);
+      update_img_fn_list();
+      _via_reload_img_fn_list_table = true;
+    }
+  } else {
+    show_message('Cannot import project from a corrupt file!');
+  }
+}
+
+function project_parse_via_attributes_from_img_metadata() {
+  // parse _via_img_metadata to populate _via_attributes
+  var img_id, fa, ra;
+
+  if ( ! _via_attributes.hasOwnProperty('file') ) {
+    _via_attributes['file'] = {};
+  }
+  if ( ! _via_attributes.hasOwnProperty('region') ) {
+    _via_attributes['region'] = {};
+  }
+
+  for ( img_id in _via_img_metadata ) {
+    // file attributes
+    for ( fa in _via_img_metadata[img_id].file_attributes ) {
+      if ( ! _via_attributes['file'].hasOwnProperty(fa) ) {
+        _via_attributes['file'][fa] = {};
+        _via_attributes['file'][fa]['type'] = 'text';
+      }
+    }
+    // region attributes
+    var ri;
+    for ( ri = 0; ri < _via_img_metadata[img_id].regions.length; ++ri ) {
+      for ( ra in _via_img_metadata[img_id].regions[ri].region_attributes ) {
+        if ( ! _via_attributes['region'].hasOwnProperty(ra) ) {
+          _via_attributes['region'][ra] = {};
+          _via_attributes['region'][ra]['type'] = 'text';
+        }
+      }
+    }
+  }
+}
+
+function project_import_settings(s) {
+  // @todo find a generic way to import into _via_settings
+  // only the components present in s (and not overwrite everything)
+  var k1;
+  for ( k1 in s ) {
+    if ( typeof( s[k1] ) === 'object' ) {
+      var k2;
+      for ( k2 in s[k1] ) {
+        if ( typeof( s[k1][k2] ) === 'object' ) {
+          var k3;
+          for ( k3 in s[k1][k2] ) {
+            _via_settings[k1][k2][k3] = s[k1][k2][k3];
+          }
+        } else {
+          _via_settings[k1][k2] = s[k1][k2];
+        }
+      }
+    } else {
+      _via_settings[k1] = s[k1];
+    }
+  }
+}
+
+function project_file_remove_with_confirm() {
+  var img_id = _via_image_id_list[_via_image_index];
+  var filename = _via_img_metadata[img_id].filename;
+  var region_count = _via_img_metadata[img_id].regions.length;
+
+  var config = {'title':'Remove File from Project' };
+  var input = { 'img_index': { type:'text', name:'File Id', value:(_via_image_index+1), disabled:true, size:8 },
+                'filename':{ type:'text', name:'Filename', value:filename, disabled:true, size:30},
+                'region_count':{ type:'text', name:'Number of regions', disabled:true, value:region_count, size:8}
+              };
+
+  invoke_with_user_inputs(project_file_remove_confirmed, input, config);
+}
+
+function project_file_remove_confirmed(input) {
+  var img_index = input.img_index.value - 1;
+  project_remove_file(img_index);
+
+  if ( img_index === _via_img_count ) {
+    if ( _via_img_count === 0 ) {
+      _via_current_image_loaded = false;
+      show_home_panel();
+    } else {
+      _via_show_img(img_index - 1);
+    }
+  } else {
+    _via_show_img(img_index);
+  }
+  _via_reload_img_fn_list_table = true;
+  update_img_fn_list();
+  show_message('Removed file [' + input.filename.value + '] from project');
+  user_input_default_cancel_handler();
+}
+
+
+function project_remove_file(img_index) {
+  if ( img_index < 0 || img_index >= _via_img_count ) {
+    console.log('project_remove_file(): invalid img_index ' + img_index);
+    return;
+  }
+  var img_id = _via_image_id_list[img_index];
+
+  // remove img_index from all array
+  // this invalidates all image_index > img_index
+  _via_image_id_list.splice( img_index, 1 );
+  _via_image_filename_list.splice( img_index, 1 );
+
+  var img_fn_list_index = _via_img_fn_list_img_index_list.indexOf(img_index);
+  if ( img_fn_list_index !== -1 ) {
+    _via_img_fn_list_img_index_list.splice( img_fn_list_index, 1 );
+  }
+
+  // clear all buffer
+  // @todo: it is wasteful to clear all the buffer instead of removing a single image
+  _via_buffer_remove_all();
+  img_fn_list_clear_css_classname('buffered');
+
+  _via_clear_reg_canvas();
+  delete _via_img_metadata[img_id];
+  delete _via_img_src[img_id];
+  delete _via_img_fileref[img_id];
+
+  _via_img_count -= 1;
+}
+
+function project_add_new_file(filename, size, file_id) {
+  var img_id = file_id;
+  if ( typeof(img_id) === 'undefined' ) {
+    if ( typeof(size) === 'undefined' ) {
+      size = -1;
+    }
+    img_id = _via_get_image_id(filename, size);
+  }
+
+  if ( ! _via_img_metadata.hasOwnProperty(img_id) ) {
+    _via_img_metadata[img_id] = new file_metadata(filename, size);
+    _via_image_id_list.push(img_id);
+    _via_image_filename_list.push(filename);
+    _via_img_count += 1;
+  }
+  return img_id;
+}
+
+function project_file_add_local(event) {
+  var user_selected_images = event.target.files;
+  var original_image_count = _via_img_count;
+
+  var new_img_index_list = [];
+  var discarded_file_count = 0;
+  for ( var i = 0; i < user_selected_images.length; ++i ) {
+    var filetype = user_selected_images[i].type.substr(0, 5);
+    if ( filetype === 'image' ) {
+      var filename = user_selected_images[i].name;
+      var size     = user_selected_images[i].size;
+      var img_id1  = _via_get_image_id(filename, size);
+      var img_id2  = _via_get_image_id(filename, -1);
+      var img_id   = img_id1;
+
+      if ( _via_img_metadata.hasOwnProperty(img_id1) || _via_img_metadata.hasOwnProperty(img_id2) ) {
+        if ( _via_img_metadata.hasOwnProperty(img_id2) ) {
+          img_id = img_id2;
+        }
+
+        _via_img_fileref[img_id] = user_selected_images[i];
+        if ( _via_img_metadata[img_id].size === -1 ) {
+          _via_img_metadata[img_id].size = size;
+        }
+      } else {
+        img_id = project_add_new_file(filename, size);
+        _via_img_fileref[img_id] = user_selected_images[i];
+        set_file_annotations_to_default_value(img_id);
+      }
+      new_img_index_list.push( _via_image_id_list.indexOf(img_id) );
+    } else {
+      discarded_file_count += 1;
+    }
+  }
+
+  if ( _via_img_metadata ) {
+    var status_msg = 'Loaded ' + new_img_index_list.length + ' images.';
+    if ( discarded_file_count ) {
+      status_msg += ' ( Discarded ' + discarded_file_count + ' non-image files! )';
+    }
+    show_message(status_msg);
+
+    if ( new_img_index_list.length ) {
+      // show first of newly added image
+      _via_show_img( new_img_index_list[0] );
+    } else {
+      // show original image
+      _via_show_img ( _via_image_index );
+    }
+    update_img_fn_list();
+  } else {
+    show_message("Please upload some image files!");
+  }
+}
+
+function project_file_add_abs_path_with_input() {
+  var config = {'title':'Add File using Absolute Path' };
+  var input = { 'absolute_path': { type:'text', name:'add one absolute path', placeholder:'/home/abhishek/image1.jpg', disabled:false, size:50 },
+		'absolute_path_list': { type:'textarea', name:'or, add multiple paths (one path per line)', placeholder:'/home/abhishek/image1.jpg\n/home/abhishek/image2.jpg\n/home/abhishek/image3.png', disabled:false, rows:5, cols:80 }
+              };
+
+  invoke_with_user_inputs(project_file_add_abs_path_input_done, input, config);
+}
+
+function project_file_add_abs_path_input_done(input) {
+  if ( input.absolute_path.value !== '' ) {
+    var abs_path  = input.absolute_path.value.trim();
+    var img_id    = project_file_add_url(abs_path);
+    var img_index = _via_image_id_list.indexOf(img_id);
+    _via_show_img(img_index);
+    show_message('Added file at absolute path [' + abs_path + ']');
+    update_img_fn_list();
+    user_input_default_cancel_handler();
+  } else {
+    if ( input.absolute_path_list.value !== '' ) {
+      var absolute_path_list_str = input.absolute_path_list.value;
+      import_files_url_from_csv(absolute_path_list_str);
+    }
+  }
+}
+
+function project_file_add_url_with_input() {
+  var config = {'title':'Add File using URL' };
+  var input = { 'url': { type:'text', name:'add one URL', placeholder:'http://www.robots.ox.ac.uk/~vgg/software/via/images/swan.jpg', disabled:false, size:50 },
+		'url_list': { type:'textarea', name:'or, add multiple URL (one url per line)', placeholder:'http://www.example.com/image1.jpg\nhttp://www.example.com/image2.jpg\nhttp://www.example.com/image3.png', disabled:false, rows:5, cols:80 }
+              };
+
+  invoke_with_user_inputs(project_file_add_url_input_done, input, config);
+}
+
+function project_file_add_url_input_done(input) {
+  if ( input.url.value !== '' ) {
+    var url = input.url.value.trim();
+    var img_id    = project_file_add_url(url);
+    var img_index = _via_image_id_list.indexOf(img_id);
+    show_message('Added file at url [' + url + ']');
+    update_img_fn_list();
+    _via_show_img(img_index);
+    user_input_default_cancel_handler();
+  } else {
+    if ( input.url_list.value !== '' ) {
+      var url_list_str = input.url_list.value;
+      import_files_url_from_csv(url_list_str);
+    }
+  }
+}
+
+function project_file_add_url(url) {
+  if ( url !== '' ) {
+    var size = -1; // convention: files added using url have size = -1
+    var img_id   = _via_get_image_id(url, size);
+
+    if ( ! _via_img_metadata.hasOwnProperty(img_id) ) {
+      img_id = project_add_new_file(url);
+      _via_img_src[img_id] = _via_img_metadata[img_id].filename;
+      set_file_annotations_to_default_value(img_id);
+      return img_id;
+    }
+  }
+}
+
+function project_file_add_base64(filename, base64) {
+  var size = -1; // convention: files added using url have size = -1
+  var img_id   = _via_get_image_id(filename, size);
+
+  if ( ! _via_img_metadata.hasOwnProperty(img_id) ) {
+    img_id = project_add_new_file(filename, size);
+    _via_img_src[img_id] = base64;
+    set_file_annotations_to_default_value(img_id);
+  }
+}
+
+function project_file_load_on_fail(img_index) {
+  var img_id = _via_image_id_list[img_index];
+  _via_img_src[img_id] = '';
+  _via_image_load_error[img_index] = true;
+  img_fn_list_ith_entry_error(img_index, true);
+}
+
+function project_file_load_on_success(img_index) {
+  _via_image_load_error[img_index] = false;
+  img_fn_list_ith_entry_error(img_index, false);
+}
+
+function project_settings_toggle() {
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.SETTINGS ) {
+    show_single_image_view();
+  } else {
+    project_settings_show();
+  }
+}
+
+function project_settings_show() {
+  set_display_area_content(VIA_DISPLAY_AREA_CONTENT_NAME.SETTINGS);
+}
+
+function project_filepath_add_from_input(p, button) {
+  var new_path = document.getElementById(p).value.trim();
+  var img_index = parseInt(button.getAttribute('value'));
+  project_filepath_add(new_path);
+  _via_show_img(img_index);
+}
+
+function project_filepath_add(new_path) {
+  console.log('adding path: ' + new_path);
+  if ( path === '' ) {
+    return;
+  }
+
+  if ( _via_settings.core.filepath.hasOwnProperty(new_path) ) {
+    return;
+  } else {
+    var largest_order = 0;
+    var path;
+    for ( path in _via_settings.core.filepath ) {
+      if ( _via_settings.core.filepath[path] > largest_order ) {
+        largest_order = _via_settings.core.filepath[path];
+      }
+    }
+    _via_settings.core.filepath[new_path] = largest_order + 1;
+
+  }
+}
+
+function project_filepath_del(path) {
+  if ( _via_settings.core.filepath.hasOwnProperty(path) ) {
+    delete _via_settings.core.filepath[path];
+  }
+}
+
+function project_save_attributes() {
+  var blob_attr = {type: 'application/json;charset=utf-8'};
+  var all_region_data_blob = new Blob( [ JSON.stringify(_via_attributes) ], blob_attr);
+
+  save_data_to_local_file(all_region_data_blob, _via_settings.project.name + '_attributes.json');
+}
+
+function project_import_attributes_from_file(event) {
+  var selected_files = event.target.files;
+  for ( var i = 0; i < selected_files.length; ++i ) {
+    var file = selected_files[i];
+    load_text_file(file, project_import_attributes_from_json);
+  }
+}
+
+function project_import_attributes_from_json(data) {
+  try {
+    var d = JSON.parse(data);
+    var attr;
+    var fattr_count = 0;
+    var rattr_count = 0;
+    // process file attributes
+    for ( attr in d['file'] ) {
+      _via_attributes['file'][attr] = JSON.parse( JSON.stringify( d['file'][attr] ) );
+      fattr_count += 1;
+    }
+
+    // process region attributes
+    for ( attr in d['region'] ) {
+      _via_attributes['region'][attr] = JSON.parse( JSON.stringify( d['region'][attr] ) );
+      rattr_count += 1;
+    }
+
+    if ( fattr_count > 0 || rattr_count > 0 ) {
+      var fattr_id_list = Object.keys(_via_attributes['file']);
+      var rattr_id_list = Object.keys(_via_attributes['region']);
+      if ( rattr_id_list.length ) {
+        _via_attribute_being_updated = 'region';
+        _via_current_attribute_id = rattr_id_list[0];
+      } else {
+        if ( fattr_id_list.length ) {
+          _via_attribute_being_updated = 'file';
+          _via_current_attribute_id = fattr_id_list[0];
+        }
+      }
+      attribute_update_panel_set_active_button();
+      update_attributes_update_panel();
+      annotation_editor_update_content();
+    }
+    show_message('Imported ' + fattr_count + ' file attributes and '
+                 + rattr_count + ' region attributes');
+  } catch (error) {
+    show_message('Failed to import attributes: [' + error + ']');
+  }
+}
+
+//
+// image grid
+//
+function image_grid_init() {
+  var p = document.getElementById('image_grid_content');
+  p.focus();
+  p.addEventListener('mousedown', image_grid_mousedown_handler, false);
+  p.addEventListener('mouseup', image_grid_mouseup_handler, false);
+  p.addEventListener('dblclick', image_grid_dblclick_handler, false);
+
+  image_grid_set_content_panel_height_fixed();
+
+  // select policy as defined in settings
+  var i, option;
+  var p = document.getElementById('image_grid_show_image_policy');
+  var n = p.options.length;
+  for ( i = 0; i < n; ++i ) {
+    if ( p.options[i].value === _via_settings.ui.image_grid.show_image_policy ) {
+      p.selectedIndex = i;
+      break;
+    }
+  }
+}
+
+function image_grid_update() {
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+    image_grid_set_content( _via_image_grid_img_index_list );
+  }
+}
+
+function image_grid_toggle() {
+  var p = document.getElementById('toolbar_image_grid_toggle');
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE_GRID ) {
+    image_grid_clear_all_groups();
+    show_single_image_view();
+  } else {
+    show_image_grid_view();
+  }
+}
+
+function image_grid_show_all_project_images() {
+  var all_img_index_list = [];
+  var i, n;
+  //n = _via_image_id_list.length;
+  n = _via_img_fn_list_img_index_list.length;
+  for ( i = 0; i < n; ++i ) {
+    all_img_index_list.push( _via_img_fn_list_img_index_list[i] );
+  }
+  image_grid_clear_all_groups();
+
+  var p = document.getElementById('image_grid_toolbar_group_by_select');
+  p.selectedIndex = 0;
+
+  image_grid_set_content(all_img_index_list);
+}
+
+function image_grid_clear_all_groups() {
+  var i, n;
+  n = _via_image_grid_group_var.length;
+  for ( i = 0; i < n; ++i ) {
+    image_grid_remove_html_group_panel( _via_image_grid_group_var[i] );
+    image_grid_group_by_select_set_disabled( _via_image_grid_group_var[i].type,
+                                             _via_image_grid_group_var[i].name,
+                                             false);
+  }
+  _via_image_grid_group = {};
+  _via_image_grid_group_var = [];
+
+}
+
+function image_grid_set_content(img_index_list) {
+  if ( img_index_list.length === 0 ) {
+    return;
+  }
+  if ( _via_image_grid_load_ongoing ) {
+    return;
+  }
+
+  _via_image_grid_img_index_list = img_index_list.slice(0);
+  _via_image_grid_selected_img_index_list = img_index_list.slice(0);
+
+  document.getElementById('image_grid_group_by_img_count').innerHTML = _via_image_grid_img_index_list.length;
+
+  _via_image_grid_page_first_index    = 0;
+  _via_image_grid_page_last_index     = null;
+  _via_image_grid_stack_prev_page     = [];
+  _via_image_grid_page_img_index_list = [];
+
+  image_grid_clear_content();
+  image_grid_set_content_panel_height_fixed();
+  _via_image_grid_load_ongoing = true;
+
+  var n = _via_image_grid_img_index_list.length;
+  switch ( _via_settings.ui.image_grid.show_image_policy ) {
+  case 'all':
+    _via_image_grid_page_img_index_list = _via_image_grid_img_index_list.slice(0);
+    break;
+  case 'first_mid_last':
+    if ( n < 3 ) {
+      var i;
+      for ( i = 0; i < n; ++i ) {
+        _via_image_grid_page_img_index_list.push( _via_image_grid_img_index_list[i] );
+      }
+    } else {
+      _via_image_grid_page_img_index_list.push( _via_image_grid_img_index_list[0] );
+      _via_image_grid_page_img_index_list.push( _via_image_grid_img_index_list[ Math.floor(n/2) ] );
+      _via_image_grid_page_img_index_list.push( _via_image_grid_img_index_list[n-1] );
+    }
+    break;
+  case 'even_indexed':
+    var i;
+    for ( i = 0; i < n; ++i ) {
+      if ( i % 2 !== 0 ) { // since the user views (i+1) based indexing
+        _via_image_grid_page_img_index_list.push( _via_image_grid_img_index_list[i] );
+      }
+    }
+    break;
+  case 'odd_indexed':
+    var i;
+    for ( i = 0; i < n; ++i ) {
+      if ( i % 2 === 0 ) { // since the user views (i+1) based indexing
+        _via_image_grid_page_img_index_list.push( _via_image_grid_img_index_list[i] );
+      }
+    }
+    break;
+  case 'gap5':  // fallback
+  case 'gap25': // fallback
+  case 'gap50': // fallback
+    var del = parseInt( _via_settings.ui.image_grid.show_image_policy.substr( 'gap'.length ) );
+    var i;
+    for ( i = 0; i < n; i = i + del ) {
+      _via_image_grid_page_img_index_list.push( _via_image_grid_img_index_list[i] );
+    }
+    break;
+  }
+
+  _via_image_grid_visible_img_index_list = [];
+
+  image_grid_update_sel_count_html();
+  annotation_editor_update_content();
+
+  image_grid_content_append_img( _via_image_grid_page_first_index );
+
+  show_message('[Click] toggles selection, ' +
+               '[Shift + Click] selects everything a image, ' +
+               '[Click] or [Ctrl + Click] removes selection of all subsequent or preceeding images.');
+}
+
+function image_grid_clear_content() {
+  var img_container = document.getElementById('image_grid_content_img');
+  var img_rshape = document.getElementById('image_grid_content_rshape');
+  img_container.innerHTML = '';
+  img_rshape.innerHTML = '';
+  _via_image_grid_visible_img_index_list = [];
+}
+
+function image_grid_set_content_panel_height_fixed() {
+  var pc = document.getElementById('image_grid_content');
+  var de = document.documentElement;
+  pc.style.height = (de.clientHeight - 5.5*ui_top_panel.offsetHeight) + 'px';
+}
+
+// We do not know how many images will fit in the display area.
+// Therefore, we add images one-by-one until overflow of parent
+// container is detected.
+function image_grid_content_append_img( img_grid_index ) {
+  var img_index   = _via_image_grid_page_img_index_list[img_grid_index];
+  var html_img_id = image_grid_get_html_img_id(img_index);
+  var img_id      = _via_image_id_list[img_index];
+  var e = document.createElement('img');
+  if ( _via_img_fileref[img_id] instanceof File ) {
+    var img_reader = new FileReader();
+    img_reader.addEventListener( "error", function() {
+      //@todo
+    }, false);
+    img_reader.addEventListener( "load", function() {
+      e.src = img_reader.result;
+    }, false);
+    img_reader.readAsDataURL( _via_img_fileref[img_id] );
+  } else {
+    e.src = _via_img_src[img_id];
+  }
+  e.setAttribute('id', html_img_id);
+  e.setAttribute('height', _via_settings.ui.image_grid.img_height + 'px');
+  e.setAttribute('title', '[' + (img_index+1) + '] ' + _via_img_metadata[img_id].filename);
+
+  e.addEventListener('load', image_grid_on_img_load, false);
+  e.addEventListener('error', image_grid_on_img_error, false);
+  document.getElementById('image_grid_content_img').appendChild(e);
+}
+
+function image_grid_on_img_load(e) {
+  var img = e.target;
+  var img_index = image_grid_parse_html_img_id(img.id);
+  project_file_load_on_success(img_index);
+
+  image_grid_add_img_if_possible(img);
+}
+
+function image_grid_on_img_error(e) {
+  var img       = e.target;
+  var img_index = image_grid_parse_html_img_id(img.id);
+  project_file_load_on_fail(img_index);
+  image_grid_add_img_if_possible(img);
+}
+
+function image_grid_add_img_if_possible(img) {
+  var img_index = image_grid_parse_html_img_id(img.id);
+
+  var p = document.getElementById('image_grid_content_img');
+  var img_bottom_right_corner = parseInt(img.offsetTop) + parseInt(img.height);
+  if ( p.clientHeight < img_bottom_right_corner ) {
+    // stop as addition of this image caused overflow of parent container
+    var img_container = document.getElementById('image_grid_content_img');
+    img_container.removeChild(img);
+
+    if ( _via_settings.ui.image_grid.show_region_shape ) {
+      image_grid_page_show_all_regions();
+    }
+    _via_image_grid_load_ongoing = false;
+
+    var index = _via_image_grid_page_img_index_list.indexOf(img_index);
+    _via_image_grid_page_last_index = index;
+
+    // setup prev, next navigation
+    var info = document.getElementById('image_grid_nav');
+    var html = [];
+    var first_index = _via_image_grid_page_first_index;
+    var last_index  = _via_image_grid_page_last_index - 1;
+    html.push('<span>Showing&nbsp;' + (first_index + 1) +
+              ' to ' + (last_index + 1) + '&nbsp;:</span>');
+    if ( _via_image_grid_stack_prev_page.length ) {
+      html.push('<span class="text_button" onclick="image_grid_page_prev()">Prev</span>');
+    } else {
+      html.push('<span>Prev</span>');
+    }
+    html.push('<span class="text_button" onclick="image_grid_page_next()">Next</span');
+    info.innerHTML = html.join('');
+  } else {
+    // process this image and trigger addition of next image in sequence
+    var img_fn_list_index = _via_image_grid_page_img_index_list.indexOf(img_index);
+    var next_img_fn_list_index = img_fn_list_index + 1;
+
+    _via_image_grid_visible_img_index_list.push( img_index );
+    var is_selected = ( _via_image_grid_selected_img_index_list.indexOf(img_index) !== -1 );
+    if ( ! is_selected ) {
+      image_grid_update_img_select(img_index, 'unselect');
+    }
+
+    if ( next_img_fn_list_index !==  _via_image_grid_page_img_index_list.length ) {
+      if ( _via_image_grid_load_ongoing ) {
+        image_grid_content_append_img( img_fn_list_index + 1 );
+      } else {
+        // image grid load operation was cancelled
+        _via_image_grid_page_last_index = _via_image_grid_page_first_index; // load this page again
+
+        var info = document.getElementById('image_grid_nav');
+        var html = [];
+        html.push('<span>Cancelled&nbsp;:</span>');
+        if ( _via_image_grid_stack_prev_page.length ) {
+          html.push('<span class="text_button" onclick="image_grid_page_prev()">Prev</span>');
+        } else {
+          html.push('<span>Prev</span>');
+        }
+        html.push('<span class="text_button" onclick="image_grid_page_next()">Next</span');
+        info.innerHTML = html.join('');
+      }
+    } else {
+      // last page
+      var index = _via_image_grid_page_img_index_list.indexOf(img_index);
+      _via_image_grid_page_last_index = index;
+
+      if ( _via_settings.ui.image_grid.show_region_shape ) {
+        image_grid_page_show_all_regions();
+      }
+      _via_image_grid_load_ongoing = false;
+
+      // setup prev, next navigation
+      var info = document.getElementById('image_grid_nav');
+      var html = [];
+      var first_index = _via_image_grid_page_first_index;
+      var last_index  = _via_image_grid_page_last_index;
+      html.push('<span>Showing&nbsp;' + (first_index + 1) +
+                ' to ' + (last_index + 1) + ' (end)&nbsp;</span>');
+      if ( _via_image_grid_stack_prev_page.length ) {
+        html.push('<span class="text_button" onclick="image_grid_page_prev()">Prev</span>');
+      } else {
+        html.push('<span>Prev</span>');
+      }
+      html.push('<span>Next</span');
+
+      info.innerHTML = html.join('');
+    }
+  }
+}
+
+function image_grid_onchange_show_image_policy(p) {
+  _via_settings.ui.image_grid.show_image_policy = p.options[p.selectedIndex].value;
+  image_grid_set_content(_via_image_grid_img_index_list);
+}
+
+function image_grid_page_show_all_regions() {
+  var all_promises = [];
+  if ( _via_settings.ui.image_grid.show_region_shape ) {
+    var p = document.getElementById('image_grid_content_img');
+    var n = p.childNodes.length;
+    var i;
+    for ( i = 0; i < n; ++i ) {
+      // draw region shape into global canvas for image grid
+      var img_index = image_grid_parse_html_img_id( p.childNodes[i].id );
+      var img_param = []; // [width, height, originalWidth, originalHeight, x, y]
+      img_param.push( parseInt(p.childNodes[i].width) );
+      img_param.push( parseInt(p.childNodes[i].height) );
+      img_param.push( parseInt(p.childNodes[i].naturalWidth) );
+      img_param.push( parseInt(p.childNodes[i].naturalHeight) );
+      img_param.push( parseInt(p.childNodes[i].offsetLeft) + parseInt(p.childNodes[i].clientLeft) );
+      img_param.push( parseInt(p.childNodes[i].offsetTop) + parseInt(p.childNodes[i].clientTop) );
+      var promise = image_grid_show_region_shape( img_index, img_param );
+      all_promises.push( promise );
+    }
+    // @todo: ensure that all promises are fulfilled
+  }
+}
+
+function image_grid_is_region_in_current_group(r) {
+  var i, n;
+  n = _via_image_grid_group_var.length;
+  if ( n === 0 ) {
+    return true;
+  }
+
+  for ( i = 0; i < n; ++i ) {
+    if ( _via_image_grid_group_var[i].type === 'region' ) {
+      var group_value = _via_image_grid_group_var[i].values[ _via_image_grid_group_var[i].current_value_index ];
+      if ( r[_via_image_grid_group_var[i].name] != group_value ) {
+        return false;
+      }
+    }
+  }
+  return true;
+}
+
+function image_grid_show_region_shape(img_index, img_param) {
+  return new Promise( function(ok_callback, err_callback) {
+    var i;
+    var img_id = _via_image_id_list[img_index];
+    var html_img_id = image_grid_get_html_img_id(img_index);
+    var n = _via_img_metadata[img_id].regions.length;
+    var is_in_group = false;
+    for ( i = 0; i < n; ++i ) {
+      if ( ! image_grid_is_region_in_current_group( _via_img_metadata[img_id].regions[i].region_attributes ) ) {
+        // skip drawing this region which is not in current group
+        continue;
+      }
+
+      var r = _via_img_metadata[img_id].regions[i].shape_attributes;
+      var dimg; // region coordinates in original image space
+      switch( r.name ) {
+      case VIA_REGION_SHAPE.RECT:
+        dimg = [ r['x'], r['y'], r['x']+r['width'], r['y']+r['height'] ];
+        break;
+      case VIA_REGION_SHAPE.CIRCLE:
+        dimg = [ r['cx'], r['cy'], r['cx']+r['r'], r['cy']+r['r'] ];
+        break;
+      case VIA_REGION_SHAPE.ELLIPSE:
+        dimg = [ r['cx'], r['cy'], r['cx']+r['rx'], r['cy']+r['ry'] ];
+        break;
+      case VIA_REGION_SHAPE.POLYLINE: // handled by POLYGON
+      case VIA_REGION_SHAPE.POLYGON:
+        var j;
+        dimg = [];
+        for ( j = 0; j < r['all_points_x'].length; ++j ) {
+          dimg.push( r['all_points_x'][j] );
+          dimg.push( r['all_points_y'][j] );
+        }
+        break;
+      case VIA_REGION_SHAPE.POINT:
+        dimg = [ r['cx'], r['cy'] ];
+        break;
+      }
+      var scale_factor = img_param[1] / img_param[3]; // new_height / original height
+      var offset_x     = img_param[4];
+      var offset_y     = img_param[5];
+      var r2 = new _via_region( r.name, i, dimg, scale_factor, offset_x, offset_y);
+      var r2_svg = r2.get_svg_element();
+      r2_svg.setAttribute('id', image_grid_get_html_region_id(img_index, i));
+      r2_svg.setAttribute('class', html_img_id);
+      r2_svg.setAttribute('fill',         _via_settings.ui.image_grid.rshape_fill);
+      //r2_svg.setAttribute('fill-opacity', _via_settings.ui.image_grid.rshape_fill_opacity);
+      r2_svg.setAttribute('stroke',       _via_settings.ui.image_grid.rshape_stroke);
+      r2_svg.setAttribute('stroke-width', _via_settings.ui.image_grid.rshape_stroke_width);
+
+      document.getElementById('image_grid_content_rshape').appendChild(r2_svg);
+    }
+  });
+}
+
+function image_grid_image_size_increase() {
+  var new_img_height = _via_settings.ui.image_grid.img_height + VIA_IMAGE_GRID_IMG_HEIGHT_CHANGE;
+  _via_settings.ui.image_grid.img_height = new_img_height;
+
+  _via_image_grid_page_last_index = null;
+  image_grid_update();
+}
+
+function image_grid_image_size_decrease() {
+  var new_img_height = _via_settings.ui.image_grid.img_height - VIA_IMAGE_GRID_IMG_HEIGHT_CHANGE;
+  if ( new_img_height > 1 ) {
+    _via_settings.ui.image_grid.img_height = new_img_height;
+    _via_image_grid_page_last_index = null;
+    image_grid_update();
+  }
+}
+
+function image_grid_image_size_reset() {
+  var new_img_height = _via_settings.ui.image_grid.img_height;
+  if ( new_img_height > 1 ) {
+    _via_settings.ui.image_grid.img_height = new_img_height;
+    _via_image_grid_page_last_index = null;
+    image_grid_update();
+  }
+}
+
+function image_grid_mousedown_handler(e) {
+  e.preventDefault();
+  _via_image_grid_mousedown_img_index = image_grid_parse_html_img_id(e.target.id);
+}
+
+function image_grid_mouseup_handler(e) {
+  e.preventDefault();
+  var last_mouseup_img_index = _via_image_grid_mouseup_img_index;
+  _via_image_grid_mouseup_img_index = image_grid_parse_html_img_id(e.target.id);
+  if ( isNaN(_via_image_grid_mousedown_img_index) ||
+       isNaN(_via_image_grid_mouseup_img_index)) {
+    last_mouseup_img_index = _via_image_grid_img_index_list[0];
+    image_grid_group_select_none();
+    return;
+  }
+
+  var mousedown_img_arr_index = _via_image_grid_img_index_list.indexOf(_via_image_grid_mousedown_img_index);
+  var mouseup_img_arr_index = _via_image_grid_img_index_list.indexOf(_via_image_grid_mouseup_img_index);
+
+  var start = -1;
+  var end   = -1;
+  var operation = 'select'; // {'select', 'unselect', 'toggle'}
+  if ( mousedown_img_arr_index === mouseup_img_arr_index ) {
+    if ( e.shiftKey ) {
+      // select all elements until this element
+      start = _via_image_grid_img_index_list.indexOf(last_mouseup_img_index) + 1;
+      end   = mouseup_img_arr_index + 1;
+    } else {
+      // toggle selection of single image
+      start = mousedown_img_arr_index;
+      end   = start + 1;
+      operation = 'toggle';
+    }
+  } else {
+    if ( mousedown_img_arr_index < mouseup_img_arr_index ) {
+      start = mousedown_img_arr_index;
+      end   = mouseup_img_arr_index + 1;
+    } else {
+      start = mouseup_img_arr_index + 1;
+      end   = mousedown_img_arr_index;
+    }
+    operation = 'toggle';
+  }
+
+  if ( start > end ) {
+    return;
+  }
+
+  var i, img_index;
+  for ( i = start; i < end; ++i ) {
+    img_index = _via_image_grid_img_index_list[i];
+    image_grid_update_img_select(img_index, operation);
+  }
+  image_grid_update_sel_count_html();
+  annotation_editor_update_content();
+}
+
+function image_grid_update_sel_count_html() {
+  document.getElementById('image_grid_group_by_sel_img_count').innerHTML = _via_image_grid_selected_img_index_list.length;
+}
+
+// state \in {'select', 'unselect', 'toggle'}
+function image_grid_update_img_select(img_index, state) {
+  var html_img_id = image_grid_get_html_img_id(img_index);
+  var is_selected = ( _via_image_grid_selected_img_index_list.indexOf(img_index) !== -1 );
+  if (state === 'toggle' ) {
+    if ( is_selected ) {
+      state = 'unselect';
+    } else {
+      state = 'select';
+    }
+  }
+
+  switch(state) {
+  case 'select':
+    if ( ! is_selected ) {
+      _via_image_grid_selected_img_index_list.push(img_index);
+    }
+    if ( _via_image_grid_visible_img_index_list.indexOf(img_index) !== -1 ) {
+      document.getElementById(html_img_id).classList.remove('not_sel');
+    }
+    break;
+  case 'unselect':
+    if ( is_selected ) {
+      var arr_index = _via_image_grid_selected_img_index_list.indexOf(img_index);
+      _via_image_grid_selected_img_index_list.splice(arr_index, 1);
+    }
+    if ( _via_image_grid_visible_img_index_list.indexOf(img_index) !== -1 ) {
+      document.getElementById(html_img_id).classList.add('not_sel');
+    }
+    break;
+  }
+}
+
+function image_grid_group_select_all() {
+  image_grid_group_set_all_selection_state('select');
+  image_grid_update_sel_count_html();
+  annotation_editor_update_content();
+  show_message('Selected all images in the current group');
+}
+
+function image_grid_group_select_none() {
+  image_grid_group_set_all_selection_state('unselect');
+  image_grid_update_sel_count_html();
+  annotation_editor_update_content();
+  show_message('Removed selection of all images in the current group');
+}
+
+function image_grid_group_set_all_selection_state(state) {
+  var i, img_index;
+  for ( i = 0; i < _via_image_grid_img_index_list.length; ++i ) {
+    img_index = _via_image_grid_img_index_list[i];
+    image_grid_update_img_select(img_index, state);
+  }
+}
+
+function image_grid_group_toggle_select_all() {
+  if ( _via_image_grid_selected_img_index_list.length === _via_image_grid_img_index_list.length ) {
+    image_grid_group_select_none();
+  } else {
+    image_grid_group_select_all();
+  }
+}
+
+function image_grid_parse_html_img_id(html_img_id) {
+  var img_index = html_img_id.substr(2);
+  return parseInt(img_index);
+}
+
+function image_grid_get_html_img_id(img_index) {
+  return 'im' + img_index;
+}
+
+function image_grid_parse_html_region_id(html_region_id) {
+  var chunks = html_region_id.split('_');
+  if ( chunks.length === 2 ) {
+    var img_index = parseInt(chunks[0].substr(2));
+    var region_id = parseInt(chunks[1].substr(2));
+    return {'img_index':img_index, 'region_id':region_id};
+  } else {
+    console.log('image_grid_parse_html_region_id(): invalid html_region_id');
+    return {};
+  }
+}
+
+function image_grid_get_html_region_id(img_index, region_id) {
+  return image_grid_get_html_img_id(img_index) + '_rs' + region_id;
+}
+
+function image_grid_dblclick_handler(e) {
+  _via_image_index = image_grid_parse_html_img_id(e.target.id);
+  show_single_image_view();
+}
+
+function image_grid_toolbar_update_group_by_select() {
+  var p = document.getElementById('image_grid_toolbar_group_by_select');
+  p.innerHTML = '';
+
+  var o = document.createElement('option');
+  o.setAttribute('value', '');
+  o.setAttribute('selected', 'selected');
+  o.innerHTML = 'All Images';
+  p.appendChild(o);
+
+  // add file attributes
+  var fattr;
+  for ( fattr in _via_attributes['file'] ) {
+    var o = document.createElement('option');
+    o.setAttribute('value', image_grid_toolbar_group_by_select_get_html_id('file', fattr));
+    o.innerHTML = '[file] ' + fattr;
+    p.appendChild(o);
+  }
+
+  // add region attributes
+  var rattr;
+  for ( rattr in _via_attributes['region'] ) {
+    var o = document.createElement('option');
+    o.setAttribute('value', image_grid_toolbar_group_by_select_get_html_id('region', rattr));
+    o.innerHTML = '[region] ' + rattr;
+    p.appendChild(o);
+  }
+}
+
+function image_grid_toolbar_group_by_select_get_html_id(type, name) {
+  if ( type === 'file' ) {
+    return 'f_' + name;
+  }
+  if ( type === 'region' ) {
+    return 'r_' + name;
+  }
+}
+
+function image_grid_toolbar_group_by_select_parse_html_id(id) {
+  if ( id.startsWith('f_') ) {
+    return { 'attr_type':'file', 'attr_name':id.substr(2) };
+  }
+  if ( id.startsWith('r_') ) {
+    return { 'attr_type':'region', 'attr_name':id.substr(2) };
+  }
+}
+
+function image_grid_toolbar_onchange_group_by_select(p) {
+  if ( p.options[p.selectedIndex].value === '' ) {
+    image_grid_show_all_project_images();
+    return;
+  }
+
+  var v = image_grid_toolbar_group_by_select_parse_html_id( p.options[p.selectedIndex].value );
+  var attr_type = v.attr_type;
+  var attr_name = v.attr_name;
+  image_grid_group_by(attr_type, attr_name);
+
+  image_grid_group_by_select_set_disabled(attr_type, attr_name, true);
+  p.blur(); // to avoid adding new groups using keyboard keys as dropdown is still in focus
+}
+
+function image_grid_remove_html_group_panel(d) {
+  var p = document.getElementById('group_toolbar_' + d.group_index);
+  document.getElementById('image_grid_group_panel').removeChild(p);
+}
+
+function image_grid_add_html_group_panel(d) {
+  var p = document.createElement('div');
+  p.classList.add('image_grid_group_toolbar');
+  p.setAttribute('id', 'group_toolbar_' + d.group_index);
+
+  var del = document.createElement('span');
+  del.classList.add('text_button');
+  del.setAttribute('onclick', 'image_grid_remove_group_by(this)');
+  del.innerHTML = '&times;';
+  p.appendChild(del);
+
+  var prev = document.createElement('button');
+  prev.innerHTML = '<';
+  prev.setAttribute('value', d.group_index);
+  prev.setAttribute('onclick', 'image_grid_group_prev(this)');
+  p.appendChild(prev);
+
+  var sel = document.createElement('select');
+  sel.setAttribute('id', image_grid_group_select_get_html_id(d.group_index));
+  sel.setAttribute('onchange', 'image_grid_group_value_onchange(this)');
+  var i, value;
+  var n = d.values.length;
+  var current_value = d.values[ d.current_value_index ];
+  for ( i = 0; i < n; ++i ) {
+    value = d.values[i];
+    var o = document.createElement('option');
+    o.setAttribute('value', value);
+    o.innerHTML = (i+1) + '/' + n + ': ' + d.name + ' = ' + value;
+    if ( value === current_value ) {
+      o.setAttribute('selected', 'selected');
+    }
+
+    sel.appendChild(o);
+  }
+  p.appendChild(sel);
+
+  var next = document.createElement('button');
+  next.innerHTML = '>';
+  next.setAttribute('value', d.group_index);
+  next.setAttribute('onclick', 'image_grid_group_next(this)');
+  p.appendChild(next);
+
+  document.getElementById('image_grid_group_panel').appendChild(p);
+}
+
+function image_grid_group_panel_set_selected_value(group_index) {
+  var sel = document.getElementById(image_grid_group_select_get_html_id(group_index));
+  sel.selectedIndex = _via_image_grid_group_var[group_index].current_value_index;
+}
+
+function image_grid_group_panel_set_options(group_index) {
+  var sel = document.getElementById(image_grid_group_select_get_html_id(group_index));
+  sel.innerHTML = '';
+
+  var i, value;
+  var n = _via_image_grid_group_var[group_index].values.length;
+  var name = _via_image_grid_group_var[group_index].name;
+  var current_value = _via_image_grid_group_var[group_index].values[ _via_image_grid_group_var[group_index].current_value_index ]
+  for ( i = 0; i < n; ++i ) {
+    value = _via_image_grid_group_var[group_index].values[i];
+    var o = document.createElement('option');
+    o.setAttribute('value', value);
+    o.innerHTML = (i+1) + '/' + n + ': ' + name + ' = ' + value;
+    if ( value === current_value ) {
+      o.setAttribute('selected', 'selected');
+    }
+    sel.appendChild(o);
+  }
+}
+
+function image_grid_group_select_get_html_id(group_index) {
+  return 'gi_' + group_index;
+}
+
+function image_grid_group_select_parse_html_id(id) {
+  return parseInt(id.substr(3));
+}
+
+function image_grid_group_by_select_set_disabled(type, name, is_disabled) {
+  var p = document.getElementById('image_grid_toolbar_group_by_select');
+  var sel_option_value = image_grid_toolbar_group_by_select_get_html_id(type, name);
+
+  var n = p.options.length;
+  var option_value;
+  var i;
+  for ( i = 0; i < n; ++i ) {
+    if ( sel_option_value === p.options[i].value ) {
+      if ( is_disabled ) {
+        p.options[i].setAttribute('disabled', 'disabled');
+      } else {
+        p.options[i].removeAttribute('disabled');
+      }
+      break;
+    }
+  }
+}
+
+function image_grid_remove_group_by(p) {
+  var prefix = 'group_toolbar_';
+  var group_index = parseInt( p.parentNode.id.substr( prefix.length ) );
+
+  if ( group_index === 0 ) {
+    image_grid_show_all_project_images();
+  } else {
+    // merge all groups that are child of group_index
+    image_grid_group_by_merge(_via_image_grid_group, 0, group_index);
+
+    var n = _via_image_grid_group_var.length;
+    var p = document.getElementById('image_grid_group_panel');
+    var group_panel_id;
+    var i;
+    for ( i = group_index; i < n; ++i ) {
+      image_grid_remove_html_group_panel( _via_image_grid_group_var[i] );
+      image_grid_group_by_select_set_disabled( _via_image_grid_group_var[i].type,
+                                               _via_image_grid_group_var[i].name,
+                                               false);
+    }
+    _via_image_grid_group_var.splice(group_index);
+
+    image_grid_set_content_to_current_group();
+  }
+}
+
+function image_grid_group_by(type, name) {
+  if ( Object.keys(_via_image_grid_group).length === 0 ) {
+    // first group
+    var img_index_array = [];
+    var n = _via_img_fn_list_img_index_list.length;
+    var i;
+    for ( i = 0; i < n; ++i ) {
+      img_index_array.push( _via_img_fn_list_img_index_list[i] );
+    }
+
+    _via_image_grid_group = image_grid_split_array_to_group(img_index_array, type, name);
+    var new_group_values = Object.keys(_via_image_grid_group);
+    _via_image_grid_group_var = [];
+    _via_image_grid_group_var.push( { 'type':type, 'name':name, 'current_value_index':0, 'values':new_group_values, 'group_index':0 } );
+
+    image_grid_add_html_group_panel(_via_image_grid_group_var[0]);
+  } else {
+    image_grid_group_split_all_arrays( _via_image_grid_group, type, name );
+
+    var i, n, value;
+    var current_group_value = _via_image_grid_group;
+    n = _via_image_grid_group_var.length;
+
+    for ( i = 0; i < n; ++i ) {
+      value = _via_image_grid_group_var[i].values[ _via_image_grid_group_var[i].current_value_index ];
+      current_group_value = current_group_value[ value ];
+    }
+    var new_group_values = Object.keys(current_group_value);
+    var group_var_index = _via_image_grid_group_var.length;
+    _via_image_grid_group_var.push( { 'type':type, 'name':name, 'current_value_index':0, 'values':new_group_values, 'group_index':group_var_index } );
+    image_grid_add_html_group_panel( _via_image_grid_group_var[group_var_index] );
+  }
+
+  image_grid_set_content_to_current_group();
+}
+
+function image_grid_group_by_merge(group, current_level, target_level) {
+  var child_value;
+  var group_data = [];
+  if ( current_level === target_level ) {
+    return image_grid_group_by_collapse(group);
+  } else {
+    for ( child_value in group ) {
+      group[child_value] = image_grid_group_by_merge(group[child_value], current_level + 1, target_level);
+    }
+  }
+}
+
+function image_grid_group_by_collapse(group) {
+  var child_value;
+  var child_collapsed_value;
+  var group_data = [];
+  for ( child_value in group ) {
+    if ( Array.isArray(group[child_value]) ) {
+      group_data = group_data.concat(group[child_value]);
+    } else {
+      group_data = group_data.concat(image_grid_group_by_collapse(group[child_value]));
+    }
+  }
+  return group_data;
+}
+
+// recursively collapse all arrays to list
+function image_grid_group_split_all_arrays(group, type, name) {
+  if ( Array.isArray(group) ) {
+    return image_grid_split_array_to_group(group, type, name);
+  } else {
+    var group_value;
+    for ( group_value in group ) {
+      if ( Array.isArray( group[group_value] ) ) {
+        group[group_value] = image_grid_split_array_to_group(group[group_value], type, name);
+      } else {
+        image_grid_group_split_all_arrays(group[group_value], type, name);
+      }
+    }
+  }
+}
+
+function image_grid_split_array_to_group(img_index_array, attr_type, attr_name) {
+  var grp = {};
+  var img_index, img_id, i;
+  var n = img_index_array.length;
+  var attr_value;
+
+  switch(attr_type) {
+  case 'file':
+    for ( i = 0; i < n; ++i ) {
+      img_index = img_index_array[i];
+      img_id = _via_image_id_list[img_index];
+      if ( _via_img_metadata[img_id].file_attributes.hasOwnProperty(attr_name) ) {
+        attr_value = _via_img_metadata[img_id].file_attributes[attr_name];
+
+        if ( ! grp.hasOwnProperty(attr_value) ) {
+          grp[attr_value] = [];
+        }
+        grp[attr_value].push(img_index);
+      }
+    }
+    break;
+  case 'region':
+    var j;
+    var region_count;
+    for ( i = 0; i < n; ++i ) {
+      img_index    = img_index_array[i];
+      img_id       = _via_image_id_list[img_index];
+      region_count = _via_img_metadata[img_id].regions.length;
+      for ( j = 0; j < region_count; ++j ) {
+        if ( _via_img_metadata[img_id].regions[j].region_attributes.hasOwnProperty(attr_name) ) {
+          attr_value = _via_img_metadata[img_id].regions[j].region_attributes[attr_name];
+
+          if ( ! grp.hasOwnProperty(attr_value) ) {
+            grp[attr_value] = [];
+          }
+          if ( grp[attr_value].includes(img_index) ) {
+            continue;
+          } else {
+            grp[attr_value].push(img_index);
+          }
+        }
+      }
+    }
+    break;
+  }
+  return grp;
+}
+
+function image_grid_group_next(p) {
+  var group_index = parseInt( p.value );
+  var group_value_list = _via_image_grid_group_var[group_index].values;
+  var n = group_value_list.length;
+  var current_index = _via_image_grid_group_var[group_index].current_value_index;
+  var next_index = current_index + 1;
+  if ( next_index >= n ) {
+    if ( group_index === 0 ) {
+      next_index = next_index - n;
+      image_grid_jump_to_group(group_index, next_index);
+    } else {
+      // next of parent group
+      var parent_group_index = group_index - 1;
+      var parent_current_val_index = _via_image_grid_group_var[parent_group_index].current_value_index;
+      var parent_next_val_index = parent_current_val_index + 1;
+      while ( parent_group_index !== 0 ) {
+        if ( parent_next_val_index >= _via_image_grid_group_var[parent_group_index].values.length ) {
+          parent_group_index = group_index - 1;
+          parent_current_val_index = _via_image_grid_group_var[parent_group_index].current_value_index;
+          parent_next_val_index = parent_current_val_index + 1;
+        } else {
+          break;
+        }
+      }
+
+      if ( parent_next_val_index >= _via_image_grid_group_var[parent_group_index].values.length ) {
+        parent_next_val_index = 0;
+      }
+      image_grid_jump_to_group(parent_group_index, parent_next_val_index);
+    }
+  } else {
+    image_grid_jump_to_group(group_index, next_index);
+  }
+  image_grid_set_content_to_current_group();
+}
+
+function image_grid_group_prev(p) {
+  var group_index = parseInt( p.value );
+  var group_value_list = _via_image_grid_group_var[group_index].values;
+  var n = group_value_list.length;
+  var current_index = _via_image_grid_group_var[group_index].current_value_index;
+  var prev_index = current_index - 1;
+  if ( prev_index < 0 ) {
+    if ( group_index === 0 ) {
+      prev_index = n + prev_index;
+      image_grid_jump_to_group(group_index, prev_index);
+    } else {
+      // prev of parent group
+      var parent_group_index = group_index - 1;
+      var parent_current_val_index = _via_image_grid_group_var[parent_group_index].current_value_index;
+      var parent_prev_val_index = parent_current_val_index - 1;
+      while ( parent_group_index !== 0 ) {
+        if ( parent_prev_val_index < 0 ) {
+          parent_group_index = group_index - 1;
+          parent_current_val_index = _via_image_grid_group_var[parent_group_index].current_value_index;
+          parent_prev_val_index = parent_current_val_index - 1;
+        } else {
+          break;
+        }
+      }
+
+      if ( parent_prev_val_index < 0 ) {
+        parent_prev_val_index = _via_image_grid_group_var[parent_group_index].values.length - 1;
+      }
+      image_grid_jump_to_group(parent_group_index, parent_prev_val_index);
+    }
+  } else {
+    image_grid_jump_to_group(group_index, prev_index);
+  }
+  image_grid_set_content_to_current_group();
+}
+
+
+function image_grid_group_value_onchange(p) {
+  var group_index = image_grid_group_select_parse_html_id(p.id);
+  image_grid_jump_to_group(group_index, p.selectedIndex);
+  image_grid_set_content_to_current_group();
+}
+
+function image_grid_jump_to_group(group_index, value_index) {
+  var n = _via_image_grid_group_var[group_index].values.length;
+  if ( value_index >=n || value_index < 0 ) {
+    return;
+  }
+
+  _via_image_grid_group_var[group_index].current_value_index = value_index;
+  image_grid_group_panel_set_selected_value( group_index );
+
+  // reset the value of lower groups
+  var i, value;
+  if ( group_index + 1 < _via_image_grid_group_var.length ) {
+    var e = _via_image_grid_group;
+    for ( i = 0; i <= group_index; ++i ) {
+      value = _via_image_grid_group_var[i].values[ _via_image_grid_group_var[i].current_value_index ];
+      e = e[ value ];
+    }
+
+    for ( i = group_index + 1; i < _via_image_grid_group_var.length; ++i ) {
+      _via_image_grid_group_var[i].values = Object.keys(e);
+      if ( _via_image_grid_group_var[i].values.length === 0 ) {
+        _via_image_grid_group_var[i].current_value_index = -1;
+        _via_image_grid_group_var.splice(i);
+        image_grid_group_panel_set_options(i);
+        break;
+      } else {
+        _via_image_grid_group_var[i].current_value_index = 0;
+        value = _via_image_grid_group_var[i].values[0]
+        e = e[value];
+        image_grid_group_panel_set_options(i);
+      }
+    }
+  }
+}
+
+function image_grid_set_content_to_current_group() {
+  var n = _via_image_grid_group_var.length;
+
+  if ( n === 0 ) {
+    image_grid_show_all_project_images();
+  } else {
+    var group_img_index_list = [];
+    var img_index_list = _via_image_grid_group;
+    var i, n, value, current_value_index;
+    for ( i = 0; i < n; ++i ) {
+      value = _via_image_grid_group_var[i].values[ _via_image_grid_group_var[i].current_value_index ];
+      img_index_list = img_index_list[ value ];
+    }
+
+    if ( Array.isArray(img_index_list) ) {
+      image_grid_set_content(img_index_list);
+    } else {
+      console.log('Error: image_grid_set_content_to_current_group(): expected array while got ' + typeof(img_index_list));
+    }
+  }
+}
+
+function image_grid_page_next() {
+  _via_image_grid_stack_prev_page.push(_via_image_grid_page_first_index);
+  _via_image_grid_page_first_index = _via_image_grid_page_last_index;
+
+  image_grid_clear_content();
+  _via_image_grid_load_ongoing = true;
+  image_grid_page_nav_show_cancel();
+  image_grid_content_append_img( _via_image_grid_page_first_index );
+}
+
+function image_grid_page_prev() {
+  _via_image_grid_page_first_index = _via_image_grid_stack_prev_page.pop();
+  _via_image_grid_page_last_index = -1;
+
+  image_grid_clear_content();
+  _via_image_grid_load_ongoing = true;
+  image_grid_page_nav_show_cancel();
+  image_grid_content_append_img( _via_image_grid_page_first_index );
+}
+
+function image_grid_page_nav_show_cancel() {
+  var info = document.getElementById('image_grid_nav');
+  var html = [];
+  html.push('<span>Loading images ... </span>');
+  html.push('<span class="text_button" onclick="image_grid_cancel_load_ongoing()">Cancel</span>');
+  info.innerHTML = html.join('');
+}
+
+function image_grid_cancel_load_ongoing() {
+  _via_image_grid_load_ongoing = false;
+}
+
+
+// everything to do with image zooming
+function image_zoom_init() {
+
+}
+
+//
+// hooks for sub-modules
+// implemented by sub-modules
+//
+//function _via_hook_next_image() {}
+//function _via_hook_prev_image() {}
+
+
+////////////////////////////////////////////////////////////////////////////////
+//
+// Code borrowed from via2 branch
+// - in future, the <canvas> based reigon shape drawing will be replaced by <svg>
+//   because svg allows independent manipulation of individual regions without
+//   requiring to clear the canvas every time some region is updated.
+//
+////////////////////////////////////////////////////////////////////////////////
+
+////////////////////////////////////////////////////////////////////////////////
+//
+// @file        _via_region.js
+// @description Implementation of region shapes like rectangle, circle, etc.
+// @author      Abhishek Dutta <adutta@robots.ox.ac.uk>
+// @date        17 June 2017
+//
+////////////////////////////////////////////////////////////////////////////////
+
+function _via_region( shape, id, data_img_space, view_scale_factor, view_offset_x, view_offset_y) {
+  // Note the following terminology:
+  //   view space  :
+  //     - corresponds to the x-y plane on which the scaled version of original image is shown to the user
+  //     - all the region query operations like is_inside(), is_on_edge(), etc are performed in view space
+  //     - all svg draw operations like get_svg() are also in view space
+  //
+  //   image space :
+  //     - corresponds to the x-y plane which corresponds to the spatial space of the original image
+  //     - region save, export, git push operations are performed in image space
+  //     - to avoid any rounding issues (caused by floating scale factor),
+  //        * user drawn regions in view space is first converted to image space
+  //        * this region in image space is now used to initialize region in view space
+  //
+  //   The two spaces are related by _via_model.now.tform.scale which is computed by the method
+  //     _via_ctrl.compute_view_panel_to_nowfile_tform()
+  //   and applied as follows:
+  //     x coordinate in image space = scale_factor * x coordinate in view space
+  //
+  // shape : {rect, circle, ellipse, line, polyline, polygon, point}
+  // id    : unique region-id
+  // d[]   : (in view space) data whose meaning depend on region shape as follows:
+  //        rect     : d[x1,y1,x2,y2] or d[corner1_x, corner1_y, corner2_x, corner2_y]
+  //        circle   : d[x1,y1,x2,y2] or d[center_x, center_y, circumference_x, circumference_y]
+  //        ellipse  : d[x1,y1,x2,y2,transform]
+  //        line     : d[x1,y1,x2,y2]
+  //        polyline : d[x1,y1,...,xn,yn]
+  //        polygon  : d[x1,y1,...,xn,yn]
+  //        point    : d[cx,cy]
+  // scale_factor : for conversion from view space to image space
+  //
+  // Note: no svg data are stored with prefix "_". For example: _scale_factor, _x2
+  this.shape  = shape;
+  this.id     = id;
+  this.scale_factor     = view_scale_factor;
+  this.offset_x         = view_offset_x;
+  this.offset_y         = view_offset_y;
+  this.recompute_svg    = false;
+  this.attributes  = {};
+
+  var n = data_img_space.length;
+  var i;
+  this.dview  = new Array(n);
+  this.dimg   = new Array(n);
+
+  if ( n !== 0 ) {
+    // IMPORTANT:
+    // to avoid any rounding issues (caused by floating scale factor), we stick to
+    // the principal that image space coordinates are the ground truth for every region.
+    // Hence, we proceed as:
+    //   * user drawn regions in view space is first converted to image space
+    //   * this region in image space is now used to initialize region in view space
+    for ( i = 0; i < n; i++ ) {
+      this.dimg[i]  = data_img_space[i];
+
+      var offset = this.offset_x;
+      if ( i % 2 !== 0 ) {
+        // y coordinate
+        offset = this.offset_y;
+      }
+      this.dview[i] = Math.round( this.dimg[i] * this.scale_factor ) + offset;
+    }
+  }
+
+  // set svg attributes for each shape
+  switch( this.shape ) {
+  case "rect":
+    _via_region_rect.call( this );
+    this.svg_attributes = ['x', 'y', 'width', 'height'];
+    break;
+  case "circle":
+    _via_region_circle.call( this );
+    this.svg_attributes = ['cx', 'cy', 'r'];
+    break;
+  case "ellipse":
+    _via_region_ellipse.call( this );
+    this.svg_attributes = ['cx', 'cy', 'rx', 'ry','transform'];
+    break;
+  case "line":
+    _via_region_line.call( this );
+    this.svg_attributes = ['x1', 'y1', 'x2', 'y2'];
+    break;
+  case "polyline":
+    _via_region_polyline.call( this );
+    this.svg_attributes = ['points'];
+    break;
+  case "polygon":
+    _via_region_polygon.call( this );
+    this.svg_attributes = ['points'];
+    break;
+  case "point":
+    _via_region_point.call( this );
+    // point is a special circle with minimal radius required for visualization
+    this.shape = 'circle';
+    this.svg_attributes = ['cx', 'cy', 'r'];
+    break;
+  }
+
+  this.initialize();
+}
+
+
+_via_region.prototype.prepare_svg_element = function() {
+  var _VIA_SVG_NS = "http://www.w3.org/2000/svg";
+  this.svg_element = document.createElementNS(_VIA_SVG_NS, this.shape);
+  this.svg_string  = '<' + this.shape;
+  this.svg_element.setAttributeNS(null, 'id', this.id);
+
+  var n = this.svg_attributes.length;
+  for ( var i = 0; i < n; i++ ) {
+    this.svg_element.setAttributeNS(null, this.svg_attributes[i], this[this.svg_attributes[i]]);
+    this.svg_string += ' ' + this.svg_attributes[i] + '="' + this[this.svg_attributes[i]] + '"';
+  }
+  this.svg_string  += '/>';
+}
+
+_via_region.prototype.get_svg_element = function() {
+  if ( this.recompute_svg ) {
+    this.prepare_svg_element();
+    this.recompute_svg = false;
+  }
+  return this.svg_element;
+}
+
+_via_region.prototype.get_svg_string = function() {
+  if ( this.recompute_svg ) {
+    this.prepare_svg_element();
+    this.recompute_svg = false;
+  }
+  return this.svg_string;
+}
+
+///
+/// Region shape : rectangle
+///
+function _via_region_rect() {
+  this.is_inside  = _via_region_rect.prototype.is_inside;
+  this.is_on_edge = _via_region_rect.prototype.is_on_edge;
+  this.move  = _via_region_rect.prototype.move;
+  this.resize  = _via_region_rect.prototype.resize;
+  this.initialize = _via_region_rect.prototype.initialize;
+  this.dist_to_nearest_edge = _via_region_rect.prototype.dist_to_nearest_edge;
+}
+
+_via_region_rect.prototype.initialize = function() {
+  // ensure that this.(x,y) corresponds to top-left corner of rectangle
+  // Note: this.(x2,y2) is defined for convenience in calculations
+  if ( this.dview[0] < this.dview[2] ) {
+    this.x  = this.dview[0];
+    this.x2 = this.dview[2];
+  } else {
+    this.x  = this.dview[2];
+    this.x2 = this.dview[0];
+  }
+  if ( this.dview[1] < this.dview[3] ) {
+    this.y  = this.dview[1];
+    this.y2 = this.dview[3];
+  } else {
+    this.y  = this.dview[3];
+    this.y2 = this.dview[1];
+  }
+  this.width  = this.x2 - this.x;
+  this.height = this.y2 - this.y;
+  this.recompute_svg = true;
+}
+
+///
+/// Region shape : circle
+///
+function _via_region_circle() {
+  this.is_inside  = _via_region_circle.prototype.is_inside;
+  this.is_on_edge = _via_region_circle.prototype.is_on_edge;
+  this.move       = _via_region_circle.prototype.move;
+  this.resize     = _via_region_circle.prototype.resize;
+  this.initialize = _via_region_circle.prototype.initialize;
+  this.dist_to_nearest_edge = _via_region_circle.prototype.dist_to_nearest_edge;
+}
+
+_via_region_circle.prototype.initialize = function() {
+  this.cx = this.dview[0];
+  this.cy = this.dview[1];
+  var dx = this.dview[2] - this.dview[0];
+  var dy = this.dview[3] - this.dview[1];
+  this.r  = Math.round( Math.sqrt(dx * dx + dy * dy) );
+  this.r2 = this.r * this.r;
+  this.recompute_svg = true;
+}
+
+
+///
+/// Region shape : ellipse
+///
+function _via_region_ellipse() {
+  this.is_inside  = _via_region_ellipse.prototype.is_inside;
+  this.is_on_edge = _via_region_ellipse.prototype.is_on_edge;
+  this.move  = _via_region_ellipse.prototype.move;
+  this.resize  = _via_region_ellipse.prototype.resize;
+  this.initialize = _via_region_ellipse.prototype.initialize;
+  this.dist_to_nearest_edge = _via_region_ellipse.prototype.dist_to_nearest_edge;
+}
+
+_via_region_ellipse.prototype.initialize = function() {
+  this.cx = this.dview[0];
+  this.cy = this.dview[1];
+  this.rx = Math.abs(this.dview[2] - this.dview[0]);
+  this.ry = Math.abs(this.dview[3] - this.dview[1]);
+
+  this.inv_rx2 = 1 / (this.rx * this.rx);
+  this.inv_ry2 = 1 / (this.ry * this.ry);
+
+  this.recompute_svg = true;
+}
+
+
+
+///
+/// Region shape : line
+///
+function _via_region_line() {
+  this.is_inside  = _via_region_line.prototype.is_inside;
+  this.is_on_edge = _via_region_line.prototype.is_on_edge;
+  this.move  = _via_region_line.prototype.move;
+  this.resize  = _via_region_line.prototype.resize;
+  this.initialize = _via_region_line.prototype.initialize;
+  this.dist_to_nearest_edge = _via_region_line.prototype.dist_to_nearest_edge;
+}
+
+_via_region_line.prototype.initialize = function() {
+  this.x1 = this.dview[0];
+  this.y1 = this.dview[1];
+  this.x2 = this.dview[2];
+  this.y2 = this.dview[3];
+  this.dx = this.x1 - this.x2;
+  this.dy = this.y1 - this.y2;
+  this.mconst = (this.x1 * this.y2) - (this.x2 * this.y1);
+
+  this.recompute_svg = true;
+}
+
+
+///
+/// Region shape : polyline
+///
+function _via_region_polyline() {
+  this.is_inside  = _via_region_polyline.prototype.is_inside;
+  this.is_on_edge = _via_region_polyline.prototype.is_on_edge;
+  this.move  = _via_region_polyline.prototype.move;
+  this.resize  = _via_region_polyline.prototype.resize;
+  this.initialize = _via_region_polyline.prototype.initialize;
+  this.dist_to_nearest_edge = _via_region_polyline.prototype.dist_to_nearest_edge;
+}
+
+_via_region_polyline.prototype.initialize = function() {
+  var n = this.dview.length;
+  var points = new Array(n/2);
+  var points_index = 0;
+  for ( var i = 0; i < n; i += 2 ) {
+    points[points_index] = ( this.dview[i] + ' ' + this.dview[i+1] );
+    points_index++;
+  }
+  this.points = points.join(',');
+  this.recompute_svg = true;
+}
+
+
+///
+/// Region shape : polygon
+///
+function _via_region_polygon() {
+  this.is_inside  = _via_region_polygon.prototype.is_inside;
+  this.is_on_edge = _via_region_polygon.prototype.is_on_edge;
+  this.move  = _via_region_polygon.prototype.move;
+  this.resize  = _via_region_polygon.prototype.resize;
+  this.initialize = _via_region_polygon.prototype.initialize;
+  this.dist_to_nearest_edge = _via_region_polygon.prototype.dist_to_nearest_edge;
+}
+
+_via_region_polygon.prototype.initialize = function() {
+  var n = this.dview.length;
+  var points = new Array(n/2);
+  var points_index = 0;
+  for ( var i = 0; i < n; i += 2 ) {
+    points[points_index] = ( this.dview[i] + ' ' + this.dview[i+1] );
+    points_index++;
+  }
+  this.points = points.join(',');
+  this.recompute_svg = true;
+}
+
+
+///
+/// Region shape : point
+///
+function _via_region_point() {
+  this.is_inside  = _via_region_point.prototype.is_inside;
+  this.is_on_edge = _via_region_point.prototype.is_on_edge;
+  this.move  = _via_region_point.prototype.move;
+  this.resize  = _via_region_point.prototype.resize
+  this.initialize  = _via_region_point.prototype.initialize;
+  this.dist_to_nearest_edge = _via_region_point.prototype.dist_to_nearest_edge;
+}
+
+_via_region_point.prototype.initialize = function() {
+  this.cx = this.dview[0];
+  this.cy = this.dview[1];
+  this.r  = 2;
+  this.r2 = this.r * this.r;
+  this.recompute_svg = true;
+}
+
+//
+// image buffering
+//
+
+function _via_cancel_current_image_loading() {
+  var panel = document.getElementById('project_panel_title');
+  panel.innerHTML = 'Project';
+  _via_is_loading_current_image = false;
+}
+
+function _via_show_img(img_index) {
+  if ( _via_is_loading_current_image ) {
+    return;
+  }
+
+  var img_id = _via_image_id_list[img_index];
+
+  if ( ! _via_img_metadata.hasOwnProperty(img_id) ) {
+    console.log('_via_show_img(): [' + img_index + '] ' + img_id + ' does not exist!')
+    show_message('The requested image does not exist!')
+    return;
+  }
+
+  // file_resolve() is not necessary for files selected using browser's file selector
+  if ( typeof(_via_img_fileref[img_id]) === 'undefined' || ! _via_img_fileref[img_id] instanceof File ) {
+    // try preload from local file or url
+    if ( typeof(_via_img_src[img_id]) === 'undefined' || _via_img_src[img_id] === '' ) {
+      if ( is_url( _via_img_metadata[img_id].filename ) ) {
+        _via_img_src[img_id] = _via_img_metadata[img_id].filename;
+        _via_show_img(img_index);
+        return;
+      } else {
+        var search_path_list = _via_file_get_search_path_list();
+        if ( search_path_list.length === 0 ) {
+          search_path_list.push(''); // search using just the filename
+        }
+
+        _via_file_resolve(img_index, search_path_list).then( function(ok_file_index) {
+          _via_show_img(img_index);
+        }, function(err_file_index) {
+          show_page_404(img_index);
+        });
+        return;
+      }
+    }
+  }
+
+  if ( _via_buffer_img_index_list.includes(img_index) ) {
+    _via_current_image_loaded = false;
+    _via_show_img_from_buffer(img_index).then( function(ok_img_index) {
+      // trigger preload of images in buffer corresponding to img_index
+      // but, wait until all previous promises get cancelled
+      Promise.all(_via_preload_img_promise_list).then( function(values) {
+        _via_preload_img_promise_list = [];
+        var preload_promise = _via_img_buffer_start_preload( img_index, 0 )
+        _via_preload_img_promise_list.push(preload_promise);
+      });
+    }, function(err_img_index) {
+      console.log('_via_show_img_from_buffer() failed for file: ' + _via_image_filename_list[err_img_index]);
+      _via_current_image_loaded = false;
+    });
+  } else {
+    // image not in buffer, so first add this image to buffer
+    _via_is_loading_current_image = true;
+    img_loading_spinbar(img_index, true);
+    _via_img_buffer_add_image(img_index).then( function(ok_img_index) {
+      _via_is_loading_current_image = false;
+      img_loading_spinbar(img_index, false);
+      _via_show_img(img_index);
+    }, function(err_img_index) {
+      _via_is_loading_current_image = false;
+      img_loading_spinbar(img_index, false);
+      show_page_404(img_index);
+      console.log('_via_img_buffer_add_image() failed for file: ' + _via_image_filename_list[err_img_index]);
+    });
+  }
+
+  // add zooming
+  _via_add_zoom_for_image(img_index)
+
+}
+
+function _via_add_zoom_for_image(img_index) {
+  // var img = document.getElementById('bim' + img_index);
+  // img.style.backgroundRepeat = 'no-repeat';
+  // img.style.backgroundImage = 'url("'+img.src+'")';
+  // tramsparent_img = 'data:image/svg+xml;base64,'+window.btoa('<svg xmlns="http://www.w3.org/2000/svg" width="'+img.naturalWidth+'" height="'+img.naturalHeight+'"></svg>');
+  // img.src = transparentSpaceFiller;
+  // _via_img_panel.style.backgroundSize
+}
+
+function _via_buffer_hide_current_image() {
+  img_fn_list_ith_entry_selected(_via_image_index, false);
+  _via_clear_reg_canvas(); // clear old region shapes
+  if ( _via_current_image ) {
+    _via_current_image.classList.remove('visible');
+  }
+}
+
+function _via_show_img_from_buffer(img_index) {
+  return new Promise( function(ok_callback, err_callback) {
+    _via_buffer_hide_current_image();
+
+    var cimg_html_id = _via_img_buffer_get_html_id(img_index);
+    _via_current_image = document.getElementById(cimg_html_id);
+    if ( ! _via_current_image ) {
+      // the said image is not present in buffer, which could be because
+      // the image got removed from the buffer
+      err_callback(img_index);
+      return;
+    }
+    _via_current_image.classList.add('visible'); // now show the new image
+
+    _via_image_index = img_index;
+    _via_image_id    = _via_image_id_list[_via_image_index];
+    _via_current_image_filename = _via_img_metadata[_via_image_id].filename;
+    _via_current_image_loaded = true;
+
+    var arr_index = _via_buffer_img_index_list.indexOf(img_index);
+    _via_buffer_img_shown_timestamp[arr_index] = Date.now(); // update shown timestamp
+
+    // update the current state of application
+    _via_click_x0 = 0; _via_click_y0 = 0;
+    _via_click_x1 = 0; _via_click_y1 = 0;
+    _via_is_user_drawing_region = false;
+    _via_is_window_resized = false;
+    _via_is_user_resizing_region = false;
+    _via_is_user_moving_region = false;
+    _via_is_user_drawing_polygon = false;
+    _via_is_region_selected = false;
+    _via_user_sel_region_id = -1;
+    _via_current_image_width = _via_current_image.naturalWidth;
+    _via_current_image_height = _via_current_image.naturalHeight;
+
+    if ( _via_current_image_width === 0 || _via_current_image_height === 0 ) {
+      // for error image icon
+      _via_current_image_width = 640;
+      _via_current_image_height = 480;
+    }
+
+    // set the size of canvas
+    // based on the current dimension of browser window
+    var de = document.documentElement;
+    var image_panel_width = de.clientWidth - leftsidebar.clientWidth - 20;
+    if ( leftsidebar.style.display === 'none' ) {
+      image_panel_width = de.clientWidth;
+    }
+    var image_panel_height = de.clientHeight - 2*ui_top_panel.offsetHeight;
+
+    _via_canvas_width = _via_current_image_width;
+    _via_canvas_height = _via_current_image_height;
+
+    if ( _via_canvas_width > image_panel_width ) {
+      // resize image to match the panel width
+      var scale_width = image_panel_width / _via_current_image.naturalWidth;
+      _via_canvas_width = image_panel_width;
+      _via_canvas_height = _via_current_image.naturalHeight * scale_width;
+    }
+    if ( _via_canvas_height > image_panel_height ) {
+      // resize further image if its height is larger than the image panel
+      var scale_height = image_panel_height / _via_canvas_height;
+      _via_canvas_height = image_panel_height;
+      _via_canvas_width = _via_canvas_width * scale_height;
+    }
+    _via_canvas_width = Math.round(_via_canvas_width);
+    _via_canvas_height = Math.round(_via_canvas_height);
+    _via_canvas_scale = _via_current_image.naturalWidth / _via_canvas_width;
+    _via_canvas_scale_without_zoom = _via_canvas_scale;
+    set_all_canvas_size(_via_canvas_width, _via_canvas_height);
+    //set_all_canvas_scale(_via_canvas_scale_without_zoom);
+
+    // reset all regions to "not selected" state
+    toggle_all_regions_selection(false);
+
+    // ensure that all the canvas are visible
+    set_display_area_content( VIA_DISPLAY_AREA_CONTENT_NAME.IMAGE );
+
+    // update img_fn_list
+    img_fn_list_ith_entry_selected(_via_image_index, true);
+    img_fn_list_scroll_to_current_file();
+
+    // refresh the annotations panel
+    annotation_editor_update_content();
+
+    _via_load_canvas_regions(); // image to canvas space transform
+    _via_redraw_reg_canvas();
+    _via_reg_canvas.focus();
+
+    // Preserve zoom level
+    if (_via_is_canvas_zoomed) {
+      set_zoom( _via_canvas_zoom_level_index );
+    }
+    ok_callback(img_index);
+  });
+}
+
+function _via_img_buffer_add_image(img_index) {
+  return new Promise( function(ok_callback, err_callback) {
+    if ( _via_buffer_img_index_list.includes(img_index) ) {
+      //console.log('_via_img_buffer_add_image(): image ' + img_index + ' already exists in buffer!')
+      ok_callback(img_index);
+      return;
+    }
+
+    var img_id = _via_image_id_list[img_index];
+    var img_filename = _via_img_metadata[img_id].filename;
+    if ( !_via_img_metadata.hasOwnProperty(img_id)) {
+      err_callback(img_index);
+      return;
+    }
+
+    // check if user has given access to local file using
+    // browser's file selector
+    if ( _via_img_fileref[img_id] instanceof File ) {
+      var tmp_file_object_url = URL.createObjectURL(_via_img_fileref[img_id]);
+      var img_id = _via_image_id_list[img_index];
+      var bimg = document.createElement('img');
+      bimg.setAttribute('id', _via_img_buffer_get_html_id(img_index));
+      bimg.setAttribute('src', tmp_file_object_url);
+      bimg.setAttribute('alt', 'Image loaded from base64 data of a local file selected by user.');
+      bimg.addEventListener('error', function() {
+        URL.revokeObjectURL(tmp_file_object_url);
+        project_file_load_on_fail(img_index);
+        err_callback(img_index);
+      });
+      bimg.addEventListener('load', function() {
+        URL.revokeObjectURL(tmp_file_object_url);
+        img_stat_set(img_index, [bimg.naturalWidth, bimg.naturalHeight]);
+        _via_img_panel.insertBefore(bimg, _via_reg_canvas);
+        project_file_load_on_success(img_index);
+        img_fn_list_ith_entry_add_css_class(img_index, 'buffered')
+        // add timestamp so that we can apply Least Recently Used (LRU)
+        // scheme to remove elements when buffer is full
+        var arr_index = _via_buffer_img_index_list.length;
+        _via_buffer_img_index_list.push(img_index);
+        _via_buffer_img_shown_timestamp[arr_index] = Date.now(); // though, not seen yet
+        ok_callback(img_index);
+      });
+      return;
+    }
+
+    if ( typeof(_via_img_src[img_id]) === 'undefined' || _via_img_src[img_id] === '' ) {
+      err_callback(img_index);
+    } else {
+      var img_id = _via_image_id_list[img_index];
+
+      var bimg = document.createElement('img');
+      bimg.setAttribute('id', _via_img_buffer_get_html_id(img_index));
+      _via_img_src[img_id] = _via_img_src[img_id].replace('#', '%23');
+      bimg.setAttribute('src', _via_img_src[img_id]);
+      if ( _via_img_src[img_id].startsWith('data:image') ) {
+        bimg.setAttribute('alt', 'Source: image data in base64 format');
+      } else {
+        bimg.setAttribute('alt', 'Source: ' + _via_img_src[img_id]);
+      }
+
+      bimg.addEventListener('abort', function() {
+        project_file_load_on_fail(img_index);
+        err_callback(img_index);
+      });
+      bimg.addEventListener('error', function() {
+        project_file_load_on_fail(img_index);
+        err_callback(img_index);
+      });
+
+      // Note: _via_current_image.{naturalWidth,naturalHeight} is only accessible after
+      // the "load" event. Therefore, all processing must happen inside this event handler.
+      bimg.addEventListener('load', function() {
+        img_stat_set(img_index, [bimg.naturalWidth, bimg.naturalHeight]);
+        _via_img_panel.insertBefore(bimg, _via_reg_canvas);
+
+        project_file_load_on_success(img_index);
+        img_fn_list_ith_entry_add_css_class(img_index, 'buffered')
+        // add timestamp so that we can apply Least Recently Used (LRU)
+        // scheme to remove elements when buffer is full
+        var arr_index = _via_buffer_img_index_list.length;
+        _via_buffer_img_index_list.push(img_index);
+        _via_buffer_img_shown_timestamp[arr_index] = Date.now(); // though, not seen yet
+        ok_callback(img_index);
+      }, false);
+    }
+  }, false);
+}
+
+function _via_img_buffer_get_html_id(img_index) {
+  return 'bim' + img_index;
+}
+
+function _via_img_buffer_parse_html_id(html_id) {
+  return parseInt( html_id.substr(3) );
+}
+
+function _via_img_buffer_start_preload(img_index, preload_index) {
+  return new Promise( function(ok_callback, err_callback) {
+    _via_buffer_preload_img_index = img_index;
+    _via_img_buffer_preload_img(_via_buffer_preload_img_index, 0).then( function(ok_img_index_list) {
+      ok_callback(ok_img_index_list);
+    });
+  });
+}
+
+function _via_img_buffer_preload_img(img_index, preload_index) {
+  return new Promise( function(ok_callback, err_callback) {
+    var preload_img_index = _via_img_buffer_get_preload_img_index(img_index, preload_index);
+
+    if ( _via_buffer_preload_img_index !== _via_image_index ) {
+      ok_callback([]);
+      return;
+    }
+
+    // ensure that there is sufficient buffer space left for preloading image
+    if ( _via_buffer_img_index_list.length > _via_settings.core.buffer_size ) {
+      while( _via_buffer_img_index_list.length > _via_settings.core.buffer_size ) {
+        _via_img_buffer_remove_least_useful_img();
+        if ( _via_image_index !== _via_buffer_preload_img_index ) {
+          // current image has changed therefore, we need to cancel this preload operation
+          ok_callback([]);
+          return;
+        }
+      }
+    }
+
+    _via_img_buffer_add_image(preload_img_index).then( function(ok_img_index) {
+      if ( _via_image_index !== _via_buffer_preload_img_index ) {
+        ok_callback( [ok_img_index] );
+        return;
+      }
+
+      var next_preload_index = preload_index + 1;
+      if ( next_preload_index !== VIA_IMG_PRELOAD_COUNT ) {
+        _via_img_buffer_preload_img(img_index, next_preload_index).then( function(ok_img_index_list) {
+          ok_img_index_list.push( ok_img_index )
+          ok_callback( ok_img_index_list );
+        });
+      } else {
+        ok_callback( [ok_img_index] );
+      }
+    }, function(err_img_index) {
+      // continue with preload of other images in sequence
+      var next_preload_index = preload_index + 1;
+      if ( next_preload_index !== VIA_IMG_PRELOAD_COUNT ) {
+        _via_img_buffer_preload_img(img_index, next_preload_index).then( function(ok_img_index_list) {
+          ok_callback( ok_img_index_list );
+        });
+      } else {
+        ok_callback([]);
+      }
+    });
+  });
+}
+
+function _via_img_buffer_get_preload_img_index(img_index, preload_index) {
+  var preload_img_index = img_index + VIA_IMG_PRELOAD_INDICES[preload_index];
+  if ( (preload_img_index < 0) || (preload_img_index >= _via_img_count) ) {
+    if ( preload_img_index < 0 ) {
+      preload_img_index = _via_img_count + preload_img_index;
+    } else {
+      preload_img_index = preload_img_index - _via_img_count;
+    }
+  }
+  return preload_img_index;
+}
+
+// the least useful image is, one with the following properties:
+// - preload list for current image will always get loaded, so there is no point in removing them from buffer
+// - all the other images in buffer were seen more recently by the image
+// - all the other images are closer (in terms of their image index) to the image currently being shown
+function _via_img_buffer_remove_least_useful_img() {
+  var not_in_preload_list = _via_buffer_img_not_in_preload_list();
+  var oldest_buffer_index = _via_buffer_get_oldest_in_list(not_in_preload_list);
+
+  if ( _via_buffer_img_index_list[oldest_buffer_index] !== _via_image_index ) {
+    //console.log('removing oldest_buffer index: ' + oldest_buffer_index);
+    _via_buffer_remove(oldest_buffer_index);
+  } else {
+    var furthest_buffer_index = _via_buffer_get_buffer_furthest_from_current_img();
+    _via_buffer_remove(furthest_buffer_index);
+  }
+}
+
+function _via_buffer_remove( buffer_index ) {
+  var img_index = _via_buffer_img_index_list[buffer_index];
+  var bimg_html_id = _via_img_buffer_get_html_id(img_index);
+  var bimg = document.getElementById(bimg_html_id);
+  if ( bimg ) {
+    _via_buffer_img_index_list.splice(buffer_index, 1);
+    _via_buffer_img_shown_timestamp.splice(buffer_index, 1);
+    _via_img_panel.removeChild(bimg);
+
+    img_fn_list_ith_entry_remove_css_class(img_index, 'buffered')
+  }
+}
+
+function _via_buffer_remove_all() {
+  var i, n;
+  n = _via_buffer_img_index_list.length;
+  for ( i = 0 ; i < n; ++i ) {
+    var img_index = _via_buffer_img_index_list[i];
+    var bimg_html_id = _via_img_buffer_get_html_id(img_index);
+    var bimg = document.getElementById(bimg_html_id);
+    if ( bimg ) {
+      _via_img_panel.removeChild(bimg);
+    }
+  }
+  _via_buffer_img_index_list = [];
+  _via_buffer_img_shown_timestamp = [];
+}
+
+function _via_buffer_get_oldest_in_list(not_in_preload_list) {
+  var i;
+  var n = not_in_preload_list.length;
+  var oldest_buffer_index = -1;
+  var oldest_buffer_timestamp = Date.now();
+
+  for ( i = 0; i < n; ++i ) {
+    var _via_buffer_index = not_in_preload_list[i];
+    if ( _via_buffer_img_shown_timestamp[_via_buffer_index] < oldest_buffer_timestamp ) {
+      oldest_buffer_timestamp = _via_buffer_img_shown_timestamp[i];
+      oldest_buffer_index = i;
+    }
+  }
+  return oldest_buffer_index;
+}
+
+function _via_buffer_get_buffer_furthest_from_current_img() {
+  var now_img_index = _via_image_index;
+  var i, dist1, dist2, dist;
+  var n = _via_buffer_img_index_list.length;
+  var furthest_buffer_index = 0;
+  dist1 = Math.abs( _via_buffer_img_index_list[0] - now_img_index );
+  dist2 = _via_img_count - dist1; // assuming the list is circular
+  var furthest_buffer_dist = Math.min(dist1, dist2);
+
+  for ( i = 1; i < n; ++i ) {
+    dist1 = Math.abs( _via_buffer_img_index_list[i] - now_img_index );
+    dist2 = _via_img_count - dist1; // assuming the list is circular
+    dist = Math.min(dist1, dist2);
+    // image has been seen by user at least once
+    if ( dist > furthest_buffer_dist ) {
+      furthest_buffer_dist = dist;
+      furthest_buffer_index = i;
+    }
+  }
+  return furthest_buffer_index;
+}
+
+function _via_buffer_img_not_in_preload_list() {
+  var preload_list = _via_buffer_get_current_preload_list();
+  var i;
+  var not_in_preload_list = [];
+  for ( i = 0; i < _via_buffer_img_index_list.length; ++i ) {
+    if ( ! preload_list.includes( _via_buffer_img_index_list[i] ) ) {
+      not_in_preload_list.push( i );
+    }
+  }
+  return not_in_preload_list;
+}
+
+function _via_buffer_get_current_preload_list() {
+  var i;
+  var preload_list = [_via_image_index];
+  var img_index = _via_image_index;
+  for ( i = 0; i < VIA_IMG_PRELOAD_COUNT; ++i ) {
+    var preload_index = img_index + VIA_IMG_PRELOAD_INDICES[i];
+    if ( preload_index < 0 ) {
+      preload_index = _via_img_count + preload_index;
+    }
+    if ( preload_index >= _via_img_count ) {
+      preload_index = preload_index - _via_img_count;
+    }
+    preload_list.push(preload_index);
+  }
+  return preload_list;
+}
+
+//
+// settings
+//
+function settings_panel_toggle() {
+  if ( _via_display_area_content_name === VIA_DISPLAY_AREA_CONTENT_NAME.SETTINGS ) {
+    if ( _via_display_area_content_name_prev !== '' ) {
+      set_display_area_content(_via_display_area_content_name_prev);
+    } else {
+      show_single_image_view();
+      _via_redraw_rleg_canvas();
+    }
+  }
+  else {
+    settings_init();
+    set_display_area_content(VIA_DISPLAY_AREA_CONTENT_NAME.SETTINGS);
+  }
+}
+
+function settings_init() {
+  settings_region_visualisation_update_options();
+  settings_filepath_update_html();
+  settings_show_current_value();
+}
+
+function settings_save() {
+  // check if default path was updated
+  var default_path_updated = false;
+  if ( document.getElementById('_via_settings.core.default_filepath').value !== _via_settings.core.default_filepath ) {
+    default_path_updated = true;
+  }
+
+  var p = document.getElementById('settings_panel');
+  var vl = p.getElementsByClassName('value');
+  var n = vl.length;
+  var i;
+  for ( i = 0; i < n; ++i ) {
+    var s = vl[i].childNodes[1];
+    var sid_parts = s.id.split('.');
+    if ( sid_parts[0] === '_via_settings' ) {
+      var el = _via_settings;
+      var found = true;
+      var j;
+      for ( j = 1; j < sid_parts.length - 1; ++j ) {
+        if ( el.hasOwnProperty( sid_parts[j] ) ) {
+          el = el[ sid_parts[j] ];
+        } else {
+          // unrecognized setting
+          found = false;
+          break;
+        }
+      }
+      if ( found ) {
+        var param = sid_parts[ sid_parts.length - 1 ];
+        if ( s.value !== '' || typeof(s.value) !== 'undefined' ) {
+          el[param] = s.value;
+        }
+      }
+    }
+  }
+
+  // non-standard settings
+  var p;
+  p = document.getElementById('settings_input_new_filepath');
+  if ( p.value !== '' ) {
+    project_filepath_add(p.value.trim());
+  }
+  p = document.getElementById('project_name');
+  if ( p.value !== _via_settings.project.name ) {
+    p.value = _via_settings.project.name;
+  }
+
+  if ( default_path_updated ) {
+    _via_file_resolve_all_to_default_filepath();
+    _via_show_img(_via_image_index);
+  }
+
+  show_message('Settings saved.');
+  settings_panel_toggle();
+}
+
+function settings_show_current_value() {
+  var p = document.getElementById('settings_panel');
+  var vl = p.getElementsByClassName('value');
+  var n = vl.length;
+  var i;
+  for ( i = 0; i < n; ++i ) {
+    var s = vl[i].childNodes[1];
+    var sid_parts = s.id.split('.');
+    if ( sid_parts[0] === '_via_settings' ) {
+      var el = _via_settings;
+      var found = true;
+      var j;
+      for ( j = 1; j < sid_parts.length; ++j ) {
+        if ( el.hasOwnProperty( sid_parts[j] ) ) {
+          el = el[ sid_parts[j] ];
+        } else {
+          // unrecognized setting
+          found = false;
+          break;
+        }
+      }
+
+      if ( found ) {
+        s.value = el;
+      }
+    }
+  }
+}
+
+function settings_region_visualisation_update_options() {
+  var region_setting_list = {'region_label': {
+    'default_option':'__via_region_id__',
+    'default_label':'Region id (1, 2, ...)',
+    'label_prefix':'Show value of region attribute: ',
+  }, 'region_color': {
+    'default_option':'__via_default_region_color__',
+    'default_label':'Default Region Colour',
+    'label_prefix':'Based on value of region attribute: ',
+  }};
+
+  for ( var setting in region_setting_list ) {
+    var select = document.getElementById('_via_settings.ui.image.' + setting);
+    select.innerHTML = '';
+    var default_option = document.createElement('option');
+    default_option.setAttribute('value', region_setting_list[setting]['default_option']);
+    if ( _via_settings.ui.image[setting] === region_setting_list[setting]['default_option'] ) {
+      default_option.setAttribute('selected', 'selected');
+    }
+    default_option.innerHTML = region_setting_list[setting]['default_label'];
+    select.appendChild(default_option);
+
+    // options: add region attributes
+    var rattr;
+    for ( rattr in _via_attributes['region'] ) {
+      var o = document.createElement('option');
+      o.setAttribute('value', rattr);
+      o.innerHTML = region_setting_list[setting]['label_prefix'] + rattr;
+      if ( _via_settings.ui.image.region_label === rattr ) {
+        o.setAttribute('selected', 'selected');
+      }
+      select.appendChild(o);
+    }
+  }
+}
+
+function settings_filepath_update_html() {
+  var p = document.getElementById('_via_settings.core.filepath');
+  p.innerHTML = '';
+  var i, path, order;
+  for ( path in _via_settings.core.filepath ) {
+    order = _via_settings.core.filepath[path]
+    if ( order !== 0 ) {
+      var li = document.createElement('li');
+      li.innerHTML = path + '<span class="text_button" title="Delete image path" onclick="project_filepath_del(\"' + path + '\"); settings_filepath_update_html();">&times;</span>';
+      p.appendChild(li);
+    }
+  }
+}
+
+//
+// find location of file
+//
+
+function _via_file_resolve_all_to_default_filepath() {
+  var img_id;
+  for ( img_id in _via_img_metadata ) {
+    if ( _via_img_metadata.hasOwnProperty(img_id) ) {
+      _via_file_resolve_file_to_default_filepath(img_id);
+    }
+  }
+}
+
+function _via_file_resolve_file_to_default_filepath(img_id) {
+  if ( _via_img_metadata.hasOwnProperty(img_id) ) {
+    if ( typeof(_via_img_fileref[img_id]) === 'undefined' || ! _via_img_fileref[img_id] instanceof File ) {
+      if ( is_url( _via_img_metadata[img_id].filename ) ) {
+        _via_img_src[img_id] = _via_img_metadata[img_id].filename;
+      } else {
+        _via_img_src[img_id] = _via_settings.core.default_filepath + _via_img_metadata[img_id].filename;
+      }
+    }
+  }
+}
+
+function _via_file_resolve_all() {
+  return new Promise( function(ok_callback, err_callback) {
+    var all_promises = [];
+
+    var search_path_list = _via_file_get_search_path_list();
+    var i, img_id;
+    for ( i = 0; i < _via_img_count; ++i ) {
+      img_id = _via_image_id_list[i];
+      if ( typeof(_via_img_src[img_id]) === 'undefined' || _via_img_src[img_id] === '' ) {
+        var p = _via_file_resolve(i, search_path_list);
+        all_promises.push(p);
+      }
+    }
+
+    Promise.all( all_promises ).then( function(ok_file_index_list) {
+      console.log(ok_file_index_list);
+      ok_callback();
+      //project_file_load_on_success(ok_file_index);
+    }, function(err_file_index_list) {
+      console.log(err_file_index_list);
+      err_callback();
+      //project_file_load_on_fail(err_file_index);
+    });
+
+  });
+}
+
+function _via_file_get_search_path_list() {
+  var search_path_list = [];
+  var path;
+  for ( path in _via_settings.core.filepath ) {
+    if ( _via_settings.core.filepath[path] !== 0 ) {
+      search_path_list.push(path);
+    }
+  }
+  return search_path_list;
+}
+
+function _via_file_resolve(file_index, search_path_list) {
+  return new Promise( function(ok_callback, err_callback) {
+    var path_index = 0;
+    var p = _via_file_resolve_check_path(file_index, path_index, search_path_list).then(function(ok) {
+      ok_callback(ok);
+    }, function(err) {
+      err_callback(err);
+    });
+  }, false);
+}
+
+function _via_file_resolve_check_path(file_index, path_index, search_path_list) {
+  return new Promise( function(ok_callback, err_callback) {
+    var img_id = _via_image_id_list[file_index];
+    var img = new Image(0,0);
+
+    var img_path = search_path_list[path_index] + _via_img_metadata[img_id].filename;
+    if ( is_url( _via_img_metadata[img_id].filename ) ) {
+      if ( search_path_list[path_index] !== '' ) {
+        // we search for the the image filename pointed by URL in local search paths
+        img_path = search_path_list[path_index] + get_filename_from_url( _via_img_metadata[img_id].filename );
+      }
+    }
+
+    img.setAttribute('src', img_path);
+
+    img.addEventListener('load', function() {
+      _via_img_src[img_id] = img_path;
+      ok_callback(file_index);
+    }, false);
+    img.addEventListener('abort', function() {
+      err_callback(file_index);
+    });
+    img.addEventListener('error', function() {
+      var new_path_index = path_index + 1;
+      if ( new_path_index < search_path_list.length ) {
+        _via_file_resolve_check_path(file_index, new_path_index, search_path_list).then( function(ok) {
+          ok_callback(file_index);
+        }, function(err) {
+          err_callback(file_index);
+        });
+      } else {
+        err_callback(file_index);
+      }
+    }, false);
+  }, false);
+}
+
+//
+// page 404 (file not found)
+//
+function show_page_404(img_index) {
+  _via_buffer_hide_current_image();
+
+  set_display_area_content(VIA_DISPLAY_AREA_CONTENT_NAME.PAGE_404);
+
+  _via_image_index = img_index;
+  _via_image_id = _via_image_id_list[_via_image_index];
+  _via_current_image_loaded = false;
+  img_fn_list_ith_entry_selected(_via_image_index, true);
+
+  document.getElementById('page_404_filename').innerHTML = '[' + (_via_image_index+1) + ']' + _via_img_metadata[_via_image_id].filename;
+}
+
+
+//
+// utils
+//
+
+function is_url( s ) {
+  // @todo: ensure that this is sufficient to capture all image url
+  if ( s.startsWith('http://') || s.startsWith('https://') || s.startsWith('www.') ) {
+    return true;
+  } else {
+    return false;
+  }
+}
+
+function get_filename_from_url( url ) {
+  return url.substring( url.lastIndexOf('/') + 1 );
+}
+
+// start with the array having smallest number of elements
+// check the remaining arrays if they all contain the elements of this shortest array
+function array_intersect( array_list ) {
+  if ( array_list.length === 0 ) {
+    return [];
+  }
+  if ( array_list.length === 1 ) {
+    return array_list[0];
+  }
+
+  var shortest_array = array_list[0];
+  var shortest_array_index = 0;
+  var i;
+  for ( i = 1; i < array_list.length; ++i ) {
+    if ( array_list[i].length < shortest_array.length ) {
+      shortest_array = array_list[i];
+      shortest_array_index = i;
+    }
+  }
+
+  var intersect = [];
+  var element_count = {};
+
+  var array_index_i;
+  for ( i = 0; i < array_list.length; ++i ) {
+    if ( i === 0 ) {
+      // in the first iteration, process the shortest element array
+      array_index_i = shortest_array_index;
+    } else {
+      array_index_i = i;
+    }
+
+    var j;
+    for ( j = 0; j < array_list[array_index_i].length; ++j ) {
+      if ( element_count[ array_list[array_index_i][j] ] === (i-1) ) {
+        if ( i === array_list.length - 1 ) {
+          intersect.push( array_list[array_index_i][j] );
+          element_count[ array_list[array_index_i][j] ] = 0;
+        } else {
+          element_count[ array_list[array_index_i][j] ] = i;
+        }
+      } else {
+        element_count[ array_list[array_index_i][j] ] = 0;
+      }
+    }
+  }
+  return intersect;
+}
+
+function generate_img_index_list(input) {
+  var all_img_index_list = [];
+
+  // condition: count format a,b
+  var count_format_img_index_list = [];
+  if ( input.prev_next_count.value !== '' ) {
+    var prev_next_split = input.prev_next_count.value.split(',');
+    if ( prev_next_split.length === 2 ) {
+      var prev = parseInt( prev_next_split[0] );
+      var next = parseInt( prev_next_split[1] );
+      var i;
+      for ( i = (_via_image_index - prev); i <= (_via_image_index + next); i++ ) {
+        count_format_img_index_list.push(i);
+      }
+    }
+  }
+  if ( count_format_img_index_list.length !== 0 ) {
+    all_img_index_list.push(count_format_img_index_list);
+  }
+
+  //condition: image index list expression
+  var expr_img_index_list = [];
+  if ( input.img_index_list.value !== '' ) {
+    var img_index_expr = input.img_index_list.value.split(',');
+    if ( img_index_expr.length !== 0 ) {
+      var i;
+      for ( i = 0; i < img_index_expr.length; ++i ) {
+        if ( img_index_expr[i].includes('-') ) {
+          var ab = img_index_expr[i].split('-');
+          var a = parseInt( ab[0] ) - 1; // 0 based indexing
+          var b = parseInt( ab[1] ) - 1;
+          var j;
+          for ( j = a; j <= b; ++j ) {
+            expr_img_index_list.push(j);
+          }
+        } else {
+          expr_img_index_list.push( parseInt(img_index_expr[i]) - 1 );
+        }
+      }
+    }
+  }
+  if ( expr_img_index_list.length !== 0 ) {
+    all_img_index_list.push(expr_img_index_list);
+  }
+
+
+  // condition: regular expression
+  var regex_img_index_list = [];
+  if ( input.regex.value !== '' ) {
+    var regex = input.regex.value;
+    for ( var i=0; i < _via_image_filename_list.length; ++i ) {
+      var filename = _via_image_filename_list[i];
+      if ( filename.match(regex) !== null ) {
+        regex_img_index_list.push(i);
+      }
+    }
+  }
+  if ( regex_img_index_list.length !== 0 ) {
+    all_img_index_list.push(regex_img_index_list);
+  }
+
+  var intersect = array_intersect(all_img_index_list);
+  return intersect;
+}
+
+if ( ! _via_is_debug_mode ) {
+  // warn user of possible loss of data
+  window.onbeforeunload = function (e) {
+    e = e || window.event;
+
+    // For IE and Firefox prior to version 4
+    if (e) {
+      e.returnValue = 'Did you save your data?';
+    }
+
+    // For Safari
+    return 'Did you save your data?';
+  };
+}
+
+//
+// keep a record of image statistics (e.g. width, height, ...)
+//
+function img_stat_set(img_index, stat) {
+  if ( stat.length ) {
+    _via_img_stat[img_index] = stat;
+  } else {
+    delete _via_img_stat[img_index];
+  }
+}
+
+function img_stat_set_all() {
+  return new Promise( function(ok_callback, err_callback) {
+    var promise_list = [];
+    var img_id;
+    for ( var img_index in _via_image_id_list ) {
+      if ( ! _via_img_stat.hasOwnProperty(img_index) ) {
+        img_id = _via_image_id_list[img_index];
+        if ( _via_img_metadata[img_id].file_attributes.hasOwnProperty('width') &&
+             _via_img_metadata[img_id].file_attributes.hasOwnProperty('height')
+           ) {
+          _via_img_stat[img_index] = [_via_img_metadata[img_id].file_attributes['width'],
+                                      _via_img_metadata[img_id].file_attributes['height'],
+                                     ];
+        } else {
+          promise_list.push( img_stat_get(img_index) );
+        }
+      }
+    }
+    if ( promise_list.length ) {
+      Promise.all(promise_list).then( function(ok) {
+        ok_callback();
+      }.bind(this), function(err) {
+        console.warn('Failed to read statistics of all images!');
+        err_callback();
+      });
+    } else {
+      ok_callback();
+    }
+  }.bind(this));
+}
+
+function img_stat_get(img_index) {
+  return new Promise( function(ok_callback, err_callback) {
+    var img_id = _via_image_id_list[img_index];
+    var tmp_img = document.createElement('img');
+    var tmp_file_object_url = null;
+    tmp_img.addEventListener('load', function() {
+      _via_img_stat[img_index] = [tmp_img.naturalWidth, tmp_img.naturalHeight];
+      if ( tmp_file_object_url !== null ) {
+        URL.revokeObjectURL(tmp_file_object_url);
+      }
+      ok_callback();
+    }.bind(this));
+    tmp_img.addEventListener('error', function() {
+      _via_img_stat[img_index] = [-1, -1];
+      if ( tmp_file_object_url !== null ) {
+        URL.revokeObjectURL(tmp_file_object_url);
+      }
+      ok_callback();
+    }.bind(this));
+
+    if ( _via_img_fileref[img_id] instanceof File ) {
+      tmp_file_object_url = URL.createObjectURL(_via_img_fileref[img_id]);
+      tmp_img.src = tmp_file_object_url;
+    } else {
+      tmp_img.src = _via_img_src[img_id];
+    }
+  }.bind(this));
+}
+
+//
+// util
+//
+function fixfloat(x) {
+  return parseFloat( x.toFixed(VIA_FLOAT_PRECISION) );
+}
+
+function shape_attribute_fixfloat(sa) {
+  for ( var attr in sa ) {
+    switch(attr) {
+    case 'x':
+    case 'y':
+    case 'width':
+    case 'height':
+    case 'r':
+    case 'rx':
+    case 'ry':
+      sa[attr] = fixfloat( sa[attr] );
+      break;
+    case 'all_points_x':
+    case 'all_points_y':
+      for ( var i in sa[attr] ) {
+        sa[attr][i] = fixfloat( sa[attr][i] );
+      }
+    }
+  }
+}
+
+// pts = [x0,y0,x1,y1,....]
+function polygon_to_bbox(pts) {
+  var xmin = +Infinity;
+  var xmax = -Infinity;
+  var ymin = +Infinity;
+  var ymax = -Infinity;
+  for ( var i = 0; i < pts.length; i = i + 2 ) {
+    if ( pts[i] > xmax ) {
+      xmax = pts[i];
+    }
+    if ( pts[i] < xmin ) {
+      xmin = pts[i];
+    }
+    if ( pts[i+1] > ymax ) {
+      ymax = pts[i+1];
+    }
+    if ( pts[i+1] < ymin ) {
+      ymin = pts[i+1];
+    }
+  }
+  return [xmin, ymin, xmax-xmin, ymax-ymin];
+}
+</script>
+<!-- END: Contents of file: via.js-->
+  </body>
+</html>
diff --git a/mask_rcnn/eval_on_val_set.py b/mask_rcnn/eval_on_val_set.py
new file mode 100644
index 00000000..2d4b6141
--- /dev/null
+++ b/mask_rcnn/eval_on_val_set.py
@@ -0,0 +1,266 @@
+from mrcnn.model import log
+import mrcnn.model as modellib
+from mrcnn.visualize import display_images
+import mrcnn.visualize as visualize
+import mrcnn.utils as utils
+from mrcnn.config import Config
+import sys
+import random
+import math
+import re
+import time
+import numpy as np
+import tensorflow as tf
+import matplotlib
+import matplotlib.pyplot as plt
+import matplotlib.patches as patches
+import os
+import sys
+import json
+import datetime
+import skimage.draw
+import cv2
+
+# TODO: update this path
+PP_WEIGHTS_PATH = "models/mask_rcnn_pointless_package_0050.h5"
+
+
+class PPConfig(Config):
+    """Configuration for training on the toy  dataset.
+    Derives from the base Config class and overrides some values.
+    """
+    # Give the configuration a recognizable name
+    NAME = "pointless_package"
+
+    # We use a GPU with 12GB memory, which can fit two images.
+    # Adjust down if you use a smaller GPU.
+    IMAGES_PER_GPU = 1
+
+    # Number of classes (including background)
+    # Background + outerbox + innerbox + item_rect + item_rect_slim + item_sq + item_circ
+    NUM_CLASSES = 1 + 6
+
+    # Number of training steps per epoch
+    STEPS_PER_EPOCH = 100
+
+    # Skip detections with < 90% confidence
+    DETECTION_MIN_CONFIDENCE = 0.75
+
+class PPDataset(utils.Dataset):
+
+    def load_dataset(self, dataset_dir, subset):
+        """Load a subset of the Balloon dataset.
+        dataset_dir: Root directory of the dataset.
+        subset: Subset to load: train or val
+        """
+        # Add classes. We have only one class to add.
+        self.add_class("pointless_package", 1, "outerbox")
+        self.add_class("pointless_package", 2, "innerbox")
+        self.add_class("pointless_package", 3, "item_sq")
+        self.add_class("pointless_package", 4, "item_rect")
+        self.add_class("pointless_package", 5, "item_rect_slim")
+        self.add_class("pointless_package", 6, "item_circ")
+
+        # Train or validation dataset?
+        assert subset in ["train", "val"]
+        dataset_dir = os.path.join(dataset_dir, subset)
+
+        # Load annotations
+        # VGG Image Annotator (up to version 1.6) saves each image in the form:
+        # { 'filename': '28503151_5b5b7ec140_b.jpg',
+        #   'regions': {
+        #       '0': {
+        #           'region_attributes': {},
+        #           'shape_attributes': {
+        #               'all_points_x': [...],
+        #               'all_points_y': [...],
+        #               'name': 'polygon'}},
+        #       ... more regions ...
+        #   },
+        #   'size': 100202
+        # }
+        # We mostly care about the x and y coordinates of each region
+        # Note: In VIA 2.0, regions was changed from a dict to a list.
+        annotations = json.load(
+            open(os.path.join(dataset_dir, "via_region_data.json")))
+        annotations = list(annotations.values())  # don't need the dict keys
+
+        # The VIA tool saves images in the JSON even if they don't have any
+        # annotations. Skip unannotated images.
+        annotations = [a for a in annotations if a['regions']]
+
+        # Add images
+        for a in annotations:
+            # Get the x, y coordinaets of points of the polygons that make up
+            # the outline of each object instance. These are stores in the
+            # shape_attributes (see json format above)
+            # The if condition is needed to support VIA versions 1.x and 2.x.
+            if type(a['regions']) is dict:
+                polygons = [r['shape_attributes']
+                            for r in a['regions'].values()]
+            else:
+                polygons = [r['shape_attributes'] for r in a['regions']]
+
+            # load_mask() needs the image size to convert polygons to masks.
+            # Unfortunately, VIA doesn't include it in JSON, so we must read
+            # the image. This is only managable since the dataset is tiny.
+            image_path = os.path.join(dataset_dir, a['filename'])
+            image = skimage.io.imread(image_path)
+            height, width = image.shape[:2]
+
+            class_list = [r['region_attributes'] for r in a['regions']]
+
+            self.add_image(
+                "pointless_package",
+                image_id=a['filename'],  # use file name as a unique image id
+                path=image_path,
+                width=width, height=height,
+                class_list=class_list,
+                polygons=polygons)
+
+    def load_mask(self, image_id):
+        """Generate instance masks for an image.
+       Returns:
+        masks: A bool array of shape [height, width, instance count] with
+            one mask per instance.
+        class_ids: a 1D array of class IDs of the instance masks.
+        """
+        class_ids = list()
+        # If not a pointless_package dataset image, delegate to parent class.
+        image_info = self.image_info[image_id]
+        # if image_info["source"] != "pointless_package":
+        #     return super(self.__class__, self).load_mask(image_id)
+
+        # Convert polygons to a bitmap mask of shape
+        # [height, width, instance_count]
+        info = self.image_info[image_id]
+        # print("\n\n\nIMAGE INFO:", info, "\n\n\n\n")
+
+        for box_type in info['class_list']:
+            # print(box_type['name'])
+            class_ids.append(self.class_names.index(str(box_type['name'])))
+        # print(class_ids)
+        # print(self.class_names)
+
+        mask = np.zeros([info["height"], info["width"], len(info["polygons"])],
+                        dtype=np.uint8)
+        for i, p in enumerate(info["polygons"]):
+            # Get indexes of pixels inside the polygon and set them to 1
+            rr, cc = skimage.draw.polygon(p['all_points_y'], p['all_points_x'])
+            mask[rr, cc, i] = 1
+        # Return mask, and array of class IDs of each instance. Since we have
+        # one class ID only, we return an array of 1s
+        return mask.astype(np.bool), np.asarray(class_ids, dtype=np.int32)
+
+    def image_reference(self, image_id):
+        """Return the path of the image."""
+        info = self.image_info[image_id]
+        if info["source"] == "pointless_package":
+            return info["path"]
+        else:
+            super(self.__class__, self).image_reference(image_id)
+
+
+config = PPConfig()
+ROOT_DIR = os.getcwd()
+PP_DIR = os.path.join(ROOT_DIR, "dataset/")
+
+# Override the training configurations with a few
+# changes for inferencing.
+class InferenceConfig(config.__class__):
+    # Run detection on one image at a time
+    GPU_COUNT = 1
+    IMAGES_PER_GPU = 1
+
+config = InferenceConfig()
+config.display()
+
+# Device to load the neural network on.
+# Useful if you're training a model on the same
+# machine, in which case use CPU and leave the
+# GPU for training.
+DEVICE = "/cpu:0"  # /cpu:0 or /gpu:0
+
+# Inspect the model in training or inference modes
+# values: 'inference' or 'training'
+# TODO: code for 'training' test mode not ready yet
+TEST_MODE = "inference"
+
+
+def get_ax(rows=1, cols=1, size=16):
+    """Return a Matplotlib Axes array to be used in
+    all visualizations in the notebook. Provide a
+    central point to control graph sizes.
+    
+    Adjust the size attribute to control how big to render images
+    """
+    _, ax = plt.subplots(rows, cols, figsize=(size*cols, size*rows))
+    return ax
+
+
+MY_ABS_PATH = "./"
+my_model_dir = MY_ABS_PATH + 'models/'
+
+# Load validation dataset
+dataset = PPDataset()
+dataset.load_dataset(PP_DIR, "val")
+
+# Must call before using the dataset
+dataset.prepare()
+
+print("Images: {}\nClasses: {}".format(
+    len(dataset.image_ids), dataset.class_names))
+
+# Create model in inference mode
+with tf.device(DEVICE):
+    model = modellib.MaskRCNN(mode="inference", model_dir=my_model_dir,
+                              config=config)
+
+# Set path to balloon weights file
+
+# Download file from the Releases page and set its path
+# https://github.com/matterport/Mask_RCNN/releases
+# weights_path = "/path/to/mask_rcnn_balloon.h5"
+
+# Or, load the last model you trained
+# weights_path = model.find_last()[1]
+weights_path = PP_WEIGHTS_PATH
+
+# Load weights
+print("Loading weights ", weights_path)
+model.load_weights(weights_path, by_name=True)
+
+# print(dataset.image_ids)
+# image_id = random.choice(dataset.image_ids)
+for number in range(150, 181):
+    # image_id = number
+    # image, image_meta, gt_class_id, gt_bbox, gt_mask =\
+    #     modellib.load_image_gt(dataset, config, image_id, use_mini_mask=False)
+    # info = dataset.image_info[image_id]
+    # print("image ID: {}.{} ({}) {}".format(info["source"], info["id"], image_id,
+                                        # dataset.image_reference(image_id)))
+
+    image = cv2.imread('./dataset/val/IMG_'+str(number)+'.jpg')
+    image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+
+    # Run object detection
+    results = model.detect([image], verbose=1)
+
+    # Display results
+    r = results[0]
+    visualize.display_instances(image, r['rois'], r['masks'], r['class_ids'],
+                                dataset.class_names, r['scores'],
+                                title="Predictions")
+
+    N = r['rois'].shape[0]
+    class_ids = r['class_ids']
+    masks = r['masks']
+
+    class_names = np.asarray(dataset.class_names)
+
+    print(class_names[class_ids])
+
+    # score_card = [masks[:, :, i].sum() for i in range(N)]
+    score_card2 = masks.sum(axis=0).sum(axis=0)
+    # print(score_card)
+    print(score_card2)
diff --git a/mask_rcnn/models/.gitkeep b/mask_rcnn/models/.gitkeep
new file mode 100644
index 00000000..74c20143
--- /dev/null
+++ b/mask_rcnn/models/.gitkeep
@@ -0,0 +1 @@
+DUMMY
\ No newline at end of file
diff --git a/mask_rcnn/models/serving_model/.gitkeep b/mask_rcnn/models/serving_model/.gitkeep
new file mode 100644
index 00000000..74c20143
--- /dev/null
+++ b/mask_rcnn/models/serving_model/.gitkeep
@@ -0,0 +1 @@
+DUMMY
\ No newline at end of file
diff --git a/mask_rcnn/mrcnn/__init__.py b/mask_rcnn/mrcnn/__init__.py
new file mode 100644
index 00000000..8b137891
--- /dev/null
+++ b/mask_rcnn/mrcnn/__init__.py
@@ -0,0 +1 @@
+
diff --git a/mask_rcnn/mrcnn/config.py b/mask_rcnn/mrcnn/config.py
new file mode 100644
index 00000000..5bffb33d
--- /dev/null
+++ b/mask_rcnn/mrcnn/config.py
@@ -0,0 +1,236 @@
+"""
+Mask R-CNN
+Base Configurations class.
+
+Copyright (c) 2017 Matterport, Inc.
+Licensed under the MIT License (see LICENSE for details)
+Written by Waleed Abdulla
+"""
+
+import numpy as np
+
+
+# Base Configuration Class
+# Don't use this class directly. Instead, sub-class it and override
+# the configurations you need to change.
+
+class Config(object):
+    """Base configuration class. For custom configurations, create a
+    sub-class that inherits from this one and override properties
+    that need to be changed.
+    """
+    # Name the configurations. For example, 'COCO', 'Experiment 3', ...etc.
+    # Useful if your code needs to do things differently depending on which
+    # experiment is running.
+    NAME = None  # Override in sub-classes
+
+    # NUMBER OF GPUs to use. When using only a CPU, this needs to be set to 1.
+    GPU_COUNT = 1
+
+    # Number of images to train with on each GPU. A 12GB GPU can typically
+    # handle 2 images of 1024x1024px.
+    # Adjust based on your GPU memory and image sizes. Use the highest
+    # number that your GPU can handle for best performance.
+    IMAGES_PER_GPU = 2
+
+    # Number of training steps per epoch
+    # This doesn't need to match the size of the training set. Tensorboard
+    # updates are saved at the end of each epoch, so setting this to a
+    # smaller number means getting more frequent TensorBoard updates.
+    # Validation stats are also calculated at each epoch end and they
+    # might take a while, so don't set this too small to avoid spending
+    # a lot of time on validation stats.
+    STEPS_PER_EPOCH = 1000
+
+    # Number of validation steps to run at the end of every training epoch.
+    # A bigger number improves accuracy of validation stats, but slows
+    # down the training.
+    VALIDATION_STEPS = 50
+
+    # Backbone network architecture
+    # Supported values are: resnet50, resnet101.
+    # You can also provide a callable that should have the signature
+    # of model.resnet_graph. If you do so, you need to supply a callable
+    # to COMPUTE_BACKBONE_SHAPE as well
+    BACKBONE = "resnet101"
+
+    # Only useful if you supply a callable to BACKBONE. Should compute
+    # the shape of each layer of the FPN Pyramid.
+    # See model.compute_backbone_shapes
+    COMPUTE_BACKBONE_SHAPE = None
+
+    # The strides of each layer of the FPN Pyramid. These values
+    # are based on a Resnet101 backbone.
+    BACKBONE_STRIDES = [4, 8, 16, 32, 64]
+
+    # Size of the fully-connected layers in the classification graph
+    FPN_CLASSIF_FC_LAYERS_SIZE = 1024
+
+    # Size of the top-down layers used to build the feature pyramid
+    TOP_DOWN_PYRAMID_SIZE = 256
+
+    # Number of classification classes (including background)
+    NUM_CLASSES = 1  # Override in sub-classes
+
+    # Length of square anchor side in pixels
+    RPN_ANCHOR_SCALES = (32, 64, 128, 256, 512)
+
+    # Ratios of anchors at each cell (width/height)
+    # A value of 1 represents a square anchor, and 0.5 is a wide anchor
+    RPN_ANCHOR_RATIOS = [0.5, 1, 2]
+
+    # Anchor stride
+    # If 1 then anchors are created for each cell in the backbone feature map.
+    # If 2, then anchors are created for every other cell, and so on.
+    RPN_ANCHOR_STRIDE = 1
+
+    # Non-max suppression threshold to filter RPN proposals.
+    # You can increase this during training to generate more propsals.
+    RPN_NMS_THRESHOLD = 0.7
+
+    # How many anchors per image to use for RPN training
+    RPN_TRAIN_ANCHORS_PER_IMAGE = 256
+    
+    # ROIs kept after tf.nn.top_k and before non-maximum suppression
+    PRE_NMS_LIMIT = 6000
+
+    # ROIs kept after non-maximum suppression (training and inference)
+    POST_NMS_ROIS_TRAINING = 2000
+    POST_NMS_ROIS_INFERENCE = 1000
+
+    # If enabled, resizes instance masks to a smaller size to reduce
+    # memory load. Recommended when using high-resolution images.
+    USE_MINI_MASK = False
+    MINI_MASK_SHAPE = (56, 56)  # (height, width) of the mini-mask
+
+    # Input image resizing
+    # Generally, use the "square" resizing mode for training and predicting
+    # and it should work well in most cases. In this mode, images are scaled
+    # up such that the small side is = IMAGE_MIN_DIM, but ensuring that the
+    # scaling doesn't make the long side > IMAGE_MAX_DIM. Then the image is
+    # padded with zeros to make it a square so multiple images can be put
+    # in one batch.
+    # Available resizing modes:
+    # none:   No resizing or padding. Return the image unchanged.
+    # square: Resize and pad with zeros to get a square image
+    #         of size [max_dim, max_dim].
+    # pad64:  Pads width and height with zeros to make them multiples of 64.
+    #         If IMAGE_MIN_DIM or IMAGE_MIN_SCALE are not None, then it scales
+    #         up before padding. IMAGE_MAX_DIM is ignored in this mode.
+    #         The multiple of 64 is needed to ensure smooth scaling of feature
+    #         maps up and down the 6 levels of the FPN pyramid (2**6=64).
+    # crop:   Picks random crops from the image. First, scales the image based
+    #         on IMAGE_MIN_DIM and IMAGE_MIN_SCALE, then picks a random crop of
+    #         size IMAGE_MIN_DIM x IMAGE_MIN_DIM. Can be used in training only.
+    #         IMAGE_MAX_DIM is not used in this mode.
+    IMAGE_RESIZE_MODE = "square"
+    IMAGE_MIN_DIM = 800
+    IMAGE_MAX_DIM = 1024
+    # Minimum scaling ratio. Checked after MIN_IMAGE_DIM and can force further
+    # up scaling. For example, if set to 2 then images are scaled up to double
+    # the width and height, or more, even if MIN_IMAGE_DIM doesn't require it.
+    # However, in 'square' mode, it can be overruled by IMAGE_MAX_DIM.
+    IMAGE_MIN_SCALE = 0
+    # Number of color channels per image. RGB = 3, grayscale = 1, RGB-D = 4
+    # Changing this requires other changes in the code. See the WIKI for more
+    # details: https://github.com/matterport/Mask_RCNN/wiki
+    IMAGE_CHANNEL_COUNT = 3
+
+    # Image mean (RGB)
+    MEAN_PIXEL = np.array([123.7, 116.8, 103.9])
+
+    # Number of ROIs per image to feed to classifier/mask heads
+    # The Mask RCNN paper uses 512 but often the RPN doesn't generate
+    # enough positive proposals to fill this and keep a positive:negative
+    # ratio of 1:3. You can increase the number of proposals by adjusting
+    # the RPN NMS threshold.
+    TRAIN_ROIS_PER_IMAGE = 200
+
+    # Percent of positive ROIs used to train classifier/mask heads
+    ROI_POSITIVE_RATIO = 0.33
+
+    # Pooled ROIs
+    POOL_SIZE = 7
+    MASK_POOL_SIZE = 14
+
+    # Shape of output mask
+    # To change this you also need to change the neural network mask branch
+    MASK_SHAPE = [28, 28]
+
+    # Maximum number of ground truth instances to use in one image
+    MAX_GT_INSTANCES = 100
+
+    # Bounding box refinement standard deviation for RPN and final detections.
+    RPN_BBOX_STD_DEV = np.array([0.1, 0.1, 0.2, 0.2])
+    BBOX_STD_DEV = np.array([0.1, 0.1, 0.2, 0.2])
+
+    # Max number of final detections
+    DETECTION_MAX_INSTANCES = 100
+
+    # Minimum probability value to accept a detected instance
+    # ROIs below this threshold are skipped
+    DETECTION_MIN_CONFIDENCE = 0.7
+
+    # Non-maximum suppression threshold for detection
+    DETECTION_NMS_THRESHOLD = 0.3
+
+    # Learning rate and momentum
+    # The Mask RCNN paper uses lr=0.02, but on TensorFlow it causes
+    # weights to explode. Likely due to differences in optimizer
+    # implementation.
+    LEARNING_RATE = 0.001
+    LEARNING_MOMENTUM = 0.9
+
+    # Weight decay regularization
+    WEIGHT_DECAY = 0.0001
+
+    # Loss weights for more precise optimization.
+    # Can be used for R-CNN training setup.
+    LOSS_WEIGHTS = {
+        "rpn_class_loss": 1.,
+        "rpn_bbox_loss": 1.,
+        "mrcnn_class_loss": 1.,
+        "mrcnn_bbox_loss": 1.,
+        "mrcnn_mask_loss": 1.
+    }
+
+    # Use RPN ROIs or externally generated ROIs for training
+    # Keep this True for most situations. Set to False if you want to train
+    # the head branches on ROI generated by code rather than the ROIs from
+    # the RPN. For example, to debug the classifier head without having to
+    # train the RPN.
+    USE_RPN_ROIS = True
+
+    # Train or freeze batch normalization layers
+    #     None: Train BN layers. This is the normal mode
+    #     False: Freeze BN layers. Good when using a small batch size
+    #     True: (don't use). Set layer in training mode even when predicting
+    TRAIN_BN = False  # Defaulting to False since batch size is often small
+
+    # Gradient norm clipping
+    GRADIENT_CLIP_NORM = 5.0
+
+    def __init__(self):
+        """Set values of computed attributes."""
+        # Effective batch size
+        self.BATCH_SIZE = self.IMAGES_PER_GPU * self.GPU_COUNT
+
+        # Input image size
+        if self.IMAGE_RESIZE_MODE == "crop":
+            self.IMAGE_SHAPE = np.array([self.IMAGE_MIN_DIM, self.IMAGE_MIN_DIM,
+                self.IMAGE_CHANNEL_COUNT])
+        else:
+            self.IMAGE_SHAPE = np.array([self.IMAGE_MAX_DIM, self.IMAGE_MAX_DIM,
+                self.IMAGE_CHANNEL_COUNT])
+
+        # Image meta data length
+        # See compose_image_meta() for details
+        self.IMAGE_META_SIZE = 1 + 3 + 3 + 4 + 1 + self.NUM_CLASSES
+
+    def display(self):
+        """Display Configuration values."""
+        print("\nConfigurations:")
+        for a in dir(self):
+            if not a.startswith("__") and not callable(getattr(self, a)):
+                print("{:30} {}".format(a, getattr(self, a)))
+        print("\n")
diff --git a/mask_rcnn/mrcnn/model.py b/mask_rcnn/mrcnn/model.py
new file mode 100644
index 00000000..f2200881
--- /dev/null
+++ b/mask_rcnn/mrcnn/model.py
@@ -0,0 +1,2871 @@
+"""
+Mask R-CNN
+The main Mask R-CNN model implementation.
+
+Copyright (c) 2017 Matterport, Inc.
+Licensed under the MIT License (see LICENSE for details)
+Written by Waleed Abdulla
+"""
+
+import os
+import random
+import datetime
+import re
+import math
+import logging
+from collections import OrderedDict
+import multiprocessing
+import numpy as np
+import warnings
+warnings.filterwarnings('ignore', category=DeprecationWarning)
+warnings.filterwarnings('ignore', category=FutureWarning)
+import tensorflow as tf
+import keras
+import keras.backend as K
+import keras.layers as KL
+import keras.engine as KE
+import keras.models as KM
+
+from mrcnn import utils
+
+# Requires TensorFlow 1.3+ and Keras 2.0.8+.
+from distutils.version import LooseVersion
+assert LooseVersion(tf.__version__) >= LooseVersion("1.3")
+assert LooseVersion(keras.__version__) >= LooseVersion('2.0.8')
+
+
+############################################################
+#  Utility Functions
+############################################################
+
+def log(text, array=None):
+    """Prints a text message. And, optionally, if a Numpy array is provided it
+    prints it's shape, min, and max values.
+    """
+    if array is not None:
+        text = text.ljust(25)
+        text += ("shape: {:20}  ".format(str(array.shape)))
+        if array.size:
+            text += ("min: {:10.5f}  max: {:10.5f}".format(array.min(),array.max()))
+        else:
+            text += ("min: {:10}  max: {:10}".format("",""))
+        text += "  {}".format(array.dtype)
+    print(text)
+
+
+class BatchNorm(KL.BatchNormalization):
+    """Extends the Keras BatchNormalization class to allow a central place
+    to make changes if needed.
+
+    Batch normalization has a negative effect on training if batches are small
+    so this layer is often frozen (via setting in Config class) and functions
+    as linear layer.
+    """
+    def call(self, inputs, training=None):
+        """
+        Note about training values:
+            None: Train BN layers. This is the normal mode
+            False: Freeze BN layers. Good when batch size is small
+            True: (don't use). Set layer in training mode even when making inferences
+        """
+        return super(self.__class__, self).call(inputs, training=training)
+
+
+def compute_backbone_shapes(config, image_shape):
+    """Computes the width and height of each stage of the backbone network.
+
+    Returns:
+        [N, (height, width)]. Where N is the number of stages
+    """
+    if callable(config.BACKBONE):
+        return config.COMPUTE_BACKBONE_SHAPE(image_shape)
+
+    # Currently supports ResNet only
+    assert config.BACKBONE in ["resnet50", "resnet101"]
+    return np.array(
+        [[int(math.ceil(image_shape[0] / stride)),
+            int(math.ceil(image_shape[1] / stride))]
+            for stride in config.BACKBONE_STRIDES])
+
+
+############################################################
+#  Resnet Graph
+############################################################
+
+# Code adopted from:
+# https://github.com/fchollet/deep-learning-models/blob/master/resnet50.py
+
+def identity_block(input_tensor, kernel_size, filters, stage, block,
+                   use_bias=True, train_bn=True):
+    """The identity_block is the block that has no conv layer at shortcut
+    # Arguments
+        input_tensor: input tensor
+        kernel_size: default 3, the kernel size of middle conv layer at main path
+        filters: list of integers, the nb_filters of 3 conv layer at main path
+        stage: integer, current stage label, used for generating layer names
+        block: 'a','b'..., current block label, used for generating layer names
+        use_bias: Boolean. To use or not use a bias in conv layers.
+        train_bn: Boolean. Train or freeze Batch Norm layers
+    """
+    nb_filter1, nb_filter2, nb_filter3 = filters
+    conv_name_base = 'res' + str(stage) + block + '_branch'
+    bn_name_base = 'bn' + str(stage) + block + '_branch'
+
+    x = KL.Conv2D(nb_filter1, (1, 1), name=conv_name_base + '2a',
+                  use_bias=use_bias)(input_tensor)
+    x = BatchNorm(name=bn_name_base + '2a')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+
+    x = KL.Conv2D(nb_filter2, (kernel_size, kernel_size), padding='same',
+                  name=conv_name_base + '2b', use_bias=use_bias)(x)
+    x = BatchNorm(name=bn_name_base + '2b')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+
+    x = KL.Conv2D(nb_filter3, (1, 1), name=conv_name_base + '2c',
+                  use_bias=use_bias)(x)
+    x = BatchNorm(name=bn_name_base + '2c')(x, training=train_bn)
+
+    x = KL.Add()([x, input_tensor])
+    x = KL.Activation('relu', name='res' + str(stage) + block + '_out')(x)
+    return x
+
+
+def conv_block(input_tensor, kernel_size, filters, stage, block,
+               strides=(2, 2), use_bias=True, train_bn=True):
+    """conv_block is the block that has a conv layer at shortcut
+    # Arguments
+        input_tensor: input tensor
+        kernel_size: default 3, the kernel size of middle conv layer at main path
+        filters: list of integers, the nb_filters of 3 conv layer at main path
+        stage: integer, current stage label, used for generating layer names
+        block: 'a','b'..., current block label, used for generating layer names
+        use_bias: Boolean. To use or not use a bias in conv layers.
+        train_bn: Boolean. Train or freeze Batch Norm layers
+    Note that from stage 3, the first conv layer at main path is with subsample=(2,2)
+    And the shortcut should have subsample=(2,2) as well
+    """
+    nb_filter1, nb_filter2, nb_filter3 = filters
+    conv_name_base = 'res' + str(stage) + block + '_branch'
+    bn_name_base = 'bn' + str(stage) + block + '_branch'
+
+    x = KL.Conv2D(nb_filter1, (1, 1), strides=strides,
+                  name=conv_name_base + '2a', use_bias=use_bias)(input_tensor)
+    x = BatchNorm(name=bn_name_base + '2a')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+
+    x = KL.Conv2D(nb_filter2, (kernel_size, kernel_size), padding='same',
+                  name=conv_name_base + '2b', use_bias=use_bias)(x)
+    x = BatchNorm(name=bn_name_base + '2b')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+
+    x = KL.Conv2D(nb_filter3, (1, 1), name=conv_name_base +
+                  '2c', use_bias=use_bias)(x)
+    x = BatchNorm(name=bn_name_base + '2c')(x, training=train_bn)
+
+    shortcut = KL.Conv2D(nb_filter3, (1, 1), strides=strides,
+                         name=conv_name_base + '1', use_bias=use_bias)(input_tensor)
+    shortcut = BatchNorm(name=bn_name_base + '1')(shortcut, training=train_bn)
+
+    x = KL.Add()([x, shortcut])
+    x = KL.Activation('relu', name='res' + str(stage) + block + '_out')(x)
+    return x
+
+
+def resnet_graph(input_image, architecture, stage5=False, train_bn=True):
+    """Build a ResNet graph.
+        architecture: Can be resnet50 or resnet101
+        stage5: Boolean. If False, stage5 of the network is not created
+        train_bn: Boolean. Train or freeze Batch Norm layers
+    """
+    assert architecture in ["resnet50", "resnet101"]
+    # Stage 1
+    x = KL.ZeroPadding2D((3, 3))(input_image)
+    x = KL.Conv2D(64, (7, 7), strides=(2, 2), name='conv1', use_bias=True)(x)
+    x = BatchNorm(name='bn_conv1')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+    C1 = x = KL.MaxPooling2D((3, 3), strides=(2, 2), padding="same")(x)
+    # Stage 2
+    x = conv_block(x, 3, [64, 64, 256], stage=2, block='a', strides=(1, 1), train_bn=train_bn)
+    x = identity_block(x, 3, [64, 64, 256], stage=2, block='b', train_bn=train_bn)
+    C2 = x = identity_block(x, 3, [64, 64, 256], stage=2, block='c', train_bn=train_bn)
+    # Stage 3
+    x = conv_block(x, 3, [128, 128, 512], stage=3, block='a', train_bn=train_bn)
+    x = identity_block(x, 3, [128, 128, 512], stage=3, block='b', train_bn=train_bn)
+    x = identity_block(x, 3, [128, 128, 512], stage=3, block='c', train_bn=train_bn)
+    C3 = x = identity_block(x, 3, [128, 128, 512], stage=3, block='d', train_bn=train_bn)
+    # Stage 4
+    x = conv_block(x, 3, [256, 256, 1024], stage=4, block='a', train_bn=train_bn)
+    block_count = {"resnet50": 5, "resnet101": 22}[architecture]
+    for i in range(block_count):
+        x = identity_block(x, 3, [256, 256, 1024], stage=4, block=chr(98 + i), train_bn=train_bn)
+    C4 = x
+    # Stage 5
+    if stage5:
+        x = conv_block(x, 3, [512, 512, 2048], stage=5, block='a', train_bn=train_bn)
+        x = identity_block(x, 3, [512, 512, 2048], stage=5, block='b', train_bn=train_bn)
+        C5 = x = identity_block(x, 3, [512, 512, 2048], stage=5, block='c', train_bn=train_bn)
+    else:
+        C5 = None
+    return [C1, C2, C3, C4, C5]
+
+
+############################################################
+#  Proposal Layer
+############################################################
+
+def apply_box_deltas_graph(boxes, deltas):
+    """Applies the given deltas to the given boxes.
+    boxes: [N, (y1, x1, y2, x2)] boxes to update
+    deltas: [N, (dy, dx, log(dh), log(dw))] refinements to apply
+    """
+    # Convert to y, x, h, w
+    height = boxes[:, 2] - boxes[:, 0]
+    width = boxes[:, 3] - boxes[:, 1]
+    center_y = boxes[:, 0] + 0.5 * height
+    center_x = boxes[:, 1] + 0.5 * width
+    # Apply deltas
+    center_y += deltas[:, 0] * height
+    center_x += deltas[:, 1] * width
+    height *= tf.exp(deltas[:, 2])
+    width *= tf.exp(deltas[:, 3])
+    # Convert back to y1, x1, y2, x2
+    y1 = center_y - 0.5 * height
+    x1 = center_x - 0.5 * width
+    y2 = y1 + height
+    x2 = x1 + width
+    result = tf.stack([y1, x1, y2, x2], axis=1, name="apply_box_deltas_out")
+    return result
+
+
+def clip_boxes_graph(boxes, window):
+    """
+    boxes: [N, (y1, x1, y2, x2)]
+    window: [4] in the form y1, x1, y2, x2
+    """
+    # Split
+    wy1, wx1, wy2, wx2 = tf.split(window, 4)
+    y1, x1, y2, x2 = tf.split(boxes, 4, axis=1)
+    # Clip
+    y1 = tf.maximum(tf.minimum(y1, wy2), wy1)
+    x1 = tf.maximum(tf.minimum(x1, wx2), wx1)
+    y2 = tf.maximum(tf.minimum(y2, wy2), wy1)
+    x2 = tf.maximum(tf.minimum(x2, wx2), wx1)
+    clipped = tf.concat([y1, x1, y2, x2], axis=1, name="clipped_boxes")
+    clipped.set_shape((clipped.shape[0], 4))
+    return clipped
+
+
+class ProposalLayer(KE.Layer):
+    """Receives anchor scores and selects a subset to pass as proposals
+    to the second stage. Filtering is done based on anchor scores and
+    non-max suppression to remove overlaps. It also applies bounding
+    box refinement deltas to anchors.
+
+    Inputs:
+        rpn_probs: [batch, num_anchors, (bg prob, fg prob)]
+        rpn_bbox: [batch, num_anchors, (dy, dx, log(dh), log(dw))]
+        anchors: [batch, num_anchors, (y1, x1, y2, x2)] anchors in normalized coordinates
+
+    Returns:
+        Proposals in normalized coordinates [batch, rois, (y1, x1, y2, x2)]
+    """
+
+    def __init__(self, proposal_count, nms_threshold, config=None, **kwargs):
+        super(ProposalLayer, self).__init__(**kwargs)
+        self.config = config
+        self.proposal_count = proposal_count
+        self.nms_threshold = nms_threshold
+
+    def call(self, inputs):
+        # Box Scores. Use the foreground class confidence. [Batch, num_rois, 1]
+        scores = inputs[0][:, :, 1]
+        # Box deltas [batch, num_rois, 4]
+        deltas = inputs[1]
+        deltas = deltas * np.reshape(self.config.RPN_BBOX_STD_DEV, [1, 1, 4])
+        # Anchors
+        anchors = inputs[2]
+
+        # Improve performance by trimming to top anchors by score
+        # and doing the rest on the smaller subset.
+        pre_nms_limit = tf.minimum(self.config.PRE_NMS_LIMIT, tf.shape(anchors)[1])
+        ix = tf.nn.top_k(scores, pre_nms_limit, sorted=True,
+                         name="top_anchors").indices
+        scores = utils.batch_slice([scores, ix], lambda x, y: tf.gather(x, y),
+                                   self.config.IMAGES_PER_GPU)
+        deltas = utils.batch_slice([deltas, ix], lambda x, y: tf.gather(x, y),
+                                   self.config.IMAGES_PER_GPU)
+        pre_nms_anchors = utils.batch_slice([anchors, ix], lambda a, x: tf.gather(a, x),
+                                    self.config.IMAGES_PER_GPU,
+                                    names=["pre_nms_anchors"])
+
+        # Apply deltas to anchors to get refined anchors.
+        # [batch, N, (y1, x1, y2, x2)]
+        boxes = utils.batch_slice([pre_nms_anchors, deltas],
+                                  lambda x, y: apply_box_deltas_graph(x, y),
+                                  self.config.IMAGES_PER_GPU,
+                                  names=["refined_anchors"])
+
+        # Clip to image boundaries. Since we're in normalized coordinates,
+        # clip to 0..1 range. [batch, N, (y1, x1, y2, x2)]
+        window = np.array([0, 0, 1, 1], dtype=np.float32)
+        boxes = utils.batch_slice(boxes,
+                                  lambda x: clip_boxes_graph(x, window),
+                                  self.config.IMAGES_PER_GPU,
+                                  names=["refined_anchors_clipped"])
+
+        # Filter out small boxes
+        # According to Xinlei Chen's paper, this reduces detection accuracy
+        # for small objects, so we're skipping it.
+
+        # Non-max suppression
+        def nms(boxes, scores):
+            indices = tf.image.non_max_suppression(
+                boxes, scores, self.proposal_count,
+                self.nms_threshold, name="rpn_non_max_suppression")
+            proposals = tf.gather(boxes, indices)
+            # Pad if needed
+            padding = tf.maximum(self.proposal_count - tf.shape(proposals)[0], 0)
+            proposals = tf.pad(proposals, [(0, padding), (0, 0)])
+            return proposals
+        proposals = utils.batch_slice([boxes, scores], nms,
+                                      self.config.IMAGES_PER_GPU)
+        return proposals
+
+    def compute_output_shape(self, input_shape):
+        return (None, self.proposal_count, 4)
+
+
+############################################################
+#  ROIAlign Layer
+############################################################
+
+def log2_graph(x):
+    """Implementation of Log2. TF doesn't have a native implementation."""
+    return tf.log(x) / tf.log(2.0)
+
+
+class PyramidROIAlign(KE.Layer):
+    """Implements ROI Pooling on multiple levels of the feature pyramid.
+
+    Params:
+    - pool_shape: [pool_height, pool_width] of the output pooled regions. Usually [7, 7]
+
+    Inputs:
+    - boxes: [batch, num_boxes, (y1, x1, y2, x2)] in normalized
+             coordinates. Possibly padded with zeros if not enough
+             boxes to fill the array.
+    - image_meta: [batch, (meta data)] Image details. See compose_image_meta()
+    - feature_maps: List of feature maps from different levels of the pyramid.
+                    Each is [batch, height, width, channels]
+
+    Output:
+    Pooled regions in the shape: [batch, num_boxes, pool_height, pool_width, channels].
+    The width and height are those specific in the pool_shape in the layer
+    constructor.
+    """
+
+    def __init__(self, pool_shape, **kwargs):
+        super(PyramidROIAlign, self).__init__(**kwargs)
+        self.pool_shape = tuple(pool_shape)
+
+    def call(self, inputs):
+        # Crop boxes [batch, num_boxes, (y1, x1, y2, x2)] in normalized coords
+        boxes = inputs[0]
+
+        # Image meta
+        # Holds details about the image. See compose_image_meta()
+        image_meta = inputs[1]
+
+        # Feature Maps. List of feature maps from different level of the
+        # feature pyramid. Each is [batch, height, width, channels]
+        feature_maps = inputs[2:]
+
+        # Assign each ROI to a level in the pyramid based on the ROI area.
+        y1, x1, y2, x2 = tf.split(boxes, 4, axis=2)
+        h = y2 - y1
+        w = x2 - x1
+        # Use shape of first image. Images in a batch must have the same size.
+        image_shape = parse_image_meta_graph(image_meta)['image_shape'][0]
+        # Equation 1 in the Feature Pyramid Networks paper. Account for
+        # the fact that our coordinates are normalized here.
+        # e.g. a 224x224 ROI (in pixels) maps to P4
+        image_area = tf.cast(image_shape[0] * image_shape[1], tf.float32)
+        roi_level = log2_graph(tf.sqrt(h * w) / (224.0 / tf.sqrt(image_area)))
+        roi_level = tf.minimum(5, tf.maximum(
+            2, 4 + tf.cast(tf.round(roi_level), tf.int32)))
+        roi_level = tf.squeeze(roi_level, 2)
+
+        # Loop through levels and apply ROI pooling to each. P2 to P5.
+        pooled = []
+        box_to_level = []
+        for i, level in enumerate(range(2, 6)):
+            ix = tf.where(tf.equal(roi_level, level))
+            level_boxes = tf.gather_nd(boxes, ix)
+
+            # Box indices for crop_and_resize.
+            box_indices = tf.cast(ix[:, 0], tf.int32)
+
+            # Keep track of which box is mapped to which level
+            box_to_level.append(ix)
+
+            # Stop gradient propogation to ROI proposals
+            level_boxes = tf.stop_gradient(level_boxes)
+            box_indices = tf.stop_gradient(box_indices)
+
+            # Crop and Resize
+            # From Mask R-CNN paper: "We sample four regular locations, so
+            # that we can evaluate either max or average pooling. In fact,
+            # interpolating only a single value at each bin center (without
+            # pooling) is nearly as effective."
+            #
+            # Here we use the simplified approach of a single value per bin,
+            # which is how it's done in tf.crop_and_resize()
+            # Result: [batch * num_boxes, pool_height, pool_width, channels]
+            pooled.append(tf.image.crop_and_resize(
+                feature_maps[i], level_boxes, box_indices, self.pool_shape,
+                method="bilinear"))
+
+        # Pack pooled features into one tensor
+        pooled = tf.concat(pooled, axis=0)
+
+        # Pack box_to_level mapping into one array and add another
+        # column representing the order of pooled boxes
+        box_to_level = tf.concat(box_to_level, axis=0)
+        box_range = tf.expand_dims(tf.range(tf.shape(box_to_level)[0]), 1)
+        box_to_level = tf.concat([tf.cast(box_to_level, tf.int32), box_range],
+                                 axis=1)
+
+        # Rearrange pooled features to match the order of the original boxes
+        # Sort box_to_level by batch then box index
+        # TF doesn't have a way to sort by two columns, so merge them and sort.
+        sorting_tensor = box_to_level[:, 0] * 100000 + box_to_level[:, 1]
+        ix = tf.nn.top_k(sorting_tensor, k=tf.shape(
+            box_to_level)[0]).indices[::-1]
+        ix = tf.gather(box_to_level[:, 2], ix)
+        pooled = tf.gather(pooled, ix)
+
+        # Re-add the batch dimension
+        shape = tf.concat([tf.shape(boxes)[:2], tf.shape(pooled)[1:]], axis=0)
+        pooled = tf.reshape(pooled, shape)
+        return pooled
+
+    def compute_output_shape(self, input_shape):
+        return input_shape[0][:2] + self.pool_shape + (input_shape[2][-1], )
+
+
+############################################################
+#  Detection Target Layer
+############################################################
+
+def overlaps_graph(boxes1, boxes2):
+    """Computes IoU overlaps between two sets of boxes.
+    boxes1, boxes2: [N, (y1, x1, y2, x2)].
+    """
+    # 1. Tile boxes2 and repeat boxes1. This allows us to compare
+    # every boxes1 against every boxes2 without loops.
+    # TF doesn't have an equivalent to np.repeat() so simulate it
+    # using tf.tile() and tf.reshape.
+    b1 = tf.reshape(tf.tile(tf.expand_dims(boxes1, 1),
+                            [1, 1, tf.shape(boxes2)[0]]), [-1, 4])
+    b2 = tf.tile(boxes2, [tf.shape(boxes1)[0], 1])
+    # 2. Compute intersections
+    b1_y1, b1_x1, b1_y2, b1_x2 = tf.split(b1, 4, axis=1)
+    b2_y1, b2_x1, b2_y2, b2_x2 = tf.split(b2, 4, axis=1)
+    y1 = tf.maximum(b1_y1, b2_y1)
+    x1 = tf.maximum(b1_x1, b2_x1)
+    y2 = tf.minimum(b1_y2, b2_y2)
+    x2 = tf.minimum(b1_x2, b2_x2)
+    intersection = tf.maximum(x2 - x1, 0) * tf.maximum(y2 - y1, 0)
+    # 3. Compute unions
+    b1_area = (b1_y2 - b1_y1) * (b1_x2 - b1_x1)
+    b2_area = (b2_y2 - b2_y1) * (b2_x2 - b2_x1)
+    union = b1_area + b2_area - intersection
+    # 4. Compute IoU and reshape to [boxes1, boxes2]
+    iou = intersection / union
+    overlaps = tf.reshape(iou, [tf.shape(boxes1)[0], tf.shape(boxes2)[0]])
+    return overlaps
+
+
+def detection_targets_graph(proposals, gt_class_ids, gt_boxes, gt_masks, config):
+    """Generates detection targets for one image. Subsamples proposals and
+    generates target class IDs, bounding box deltas, and masks for each.
+
+    Inputs:
+    proposals: [POST_NMS_ROIS_TRAINING, (y1, x1, y2, x2)] in normalized coordinates. Might
+               be zero padded if there are not enough proposals.
+    gt_class_ids: [MAX_GT_INSTANCES] int class IDs
+    gt_boxes: [MAX_GT_INSTANCES, (y1, x1, y2, x2)] in normalized coordinates.
+    gt_masks: [height, width, MAX_GT_INSTANCES] of boolean type.
+
+    Returns: Target ROIs and corresponding class IDs, bounding box shifts,
+    and masks.
+    rois: [TRAIN_ROIS_PER_IMAGE, (y1, x1, y2, x2)] in normalized coordinates
+    class_ids: [TRAIN_ROIS_PER_IMAGE]. Integer class IDs. Zero padded.
+    deltas: [TRAIN_ROIS_PER_IMAGE, (dy, dx, log(dh), log(dw))]
+    masks: [TRAIN_ROIS_PER_IMAGE, height, width]. Masks cropped to bbox
+           boundaries and resized to neural network output size.
+
+    Note: Returned arrays might be zero padded if not enough target ROIs.
+    """
+    # Assertions
+    asserts = [
+        tf.Assert(tf.greater(tf.shape(proposals)[0], 0), [proposals],
+                  name="roi_assertion"),
+    ]
+    with tf.control_dependencies(asserts):
+        proposals = tf.identity(proposals)
+
+    # Remove zero padding
+    proposals, _ = trim_zeros_graph(proposals, name="trim_proposals")
+    gt_boxes, non_zeros = trim_zeros_graph(gt_boxes, name="trim_gt_boxes")
+    gt_class_ids = tf.boolean_mask(gt_class_ids, non_zeros,
+                                   name="trim_gt_class_ids")
+    gt_masks = tf.gather(gt_masks, tf.where(non_zeros)[:, 0], axis=2,
+                         name="trim_gt_masks")
+
+    # Handle COCO crowds
+    # A crowd box in COCO is a bounding box around several instances. Exclude
+    # them from training. A crowd box is given a negative class ID.
+    crowd_ix = tf.where(gt_class_ids < 0)[:, 0]
+    non_crowd_ix = tf.where(gt_class_ids > 0)[:, 0]
+    crowd_boxes = tf.gather(gt_boxes, crowd_ix)
+    gt_class_ids = tf.gather(gt_class_ids, non_crowd_ix)
+    gt_boxes = tf.gather(gt_boxes, non_crowd_ix)
+    gt_masks = tf.gather(gt_masks, non_crowd_ix, axis=2)
+
+    # Compute overlaps matrix [proposals, gt_boxes]
+    overlaps = overlaps_graph(proposals, gt_boxes)
+
+    # Compute overlaps with crowd boxes [proposals, crowd_boxes]
+    crowd_overlaps = overlaps_graph(proposals, crowd_boxes)
+    crowd_iou_max = tf.reduce_max(crowd_overlaps, axis=1)
+    no_crowd_bool = (crowd_iou_max < 0.001)
+
+    # Determine positive and negative ROIs
+    roi_iou_max = tf.reduce_max(overlaps, axis=1)
+    # 1. Positive ROIs are those with >= 0.5 IoU with a GT box
+    positive_roi_bool = (roi_iou_max >= 0.5)
+    positive_indices = tf.where(positive_roi_bool)[:, 0]
+    # 2. Negative ROIs are those with < 0.5 with every GT box. Skip crowds.
+    negative_indices = tf.where(tf.logical_and(roi_iou_max < 0.5, no_crowd_bool))[:, 0]
+
+    # Subsample ROIs. Aim for 33% positive
+    # Positive ROIs
+    positive_count = int(config.TRAIN_ROIS_PER_IMAGE *
+                         config.ROI_POSITIVE_RATIO)
+    positive_indices = tf.random_shuffle(positive_indices)[:positive_count]
+    positive_count = tf.shape(positive_indices)[0]
+    # Negative ROIs. Add enough to maintain positive:negative ratio.
+    r = 1.0 / config.ROI_POSITIVE_RATIO
+    negative_count = tf.cast(r * tf.cast(positive_count, tf.float32), tf.int32) - positive_count
+    negative_indices = tf.random_shuffle(negative_indices)[:negative_count]
+    # Gather selected ROIs
+    positive_rois = tf.gather(proposals, positive_indices)
+    negative_rois = tf.gather(proposals, negative_indices)
+
+    # Assign positive ROIs to GT boxes.
+    positive_overlaps = tf.gather(overlaps, positive_indices)
+    roi_gt_box_assignment = tf.cond(
+        tf.greater(tf.shape(positive_overlaps)[1], 0),
+        true_fn = lambda: tf.argmax(positive_overlaps, axis=1),
+        false_fn = lambda: tf.cast(tf.constant([]),tf.int64)
+    )
+    roi_gt_boxes = tf.gather(gt_boxes, roi_gt_box_assignment)
+    roi_gt_class_ids = tf.gather(gt_class_ids, roi_gt_box_assignment)
+
+    # Compute bbox refinement for positive ROIs
+    deltas = utils.box_refinement_graph(positive_rois, roi_gt_boxes)
+    deltas /= config.BBOX_STD_DEV
+
+    # Assign positive ROIs to GT masks
+    # Permute masks to [N, height, width, 1]
+    transposed_masks = tf.expand_dims(tf.transpose(gt_masks, [2, 0, 1]), -1)
+    # Pick the right mask for each ROI
+    roi_masks = tf.gather(transposed_masks, roi_gt_box_assignment)
+
+    # Compute mask targets
+    boxes = positive_rois
+    if config.USE_MINI_MASK:
+        # Transform ROI coordinates from normalized image space
+        # to normalized mini-mask space.
+        y1, x1, y2, x2 = tf.split(positive_rois, 4, axis=1)
+        gt_y1, gt_x1, gt_y2, gt_x2 = tf.split(roi_gt_boxes, 4, axis=1)
+        gt_h = gt_y2 - gt_y1
+        gt_w = gt_x2 - gt_x1
+        y1 = (y1 - gt_y1) / gt_h
+        x1 = (x1 - gt_x1) / gt_w
+        y2 = (y2 - gt_y1) / gt_h
+        x2 = (x2 - gt_x1) / gt_w
+        boxes = tf.concat([y1, x1, y2, x2], 1)
+    box_ids = tf.range(0, tf.shape(roi_masks)[0])
+    masks = tf.image.crop_and_resize(tf.cast(roi_masks, tf.float32), boxes,
+                                     box_ids,
+                                     config.MASK_SHAPE)
+    # Remove the extra dimension from masks.
+    masks = tf.squeeze(masks, axis=3)
+
+    # Threshold mask pixels at 0.5 to have GT masks be 0 or 1 to use with
+    # binary cross entropy loss.
+    masks = tf.round(masks)
+
+    # Append negative ROIs and pad bbox deltas and masks that
+    # are not used for negative ROIs with zeros.
+    rois = tf.concat([positive_rois, negative_rois], axis=0)
+    N = tf.shape(negative_rois)[0]
+    P = tf.maximum(config.TRAIN_ROIS_PER_IMAGE - tf.shape(rois)[0], 0)
+    rois = tf.pad(rois, [(0, P), (0, 0)])
+    roi_gt_boxes = tf.pad(roi_gt_boxes, [(0, N + P), (0, 0)])
+    roi_gt_class_ids = tf.pad(roi_gt_class_ids, [(0, N + P)])
+    deltas = tf.pad(deltas, [(0, N + P), (0, 0)])
+    masks = tf.pad(masks, [[0, N + P], (0, 0), (0, 0)])
+
+    return rois, roi_gt_class_ids, deltas, masks
+
+
+class DetectionTargetLayer(KE.Layer):
+    """Subsamples proposals and generates target box refinement, class_ids,
+    and masks for each.
+
+    Inputs:
+    proposals: [batch, N, (y1, x1, y2, x2)] in normalized coordinates. Might
+               be zero padded if there are not enough proposals.
+    gt_class_ids: [batch, MAX_GT_INSTANCES] Integer class IDs.
+    gt_boxes: [batch, MAX_GT_INSTANCES, (y1, x1, y2, x2)] in normalized
+              coordinates.
+    gt_masks: [batch, height, width, MAX_GT_INSTANCES] of boolean type
+
+    Returns: Target ROIs and corresponding class IDs, bounding box shifts,
+    and masks.
+    rois: [batch, TRAIN_ROIS_PER_IMAGE, (y1, x1, y2, x2)] in normalized
+          coordinates
+    target_class_ids: [batch, TRAIN_ROIS_PER_IMAGE]. Integer class IDs.
+    target_deltas: [batch, TRAIN_ROIS_PER_IMAGE, (dy, dx, log(dh), log(dw)]
+    target_mask: [batch, TRAIN_ROIS_PER_IMAGE, height, width]
+                 Masks cropped to bbox boundaries and resized to neural
+                 network output size.
+
+    Note: Returned arrays might be zero padded if not enough target ROIs.
+    """
+
+    def __init__(self, config, **kwargs):
+        super(DetectionTargetLayer, self).__init__(**kwargs)
+        self.config = config
+
+    def call(self, inputs):
+        proposals = inputs[0]
+        gt_class_ids = inputs[1]
+        gt_boxes = inputs[2]
+        gt_masks = inputs[3]
+
+        # Slice the batch and run a graph for each slice
+        # TODO: Rename target_bbox to target_deltas for clarity
+        names = ["rois", "target_class_ids", "target_bbox", "target_mask"]
+        outputs = utils.batch_slice(
+            [proposals, gt_class_ids, gt_boxes, gt_masks],
+            lambda w, x, y, z: detection_targets_graph(
+                w, x, y, z, self.config),
+            self.config.IMAGES_PER_GPU, names=names)
+        return outputs
+
+    def compute_output_shape(self, input_shape):
+        return [
+            (None, self.config.TRAIN_ROIS_PER_IMAGE, 4),  # rois
+            (None, self.config.TRAIN_ROIS_PER_IMAGE),  # class_ids
+            (None, self.config.TRAIN_ROIS_PER_IMAGE, 4),  # deltas
+            (None, self.config.TRAIN_ROIS_PER_IMAGE, self.config.MASK_SHAPE[0],
+             self.config.MASK_SHAPE[1])  # masks
+        ]
+
+    def compute_mask(self, inputs, mask=None):
+        return [None, None, None, None]
+
+
+############################################################
+#  Detection Layer
+############################################################
+
+def refine_detections_graph(rois, probs, deltas, window, config):
+    """Refine classified proposals and filter overlaps and return final
+    detections.
+
+    Inputs:
+        rois: [N, (y1, x1, y2, x2)] in normalized coordinates
+        probs: [N, num_classes]. Class probabilities.
+        deltas: [N, num_classes, (dy, dx, log(dh), log(dw))]. Class-specific
+                bounding box deltas.
+        window: (y1, x1, y2, x2) in normalized coordinates. The part of the image
+            that contains the image excluding the padding.
+
+    Returns detections shaped: [num_detections, (y1, x1, y2, x2, class_id, score)] where
+        coordinates are normalized.
+    """
+    # Class IDs per ROI
+    class_ids = tf.argmax(probs, axis=1, output_type=tf.int32)
+    # Class probability of the top class of each ROI
+    indices = tf.stack([tf.range(probs.shape[0]), class_ids], axis=1)
+    class_scores = tf.gather_nd(probs, indices)
+    # Class-specific bounding box deltas
+    deltas_specific = tf.gather_nd(deltas, indices)
+    # Apply bounding box deltas
+    # Shape: [boxes, (y1, x1, y2, x2)] in normalized coordinates
+    refined_rois = apply_box_deltas_graph(
+        rois, deltas_specific * config.BBOX_STD_DEV)
+    # Clip boxes to image window
+    refined_rois = clip_boxes_graph(refined_rois, window)
+
+    # TODO: Filter out boxes with zero area
+
+    # Filter out background boxes
+    keep = tf.where(class_ids > 0)[:, 0]
+    # Filter out low confidence boxes
+    if config.DETECTION_MIN_CONFIDENCE:
+        conf_keep = tf.where(class_scores >= config.DETECTION_MIN_CONFIDENCE)[:, 0]
+        keep = tf.sets.set_intersection(tf.expand_dims(keep, 0),
+                                        tf.expand_dims(conf_keep, 0))
+        keep = tf.sparse_tensor_to_dense(keep)[0]
+
+    # Apply per-class NMS
+    # 1. Prepare variables
+    pre_nms_class_ids = tf.gather(class_ids, keep)
+    pre_nms_scores = tf.gather(class_scores, keep)
+    pre_nms_rois = tf.gather(refined_rois,   keep)
+    unique_pre_nms_class_ids = tf.unique(pre_nms_class_ids)[0]
+
+    def nms_keep_map(class_id):
+        """Apply Non-Maximum Suppression on ROIs of the given class."""
+        # Indices of ROIs of the given class
+        ixs = tf.where(tf.equal(pre_nms_class_ids, class_id))[:, 0]
+        # Apply NMS
+        class_keep = tf.image.non_max_suppression(
+                tf.gather(pre_nms_rois, ixs),
+                tf.gather(pre_nms_scores, ixs),
+                max_output_size=config.DETECTION_MAX_INSTANCES,
+                iou_threshold=config.DETECTION_NMS_THRESHOLD)
+        # Map indices
+        class_keep = tf.gather(keep, tf.gather(ixs, class_keep))
+        # Pad with -1 so returned tensors have the same shape
+        gap = config.DETECTION_MAX_INSTANCES - tf.shape(class_keep)[0]
+        class_keep = tf.pad(class_keep, [(0, gap)],
+                            mode='CONSTANT', constant_values=-1)
+        # Set shape so map_fn() can infer result shape
+        class_keep.set_shape([config.DETECTION_MAX_INSTANCES])
+        return class_keep
+
+    # 2. Map over class IDs
+    nms_keep = tf.map_fn(nms_keep_map, unique_pre_nms_class_ids,
+                         dtype=tf.int64)
+    # 3. Merge results into one list, and remove -1 padding
+    nms_keep = tf.reshape(nms_keep, [-1])
+    nms_keep = tf.gather(nms_keep, tf.where(nms_keep > -1)[:, 0])
+    # 4. Compute intersection between keep and nms_keep
+    keep = tf.sets.set_intersection(tf.expand_dims(keep, 0),
+                                    tf.expand_dims(nms_keep, 0))
+    keep = tf.sparse_tensor_to_dense(keep)[0]
+    # Keep top detections
+    roi_count = config.DETECTION_MAX_INSTANCES
+    class_scores_keep = tf.gather(class_scores, keep)
+    num_keep = tf.minimum(tf.shape(class_scores_keep)[0], roi_count)
+    top_ids = tf.nn.top_k(class_scores_keep, k=num_keep, sorted=True)[1]
+    keep = tf.gather(keep, top_ids)
+
+    # Arrange output as [N, (y1, x1, y2, x2, class_id, score)]
+    # Coordinates are normalized.
+    detections = tf.concat([
+        tf.gather(refined_rois, keep),
+        tf.to_float(tf.gather(class_ids, keep))[..., tf.newaxis],
+        tf.gather(class_scores, keep)[..., tf.newaxis]
+        ], axis=1)
+
+    # Pad with zeros if detections < DETECTION_MAX_INSTANCES
+    gap = config.DETECTION_MAX_INSTANCES - tf.shape(detections)[0]
+    detections = tf.pad(detections, [(0, gap), (0, 0)], "CONSTANT")
+    return detections
+
+
+class DetectionLayer(KE.Layer):
+    """Takes classified proposal boxes and their bounding box deltas and
+    returns the final detection boxes.
+
+    Returns:
+    [batch, num_detections, (y1, x1, y2, x2, class_id, class_score)] where
+    coordinates are normalized.
+    """
+
+    def __init__(self, config=None, **kwargs):
+        super(DetectionLayer, self).__init__(**kwargs)
+        self.config = config
+
+    def call(self, inputs):
+        rois = inputs[0]
+        mrcnn_class = inputs[1]
+        mrcnn_bbox = inputs[2]
+        image_meta = inputs[3]
+
+        # Get windows of images in normalized coordinates. Windows are the area
+        # in the image that excludes the padding.
+        # Use the shape of the first image in the batch to normalize the window
+        # because we know that all images get resized to the same size.
+        m = parse_image_meta_graph(image_meta)
+        image_shape = m['image_shape'][0]
+        window = norm_boxes_graph(m['window'], image_shape[:2])
+
+        # Run detection refinement graph on each item in the batch
+        detections_batch = utils.batch_slice(
+            [rois, mrcnn_class, mrcnn_bbox, window],
+            lambda x, y, w, z: refine_detections_graph(x, y, w, z, self.config),
+            self.config.IMAGES_PER_GPU)
+
+        # Reshape output
+        # [batch, num_detections, (y1, x1, y2, x2, class_id, class_score)] in
+        # normalized coordinates
+        return tf.reshape(
+            detections_batch,
+            [self.config.BATCH_SIZE, self.config.DETECTION_MAX_INSTANCES, 6])
+
+    def compute_output_shape(self, input_shape):
+        return (None, self.config.DETECTION_MAX_INSTANCES, 6)
+
+
+############################################################
+#  Region Proposal Network (RPN)
+############################################################
+
+def rpn_graph(feature_map, anchors_per_location, anchor_stride):
+    """Builds the computation graph of Region Proposal Network.
+
+    feature_map: backbone features [batch, height, width, depth]
+    anchors_per_location: number of anchors per pixel in the feature map
+    anchor_stride: Controls the density of anchors. Typically 1 (anchors for
+                   every pixel in the feature map), or 2 (every other pixel).
+
+    Returns:
+        rpn_class_logits: [batch, H * W * anchors_per_location, 2] Anchor classifier logits (before softmax)
+        rpn_probs: [batch, H * W * anchors_per_location, 2] Anchor classifier probabilities.
+        rpn_bbox: [batch, H * W * anchors_per_location, (dy, dx, log(dh), log(dw))] Deltas to be
+                  applied to anchors.
+    """
+    # TODO: check if stride of 2 causes alignment issues if the feature map
+    # is not even.
+    # Shared convolutional base of the RPN
+    shared = KL.Conv2D(512, (3, 3), padding='same', activation='relu',
+                       strides=anchor_stride,
+                       name='rpn_conv_shared')(feature_map)
+
+    # Anchor Score. [batch, height, width, anchors per location * 2].
+    x = KL.Conv2D(2 * anchors_per_location, (1, 1), padding='valid',
+                  activation='linear', name='rpn_class_raw')(shared)
+
+    # Reshape to [batch, anchors, 2]
+    rpn_class_logits = KL.Lambda(
+        lambda t: tf.reshape(t, [tf.shape(t)[0], -1, 2]))(x)
+
+    # Softmax on last dimension of BG/FG.
+    rpn_probs = KL.Activation(
+        "softmax", name="rpn_class_xxx")(rpn_class_logits)
+
+    # Bounding box refinement. [batch, H, W, anchors per location * depth]
+    # where depth is [x, y, log(w), log(h)]
+    x = KL.Conv2D(anchors_per_location * 4, (1, 1), padding="valid",
+                  activation='linear', name='rpn_bbox_pred')(shared)
+
+    # Reshape to [batch, anchors, 4]
+    rpn_bbox = KL.Lambda(lambda t: tf.reshape(t, [tf.shape(t)[0], -1, 4]))(x)
+
+    return [rpn_class_logits, rpn_probs, rpn_bbox]
+
+
+def build_rpn_model(anchor_stride, anchors_per_location, depth):
+    """Builds a Keras model of the Region Proposal Network.
+    It wraps the RPN graph so it can be used multiple times with shared
+    weights.
+
+    anchors_per_location: number of anchors per pixel in the feature map
+    anchor_stride: Controls the density of anchors. Typically 1 (anchors for
+                   every pixel in the feature map), or 2 (every other pixel).
+    depth: Depth of the backbone feature map.
+
+    Returns a Keras Model object. The model outputs, when called, are:
+    rpn_class_logits: [batch, H * W * anchors_per_location, 2] Anchor classifier logits (before softmax)
+    rpn_probs: [batch, H * W * anchors_per_location, 2] Anchor classifier probabilities.
+    rpn_bbox: [batch, H * W * anchors_per_location, (dy, dx, log(dh), log(dw))] Deltas to be
+                applied to anchors.
+    """
+    input_feature_map = KL.Input(shape=[None, None, depth],
+                                 name="input_rpn_feature_map")
+    outputs = rpn_graph(input_feature_map, anchors_per_location, anchor_stride)
+    return KM.Model([input_feature_map], outputs, name="rpn_model")
+
+
+############################################################
+#  Feature Pyramid Network Heads
+############################################################
+
+def fpn_classifier_graph(rois, feature_maps, image_meta,
+                         pool_size, num_classes, train_bn=True,
+                         fc_layers_size=1024):
+    """Builds the computation graph of the feature pyramid network classifier
+    and regressor heads.
+
+    rois: [batch, num_rois, (y1, x1, y2, x2)] Proposal boxes in normalized
+          coordinates.
+    feature_maps: List of feature maps from different layers of the pyramid,
+                  [P2, P3, P4, P5]. Each has a different resolution.
+    image_meta: [batch, (meta data)] Image details. See compose_image_meta()
+    pool_size: The width of the square feature map generated from ROI Pooling.
+    num_classes: number of classes, which determines the depth of the results
+    train_bn: Boolean. Train or freeze Batch Norm layers
+    fc_layers_size: Size of the 2 FC layers
+
+    Returns:
+        logits: [batch, num_rois, NUM_CLASSES] classifier logits (before softmax)
+        probs: [batch, num_rois, NUM_CLASSES] classifier probabilities
+        bbox_deltas: [batch, num_rois, NUM_CLASSES, (dy, dx, log(dh), log(dw))] Deltas to apply to
+                     proposal boxes
+    """
+    # ROI Pooling
+    # Shape: [batch, num_rois, POOL_SIZE, POOL_SIZE, channels]
+    x = PyramidROIAlign([pool_size, pool_size],
+                        name="roi_align_classifier")([rois, image_meta] + feature_maps)
+    # Two 1024 FC layers (implemented with Conv2D for consistency)
+    x = KL.TimeDistributed(KL.Conv2D(fc_layers_size, (pool_size, pool_size), padding="valid"),
+                           name="mrcnn_class_conv1")(x)
+    x = KL.TimeDistributed(BatchNorm(), name='mrcnn_class_bn1')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+    x = KL.TimeDistributed(KL.Conv2D(fc_layers_size, (1, 1)),
+                           name="mrcnn_class_conv2")(x)
+    x = KL.TimeDistributed(BatchNorm(), name='mrcnn_class_bn2')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+
+    shared = KL.Lambda(lambda x: K.squeeze(K.squeeze(x, 3), 2),
+                       name="pool_squeeze")(x)
+
+    # Classifier head
+    mrcnn_class_logits = KL.TimeDistributed(KL.Dense(num_classes),
+                                            name='mrcnn_class_logits')(shared)
+    mrcnn_probs = KL.TimeDistributed(KL.Activation("softmax"),
+                                     name="mrcnn_class")(mrcnn_class_logits)
+
+    # BBox head
+    # [batch, num_rois, NUM_CLASSES * (dy, dx, log(dh), log(dw))]
+    x = KL.TimeDistributed(KL.Dense(num_classes * 4, activation='linear'),
+                           name='mrcnn_bbox_fc')(shared)
+    # Reshape to [batch, num_rois, NUM_CLASSES, (dy, dx, log(dh), log(dw))]
+    s = K.int_shape(x)
+    mrcnn_bbox = KL.Reshape((s[1], num_classes, 4), name="mrcnn_bbox")(x)
+
+    return mrcnn_class_logits, mrcnn_probs, mrcnn_bbox
+
+
+def build_fpn_mask_graph(rois, feature_maps, image_meta,
+                         pool_size, num_classes, train_bn=True):
+    """Builds the computation graph of the mask head of Feature Pyramid Network.
+
+    rois: [batch, num_rois, (y1, x1, y2, x2)] Proposal boxes in normalized
+          coordinates.
+    feature_maps: List of feature maps from different layers of the pyramid,
+                  [P2, P3, P4, P5]. Each has a different resolution.
+    image_meta: [batch, (meta data)] Image details. See compose_image_meta()
+    pool_size: The width of the square feature map generated from ROI Pooling.
+    num_classes: number of classes, which determines the depth of the results
+    train_bn: Boolean. Train or freeze Batch Norm layers
+
+    Returns: Masks [batch, num_rois, MASK_POOL_SIZE, MASK_POOL_SIZE, NUM_CLASSES]
+    """
+    # ROI Pooling
+    # Shape: [batch, num_rois, MASK_POOL_SIZE, MASK_POOL_SIZE, channels]
+    x = PyramidROIAlign([pool_size, pool_size],
+                        name="roi_align_mask")([rois, image_meta] + feature_maps)
+
+    # Conv layers
+    x = KL.TimeDistributed(KL.Conv2D(256, (3, 3), padding="same"),
+                           name="mrcnn_mask_conv1")(x)
+    x = KL.TimeDistributed(BatchNorm(),
+                           name='mrcnn_mask_bn1')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+
+    x = KL.TimeDistributed(KL.Conv2D(256, (3, 3), padding="same"),
+                           name="mrcnn_mask_conv2")(x)
+    x = KL.TimeDistributed(BatchNorm(),
+                           name='mrcnn_mask_bn2')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+
+    x = KL.TimeDistributed(KL.Conv2D(256, (3, 3), padding="same"),
+                           name="mrcnn_mask_conv3")(x)
+    x = KL.TimeDistributed(BatchNorm(),
+                           name='mrcnn_mask_bn3')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+
+    x = KL.TimeDistributed(KL.Conv2D(256, (3, 3), padding="same"),
+                           name="mrcnn_mask_conv4")(x)
+    x = KL.TimeDistributed(BatchNorm(),
+                           name='mrcnn_mask_bn4')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+
+    x = KL.TimeDistributed(KL.Conv2DTranspose(256, (2, 2), strides=2, activation="relu"),
+                           name="mrcnn_mask_deconv")(x)
+    x = KL.TimeDistributed(KL.Conv2D(num_classes, (1, 1), strides=1, activation="sigmoid"),
+                           name="mrcnn_mask")(x)
+    return x
+
+
+############################################################
+#  Loss Functions
+############################################################
+
+def smooth_l1_loss(y_true, y_pred):
+    """Implements Smooth-L1 loss.
+    y_true and y_pred are typically: [N, 4], but could be any shape.
+    """
+    diff = K.abs(y_true - y_pred)
+    less_than_one = K.cast(K.less(diff, 1.0), "float32")
+    loss = (less_than_one * 0.5 * diff**2) + (1 - less_than_one) * (diff - 0.5)
+    return loss
+
+
+def rpn_class_loss_graph(rpn_match, rpn_class_logits):
+    """RPN anchor classifier loss.
+
+    rpn_match: [batch, anchors, 1]. Anchor match type. 1=positive,
+               -1=negative, 0=neutral anchor.
+    rpn_class_logits: [batch, anchors, 2]. RPN classifier logits for BG/FG.
+    """
+    # Squeeze last dim to simplify
+    rpn_match = tf.squeeze(rpn_match, -1)
+    # Get anchor classes. Convert the -1/+1 match to 0/1 values.
+    anchor_class = K.cast(K.equal(rpn_match, 1), tf.int32)
+    # Positive and Negative anchors contribute to the loss,
+    # but neutral anchors (match value = 0) don't.
+    indices = tf.where(K.not_equal(rpn_match, 0))
+    # Pick rows that contribute to the loss and filter out the rest.
+    rpn_class_logits = tf.gather_nd(rpn_class_logits, indices)
+    anchor_class = tf.gather_nd(anchor_class, indices)
+    # Cross entropy loss
+    loss = K.sparse_categorical_crossentropy(target=anchor_class,
+                                             output=rpn_class_logits,
+                                             from_logits=True)
+    loss = K.switch(tf.size(loss) > 0, K.mean(loss), tf.constant(0.0))
+    return loss
+
+
+def rpn_bbox_loss_graph(config, target_bbox, rpn_match, rpn_bbox):
+    """Return the RPN bounding box loss graph.
+
+    config: the model config object.
+    target_bbox: [batch, max positive anchors, (dy, dx, log(dh), log(dw))].
+        Uses 0 padding to fill in unsed bbox deltas.
+    rpn_match: [batch, anchors, 1]. Anchor match type. 1=positive,
+               -1=negative, 0=neutral anchor.
+    rpn_bbox: [batch, anchors, (dy, dx, log(dh), log(dw))]
+    """
+    # Positive anchors contribute to the loss, but negative and
+    # neutral anchors (match value of 0 or -1) don't.
+    rpn_match = K.squeeze(rpn_match, -1)
+    indices = tf.where(K.equal(rpn_match, 1))
+
+    # Pick bbox deltas that contribute to the loss
+    rpn_bbox = tf.gather_nd(rpn_bbox, indices)
+
+    # Trim target bounding box deltas to the same length as rpn_bbox.
+    batch_counts = K.sum(K.cast(K.equal(rpn_match, 1), tf.int32), axis=1)
+    target_bbox = batch_pack_graph(target_bbox, batch_counts,
+                                   config.IMAGES_PER_GPU)
+
+    loss = smooth_l1_loss(target_bbox, rpn_bbox)
+    
+    loss = K.switch(tf.size(loss) > 0, K.mean(loss), tf.constant(0.0))
+    return loss
+
+
+def mrcnn_class_loss_graph(target_class_ids, pred_class_logits,
+                           active_class_ids):
+    """Loss for the classifier head of Mask RCNN.
+
+    target_class_ids: [batch, num_rois]. Integer class IDs. Uses zero
+        padding to fill in the array.
+    pred_class_logits: [batch, num_rois, num_classes]
+    active_class_ids: [batch, num_classes]. Has a value of 1 for
+        classes that are in the dataset of the image, and 0
+        for classes that are not in the dataset.
+    """
+    # During model building, Keras calls this function with
+    # target_class_ids of type float32. Unclear why. Cast it
+    # to int to get around it.
+    target_class_ids = tf.cast(target_class_ids, 'int64')
+
+    # Find predictions of classes that are not in the dataset.
+    pred_class_ids = tf.argmax(pred_class_logits, axis=2)
+    # TODO: Update this line to work with batch > 1. Right now it assumes all
+    #       images in a batch have the same active_class_ids
+    pred_active = tf.gather(active_class_ids[0], pred_class_ids)
+
+    # Loss
+    loss = tf.nn.sparse_softmax_cross_entropy_with_logits(
+        labels=target_class_ids, logits=pred_class_logits)
+
+    # Erase losses of predictions of classes that are not in the active
+    # classes of the image.
+    loss = loss * pred_active
+
+    # Computer loss mean. Use only predictions that contribute
+    # to the loss to get a correct mean.
+    loss = tf.reduce_sum(loss) / tf.reduce_sum(pred_active)
+    return loss
+
+
+def mrcnn_bbox_loss_graph(target_bbox, target_class_ids, pred_bbox):
+    """Loss for Mask R-CNN bounding box refinement.
+
+    target_bbox: [batch, num_rois, (dy, dx, log(dh), log(dw))]
+    target_class_ids: [batch, num_rois]. Integer class IDs.
+    pred_bbox: [batch, num_rois, num_classes, (dy, dx, log(dh), log(dw))]
+    """
+    # Reshape to merge batch and roi dimensions for simplicity.
+    target_class_ids = K.reshape(target_class_ids, (-1,))
+    target_bbox = K.reshape(target_bbox, (-1, 4))
+    pred_bbox = K.reshape(pred_bbox, (-1, K.int_shape(pred_bbox)[2], 4))
+
+    # Only positive ROIs contribute to the loss. And only
+    # the right class_id of each ROI. Get their indices.
+    positive_roi_ix = tf.where(target_class_ids > 0)[:, 0]
+    positive_roi_class_ids = tf.cast(
+        tf.gather(target_class_ids, positive_roi_ix), tf.int64)
+    indices = tf.stack([positive_roi_ix, positive_roi_class_ids], axis=1)
+
+    # Gather the deltas (predicted and true) that contribute to loss
+    target_bbox = tf.gather(target_bbox, positive_roi_ix)
+    pred_bbox = tf.gather_nd(pred_bbox, indices)
+
+    # Smooth-L1 Loss
+    loss = K.switch(tf.size(target_bbox) > 0,
+                    smooth_l1_loss(y_true=target_bbox, y_pred=pred_bbox),
+                    tf.constant(0.0))
+    loss = K.mean(loss)
+    return loss
+
+
+def mrcnn_mask_loss_graph(target_masks, target_class_ids, pred_masks):
+    """Mask binary cross-entropy loss for the masks head.
+
+    target_masks: [batch, num_rois, height, width].
+        A float32 tensor of values 0 or 1. Uses zero padding to fill array.
+    target_class_ids: [batch, num_rois]. Integer class IDs. Zero padded.
+    pred_masks: [batch, proposals, height, width, num_classes] float32 tensor
+                with values from 0 to 1.
+    """
+    # Reshape for simplicity. Merge first two dimensions into one.
+    target_class_ids = K.reshape(target_class_ids, (-1,))
+    mask_shape = tf.shape(target_masks)
+    target_masks = K.reshape(target_masks, (-1, mask_shape[2], mask_shape[3]))
+    pred_shape = tf.shape(pred_masks)
+    pred_masks = K.reshape(pred_masks,
+                           (-1, pred_shape[2], pred_shape[3], pred_shape[4]))
+    # Permute predicted masks to [N, num_classes, height, width]
+    pred_masks = tf.transpose(pred_masks, [0, 3, 1, 2])
+
+    # Only positive ROIs contribute to the loss. And only
+    # the class specific mask of each ROI.
+    positive_ix = tf.where(target_class_ids > 0)[:, 0]
+    positive_class_ids = tf.cast(
+        tf.gather(target_class_ids, positive_ix), tf.int64)
+    indices = tf.stack([positive_ix, positive_class_ids], axis=1)
+
+    # Gather the masks (predicted and true) that contribute to loss
+    y_true = tf.gather(target_masks, positive_ix)
+    y_pred = tf.gather_nd(pred_masks, indices)
+
+    # Compute binary cross entropy. If no positive ROIs, then return 0.
+    # shape: [batch, roi, num_classes]
+    loss = K.switch(tf.size(y_true) > 0,
+                    K.binary_crossentropy(target=y_true, output=y_pred),
+                    tf.constant(0.0))
+    loss = K.mean(loss)
+    return loss
+
+
+############################################################
+#  Data Generator
+############################################################
+
+def load_image_gt(dataset, config, image_id, augment=False, augmentation=None,
+                  use_mini_mask=False):
+    """Load and return ground truth data for an image (image, mask, bounding boxes).
+
+    augment: (deprecated. Use augmentation instead). If true, apply random
+        image augmentation. Currently, only horizontal flipping is offered.
+    augmentation: Optional. An imgaug (https://github.com/aleju/imgaug) augmentation.
+        For example, passing imgaug.augmenters.Fliplr(0.5) flips images
+        right/left 50% of the time.
+    use_mini_mask: If False, returns full-size masks that are the same height
+        and width as the original image. These can be big, for example
+        1024x1024x100 (for 100 instances). Mini masks are smaller, typically,
+        224x224 and are generated by extracting the bounding box of the
+        object and resizing it to MINI_MASK_SHAPE.
+
+    Returns:
+    image: [height, width, 3]
+    shape: the original shape of the image before resizing and cropping.
+    class_ids: [instance_count] Integer class IDs
+    bbox: [instance_count, (y1, x1, y2, x2)]
+    mask: [height, width, instance_count]. The height and width are those
+        of the image unless use_mini_mask is True, in which case they are
+        defined in MINI_MASK_SHAPE.
+    """
+    # Load image and mask
+    image = dataset.load_image(image_id)
+    mask, class_ids = dataset.load_mask(image_id)
+    original_shape = image.shape
+    image, window, scale, padding, crop = utils.resize_image(
+        image,
+        min_dim=config.IMAGE_MIN_DIM,
+        min_scale=config.IMAGE_MIN_SCALE,
+        max_dim=config.IMAGE_MAX_DIM,
+        mode=config.IMAGE_RESIZE_MODE)
+    mask = utils.resize_mask(mask, scale, padding, crop)
+
+    # Random horizontal flips.
+    # TODO: will be removed in a future update in favor of augmentation
+    if augment:
+        logging.warning("'augment' is deprecated. Use 'augmentation' instead.")
+        if random.randint(0, 1):
+            image = np.fliplr(image)
+            mask = np.fliplr(mask)
+
+    # Augmentation
+    # This requires the imgaug lib (https://github.com/aleju/imgaug)
+    if augmentation:
+        import imgaug
+
+        # Augmenters that are safe to apply to masks
+        # Some, such as Affine, have settings that make them unsafe, so always
+        # test your augmentation on masks
+        MASK_AUGMENTERS = ["Sequential", "SomeOf", "OneOf", "Sometimes",
+                           "Fliplr", "Flipud", "CropAndPad",
+                           "Affine", "PiecewiseAffine"]
+
+        def hook(images, augmenter, parents, default):
+            """Determines which augmenters to apply to masks."""
+            return augmenter.__class__.__name__ in MASK_AUGMENTERS
+
+        # Store shapes before augmentation to compare
+        image_shape = image.shape
+        mask_shape = mask.shape
+        # Make augmenters deterministic to apply similarly to images and masks
+        det = augmentation.to_deterministic()
+        image = det.augment_image(image)
+        # Change mask to np.uint8 because imgaug doesn't support np.bool
+        mask = det.augment_image(mask.astype(np.uint8),
+                                 hooks=imgaug.HooksImages(activator=hook))
+        # Verify that shapes didn't change
+        assert image.shape == image_shape, "Augmentation shouldn't change image size"
+        assert mask.shape == mask_shape, "Augmentation shouldn't change mask size"
+        # Change mask back to bool
+        mask = mask.astype(np.bool)
+
+    # Note that some boxes might be all zeros if the corresponding mask got cropped out.
+    # and here is to filter them out
+    _idx = np.sum(mask, axis=(0, 1)) > 0
+    mask = mask[:, :, _idx]
+    class_ids = class_ids[_idx]
+    # Bounding boxes. Note that some boxes might be all zeros
+    # if the corresponding mask got cropped out.
+    # bbox: [num_instances, (y1, x1, y2, x2)]
+    bbox = utils.extract_bboxes(mask)
+
+    # Active classes
+    # Different datasets have different classes, so track the
+    # classes supported in the dataset of this image.
+    active_class_ids = np.zeros([dataset.num_classes], dtype=np.int32)
+    source_class_ids = dataset.source_class_ids[dataset.image_info[image_id]["source"]]
+    active_class_ids[source_class_ids] = 1
+
+    # Resize masks to smaller size to reduce memory usage
+    if use_mini_mask:
+        mask = utils.minimize_mask(bbox, mask, config.MINI_MASK_SHAPE)
+
+    # Image meta data
+    image_meta = compose_image_meta(image_id, original_shape, image.shape,
+                                    window, scale, active_class_ids)
+
+    return image, image_meta, class_ids, bbox, mask
+
+
+def build_detection_targets(rpn_rois, gt_class_ids, gt_boxes, gt_masks, config):
+    """Generate targets for training Stage 2 classifier and mask heads.
+    This is not used in normal training. It's useful for debugging or to train
+    the Mask RCNN heads without using the RPN head.
+
+    Inputs:
+    rpn_rois: [N, (y1, x1, y2, x2)] proposal boxes.
+    gt_class_ids: [instance count] Integer class IDs
+    gt_boxes: [instance count, (y1, x1, y2, x2)]
+    gt_masks: [height, width, instance count] Ground truth masks. Can be full
+              size or mini-masks.
+
+    Returns:
+    rois: [TRAIN_ROIS_PER_IMAGE, (y1, x1, y2, x2)]
+    class_ids: [TRAIN_ROIS_PER_IMAGE]. Integer class IDs.
+    bboxes: [TRAIN_ROIS_PER_IMAGE, NUM_CLASSES, (y, x, log(h), log(w))]. Class-specific
+            bbox refinements.
+    masks: [TRAIN_ROIS_PER_IMAGE, height, width, NUM_CLASSES). Class specific masks cropped
+           to bbox boundaries and resized to neural network output size.
+    """
+    assert rpn_rois.shape[0] > 0
+    assert gt_class_ids.dtype == np.int32, "Expected int but got {}".format(
+        gt_class_ids.dtype)
+    assert gt_boxes.dtype == np.int32, "Expected int but got {}".format(
+        gt_boxes.dtype)
+    assert gt_masks.dtype == np.bool_, "Expected bool but got {}".format(
+        gt_masks.dtype)
+
+    # It's common to add GT Boxes to ROIs but we don't do that here because
+    # according to XinLei Chen's paper, it doesn't help.
+
+    # Trim empty padding in gt_boxes and gt_masks parts
+    instance_ids = np.where(gt_class_ids > 0)[0]
+    assert instance_ids.shape[0] > 0, "Image must contain instances."
+    gt_class_ids = gt_class_ids[instance_ids]
+    gt_boxes = gt_boxes[instance_ids]
+    gt_masks = gt_masks[:, :, instance_ids]
+
+    # Compute areas of ROIs and ground truth boxes.
+    rpn_roi_area = (rpn_rois[:, 2] - rpn_rois[:, 0]) * \
+        (rpn_rois[:, 3] - rpn_rois[:, 1])
+    gt_box_area = (gt_boxes[:, 2] - gt_boxes[:, 0]) * \
+        (gt_boxes[:, 3] - gt_boxes[:, 1])
+
+    # Compute overlaps [rpn_rois, gt_boxes]
+    overlaps = np.zeros((rpn_rois.shape[0], gt_boxes.shape[0]))
+    for i in range(overlaps.shape[1]):
+        gt = gt_boxes[i]
+        overlaps[:, i] = utils.compute_iou(
+            gt, rpn_rois, gt_box_area[i], rpn_roi_area)
+
+    # Assign ROIs to GT boxes
+    rpn_roi_iou_argmax = np.argmax(overlaps, axis=1)
+    rpn_roi_iou_max = overlaps[np.arange(
+        overlaps.shape[0]), rpn_roi_iou_argmax]
+    # GT box assigned to each ROI
+    rpn_roi_gt_boxes = gt_boxes[rpn_roi_iou_argmax]
+    rpn_roi_gt_class_ids = gt_class_ids[rpn_roi_iou_argmax]
+
+    # Positive ROIs are those with >= 0.5 IoU with a GT box.
+    fg_ids = np.where(rpn_roi_iou_max > 0.5)[0]
+
+    # Negative ROIs are those with max IoU 0.1-0.5 (hard example mining)
+    # TODO: To hard example mine or not to hard example mine, that's the question
+    # bg_ids = np.where((rpn_roi_iou_max >= 0.1) & (rpn_roi_iou_max < 0.5))[0]
+    bg_ids = np.where(rpn_roi_iou_max < 0.5)[0]
+
+    # Subsample ROIs. Aim for 33% foreground.
+    # FG
+    fg_roi_count = int(config.TRAIN_ROIS_PER_IMAGE * config.ROI_POSITIVE_RATIO)
+    if fg_ids.shape[0] > fg_roi_count:
+        keep_fg_ids = np.random.choice(fg_ids, fg_roi_count, replace=False)
+    else:
+        keep_fg_ids = fg_ids
+    # BG
+    remaining = config.TRAIN_ROIS_PER_IMAGE - keep_fg_ids.shape[0]
+    if bg_ids.shape[0] > remaining:
+        keep_bg_ids = np.random.choice(bg_ids, remaining, replace=False)
+    else:
+        keep_bg_ids = bg_ids
+    # Combine indices of ROIs to keep
+    keep = np.concatenate([keep_fg_ids, keep_bg_ids])
+    # Need more?
+    remaining = config.TRAIN_ROIS_PER_IMAGE - keep.shape[0]
+    if remaining > 0:
+        # Looks like we don't have enough samples to maintain the desired
+        # balance. Reduce requirements and fill in the rest. This is
+        # likely different from the Mask RCNN paper.
+
+        # There is a small chance we have neither fg nor bg samples.
+        if keep.shape[0] == 0:
+            # Pick bg regions with easier IoU threshold
+            bg_ids = np.where(rpn_roi_iou_max < 0.5)[0]
+            assert bg_ids.shape[0] >= remaining
+            keep_bg_ids = np.random.choice(bg_ids, remaining, replace=False)
+            assert keep_bg_ids.shape[0] == remaining
+            keep = np.concatenate([keep, keep_bg_ids])
+        else:
+            # Fill the rest with repeated bg rois.
+            keep_extra_ids = np.random.choice(
+                keep_bg_ids, remaining, replace=True)
+            keep = np.concatenate([keep, keep_extra_ids])
+    assert keep.shape[0] == config.TRAIN_ROIS_PER_IMAGE, \
+        "keep doesn't match ROI batch size {}, {}".format(
+            keep.shape[0], config.TRAIN_ROIS_PER_IMAGE)
+
+    # Reset the gt boxes assigned to BG ROIs.
+    rpn_roi_gt_boxes[keep_bg_ids, :] = 0
+    rpn_roi_gt_class_ids[keep_bg_ids] = 0
+
+    # For each kept ROI, assign a class_id, and for FG ROIs also add bbox refinement.
+    rois = rpn_rois[keep]
+    roi_gt_boxes = rpn_roi_gt_boxes[keep]
+    roi_gt_class_ids = rpn_roi_gt_class_ids[keep]
+    roi_gt_assignment = rpn_roi_iou_argmax[keep]
+
+    # Class-aware bbox deltas. [y, x, log(h), log(w)]
+    bboxes = np.zeros((config.TRAIN_ROIS_PER_IMAGE,
+                       config.NUM_CLASSES, 4), dtype=np.float32)
+    pos_ids = np.where(roi_gt_class_ids > 0)[0]
+    bboxes[pos_ids, roi_gt_class_ids[pos_ids]] = utils.box_refinement(
+        rois[pos_ids], roi_gt_boxes[pos_ids, :4])
+    # Normalize bbox refinements
+    bboxes /= config.BBOX_STD_DEV
+
+    # Generate class-specific target masks
+    masks = np.zeros((config.TRAIN_ROIS_PER_IMAGE, config.MASK_SHAPE[0], config.MASK_SHAPE[1], config.NUM_CLASSES),
+                     dtype=np.float32)
+    for i in pos_ids:
+        class_id = roi_gt_class_ids[i]
+        assert class_id > 0, "class id must be greater than 0"
+        gt_id = roi_gt_assignment[i]
+        class_mask = gt_masks[:, :, gt_id]
+
+        if config.USE_MINI_MASK:
+            # Create a mask placeholder, the size of the image
+            placeholder = np.zeros(config.IMAGE_SHAPE[:2], dtype=bool)
+            # GT box
+            gt_y1, gt_x1, gt_y2, gt_x2 = gt_boxes[gt_id]
+            gt_w = gt_x2 - gt_x1
+            gt_h = gt_y2 - gt_y1
+            # Resize mini mask to size of GT box
+            placeholder[gt_y1:gt_y2, gt_x1:gt_x2] = \
+                np.round(utils.resize(class_mask, (gt_h, gt_w))).astype(bool)
+            # Place the mini batch in the placeholder
+            class_mask = placeholder
+
+        # Pick part of the mask and resize it
+        y1, x1, y2, x2 = rois[i].astype(np.int32)
+        m = class_mask[y1:y2, x1:x2]
+        mask = utils.resize(m, config.MASK_SHAPE)
+        masks[i, :, :, class_id] = mask
+
+    return rois, roi_gt_class_ids, bboxes, masks
+
+
+def build_rpn_targets(image_shape, anchors, gt_class_ids, gt_boxes, config):
+    """Given the anchors and GT boxes, compute overlaps and identify positive
+    anchors and deltas to refine them to match their corresponding GT boxes.
+
+    anchors: [num_anchors, (y1, x1, y2, x2)]
+    gt_class_ids: [num_gt_boxes] Integer class IDs.
+    gt_boxes: [num_gt_boxes, (y1, x1, y2, x2)]
+
+    Returns:
+    rpn_match: [N] (int32) matches between anchors and GT boxes.
+               1 = positive anchor, -1 = negative anchor, 0 = neutral
+    rpn_bbox: [N, (dy, dx, log(dh), log(dw))] Anchor bbox deltas.
+    """
+    # RPN Match: 1 = positive anchor, -1 = negative anchor, 0 = neutral
+    rpn_match = np.zeros([anchors.shape[0]], dtype=np.int32)
+    # RPN bounding boxes: [max anchors per image, (dy, dx, log(dh), log(dw))]
+    rpn_bbox = np.zeros((config.RPN_TRAIN_ANCHORS_PER_IMAGE, 4))
+
+    # Handle COCO crowds
+    # A crowd box in COCO is a bounding box around several instances. Exclude
+    # them from training. A crowd box is given a negative class ID.
+    crowd_ix = np.where(gt_class_ids < 0)[0]
+    if crowd_ix.shape[0] > 0:
+        # Filter out crowds from ground truth class IDs and boxes
+        non_crowd_ix = np.where(gt_class_ids > 0)[0]
+        crowd_boxes = gt_boxes[crowd_ix]
+        gt_class_ids = gt_class_ids[non_crowd_ix]
+        gt_boxes = gt_boxes[non_crowd_ix]
+        # Compute overlaps with crowd boxes [anchors, crowds]
+        crowd_overlaps = utils.compute_overlaps(anchors, crowd_boxes)
+        crowd_iou_max = np.amax(crowd_overlaps, axis=1)
+        no_crowd_bool = (crowd_iou_max < 0.001)
+    else:
+        # All anchors don't intersect a crowd
+        no_crowd_bool = np.ones([anchors.shape[0]], dtype=bool)
+
+    # Compute overlaps [num_anchors, num_gt_boxes]
+    overlaps = utils.compute_overlaps(anchors, gt_boxes)
+
+    # Match anchors to GT Boxes
+    # If an anchor overlaps a GT box with IoU >= 0.7 then it's positive.
+    # If an anchor overlaps a GT box with IoU < 0.3 then it's negative.
+    # Neutral anchors are those that don't match the conditions above,
+    # and they don't influence the loss function.
+    # However, don't keep any GT box unmatched (rare, but happens). Instead,
+    # match it to the closest anchor (even if its max IoU is < 0.3).
+    #
+    # 1. Set negative anchors first. They get overwritten below if a GT box is
+    # matched to them. Skip boxes in crowd areas.
+    anchor_iou_argmax = np.argmax(overlaps, axis=1)
+    anchor_iou_max = overlaps[np.arange(overlaps.shape[0]), anchor_iou_argmax]
+    rpn_match[(anchor_iou_max < 0.3) & (no_crowd_bool)] = -1
+    # 2. Set an anchor for each GT box (regardless of IoU value).
+    # If multiple anchors have the same IoU match all of them
+    gt_iou_argmax = np.argwhere(overlaps == np.max(overlaps, axis=0))[:,0]
+    rpn_match[gt_iou_argmax] = 1
+    # 3. Set anchors with high overlap as positive.
+    rpn_match[anchor_iou_max >= 0.7] = 1
+
+    # Subsample to balance positive and negative anchors
+    # Don't let positives be more than half the anchors
+    ids = np.where(rpn_match == 1)[0]
+    extra = len(ids) - (config.RPN_TRAIN_ANCHORS_PER_IMAGE // 2)
+    if extra > 0:
+        # Reset the extra ones to neutral
+        ids = np.random.choice(ids, extra, replace=False)
+        rpn_match[ids] = 0
+    # Same for negative proposals
+    ids = np.where(rpn_match == -1)[0]
+    extra = len(ids) - (config.RPN_TRAIN_ANCHORS_PER_IMAGE -
+                        np.sum(rpn_match == 1))
+    if extra > 0:
+        # Rest the extra ones to neutral
+        ids = np.random.choice(ids, extra, replace=False)
+        rpn_match[ids] = 0
+
+    # For positive anchors, compute shift and scale needed to transform them
+    # to match the corresponding GT boxes.
+    ids = np.where(rpn_match == 1)[0]
+    ix = 0  # index into rpn_bbox
+    # TODO: use box_refinement() rather than duplicating the code here
+    for i, a in zip(ids, anchors[ids]):
+        # Closest gt box (it might have IoU < 0.7)
+        gt = gt_boxes[anchor_iou_argmax[i]]
+
+        # Convert coordinates to center plus width/height.
+        # GT Box
+        gt_h = gt[2] - gt[0]
+        gt_w = gt[3] - gt[1]
+        gt_center_y = gt[0] + 0.5 * gt_h
+        gt_center_x = gt[1] + 0.5 * gt_w
+        # Anchor
+        a_h = a[2] - a[0]
+        a_w = a[3] - a[1]
+        a_center_y = a[0] + 0.5 * a_h
+        a_center_x = a[1] + 0.5 * a_w
+
+        # Compute the bbox refinement that the RPN should predict.
+        rpn_bbox[ix] = [
+            (gt_center_y - a_center_y) / a_h,
+            (gt_center_x - a_center_x) / a_w,
+            np.log(gt_h / a_h),
+            np.log(gt_w / a_w),
+        ]
+        # Normalize
+        rpn_bbox[ix] /= config.RPN_BBOX_STD_DEV
+        ix += 1
+
+    return rpn_match, rpn_bbox
+
+
+def generate_random_rois(image_shape, count, gt_class_ids, gt_boxes):
+    """Generates ROI proposals similar to what a region proposal network
+    would generate.
+
+    image_shape: [Height, Width, Depth]
+    count: Number of ROIs to generate
+    gt_class_ids: [N] Integer ground truth class IDs
+    gt_boxes: [N, (y1, x1, y2, x2)] Ground truth boxes in pixels.
+
+    Returns: [count, (y1, x1, y2, x2)] ROI boxes in pixels.
+    """
+    # placeholder
+    rois = np.zeros((count, 4), dtype=np.int32)
+
+    # Generate random ROIs around GT boxes (90% of count)
+    rois_per_box = int(0.9 * count / gt_boxes.shape[0])
+    for i in range(gt_boxes.shape[0]):
+        gt_y1, gt_x1, gt_y2, gt_x2 = gt_boxes[i]
+        h = gt_y2 - gt_y1
+        w = gt_x2 - gt_x1
+        # random boundaries
+        r_y1 = max(gt_y1 - h, 0)
+        r_y2 = min(gt_y2 + h, image_shape[0])
+        r_x1 = max(gt_x1 - w, 0)
+        r_x2 = min(gt_x2 + w, image_shape[1])
+
+        # To avoid generating boxes with zero area, we generate double what
+        # we need and filter out the extra. If we get fewer valid boxes
+        # than we need, we loop and try again.
+        while True:
+            y1y2 = np.random.randint(r_y1, r_y2, (rois_per_box * 2, 2))
+            x1x2 = np.random.randint(r_x1, r_x2, (rois_per_box * 2, 2))
+            # Filter out zero area boxes
+            threshold = 1
+            y1y2 = y1y2[np.abs(y1y2[:, 0] - y1y2[:, 1]) >=
+                        threshold][:rois_per_box]
+            x1x2 = x1x2[np.abs(x1x2[:, 0] - x1x2[:, 1]) >=
+                        threshold][:rois_per_box]
+            if y1y2.shape[0] == rois_per_box and x1x2.shape[0] == rois_per_box:
+                break
+
+        # Sort on axis 1 to ensure x1 <= x2 and y1 <= y2 and then reshape
+        # into x1, y1, x2, y2 order
+        x1, x2 = np.split(np.sort(x1x2, axis=1), 2, axis=1)
+        y1, y2 = np.split(np.sort(y1y2, axis=1), 2, axis=1)
+        box_rois = np.hstack([y1, x1, y2, x2])
+        rois[rois_per_box * i:rois_per_box * (i + 1)] = box_rois
+
+    # Generate random ROIs anywhere in the image (10% of count)
+    remaining_count = count - (rois_per_box * gt_boxes.shape[0])
+    # To avoid generating boxes with zero area, we generate double what
+    # we need and filter out the extra. If we get fewer valid boxes
+    # than we need, we loop and try again.
+    while True:
+        y1y2 = np.random.randint(0, image_shape[0], (remaining_count * 2, 2))
+        x1x2 = np.random.randint(0, image_shape[1], (remaining_count * 2, 2))
+        # Filter out zero area boxes
+        threshold = 1
+        y1y2 = y1y2[np.abs(y1y2[:, 0] - y1y2[:, 1]) >=
+                    threshold][:remaining_count]
+        x1x2 = x1x2[np.abs(x1x2[:, 0] - x1x2[:, 1]) >=
+                    threshold][:remaining_count]
+        if y1y2.shape[0] == remaining_count and x1x2.shape[0] == remaining_count:
+            break
+
+    # Sort on axis 1 to ensure x1 <= x2 and y1 <= y2 and then reshape
+    # into x1, y1, x2, y2 order
+    x1, x2 = np.split(np.sort(x1x2, axis=1), 2, axis=1)
+    y1, y2 = np.split(np.sort(y1y2, axis=1), 2, axis=1)
+    global_rois = np.hstack([y1, x1, y2, x2])
+    rois[-remaining_count:] = global_rois
+    return rois
+
+
+def data_generator(dataset, config, shuffle=True, augment=False, augmentation=None,
+                   random_rois=0, batch_size=1, detection_targets=False,
+                   no_augmentation_sources=None):
+    """A generator that returns images and corresponding target class ids,
+    bounding box deltas, and masks.
+
+    dataset: The Dataset object to pick data from
+    config: The model config object
+    shuffle: If True, shuffles the samples before every epoch
+    augment: (deprecated. Use augmentation instead). If true, apply random
+        image augmentation. Currently, only horizontal flipping is offered.
+    augmentation: Optional. An imgaug (https://github.com/aleju/imgaug) augmentation.
+        For example, passing imgaug.augmenters.Fliplr(0.5) flips images
+        right/left 50% of the time.
+    random_rois: If > 0 then generate proposals to be used to train the
+                 network classifier and mask heads. Useful if training
+                 the Mask RCNN part without the RPN.
+    batch_size: How many images to return in each call
+    detection_targets: If True, generate detection targets (class IDs, bbox
+        deltas, and masks). Typically for debugging or visualizations because
+        in trainig detection targets are generated by DetectionTargetLayer.
+    no_augmentation_sources: Optional. List of sources to exclude for
+        augmentation. A source is string that identifies a dataset and is
+        defined in the Dataset class.
+
+    Returns a Python generator. Upon calling next() on it, the
+    generator returns two lists, inputs and outputs. The contents
+    of the lists differs depending on the received arguments:
+    inputs list:
+    - images: [batch, H, W, C]
+    - image_meta: [batch, (meta data)] Image details. See compose_image_meta()
+    - rpn_match: [batch, N] Integer (1=positive anchor, -1=negative, 0=neutral)
+    - rpn_bbox: [batch, N, (dy, dx, log(dh), log(dw))] Anchor bbox deltas.
+    - gt_class_ids: [batch, MAX_GT_INSTANCES] Integer class IDs
+    - gt_boxes: [batch, MAX_GT_INSTANCES, (y1, x1, y2, x2)]
+    - gt_masks: [batch, height, width, MAX_GT_INSTANCES]. The height and width
+                are those of the image unless use_mini_mask is True, in which
+                case they are defined in MINI_MASK_SHAPE.
+
+    outputs list: Usually empty in regular training. But if detection_targets
+        is True then the outputs list contains target class_ids, bbox deltas,
+        and masks.
+    """
+    b = 0  # batch item index
+    image_index = -1
+    image_ids = np.copy(dataset.image_ids)
+    error_count = 0
+    no_augmentation_sources = no_augmentation_sources or []
+
+    # Anchors
+    # [anchor_count, (y1, x1, y2, x2)]
+    backbone_shapes = compute_backbone_shapes(config, config.IMAGE_SHAPE)
+    anchors = utils.generate_pyramid_anchors(config.RPN_ANCHOR_SCALES,
+                                             config.RPN_ANCHOR_RATIOS,
+                                             backbone_shapes,
+                                             config.BACKBONE_STRIDES,
+                                             config.RPN_ANCHOR_STRIDE)
+
+    # Keras requires a generator to run indefinitely.
+    while True:
+        try:
+            # Increment index to pick next image. Shuffle if at the start of an epoch.
+            image_index = (image_index + 1) % len(image_ids)
+            if shuffle and image_index == 0:
+                np.random.shuffle(image_ids)
+
+            # Get GT bounding boxes and masks for image.
+            image_id = image_ids[image_index]
+
+            # If the image source is not to be augmented pass None as augmentation
+            if dataset.image_info[image_id]['source'] in no_augmentation_sources:
+                image, image_meta, gt_class_ids, gt_boxes, gt_masks = \
+                load_image_gt(dataset, config, image_id, augment=augment,
+                              augmentation=None,
+                              use_mini_mask=config.USE_MINI_MASK)
+            else:
+                image, image_meta, gt_class_ids, gt_boxes, gt_masks = \
+                    load_image_gt(dataset, config, image_id, augment=augment,
+                                augmentation=augmentation,
+                                use_mini_mask=config.USE_MINI_MASK)
+
+            # Skip images that have no instances. This can happen in cases
+            # where we train on a subset of classes and the image doesn't
+            # have any of the classes we care about.
+            if not np.any(gt_class_ids > 0):
+                continue
+
+            # RPN Targets
+            rpn_match, rpn_bbox = build_rpn_targets(image.shape, anchors,
+                                                    gt_class_ids, gt_boxes, config)
+
+            # Mask R-CNN Targets
+            if random_rois:
+                rpn_rois = generate_random_rois(
+                    image.shape, random_rois, gt_class_ids, gt_boxes)
+                if detection_targets:
+                    rois, mrcnn_class_ids, mrcnn_bbox, mrcnn_mask =\
+                        build_detection_targets(
+                            rpn_rois, gt_class_ids, gt_boxes, gt_masks, config)
+
+            # Init batch arrays
+            if b == 0:
+                batch_image_meta = np.zeros(
+                    (batch_size,) + image_meta.shape, dtype=image_meta.dtype)
+                batch_rpn_match = np.zeros(
+                    [batch_size, anchors.shape[0], 1], dtype=rpn_match.dtype)
+                batch_rpn_bbox = np.zeros(
+                    [batch_size, config.RPN_TRAIN_ANCHORS_PER_IMAGE, 4], dtype=rpn_bbox.dtype)
+                batch_images = np.zeros(
+                    (batch_size,) + image.shape, dtype=np.float32)
+                batch_gt_class_ids = np.zeros(
+                    (batch_size, config.MAX_GT_INSTANCES), dtype=np.int32)
+                batch_gt_boxes = np.zeros(
+                    (batch_size, config.MAX_GT_INSTANCES, 4), dtype=np.int32)
+                batch_gt_masks = np.zeros(
+                    (batch_size, gt_masks.shape[0], gt_masks.shape[1],
+                     config.MAX_GT_INSTANCES), dtype=gt_masks.dtype)
+                if random_rois:
+                    batch_rpn_rois = np.zeros(
+                        (batch_size, rpn_rois.shape[0], 4), dtype=rpn_rois.dtype)
+                    if detection_targets:
+                        batch_rois = np.zeros(
+                            (batch_size,) + rois.shape, dtype=rois.dtype)
+                        batch_mrcnn_class_ids = np.zeros(
+                            (batch_size,) + mrcnn_class_ids.shape, dtype=mrcnn_class_ids.dtype)
+                        batch_mrcnn_bbox = np.zeros(
+                            (batch_size,) + mrcnn_bbox.shape, dtype=mrcnn_bbox.dtype)
+                        batch_mrcnn_mask = np.zeros(
+                            (batch_size,) + mrcnn_mask.shape, dtype=mrcnn_mask.dtype)
+
+            # If more instances than fits in the array, sub-sample from them.
+            if gt_boxes.shape[0] > config.MAX_GT_INSTANCES:
+                ids = np.random.choice(
+                    np.arange(gt_boxes.shape[0]), config.MAX_GT_INSTANCES, replace=False)
+                gt_class_ids = gt_class_ids[ids]
+                gt_boxes = gt_boxes[ids]
+                gt_masks = gt_masks[:, :, ids]
+
+            # Add to batch
+            batch_image_meta[b] = image_meta
+            batch_rpn_match[b] = rpn_match[:, np.newaxis]
+            batch_rpn_bbox[b] = rpn_bbox
+            batch_images[b] = mold_image(image.astype(np.float32), config)
+            batch_gt_class_ids[b, :gt_class_ids.shape[0]] = gt_class_ids
+            batch_gt_boxes[b, :gt_boxes.shape[0]] = gt_boxes
+            batch_gt_masks[b, :, :, :gt_masks.shape[-1]] = gt_masks
+            if random_rois:
+                batch_rpn_rois[b] = rpn_rois
+                if detection_targets:
+                    batch_rois[b] = rois
+                    batch_mrcnn_class_ids[b] = mrcnn_class_ids
+                    batch_mrcnn_bbox[b] = mrcnn_bbox
+                    batch_mrcnn_mask[b] = mrcnn_mask
+            b += 1
+
+            # Batch full?
+            if b >= batch_size:
+                inputs = [batch_images, batch_image_meta, batch_rpn_match, batch_rpn_bbox,
+                          batch_gt_class_ids, batch_gt_boxes, batch_gt_masks]
+                outputs = []
+
+                if random_rois:
+                    inputs.extend([batch_rpn_rois])
+                    if detection_targets:
+                        inputs.extend([batch_rois])
+                        # Keras requires that output and targets have the same number of dimensions
+                        batch_mrcnn_class_ids = np.expand_dims(
+                            batch_mrcnn_class_ids, -1)
+                        outputs.extend(
+                            [batch_mrcnn_class_ids, batch_mrcnn_bbox, batch_mrcnn_mask])
+
+                yield inputs, outputs
+
+                # start a new batch
+                b = 0
+        except (GeneratorExit, KeyboardInterrupt):
+            raise
+        except:
+            # Log it and skip the image
+            logging.exception("Error processing image {}".format(
+                dataset.image_info[image_id]))
+            error_count += 1
+            if error_count > 5:
+                raise
+
+
+############################################################
+#  MaskRCNN Class
+############################################################
+
+class MaskRCNN():
+    """Encapsulates the Mask RCNN model functionality.
+
+    The actual Keras model is in the keras_model property.
+    """
+
+    def __init__(self, mode, config, model_dir):
+        """
+        mode: Either "training" or "inference"
+        config: A Sub-class of the Config class
+        model_dir: Directory to save training logs and trained weights
+        """
+        assert mode in ['training', 'inference']
+        self.mode = mode
+        self.config = config
+        self.model_dir = model_dir
+        self.set_log_dir()
+        self.keras_model = self.build(mode=mode, config=config)
+
+    def build(self, mode, config):
+        """Build Mask R-CNN architecture.
+            input_shape: The shape of the input image.
+            mode: Either "training" or "inference". The inputs and
+                outputs of the model differ accordingly.
+        """
+        assert mode in ['training', 'inference']
+
+        # Image size must be dividable by 2 multiple times
+        h, w = config.IMAGE_SHAPE[:2]
+        if h / 2**6 != int(h / 2**6) or w / 2**6 != int(w / 2**6):
+            raise Exception("Image size must be dividable by 2 at least 6 times "
+                            "to avoid fractions when downscaling and upscaling."
+                            "For example, use 256, 320, 384, 448, 512, ... etc. ")
+
+        # Inputs
+        input_image = KL.Input(
+            shape=[None, None, config.IMAGE_SHAPE[2]], name="input_image")
+        input_image_meta = KL.Input(shape=[config.IMAGE_META_SIZE],
+                                    name="input_image_meta")
+        if mode == "training":
+            # RPN GT
+            input_rpn_match = KL.Input(
+                shape=[None, 1], name="input_rpn_match", dtype=tf.int32)
+            input_rpn_bbox = KL.Input(
+                shape=[None, 4], name="input_rpn_bbox", dtype=tf.float32)
+
+            # Detection GT (class IDs, bounding boxes, and masks)
+            # 1. GT Class IDs (zero padded)
+            input_gt_class_ids = KL.Input(
+                shape=[None], name="input_gt_class_ids", dtype=tf.int32)
+            # 2. GT Boxes in pixels (zero padded)
+            # [batch, MAX_GT_INSTANCES, (y1, x1, y2, x2)] in image coordinates
+            input_gt_boxes = KL.Input(
+                shape=[None, 4], name="input_gt_boxes", dtype=tf.float32)
+            # Normalize coordinates
+            gt_boxes = KL.Lambda(lambda x: norm_boxes_graph(
+                x, K.shape(input_image)[1:3]))(input_gt_boxes)
+            # 3. GT Masks (zero padded)
+            # [batch, height, width, MAX_GT_INSTANCES]
+            if config.USE_MINI_MASK:
+                input_gt_masks = KL.Input(
+                    shape=[config.MINI_MASK_SHAPE[0],
+                           config.MINI_MASK_SHAPE[1], None],
+                    name="input_gt_masks", dtype=bool)
+            else:
+                input_gt_masks = KL.Input(
+                    shape=[config.IMAGE_SHAPE[0], config.IMAGE_SHAPE[1], None],
+                    name="input_gt_masks", dtype=bool)
+        elif mode == "inference":
+            # Anchors in normalized coordinates
+            input_anchors = KL.Input(shape=[None, 4], name="input_anchors")
+
+        # Build the shared convolutional layers.
+        # Bottom-up Layers
+        # Returns a list of the last layers of each stage, 5 in total.
+        # Don't create the thead (stage 5), so we pick the 4th item in the list.
+        if callable(config.BACKBONE):
+            _, C2, C3, C4, C5 = config.BACKBONE(input_image, stage5=True,
+                                                train_bn=config.TRAIN_BN)
+        else:
+            _, C2, C3, C4, C5 = resnet_graph(input_image, config.BACKBONE,
+                                             stage5=True, train_bn=config.TRAIN_BN)
+        # Top-down Layers
+        # TODO: add assert to varify feature map sizes match what's in config
+        P5 = KL.Conv2D(config.TOP_DOWN_PYRAMID_SIZE, (1, 1), name='fpn_c5p5')(C5)
+        P4 = KL.Add(name="fpn_p4add")([
+            KL.UpSampling2D(size=(2, 2), name="fpn_p5upsampled")(P5),
+            KL.Conv2D(config.TOP_DOWN_PYRAMID_SIZE, (1, 1), name='fpn_c4p4')(C4)])
+        P3 = KL.Add(name="fpn_p3add")([
+            KL.UpSampling2D(size=(2, 2), name="fpn_p4upsampled")(P4),
+            KL.Conv2D(config.TOP_DOWN_PYRAMID_SIZE, (1, 1), name='fpn_c3p3')(C3)])
+        P2 = KL.Add(name="fpn_p2add")([
+            KL.UpSampling2D(size=(2, 2), name="fpn_p3upsampled")(P3),
+            KL.Conv2D(config.TOP_DOWN_PYRAMID_SIZE, (1, 1), name='fpn_c2p2')(C2)])
+        # Attach 3x3 conv to all P layers to get the final feature maps.
+        P2 = KL.Conv2D(config.TOP_DOWN_PYRAMID_SIZE, (3, 3), padding="SAME", name="fpn_p2")(P2)
+        P3 = KL.Conv2D(config.TOP_DOWN_PYRAMID_SIZE, (3, 3), padding="SAME", name="fpn_p3")(P3)
+        P4 = KL.Conv2D(config.TOP_DOWN_PYRAMID_SIZE, (3, 3), padding="SAME", name="fpn_p4")(P4)
+        P5 = KL.Conv2D(config.TOP_DOWN_PYRAMID_SIZE, (3, 3), padding="SAME", name="fpn_p5")(P5)
+        # P6 is used for the 5th anchor scale in RPN. Generated by
+        # subsampling from P5 with stride of 2.
+        P6 = KL.MaxPooling2D(pool_size=(1, 1), strides=2, name="fpn_p6")(P5)
+
+        # Note that P6 is used in RPN, but not in the classifier heads.
+        rpn_feature_maps = [P2, P3, P4, P5, P6]
+        mrcnn_feature_maps = [P2, P3, P4, P5]
+
+        # Anchors
+        if mode == "training":
+            anchors = self.get_anchors(config.IMAGE_SHAPE)
+            # Duplicate across the batch dimension because Keras requires it
+            # TODO: can this be optimized to avoid duplicating the anchors?
+            anchors = np.broadcast_to(anchors, (config.BATCH_SIZE,) + anchors.shape)
+            # A hack to get around Keras's bad support for constants
+            anchors = KL.Lambda(lambda x: tf.Variable(anchors), name="anchors")(input_image)
+        else:
+            anchors = input_anchors
+
+        # RPN Model
+        rpn = build_rpn_model(config.RPN_ANCHOR_STRIDE,
+                              len(config.RPN_ANCHOR_RATIOS), config.TOP_DOWN_PYRAMID_SIZE)
+        # Loop through pyramid layers
+        layer_outputs = []  # list of lists
+        for p in rpn_feature_maps:
+            layer_outputs.append(rpn([p]))
+        # Concatenate layer outputs
+        # Convert from list of lists of level outputs to list of lists
+        # of outputs across levels.
+        # e.g. [[a1, b1, c1], [a2, b2, c2]] => [[a1, a2], [b1, b2], [c1, c2]]
+        output_names = ["rpn_class_logits", "rpn_class", "rpn_bbox"]
+        outputs = list(zip(*layer_outputs))
+        outputs = [KL.Concatenate(axis=1, name=n)(list(o))
+                   for o, n in zip(outputs, output_names)]
+
+        rpn_class_logits, rpn_class, rpn_bbox = outputs
+
+        # Generate proposals
+        # Proposals are [batch, N, (y1, x1, y2, x2)] in normalized coordinates
+        # and zero padded.
+        proposal_count = config.POST_NMS_ROIS_TRAINING if mode == "training"\
+            else config.POST_NMS_ROIS_INFERENCE
+        rpn_rois = ProposalLayer(
+            proposal_count=proposal_count,
+            nms_threshold=config.RPN_NMS_THRESHOLD,
+            name="ROI",
+            config=config)([rpn_class, rpn_bbox, anchors])
+
+        if mode == "training":
+            # Class ID mask to mark class IDs supported by the dataset the image
+            # came from.
+            active_class_ids = KL.Lambda(
+                lambda x: parse_image_meta_graph(x)["active_class_ids"]
+                )(input_image_meta)
+
+            if not config.USE_RPN_ROIS:
+                # Ignore predicted ROIs and use ROIs provided as an input.
+                input_rois = KL.Input(shape=[config.POST_NMS_ROIS_TRAINING, 4],
+                                      name="input_roi", dtype=np.int32)
+                # Normalize coordinates
+                target_rois = KL.Lambda(lambda x: norm_boxes_graph(
+                    x, K.shape(input_image)[1:3]))(input_rois)
+            else:
+                target_rois = rpn_rois
+
+            # Generate detection targets
+            # Subsamples proposals and generates target outputs for training
+            # Note that proposal class IDs, gt_boxes, and gt_masks are zero
+            # padded. Equally, returned rois and targets are zero padded.
+            rois, target_class_ids, target_bbox, target_mask =\
+                DetectionTargetLayer(config, name="proposal_targets")([
+                    target_rois, input_gt_class_ids, gt_boxes, input_gt_masks])
+
+            # Network Heads
+            # TODO: verify that this handles zero padded ROIs
+            mrcnn_class_logits, mrcnn_class, mrcnn_bbox =\
+                fpn_classifier_graph(rois, mrcnn_feature_maps, input_image_meta,
+                                     config.POOL_SIZE, config.NUM_CLASSES,
+                                     train_bn=config.TRAIN_BN,
+                                     fc_layers_size=config.FPN_CLASSIF_FC_LAYERS_SIZE)
+
+            mrcnn_mask = build_fpn_mask_graph(rois, mrcnn_feature_maps,
+                                              input_image_meta,
+                                              config.MASK_POOL_SIZE,
+                                              config.NUM_CLASSES,
+                                              train_bn=config.TRAIN_BN)
+
+            # TODO: clean up (use tf.identify if necessary)
+            output_rois = KL.Lambda(lambda x: x * 1, name="output_rois")(rois)
+
+            # Losses
+            rpn_class_loss = KL.Lambda(lambda x: rpn_class_loss_graph(*x), name="rpn_class_loss")(
+                [input_rpn_match, rpn_class_logits])
+            rpn_bbox_loss = KL.Lambda(lambda x: rpn_bbox_loss_graph(config, *x), name="rpn_bbox_loss")(
+                [input_rpn_bbox, input_rpn_match, rpn_bbox])
+            class_loss = KL.Lambda(lambda x: mrcnn_class_loss_graph(*x), name="mrcnn_class_loss")(
+                [target_class_ids, mrcnn_class_logits, active_class_ids])
+            bbox_loss = KL.Lambda(lambda x: mrcnn_bbox_loss_graph(*x), name="mrcnn_bbox_loss")(
+                [target_bbox, target_class_ids, mrcnn_bbox])
+            mask_loss = KL.Lambda(lambda x: mrcnn_mask_loss_graph(*x), name="mrcnn_mask_loss")(
+                [target_mask, target_class_ids, mrcnn_mask])
+
+            # Model
+            inputs = [input_image, input_image_meta,
+                      input_rpn_match, input_rpn_bbox, input_gt_class_ids, input_gt_boxes, input_gt_masks]
+            if not config.USE_RPN_ROIS:
+                inputs.append(input_rois)
+            outputs = [rpn_class_logits, rpn_class, rpn_bbox,
+                       mrcnn_class_logits, mrcnn_class, mrcnn_bbox, mrcnn_mask,
+                       rpn_rois, output_rois,
+                       rpn_class_loss, rpn_bbox_loss, class_loss, bbox_loss, mask_loss]
+            model = KM.Model(inputs, outputs, name='mask_rcnn')
+        else:
+            # Network Heads
+            # Proposal classifier and BBox regressor heads
+            mrcnn_class_logits, mrcnn_class, mrcnn_bbox =\
+                fpn_classifier_graph(rpn_rois, mrcnn_feature_maps, input_image_meta,
+                                     config.POOL_SIZE, config.NUM_CLASSES,
+                                     train_bn=config.TRAIN_BN,
+                                     fc_layers_size=config.FPN_CLASSIF_FC_LAYERS_SIZE)
+
+            # Detections
+            # output is [batch, num_detections, (y1, x1, y2, x2, class_id, score)] in
+            # normalized coordinates
+            detections = DetectionLayer(config, name="mrcnn_detection")(
+                [rpn_rois, mrcnn_class, mrcnn_bbox, input_image_meta])
+
+            # Create masks for detections
+            detection_boxes = KL.Lambda(lambda x: x[..., :4])(detections)
+            mrcnn_mask = build_fpn_mask_graph(detection_boxes, mrcnn_feature_maps,
+                                              input_image_meta,
+                                              config.MASK_POOL_SIZE,
+                                              config.NUM_CLASSES,
+                                              train_bn=config.TRAIN_BN)
+
+            model = KM.Model([input_image, input_image_meta, input_anchors],
+                             [detections, mrcnn_class, mrcnn_bbox,
+                                 mrcnn_mask, rpn_rois, rpn_class, rpn_bbox],
+                             name='mask_rcnn')
+
+        # Add multi-GPU support.
+        if config.GPU_COUNT > 1:
+            from mrcnn.parallel_model import ParallelModel
+            model = ParallelModel(model, config.GPU_COUNT)
+
+        return model
+
+    def find_last(self):
+        """Finds the last checkpoint file of the last trained model in the
+        model directory.
+        Returns:
+            The path of the last checkpoint file
+        """
+        # Get directory names. Each directory corresponds to a model
+        dir_names = next(os.walk(self.model_dir))[1]
+        key = self.config.NAME.lower()
+        dir_names = filter(lambda f: f.startswith(key), dir_names)
+        dir_names = sorted(dir_names)
+        if not dir_names:
+            import errno
+            raise FileNotFoundError(
+                errno.ENOENT,
+                "Could not find model directory under {}".format(self.model_dir))
+        # Pick last directory
+        dir_name = os.path.join(self.model_dir, dir_names[-1])
+        # Find the last checkpoint
+        checkpoints = next(os.walk(dir_name))[2]
+        checkpoints = filter(lambda f: f.startswith("mask_rcnn"), checkpoints)
+        checkpoints = sorted(checkpoints)
+        if not checkpoints:
+            import errno
+            raise FileNotFoundError(
+                errno.ENOENT, "Could not find weight files in {}".format(dir_name))
+        checkpoint = os.path.join(dir_name, checkpoints[-1])
+        return checkpoint
+
+    def load_weights(self, filepath, by_name=False, exclude=None):
+        """Modified version of the corresponding Keras function with
+        the addition of multi-GPU support and the ability to exclude
+        some layers from loading.
+        exclude: list of layer names to exclude
+        """
+        import h5py
+        # Conditional import to support versions of Keras before 2.2
+        # TODO: remove in about 6 months (end of 2018)
+        try:
+            from keras.engine import saving
+        except ImportError:
+            # Keras before 2.2 used the 'topology' namespace.
+            from keras.engine import topology as saving
+
+        if exclude:
+            by_name = True
+
+        if h5py is None:
+            raise ImportError('`load_weights` requires h5py.')
+        f = h5py.File(filepath, mode='r')
+        if 'layer_names' not in f.attrs and 'model_weights' in f:
+            f = f['model_weights']
+
+        # In multi-GPU training, we wrap the model. Get layers
+        # of the inner model because they have the weights.
+        keras_model = self.keras_model
+        layers = keras_model.inner_model.layers if hasattr(keras_model, "inner_model")\
+            else keras_model.layers
+
+        # Exclude some layers
+        if exclude:
+            layers = filter(lambda l: l.name not in exclude, layers)
+
+        if by_name:
+            saving.load_weights_from_hdf5_group_by_name(f, layers)
+        else:
+            saving.load_weights_from_hdf5_group(f, layers)
+        if hasattr(f, 'close'):
+            f.close()
+
+        # Update the log directory
+        self.set_log_dir(filepath)
+
+    def get_imagenet_weights(self):
+        """Downloads ImageNet trained weights from Keras.
+        Returns path to weights file.
+        """
+        from keras.utils.data_utils import get_file
+        TF_WEIGHTS_PATH_NO_TOP = 'https://github.com/fchollet/deep-learning-models/'\
+                                 'releases/download/v0.2/'\
+                                 'resnet50_weights_tf_dim_ordering_tf_kernels_notop.h5'
+        weights_path = get_file('resnet50_weights_tf_dim_ordering_tf_kernels_notop.h5',
+                                TF_WEIGHTS_PATH_NO_TOP,
+                                cache_subdir='models',
+                                md5_hash='a268eb855778b3df3c7506639542a6af')
+        return weights_path
+
+    def compile(self, learning_rate, momentum):
+        """Gets the model ready for training. Adds losses, regularization, and
+        metrics. Then calls the Keras compile() function.
+        """
+        # Optimizer object
+        optimizer = keras.optimizers.SGD(
+            lr=learning_rate, momentum=momentum,
+            clipnorm=self.config.GRADIENT_CLIP_NORM)
+        # Add Losses
+        # First, clear previously set losses to avoid duplication
+        self.keras_model._losses = []
+        self.keras_model._per_input_losses = {}
+        loss_names = [
+            "rpn_class_loss",  "rpn_bbox_loss",
+            "mrcnn_class_loss", "mrcnn_bbox_loss", "mrcnn_mask_loss"]
+        for name in loss_names:
+            layer = self.keras_model.get_layer(name)
+            if layer.output in self.keras_model.losses:
+                continue
+            loss = (
+                tf.reduce_mean(layer.output, keepdims=True)
+                * self.config.LOSS_WEIGHTS.get(name, 1.))
+            self.keras_model.add_loss(loss)
+
+        # Add L2 Regularization
+        # Skip gamma and beta weights of batch normalization layers.
+        reg_losses = [
+            keras.regularizers.l2(self.config.WEIGHT_DECAY)(w) / tf.cast(tf.size(w), tf.float32)
+            for w in self.keras_model.trainable_weights
+            if 'gamma' not in w.name and 'beta' not in w.name]
+        self.keras_model.add_loss(tf.add_n(reg_losses))
+
+        # Compile
+        self.keras_model.compile(
+            optimizer=optimizer,
+            loss=[None] * len(self.keras_model.outputs))
+
+        # Add metrics for losses
+        for name in loss_names:
+            if name in self.keras_model.metrics_names:
+                continue
+            layer = self.keras_model.get_layer(name)
+            self.keras_model.metrics_names.append(name)
+            loss = (
+                tf.reduce_mean(layer.output, keepdims=True)
+                * self.config.LOSS_WEIGHTS.get(name, 1.))
+            self.keras_model.metrics_tensors.append(loss)
+
+    def set_trainable(self, layer_regex, keras_model=None, indent=0, verbose=1):
+        """Sets model layers as trainable if their names match
+        the given regular expression.
+        """
+        # Print message on the first call (but not on recursive calls)
+        if verbose > 0 and keras_model is None:
+            log("Selecting layers to train")
+
+        keras_model = keras_model or self.keras_model
+
+        # In multi-GPU training, we wrap the model. Get layers
+        # of the inner model because they have the weights.
+        layers = keras_model.inner_model.layers if hasattr(keras_model, "inner_model")\
+            else keras_model.layers
+
+        for layer in layers:
+            # Is the layer a model?
+            if layer.__class__.__name__ == 'Model':
+                print("In model: ", layer.name)
+                self.set_trainable(
+                    layer_regex, keras_model=layer, indent=indent + 4)
+                continue
+
+            if not layer.weights:
+                continue
+            # Is it trainable?
+            trainable = bool(re.fullmatch(layer_regex, layer.name))
+            # Update layer. If layer is a container, update inner layer.
+            if layer.__class__.__name__ == 'TimeDistributed':
+                layer.layer.trainable = trainable
+            else:
+                layer.trainable = trainable
+            # Print trainable layer names
+            if trainable and verbose > 0:
+                log("{}{:20}   ({})".format(" " * indent, layer.name,
+                                            layer.__class__.__name__))
+
+    def set_log_dir(self, model_path=None):
+        """Sets the model log directory and epoch counter.
+
+        model_path: If None, or a format different from what this code uses
+            then set a new log directory and start epochs from 0. Otherwise,
+            extract the log directory and the epoch counter from the file
+            name.
+        """
+        # Set date and epoch counter as if starting a new model
+        self.epoch = 0
+        now = datetime.datetime.now()
+
+        # If we have a model path with date and epochs use them
+        if model_path:
+            # Continue from we left of. Get epoch and date from the file name
+            # A sample model path might look like:
+            # \path\to\logs\coco20171029T2315\mask_rcnn_coco_0001.h5 (Windows)
+            # /path/to/logs/coco20171029T2315/mask_rcnn_coco_0001.h5 (Linux)
+            regex = r".*[/\\][\w-]+(\d{4})(\d{2})(\d{2})T(\d{2})(\d{2})[/\\]mask\_rcnn\_[\w-]+(\d{4})\.h5"
+            m = re.match(regex, model_path)
+            if m:
+                now = datetime.datetime(int(m.group(1)), int(m.group(2)), int(m.group(3)),
+                                        int(m.group(4)), int(m.group(5)))
+                # Epoch number in file is 1-based, and in Keras code it's 0-based.
+                # So, adjust for that then increment by one to start from the next epoch
+                self.epoch = int(m.group(6)) - 1 + 1
+                print('Re-starting from epoch %d' % self.epoch)
+
+        # Directory for training logs
+        self.log_dir = os.path.join(self.model_dir, "{}{:%Y%m%dT%H%M}".format(
+            self.config.NAME.lower(), now))
+
+        # Path to save after each epoch. Include placeholders that get filled by Keras.
+        self.checkpoint_path = os.path.join(self.log_dir, "mask_rcnn_{}_*epoch*.h5".format(
+            self.config.NAME.lower()))
+        self.checkpoint_path = self.checkpoint_path.replace(
+            "*epoch*", "{epoch:04d}")
+
+    def train(self, train_dataset, val_dataset, learning_rate, epochs, layers,
+              augmentation=None, custom_callbacks=None, no_augmentation_sources=None):
+        """Train the model.
+        train_dataset, val_dataset: Training and validation Dataset objects.
+        learning_rate: The learning rate to train with
+        epochs: Number of training epochs. Note that previous training epochs
+                are considered to be done alreay, so this actually determines
+                the epochs to train in total rather than in this particaular
+                call.
+        layers: Allows selecting wich layers to train. It can be:
+            - A regular expression to match layer names to train
+            - One of these predefined values:
+              heads: The RPN, classifier and mask heads of the network
+              all: All the layers
+              3+: Train Resnet stage 3 and up
+              4+: Train Resnet stage 4 and up
+              5+: Train Resnet stage 5 and up
+        augmentation: Optional. An imgaug (https://github.com/aleju/imgaug)
+            augmentation. For example, passing imgaug.augmenters.Fliplr(0.5)
+            flips images right/left 50% of the time. You can pass complex
+            augmentations as well. This augmentation applies 50% of the
+            time, and when it does it flips images right/left half the time
+            and adds a Gaussian blur with a random sigma in range 0 to 5.
+
+                augmentation = imgaug.augmenters.Sometimes(0.5, [
+                    imgaug.augmenters.Fliplr(0.5),
+                    imgaug.augmenters.GaussianBlur(sigma=(0.0, 5.0))
+                ])
+	    custom_callbacks: Optional. Add custom callbacks to be called
+	        with the keras fit_generator method. Must be list of type keras.callbacks.
+        no_augmentation_sources: Optional. List of sources to exclude for
+            augmentation. A source is string that identifies a dataset and is
+            defined in the Dataset class.
+        """
+        assert self.mode == "training", "Create model in training mode."
+
+        # Pre-defined layer regular expressions
+        layer_regex = {
+            # all layers but the backbone
+            "heads": r"(mrcnn\_.*)|(rpn\_.*)|(fpn\_.*)",
+            # From a specific Resnet stage and up
+            "3+": r"(res3.*)|(bn3.*)|(res4.*)|(bn4.*)|(res5.*)|(bn5.*)|(mrcnn\_.*)|(rpn\_.*)|(fpn\_.*)",
+            "4+": r"(res4.*)|(bn4.*)|(res5.*)|(bn5.*)|(mrcnn\_.*)|(rpn\_.*)|(fpn\_.*)",
+            "5+": r"(res5.*)|(bn5.*)|(mrcnn\_.*)|(rpn\_.*)|(fpn\_.*)",
+            # All layers
+            "all": ".*",
+        }
+        if layers in layer_regex.keys():
+            layers = layer_regex[layers]
+
+        # Data generators
+        train_generator = data_generator(train_dataset, self.config, shuffle=True,
+                                         augmentation=augmentation,
+                                         batch_size=self.config.BATCH_SIZE,
+                                         no_augmentation_sources=no_augmentation_sources)
+        val_generator = data_generator(val_dataset, self.config, shuffle=True,
+                                       batch_size=self.config.BATCH_SIZE)
+
+        # Create log_dir if it does not exist
+        if not os.path.exists(self.log_dir):
+            os.makedirs(self.log_dir)
+
+        # Callbacks
+        callbacks = [
+            keras.callbacks.TensorBoard(log_dir=self.log_dir,
+                                        histogram_freq=0, write_graph=True, write_images=False),
+            keras.callbacks.ModelCheckpoint(self.checkpoint_path,
+                                            verbose=0, save_weights_only=True),
+        ]
+
+        # Add custom callbacks to the list
+        if custom_callbacks:
+            callbacks += custom_callbacks
+
+        # Train
+        log("\nStarting at epoch {}. LR={}\n".format(self.epoch, learning_rate))
+        log("Checkpoint Path: {}".format(self.checkpoint_path))
+        self.set_trainable(layers)
+        self.compile(learning_rate, self.config.LEARNING_MOMENTUM)
+
+        # Work-around for Windows: Keras fails on Windows when using
+        # multiprocessing workers. See discussion here:
+        # https://github.com/matterport/Mask_RCNN/issues/13#issuecomment-353124009
+        if os.name is 'nt':
+            workers = 0
+        else:
+            workers = multiprocessing.cpu_count()
+
+        self.keras_model.fit_generator(
+            train_generator,
+            initial_epoch=self.epoch,
+            epochs=epochs,
+            steps_per_epoch=self.config.STEPS_PER_EPOCH,
+            callbacks=callbacks,
+            validation_data=val_generator,
+            validation_steps=self.config.VALIDATION_STEPS,
+            max_queue_size=50,
+            workers=workers,
+            use_multiprocessing=True,
+        )
+        self.epoch = max(self.epoch, epochs)
+
+    def mold_inputs(self, images):
+        """Takes a list of images and modifies them to the format expected
+        as an input to the neural network.
+        images: List of image matrices [height,width,depth]. Images can have
+            different sizes.
+
+        Returns 3 Numpy matrices:
+        molded_images: [N, h, w, 3]. Images resized and normalized.
+        image_metas: [N, length of meta data]. Details about each image.
+        windows: [N, (y1, x1, y2, x2)]. The portion of the image that has the
+            original image (padding excluded).
+        """
+        molded_images = []
+        image_metas = []
+        windows = []
+        for image in images:
+            # Resize image
+            # TODO: move resizing to mold_image()
+            molded_image, window, scale, padding, crop = utils.resize_image(
+                image,
+                min_dim=self.config.IMAGE_MIN_DIM,
+                min_scale=self.config.IMAGE_MIN_SCALE,
+                max_dim=self.config.IMAGE_MAX_DIM,
+                mode=self.config.IMAGE_RESIZE_MODE)
+            molded_image = mold_image(molded_image, self.config)
+            # Build image_meta
+            image_meta = compose_image_meta(
+                0, image.shape, molded_image.shape, window, scale,
+                np.zeros([self.config.NUM_CLASSES], dtype=np.int32))
+            # Append
+            molded_images.append(molded_image)
+            windows.append(window)
+            image_metas.append(image_meta)
+        # Pack into arrays
+        molded_images = np.stack(molded_images)
+        image_metas = np.stack(image_metas)
+        windows = np.stack(windows)
+        return molded_images, image_metas, windows
+
+    def unmold_detections(self, detections, mrcnn_mask, original_image_shape,
+                          image_shape, window):
+        """Reformats the detections of one image from the format of the neural
+        network output to a format suitable for use in the rest of the
+        application.
+
+        detections: [N, (y1, x1, y2, x2, class_id, score)] in normalized coordinates
+        mrcnn_mask: [N, height, width, num_classes]
+        original_image_shape: [H, W, C] Original image shape before resizing
+        image_shape: [H, W, C] Shape of the image after resizing and padding
+        window: [y1, x1, y2, x2] Pixel coordinates of box in the image where the real
+                image is excluding the padding.
+
+        Returns:
+        boxes: [N, (y1, x1, y2, x2)] Bounding boxes in pixels
+        class_ids: [N] Integer class IDs for each bounding box
+        scores: [N] Float probability scores of the class_id
+        masks: [height, width, num_instances] Instance masks
+        """
+        # How many detections do we have?
+        # Detections array is padded with zeros. Find the first class_id == 0.
+        zero_ix = np.where(detections[:, 4] == 0)[0]
+        N = zero_ix[0] if zero_ix.shape[0] > 0 else detections.shape[0]
+
+        # Extract boxes, class_ids, scores, and class-specific masks
+        boxes = detections[:N, :4]
+        class_ids = detections[:N, 4].astype(np.int32)
+        scores = detections[:N, 5]
+        masks = mrcnn_mask[np.arange(N), :, :, class_ids]
+
+        # Translate normalized coordinates in the resized image to pixel
+        # coordinates in the original image before resizing
+        window = utils.norm_boxes(window, image_shape[:2])
+        wy1, wx1, wy2, wx2 = window
+        shift = np.array([wy1, wx1, wy1, wx1])
+        wh = wy2 - wy1  # window height
+        ww = wx2 - wx1  # window width
+        scale = np.array([wh, ww, wh, ww])
+        # Convert boxes to normalized coordinates on the window
+        boxes = np.divide(boxes - shift, scale)
+        # Convert boxes to pixel coordinates on the original image
+        boxes = utils.denorm_boxes(boxes, original_image_shape[:2])
+
+        # Filter out detections with zero area. Happens in early training when
+        # network weights are still random
+        exclude_ix = np.where(
+            (boxes[:, 2] - boxes[:, 0]) * (boxes[:, 3] - boxes[:, 1]) <= 0)[0]
+        if exclude_ix.shape[0] > 0:
+            boxes = np.delete(boxes, exclude_ix, axis=0)
+            class_ids = np.delete(class_ids, exclude_ix, axis=0)
+            scores = np.delete(scores, exclude_ix, axis=0)
+            masks = np.delete(masks, exclude_ix, axis=0)
+            N = class_ids.shape[0]
+
+        # Resize masks to original image size and set boundary threshold.
+        full_masks = []
+        for i in range(N):
+            # Convert neural network mask to full size mask
+            full_mask = utils.unmold_mask(masks[i], boxes[i], original_image_shape)
+            full_masks.append(full_mask)
+        full_masks = np.stack(full_masks, axis=-1)\
+            if full_masks else np.empty(original_image_shape[:2] + (0,))
+
+        return boxes, class_ids, scores, full_masks
+
+    def detect(self, images, verbose=0):
+        """Runs the detection pipeline.
+
+        images: List of images, potentially of different sizes.
+
+        Returns a list of dicts, one dict per image. The dict contains:
+        rois: [N, (y1, x1, y2, x2)] detection bounding boxes
+        class_ids: [N] int class IDs
+        scores: [N] float probability scores for the class IDs
+        masks: [H, W, N] instance binary masks
+        """
+        assert self.mode == "inference", "Create model in inference mode."
+        assert len(
+            images) == self.config.BATCH_SIZE, "len(images) must be equal to BATCH_SIZE"
+
+        if verbose:
+            log("Processing {} images".format(len(images)))
+            for image in images:
+                log("image", image)
+
+        # Mold inputs to format expected by the neural network
+        molded_images, image_metas, windows = self.mold_inputs(images)
+
+        # Validate image sizes
+        # All images in a batch MUST be of the same size
+        image_shape = molded_images[0].shape
+        for g in molded_images[1:]:
+            assert g.shape == image_shape,\
+                "After resizing, all images must have the same size. Check IMAGE_RESIZE_MODE and image sizes."
+
+        # Anchors
+        anchors = self.get_anchors(image_shape)
+        # Duplicate across the batch dimension because Keras requires it
+        # TODO: can this be optimized to avoid duplicating the anchors?
+        anchors = np.broadcast_to(anchors, (self.config.BATCH_SIZE,) + anchors.shape)
+
+        if verbose:
+            log("molded_images", molded_images)
+            log("image_metas", image_metas)
+            log("anchors", anchors)
+        # Run object detection
+        detections, _, _, mrcnn_mask, _, _, _ =\
+            self.keras_model.predict([molded_images, image_metas, anchors], verbose=0)
+        # Process detections
+        results = []
+        for i, image in enumerate(images):
+            final_rois, final_class_ids, final_scores, final_masks =\
+                self.unmold_detections(detections[i], mrcnn_mask[i],
+                                       image.shape, molded_images[i].shape,
+                                       windows[i])
+            results.append({
+                "rois": final_rois,
+                "class_ids": final_class_ids,
+                "scores": final_scores,
+                "masks": final_masks,
+            })
+        return results
+
+    def detect_molded(self, molded_images, image_metas, verbose=0):
+        """Runs the detection pipeline, but expect inputs that are
+        molded already. Used mostly for debugging and inspecting
+        the model.
+
+        molded_images: List of images loaded using load_image_gt()
+        image_metas: image meta data, also returned by load_image_gt()
+
+        Returns a list of dicts, one dict per image. The dict contains:
+        rois: [N, (y1, x1, y2, x2)] detection bounding boxes
+        class_ids: [N] int class IDs
+        scores: [N] float probability scores for the class IDs
+        masks: [H, W, N] instance binary masks
+        """
+        assert self.mode == "inference", "Create model in inference mode."
+        assert len(molded_images) == self.config.BATCH_SIZE,\
+            "Number of images must be equal to BATCH_SIZE"
+
+        if verbose:
+            log("Processing {} images".format(len(molded_images)))
+            for image in molded_images:
+                log("image", image)
+
+        # Validate image sizes
+        # All images in a batch MUST be of the same size
+        image_shape = molded_images[0].shape
+        for g in molded_images[1:]:
+            assert g.shape == image_shape, "Images must have the same size"
+
+        # Anchors
+        anchors = self.get_anchors(image_shape)
+        # Duplicate across the batch dimension because Keras requires it
+        # TODO: can this be optimized to avoid duplicating the anchors?
+        anchors = np.broadcast_to(anchors, (self.config.BATCH_SIZE,) + anchors.shape)
+
+        if verbose:
+            log("molded_images", molded_images)
+            log("image_metas", image_metas)
+            log("anchors", anchors)
+        # Run object detection
+        detections, _, _, mrcnn_mask, _, _, _ =\
+            self.keras_model.predict([molded_images, image_metas, anchors], verbose=0)
+        # Process detections
+        results = []
+        for i, image in enumerate(molded_images):
+            window = [0, 0, image.shape[0], image.shape[1]]
+            final_rois, final_class_ids, final_scores, final_masks =\
+                self.unmold_detections(detections[i], mrcnn_mask[i],
+                                       image.shape, molded_images[i].shape,
+                                       window)
+            results.append({
+                "rois": final_rois,
+                "class_ids": final_class_ids,
+                "scores": final_scores,
+                "masks": final_masks,
+            })
+        return results
+
+    def get_anchors(self, image_shape):
+        """Returns anchor pyramid for the given image size."""
+        backbone_shapes = compute_backbone_shapes(self.config, image_shape)
+        # Cache anchors and reuse if image shape is the same
+        if not hasattr(self, "_anchor_cache"):
+            self._anchor_cache = {}
+        if not tuple(image_shape) in self._anchor_cache:
+            # Generate Anchors
+            a = utils.generate_pyramid_anchors(
+                self.config.RPN_ANCHOR_SCALES,
+                self.config.RPN_ANCHOR_RATIOS,
+                backbone_shapes,
+                self.config.BACKBONE_STRIDES,
+                self.config.RPN_ANCHOR_STRIDE)
+            # Keep a copy of the latest anchors in pixel coordinates because
+            # it's used in inspect_model notebooks.
+            # TODO: Remove this after the notebook are refactored to not use it
+            self.anchors = a
+            # Normalize coordinates
+            self._anchor_cache[tuple(image_shape)] = utils.norm_boxes(a, image_shape[:2])
+        return self._anchor_cache[tuple(image_shape)]
+
+    def ancestor(self, tensor, name, checked=None):
+        """Finds the ancestor of a TF tensor in the computation graph.
+        tensor: TensorFlow symbolic tensor.
+        name: Name of ancestor tensor to find
+        checked: For internal use. A list of tensors that were already
+                 searched to avoid loops in traversing the graph.
+        """
+        checked = checked if checked is not None else []
+        # Put a limit on how deep we go to avoid very long loops
+        if len(checked) > 500:
+            return None
+        # Convert name to a regex and allow matching a number prefix
+        # because Keras adds them automatically
+        if isinstance(name, str):
+            name = re.compile(name.replace("/", r"(\_\d+)*/"))
+
+        parents = tensor.op.inputs
+        for p in parents:
+            if p in checked:
+                continue
+            if bool(re.fullmatch(name, p.name)):
+                return p
+            checked.append(p)
+            a = self.ancestor(p, name, checked)
+            if a is not None:
+                return a
+        return None
+
+    def find_trainable_layer(self, layer):
+        """If a layer is encapsulated by another layer, this function
+        digs through the encapsulation and returns the layer that holds
+        the weights.
+        """
+        if layer.__class__.__name__ == 'TimeDistributed':
+            return self.find_trainable_layer(layer.layer)
+        return layer
+
+    def get_trainable_layers(self):
+        """Returns a list of layers that have weights."""
+        layers = []
+        # Loop through all layers
+        for l in self.keras_model.layers:
+            # If layer is a wrapper, find inner trainable layer
+            l = self.find_trainable_layer(l)
+            # Include layer if it has weights
+            if l.get_weights():
+                layers.append(l)
+        return layers
+
+    def run_graph(self, images, outputs, image_metas=None):
+        """Runs a sub-set of the computation graph that computes the given
+        outputs.
+
+        image_metas: If provided, the images are assumed to be already
+            molded (i.e. resized, padded, and normalized)
+
+        outputs: List of tuples (name, tensor) to compute. The tensors are
+            symbolic TensorFlow tensors and the names are for easy tracking.
+
+        Returns an ordered dict of results. Keys are the names received in the
+        input and values are Numpy arrays.
+        """
+        model = self.keras_model
+
+        # Organize desired outputs into an ordered dict
+        outputs = OrderedDict(outputs)
+        for o in outputs.values():
+            assert o is not None
+
+        # Build a Keras function to run parts of the computation graph
+        inputs = model.inputs
+        if model.uses_learning_phase and not isinstance(K.learning_phase(), int):
+            inputs += [K.learning_phase()]
+        kf = K.function(model.inputs, list(outputs.values()))
+
+        # Prepare inputs
+        if image_metas is None:
+            molded_images, image_metas, _ = self.mold_inputs(images)
+        else:
+            molded_images = images
+        image_shape = molded_images[0].shape
+        # Anchors
+        anchors = self.get_anchors(image_shape)
+        # Duplicate across the batch dimension because Keras requires it
+        # TODO: can this be optimized to avoid duplicating the anchors?
+        anchors = np.broadcast_to(anchors, (self.config.BATCH_SIZE,) + anchors.shape)
+        model_in = [molded_images, image_metas, anchors]
+
+        # Run inference
+        if model.uses_learning_phase and not isinstance(K.learning_phase(), int):
+            model_in.append(0.)
+        outputs_np = kf(model_in)
+
+        # Pack the generated Numpy arrays into a a dict and log the results.
+        outputs_np = OrderedDict([(k, v)
+                                  for k, v in zip(outputs.keys(), outputs_np)])
+        for k, v in outputs_np.items():
+            log(k, v)
+        return outputs_np
+
+
+############################################################
+#  Data Formatting
+############################################################
+
+def compose_image_meta(image_id, original_image_shape, image_shape,
+                       window, scale, active_class_ids):
+    """Takes attributes of an image and puts them in one 1D array.
+
+    image_id: An int ID of the image. Useful for debugging.
+    original_image_shape: [H, W, C] before resizing or padding.
+    image_shape: [H, W, C] after resizing and padding
+    window: (y1, x1, y2, x2) in pixels. The area of the image where the real
+            image is (excluding the padding)
+    scale: The scaling factor applied to the original image (float32)
+    active_class_ids: List of class_ids available in the dataset from which
+        the image came. Useful if training on images from multiple datasets
+        where not all classes are present in all datasets.
+    """
+    meta = np.array(
+        [image_id] +                  # size=1
+        list(original_image_shape) +  # size=3
+        list(image_shape) +           # size=3
+        list(window) +                # size=4 (y1, x1, y2, x2) in image cooredinates
+        [scale] +                     # size=1
+        list(active_class_ids)        # size=num_classes
+    )
+    return meta
+
+
+def parse_image_meta(meta):
+    """Parses an array that contains image attributes to its components.
+    See compose_image_meta() for more details.
+
+    meta: [batch, meta length] where meta length depends on NUM_CLASSES
+
+    Returns a dict of the parsed values.
+    """
+    image_id = meta[:, 0]
+    original_image_shape = meta[:, 1:4]
+    image_shape = meta[:, 4:7]
+    window = meta[:, 7:11]  # (y1, x1, y2, x2) window of image in in pixels
+    scale = meta[:, 11]
+    active_class_ids = meta[:, 12:]
+    return {
+        "image_id": image_id.astype(np.int32),
+        "original_image_shape": original_image_shape.astype(np.int32),
+        "image_shape": image_shape.astype(np.int32),
+        "window": window.astype(np.int32),
+        "scale": scale.astype(np.float32),
+        "active_class_ids": active_class_ids.astype(np.int32),
+    }
+
+
+def parse_image_meta_graph(meta):
+    """Parses a tensor that contains image attributes to its components.
+    See compose_image_meta() for more details.
+
+    meta: [batch, meta length] where meta length depends on NUM_CLASSES
+
+    Returns a dict of the parsed tensors.
+    """
+    image_id = meta[:, 0]
+    original_image_shape = meta[:, 1:4]
+    image_shape = meta[:, 4:7]
+    window = meta[:, 7:11]  # (y1, x1, y2, x2) window of image in in pixels
+    scale = meta[:, 11]
+    active_class_ids = meta[:, 12:]
+    return {
+        "image_id": image_id,
+        "original_image_shape": original_image_shape,
+        "image_shape": image_shape,
+        "window": window,
+        "scale": scale,
+        "active_class_ids": active_class_ids,
+    }
+
+
+def mold_image(images, config):
+    """Expects an RGB image (or array of images) and subtracts
+    the mean pixel and converts it to float. Expects image
+    colors in RGB order.
+    """
+    return images.astype(np.float32) - config.MEAN_PIXEL
+
+
+def unmold_image(normalized_images, config):
+    """Takes a image normalized with mold() and returns the original."""
+    return (normalized_images + config.MEAN_PIXEL).astype(np.uint8)
+
+
+############################################################
+#  Miscellenous Graph Functions
+############################################################
+
+def trim_zeros_graph(boxes, name='trim_zeros'):
+    """Often boxes are represented with matrices of shape [N, 4] and
+    are padded with zeros. This removes zero boxes.
+
+    boxes: [N, 4] matrix of boxes.
+    non_zeros: [N] a 1D boolean mask identifying the rows to keep
+    """
+    non_zeros = tf.cast(tf.reduce_sum(tf.abs(boxes), axis=1), tf.bool)
+    boxes = tf.boolean_mask(boxes, non_zeros, name=name)
+    return boxes, non_zeros
+
+
+def batch_pack_graph(x, counts, num_rows):
+    """Picks different number of values from each row
+    in x depending on the values in counts.
+    """
+    outputs = []
+    for i in range(num_rows):
+        outputs.append(x[i, :counts[i]])
+    return tf.concat(outputs, axis=0)
+
+
+def norm_boxes_graph(boxes, shape):
+    """Converts boxes from pixel coordinates to normalized coordinates.
+    boxes: [..., (y1, x1, y2, x2)] in pixel coordinates
+    shape: [..., (height, width)] in pixels
+
+    Note: In pixel coordinates (y2, x2) is outside the box. But in normalized
+    coordinates it's inside the box.
+
+    Returns:
+        [..., (y1, x1, y2, x2)] in normalized coordinates
+    """
+    h, w = tf.split(tf.cast(shape, tf.float32), 2)
+    scale = tf.concat([h, w, h, w], axis=-1) - tf.constant(1.0)
+    shift = tf.constant([0., 0., 1., 1.])
+    return tf.divide(boxes - shift, scale)
+
+
+def denorm_boxes_graph(boxes, shape):
+    """Converts boxes from normalized coordinates to pixel coordinates.
+    boxes: [..., (y1, x1, y2, x2)] in normalized coordinates
+    shape: [..., (height, width)] in pixels
+
+    Note: In pixel coordinates (y2, x2) is outside the box. But in normalized
+    coordinates it's inside the box.
+
+    Returns:
+        [..., (y1, x1, y2, x2)] in pixel coordinates
+    """
+    h, w = tf.split(tf.cast(shape, tf.float32), 2)
+    scale = tf.concat([h, w, h, w], axis=-1) - tf.constant(1.0)
+    shift = tf.constant([0., 0., 1., 1.])
+    return tf.cast(tf.round(tf.multiply(boxes, scale) + shift), tf.int32)
diff --git a/mask_rcnn/mrcnn/parallel_model.py b/mask_rcnn/mrcnn/parallel_model.py
new file mode 100644
index 00000000..0a28fdf6
--- /dev/null
+++ b/mask_rcnn/mrcnn/parallel_model.py
@@ -0,0 +1,177 @@
+"""
+Mask R-CNN
+Multi-GPU Support for Keras.
+
+Copyright (c) 2017 Matterport, Inc.
+Licensed under the MIT License (see LICENSE for details)
+Written by Waleed Abdulla
+
+Ideas and a small code snippets from these sources:
+https://github.com/fchollet/keras/issues/2436
+https://medium.com/@kuza55/transparent-multi-gpu-training-on-tensorflow-with-keras-8b0016fd9012
+https://github.com/avolkov1/keras_experiments/blob/master/keras_exp/multigpu/
+https://github.com/fchollet/keras/blob/master/keras/utils/training_utils.py
+"""
+import warnings
+warnings.filterwarnings('ignore', category=DeprecationWarning)
+warnings.filterwarnings('ignore', category=FutureWarning)
+import tensorflow as tf
+import keras.backend as K
+import keras.layers as KL
+import keras.models as KM
+
+
+class ParallelModel(KM.Model):
+    """Subclasses the standard Keras Model and adds multi-GPU support.
+    It works by creating a copy of the model on each GPU. Then it slices
+    the inputs and sends a slice to each copy of the model, and then
+    merges the outputs together and applies the loss on the combined
+    outputs.
+    """
+
+    def __init__(self, keras_model, gpu_count):
+        """Class constructor.
+        keras_model: The Keras model to parallelize
+        gpu_count: Number of GPUs. Must be > 1
+        """
+        self.inner_model = keras_model
+        self.gpu_count = gpu_count
+        merged_outputs = self.make_parallel()
+        super(ParallelModel, self).__init__(inputs=self.inner_model.inputs,
+                                            outputs=merged_outputs)
+
+    def __getattribute__(self, attrname):
+        """Redirect loading and saving methods to the inner model. That's where
+        the weights are stored."""
+        if 'load' in attrname or 'save' in attrname:
+            return getattr(self.inner_model, attrname)
+        return super(ParallelModel, self).__getattribute__(attrname)
+
+    def summary(self, *args, **kwargs):
+        """Override summary() to display summaries of both, the wrapper
+        and inner models."""
+        super(ParallelModel, self).summary(*args, **kwargs)
+        self.inner_model.summary(*args, **kwargs)
+
+    def make_parallel(self):
+        """Creates a new wrapper model that consists of multiple replicas of
+        the original model placed on different GPUs.
+        """
+        # Slice inputs. Slice inputs on the CPU to avoid sending a copy
+        # of the full inputs to all GPUs. Saves on bandwidth and memory.
+        input_slices = {name: tf.split(x, self.gpu_count)
+                        for name, x in zip(self.inner_model.input_names,
+                                           self.inner_model.inputs)}
+
+        output_names = self.inner_model.output_names
+        outputs_all = []
+        for i in range(len(self.inner_model.outputs)):
+            outputs_all.append([])
+
+        # Run the model call() on each GPU to place the ops there
+        for i in range(self.gpu_count):
+            with tf.device('/gpu:%d' % i):
+                with tf.name_scope('tower_%d' % i):
+                    # Run a slice of inputs through this replica
+                    zipped_inputs = zip(self.inner_model.input_names,
+                                        self.inner_model.inputs)
+                    inputs = [
+                        KL.Lambda(lambda s: input_slices[name][i],
+                                  output_shape=lambda s: (None,) + s[1:])(tensor)
+                        for name, tensor in zipped_inputs]
+                    # Create the model replica and get the outputs
+                    outputs = self.inner_model(inputs)
+                    if not isinstance(outputs, list):
+                        outputs = [outputs]
+                    # Save the outputs for merging back together later
+                    for l, o in enumerate(outputs):
+                        outputs_all[l].append(o)
+
+        # Merge outputs on CPU
+        with tf.device('/cpu:0'):
+            merged = []
+            for outputs, name in zip(outputs_all, output_names):
+                # Concatenate or average outputs?
+                # Outputs usually have a batch dimension and we concatenate
+                # across it. If they don't, then the output is likely a loss
+                # or a metric value that gets averaged across the batch.
+                # Keras expects losses and metrics to be scalars.
+                if K.int_shape(outputs[0]) == ():
+                    # Average
+                    m = KL.Lambda(lambda o: tf.add_n(o) / len(outputs), name=name)(outputs)
+                else:
+                    # Concatenate
+                    m = KL.Concatenate(axis=0, name=name)(outputs)
+                merged.append(m)
+        return merged
+
+
+if __name__ == "__main__":
+    # Testing code below. It creates a simple model to train on MNIST and
+    # tries to run it on 2 GPUs. It saves the graph so it can be viewed
+    # in TensorBoard. Run it as:
+    #
+    # python3 parallel_model.py
+
+    import os
+    import numpy as np
+    import keras.optimizers
+    from keras.datasets import mnist
+    from keras.preprocessing.image import ImageDataGenerator
+
+    GPU_COUNT = 2
+
+    # Root directory of the project
+    ROOT_DIR = os.path.abspath("../")
+
+    # Directory to save logs and trained model
+    MODEL_DIR = os.path.join(ROOT_DIR, "logs")
+
+    def build_model(x_train, num_classes):
+        # Reset default graph. Keras leaves old ops in the graph,
+        # which are ignored for execution but clutter graph
+        # visualization in TensorBoard.
+        tf.reset_default_graph()
+
+        inputs = KL.Input(shape=x_train.shape[1:], name="input_image")
+        x = KL.Conv2D(32, (3, 3), activation='relu', padding="same",
+                      name="conv1")(inputs)
+        x = KL.Conv2D(64, (3, 3), activation='relu', padding="same",
+                      name="conv2")(x)
+        x = KL.MaxPooling2D(pool_size=(2, 2), name="pool1")(x)
+        x = KL.Flatten(name="flat1")(x)
+        x = KL.Dense(128, activation='relu', name="dense1")(x)
+        x = KL.Dense(num_classes, activation='softmax', name="dense2")(x)
+
+        return KM.Model(inputs, x, "digit_classifier_model")
+
+    # Load MNIST Data
+    (x_train, y_train), (x_test, y_test) = mnist.load_data()
+    x_train = np.expand_dims(x_train, -1).astype('float32') / 255
+    x_test = np.expand_dims(x_test, -1).astype('float32') / 255
+
+    print('x_train shape:', x_train.shape)
+    print('x_test shape:', x_test.shape)
+
+    # Build data generator and model
+    datagen = ImageDataGenerator()
+    model = build_model(x_train, 10)
+
+    # Add multi-GPU support.
+    model = ParallelModel(model, GPU_COUNT)
+
+    optimizer = keras.optimizers.SGD(lr=0.01, momentum=0.9, clipnorm=5.0)
+
+    model.compile(loss='sparse_categorical_crossentropy',
+                  optimizer=optimizer, metrics=['accuracy'])
+
+    model.summary()
+
+    # Train
+    model.fit_generator(
+        datagen.flow(x_train, y_train, batch_size=64),
+        steps_per_epoch=50, epochs=10, verbose=1,
+        validation_data=(x_test, y_test),
+        callbacks=[keras.callbacks.TensorBoard(log_dir=MODEL_DIR,
+                                               write_graph=True)]
+    )
diff --git a/mask_rcnn/mrcnn/utils.py b/mask_rcnn/mrcnn/utils.py
new file mode 100644
index 00000000..e0da612a
--- /dev/null
+++ b/mask_rcnn/mrcnn/utils.py
@@ -0,0 +1,911 @@
+"""
+Mask R-CNN
+Common utility functions and classes.
+
+Copyright (c) 2017 Matterport, Inc.
+Licensed under the MIT License (see LICENSE for details)
+Written by Waleed Abdulla
+"""
+
+import sys
+import os
+import logging
+import math
+import random
+import numpy as np
+import warnings
+warnings.filterwarnings('ignore', category=DeprecationWarning)
+warnings.filterwarnings('ignore', category=FutureWarning)
+import tensorflow as tf
+import scipy
+import skimage.color
+import skimage.io
+import skimage.transform
+import urllib.request
+import shutil
+import warnings
+from distutils.version import LooseVersion
+
+# URL from which to download the latest COCO trained weights
+COCO_MODEL_URL = "https://github.com/matterport/Mask_RCNN/releases/download/v2.0/mask_rcnn_coco.h5"
+
+
+############################################################
+#  Bounding Boxes
+############################################################
+
+def extract_bboxes(mask):
+    """Compute bounding boxes from masks.
+    mask: [height, width, num_instances]. Mask pixels are either 1 or 0.
+
+    Returns: bbox array [num_instances, (y1, x1, y2, x2)].
+    """
+    boxes = np.zeros([mask.shape[-1], 4], dtype=np.int32)
+    for i in range(mask.shape[-1]):
+        m = mask[:, :, i]
+        # Bounding box.
+        horizontal_indicies = np.where(np.any(m, axis=0))[0]
+        vertical_indicies = np.where(np.any(m, axis=1))[0]
+        if horizontal_indicies.shape[0]:
+            x1, x2 = horizontal_indicies[[0, -1]]
+            y1, y2 = vertical_indicies[[0, -1]]
+            # x2 and y2 should not be part of the box. Increment by 1.
+            x2 += 1
+            y2 += 1
+        else:
+            # No mask for this instance. Might happen due to
+            # resizing or cropping. Set bbox to zeros
+            x1, x2, y1, y2 = 0, 0, 0, 0
+        boxes[i] = np.array([y1, x1, y2, x2])
+    return boxes.astype(np.int32)
+
+
+def compute_iou(box, boxes, box_area, boxes_area):
+    """Calculates IoU of the given box with the array of the given boxes.
+    box: 1D vector [y1, x1, y2, x2]
+    boxes: [boxes_count, (y1, x1, y2, x2)]
+    box_area: float. the area of 'box'
+    boxes_area: array of length boxes_count.
+
+    Note: the areas are passed in rather than calculated here for
+    efficiency. Calculate once in the caller to avoid duplicate work.
+    """
+    # Calculate intersection areas
+    y1 = np.maximum(box[0], boxes[:, 0])
+    y2 = np.minimum(box[2], boxes[:, 2])
+    x1 = np.maximum(box[1], boxes[:, 1])
+    x2 = np.minimum(box[3], boxes[:, 3])
+    intersection = np.maximum(x2 - x1, 0) * np.maximum(y2 - y1, 0)
+    union = box_area + boxes_area[:] - intersection[:]
+    iou = intersection / union
+    return iou
+
+
+def compute_overlaps(boxes1, boxes2):
+    """Computes IoU overlaps between two sets of boxes.
+    boxes1, boxes2: [N, (y1, x1, y2, x2)].
+
+    For better performance, pass the largest set first and the smaller second.
+    """
+    # Areas of anchors and GT boxes
+    area1 = (boxes1[:, 2] - boxes1[:, 0]) * (boxes1[:, 3] - boxes1[:, 1])
+    area2 = (boxes2[:, 2] - boxes2[:, 0]) * (boxes2[:, 3] - boxes2[:, 1])
+
+    # Compute overlaps to generate matrix [boxes1 count, boxes2 count]
+    # Each cell contains the IoU value.
+    overlaps = np.zeros((boxes1.shape[0], boxes2.shape[0]))
+    for i in range(overlaps.shape[1]):
+        box2 = boxes2[i]
+        overlaps[:, i] = compute_iou(box2, boxes1, area2[i], area1)
+    return overlaps
+
+
+def compute_overlaps_masks(masks1, masks2):
+    """Computes IoU overlaps between two sets of masks.
+    masks1, masks2: [Height, Width, instances]
+    """
+    
+    # If either set of masks is empty return empty result
+    if masks1.shape[-1] == 0 or masks2.shape[-1] == 0:
+        return np.zeros((masks1.shape[-1], masks2.shape[-1]))
+    # flatten masks and compute their areas
+    masks1 = np.reshape(masks1 > .5, (-1, masks1.shape[-1])).astype(np.float32)
+    masks2 = np.reshape(masks2 > .5, (-1, masks2.shape[-1])).astype(np.float32)
+    area1 = np.sum(masks1, axis=0)
+    area2 = np.sum(masks2, axis=0)
+
+    # intersections and union
+    intersections = np.dot(masks1.T, masks2)
+    union = area1[:, None] + area2[None, :] - intersections
+    overlaps = intersections / union
+
+    return overlaps
+
+
+def non_max_suppression(boxes, scores, threshold):
+    """Performs non-maximum suppression and returns indices of kept boxes.
+    boxes: [N, (y1, x1, y2, x2)]. Notice that (y2, x2) lays outside the box.
+    scores: 1-D array of box scores.
+    threshold: Float. IoU threshold to use for filtering.
+    """
+    assert boxes.shape[0] > 0
+    if boxes.dtype.kind != "f":
+        boxes = boxes.astype(np.float32)
+
+    # Compute box areas
+    y1 = boxes[:, 0]
+    x1 = boxes[:, 1]
+    y2 = boxes[:, 2]
+    x2 = boxes[:, 3]
+    area = (y2 - y1) * (x2 - x1)
+
+    # Get indicies of boxes sorted by scores (highest first)
+    ixs = scores.argsort()[::-1]
+
+    pick = []
+    while len(ixs) > 0:
+        # Pick top box and add its index to the list
+        i = ixs[0]
+        pick.append(i)
+        # Compute IoU of the picked box with the rest
+        iou = compute_iou(boxes[i], boxes[ixs[1:]], area[i], area[ixs[1:]])
+        # Identify boxes with IoU over the threshold. This
+        # returns indices into ixs[1:], so add 1 to get
+        # indices into ixs.
+        remove_ixs = np.where(iou > threshold)[0] + 1
+        # Remove indices of the picked and overlapped boxes.
+        ixs = np.delete(ixs, remove_ixs)
+        ixs = np.delete(ixs, 0)
+    return np.array(pick, dtype=np.int32)
+
+
+def apply_box_deltas(boxes, deltas):
+    """Applies the given deltas to the given boxes.
+    boxes: [N, (y1, x1, y2, x2)]. Note that (y2, x2) is outside the box.
+    deltas: [N, (dy, dx, log(dh), log(dw))]
+    """
+    boxes = boxes.astype(np.float32)
+    # Convert to y, x, h, w
+    height = boxes[:, 2] - boxes[:, 0]
+    width = boxes[:, 3] - boxes[:, 1]
+    center_y = boxes[:, 0] + 0.5 * height
+    center_x = boxes[:, 1] + 0.5 * width
+    # Apply deltas
+    center_y += deltas[:, 0] * height
+    center_x += deltas[:, 1] * width
+    height *= np.exp(deltas[:, 2])
+    width *= np.exp(deltas[:, 3])
+    # Convert back to y1, x1, y2, x2
+    y1 = center_y - 0.5 * height
+    x1 = center_x - 0.5 * width
+    y2 = y1 + height
+    x2 = x1 + width
+    return np.stack([y1, x1, y2, x2], axis=1)
+
+
+def box_refinement_graph(box, gt_box):
+    """Compute refinement needed to transform box to gt_box.
+    box and gt_box are [N, (y1, x1, y2, x2)]
+    """
+    box = tf.cast(box, tf.float32)
+    gt_box = tf.cast(gt_box, tf.float32)
+
+    height = box[:, 2] - box[:, 0]
+    width = box[:, 3] - box[:, 1]
+    center_y = box[:, 0] + 0.5 * height
+    center_x = box[:, 1] + 0.5 * width
+
+    gt_height = gt_box[:, 2] - gt_box[:, 0]
+    gt_width = gt_box[:, 3] - gt_box[:, 1]
+    gt_center_y = gt_box[:, 0] + 0.5 * gt_height
+    gt_center_x = gt_box[:, 1] + 0.5 * gt_width
+
+    dy = (gt_center_y - center_y) / height
+    dx = (gt_center_x - center_x) / width
+    dh = tf.log(gt_height / height)
+    dw = tf.log(gt_width / width)
+
+    result = tf.stack([dy, dx, dh, dw], axis=1)
+    return result
+
+
+def box_refinement(box, gt_box):
+    """Compute refinement needed to transform box to gt_box.
+    box and gt_box are [N, (y1, x1, y2, x2)]. (y2, x2) is
+    assumed to be outside the box.
+    """
+    box = box.astype(np.float32)
+    gt_box = gt_box.astype(np.float32)
+
+    height = box[:, 2] - box[:, 0]
+    width = box[:, 3] - box[:, 1]
+    center_y = box[:, 0] + 0.5 * height
+    center_x = box[:, 1] + 0.5 * width
+
+    gt_height = gt_box[:, 2] - gt_box[:, 0]
+    gt_width = gt_box[:, 3] - gt_box[:, 1]
+    gt_center_y = gt_box[:, 0] + 0.5 * gt_height
+    gt_center_x = gt_box[:, 1] + 0.5 * gt_width
+
+    dy = (gt_center_y - center_y) / height
+    dx = (gt_center_x - center_x) / width
+    dh = np.log(gt_height / height)
+    dw = np.log(gt_width / width)
+
+    return np.stack([dy, dx, dh, dw], axis=1)
+
+
+############################################################
+#  Dataset
+############################################################
+
+class Dataset(object):
+    """The base class for dataset classes.
+    To use it, create a new class that adds functions specific to the dataset
+    you want to use. For example:
+
+    class CatsAndDogsDataset(Dataset):
+        def load_cats_and_dogs(self):
+            ...
+        def load_mask(self, image_id):
+            ...
+        def image_reference(self, image_id):
+            ...
+
+    See COCODataset and ShapesDataset as examples.
+    """
+
+    def __init__(self, class_map=None):
+        self._image_ids = []
+        self.image_info = []
+        # Background is always the first class
+        self.class_info = [{"source": "", "id": 0, "name": "BG"}]
+        self.source_class_ids = {}
+
+    def add_class(self, source, class_id, class_name):
+        assert "." not in source, "Source name cannot contain a dot"
+        # Does the class exist already?
+        for info in self.class_info:
+            if info['source'] == source and info["id"] == class_id:
+                # source.class_id combination already available, skip
+                return
+        # Add the class
+        self.class_info.append({
+            "source": source,
+            "id": class_id,
+            "name": class_name,
+        })
+
+    def add_image(self, source, image_id, path, **kwargs):
+        image_info = {
+            "id": image_id,
+            "source": source,
+            "path": path,
+        }
+        image_info.update(kwargs)
+        self.image_info.append(image_info)
+
+    def image_reference(self, image_id):
+        """Return a link to the image in its source Website or details about
+        the image that help looking it up or debugging it.
+
+        Override for your dataset, but pass to this function
+        if you encounter images not in your dataset.
+        """
+        return ""
+
+    def prepare(self, class_map=None):
+        """Prepares the Dataset class for use.
+
+        TODO: class map is not supported yet. When done, it should handle mapping
+              classes from different datasets to the same class ID.
+        """
+
+        def clean_name(name):
+            """Returns a shorter version of object names for cleaner display."""
+            return ",".join(name.split(",")[:1])
+
+        # Build (or rebuild) everything else from the info dicts.
+        self.num_classes = len(self.class_info)
+        self.class_ids = np.arange(self.num_classes)
+        self.class_names = [clean_name(c["name"]) for c in self.class_info]
+        self.num_images = len(self.image_info)
+        self._image_ids = np.arange(self.num_images)
+
+        # Mapping from source class and image IDs to internal IDs
+        self.class_from_source_map = {"{}.{}".format(info['source'], info['id']): id
+                                      for info, id in zip(self.class_info, self.class_ids)}
+        self.image_from_source_map = {"{}.{}".format(info['source'], info['id']): id
+                                      for info, id in zip(self.image_info, self.image_ids)}
+
+        # Map sources to class_ids they support
+        self.sources = list(set([i['source'] for i in self.class_info]))
+        self.source_class_ids = {}
+        # Loop over datasets
+        for source in self.sources:
+            self.source_class_ids[source] = []
+            # Find classes that belong to this dataset
+            for i, info in enumerate(self.class_info):
+                # Include BG class in all datasets
+                if i == 0 or source == info['source']:
+                    self.source_class_ids[source].append(i)
+
+    def map_source_class_id(self, source_class_id):
+        """Takes a source class ID and returns the int class ID assigned to it.
+
+        For example:
+        dataset.map_source_class_id("coco.12") -> 23
+        """
+        return self.class_from_source_map[source_class_id]
+
+    def get_source_class_id(self, class_id, source):
+        """Map an internal class ID to the corresponding class ID in the source dataset."""
+        info = self.class_info[class_id]
+        assert info['source'] == source
+        return info['id']
+
+    @property
+    def image_ids(self):
+        return self._image_ids
+
+    def source_image_link(self, image_id):
+        """Returns the path or URL to the image.
+        Override this to return a URL to the image if it's available online for easy
+        debugging.
+        """
+        return self.image_info[image_id]["path"]
+
+    def load_image(self, image_id):
+        """Load the specified image and return a [H,W,3] Numpy array.
+        """
+        # Load image
+        image = skimage.io.imread(self.image_info[image_id]['path'])
+        # If grayscale. Convert to RGB for consistency.
+        if image.ndim != 3:
+            image = skimage.color.gray2rgb(image)
+        # If has an alpha channel, remove it for consistency
+        if image.shape[-1] == 4:
+            image = image[..., :3]
+        return image
+
+    def load_mask(self, image_id):
+        """Load instance masks for the given image.
+
+        Different datasets use different ways to store masks. Override this
+        method to load instance masks and return them in the form of am
+        array of binary masks of shape [height, width, instances].
+
+        Returns:
+            masks: A bool array of shape [height, width, instance count] with
+                a binary mask per instance.
+            class_ids: a 1D array of class IDs of the instance masks.
+        """
+        # Override this function to load a mask from your dataset.
+        # Otherwise, it returns an empty mask.
+        logging.warning("You are using the default load_mask(), maybe you need to define your own one.")
+        mask = np.empty([0, 0, 0])
+        class_ids = np.empty([0], np.int32)
+        return mask, class_ids
+
+
+def resize_image(image, min_dim=None, max_dim=None, min_scale=None, mode="square"):
+    """Resizes an image keeping the aspect ratio unchanged.
+
+    min_dim: if provided, resizes the image such that it's smaller
+        dimension == min_dim
+    max_dim: if provided, ensures that the image longest side doesn't
+        exceed this value.
+    min_scale: if provided, ensure that the image is scaled up by at least
+        this percent even if min_dim doesn't require it.
+    mode: Resizing mode.
+        none: No resizing. Return the image unchanged.
+        square: Resize and pad with zeros to get a square image
+            of size [max_dim, max_dim].
+        pad64: Pads width and height with zeros to make them multiples of 64.
+               If min_dim or min_scale are provided, it scales the image up
+               before padding. max_dim is ignored in this mode.
+               The multiple of 64 is needed to ensure smooth scaling of feature
+               maps up and down the 6 levels of the FPN pyramid (2**6=64).
+        crop: Picks random crops from the image. First, scales the image based
+              on min_dim and min_scale, then picks a random crop of
+              size min_dim x min_dim. Can be used in training only.
+              max_dim is not used in this mode.
+
+    Returns:
+    image: the resized image
+    window: (y1, x1, y2, x2). If max_dim is provided, padding might
+        be inserted in the returned image. If so, this window is the
+        coordinates of the image part of the full image (excluding
+        the padding). The x2, y2 pixels are not included.
+    scale: The scale factor used to resize the image
+    padding: Padding added to the image [(top, bottom), (left, right), (0, 0)]
+    """
+    # Keep track of image dtype and return results in the same dtype
+    image_dtype = image.dtype
+    # Default window (y1, x1, y2, x2) and default scale == 1.
+    h, w = image.shape[:2]
+    window = (0, 0, h, w)
+    scale = 1
+    padding = [(0, 0), (0, 0), (0, 0)]
+    crop = None
+
+    if mode == "none":
+        return image, window, scale, padding, crop
+
+    # Scale?
+    if min_dim:
+        # Scale up but not down
+        scale = max(1, min_dim / min(h, w))
+    if min_scale and scale < min_scale:
+        scale = min_scale
+
+    # Does it exceed max dim?
+    if max_dim and mode == "square":
+        image_max = max(h, w)
+        if round(image_max * scale) > max_dim:
+            scale = max_dim / image_max
+
+    # Resize image using bilinear interpolation
+    if scale != 1:
+        image = resize(image, (round(h * scale), round(w * scale)),
+                       preserve_range=True)
+
+    # Need padding or cropping?
+    if mode == "square":
+        # Get new height and width
+        h, w = image.shape[:2]
+        top_pad = (max_dim - h) // 2
+        bottom_pad = max_dim - h - top_pad
+        left_pad = (max_dim - w) // 2
+        right_pad = max_dim - w - left_pad
+        padding = [(top_pad, bottom_pad), (left_pad, right_pad), (0, 0)]
+        image = np.pad(image, padding, mode='constant', constant_values=0)
+        window = (top_pad, left_pad, h + top_pad, w + left_pad)
+    elif mode == "pad64":
+        h, w = image.shape[:2]
+        # Both sides must be divisible by 64
+        assert min_dim % 64 == 0, "Minimum dimension must be a multiple of 64"
+        # Height
+        if h % 64 > 0:
+            max_h = h - (h % 64) + 64
+            top_pad = (max_h - h) // 2
+            bottom_pad = max_h - h - top_pad
+        else:
+            top_pad = bottom_pad = 0
+        # Width
+        if w % 64 > 0:
+            max_w = w - (w % 64) + 64
+            left_pad = (max_w - w) // 2
+            right_pad = max_w - w - left_pad
+        else:
+            left_pad = right_pad = 0
+        padding = [(top_pad, bottom_pad), (left_pad, right_pad), (0, 0)]
+        image = np.pad(image, padding, mode='constant', constant_values=0)
+        window = (top_pad, left_pad, h + top_pad, w + left_pad)
+    elif mode == "crop":
+        # Pick a random crop
+        h, w = image.shape[:2]
+        y = random.randint(0, (h - min_dim))
+        x = random.randint(0, (w - min_dim))
+        crop = (y, x, min_dim, min_dim)
+        image = image[y:y + min_dim, x:x + min_dim]
+        window = (0, 0, min_dim, min_dim)
+    else:
+        raise Exception("Mode {} not supported".format(mode))
+    return image.astype(image_dtype), window, scale, padding, crop
+
+
+def resize_mask(mask, scale, padding, crop=None):
+    """Resizes a mask using the given scale and padding.
+    Typically, you get the scale and padding from resize_image() to
+    ensure both, the image and the mask, are resized consistently.
+
+    scale: mask scaling factor
+    padding: Padding to add to the mask in the form
+            [(top, bottom), (left, right), (0, 0)]
+    """
+    # Suppress warning from scipy 0.13.0, the output shape of zoom() is
+    # calculated with round() instead of int()
+    with warnings.catch_warnings():
+        warnings.simplefilter("ignore")
+        mask = scipy.ndimage.zoom(mask, zoom=[scale, scale, 1], order=0)
+    if crop is not None:
+        y, x, h, w = crop
+        mask = mask[y:y + h, x:x + w]
+    else:
+        mask = np.pad(mask, padding, mode='constant', constant_values=0)
+    return mask
+
+
+def minimize_mask(bbox, mask, mini_shape):
+    """Resize masks to a smaller version to reduce memory load.
+    Mini-masks can be resized back to image scale using expand_masks()
+
+    See inspect_data.ipynb notebook for more details.
+    """
+    mini_mask = np.zeros(mini_shape + (mask.shape[-1],), dtype=bool)
+    for i in range(mask.shape[-1]):
+        # Pick slice and cast to bool in case load_mask() returned wrong dtype
+        m = mask[:, :, i].astype(bool)
+        y1, x1, y2, x2 = bbox[i][:4]
+        m = m[y1:y2, x1:x2]
+        if m.size == 0:
+            raise Exception("Invalid bounding box with area of zero")
+        # Resize with bilinear interpolation
+        m = resize(m, mini_shape)
+        mini_mask[:, :, i] = np.around(m).astype(np.bool)
+    return mini_mask
+
+
+def expand_mask(bbox, mini_mask, image_shape):
+    """Resizes mini masks back to image size. Reverses the change
+    of minimize_mask().
+
+    See inspect_data.ipynb notebook for more details.
+    """
+    mask = np.zeros(image_shape[:2] + (mini_mask.shape[-1],), dtype=bool)
+    for i in range(mask.shape[-1]):
+        m = mini_mask[:, :, i]
+        y1, x1, y2, x2 = bbox[i][:4]
+        h = y2 - y1
+        w = x2 - x1
+        # Resize with bilinear interpolation
+        m = resize(m, (h, w))
+        mask[y1:y2, x1:x2, i] = np.around(m).astype(np.bool)
+    return mask
+
+
+# TODO: Build and use this function to reduce code duplication
+def mold_mask(mask, config):
+    pass
+
+
+def unmold_mask(mask, bbox, image_shape):
+    """Converts a mask generated by the neural network to a format similar
+    to its original shape.
+    mask: [height, width] of type float. A small, typically 28x28 mask.
+    bbox: [y1, x1, y2, x2]. The box to fit the mask in.
+
+    Returns a binary mask with the same size as the original image.
+    """
+    threshold = 0.5
+    y1, x1, y2, x2 = bbox
+    mask = resize(mask, (y2 - y1, x2 - x1))
+    mask = np.where(mask >= threshold, 1, 0).astype(np.bool)
+
+    # Put the mask in the right location.
+    full_mask = np.zeros(image_shape[:2], dtype=np.bool)
+    full_mask[y1:y2, x1:x2] = mask
+    return full_mask
+
+
+############################################################
+#  Anchors
+############################################################
+
+def generate_anchors(scales, ratios, shape, feature_stride, anchor_stride):
+    """
+    scales: 1D array of anchor sizes in pixels. Example: [32, 64, 128]
+    ratios: 1D array of anchor ratios of width/height. Example: [0.5, 1, 2]
+    shape: [height, width] spatial shape of the feature map over which
+            to generate anchors.
+    feature_stride: Stride of the feature map relative to the image in pixels.
+    anchor_stride: Stride of anchors on the feature map. For example, if the
+        value is 2 then generate anchors for every other feature map pixel.
+    """
+    # Get all combinations of scales and ratios
+    scales, ratios = np.meshgrid(np.array(scales), np.array(ratios))
+    scales = scales.flatten()
+    ratios = ratios.flatten()
+
+    # Enumerate heights and widths from scales and ratios
+    heights = scales / np.sqrt(ratios)
+    widths = scales * np.sqrt(ratios)
+
+    # Enumerate shifts in feature space
+    shifts_y = np.arange(0, shape[0], anchor_stride) * feature_stride
+    shifts_x = np.arange(0, shape[1], anchor_stride) * feature_stride
+    shifts_x, shifts_y = np.meshgrid(shifts_x, shifts_y)
+
+    # Enumerate combinations of shifts, widths, and heights
+    box_widths, box_centers_x = np.meshgrid(widths, shifts_x)
+    box_heights, box_centers_y = np.meshgrid(heights, shifts_y)
+
+    # Reshape to get a list of (y, x) and a list of (h, w)
+    box_centers = np.stack(
+        [box_centers_y, box_centers_x], axis=2).reshape([-1, 2])
+    box_sizes = np.stack([box_heights, box_widths], axis=2).reshape([-1, 2])
+
+    # Convert to corner coordinates (y1, x1, y2, x2)
+    boxes = np.concatenate([box_centers - 0.5 * box_sizes,
+                            box_centers + 0.5 * box_sizes], axis=1)
+    return boxes
+
+
+def generate_pyramid_anchors(scales, ratios, feature_shapes, feature_strides,
+                             anchor_stride):
+    """Generate anchors at different levels of a feature pyramid. Each scale
+    is associated with a level of the pyramid, but each ratio is used in
+    all levels of the pyramid.
+
+    Returns:
+    anchors: [N, (y1, x1, y2, x2)]. All generated anchors in one array. Sorted
+        with the same order of the given scales. So, anchors of scale[0] come
+        first, then anchors of scale[1], and so on.
+    """
+    # Anchors
+    # [anchor_count, (y1, x1, y2, x2)]
+    anchors = []
+    for i in range(len(scales)):
+        anchors.append(generate_anchors(scales[i], ratios, feature_shapes[i],
+                                        feature_strides[i], anchor_stride))
+    return np.concatenate(anchors, axis=0)
+
+
+############################################################
+#  Miscellaneous
+############################################################
+
+def trim_zeros(x):
+    """It's common to have tensors larger than the available data and
+    pad with zeros. This function removes rows that are all zeros.
+
+    x: [rows, columns].
+    """
+    assert len(x.shape) == 2
+    return x[~np.all(x == 0, axis=1)]
+
+
+def compute_matches(gt_boxes, gt_class_ids, gt_masks,
+                    pred_boxes, pred_class_ids, pred_scores, pred_masks,
+                    iou_threshold=0.5, score_threshold=0.0):
+    """Finds matches between prediction and ground truth instances.
+
+    Returns:
+        gt_match: 1-D array. For each GT box it has the index of the matched
+                  predicted box.
+        pred_match: 1-D array. For each predicted box, it has the index of
+                    the matched ground truth box.
+        overlaps: [pred_boxes, gt_boxes] IoU overlaps.
+    """
+    # Trim zero padding
+    # TODO: cleaner to do zero unpadding upstream
+    gt_boxes = trim_zeros(gt_boxes)
+    gt_masks = gt_masks[..., :gt_boxes.shape[0]]
+    pred_boxes = trim_zeros(pred_boxes)
+    pred_scores = pred_scores[:pred_boxes.shape[0]]
+    # Sort predictions by score from high to low
+    indices = np.argsort(pred_scores)[::-1]
+    pred_boxes = pred_boxes[indices]
+    pred_class_ids = pred_class_ids[indices]
+    pred_scores = pred_scores[indices]
+    pred_masks = pred_masks[..., indices]
+
+    # Compute IoU overlaps [pred_masks, gt_masks]
+    overlaps = compute_overlaps_masks(pred_masks, gt_masks)
+
+    # Loop through predictions and find matching ground truth boxes
+    match_count = 0
+    pred_match = -1 * np.ones([pred_boxes.shape[0]])
+    gt_match = -1 * np.ones([gt_boxes.shape[0]])
+    for i in range(len(pred_boxes)):
+        # Find best matching ground truth box
+        # 1. Sort matches by score
+        sorted_ixs = np.argsort(overlaps[i])[::-1]
+        # 2. Remove low scores
+        low_score_idx = np.where(overlaps[i, sorted_ixs] < score_threshold)[0]
+        if low_score_idx.size > 0:
+            sorted_ixs = sorted_ixs[:low_score_idx[0]]
+        # 3. Find the match
+        for j in sorted_ixs:
+            # If ground truth box is already matched, go to next one
+            if gt_match[j] > -1:
+                continue
+            # If we reach IoU smaller than the threshold, end the loop
+            iou = overlaps[i, j]
+            if iou < iou_threshold:
+                break
+            # Do we have a match?
+            if pred_class_ids[i] == gt_class_ids[j]:
+                match_count += 1
+                gt_match[j] = i
+                pred_match[i] = j
+                break
+
+    return gt_match, pred_match, overlaps
+
+
+def compute_ap(gt_boxes, gt_class_ids, gt_masks,
+               pred_boxes, pred_class_ids, pred_scores, pred_masks,
+               iou_threshold=0.5):
+    """Compute Average Precision at a set IoU threshold (default 0.5).
+
+    Returns:
+    mAP: Mean Average Precision
+    precisions: List of precisions at different class score thresholds.
+    recalls: List of recall values at different class score thresholds.
+    overlaps: [pred_boxes, gt_boxes] IoU overlaps.
+    """
+    # Get matches and overlaps
+    gt_match, pred_match, overlaps = compute_matches(
+        gt_boxes, gt_class_ids, gt_masks,
+        pred_boxes, pred_class_ids, pred_scores, pred_masks,
+        iou_threshold)
+
+    # Compute precision and recall at each prediction box step
+    precisions = np.cumsum(pred_match > -1) / (np.arange(len(pred_match)) + 1)
+    recalls = np.cumsum(pred_match > -1).astype(np.float32) / len(gt_match)
+
+    # Pad with start and end values to simplify the math
+    precisions = np.concatenate([[0], precisions, [0]])
+    recalls = np.concatenate([[0], recalls, [1]])
+
+    # Ensure precision values decrease but don't increase. This way, the
+    # precision value at each recall threshold is the maximum it can be
+    # for all following recall thresholds, as specified by the VOC paper.
+    for i in range(len(precisions) - 2, -1, -1):
+        precisions[i] = np.maximum(precisions[i], precisions[i + 1])
+
+    # Compute mean AP over recall range
+    indices = np.where(recalls[:-1] != recalls[1:])[0] + 1
+    mAP = np.sum((recalls[indices] - recalls[indices - 1]) *
+                 precisions[indices])
+
+    return mAP, precisions, recalls, overlaps
+
+
+def compute_ap_range(gt_box, gt_class_id, gt_mask,
+                     pred_box, pred_class_id, pred_score, pred_mask,
+                     iou_thresholds=None, verbose=1):
+    """Compute AP over a range or IoU thresholds. Default range is 0.5-0.95."""
+    # Default is 0.5 to 0.95 with increments of 0.05
+    iou_thresholds = iou_thresholds or np.arange(0.5, 1.0, 0.05)
+    
+    # Compute AP over range of IoU thresholds
+    AP = []
+    for iou_threshold in iou_thresholds:
+        ap, precisions, recalls, overlaps =\
+            compute_ap(gt_box, gt_class_id, gt_mask,
+                        pred_box, pred_class_id, pred_score, pred_mask,
+                        iou_threshold=iou_threshold)
+        if verbose:
+            print("AP @{:.2f}:\t {:.3f}".format(iou_threshold, ap))
+        AP.append(ap)
+    AP = np.array(AP).mean()
+    if verbose:
+        print("AP @{:.2f}-{:.2f}:\t {:.3f}".format(
+            iou_thresholds[0], iou_thresholds[-1], AP))
+    return AP
+
+
+def compute_recall(pred_boxes, gt_boxes, iou):
+    """Compute the recall at the given IoU threshold. It's an indication
+    of how many GT boxes were found by the given prediction boxes.
+
+    pred_boxes: [N, (y1, x1, y2, x2)] in image coordinates
+    gt_boxes: [N, (y1, x1, y2, x2)] in image coordinates
+    """
+    # Measure overlaps
+    overlaps = compute_overlaps(pred_boxes, gt_boxes)
+    iou_max = np.max(overlaps, axis=1)
+    iou_argmax = np.argmax(overlaps, axis=1)
+    positive_ids = np.where(iou_max >= iou)[0]
+    matched_gt_boxes = iou_argmax[positive_ids]
+
+    recall = len(set(matched_gt_boxes)) / gt_boxes.shape[0]
+    return recall, positive_ids
+
+
+# ## Batch Slicing
+# Some custom layers support a batch size of 1 only, and require a lot of work
+# to support batches greater than 1. This function slices an input tensor
+# across the batch dimension and feeds batches of size 1. Effectively,
+# an easy way to support batches > 1 quickly with little code modification.
+# In the long run, it's more efficient to modify the code to support large
+# batches and getting rid of this function. Consider this a temporary solution
+def batch_slice(inputs, graph_fn, batch_size, names=None):
+    """Splits inputs into slices and feeds each slice to a copy of the given
+    computation graph and then combines the results. It allows you to run a
+    graph on a batch of inputs even if the graph is written to support one
+    instance only.
+
+    inputs: list of tensors. All must have the same first dimension length
+    graph_fn: A function that returns a TF tensor that's part of a graph.
+    batch_size: number of slices to divide the data into.
+    names: If provided, assigns names to the resulting tensors.
+    """
+    if not isinstance(inputs, list):
+        inputs = [inputs]
+
+    outputs = []
+    for i in range(batch_size):
+        inputs_slice = [x[i] for x in inputs]
+        output_slice = graph_fn(*inputs_slice)
+        if not isinstance(output_slice, (tuple, list)):
+            output_slice = [output_slice]
+        outputs.append(output_slice)
+    # Change outputs from a list of slices where each is
+    # a list of outputs to a list of outputs and each has
+    # a list of slices
+    outputs = list(zip(*outputs))
+
+    if names is None:
+        names = [None] * len(outputs)
+
+    result = [tf.stack(o, axis=0, name=n)
+              for o, n in zip(outputs, names)]
+    if len(result) == 1:
+        result = result[0]
+
+    return result
+
+
+def download_trained_weights(coco_model_path, verbose=1):
+    """Download COCO trained weights from Releases.
+
+    coco_model_path: local path of COCO trained weights
+    """
+    if verbose > 0:
+        print("Downloading pretrained model to " + coco_model_path + " ...")
+    with urllib.request.urlopen(COCO_MODEL_URL) as resp, open(coco_model_path, 'wb') as out:
+        shutil.copyfileobj(resp, out)
+    if verbose > 0:
+        print("... done downloading pretrained model!")
+
+
+def norm_boxes(boxes, shape):
+    """Converts boxes from pixel coordinates to normalized coordinates.
+    boxes: [N, (y1, x1, y2, x2)] in pixel coordinates
+    shape: [..., (height, width)] in pixels
+
+    Note: In pixel coordinates (y2, x2) is outside the box. But in normalized
+    coordinates it's inside the box.
+
+    Returns:
+        [N, (y1, x1, y2, x2)] in normalized coordinates
+    """
+    h, w = shape
+    scale = np.array([h - 1, w - 1, h - 1, w - 1])
+    shift = np.array([0, 0, 1, 1])
+    return np.divide((boxes - shift), scale).astype(np.float32)
+
+
+def denorm_boxes(boxes, shape):
+    """Converts boxes from normalized coordinates to pixel coordinates.
+    boxes: [N, (y1, x1, y2, x2)] in normalized coordinates
+    shape: [..., (height, width)] in pixels
+
+    Note: In pixel coordinates (y2, x2) is outside the box. But in normalized
+    coordinates it's inside the box.
+
+    Returns:
+        [N, (y1, x1, y2, x2)] in pixel coordinates
+    """
+    h, w = shape
+    scale = np.array([h - 1, w - 1, h - 1, w - 1])
+    shift = np.array([0, 0, 1, 1])
+    return np.around(np.multiply(boxes, scale) + shift).astype(np.int32)
+
+
+def resize(image, output_shape, order=1, mode='constant', cval=0, clip=True,
+           preserve_range=False, anti_aliasing=False, anti_aliasing_sigma=None):
+    """A wrapper for Scikit-Image resize().
+
+    Scikit-Image generates warnings on every call to resize() if it doesn't
+    receive the right parameters. The right parameters depend on the version
+    of skimage. This solves the problem by using different parameters per
+    version. And it provides a central place to control resizing defaults.
+    """
+    if LooseVersion(skimage.__version__) >= LooseVersion("0.14"):
+        # New in 0.14: anti_aliasing. Default it to False for backward
+        # compatibility with skimage 0.13.
+        return skimage.transform.resize(
+            image, output_shape,
+            order=order, mode=mode, cval=cval, clip=clip,
+            preserve_range=preserve_range, anti_aliasing=anti_aliasing,
+            anti_aliasing_sigma=anti_aliasing_sigma)
+    else:
+        return skimage.transform.resize(
+            image, output_shape,
+            order=order, mode=mode, cval=cval, clip=clip,
+            preserve_range=preserve_range)
diff --git a/mask_rcnn/mrcnn/visualize.py b/mask_rcnn/mrcnn/visualize.py
new file mode 100644
index 00000000..80e5ef58
--- /dev/null
+++ b/mask_rcnn/mrcnn/visualize.py
@@ -0,0 +1,502 @@
+"""
+Mask R-CNN
+Display and Visualization Functions.
+
+Copyright (c) 2017 Matterport, Inc.
+Licensed under the MIT License (see LICENSE for details)
+Written by Waleed Abdulla
+"""
+import warnings
+warnings.filterwarnings('ignore', category=DeprecationWarning)
+warnings.filterwarnings('ignore', category=FutureWarning)
+import os
+import sys
+import random
+import itertools
+import colorsys
+
+import numpy as np
+from skimage.measure import find_contours
+import matplotlib.pyplot as plt
+from matplotlib import patches,  lines
+from matplotlib.patches import Polygon
+import IPython.display
+
+# Root directory of the project
+ROOT_DIR = os.path.abspath("../")
+
+# Import Mask RCNN
+sys.path.append(ROOT_DIR)  # To find local version of the library
+from mrcnn import utils
+
+
+############################################################
+#  Visualization
+############################################################
+
+def display_images(images, titles=None, cols=4, cmap=None, norm=None,
+                   interpolation=None):
+    """Display the given set of images, optionally with titles.
+    images: list or array of image tensors in HWC format.
+    titles: optional. A list of titles to display with each image.
+    cols: number of images per row
+    cmap: Optional. Color map to use. For example, "Blues".
+    norm: Optional. A Normalize instance to map values to colors.
+    interpolation: Optional. Image interpolation to use for display.
+    """
+    titles = titles if titles is not None else [""] * len(images)
+    rows = len(images) // cols + 1
+    plt.figure(figsize=(14, 14 * rows // cols))
+    i = 1
+    for image, title in zip(images, titles):
+        plt.subplot(rows, cols, i)
+        plt.title(title, fontsize=9)
+        plt.axis('off')
+        plt.imshow(image.astype(np.uint8), cmap=cmap,
+                   norm=norm, interpolation=interpolation)
+        i += 1
+    plt.show()
+
+
+def random_colors(N, bright=True):
+    """
+    Generate random colors.
+    To get visually distinct colors, generate them in HSV space then
+    convert to RGB.
+    """
+    brightness = 1.0 if bright else 0.7
+    hsv = [(i / N, 1, brightness) for i in range(N)]
+    colors = list(map(lambda c: colorsys.hsv_to_rgb(*c), hsv))
+    random.shuffle(colors)
+    return colors
+
+
+def apply_mask(image, mask, color, alpha=0.5):
+    """Apply the given mask to the image.
+    """
+    for c in range(3):
+        image[:, :, c] = np.where(mask == 1,
+                                  image[:, :, c] *
+                                  (1 - alpha) + alpha * color[c] * 255,
+                                  image[:, :, c])
+    return image
+
+
+def display_instances(image, boxes, masks, class_ids, class_names,
+                      scores=None, title="",
+                      figsize=(16, 16), ax=None,
+                      show_mask=True, show_bbox=True,
+                      colors=None, captions=None):
+    """
+    boxes: [num_instance, (y1, x1, y2, x2, class_id)] in image coordinates.
+    masks: [height, width, num_instances]
+    class_ids: [num_instances]
+    class_names: list of class names of the dataset
+    scores: (optional) confidence scores for each box
+    title: (optional) Figure title
+    show_mask, show_bbox: To show masks and bounding boxes or not
+    figsize: (optional) the size of the image
+    colors: (optional) An array or colors to use with each object
+    captions: (optional) A list of strings to use as captions for each object
+    """
+    # Number of instances
+    N = boxes.shape[0]
+    if not N:
+        print("\n*** No instances to display *** \n")
+    else:
+        assert boxes.shape[0] == masks.shape[-1] == class_ids.shape[0]
+
+    # If no axis is passed, create one and automatically call show()
+    auto_show = False
+    if not ax:
+        _, ax = plt.subplots(1, figsize=figsize)
+        auto_show = True
+
+    # Generate random colors
+    colors = colors or random_colors(N)
+
+    # Show area outside image boundaries.
+    height, width = image.shape[:2]
+    ax.set_ylim(height + 10, -10)
+    ax.set_xlim(-10, width + 10)
+    ax.axis('off')
+    ax.set_title(title)
+
+    masked_image = image.astype(np.uint32).copy()
+    for i in range(N):
+        color = colors[i]
+
+        # Bounding box
+        if not np.any(boxes[i]):
+            # Skip this instance. Has no bbox. Likely lost in image cropping.
+            continue
+        y1, x1, y2, x2 = boxes[i]
+        if show_bbox:
+            p = patches.Rectangle((x1, y1), x2 - x1, y2 - y1, linewidth=2,
+                                alpha=0.7, linestyle="dashed",
+                                edgecolor=color, facecolor='none')
+            ax.add_patch(p)
+
+        # Label
+        if not captions:
+            class_id = class_ids[i]
+            score = scores[i] if scores is not None else None
+            label = class_names[class_id]
+            caption = "{} {:.3f}".format(label, score) if score else label
+        else:
+            caption = captions[i]
+        ax.text(x1, y1 + 8, caption,
+                color='w', size=11, backgroundcolor="none")
+
+        # Mask
+        mask = masks[:, :, i]
+        if show_mask:
+            masked_image = apply_mask(masked_image, mask, color)
+
+        # Mask Polygon
+        # Pad to ensure proper polygons for masks that touch image edges.
+        padded_mask = np.zeros(
+            (mask.shape[0] + 2, mask.shape[1] + 2), dtype=np.uint8)
+        padded_mask[1:-1, 1:-1] = mask
+        contours = find_contours(padded_mask, 0.5)
+        for verts in contours:
+            # Subtract the padding and flip (y, x) to (x, y)
+            verts = np.fliplr(verts) - 1
+            p = Polygon(verts, facecolor="none", edgecolor=color)
+            ax.add_patch(p)
+    ax.imshow(masked_image.astype(np.uint8))
+    if auto_show:
+        plt.show()
+
+
+def display_differences(image,
+                        gt_box, gt_class_id, gt_mask,
+                        pred_box, pred_class_id, pred_score, pred_mask,
+                        class_names, title="", ax=None,
+                        show_mask=True, show_box=True,
+                        iou_threshold=0.5, score_threshold=0.5):
+    """Display ground truth and prediction instances on the same image."""
+    # Match predictions to ground truth
+    gt_match, pred_match, overlaps = utils.compute_matches(
+        gt_box, gt_class_id, gt_mask,
+        pred_box, pred_class_id, pred_score, pred_mask,
+        iou_threshold=iou_threshold, score_threshold=score_threshold)
+    # Ground truth = green. Predictions = red
+    colors = [(0, 1, 0, .8)] * len(gt_match)\
+           + [(1, 0, 0, 1)] * len(pred_match)
+    # Concatenate GT and predictions
+    class_ids = np.concatenate([gt_class_id, pred_class_id])
+    scores = np.concatenate([np.zeros([len(gt_match)]), pred_score])
+    boxes = np.concatenate([gt_box, pred_box])
+    masks = np.concatenate([gt_mask, pred_mask], axis=-1)
+    # Captions per instance show score/IoU
+    captions = ["" for m in gt_match] + ["{:.2f} / {:.2f}".format(
+        pred_score[i],
+        (overlaps[i, int(pred_match[i])]
+            if pred_match[i] > -1 else overlaps[i].max()))
+            for i in range(len(pred_match))]
+    # Set title if not provided
+    title = title or "Ground Truth and Detections\n GT=green, pred=red, captions: score/IoU"
+    # Display
+    display_instances(
+        image,
+        boxes, masks, class_ids,
+        class_names, scores, ax=ax,
+        show_bbox=show_box, show_mask=show_mask,
+        colors=colors, captions=captions,
+        title=title)
+
+
+def draw_rois(image, rois, refined_rois, mask, class_ids, class_names, limit=10):
+    """
+    anchors: [n, (y1, x1, y2, x2)] list of anchors in image coordinates.
+    proposals: [n, 4] the same anchors but refined to fit objects better.
+    """
+    masked_image = image.copy()
+
+    # Pick random anchors in case there are too many.
+    ids = np.arange(rois.shape[0], dtype=np.int32)
+    ids = np.random.choice(
+        ids, limit, replace=False) if ids.shape[0] > limit else ids
+
+    fig, ax = plt.subplots(1, figsize=(12, 12))
+    if rois.shape[0] > limit:
+        plt.title("Showing {} random ROIs out of {}".format(
+            len(ids), rois.shape[0]))
+    else:
+        plt.title("{} ROIs".format(len(ids)))
+
+    # Show area outside image boundaries.
+    ax.set_ylim(image.shape[0] + 20, -20)
+    ax.set_xlim(-50, image.shape[1] + 20)
+    ax.axis('off')
+
+    for i, id in enumerate(ids):
+        color = np.random.rand(3)
+        class_id = class_ids[id]
+        # ROI
+        y1, x1, y2, x2 = rois[id]
+        p = patches.Rectangle((x1, y1), x2 - x1, y2 - y1, linewidth=2,
+                              edgecolor=color if class_id else "gray",
+                              facecolor='none', linestyle="dashed")
+        ax.add_patch(p)
+        # Refined ROI
+        if class_id:
+            ry1, rx1, ry2, rx2 = refined_rois[id]
+            p = patches.Rectangle((rx1, ry1), rx2 - rx1, ry2 - ry1, linewidth=2,
+                                  edgecolor=color, facecolor='none')
+            ax.add_patch(p)
+            # Connect the top-left corners of the anchor and proposal for easy visualization
+            ax.add_line(lines.Line2D([x1, rx1], [y1, ry1], color=color))
+
+            # Label
+            label = class_names[class_id]
+            ax.text(rx1, ry1 + 8, "{}".format(label),
+                    color='w', size=11, backgroundcolor="none")
+
+            # Mask
+            m = utils.unmold_mask(mask[id], rois[id]
+                                  [:4].astype(np.int32), image.shape)
+            masked_image = apply_mask(masked_image, m, color)
+
+    ax.imshow(masked_image)
+
+    # Print stats
+    print("Positive ROIs: ", class_ids[class_ids > 0].shape[0])
+    print("Negative ROIs: ", class_ids[class_ids == 0].shape[0])
+    print("Positive Ratio: {:.2f}".format(
+        class_ids[class_ids > 0].shape[0] / class_ids.shape[0]))
+
+
+# TODO: Replace with matplotlib equivalent?
+def draw_box(image, box, color):
+    """Draw 3-pixel width bounding boxes on the given image array.
+    color: list of 3 int values for RGB.
+    """
+    y1, x1, y2, x2 = box
+    image[y1:y1 + 2, x1:x2] = color
+    image[y2:y2 + 2, x1:x2] = color
+    image[y1:y2, x1:x1 + 2] = color
+    image[y1:y2, x2:x2 + 2] = color
+    return image
+
+
+def display_top_masks(image, mask, class_ids, class_names, limit=4):
+    """Display the given image and the top few class masks."""
+    to_display = []
+    titles = []
+    to_display.append(image)
+    titles.append("H x W={}x{}".format(image.shape[0], image.shape[1]))
+    # Pick top prominent classes in this image
+    unique_class_ids = np.unique(class_ids)
+    mask_area = [np.sum(mask[:, :, np.where(class_ids == i)[0]])
+                 for i in unique_class_ids]
+    top_ids = [v[0] for v in sorted(zip(unique_class_ids, mask_area),
+                                    key=lambda r: r[1], reverse=True) if v[1] > 0]
+    # Generate images and titles
+    for i in range(limit):
+        class_id = top_ids[i] if i < len(top_ids) else -1
+        # Pull masks of instances belonging to the same class.
+        m = mask[:, :, np.where(class_ids == class_id)[0]]
+        m = np.sum(m * np.arange(1, m.shape[-1] + 1), -1)
+        to_display.append(m)
+        titles.append(class_names[class_id] if class_id != -1 else "-")
+    display_images(to_display, titles=titles, cols=limit + 1, cmap="Blues_r")
+
+
+def plot_precision_recall(AP, precisions, recalls):
+    """Draw the precision-recall curve.
+
+    AP: Average precision at IoU >= 0.5
+    precisions: list of precision values
+    recalls: list of recall values
+    """
+    # Plot the Precision-Recall curve
+    _, ax = plt.subplots(1)
+    ax.set_title("Precision-Recall Curve. AP@50 = {:.3f}".format(AP))
+    ax.set_ylim(0, 1.1)
+    ax.set_xlim(0, 1.1)
+    _ = ax.plot(recalls, precisions)
+
+
+def plot_overlaps(gt_class_ids, pred_class_ids, pred_scores,
+                  overlaps, class_names, threshold=0.5):
+    """Draw a grid showing how ground truth objects are classified.
+    gt_class_ids: [N] int. Ground truth class IDs
+    pred_class_id: [N] int. Predicted class IDs
+    pred_scores: [N] float. The probability scores of predicted classes
+    overlaps: [pred_boxes, gt_boxes] IoU overlaps of predictions and GT boxes.
+    class_names: list of all class names in the dataset
+    threshold: Float. The prediction probability required to predict a class
+    """
+    gt_class_ids = gt_class_ids[gt_class_ids != 0]
+    pred_class_ids = pred_class_ids[pred_class_ids != 0]
+
+    plt.figure(figsize=(12, 10))
+    plt.imshow(overlaps, interpolation='nearest', cmap=plt.cm.Blues)
+    plt.yticks(np.arange(len(pred_class_ids)),
+               ["{} ({:.2f})".format(class_names[int(id)], pred_scores[i])
+                for i, id in enumerate(pred_class_ids)])
+    plt.xticks(np.arange(len(gt_class_ids)),
+               [class_names[int(id)] for id in gt_class_ids], rotation=90)
+
+    thresh = overlaps.max() / 2.
+    for i, j in itertools.product(range(overlaps.shape[0]),
+                                  range(overlaps.shape[1])):
+        text = ""
+        if overlaps[i, j] > threshold:
+            text = "match" if gt_class_ids[j] == pred_class_ids[i] else "wrong"
+        color = ("white" if overlaps[i, j] > thresh
+                 else "black" if overlaps[i, j] > 0
+                 else "grey")
+        plt.text(j, i, "{:.3f}\n{}".format(overlaps[i, j], text),
+                 horizontalalignment="center", verticalalignment="center",
+                 fontsize=9, color=color)
+
+    plt.tight_layout()
+    plt.xlabel("Ground Truth")
+    plt.ylabel("Predictions")
+
+
+def draw_boxes(image, boxes=None, refined_boxes=None,
+               masks=None, captions=None, visibilities=None,
+               title="", ax=None):
+    """Draw bounding boxes and segmentation masks with different
+    customizations.
+
+    boxes: [N, (y1, x1, y2, x2, class_id)] in image coordinates.
+    refined_boxes: Like boxes, but draw with solid lines to show
+        that they're the result of refining 'boxes'.
+    masks: [N, height, width]
+    captions: List of N titles to display on each box
+    visibilities: (optional) List of values of 0, 1, or 2. Determine how
+        prominent each bounding box should be.
+    title: An optional title to show over the image
+    ax: (optional) Matplotlib axis to draw on.
+    """
+    # Number of boxes
+    assert boxes is not None or refined_boxes is not None
+    N = boxes.shape[0] if boxes is not None else refined_boxes.shape[0]
+
+    # Matplotlib Axis
+    if not ax:
+        _, ax = plt.subplots(1, figsize=(12, 12))
+
+    # Generate random colors
+    colors = random_colors(N)
+
+    # Show area outside image boundaries.
+    margin = image.shape[0] // 10
+    ax.set_ylim(image.shape[0] + margin, -margin)
+    ax.set_xlim(-margin, image.shape[1] + margin)
+    ax.axis('off')
+
+    ax.set_title(title)
+
+    masked_image = image.astype(np.uint32).copy()
+    for i in range(N):
+        # Box visibility
+        visibility = visibilities[i] if visibilities is not None else 1
+        if visibility == 0:
+            color = "gray"
+            style = "dotted"
+            alpha = 0.5
+        elif visibility == 1:
+            color = colors[i]
+            style = "dotted"
+            alpha = 1
+        elif visibility == 2:
+            color = colors[i]
+            style = "solid"
+            alpha = 1
+
+        # Boxes
+        if boxes is not None:
+            if not np.any(boxes[i]):
+                # Skip this instance. Has no bbox. Likely lost in cropping.
+                continue
+            y1, x1, y2, x2 = boxes[i]
+            p = patches.Rectangle((x1, y1), x2 - x1, y2 - y1, linewidth=2,
+                                  alpha=alpha, linestyle=style,
+                                  edgecolor=color, facecolor='none')
+            ax.add_patch(p)
+
+        # Refined boxes
+        if refined_boxes is not None and visibility > 0:
+            ry1, rx1, ry2, rx2 = refined_boxes[i].astype(np.int32)
+            p = patches.Rectangle((rx1, ry1), rx2 - rx1, ry2 - ry1, linewidth=2,
+                                  edgecolor=color, facecolor='none')
+            ax.add_patch(p)
+            # Connect the top-left corners of the anchor and proposal
+            if boxes is not None:
+                ax.add_line(lines.Line2D([x1, rx1], [y1, ry1], color=color))
+
+        # Captions
+        if captions is not None:
+            caption = captions[i]
+            # If there are refined boxes, display captions on them
+            if refined_boxes is not None:
+                y1, x1, y2, x2 = ry1, rx1, ry2, rx2
+            ax.text(x1, y1, caption, size=11, verticalalignment='top',
+                    color='w', backgroundcolor="none",
+                    bbox={'facecolor': color, 'alpha': 0.5,
+                          'pad': 2, 'edgecolor': 'none'})
+
+        # Masks
+        if masks is not None:
+            mask = masks[:, :, i]
+            masked_image = apply_mask(masked_image, mask, color)
+            # Mask Polygon
+            # Pad to ensure proper polygons for masks that touch image edges.
+            padded_mask = np.zeros(
+                (mask.shape[0] + 2, mask.shape[1] + 2), dtype=np.uint8)
+            padded_mask[1:-1, 1:-1] = mask
+            contours = find_contours(padded_mask, 0.5)
+            for verts in contours:
+                # Subtract the padding and flip (y, x) to (x, y)
+                verts = np.fliplr(verts) - 1
+                p = Polygon(verts, facecolor="none", edgecolor=color)
+                ax.add_patch(p)
+    ax.imshow(masked_image.astype(np.uint8))
+
+
+def display_table(table):
+    """Display values in a table format.
+    table: an iterable of rows, and each row is an iterable of values.
+    """
+    html = ""
+    for row in table:
+        row_html = ""
+        for col in row:
+            row_html += "<td>{:40}</td>".format(str(col))
+        html += "<tr>" + row_html + "</tr>"
+    html = "<table>" + html + "</table>"
+    IPython.display.display(IPython.display.HTML(html))
+
+
+def display_weight_stats(model):
+    """Scans all the weights in the model and returns a list of tuples
+    that contain stats about each weight.
+    """
+    layers = model.get_trainable_layers()
+    table = [["WEIGHT NAME", "SHAPE", "MIN", "MAX", "STD"]]
+    for l in layers:
+        weight_values = l.get_weights()  # list of Numpy arrays
+        weight_tensors = l.weights  # list of TF tensors
+        for i, w in enumerate(weight_values):
+            weight_name = weight_tensors[i].name
+            # Detect problematic layers. Exclude biases of conv layers.
+            alert = ""
+            if w.min() == w.max() and not (l.__class__.__name__ == "Conv2D" and i == 1):
+                alert += "<span style='color:red'>*** dead?</span>"
+            if np.abs(w.min()) > 1000 or np.abs(w.max()) > 1000:
+                alert += "<span style='color:red'>*** Overflow?</span>"
+            # Add row
+            table.append([
+                weight_name + alert,
+                str(w.shape),
+                "{:+9.4f}".format(w.min()),
+                "{:+10.4f}".format(w.max()),
+                "{:+9.4f}".format(w.std()),
+            ])
+    display_table(table)
diff --git a/mask_rcnn/requirements.txt b/mask_rcnn/requirements.txt
new file mode 100644
index 00000000..22e883b7
--- /dev/null
+++ b/mask_rcnn/requirements.txt
@@ -0,0 +1,12 @@
+numpy
+scipy
+Pillow
+cython
+matplotlib
+scikit-image
+tensorflow-gpu
+keras==2.2.5
+opencv-python
+h5py
+imgaug
+IPython[all]
\ No newline at end of file
diff --git a/mask_rcnn/score.py b/mask_rcnn/score.py
new file mode 100644
index 00000000..ad9bc731
--- /dev/null
+++ b/mask_rcnn/score.py
@@ -0,0 +1,300 @@
+from mrcnn.model import log
+import mrcnn.model as modellib
+from mrcnn.visualize import display_images
+import mrcnn.visualize as visualize
+import mrcnn.utils as utils
+from mrcnn.config import Config
+import sys
+import math
+import re
+import time
+import numpy as np
+import tensorflow as tf
+import matplotlib
+import matplotlib.pyplot as plt
+import matplotlib.patches as patches
+import os
+import sys
+import json
+import datetime
+import skimage.draw
+import cv2
+import argparse
+
+# Device to load the neural network on.
+# Useful if you're training a model on the same
+# machine, in which case use CPU and leave the
+# GPU for training.
+DEVICE = "/cpu:0"  # /cpu:0 or /gpu:0
+
+ACCEPTED_EXTENSIONS = ['.jpg', '.jpeg', '.png', '.gif']
+CLASS_NAMES = ['BG', 'outerbox', 'innerbox', 'item_sq', 'item_rect', 'item_rect_slim', 'item_circ']
+ITEM_NAMES = CLASS_NAMES[3:]
+
+class PPConfig(Config):
+    """Configuration for training on the toy  dataset.
+    Derives from the base Config class and overrides some values.
+    """
+    # Give the configuration a recognizable name
+    NAME = "pointless_package"
+
+    # We use a GPU with 12GB memory, which can fit two images.
+    # Adjust down if you use a smaller GPU.
+    IMAGES_PER_GPU = 1
+
+    # Number of classes (including background)
+    # Background + outerbox + innerbox + item_rect + item_rect_slim + item_sq + item_circ
+    NUM_CLASSES = 1 + 6
+
+    # Number of training steps per epoch
+    STEPS_PER_EPOCH = 100
+
+    # Skip detections with < 90% confidence
+    DETECTION_MIN_CONFIDENCE = 0.75
+
+class PPDataset(utils.Dataset):
+
+    def load_dataset(self, dataset_dir, subset):
+        """Load a subset of the Balloon dataset.
+        dataset_dir: Root directory of the dataset.
+        subset: Subset to load: train or val
+        """
+        # Add classes. We have only one class to add.
+        self.add_class("pointless_package", 1, "outerbox")
+        self.add_class("pointless_package", 2, "innerbox")
+        self.add_class("pointless_package", 3, "item_sq")
+        self.add_class("pointless_package", 4, "item_rect")
+        self.add_class("pointless_package", 5, "item_rect_slim")
+        self.add_class("pointless_package", 6, "item_circ")
+
+        # Train or validation dataset?
+        assert subset in ["train", "val"]
+        dataset_dir = os.path.join(dataset_dir, subset)
+
+        # Load annotations
+        # VGG Image Annotator (up to version 1.6) saves each image in the form:
+        # { 'filename': '28503151_5b5b7ec140_b.jpg',
+        #   'regions': {
+        #       '0': {
+        #           'region_attributes': {},
+        #           'shape_attributes': {
+        #               'all_points_x': [...],
+        #               'all_points_y': [...],
+        #               'name': 'polygon'}},
+        #       ... more regions ...
+        #   },
+        #   'size': 100202
+        # }
+        # We mostly care about the x and y coordinates of each region
+        # Note: In VIA 2.0, regions was changed from a dict to a list.
+        annotations = json.load(
+            open(os.path.join(dataset_dir, "via_region_data.json")))
+        annotations = list(annotations.values())  # don't need the dict keys
+
+        # The VIA tool saves images in the JSON even if they don't have any
+        # annotations. Skip unannotated images.
+        annotations = [a for a in annotations if a['regions']]
+
+        # Add images
+        for a in annotations:
+            # Get the x, y coordinaets of points of the polygons that make up
+            # the outline of each object instance. These are stores in the
+            # shape_attributes (see json format above)
+            # The if condition is needed to support VIA versions 1.x and 2.x.
+            if type(a['regions']) is dict:
+                polygons = [r['shape_attributes']
+                            for r in a['regions'].values()]
+            else:
+                polygons = [r['shape_attributes'] for r in a['regions']]
+
+            # load_mask() needs the image size to convert polygons to masks.
+            # Unfortunately, VIA doesn't include it in JSON, so we must read
+            # the image. This is only managable since the dataset is tiny.
+            image_path = os.path.join(dataset_dir, a['filename'])
+            image = skimage.io.imread(image_path)
+            height, width = image.shape[:2]
+
+            class_list = [r['region_attributes'] for r in a['regions']]
+
+            self.add_image(
+                "pointless_package",
+                image_id=a['filename'],  # use file name as a unique image id
+                path=image_path,
+                width=width, height=height,
+                class_list=class_list,
+                polygons=polygons)
+
+    def load_mask(self, image_id):
+        """Generate instance masks for an image.
+       Returns:
+        masks: A bool array of shape [height, width, instance count] with
+            one mask per instance.
+        class_ids: a 1D array of class IDs of the instance masks.
+        """
+        class_ids = list()
+        # If not a pointless_package dataset image, delegate to parent class.
+        image_info = self.image_info[image_id]
+        # if image_info["source"] != "pointless_package":
+        #     return super(self.__class__, self).load_mask(image_id)
+
+        # Convert polygons to a bitmap mask of shape
+        # [height, width, instance_count]
+        info = self.image_info[image_id]
+        # print("\n\n\nIMAGE INFO:", info, "\n\n\n\n")
+
+        for box_type in info['class_list']:
+            # print(box_type['name'])
+            class_ids.append(self.class_names.index(str(box_type['name'])))
+        # print(class_ids)
+        # print(self.class_names)
+
+        mask = np.zeros([info["height"], info["width"], len(info["polygons"])],
+                        dtype=np.uint8)
+        for i, p in enumerate(info["polygons"]):
+            # Get indexes of pixels inside the polygon and set them to 1
+            rr, cc = skimage.draw.polygon(p['all_points_y'], p['all_points_x'])
+            mask[rr, cc, i] = 1
+        # Return mask, and array of class IDs of each instance. Since we have
+        # one class ID only, we return an array of 1s
+        return mask.astype(np.bool), np.asarray(class_ids, dtype=np.int32)
+
+    def image_reference(self, image_id):
+        """Return the path of the image."""
+        info = self.image_info[image_id]
+        if info["source"] == "pointless_package":
+            return info["path"]
+        else:
+            super(self.__class__, self).image_reference(image_id)
+
+config = PPConfig()
+ROOT_DIR = os.getcwd()
+PP_DIR = os.path.join(ROOT_DIR, "./")
+
+# Override the training configurations with a few
+# changes for inferencing.
+class InferenceConfig(config.__class__):
+    # Run detection on one image at a time
+    GPU_COUNT = 1
+    IMAGES_PER_GPU = 1
+
+config = InferenceConfig()
+
+def get_ax(rows=1, cols=1, size=16):
+    """Return a Matplotlib Axes array to be used in
+    all visualizations in the notebook. Provide a
+    central point to control graph sizes.
+    
+    Adjust the size attribute to control how big to render images
+    """
+    _, ax = plt.subplots(rows, cols, figsize=(size*cols, size*rows))
+    return ax
+
+description = "Simple script that takes a trained MASK R-CNN model (.h5), a pointless packaging image and then runs generates score of the packaging purely based on the area; using the provided model."
+
+def parse_args():
+    parser = argparse.ArgumentParser(description=description)
+    parser.add_argument('-m', '--model', required=True,
+                        help='Absolute/Relative path to the MASK R-CNN Model', dest='model_src')
+    g = parser.add_mutually_exclusive_group()
+    g.add_argument('-i', '--img', required=False,
+                        help='Absolute/Relative path of the image. Cannot include --dir argument.', dest='img_src')
+    g.add_argument('-d', '--dir', required=False,
+                        help='Absolute/Relative path of the directory containing the images. Cannot include --img argument.', dest='dir_src')
+    parser.add_argument('-v', '--visualize', action='store_true',
+                        help='Visualize the image.', dest='vis_arg')
+
+    return parser.parse_args()
+
+def main():
+    args = parse_args()
+    file_only = False if args.img_src is None else True
+
+    if os.path.isfile(args.model_src) == False:
+        print("Model file does not exist. Please provide a model.")
+        raise SystemExit
+    
+    if file_only:
+        if os.path.isfile(args.img_src) == False:
+            print("Please enter a valid image.")
+            raise SystemExit
+        img_src = os.path.splitext(args.img_src)  # path of the image
+    else:
+        if os.path.isdir(args.dir_src) == False:
+            print("Please enter a valid directory.")
+            raise SystemExit
+
+    model_src = os.path.splitext(args.model_src)  # model path
+    
+    if model_src[1] != '.h5':
+        print("Not a valid model. Please enter .h5 models only.")
+        raise SystemExit
+
+    ### SETUP MODEL ###
+    width = 300
+
+    # # Create model in inference mode
+    with tf.device(DEVICE):
+        model = modellib.MaskRCNN(mode="inference", model_dir='./models/',
+                                config=config)
+
+    # Load weights
+    print("Loading weights ", args.model_src)
+    model.load_weights(args.model_src, by_name=True)
+
+    ### RUN INFERENCE ###
+    if file_only:
+        files = [args.img_src]
+    else:
+        try:
+            """ Get all files in the copied directory """
+            files = os.listdir(args.dir_src)
+        except NotADirectoryError:
+            print("Invalid directory:", args.dir_src)
+            raise
+
+    print("\n\n----------------------")
+    print("  PACKAGING SCORES    ")
+    print("----------------------")
+    
+    for file in files:
+        if os.path.splitext(file)[1] not in ACCEPTED_EXTENSIONS:
+            # print(file + "is not a valid image.")
+            continue
+        image = cv2.imread(args.dir_src+file)
+        image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+
+        orig_dim = image.shape
+        new_dim = (int((width/orig_dim[0]) * orig_dim[1]), width)
+        image = cv2.resize(
+            image, new_dim, interpolation=cv2.INTER_AREA)
+        if orig_dim[0] > 300:
+            print("Image resized from", orig_dim[:2], " ->", image.shape[:2])
+
+        # Run object detection
+        results = model.detect([image], verbose=0)
+
+        # Display results
+        r = results[0]
+
+        N = r['rois'].shape[0]
+        class_ids = r['class_ids']
+        masks = r['masks']
+
+        class_names = np.asarray(CLASS_NAMES)
+
+        # area_occupation = [masks[:, :, i].sum() for i in range(N)]
+        area_occupation = masks.sum(axis=0).sum(axis=0)
+        map_items_to_area = list(map(
+            lambda x, y: x+': '+str(y), class_names[class_ids], area_occupation))
+        print("{}: (ITEM: AREA) ->".format(os.path.basename(file)), map_items_to_area, "{}".format(
+            "" if set(ITEM_NAMES) & set(class_names[class_ids]) else "-> NO ITEMS FOUND!"))
+
+        if args.vis_arg:
+            visualize.display_instances(image, r['rois'], r['masks'], r['class_ids'],
+                                    CLASS_NAMES, r['scores'],
+                                    title="Predictions")
+    
+    print("\n\nDone.\n")
+
+if __name__ == "__main__":
+    main()
diff --git a/mask_rcnn/test_images/IMG_0.jpg b/mask_rcnn/test_images/IMG_0.jpg
new file mode 100644
index 00000000..57b9d110
Binary files /dev/null and b/mask_rcnn/test_images/IMG_0.jpg differ
diff --git a/mask_rcnn/test_images/IMG_1.jpg b/mask_rcnn/test_images/IMG_1.jpg
new file mode 100644
index 00000000..eac21b38
Binary files /dev/null and b/mask_rcnn/test_images/IMG_1.jpg differ
diff --git a/mask_rcnn/test_images/IMG_2.jpg b/mask_rcnn/test_images/IMG_2.jpg
new file mode 100644
index 00000000..a67f55cb
Binary files /dev/null and b/mask_rcnn/test_images/IMG_2.jpg differ
diff --git a/mask_rcnn/test_images/IMG_26.jpg b/mask_rcnn/test_images/IMG_26.jpg
new file mode 100644
index 00000000..b927984e
Binary files /dev/null and b/mask_rcnn/test_images/IMG_26.jpg differ
diff --git a/mask_rcnn/test_images/IMG_3.jpg b/mask_rcnn/test_images/IMG_3.jpg
new file mode 100644
index 00000000..0258c891
Binary files /dev/null and b/mask_rcnn/test_images/IMG_3.jpg differ
diff --git a/mask_rcnn/test_images/IMG_4.jpg b/mask_rcnn/test_images/IMG_4.jpg
new file mode 100644
index 00000000..089831a3
Binary files /dev/null and b/mask_rcnn/test_images/IMG_4.jpg differ
diff --git a/mask_rcnn/test_images/IMG_7.jpg b/mask_rcnn/test_images/IMG_7.jpg
new file mode 100644
index 00000000..a19209ef
Binary files /dev/null and b/mask_rcnn/test_images/IMG_7.jpg differ
diff --git a/mask_rcnn/test_images/IMG_8.jpg b/mask_rcnn/test_images/IMG_8.jpg
new file mode 100644
index 00000000..d846986b
Binary files /dev/null and b/mask_rcnn/test_images/IMG_8.jpg differ
diff --git a/mask_rcnn/test_images/IMG_9.jpg b/mask_rcnn/test_images/IMG_9.jpg
new file mode 100644
index 00000000..0df3d43f
Binary files /dev/null and b/mask_rcnn/test_images/IMG_9.jpg differ
diff --git a/mask_rcnn/tf_servable/README.md b/mask_rcnn/tf_servable/README.md
new file mode 100644
index 00000000..9d87f2af
--- /dev/null
+++ b/mask_rcnn/tf_servable/README.md
@@ -0,0 +1,50 @@
+# CREDIT FOR THIS LIBRARY: https://github.com/bendangnuksung/mrcnn_serving_ready
+
+### MRCNN Model conversion
+Script to convert [MatterPort Mask_RCNN](https://github.com/matterport/Mask_RCNN) Keras model to Tensorflow Frozen Graph and Tensorflow Serving Model.  
+Plus inferencing with GRPC or RESTAPI using Tensorflow Model Server. 
+
+
+### How to Run
+1. Modify the path variables in 'user_config.py'
+2. Run main.py
+    ```bash
+    python3 main.py
+    ```
+    
+#### For Custom Config class
+If you have a different config class you can replace the existing config in 'main.py'
+```python
+# main.py
+# Current config load
+config = get_config()
+
+# replace it with your config class
+config = your_custom_config_class
+
+```
+
+### Inferencing
+Follow once you finish converting it to a `saved_model` using the above code
+
+#### Tensorflow Model Server with GRPC and RESTAPI
+
+1. First run your `saved_model.pb` in Tensorflow Model Server, using:
+    ```bash
+    tensorflow_model_server --port=8500 --rest_api_port=8501 --model_name=mask --model_base_path=/path/to/saved_model/
+    ```
+2. Modify the variables and add your Config Class if needed in `inferencing/saved_model_config.py`. No need to change if the saved_model is the default COCO model.
+3. Then run the `inferencing/saved_model_inference.py` with the image path:
+    ```bash
+    # Set Python Path
+    export PYTHONPATH=$PYTHONPATH:$pwd
+   
+    # Run Inference with GRPC
+    python3 inferencing/saved_model_inference.py -t grpc -p test_image/monalisa.jpg
+   
+   # Run Inference with RESTAPI
+    python3 inferencing/saved_model_inference.py -t restapi -p test_image/monalisa.jpg
+    ```   
+
+### Acknowledgement
+Thanks to [@rahulgullan](https://github.com/rahulgullan) for RESTAPI client code.
\ No newline at end of file
diff --git a/mask_rcnn/tf_servable/coco.py b/mask_rcnn/tf_servable/coco.py
new file mode 100644
index 00000000..5d172b5c
--- /dev/null
+++ b/mask_rcnn/tf_servable/coco.py
@@ -0,0 +1,534 @@
+"""
+Mask R-CNN
+Configurations and data loading code for MS COCO.
+
+Copyright (c) 2017 Matterport, Inc.
+Licensed under the MIT License (see LICENSE for details)
+Written by Waleed Abdulla
+
+------------------------------------------------------------
+
+Usage: import the module (see Jupyter notebooks for examples), or run from
+       the command line as such:
+
+    # Train a new model starting from pre-trained COCO weights
+    python3 coco.py train --dataset=/path/to/coco/ --model=coco
+
+    # Train a new model starting from ImageNet weights. Also auto download COCO dataset
+    python3 coco.py train --dataset=/path/to/coco/ --model=imagenet --download=True
+
+    # Continue training a model that you had trained earlier
+    python3 coco.py train --dataset=/path/to/coco/ --model=/path/to/weights.h5
+
+    # Continue training the last model you trained
+    python3 coco.py train --dataset=/path/to/coco/ --model=last
+
+    # Run COCO evaluatoin on the last model you trained
+    python3 coco.py evaluate --dataset=/path/to/coco/ --model=last
+"""
+
+import os
+import sys
+import time
+import numpy as np
+import imgaug  # https://github.com/aleju/imgaug (pip3 install imgaug)
+
+# Download and install the Python COCO tools from https://github.com/waleedka/coco
+# That's a fork from the original https://github.com/pdollar/coco with a bug
+# fix for Python 3.
+# I submitted a pull request https://github.com/cocodataset/cocoapi/pull/50
+# If the PR is merged then use the original repo.
+# Note: Edit PythonAPI/Makefile and replace "python" with "python3".
+from pycocotools.coco import COCO
+from pycocotools.cocoeval import COCOeval
+from pycocotools import mask as maskUtils
+
+import zipfile
+import urllib.request
+import shutil
+
+# Root directory of the project
+ROOT_DIR = os.path.abspath("../../")
+
+# Import Mask RCNN
+sys.path.append(ROOT_DIR)  # To find local version of the library
+from mrcnn.config import Config
+from mrcnn import model as modellib, utils
+
+# Path to trained weights file
+COCO_MODEL_PATH = os.path.join(ROOT_DIR, "mask_rcnn_coco.h5")
+
+# Directory to save logs and model checkpoints, if not provided
+# through the command line argument --logs
+DEFAULT_LOGS_DIR = os.path.join(ROOT_DIR, "logs")
+DEFAULT_DATASET_YEAR = "2014"
+
+############################################################
+#  Configurations
+############################################################
+
+
+class CocoConfig(Config):
+    """Configuration for training on MS COCO.
+    Derives from the base Config class and overrides values specific
+    to the COCO dataset.
+    """
+    # Give the configuration a recognizable name
+    NAME = "coco"
+
+    # We use a GPU with 12GB memory, which can fit two images.
+    # Adjust down if you use a smaller GPU.
+    IMAGES_PER_GPU = 2
+
+    # Uncomment to train on 8 GPUs (default is 1)
+    # GPU_COUNT = 8
+
+    # Number of classes (including background)
+    NUM_CLASSES = 1 + 80  # COCO has 80 classes
+
+
+############################################################
+#  Dataset
+############################################################
+
+class CocoDataset(utils.Dataset):
+    def load_coco(self, dataset_dir, subset, year=DEFAULT_DATASET_YEAR, class_ids=None,
+                  class_map=None, return_coco=False, auto_download=False):
+        """Load a subset of the COCO dataset.
+        dataset_dir: The root directory of the COCO dataset.
+        subset: What to load (train, val, minival, valminusminival)
+        year: What dataset year to load (2014, 2017) as a string, not an integer
+        class_ids: If provided, only loads images that have the given classes.
+        class_map: TODO: Not implemented yet. Supports maping classes from
+            different datasets to the same class ID.
+        return_coco: If True, returns the COCO object.
+        auto_download: Automatically download and unzip MS-COCO images and annotations
+        """
+
+        if auto_download is True:
+            self.auto_download(dataset_dir, subset, year)
+
+        coco = COCO("{}/annotations/instances_{}{}.json".format(dataset_dir, subset, year))
+        if subset == "minival" or subset == "valminusminival":
+            subset = "val"
+        image_dir = "{}/{}{}".format(dataset_dir, subset, year)
+
+        # Load all classes or a subset?
+        if not class_ids:
+            # All classes
+            class_ids = sorted(coco.getCatIds())
+
+        # All images or a subset?
+        if class_ids:
+            image_ids = []
+            for id in class_ids:
+                image_ids.extend(list(coco.getImgIds(catIds=[id])))
+            # Remove duplicates
+            image_ids = list(set(image_ids))
+        else:
+            # All images
+            image_ids = list(coco.imgs.keys())
+
+        # Add classes
+        for i in class_ids:
+            self.add_class("coco", i, coco.loadCats(i)[0]["name"])
+
+        # Add images
+        for i in image_ids:
+            self.add_image(
+                "coco", image_id=i,
+                path=os.path.join(image_dir, coco.imgs[i]['file_name']),
+                width=coco.imgs[i]["width"],
+                height=coco.imgs[i]["height"],
+                annotations=coco.loadAnns(coco.getAnnIds(
+                    imgIds=[i], catIds=class_ids, iscrowd=None)))
+        if return_coco:
+            return coco
+
+    def auto_download(self, dataDir, dataType, dataYear):
+        """Download the COCO dataset/annotations if requested.
+        dataDir: The root directory of the COCO dataset.
+        dataType: What to load (train, val, minival, valminusminival)
+        dataYear: What dataset year to load (2014, 2017) as a string, not an integer
+        Note:
+            For 2014, use "train", "val", "minival", or "valminusminival"
+            For 2017, only "train" and "val" annotations are available
+        """
+
+        # Setup paths and file names
+        if dataType == "minival" or dataType == "valminusminival":
+            imgDir = "{}/{}{}".format(dataDir, "val", dataYear)
+            imgZipFile = "{}/{}{}.zip".format(dataDir, "val", dataYear)
+            imgURL = "http://images.cocodataset.org/zips/{}{}.zip".format("val", dataYear)
+        else:
+            imgDir = "{}/{}{}".format(dataDir, dataType, dataYear)
+            imgZipFile = "{}/{}{}.zip".format(dataDir, dataType, dataYear)
+            imgURL = "http://images.cocodataset.org/zips/{}{}.zip".format(dataType, dataYear)
+        # print("Image paths:"); print(imgDir); print(imgZipFile); print(imgURL)
+
+        # Create main folder if it doesn't exist yet
+        if not os.path.exists(dataDir):
+            os.makedirs(dataDir)
+
+        # Download images if not available locally
+        if not os.path.exists(imgDir):
+            os.makedirs(imgDir)
+            print("Downloading images to " + imgZipFile + " ...")
+            with urllib.request.urlopen(imgURL) as resp, open(imgZipFile, 'wb') as out:
+                shutil.copyfileobj(resp, out)
+            print("... done downloading.")
+            print("Unzipping " + imgZipFile)
+            with zipfile.ZipFile(imgZipFile, "r") as zip_ref:
+                zip_ref.extractall(dataDir)
+            print("... done unzipping")
+        print("Will use images in " + imgDir)
+
+        # Setup annotations data paths
+        annDir = "{}/annotations".format(dataDir)
+        if dataType == "minival":
+            annZipFile = "{}/instances_minival2014.json.zip".format(dataDir)
+            annFile = "{}/instances_minival2014.json".format(annDir)
+            annURL = "https://dl.dropboxusercontent.com/s/o43o90bna78omob/instances_minival2014.json.zip?dl=0"
+            unZipDir = annDir
+        elif dataType == "valminusminival":
+            annZipFile = "{}/instances_valminusminival2014.json.zip".format(dataDir)
+            annFile = "{}/instances_valminusminival2014.json".format(annDir)
+            annURL = "https://dl.dropboxusercontent.com/s/s3tw5zcg7395368/instances_valminusminival2014.json.zip?dl=0"
+            unZipDir = annDir
+        else:
+            annZipFile = "{}/annotations_trainval{}.zip".format(dataDir, dataYear)
+            annFile = "{}/instances_{}{}.json".format(annDir, dataType, dataYear)
+            annURL = "http://images.cocodataset.org/annotations/annotations_trainval{}.zip".format(dataYear)
+            unZipDir = dataDir
+        # print("Annotations paths:"); print(annDir); print(annFile); print(annZipFile); print(annURL)
+
+        # Download annotations if not available locally
+        if not os.path.exists(annDir):
+            os.makedirs(annDir)
+        if not os.path.exists(annFile):
+            if not os.path.exists(annZipFile):
+                print("Downloading zipped annotations to " + annZipFile + " ...")
+                with urllib.request.urlopen(annURL) as resp, open(annZipFile, 'wb') as out:
+                    shutil.copyfileobj(resp, out)
+                print("... done downloading.")
+            print("Unzipping " + annZipFile)
+            with zipfile.ZipFile(annZipFile, "r") as zip_ref:
+                zip_ref.extractall(unZipDir)
+            print("... done unzipping")
+        print("Will use annotations in " + annFile)
+
+    def load_mask(self, image_id):
+        """Load instance masks for the given image.
+
+        Different datasets use different ways to store masks. This
+        function converts the different mask format to one format
+        in the form of a bitmap [height, width, instances].
+
+        Returns:
+        masks: A bool array of shape [height, width, instance count] with
+            one mask per instance.
+        class_ids: a 1D array of class IDs of the instance masks.
+        """
+        # If not a COCO image, delegate to parent class.
+        image_info = self.image_info[image_id]
+        if image_info["source"] != "coco":
+            return super(CocoDataset, self).load_mask(image_id)
+
+        instance_masks = []
+        class_ids = []
+        annotations = self.image_info[image_id]["annotations"]
+        # Build mask of shape [height, width, instance_count] and list
+        # of class IDs that correspond to each channel of the mask.
+        for annotation in annotations:
+            class_id = self.map_source_class_id(
+                "coco.{}".format(annotation['category_id']))
+            if class_id:
+                m = self.annToMask(annotation, image_info["height"],
+                                   image_info["width"])
+                # Some objects are so small that they're less than 1 pixel area
+                # and end up rounded out. Skip those objects.
+                if m.max() < 1:
+                    continue
+                # Is it a crowd? If so, use a negative class ID.
+                if annotation['iscrowd']:
+                    # Use negative class ID for crowds
+                    class_id *= -1
+                    # For crowd masks, annToMask() sometimes returns a mask
+                    # smaller than the given dimensions. If so, resize it.
+                    if m.shape[0] != image_info["height"] or m.shape[1] != image_info["width"]:
+                        m = np.ones([image_info["height"], image_info["width"]], dtype=bool)
+                instance_masks.append(m)
+                class_ids.append(class_id)
+
+        # Pack instance masks into an array
+        if class_ids:
+            mask = np.stack(instance_masks, axis=2).astype(np.bool)
+            class_ids = np.array(class_ids, dtype=np.int32)
+            return mask, class_ids
+        else:
+            # Call super class to return an empty mask
+            return super(CocoDataset, self).load_mask(image_id)
+
+    def image_reference(self, image_id):
+        """Return a link to the image in the COCO Website."""
+        info = self.image_info[image_id]
+        if info["source"] == "coco":
+            return "http://cocodataset.org/#explore?id={}".format(info["id"])
+        else:
+            super(CocoDataset, self).image_reference(image_id)
+
+    # The following two functions are from pycocotools with a few changes.
+
+    def annToRLE(self, ann, height, width):
+        """
+        Convert annotation which can be polygons, uncompressed RLE to RLE.
+        :return: binary mask (numpy 2D array)
+        """
+        segm = ann['segmentation']
+        if isinstance(segm, list):
+            # polygon -- a single object might consist of multiple parts
+            # we merge all parts into one mask rle code
+            rles = maskUtils.frPyObjects(segm, height, width)
+            rle = maskUtils.merge(rles)
+        elif isinstance(segm['counts'], list):
+            # uncompressed RLE
+            rle = maskUtils.frPyObjects(segm, height, width)
+        else:
+            # rle
+            rle = ann['segmentation']
+        return rle
+
+    def annToMask(self, ann, height, width):
+        """
+        Convert annotation which can be polygons, uncompressed RLE, or RLE to binary mask.
+        :return: binary mask (numpy 2D array)
+        """
+        rle = self.annToRLE(ann, height, width)
+        m = maskUtils.decode(rle)
+        return m
+
+
+############################################################
+#  COCO Evaluation
+############################################################
+
+def build_coco_results(dataset, image_ids, rois, class_ids, scores, masks):
+    """Arrange resutls to match COCO specs in http://cocodataset.org/#format
+    """
+    # If no results, return an empty list
+    if rois is None:
+        return []
+
+    results = []
+    for image_id in image_ids:
+        # Loop through detections
+        for i in range(rois.shape[0]):
+            class_id = class_ids[i]
+            score = scores[i]
+            bbox = np.around(rois[i], 1)
+            mask = masks[:, :, i]
+
+            result = {
+                "image_id": image_id,
+                "category_id": dataset.get_source_class_id(class_id, "coco"),
+                "bbox": [bbox[1], bbox[0], bbox[3] - bbox[1], bbox[2] - bbox[0]],
+                "score": score,
+                "segmentation": maskUtils.encode(np.asfortranarray(mask))
+            }
+            results.append(result)
+    return results
+
+
+def evaluate_coco(model, dataset, coco, eval_type="bbox", limit=0, image_ids=None):
+    """Runs official COCO evaluation.
+    dataset: A Dataset object with valiadtion data
+    eval_type: "bbox" or "segm" for bounding box or segmentation evaluation
+    limit: if not 0, it's the number of images to use for evaluation
+    """
+    # Pick COCO images from the dataset
+    image_ids = image_ids or dataset.image_ids
+
+    # Limit to a subset
+    if limit:
+        image_ids = image_ids[:limit]
+
+    # Get corresponding COCO image IDs.
+    coco_image_ids = [dataset.image_info[id]["id"] for id in image_ids]
+
+    t_prediction = 0
+    t_start = time.time()
+
+    results = []
+    for i, image_id in enumerate(image_ids):
+        # Load image
+        image = dataset.load_image(image_id)
+
+        # Run detection
+        t = time.time()
+        r = model.detect([image], verbose=0)[0]
+        t_prediction += (time.time() - t)
+
+        # Convert results to COCO format
+        # Cast masks to uint8 because COCO tools errors out on bool
+        image_results = build_coco_results(dataset, coco_image_ids[i:i + 1],
+                                           r["rois"], r["class_ids"],
+                                           r["scores"],
+                                           r["masks"].astype(np.uint8))
+        results.extend(image_results)
+
+    # Load results. This modifies results with additional attributes.
+    coco_results = coco.loadRes(results)
+
+    # Evaluate
+    cocoEval = COCOeval(coco, coco_results, eval_type)
+    cocoEval.params.imgIds = coco_image_ids
+    cocoEval.evaluate()
+    cocoEval.accumulate()
+    cocoEval.summarize()
+
+    print("Prediction time: {}. Average {}/image".format(
+        t_prediction, t_prediction / len(image_ids)))
+    print("Total time: ", time.time() - t_start)
+
+
+############################################################
+#  Training
+############################################################
+
+
+if __name__ == '__main__':
+    import argparse
+
+    # Parse command line arguments
+    parser = argparse.ArgumentParser(
+        description='Train Mask R-CNN on MS COCO.')
+    parser.add_argument("command",
+                        metavar="<command>",
+                        help="'train' or 'evaluate' on MS COCO")
+    parser.add_argument('--dataset', required=True,
+                        metavar="/path/to/coco/",
+                        help='Directory of the MS-COCO dataset')
+    parser.add_argument('--year', required=False,
+                        default=DEFAULT_DATASET_YEAR,
+                        metavar="<year>",
+                        help='Year of the MS-COCO dataset (2014 or 2017) (default=2014)')
+    parser.add_argument('--model', required=True,
+                        metavar="/path/to/weights.h5",
+                        help="Path to weights .h5 file or 'coco'")
+    parser.add_argument('--logs', required=False,
+                        default=DEFAULT_LOGS_DIR,
+                        metavar="/path/to/logs/",
+                        help='Logs and checkpoints directory (default=logs/)')
+    parser.add_argument('--limit', required=False,
+                        default=500,
+                        metavar="<image count>",
+                        help='Images to use for evaluation (default=500)')
+    parser.add_argument('--download', required=False,
+                        default=False,
+                        metavar="<True|False>",
+                        help='Automatically download and unzip MS-COCO files (default=False)',
+                        type=bool)
+    args = parser.parse_args()
+    print("Command: ", args.command)
+    print("Model: ", args.model)
+    print("Dataset: ", args.dataset)
+    print("Year: ", args.year)
+    print("Logs: ", args.logs)
+    print("Auto Download: ", args.download)
+
+    # Configurations
+    if args.command == "train":
+        config = CocoConfig()
+    else:
+        class InferenceConfig(CocoConfig):
+            # Set batch size to 1 since we'll be running inference on
+            # one image at a time. Batch size = GPU_COUNT * IMAGES_PER_GPU
+            GPU_COUNT = 1
+            IMAGES_PER_GPU = 1
+            DETECTION_MIN_CONFIDENCE = 0
+        config = InferenceConfig()
+    config.display()
+
+    # Create model
+    if args.command == "train":
+        model = modellib.MaskRCNN(mode="training", config=config,
+                                  model_dir=args.logs)
+    else:
+        model = modellib.MaskRCNN(mode="inference", config=config,
+                                  model_dir=args.logs)
+
+    # Select weights file to load
+    if args.model.lower() == "coco":
+        model_path = COCO_MODEL_PATH
+    elif args.model.lower() == "last":
+        # Find last trained weights
+        model_path = model.find_last()
+    elif args.model.lower() == "imagenet":
+        # Start from ImageNet trained weights
+        model_path = model.get_imagenet_weights()
+    else:
+        model_path = args.model
+
+    # Load weights
+    print("Loading weights ", model_path)
+    model.load_weights(model_path, by_name=True)
+
+    # Train or evaluate
+    if args.command == "train":
+        # Training dataset. Use the training set and 35K from the
+        # validation set, as as in the Mask RCNN paper.
+        dataset_train = CocoDataset()
+        dataset_train.load_coco(args.dataset, "train", year=args.year, auto_download=args.download)
+        if args.year in '2014':
+            dataset_train.load_coco(args.dataset, "valminusminival", year=args.year, auto_download=args.download)
+        dataset_train.prepare()
+
+        # Validation dataset
+        dataset_val = CocoDataset()
+        val_type = "val" if args.year in '2017' else "minival"
+        dataset_val.load_coco(args.dataset, val_type, year=args.year, auto_download=args.download)
+        dataset_val.prepare()
+
+        # Image Augmentation
+        # Right/Left flip 50% of the time
+        augmentation = imgaug.augmenters.Fliplr(0.5)
+
+        # *** This training schedule is an example. Update to your needs ***
+
+        # Training - Stage 1
+        print("Training network heads")
+        model.train(dataset_train, dataset_val,
+                    learning_rate=config.LEARNING_RATE,
+                    epochs=40,
+                    layers='heads',
+                    augmentation=augmentation)
+
+        # Training - Stage 2
+        # Finetune layers from ResNet stage 4 and up
+        print("Fine tune Resnet stage 4 and up")
+        model.train(dataset_train, dataset_val,
+                    learning_rate=config.LEARNING_RATE,
+                    epochs=120,
+                    layers='4+',
+                    augmentation=augmentation)
+
+        # Training - Stage 3
+        # Fine tune all layers
+        print("Fine tune all layers")
+        model.train(dataset_train, dataset_val,
+                    learning_rate=config.LEARNING_RATE / 10,
+                    epochs=160,
+                    layers='all',
+                    augmentation=augmentation)
+
+    elif args.command == "evaluate":
+        # Validation dataset
+        dataset_val = CocoDataset()
+        val_type = "val" if args.year in '2017' else "minival"
+        coco = dataset_val.load_coco(args.dataset, val_type, year=args.year, return_coco=True, auto_download=args.download)
+        dataset_val.prepare()
+        print("Running COCO evaluation on {} images.".format(args.limit))
+        evaluate_coco(model, dataset_val, coco, "bbox", limit=int(args.limit))
+    else:
+        print("'{}' is not recognized. "
+              "Use 'train' or 'evaluate'".format(args.command))
diff --git a/mask_rcnn/tf_servable/config.py b/mask_rcnn/tf_servable/config.py
new file mode 100644
index 00000000..90286026
--- /dev/null
+++ b/mask_rcnn/tf_servable/config.py
@@ -0,0 +1,67 @@
+import numpy as np
+
+
+class mask_config():
+    def __init__(self, NUMBER_OF_CLASSES):
+        self.NAME = "tags"
+        self.IMAGES_PER_GPU = 2
+        self.NUM_CLASSES = 1 + NUMBER_OF_CLASSES  # Background + tags
+        self.STEPS_PER_EPOCH = 100
+        self.DETECTION_MIN_CONFIDENCE = 0.9
+        self.GPU_COUNT = 1
+        self.IMAGES_PER_GPU = 1
+        self.NAME = None  # Override in sub-classes
+        self.GPU_COUNT = 1
+        self.IMAGES_PER_GPU = 1
+        self.STEPS_PER_EPOCH = 1000
+        self.VALIDATION_STEPS = 50
+        self.BACKBONE = "resnet101"
+        self.COMPUTE_BACKBONE_SHAPE = None
+        self.BACKBONE_STRIDES = [4, 8, 16, 32, 64]
+        self.FPN_CLASSIF_FC_LAYERS_SIZE = 1024
+        self.TOP_DOWN_PYRAMID_SIZE = 256
+        self.RPN_ANCHOR_SCALES = (32, 64, 128, 256, 512)
+        self.RPN_ANCHOR_RATIOS = [0.5, 1, 2]
+        self.RPN_ANCHOR_STRIDE = 1
+        self.RPN_NMS_THRESHOLD = 0.7
+        self.RPN_TRAIN_ANCHORS_PER_IMAGE = 256
+        self.POST_NMS_ROIS_TRAINING = 2000
+        self.POST_NMS_ROIS_INFERENCE = 1000
+        self.USE_MINI_MASK = True
+        self.MINI_MASK_SHAPE = (56, 56)  # (height, width) of the mini-mask
+        self.IMAGE_RESIZE_MODE = "square"
+        self.IMAGE_MIN_DIM = 800
+        self.IMAGE_MAX_DIM = 1024
+        self.IMAGE_MIN_SCALE = 0
+        self.MEAN_PIXEL = np.array([123.7, 116.8, 103.9])
+        self.TRAIN_ROIS_PER_IMAGE = 200
+        self.ROI_POSITIVE_RATIO = 0.33
+        self.POOL_SIZE = 7
+        self.MASK_POOL_SIZE = 14
+        self.MASK_SHAPE = [28, 28]
+        self.MAX_GT_INSTANCES = 100
+        self.RPN_BBOX_STD_DEV = np.array([0.1, 0.1, 0.2, 0.2])
+        self.BBOX_STD_DEV = np.array([0.1, 0.1, 0.2, 0.2])
+        self.DETECTION_MAX_INSTANCES = 100
+        self.DETECTION_MIN_CONFIDENCE = 0.7
+        self.DETECTION_NMS_THRESHOLD = 0.3
+        self.LEARNING_RATE = 0.001
+        self.LEARNING_MOMENTUM = 0.9
+        self.WEIGHT_DECAY = 0.0001
+        self.LOSS_WEIGHTS = {"rpn_class_loss": 1., "rpn_bbox_loss": 1., "mrcnn_class_loss": 1., "mrcnn_bbox_loss": 1.,
+                             "mrcnn_mask_loss": 1.}
+        self.USE_RPN_ROIS = True
+        self.TRAIN_BN = False  # Defaulting to False since batch size is often small
+        self.GRADIENT_CLIP_NORM = 5.0
+
+        self.BATCH_SIZE = self.IMAGES_PER_GPU * self.GPU_COUNT
+
+        # Input image size
+        if self.IMAGE_RESIZE_MODE == "crop":
+            self.IMAGE_SHAPE = np.array([self.IMAGE_MIN_DIM, self.IMAGE_MIN_DIM, 3])
+        else:
+            self.IMAGE_SHAPE = np.array([self.IMAGE_MAX_DIM, self.IMAGE_MAX_DIM, 3])
+
+        # Image meta data length
+        # See compose_image_meta() for details
+        self.IMAGE_META_SIZE = 1 + 3 + 3 + 4 + 1 + self.NUM_CLASSES
diff --git a/mask_rcnn/tf_servable/frozen_model/.gitkeep b/mask_rcnn/tf_servable/frozen_model/.gitkeep
new file mode 100644
index 00000000..74c20143
--- /dev/null
+++ b/mask_rcnn/tf_servable/frozen_model/.gitkeep
@@ -0,0 +1 @@
+DUMMY
\ No newline at end of file
diff --git a/mask_rcnn/tf_servable/inferencing/config.py b/mask_rcnn/tf_servable/inferencing/config.py
new file mode 100644
index 00000000..5bffb33d
--- /dev/null
+++ b/mask_rcnn/tf_servable/inferencing/config.py
@@ -0,0 +1,236 @@
+"""
+Mask R-CNN
+Base Configurations class.
+
+Copyright (c) 2017 Matterport, Inc.
+Licensed under the MIT License (see LICENSE for details)
+Written by Waleed Abdulla
+"""
+
+import numpy as np
+
+
+# Base Configuration Class
+# Don't use this class directly. Instead, sub-class it and override
+# the configurations you need to change.
+
+class Config(object):
+    """Base configuration class. For custom configurations, create a
+    sub-class that inherits from this one and override properties
+    that need to be changed.
+    """
+    # Name the configurations. For example, 'COCO', 'Experiment 3', ...etc.
+    # Useful if your code needs to do things differently depending on which
+    # experiment is running.
+    NAME = None  # Override in sub-classes
+
+    # NUMBER OF GPUs to use. When using only a CPU, this needs to be set to 1.
+    GPU_COUNT = 1
+
+    # Number of images to train with on each GPU. A 12GB GPU can typically
+    # handle 2 images of 1024x1024px.
+    # Adjust based on your GPU memory and image sizes. Use the highest
+    # number that your GPU can handle for best performance.
+    IMAGES_PER_GPU = 2
+
+    # Number of training steps per epoch
+    # This doesn't need to match the size of the training set. Tensorboard
+    # updates are saved at the end of each epoch, so setting this to a
+    # smaller number means getting more frequent TensorBoard updates.
+    # Validation stats are also calculated at each epoch end and they
+    # might take a while, so don't set this too small to avoid spending
+    # a lot of time on validation stats.
+    STEPS_PER_EPOCH = 1000
+
+    # Number of validation steps to run at the end of every training epoch.
+    # A bigger number improves accuracy of validation stats, but slows
+    # down the training.
+    VALIDATION_STEPS = 50
+
+    # Backbone network architecture
+    # Supported values are: resnet50, resnet101.
+    # You can also provide a callable that should have the signature
+    # of model.resnet_graph. If you do so, you need to supply a callable
+    # to COMPUTE_BACKBONE_SHAPE as well
+    BACKBONE = "resnet101"
+
+    # Only useful if you supply a callable to BACKBONE. Should compute
+    # the shape of each layer of the FPN Pyramid.
+    # See model.compute_backbone_shapes
+    COMPUTE_BACKBONE_SHAPE = None
+
+    # The strides of each layer of the FPN Pyramid. These values
+    # are based on a Resnet101 backbone.
+    BACKBONE_STRIDES = [4, 8, 16, 32, 64]
+
+    # Size of the fully-connected layers in the classification graph
+    FPN_CLASSIF_FC_LAYERS_SIZE = 1024
+
+    # Size of the top-down layers used to build the feature pyramid
+    TOP_DOWN_PYRAMID_SIZE = 256
+
+    # Number of classification classes (including background)
+    NUM_CLASSES = 1  # Override in sub-classes
+
+    # Length of square anchor side in pixels
+    RPN_ANCHOR_SCALES = (32, 64, 128, 256, 512)
+
+    # Ratios of anchors at each cell (width/height)
+    # A value of 1 represents a square anchor, and 0.5 is a wide anchor
+    RPN_ANCHOR_RATIOS = [0.5, 1, 2]
+
+    # Anchor stride
+    # If 1 then anchors are created for each cell in the backbone feature map.
+    # If 2, then anchors are created for every other cell, and so on.
+    RPN_ANCHOR_STRIDE = 1
+
+    # Non-max suppression threshold to filter RPN proposals.
+    # You can increase this during training to generate more propsals.
+    RPN_NMS_THRESHOLD = 0.7
+
+    # How many anchors per image to use for RPN training
+    RPN_TRAIN_ANCHORS_PER_IMAGE = 256
+    
+    # ROIs kept after tf.nn.top_k and before non-maximum suppression
+    PRE_NMS_LIMIT = 6000
+
+    # ROIs kept after non-maximum suppression (training and inference)
+    POST_NMS_ROIS_TRAINING = 2000
+    POST_NMS_ROIS_INFERENCE = 1000
+
+    # If enabled, resizes instance masks to a smaller size to reduce
+    # memory load. Recommended when using high-resolution images.
+    USE_MINI_MASK = False
+    MINI_MASK_SHAPE = (56, 56)  # (height, width) of the mini-mask
+
+    # Input image resizing
+    # Generally, use the "square" resizing mode for training and predicting
+    # and it should work well in most cases. In this mode, images are scaled
+    # up such that the small side is = IMAGE_MIN_DIM, but ensuring that the
+    # scaling doesn't make the long side > IMAGE_MAX_DIM. Then the image is
+    # padded with zeros to make it a square so multiple images can be put
+    # in one batch.
+    # Available resizing modes:
+    # none:   No resizing or padding. Return the image unchanged.
+    # square: Resize and pad with zeros to get a square image
+    #         of size [max_dim, max_dim].
+    # pad64:  Pads width and height with zeros to make them multiples of 64.
+    #         If IMAGE_MIN_DIM or IMAGE_MIN_SCALE are not None, then it scales
+    #         up before padding. IMAGE_MAX_DIM is ignored in this mode.
+    #         The multiple of 64 is needed to ensure smooth scaling of feature
+    #         maps up and down the 6 levels of the FPN pyramid (2**6=64).
+    # crop:   Picks random crops from the image. First, scales the image based
+    #         on IMAGE_MIN_DIM and IMAGE_MIN_SCALE, then picks a random crop of
+    #         size IMAGE_MIN_DIM x IMAGE_MIN_DIM. Can be used in training only.
+    #         IMAGE_MAX_DIM is not used in this mode.
+    IMAGE_RESIZE_MODE = "square"
+    IMAGE_MIN_DIM = 800
+    IMAGE_MAX_DIM = 1024
+    # Minimum scaling ratio. Checked after MIN_IMAGE_DIM and can force further
+    # up scaling. For example, if set to 2 then images are scaled up to double
+    # the width and height, or more, even if MIN_IMAGE_DIM doesn't require it.
+    # However, in 'square' mode, it can be overruled by IMAGE_MAX_DIM.
+    IMAGE_MIN_SCALE = 0
+    # Number of color channels per image. RGB = 3, grayscale = 1, RGB-D = 4
+    # Changing this requires other changes in the code. See the WIKI for more
+    # details: https://github.com/matterport/Mask_RCNN/wiki
+    IMAGE_CHANNEL_COUNT = 3
+
+    # Image mean (RGB)
+    MEAN_PIXEL = np.array([123.7, 116.8, 103.9])
+
+    # Number of ROIs per image to feed to classifier/mask heads
+    # The Mask RCNN paper uses 512 but often the RPN doesn't generate
+    # enough positive proposals to fill this and keep a positive:negative
+    # ratio of 1:3. You can increase the number of proposals by adjusting
+    # the RPN NMS threshold.
+    TRAIN_ROIS_PER_IMAGE = 200
+
+    # Percent of positive ROIs used to train classifier/mask heads
+    ROI_POSITIVE_RATIO = 0.33
+
+    # Pooled ROIs
+    POOL_SIZE = 7
+    MASK_POOL_SIZE = 14
+
+    # Shape of output mask
+    # To change this you also need to change the neural network mask branch
+    MASK_SHAPE = [28, 28]
+
+    # Maximum number of ground truth instances to use in one image
+    MAX_GT_INSTANCES = 100
+
+    # Bounding box refinement standard deviation for RPN and final detections.
+    RPN_BBOX_STD_DEV = np.array([0.1, 0.1, 0.2, 0.2])
+    BBOX_STD_DEV = np.array([0.1, 0.1, 0.2, 0.2])
+
+    # Max number of final detections
+    DETECTION_MAX_INSTANCES = 100
+
+    # Minimum probability value to accept a detected instance
+    # ROIs below this threshold are skipped
+    DETECTION_MIN_CONFIDENCE = 0.7
+
+    # Non-maximum suppression threshold for detection
+    DETECTION_NMS_THRESHOLD = 0.3
+
+    # Learning rate and momentum
+    # The Mask RCNN paper uses lr=0.02, but on TensorFlow it causes
+    # weights to explode. Likely due to differences in optimizer
+    # implementation.
+    LEARNING_RATE = 0.001
+    LEARNING_MOMENTUM = 0.9
+
+    # Weight decay regularization
+    WEIGHT_DECAY = 0.0001
+
+    # Loss weights for more precise optimization.
+    # Can be used for R-CNN training setup.
+    LOSS_WEIGHTS = {
+        "rpn_class_loss": 1.,
+        "rpn_bbox_loss": 1.,
+        "mrcnn_class_loss": 1.,
+        "mrcnn_bbox_loss": 1.,
+        "mrcnn_mask_loss": 1.
+    }
+
+    # Use RPN ROIs or externally generated ROIs for training
+    # Keep this True for most situations. Set to False if you want to train
+    # the head branches on ROI generated by code rather than the ROIs from
+    # the RPN. For example, to debug the classifier head without having to
+    # train the RPN.
+    USE_RPN_ROIS = True
+
+    # Train or freeze batch normalization layers
+    #     None: Train BN layers. This is the normal mode
+    #     False: Freeze BN layers. Good when using a small batch size
+    #     True: (don't use). Set layer in training mode even when predicting
+    TRAIN_BN = False  # Defaulting to False since batch size is often small
+
+    # Gradient norm clipping
+    GRADIENT_CLIP_NORM = 5.0
+
+    def __init__(self):
+        """Set values of computed attributes."""
+        # Effective batch size
+        self.BATCH_SIZE = self.IMAGES_PER_GPU * self.GPU_COUNT
+
+        # Input image size
+        if self.IMAGE_RESIZE_MODE == "crop":
+            self.IMAGE_SHAPE = np.array([self.IMAGE_MIN_DIM, self.IMAGE_MIN_DIM,
+                self.IMAGE_CHANNEL_COUNT])
+        else:
+            self.IMAGE_SHAPE = np.array([self.IMAGE_MAX_DIM, self.IMAGE_MAX_DIM,
+                self.IMAGE_CHANNEL_COUNT])
+
+        # Image meta data length
+        # See compose_image_meta() for details
+        self.IMAGE_META_SIZE = 1 + 3 + 3 + 4 + 1 + self.NUM_CLASSES
+
+    def display(self):
+        """Display Configuration values."""
+        print("\nConfigurations:")
+        for a in dir(self):
+            if not a.startswith("__") and not callable(getattr(self, a)):
+                print("{:30} {}".format(a, getattr(self, a)))
+        print("\n")
diff --git a/mask_rcnn/tf_servable/inferencing/saved_model_config.py b/mask_rcnn/tf_servable/inferencing/saved_model_config.py
new file mode 100644
index 00000000..e8b9caa7
--- /dev/null
+++ b/mask_rcnn/tf_servable/inferencing/saved_model_config.py
@@ -0,0 +1,50 @@
+# Your Inference Config Class
+# Replace your own config
+# MY_INFERENCE_CONFIG = YOUR_CONFIG_CLASS
+# import coco
+# class InferenceConfig(coco.CocoConfig):
+#     GPU_COUNT = 1
+#     IMAGES_PER_GPU = 1
+# coco_config = InferenceConfig()
+import config
+class PPConfig(config.Config):
+    """Configuration for training on the toy  dataset.
+    Derives from the base Config class and overrides some values.
+    """
+    # Give the configuration a recognizable name
+    NAME = "pointless_package"
+
+    # We use a GPU with 12GB memory, which can fit two images.
+    # Adjust down if you use a smaller GPU.
+    IMAGES_PER_GPU = 1
+
+    # Skip detections with < 90% confidence
+    DETECTION_MIN_CONFIDENCE = 0.75
+
+MY_INFERENCE_CONFIG = PPConfig()
+
+
+# Tensorflow Model server variable
+ADDRESS = 'localhost'
+PORT_NO_GRPC = 8500
+PORT_NO_RESTAPI = 8501
+MODEL_NAME = 'mask'
+REST_API_URL = "http://%s:%s/v1/models/%s:predict" % (ADDRESS, PORT_NO_RESTAPI, MODEL_NAME)
+
+
+# TF variable name
+OUTPUT_DETECTION = 'mrcnn_detection/Reshape_1'
+OUTPUT_CLASS = 'mrcnn_class/Reshape_1'
+OUTPUT_BBOX = 'mrcnn_bbox/Reshape'
+OUTPUT_MASK = 'mrcnn_mask/Reshape_1'
+INPUT_IMAGE = 'input_image'
+INPUT_IMAGE_META = 'input_image_meta'
+INPUT_ANCHORS = 'input_anchors'
+OUTPUT_NAME = 'predict_images'
+
+
+# Signature name
+SIGNATURE_NAME = 'serving_default'
+
+# GRPC config
+GRPC_MAX_RECEIVE_MESSAGE_LENGTH = 4096 * 4096 * 3 # Max LENGTH the GRPC should handle
diff --git a/mask_rcnn/tf_servable/inferencing/saved_model_inference.py b/mask_rcnn/tf_servable/inferencing/saved_model_inference.py
new file mode 100644
index 00000000..ffd9988c
--- /dev/null
+++ b/mask_rcnn/tf_servable/inferencing/saved_model_inference.py
@@ -0,0 +1,138 @@
+import cv2, grpc
+from tensorflow_serving.apis import prediction_service_pb2_grpc
+from tensorflow_serving.apis import predict_pb2
+import numpy as np
+import tensorflow as tf
+import saved_model_config
+from saved_model_preprocess import ForwardModel
+import requests
+import json
+from visualize import display_images
+import visualize as visualize
+
+host = saved_model_config.ADDRESS
+PORT_GRPC = saved_model_config.PORT_NO_GRPC
+RESTAPI_URL = saved_model_config.REST_API_URL
+
+channel = grpc.insecure_channel(str(host) + ':' + str(PORT_GRPC), options=[('grpc.max_receive_message_length', saved_model_config.GRPC_MAX_RECEIVE_MESSAGE_LENGTH)])
+
+stub = prediction_service_pb2_grpc.PredictionServiceStub(channel)
+
+
+request = predict_pb2.PredictRequest()
+request.model_spec.name = saved_model_config.MODEL_NAME
+request.model_spec.signature_name = saved_model_config.SIGNATURE_NAME
+
+model_config = saved_model_config.MY_INFERENCE_CONFIG
+preprocess_obj = ForwardModel(model_config)
+
+
+def detect_mask_single_image_using_grpc(image):
+    images = np.expand_dims(image, axis=0)
+    molded_images, image_metas, windows = preprocess_obj.mold_inputs(images)
+    molded_images = molded_images.astype(np.float32)
+    image_metas = image_metas.astype(np.float32)
+    # Validate image sizes
+    # All images in a batch MUST be of the same size
+    image_shape = molded_images[0].shape
+    for g in molded_images[1:]:
+        assert g.shape == image_shape, \
+            "After resizing, all images must have the same size. Check IMAGE_RESIZE_MODE and image sizes."
+
+    # Anchors
+    anchors = preprocess_obj.get_anchors(image_shape)
+    anchors = np.broadcast_to(anchors, (images.shape[0],) + anchors.shape)
+
+    request.inputs[saved_model_config.INPUT_IMAGE].CopyFrom(
+        tf.contrib.util.make_tensor_proto(molded_images, shape=molded_images.shape))
+    request.inputs[saved_model_config.INPUT_IMAGE_META].CopyFrom(
+        tf.contrib.util.make_tensor_proto(image_metas, shape=image_metas.shape))
+    request.inputs[saved_model_config.INPUT_ANCHORS].CopyFrom(
+        tf.contrib.util.make_tensor_proto(anchors, shape=anchors.shape))
+
+    result = stub.Predict(request, 60.)
+    result_dict = preprocess_obj.result_to_dict(images, molded_images, windows, result)[0]
+    return result_dict
+
+
+def detect_mask_single_image_using_restapi(image):
+    images = np.expand_dims(image, axis=0)
+    molded_images, image_metas, windows = preprocess_obj.mold_inputs(images)
+
+    molded_images = molded_images.astype(np.float32)
+
+    image_shape = molded_images[0].shape
+
+    for g in molded_images[1:]:
+        assert g.shape == image_shape, \
+            "After resizing, all images must have the same size. Check IMAGE_RESIZE_MODE and image sizes."
+
+    anchors = preprocess_obj.get_anchors(image_shape)
+    anchors = np.broadcast_to(anchors, (images.shape[0],) + anchors.shape)
+
+    # response body format row wise.
+    data = {'signature_name': saved_model_config.SIGNATURE_NAME,
+            'instances': [{saved_model_config.INPUT_IMAGE: molded_images[0].tolist(),
+                           saved_model_config.INPUT_IMAGE_META: image_metas[0].tolist(),
+                           saved_model_config.INPUT_ANCHORS: anchors[0].tolist()}]}
+
+    response = requests.post(RESTAPI_URL, data=json.dumps(data), headers={"content-type":"application/json"})
+    result = json.loads(response.text)
+    result = result['predictions'][0]
+
+    result_dict = preprocess_obj.result_to_dict(images, molded_images, windows, result, is_restapi=True)[0]
+    return result_dict
+
+
+if __name__ == '__main__':
+    import argparse
+    import os
+    parser = argparse.ArgumentParser()
+    parser.add_argument('-p', '--path', help='Path to Image', required=True)
+    parser.add_argument('-t', '--type', help='Type of call [restapi, grpc]', default='restapi')
+    args = vars(parser.parse_args())
+    image_path = args['path']
+    call_type = args['type']
+
+    if not os.path.exists(image_path):
+        print(image_path, " -- Does not exist")
+        exit()
+
+    image = cv2.imread(image_path)
+    image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+    if image is None:
+        print("Image path is not proper")
+        exit()
+
+    if call_type == 'restapi':
+        result = detect_mask_single_image_using_restapi(image)
+    else:
+        result = detect_mask_single_image_using_grpc(image)
+
+    print(result)
+    r = result
+
+    N = r['rois'].shape[0]
+    class_ids = r['class']
+    masks = r['mask']
+
+    CLASS_NAMES = ['BG', 'outerbox', 'innerbox', 'item_sq',
+                   'item_rect', 'item_rect_slim', 'item_circ']
+
+    class_names = np.asarray(CLASS_NAMES)
+    ITEM_NAMES = CLASS_NAMES[3:]
+    # area_occupation = [masks[:, :, i].sum() for i in range(N)]
+    area_occupation = masks.sum(axis=0).sum(axis=0)
+    map_items_to_area = list(map(
+        lambda x, y: x+': '+str(y), class_names[class_ids], area_occupation))
+    print("{}: (ITEM: AREA) ->".format('IMAGE'), map_items_to_area, "{}".format(
+        "" if set(ITEM_NAMES) & set(class_names[class_ids]) else "-> NO ITEMS FOUND!"))
+
+    visualize.display_instances(image, r['rois'], r['mask'], r['class'],
+                                    CLASS_NAMES, r['scores'],
+                                    title="Predictions")
+
+    print("*" * 60)
+    print("RESULTS:")
+    print(result)
+    print("*" * 60)
diff --git a/mask_rcnn/tf_servable/inferencing/saved_model_preprocess.py b/mask_rcnn/tf_servable/inferencing/saved_model_preprocess.py
new file mode 100644
index 00000000..d43ddfb5
--- /dev/null
+++ b/mask_rcnn/tf_servable/inferencing/saved_model_preprocess.py
@@ -0,0 +1,243 @@
+import saved_model_config
+import saved_model_utils
+import numpy as np
+import math
+
+
+def compose_image_meta(image_id, original_image_shape, image_shape,
+                       window, scale, active_class_ids):
+    """Takes attributes of an image and puts them in one 1D array.
+    image_id: An int ID of the image. Useful for debugging.
+    original_image_shape: [H, W, C] before resizing or padding.
+    image_shape: [H, W, C] after resizing and padding
+    window: (y1, x1, y2, x2) in pixels. The area of the image where the real
+            image is (excluding the padding)
+    scale: The scaling factor applied to the original image (float32)
+    active_class_ids: List of class_ids available in the dataset from which
+        the image came. Useful if training on images from multiple segmentation_datasets
+        where not all classes are present in all segmentation_datasets.
+    """
+    meta = np.array(
+        [image_id] +  # size=1
+        list(original_image_shape) +  # size=3
+        list(image_shape) +  # size=3
+        list(window) +  # size=4 (y1, x1, y2, x2) in image cooredinates
+        [scale] +  # size=1
+        list(active_class_ids)  # size=num_classes
+    )
+    return meta
+
+
+def mold_image(images, config):
+    """Expects an RGB image (or array of images) and subtracts
+    the mean pixel and converts it to float. Expects image
+    colors in RGB order.
+    """
+    return images.astype(np.float32) - config.MEAN_PIXEL
+
+
+def compute_backbone_shapes(config, image_shape):
+    """Computes the width and height of each stage of the backbone network.
+
+    Returns:
+        [N, (height, width)]. Where N is the number of stages
+    """
+    if callable(config.BACKBONE):
+        return config.COMPUTE_BACKBONE_SHAPE(image_shape)
+
+    # Currently supports ResNet only
+    assert config.BACKBONE in ["resnet50", "resnet101"]
+    return np.array(
+        [[int(math.ceil(image_shape[0] / stride)),
+            int(math.ceil(image_shape[1] / stride))]
+            for stride in config.BACKBONE_STRIDES])
+
+
+class ForwardModel:
+    def __init__(self, config):
+        self.config = config
+        self.outputs = {
+            'detection': 'mrcnn_detection/Reshape_1',
+            'class': 'mrcnn_class/Reshape_1',
+            'box': 'mrcnn_bbox/Reshape',
+            'mask': 'mrcnn_mask/Reshape_1'}
+
+        # self.build_outputs()
+
+    def mold_inputs(self, images):
+        """Takes a list of images and modifies them to the format expected
+        as an input to the neural network.
+        images: List of image matrices [height,width,depth]. Images can have
+            different sizes.
+
+        Returns 3 Numpy matrices:
+        molded_images: [N, h, w, 3]. Images resized and normalized.
+        image_metas: [N, length of meta data]. Details about each image.
+        windows: [N, (y1, x1, y2, x2)]. The portion of the image that has the
+            original image (padding excluded).
+        """
+        molded_images = []
+        image_metas = []
+        windows = []
+        for image in images:
+            # Resize image
+            # TODO: move resizing to mold_image()
+            molded_image, window, scale, padding, crop = saved_model_utils.resize_image(
+                image,
+                min_dim=self.config.IMAGE_MIN_DIM,
+                min_scale=self.config.IMAGE_MIN_SCALE,
+                max_dim=self.config.IMAGE_MAX_DIM,
+                mode=self.config.IMAGE_RESIZE_MODE)
+            molded_image = mold_image(molded_image, self.config)
+            # Build image_meta
+            image_meta = compose_image_meta(
+                0, image.shape, molded_image.shape, window, scale,
+                np.zeros([self.config.NUM_CLASSES], dtype=np.int32))
+            # Append
+            molded_images.append(molded_image)
+            windows.append(window)
+            image_metas.append(image_meta)
+        # Pack into arrays
+        molded_images = np.stack(molded_images)
+        image_metas = np.stack(image_metas)
+        windows = np.stack(windows)
+        return molded_images, image_metas, windows
+
+    def get_anchors(self, image_shape):
+        """Returns anchor pyramid for the given image size."""
+        backbone_shapes = compute_backbone_shapes(self.config, image_shape)
+        # Cache anchors and reuse if image shape is the same
+        if not hasattr(self, "_anchor_cache"):
+            self._anchor_cache = {}
+        if not tuple(image_shape) in self._anchor_cache:
+            # Generate Anchors
+            a = saved_model_utils.generate_pyramid_anchors(
+                self.config.RPN_ANCHOR_SCALES,
+                self.config.RPN_ANCHOR_RATIOS,
+                backbone_shapes,
+                self.config.BACKBONE_STRIDES,
+                self.config.RPN_ANCHOR_STRIDE)
+            # Keep a copy of the latest anchors in pixel coordinates because
+            # it's used in inspect_model notebooks.
+            # TODO: Remove this after the notebook are refactored to not use it
+            self.anchors = a
+            # Normalize coordinates
+            self._anchor_cache[tuple(image_shape)] = saved_model_utils.norm_boxes(a, image_shape[:2])
+        return self._anchor_cache[tuple(image_shape)]
+
+    def unmold_detections(self, detections, mrcnn_mask, original_image_shape,
+                          image_shape, window):
+        """Reformats the detections of one image from the format of the neural
+        network output to a format suitable for use in the rest of the
+        application.
+
+        detections: [N, (y1, x1, y2, x2, class_id, score)] in normalized coordinates
+        mrcnn_mask: [N, height, width, num_classes]
+        original_image_shape: [H, W, C] Original image shape before resizing
+        image_shape: [H, W, C] Shape of the image after resizing and padding
+        window: [y1, x1, y2, x2] Pixel coordinates of box in the image where the real
+                image is excluding the padding.
+
+        Returns:
+        boxes: [N, (y1, x1, y2, x2)] Bounding boxes in pixels
+        class_ids: [N] Integer class IDs for each bounding box
+        scores: [N] Float probability scores of the class_id
+        masks: [height, width, num_instances] Instance masks
+        """
+        # How many detections do we have?
+        # Detections array is padded with zeros. Find the first class_id == 0.
+        zero_ix = np.where(detections[:, 4] == 0)[0]
+        N = zero_ix[0] if zero_ix.shape[0] > 0 else detections.shape[0]
+
+        # Extract boxes, class_ids, scores, and class-specific masks
+        boxes = detections[:N, :4]
+        class_ids = detections[:N, 4].astype(np.int32)
+        scores = detections[:N, 5]
+        masks = mrcnn_mask[np.arange(N), :, :, class_ids]
+
+        # Translate normalized coordinates in the resized image to pixel
+        # coordinates in the original image before resizing
+        window = saved_model_utils.norm_boxes(window, image_shape[:2])
+        wy1, wx1, wy2, wx2 = window
+        shift = np.array([wy1, wx1, wy1, wx1])
+        wh = wy2 - wy1  # window height
+        ww = wx2 - wx1  # window width
+        scale = np.array([wh, ww, wh, ww])
+        # Convert boxes to normalized coordinates on the window
+        boxes = np.divide(boxes - shift, scale)
+        # Convert boxes to pixel coordinates on the original image
+        boxes = saved_model_utils.denorm_boxes(boxes, original_image_shape[:2])
+
+        # Filter out detections with zero area. Happens in early training when
+        # network weights are still random
+        exclude_ix = np.where(
+            (boxes[:, 2] - boxes[:, 0]) * (boxes[:, 3] - boxes[:, 1]) <= 0)[0]
+        if exclude_ix.shape[0] > 0:
+            boxes = np.delete(boxes, exclude_ix, axis=0)
+            class_ids = np.delete(class_ids, exclude_ix, axis=0)
+            scores = np.delete(scores, exclude_ix, axis=0)
+            masks = np.delete(masks, exclude_ix, axis=0)
+            N = class_ids.shape[0]
+
+        # Resize masks to original image size and set boundary threshold.
+        full_masks = []
+        for i in range(N):
+            # Convert neural network mask to full size mask
+            full_mask = saved_model_utils.unmold_mask(masks[i], boxes[i], original_image_shape)
+            full_masks.append(full_mask)
+        full_masks = np.stack(full_masks, axis=-1)\
+            if full_masks else np.empty(original_image_shape[:2] + (0,))
+
+        return boxes, class_ids, scores, full_masks
+
+    def format_output(self, result_dict):
+        mask_shape = result_dict.outputs[saved_model_config.OUTPUT_MASK].tensor_shape.dim
+        mask_shape = tuple(d.size for d in mask_shape)
+        mask = np.array(result_dict.outputs[saved_model_config.OUTPUT_MASK].float_val)
+        mask = np.reshape(mask, mask_shape)
+
+        detection_shape = result_dict.outputs[saved_model_config.OUTPUT_DETECTION].tensor_shape.dim
+        detection_shape = tuple(d.size for d in detection_shape)
+        detection = np.array(result_dict.outputs[saved_model_config.OUTPUT_DETECTION].float_val)
+        detection = np.reshape(detection, detection_shape)
+
+        result_dict = {'detection': detection, 'mask': mask}
+
+        return result_dict
+
+    def format_restapi_output(self, result_dict):
+        mask = result_dict[saved_model_config.OUTPUT_MASK]
+        mask = np.array(mask)
+        mask = np.expand_dims(mask, axis=0)
+
+        detection = result_dict[saved_model_config.OUTPUT_DETECTION]
+        detection = np.array(detection)
+        detection = np.expand_dims(detection, axis=0)
+
+        result_dict = {'detection': detection, 'mask': mask}
+        return result_dict
+
+    def result_to_dict(self, images, molded_images, windows, result_dict, is_restapi=False):
+        if is_restapi:
+            result_dict = self.format_restapi_output(result_dict)
+        else:
+            result_dict = self.format_output(result_dict)
+        results = []
+        for i, image in enumerate(images):
+            # print('detection len',len(result_dict['detection']))
+            # print('mask len ',len(result_dict['mask']))
+            final_rois, final_class_ids, final_scores, final_masks = \
+                self.unmold_detections(result_dict['detection'][i], result_dict['mask'][i],
+                                       image.shape, molded_images[i].shape,
+                                       windows[i])
+            results.append({
+                "rois": final_rois,
+                "class": final_class_ids,
+                "scores": final_scores,
+                "mask": final_masks,
+            })
+            # print('rois:', final_rois.shape)
+            # print('class:', final_class_ids.shape)
+            # print('scores:', final_scores.shape)
+            # print('final mask shaoe:', final_masks.shape)
+        return results
\ No newline at end of file
diff --git a/mask_rcnn/tf_servable/inferencing/saved_model_utils.py b/mask_rcnn/tf_servable/inferencing/saved_model_utils.py
new file mode 100644
index 00000000..a6823fea
--- /dev/null
+++ b/mask_rcnn/tf_servable/inferencing/saved_model_utils.py
@@ -0,0 +1,879 @@
+import random
+import cv2
+import numpy as np
+import tensorflow as tf
+import scipy
+import skimage.color
+import skimage.transform
+import urllib.request
+import shutil
+import warnings
+
+
+COCO_MODEL_URL = "https://github.com/matterport/Mask_RCNN/releases/download/v2.0/mask_rcnn_coco.h5"
+
+
+############################################################
+#  Bounding Boxes
+############################################################
+
+def extract_bboxes(mask):
+    """Compute bounding boxes from masks.
+    mask: [height, width, num_instances]. Mask pixels are either 1 or 0.
+
+    Returns: bbox array [num_instances, (y1, x1, y2, x2)].
+    """
+    boxes = np.zeros([mask.shape[-1], 4], dtype=np.int32)
+    for i in range(mask.shape[-1]):
+        m = mask[:, :, i]
+        # Bounding box.
+        horizontal_indicies = np.where(np.any(m, axis=0))[0]
+        vertical_indicies = np.where(np.any(m, axis=1))[0]
+        if horizontal_indicies.shape[0]:
+            x1, x2 = horizontal_indicies[[0, -1]]
+            y1, y2 = vertical_indicies[[0, -1]]
+            # x2 and y2 should not be part of the box. Increment by 1.
+            x2 += 1
+            y2 += 1
+        else:
+            # No mask for this instance. Might happen due to
+            # resizing or cropping. Set bbox to zeros
+            x1, x2, y1, y2 = 0, 0, 0, 0
+        boxes[i] = np.array([y1, x1, y2, x2])
+    return boxes.astype(np.int32)
+
+
+def compute_iou(box, boxes, box_area, boxes_area):
+    """Calculates IoU of the given box with the array of the given boxes.
+    box: 1D vector [y1, x1, y2, x2]
+    boxes: [boxes_count, (y1, x1, y2, x2)]
+    box_area: float. the area of 'box'
+    boxes_area: array of length boxes_count.
+
+    Note: the areas are passed in rather than calculated here for
+    efficiency. Calculate once in the caller to avoid duplicate work.
+    """
+    # Calculate intersection areas
+    y1 = np.maximum(box[0], boxes[:, 0])
+    y2 = np.minimum(box[2], boxes[:, 2])
+    x1 = np.maximum(box[1], boxes[:, 1])
+    x2 = np.minimum(box[3], boxes[:, 3])
+    intersection = np.maximum(x2 - x1, 0) * np.maximum(y2 - y1, 0)
+    union = box_area + boxes_area[:] - intersection[:]
+    iou = intersection / union
+    return iou
+
+
+def compute_overlaps(boxes1, boxes2):
+    """Computes IoU overlaps between two sets of boxes.
+    boxes1, boxes2: [N, (y1, x1, y2, x2)].
+
+    For better performance, pass the largest set first and the smaller second.
+    """
+    # Areas of anchors and GT boxes
+    area1 = (boxes1[:, 2] - boxes1[:, 0]) * (boxes1[:, 3] - boxes1[:, 1])
+    area2 = (boxes2[:, 2] - boxes2[:, 0]) * (boxes2[:, 3] - boxes2[:, 1])
+
+    # Compute overlaps to generate matrix [boxes1 count, boxes2 count]
+    # Each cell contains the IoU value.
+    overlaps = np.zeros((boxes1.shape[0], boxes2.shape[0]))
+    for i in range(overlaps.shape[1]):
+        box2 = boxes2[i]
+        overlaps[:, i] = compute_iou(box2, boxes1, area2[i], area1)
+    return overlaps
+
+
+def compute_overlaps_masks(masks1, masks2):
+    """Computes IoU overlaps between two sets of masks.
+    masks1, masks2: [Height, Width, instances]
+    """
+
+    # If either set of masks is empty return empty result
+    if masks1.shape[0] == 0 or masks2.shape[0] == 0:
+        return np.zeros((masks1.shape[0], masks2.shape[-1]))
+    # flatten masks and compute their areas
+    masks1 = np.reshape(masks1 > .5, (-1, masks1.shape[-1])).astype(np.float32)
+    masks2 = np.reshape(masks2 > .5, (-1, masks2.shape[-1])).astype(np.float32)
+    area1 = np.sum(masks1, axis=0)
+    area2 = np.sum(masks2, axis=0)
+
+    # intersections and union
+    intersections = np.dot(masks1.T, masks2)
+    union = area1[:, None] + area2[None, :] - intersections
+    overlaps = intersections / union
+
+    return overlaps
+
+
+def non_max_suppression(boxes, scores, threshold):
+    """Performs non-maximum suppression and returns indices of kept boxes.
+    boxes: [N, (y1, x1, y2, x2)]. Notice that (y2, x2) lays outside the box.
+    scores: 1-D array of box scores.
+    threshold: Float. IoU threshold to use for filtering.
+    """
+    assert boxes.shape[0] > 0
+    if boxes.dtype.kind != "f":
+        boxes = boxes.astype(np.float32)
+
+    # Compute box areas
+    y1 = boxes[:, 0]
+    x1 = boxes[:, 1]
+    y2 = boxes[:, 2]
+    x2 = boxes[:, 3]
+    area = (y2 - y1) * (x2 - x1)
+
+    # Get indicies of boxes sorted by scores (highest first)
+    ixs = scores.argsort()[::-1]
+
+    pick = []
+    while len(ixs) > 0:
+        # Pick top box and add its index to the list
+        i = ixs[0]
+        pick.append(i)
+        # Compute IoU of the picked box with the rest
+        iou = compute_iou(boxes[i], boxes[ixs[1:]], area[i], area[ixs[1:]])
+        # Identify boxes with IoU over the threshold. This
+        # returns indices into ixs[1:], so add 1 to get
+        # indices into ixs.
+        remove_ixs = np.where(iou > threshold)[0] + 1
+        # Remove indices of the picked and overlapped boxes.
+        ixs = np.delete(ixs, remove_ixs)
+        ixs = np.delete(ixs, 0)
+    return np.array(pick, dtype=np.int32)
+
+
+def apply_box_deltas(boxes, deltas):
+    """Applies the given deltas to the given boxes.
+    boxes: [N, (y1, x1, y2, x2)]. Note that (y2, x2) is outside the box.
+    deltas: [N, (dy, dx, log(dh), log(dw))]
+    """
+    boxes = boxes.astype(np.float32)
+    # Convert to y, x, h, w
+    height = boxes[:, 2] - boxes[:, 0]
+    width = boxes[:, 3] - boxes[:, 1]
+    center_y = boxes[:, 0] + 0.5 * height
+    center_x = boxes[:, 1] + 0.5 * width
+    # Apply deltas
+    center_y += deltas[:, 0] * height
+    center_x += deltas[:, 1] * width
+    height *= np.exp(deltas[:, 2])
+    width *= np.exp(deltas[:, 3])
+    # Convert back to y1, x1, y2, x2
+    y1 = center_y - 0.5 * height
+    x1 = center_x - 0.5 * width
+    y2 = y1 + height
+    x2 = x1 + width
+    return np.stack([y1, x1, y2, x2], axis=1)
+
+
+def box_refinement_graph(box, gt_box):
+    """Compute refinement needed to transform box to gt_box.
+    box and gt_box are [N, (y1, x1, y2, x2)]
+    """
+    box = tf.cast(box, tf.float32)
+    gt_box = tf.cast(gt_box, tf.float32)
+
+    height = box[:, 2] - box[:, 0]
+    width = box[:, 3] - box[:, 1]
+    center_y = box[:, 0] + 0.5 * height
+    center_x = box[:, 1] + 0.5 * width
+
+    gt_height = gt_box[:, 2] - gt_box[:, 0]
+    gt_width = gt_box[:, 3] - gt_box[:, 1]
+    gt_center_y = gt_box[:, 0] + 0.5 * gt_height
+    gt_center_x = gt_box[:, 1] + 0.5 * gt_width
+
+    dy = (gt_center_y - center_y) / height
+    dx = (gt_center_x - center_x) / width
+    dh = tf.log(gt_height / height)
+    dw = tf.log(gt_width / width)
+
+    result = tf.stack([dy, dx, dh, dw], axis=1)
+    return result
+
+
+def box_refinement(box, gt_box):
+    """Compute refinement needed to transform box to gt_box.
+    box and gt_box are [N, (y1, x1, y2, x2)]. (y2, x2) is
+    assumed to be outside the box.
+    """
+    box = box.astype(np.float32)
+    gt_box = gt_box.astype(np.float32)
+
+    height = box[:, 2] - box[:, 0]
+    width = box[:, 3] - box[:, 1]
+    center_y = box[:, 0] + 0.5 * height
+    center_x = box[:, 1] + 0.5 * width
+
+    gt_height = gt_box[:, 2] - gt_box[:, 0]
+    gt_width = gt_box[:, 3] - gt_box[:, 1]
+    gt_center_y = gt_box[:, 0] + 0.5 * gt_height
+    gt_center_x = gt_box[:, 1] + 0.5 * gt_width
+
+    dy = (gt_center_y - center_y) / height
+    dx = (gt_center_x - center_x) / width
+    dh = np.log(gt_height / height)
+    dw = np.log(gt_width / width)
+
+    return np.stack([dy, dx, dh, dw], axis=1)
+
+
+############################################################
+#  Dataset
+############################################################
+
+class Dataset(object):
+    """The base class for dataset classes.
+    To use it, create a new class that adds functions specific to the dataset
+    you want to use. For example:
+
+    class CatsAndDogsDataset(Dataset):
+        def load_cats_and_dogs(self):
+            ...
+        def load_mask(self, image_id):
+            ...
+        def image_reference(self, image_id):
+            ...
+
+    See COCODataset and ShapesDataset as examples.
+    """
+
+    def __init__(self, class_map=None):
+        self._image_ids = []
+        self.image_info = []
+        # Background is always the first class
+        self.class_info = [{"source": "", "id": 0, "name": "BG"}]
+        self.source_class_ids = {}
+
+    def add_class(self, source, class_id, class_name):
+        assert "." not in source, "Source name cannot contain a dot"
+        # Does the class exist already?
+        for info in self.class_info:
+            if info['source'] == source and info["id"] == class_id:
+                # source.class_id combination already available, skip
+                return
+        # Add the class
+        self.class_info.append({
+            "source": source,
+            "id": class_id,
+            "name": class_name,
+        })
+
+    def add_image(self, source, image_id, path, **kwargs):
+        image_info = {
+            "id": image_id,
+            "source": source,
+            "path": path,
+        }
+        image_info.update(kwargs)
+        self.image_info.append(image_info)
+
+    def image_reference(self, image_id):
+        """Return a link to the image in its source Website or details about
+        the image that help looking it up or debugging it.
+
+        Override for your dataset, but pass to this function
+        if you encounter images not in your dataset.
+        """
+        return ""
+
+    def prepare(self, class_map=None):
+        """Prepares the Dataset class for use.
+
+        TODO: class map is not supported yet. When done, it should handle mapping
+              classes from different datasets to the same class ID.
+        """
+
+        def clean_name(name):
+            """Returns a shorter version of object names for cleaner display."""
+            return ",".join(name.split(",")[:1])
+
+        # Build (or rebuild) everything else from the info dicts.
+        self.num_classes = len(self.class_info)
+        self.class_ids = np.arange(self.num_classes)
+        self.class_names = [clean_name(c["name"]) for c in self.class_info]
+        self.num_images = len(self.image_info)
+        self._image_ids = np.arange(self.num_images)
+
+        # Mapping from source class and image IDs to internal IDs
+        self.class_from_source_map = {"{}.{}".format(info['source'], info['id']): id
+                                      for info, id in zip(self.class_info, self.class_ids)}
+        self.image_from_source_map = {"{}.{}".format(info['source'], info['id']): id
+                                      for info, id in zip(self.image_info, self.image_ids)}
+
+        # Map sources to class_ids they support
+        self.sources = list(set([i['source'] for i in self.class_info]))
+        self.source_class_ids = {}
+        # Loop over datasets
+        for source in self.sources:
+            self.source_class_ids[source] = []
+            # Find classes that belong to this dataset
+            for i, info in enumerate(self.class_info):
+                # Include BG class in all datasets
+                if i == 0 or source == info['source']:
+                    self.source_class_ids[source].append(i)
+
+    def map_source_class_id(self, source_class_id):
+        """Takes a source class ID and returns the int class ID assigned to it.
+
+        For example:
+        dataset.map_source_class_id("coco.12") -> 23
+        """
+        return self.class_from_source_map[source_class_id]
+
+    def get_source_class_id(self, class_id, source):
+        """Map an internal class ID to the corresponding class ID in the source dataset."""
+        info = self.class_info[class_id]
+        assert info['source'] == source
+        return info['id']
+
+    def append_data(self, class_info, image_info):
+        self.external_to_class_id = {}
+        for i, c in enumerate(self.class_info):
+            for ds, id in c["map"]:
+                self.external_to_class_id[ds + str(id)] = i
+
+        # Map external image IDs to internal ones.
+        self.external_to_image_id = {}
+        for i, info in enumerate(self.image_info):
+            self.external_to_image_id[info["ds"] + str(info["id"])] = i
+
+    @property
+    def image_ids(self):
+        return self._image_ids
+
+    def source_image_link(self, image_id):
+        """Returns the path or URL to the image.
+        Override this to return a URL to the image if it's available online for easy
+        debugging.
+        """
+        return self.image_info[image_id]["path"]
+
+    def load_image(self, image_id):
+        """Load the specified image and return a [H,W,3] Numpy array.
+        """
+        # Load image
+        image = cv2.imread(self.image_info[image_id]['path'])
+        # image = skimage.io.imread(self.image_info[image_id]['path'])
+        # If grayscale. Convert to RGB for consistency.
+        if image.ndim != 3:
+            image = skimage.color.gray2rgb(image)
+        # If has an alpha channel, remove it for consistency
+        if image.shape[-1] == 4:
+            image = image[..., :3]
+        return image
+
+    def load_mask(self, image_id):
+        """Load instance masks for the given image.
+
+        Different datasets use different ways to store masks. Override this
+        method to load instance masks and return them in the form of am
+        array of binary masks of shape [height, width, instances].
+
+        Returns:
+            masks: A bool array of shape [height, width, instance count] with
+                a binary mask per instance.
+            class_ids: a 1D array of class IDs of the instance masks.
+        """
+        # Override this function to load a mask from your dataset.
+        # Otherwise, it returns an empty mask.
+        mask = np.empty([0, 0, 0])
+        class_ids = np.empty([0], np.int32)
+        return mask, class_ids
+
+
+def resize_image(image, min_dim=None, max_dim=None, min_scale=None, mode="square"):
+    """Resizes an image keeping the aspect ratio unchanged.
+
+    min_dim: if provided, resizes the image such that it's smaller
+        dimension == min_dim
+    max_dim: if provided, ensures that the image longest side doesn't
+        exceed this value.
+    min_scale: if provided, ensure that the image is scaled up by at least
+        this percent even if min_dim doesn't require it.
+    mode: Resizing mode.
+        none: No resizing. Return the image unchanged.
+        square: Resize and pad with zeros to get a square image
+            of size [max_dim, max_dim].
+        pad64: Pads width and height with zeros to make them multiples of 64.
+               If min_dim or min_scale are provided, it scales the image up
+               before padding. max_dim is ignored in this mode.
+               The multiple of 64 is needed to ensure smooth scaling of feature
+               maps up and down the 6 levels of the FPN pyramid (2**6=64).
+        crop: Picks random crops from the image. First, scales the image based
+              on min_dim and min_scale, then picks a random crop of
+              size min_dim x min_dim. Can be used in training only.
+              max_dim is not used in this mode.
+
+    Returns:
+    image: the resized image
+    window: (y1, x1, y2, x2). If max_dim is provided, padding might
+        be inserted in the returned image. If so, this window is the
+        coordinates of the image part of the full image (excluding
+        the padding). The x2, y2 pixels are not included.
+    scale: The scale factor used to resize the image
+    padding: Padding added to the image [(top, bottom), (left, right), (0, 0)]
+    """
+    # Keep track of image dtype and return results in the same dtype
+    image_dtype = image.dtype
+    # Default window (y1, x1, y2, x2) and default scale == 1.
+    h, w = image.shape[:2]
+    window = (0, 0, h, w)
+    scale = 1
+    padding = [(0, 0), (0, 0), (0, 0)]
+    crop = None
+
+    if mode == "none":
+        return image, window, scale, padding, crop
+
+    # Scale?
+    if min_dim:
+        # Scale up but not down
+        scale = max(1, min_dim / min(h, w))
+    if min_scale and scale < min_scale:
+        scale = min_scale
+
+    # Does it exceed max dim?
+    if max_dim and mode == "square":
+        image_max = max(h, w)
+        if round(image_max * scale) > max_dim:
+            scale = max_dim / image_max
+
+    # Resize image using bilinear interpolation
+    if scale != 1:
+        # image = skimage.transform.resize(
+        #     image, (round(h * scale), round(w * scale)),
+        #     order=1, mode="constant", preserve_range=True)
+        image = cv2.resize(image, (round(w * scale), round(h * scale)))
+
+    # Need padding or cropping?
+    if mode == "square":
+        # Get new height and width
+        h, w = image.shape[:2]
+        top_pad = (max_dim - h) // 2
+        bottom_pad = max_dim - h - top_pad
+        left_pad = (max_dim - w) // 2
+        right_pad = max_dim - w - left_pad
+        padding = [(top_pad, bottom_pad), (left_pad, right_pad), (0, 0)]
+        image = np.pad(image, padding, mode='constant', constant_values=0)
+        window = (top_pad, left_pad, h + top_pad, w + left_pad)
+    elif mode == "pad64":
+        h, w = image.shape[:2]
+        # Both sides must be divisible by 64
+        assert min_dim % 64 == 0, "Minimum dimension must be a multiple of 64"
+        # Height
+        if h % 64 > 0:
+            max_h = h - (h % 64) + 64
+            top_pad = (max_h - h) // 2
+            bottom_pad = max_h - h - top_pad
+        else:
+            top_pad = bottom_pad = 0
+        # Width
+        if w % 64 > 0:
+            max_w = w - (w % 64) + 64
+            left_pad = (max_w - w) // 2
+            right_pad = max_w - w - left_pad
+        else:
+            left_pad = right_pad = 0
+        padding = [(top_pad, bottom_pad), (left_pad, right_pad), (0, 0)]
+        image = np.pad(image, padding, mode='constant', constant_values=0)
+        window = (top_pad, left_pad, h + top_pad, w + left_pad)
+    elif mode == "crop":
+        # Pick a random crop
+        h, w = image.shape[:2]
+        y = random.randint(0, (h - min_dim))
+        x = random.randint(0, (w - min_dim))
+        crop = (y, x, min_dim, min_dim)
+        image = image[y:y + min_dim, x:x + min_dim]
+        window = (0, 0, min_dim, min_dim)
+    else:
+        raise Exception("Mode {} not supported".format(mode))
+    return image.astype(image_dtype), window, scale, padding, crop
+
+
+def resize_mask(mask, scale, padding, crop=None):
+    """Resizes a mask using the given scale and padding.
+    Typically, you get the scale and padding from resize_image() to
+    ensure both, the image and the mask, are resized consistently.
+
+    scale: mask scaling factor
+    padding: Padding to add to the mask in the form
+            [(top, bottom), (left, right), (0, 0)]
+    """
+    # Suppress warning from scipy 0.13.0, the output shape of zoom() is
+    # calculated with round() instead of int()
+    with warnings.catch_warnings():
+        warnings.simplefilter("ignore")
+        mask = scipy.ndimage.zoom(mask, zoom=[scale, scale, 1], order=0)
+    if crop is not None:
+        y, x, h, w = crop
+        mask = mask[y:y + h, x:x + w]
+    else:
+        mask = np.pad(mask, padding, mode='constant', constant_values=0)
+    return mask
+
+
+def minimize_mask(bbox, mask, mini_shape):
+    """Resize masks to a smaller version to reduce memory load.
+    Mini-masks can be resized back to image scale using expand_masks()
+
+    See inspect_data.ipynb notebook for more details.
+    """
+    mini_mask = np.zeros(mini_shape + (mask.shape[-1],), dtype=bool)
+    for i in range(mask.shape[-1]):
+        # Pick slice and cast to bool in case load_mask() returned wrong dtype
+        m = mask[:, :, i].astype(bool)
+        y1, x1, y2, x2 = bbox[i][:4]
+        m = m[y1:y2, x1:x2]
+        if m.size == 0:
+            raise Exception("Invalid bounding box with area of zero")
+        # Resize with bilinear interpolation
+        m = skimage.transform.resize(m, mini_shape, order=1, mode="constant")
+        mini_mask[:, :, i] = np.around(m).astype(np.bool)
+    return mini_mask
+
+
+def expand_mask(bbox, mini_mask, image_shape):
+    """Resizes mini masks back to image size. Reverses the change
+    of minimize_mask().
+
+    See inspect_data.ipynb notebook for more details.
+    """
+    mask = np.zeros(image_shape[:2] + (mini_mask.shape[-1],), dtype=bool)
+    for i in range(mask.shape[-1]):
+        m = mini_mask[:, :, i]
+        y1, x1, y2, x2 = bbox[i][:4]
+        h = y2 - y1
+        w = x2 - x1
+        # Resize with bilinear interpolation
+        m = skimage.transform.resize(m, (h, w), order=1, mode="constant")
+        mask[y1:y2, x1:x2, i] = np.around(m).astype(np.bool)
+    return mask
+
+
+def unmold_mask(mask, bbox, image_shape):
+    """Converts a mask generated by the neural network to a format similar
+    to its original shape.
+    mask: [height, width] of type float. A small, typically 28x28 mask.
+    bbox: [y1, x1, y2, x2]. The box to fit the mask in.
+
+    Returns a binary mask with the same size as the original image.
+    """
+    threshold = 0.5
+    y1, x1, y2, x2 = bbox
+    # mask = skimage.transform.resize(mask, (y2 - y1, x2 - x1), order=1, mode="constant")
+    mask = cv2.resize(mask, (x2 - x1, y2 - y1))
+    mask = np.where(mask >= threshold, 1, 0).astype(np.bool)
+
+    # Put the mask in the right location.
+    full_mask = np.zeros(image_shape[:2], dtype=np.bool)
+    full_mask[y1:y2, x1:x2] = mask
+    return full_mask
+
+
+############################################################
+#  Anchors
+############################################################
+
+def generate_anchors(scales, ratios, shape, feature_stride, anchor_stride):
+    """
+    scales: 1D array of anchor sizes in pixels. Example: [32, 64, 128]
+    ratios: 1D array of anchor ratios of width/height. Example: [0.5, 1, 2]
+    shape: [height, width] spatial shape of the feature map over which
+            to generate anchors.
+    feature_stride: Stride of the feature map relative to the image in pixels.
+    anchor_stride: Stride of anchors on the feature map. For example, if the
+        value is 2 then generate anchors for every other feature map pixel.
+    """
+    # Get all combinations of scales and ratios
+    scales, ratios = np.meshgrid(np.array(scales), np.array(ratios))
+    scales = scales.flatten()
+    ratios = ratios.flatten()
+
+    # Enumerate heights and widths from scales and ratios
+    heights = scales / np.sqrt(ratios)
+    widths = scales * np.sqrt(ratios)
+
+    # Enumerate shifts in feature space
+    shifts_y = np.arange(0, shape[0], anchor_stride) * feature_stride
+    shifts_x = np.arange(0, shape[1], anchor_stride) * feature_stride
+    shifts_x, shifts_y = np.meshgrid(shifts_x, shifts_y)
+
+    # Enumerate combinations of shifts, widths, and heights
+    box_widths, box_centers_x = np.meshgrid(widths, shifts_x)
+    box_heights, box_centers_y = np.meshgrid(heights, shifts_y)
+
+    # Reshape to get a list of (y, x) and a list of (h, w)
+    box_centers = np.stack(
+        [box_centers_y, box_centers_x], axis=2).reshape([-1, 2])
+    box_sizes = np.stack([box_heights, box_widths], axis=2).reshape([-1, 2])
+
+    # Convert to corner coordinates (y1, x1, y2, x2)
+    boxes = np.concatenate([box_centers - 0.5 * box_sizes,
+                            box_centers + 0.5 * box_sizes], axis=1)
+    return boxes
+
+
+def generate_pyramid_anchors(scales, ratios, feature_shapes, feature_strides,
+                             anchor_stride):
+    """Generate anchors at different levels of a feature pyramid. Each scale
+    is associated with a level of the pyramid, but each ratio is used in
+    all levels of the pyramid.
+
+    Returns:
+    anchors: [N, (y1, x1, y2, x2)]. All generated anchors in one array. Sorted
+        with the same order of the given scales. So, anchors of scale[0] come
+        first, then anchors of scale[1], and so on.
+    """
+    # Anchors
+    # [anchor_count, (y1, x1, y2, x2)]
+    anchors = []
+    for i in range(len(scales)):
+        anchors.append(generate_anchors(scales[i], ratios, feature_shapes[i],
+                                        feature_strides[i], anchor_stride))
+    return np.concatenate(anchors, axis=0)
+
+
+############################################################
+#  Miscellaneous
+############################################################
+
+def trim_zeros(x):
+    """It's common to have tensors larger than the available data and
+    pad with zeros. This function removes rows that are all zeros.
+
+    x: [rows, columns].
+    """
+    assert len(x.shape) == 2
+    return x[~np.all(x == 0, axis=1)]
+
+
+def compute_matches(gt_boxes, gt_class_ids, gt_masks,
+                    pred_boxes, pred_class_ids, pred_scores, pred_masks,
+                    iou_threshold=0.5, score_threshold=0.0):
+    """Finds matches between prediction and ground truth instances.
+
+    Returns:
+        gt_match: 1-D array. For each GT box it has the index of the matched
+                  predicted box.
+        pred_match: 1-D array. For each predicted box, it has the index of
+                    the matched ground truth box.
+        overlaps: [pred_boxes, gt_boxes] IoU overlaps.
+    """
+    # Trim zero padding
+    # TODO: cleaner to do zero unpadding upstream
+    gt_boxes = trim_zeros(gt_boxes)
+    gt_masks = gt_masks[..., :gt_boxes.shape[0]]
+    pred_boxes = trim_zeros(pred_boxes)
+    pred_scores = pred_scores[:pred_boxes.shape[0]]
+    # Sort predictions by score from high to low
+    indices = np.argsort(pred_scores)[::-1]
+    pred_boxes = pred_boxes[indices]
+    pred_class_ids = pred_class_ids[indices]
+    pred_scores = pred_scores[indices]
+    pred_masks = pred_masks[..., indices]
+
+    # Compute IoU overlaps [pred_masks, gt_masks]
+    overlaps = compute_overlaps_masks(pred_masks, gt_masks)
+
+    # Loop through predictions and find matching ground truth boxes
+    match_count = 0
+    pred_match = -1 * np.ones([pred_boxes.shape[0]])
+    gt_match = -1 * np.ones([gt_boxes.shape[0]])
+    for i in range(len(pred_boxes)):
+        # Find best matching ground truth box
+        # 1. Sort matches by score
+        sorted_ixs = np.argsort(overlaps[i])[::-1]
+        # 2. Remove low scores
+        low_score_idx = np.where(overlaps[i, sorted_ixs] < score_threshold)[0]
+        if low_score_idx.size > 0:
+            sorted_ixs = sorted_ixs[:low_score_idx[0]]
+        # 3. Find the match
+        for j in sorted_ixs:
+            # If ground truth box is already matched, go to next one
+            if gt_match[j] > 0:
+                continue
+            # If we reach IoU smaller than the threshold, end the loop
+            iou = overlaps[i, j]
+            if iou < iou_threshold:
+                break
+            # Do we have a match?
+            if pred_class_ids[i] == gt_class_ids[j]:
+                match_count += 1
+                gt_match[j] = i
+                pred_match[i] = j
+                break
+
+    return gt_match, pred_match, overlaps
+
+
+def compute_ap(gt_boxes, gt_class_ids, gt_masks,
+               pred_boxes, pred_class_ids, pred_scores, pred_masks,
+               iou_threshold=0.5):
+    """Compute Average Precision at a set IoU threshold (default 0.5).
+
+    Returns:
+    mAP: Mean Average Precision
+    precisions: List of precisions at different class score thresholds.
+    recalls: List of recall values at different class score thresholds.
+    overlaps: [pred_boxes, gt_boxes] IoU overlaps.
+    """
+    # Get matches and overlaps
+    gt_match, pred_match, overlaps = compute_matches(
+        gt_boxes, gt_class_ids, gt_masks,
+        pred_boxes, pred_class_ids, pred_scores, pred_masks,
+        iou_threshold)
+
+    # Compute precision and recall at each prediction box step
+    precisions = np.cumsum(pred_match > -1) / (np.arange(len(pred_match)) + 1)
+    recalls = np.cumsum(pred_match > -1).astype(np.float32) / len(gt_match)
+
+    # Pad with start and end values to simplify the math
+    precisions = np.concatenate([[0], precisions, [0]])
+    recalls = np.concatenate([[0], recalls, [1]])
+
+    # Ensure precision values decrease but don't increase. This way, the
+    # precision value at each recall threshold is the maximum it can be
+    # for all following recall thresholds, as specified by the VOC paper.
+    for i in range(len(precisions) - 2, -1, -1):
+        precisions[i] = np.maximum(precisions[i], precisions[i + 1])
+
+    # Compute mean AP over recall range
+    indices = np.where(recalls[:-1] != recalls[1:])[0] + 1
+    mAP = np.sum((recalls[indices] - recalls[indices - 1]) *
+                 precisions[indices])
+
+    return mAP, precisions, recalls, overlaps
+
+
+def compute_ap_range(gt_box, gt_class_id, gt_mask,
+                     pred_box, pred_class_id, pred_score, pred_mask,
+                     iou_thresholds=None, verbose=1):
+    """Compute AP over a range or IoU thresholds. Default range is 0.5-0.95."""
+    # Default is 0.5 to 0.95 with increments of 0.05
+    iou_thresholds = iou_thresholds or np.arange(0.5, 1.0, 0.05)
+
+    # Compute AP over range of IoU thresholds
+    AP = []
+    for iou_threshold in iou_thresholds:
+        ap, precisions, recalls, overlaps = \
+            compute_ap(gt_box, gt_class_id, gt_mask,
+                       pred_box, pred_class_id, pred_score, pred_mask,
+                       iou_threshold=iou_threshold)
+        if verbose:
+            print("AP @{:.2f}:\t {:.3f}".format(iou_threshold, ap))
+        AP.append(ap)
+    AP = np.array(AP).mean()
+    if verbose:
+        print("AP @{:.2f}-{:.2f}:\t {:.3f}".format(
+            iou_thresholds[0], iou_thresholds[-1], AP))
+    return AP
+
+
+def compute_recall(pred_boxes, gt_boxes, iou):
+    """Compute the recall at the given IoU threshold. It's an indication
+    of how many GT boxes were found by the given prediction boxes.
+
+    pred_boxes: [N, (y1, x1, y2, x2)] in image coordinates
+    gt_boxes: [N, (y1, x1, y2, x2)] in image coordinates
+    """
+    # Measure overlaps
+    overlaps = compute_overlaps(pred_boxes, gt_boxes)
+    iou_max = np.max(overlaps, axis=1)
+    iou_argmax = np.argmax(overlaps, axis=1)
+    positive_ids = np.where(iou_max >= iou)[0]
+    matched_gt_boxes = iou_argmax[positive_ids]
+
+    recall = len(set(matched_gt_boxes)) / gt_boxes.shape[0]
+    return recall, positive_ids
+
+
+# ## Batch Slicing
+# Some custom layers support a batch size of 1 only, and require a lot of work
+# to support batches greater than 1. This function slices an input tensor
+# across the batch dimension and feeds batches of size 1. Effectively,
+# an easy way to support batches > 1 quickly with little code modification.
+# In the long run, it's more efficient to modify the code to support large
+# batches and getting rid of this function. Consider this a temporary solution
+def batch_slice(inputs, graph_fn, batch_size, names=None):
+    """Splits inputs into slices and feeds each slice to a copy of the given
+    computation graph and then combines the results. It allows you to run a
+    graph on a batch of inputs even if the graph is written to support one
+    instance only.
+
+    inputs: list of tensors. All must have the same first dimension length
+    graph_fn: A function that returns a TF tensor that's part of a graph.
+    batch_size: number of slices to divide the data into.
+    names: If provided, assigns names to the resulting tensors.
+    """
+    if not isinstance(inputs, list):
+        inputs = [inputs]
+
+    outputs = []
+    for i in range(batch_size):
+        inputs_slice = [x[i] for x in inputs]
+        output_slice = graph_fn(*inputs_slice)
+        if not isinstance(output_slice, (tuple, list)):
+            output_slice = [output_slice]
+        outputs.append(output_slice)
+    # Change outputs from a list of slices where each is
+    # a list of outputs to a list of outputs and each has
+    # a list of slices
+    outputs = list(zip(*outputs))
+
+    if names is None:
+        names = [None] * len(outputs)
+
+    result = [tf.stack(o, axis=0, name=n)
+              for o, n in zip(outputs, names)]
+    if len(result) == 1:
+        result = result[0]
+
+    return result
+
+
+def download_trained_weights(coco_model_path, verbose=1):
+    """Download COCO trained weights from Releases.
+
+    coco_model_path: local path of COCO trained weights
+    """
+    if verbose > 0:
+        print("Downloading pretrained model to " + coco_model_path + " ...")
+    with urllib.request.urlopen(COCO_MODEL_URL) as resp, open(coco_model_path, 'wb') as out:
+        shutil.copyfileobj(resp, out)
+    if verbose > 0:
+        print("... done downloading pretrained model!")
+
+
+def norm_boxes(boxes, shape):
+    """Converts boxes from pixel coordinates to normalized coordinates.
+    boxes: [N, (y1, x1, y2, x2)] in pixel coordinates
+    shape: [..., (height, width)] in pixels
+
+    Note: In pixel coordinates (y2, x2) is outside the box. But in normalized
+    coordinates it's inside the box.
+
+    Returns:
+        [N, (y1, x1, y2, x2)] in normalized coordinates
+    """
+    h, w = shape
+    scale = np.array([h - 1, w - 1, h - 1, w - 1])
+    shift = np.array([0, 0, 1, 1])
+    return np.divide((boxes - shift), scale).astype(np.float32)
+
+
+def denorm_boxes(boxes, shape):
+    """Converts boxes from normalized coordinates to pixel coordinates.
+    boxes: [N, (y1, x1, y2, x2)] in normalized coordinates
+    shape: [..., (height, width)] in pixels
+
+    Note: In pixel coordinates (y2, x2) is outside the box. But in normalized
+    coordinates it's inside the box.
+
+    Returns:
+        [N, (y1, x1, y2, x2)] in pixel coordinates
+    """
+    h, w = shape
+    scale = np.array([h - 1, w - 1, h - 1, w - 1])
+    shift = np.array([0, 0, 1, 1])
+    return np.around(np.multiply(boxes, scale) + shift).astype(np.int32)
diff --git a/mask_rcnn/tf_servable/inferencing/visualize.py b/mask_rcnn/tf_servable/inferencing/visualize.py
new file mode 100644
index 00000000..80e5ef58
--- /dev/null
+++ b/mask_rcnn/tf_servable/inferencing/visualize.py
@@ -0,0 +1,502 @@
+"""
+Mask R-CNN
+Display and Visualization Functions.
+
+Copyright (c) 2017 Matterport, Inc.
+Licensed under the MIT License (see LICENSE for details)
+Written by Waleed Abdulla
+"""
+import warnings
+warnings.filterwarnings('ignore', category=DeprecationWarning)
+warnings.filterwarnings('ignore', category=FutureWarning)
+import os
+import sys
+import random
+import itertools
+import colorsys
+
+import numpy as np
+from skimage.measure import find_contours
+import matplotlib.pyplot as plt
+from matplotlib import patches,  lines
+from matplotlib.patches import Polygon
+import IPython.display
+
+# Root directory of the project
+ROOT_DIR = os.path.abspath("../")
+
+# Import Mask RCNN
+sys.path.append(ROOT_DIR)  # To find local version of the library
+from mrcnn import utils
+
+
+############################################################
+#  Visualization
+############################################################
+
+def display_images(images, titles=None, cols=4, cmap=None, norm=None,
+                   interpolation=None):
+    """Display the given set of images, optionally with titles.
+    images: list or array of image tensors in HWC format.
+    titles: optional. A list of titles to display with each image.
+    cols: number of images per row
+    cmap: Optional. Color map to use. For example, "Blues".
+    norm: Optional. A Normalize instance to map values to colors.
+    interpolation: Optional. Image interpolation to use for display.
+    """
+    titles = titles if titles is not None else [""] * len(images)
+    rows = len(images) // cols + 1
+    plt.figure(figsize=(14, 14 * rows // cols))
+    i = 1
+    for image, title in zip(images, titles):
+        plt.subplot(rows, cols, i)
+        plt.title(title, fontsize=9)
+        plt.axis('off')
+        plt.imshow(image.astype(np.uint8), cmap=cmap,
+                   norm=norm, interpolation=interpolation)
+        i += 1
+    plt.show()
+
+
+def random_colors(N, bright=True):
+    """
+    Generate random colors.
+    To get visually distinct colors, generate them in HSV space then
+    convert to RGB.
+    """
+    brightness = 1.0 if bright else 0.7
+    hsv = [(i / N, 1, brightness) for i in range(N)]
+    colors = list(map(lambda c: colorsys.hsv_to_rgb(*c), hsv))
+    random.shuffle(colors)
+    return colors
+
+
+def apply_mask(image, mask, color, alpha=0.5):
+    """Apply the given mask to the image.
+    """
+    for c in range(3):
+        image[:, :, c] = np.where(mask == 1,
+                                  image[:, :, c] *
+                                  (1 - alpha) + alpha * color[c] * 255,
+                                  image[:, :, c])
+    return image
+
+
+def display_instances(image, boxes, masks, class_ids, class_names,
+                      scores=None, title="",
+                      figsize=(16, 16), ax=None,
+                      show_mask=True, show_bbox=True,
+                      colors=None, captions=None):
+    """
+    boxes: [num_instance, (y1, x1, y2, x2, class_id)] in image coordinates.
+    masks: [height, width, num_instances]
+    class_ids: [num_instances]
+    class_names: list of class names of the dataset
+    scores: (optional) confidence scores for each box
+    title: (optional) Figure title
+    show_mask, show_bbox: To show masks and bounding boxes or not
+    figsize: (optional) the size of the image
+    colors: (optional) An array or colors to use with each object
+    captions: (optional) A list of strings to use as captions for each object
+    """
+    # Number of instances
+    N = boxes.shape[0]
+    if not N:
+        print("\n*** No instances to display *** \n")
+    else:
+        assert boxes.shape[0] == masks.shape[-1] == class_ids.shape[0]
+
+    # If no axis is passed, create one and automatically call show()
+    auto_show = False
+    if not ax:
+        _, ax = plt.subplots(1, figsize=figsize)
+        auto_show = True
+
+    # Generate random colors
+    colors = colors or random_colors(N)
+
+    # Show area outside image boundaries.
+    height, width = image.shape[:2]
+    ax.set_ylim(height + 10, -10)
+    ax.set_xlim(-10, width + 10)
+    ax.axis('off')
+    ax.set_title(title)
+
+    masked_image = image.astype(np.uint32).copy()
+    for i in range(N):
+        color = colors[i]
+
+        # Bounding box
+        if not np.any(boxes[i]):
+            # Skip this instance. Has no bbox. Likely lost in image cropping.
+            continue
+        y1, x1, y2, x2 = boxes[i]
+        if show_bbox:
+            p = patches.Rectangle((x1, y1), x2 - x1, y2 - y1, linewidth=2,
+                                alpha=0.7, linestyle="dashed",
+                                edgecolor=color, facecolor='none')
+            ax.add_patch(p)
+
+        # Label
+        if not captions:
+            class_id = class_ids[i]
+            score = scores[i] if scores is not None else None
+            label = class_names[class_id]
+            caption = "{} {:.3f}".format(label, score) if score else label
+        else:
+            caption = captions[i]
+        ax.text(x1, y1 + 8, caption,
+                color='w', size=11, backgroundcolor="none")
+
+        # Mask
+        mask = masks[:, :, i]
+        if show_mask:
+            masked_image = apply_mask(masked_image, mask, color)
+
+        # Mask Polygon
+        # Pad to ensure proper polygons for masks that touch image edges.
+        padded_mask = np.zeros(
+            (mask.shape[0] + 2, mask.shape[1] + 2), dtype=np.uint8)
+        padded_mask[1:-1, 1:-1] = mask
+        contours = find_contours(padded_mask, 0.5)
+        for verts in contours:
+            # Subtract the padding and flip (y, x) to (x, y)
+            verts = np.fliplr(verts) - 1
+            p = Polygon(verts, facecolor="none", edgecolor=color)
+            ax.add_patch(p)
+    ax.imshow(masked_image.astype(np.uint8))
+    if auto_show:
+        plt.show()
+
+
+def display_differences(image,
+                        gt_box, gt_class_id, gt_mask,
+                        pred_box, pred_class_id, pred_score, pred_mask,
+                        class_names, title="", ax=None,
+                        show_mask=True, show_box=True,
+                        iou_threshold=0.5, score_threshold=0.5):
+    """Display ground truth and prediction instances on the same image."""
+    # Match predictions to ground truth
+    gt_match, pred_match, overlaps = utils.compute_matches(
+        gt_box, gt_class_id, gt_mask,
+        pred_box, pred_class_id, pred_score, pred_mask,
+        iou_threshold=iou_threshold, score_threshold=score_threshold)
+    # Ground truth = green. Predictions = red
+    colors = [(0, 1, 0, .8)] * len(gt_match)\
+           + [(1, 0, 0, 1)] * len(pred_match)
+    # Concatenate GT and predictions
+    class_ids = np.concatenate([gt_class_id, pred_class_id])
+    scores = np.concatenate([np.zeros([len(gt_match)]), pred_score])
+    boxes = np.concatenate([gt_box, pred_box])
+    masks = np.concatenate([gt_mask, pred_mask], axis=-1)
+    # Captions per instance show score/IoU
+    captions = ["" for m in gt_match] + ["{:.2f} / {:.2f}".format(
+        pred_score[i],
+        (overlaps[i, int(pred_match[i])]
+            if pred_match[i] > -1 else overlaps[i].max()))
+            for i in range(len(pred_match))]
+    # Set title if not provided
+    title = title or "Ground Truth and Detections\n GT=green, pred=red, captions: score/IoU"
+    # Display
+    display_instances(
+        image,
+        boxes, masks, class_ids,
+        class_names, scores, ax=ax,
+        show_bbox=show_box, show_mask=show_mask,
+        colors=colors, captions=captions,
+        title=title)
+
+
+def draw_rois(image, rois, refined_rois, mask, class_ids, class_names, limit=10):
+    """
+    anchors: [n, (y1, x1, y2, x2)] list of anchors in image coordinates.
+    proposals: [n, 4] the same anchors but refined to fit objects better.
+    """
+    masked_image = image.copy()
+
+    # Pick random anchors in case there are too many.
+    ids = np.arange(rois.shape[0], dtype=np.int32)
+    ids = np.random.choice(
+        ids, limit, replace=False) if ids.shape[0] > limit else ids
+
+    fig, ax = plt.subplots(1, figsize=(12, 12))
+    if rois.shape[0] > limit:
+        plt.title("Showing {} random ROIs out of {}".format(
+            len(ids), rois.shape[0]))
+    else:
+        plt.title("{} ROIs".format(len(ids)))
+
+    # Show area outside image boundaries.
+    ax.set_ylim(image.shape[0] + 20, -20)
+    ax.set_xlim(-50, image.shape[1] + 20)
+    ax.axis('off')
+
+    for i, id in enumerate(ids):
+        color = np.random.rand(3)
+        class_id = class_ids[id]
+        # ROI
+        y1, x1, y2, x2 = rois[id]
+        p = patches.Rectangle((x1, y1), x2 - x1, y2 - y1, linewidth=2,
+                              edgecolor=color if class_id else "gray",
+                              facecolor='none', linestyle="dashed")
+        ax.add_patch(p)
+        # Refined ROI
+        if class_id:
+            ry1, rx1, ry2, rx2 = refined_rois[id]
+            p = patches.Rectangle((rx1, ry1), rx2 - rx1, ry2 - ry1, linewidth=2,
+                                  edgecolor=color, facecolor='none')
+            ax.add_patch(p)
+            # Connect the top-left corners of the anchor and proposal for easy visualization
+            ax.add_line(lines.Line2D([x1, rx1], [y1, ry1], color=color))
+
+            # Label
+            label = class_names[class_id]
+            ax.text(rx1, ry1 + 8, "{}".format(label),
+                    color='w', size=11, backgroundcolor="none")
+
+            # Mask
+            m = utils.unmold_mask(mask[id], rois[id]
+                                  [:4].astype(np.int32), image.shape)
+            masked_image = apply_mask(masked_image, m, color)
+
+    ax.imshow(masked_image)
+
+    # Print stats
+    print("Positive ROIs: ", class_ids[class_ids > 0].shape[0])
+    print("Negative ROIs: ", class_ids[class_ids == 0].shape[0])
+    print("Positive Ratio: {:.2f}".format(
+        class_ids[class_ids > 0].shape[0] / class_ids.shape[0]))
+
+
+# TODO: Replace with matplotlib equivalent?
+def draw_box(image, box, color):
+    """Draw 3-pixel width bounding boxes on the given image array.
+    color: list of 3 int values for RGB.
+    """
+    y1, x1, y2, x2 = box
+    image[y1:y1 + 2, x1:x2] = color
+    image[y2:y2 + 2, x1:x2] = color
+    image[y1:y2, x1:x1 + 2] = color
+    image[y1:y2, x2:x2 + 2] = color
+    return image
+
+
+def display_top_masks(image, mask, class_ids, class_names, limit=4):
+    """Display the given image and the top few class masks."""
+    to_display = []
+    titles = []
+    to_display.append(image)
+    titles.append("H x W={}x{}".format(image.shape[0], image.shape[1]))
+    # Pick top prominent classes in this image
+    unique_class_ids = np.unique(class_ids)
+    mask_area = [np.sum(mask[:, :, np.where(class_ids == i)[0]])
+                 for i in unique_class_ids]
+    top_ids = [v[0] for v in sorted(zip(unique_class_ids, mask_area),
+                                    key=lambda r: r[1], reverse=True) if v[1] > 0]
+    # Generate images and titles
+    for i in range(limit):
+        class_id = top_ids[i] if i < len(top_ids) else -1
+        # Pull masks of instances belonging to the same class.
+        m = mask[:, :, np.where(class_ids == class_id)[0]]
+        m = np.sum(m * np.arange(1, m.shape[-1] + 1), -1)
+        to_display.append(m)
+        titles.append(class_names[class_id] if class_id != -1 else "-")
+    display_images(to_display, titles=titles, cols=limit + 1, cmap="Blues_r")
+
+
+def plot_precision_recall(AP, precisions, recalls):
+    """Draw the precision-recall curve.
+
+    AP: Average precision at IoU >= 0.5
+    precisions: list of precision values
+    recalls: list of recall values
+    """
+    # Plot the Precision-Recall curve
+    _, ax = plt.subplots(1)
+    ax.set_title("Precision-Recall Curve. AP@50 = {:.3f}".format(AP))
+    ax.set_ylim(0, 1.1)
+    ax.set_xlim(0, 1.1)
+    _ = ax.plot(recalls, precisions)
+
+
+def plot_overlaps(gt_class_ids, pred_class_ids, pred_scores,
+                  overlaps, class_names, threshold=0.5):
+    """Draw a grid showing how ground truth objects are classified.
+    gt_class_ids: [N] int. Ground truth class IDs
+    pred_class_id: [N] int. Predicted class IDs
+    pred_scores: [N] float. The probability scores of predicted classes
+    overlaps: [pred_boxes, gt_boxes] IoU overlaps of predictions and GT boxes.
+    class_names: list of all class names in the dataset
+    threshold: Float. The prediction probability required to predict a class
+    """
+    gt_class_ids = gt_class_ids[gt_class_ids != 0]
+    pred_class_ids = pred_class_ids[pred_class_ids != 0]
+
+    plt.figure(figsize=(12, 10))
+    plt.imshow(overlaps, interpolation='nearest', cmap=plt.cm.Blues)
+    plt.yticks(np.arange(len(pred_class_ids)),
+               ["{} ({:.2f})".format(class_names[int(id)], pred_scores[i])
+                for i, id in enumerate(pred_class_ids)])
+    plt.xticks(np.arange(len(gt_class_ids)),
+               [class_names[int(id)] for id in gt_class_ids], rotation=90)
+
+    thresh = overlaps.max() / 2.
+    for i, j in itertools.product(range(overlaps.shape[0]),
+                                  range(overlaps.shape[1])):
+        text = ""
+        if overlaps[i, j] > threshold:
+            text = "match" if gt_class_ids[j] == pred_class_ids[i] else "wrong"
+        color = ("white" if overlaps[i, j] > thresh
+                 else "black" if overlaps[i, j] > 0
+                 else "grey")
+        plt.text(j, i, "{:.3f}\n{}".format(overlaps[i, j], text),
+                 horizontalalignment="center", verticalalignment="center",
+                 fontsize=9, color=color)
+
+    plt.tight_layout()
+    plt.xlabel("Ground Truth")
+    plt.ylabel("Predictions")
+
+
+def draw_boxes(image, boxes=None, refined_boxes=None,
+               masks=None, captions=None, visibilities=None,
+               title="", ax=None):
+    """Draw bounding boxes and segmentation masks with different
+    customizations.
+
+    boxes: [N, (y1, x1, y2, x2, class_id)] in image coordinates.
+    refined_boxes: Like boxes, but draw with solid lines to show
+        that they're the result of refining 'boxes'.
+    masks: [N, height, width]
+    captions: List of N titles to display on each box
+    visibilities: (optional) List of values of 0, 1, or 2. Determine how
+        prominent each bounding box should be.
+    title: An optional title to show over the image
+    ax: (optional) Matplotlib axis to draw on.
+    """
+    # Number of boxes
+    assert boxes is not None or refined_boxes is not None
+    N = boxes.shape[0] if boxes is not None else refined_boxes.shape[0]
+
+    # Matplotlib Axis
+    if not ax:
+        _, ax = plt.subplots(1, figsize=(12, 12))
+
+    # Generate random colors
+    colors = random_colors(N)
+
+    # Show area outside image boundaries.
+    margin = image.shape[0] // 10
+    ax.set_ylim(image.shape[0] + margin, -margin)
+    ax.set_xlim(-margin, image.shape[1] + margin)
+    ax.axis('off')
+
+    ax.set_title(title)
+
+    masked_image = image.astype(np.uint32).copy()
+    for i in range(N):
+        # Box visibility
+        visibility = visibilities[i] if visibilities is not None else 1
+        if visibility == 0:
+            color = "gray"
+            style = "dotted"
+            alpha = 0.5
+        elif visibility == 1:
+            color = colors[i]
+            style = "dotted"
+            alpha = 1
+        elif visibility == 2:
+            color = colors[i]
+            style = "solid"
+            alpha = 1
+
+        # Boxes
+        if boxes is not None:
+            if not np.any(boxes[i]):
+                # Skip this instance. Has no bbox. Likely lost in cropping.
+                continue
+            y1, x1, y2, x2 = boxes[i]
+            p = patches.Rectangle((x1, y1), x2 - x1, y2 - y1, linewidth=2,
+                                  alpha=alpha, linestyle=style,
+                                  edgecolor=color, facecolor='none')
+            ax.add_patch(p)
+
+        # Refined boxes
+        if refined_boxes is not None and visibility > 0:
+            ry1, rx1, ry2, rx2 = refined_boxes[i].astype(np.int32)
+            p = patches.Rectangle((rx1, ry1), rx2 - rx1, ry2 - ry1, linewidth=2,
+                                  edgecolor=color, facecolor='none')
+            ax.add_patch(p)
+            # Connect the top-left corners of the anchor and proposal
+            if boxes is not None:
+                ax.add_line(lines.Line2D([x1, rx1], [y1, ry1], color=color))
+
+        # Captions
+        if captions is not None:
+            caption = captions[i]
+            # If there are refined boxes, display captions on them
+            if refined_boxes is not None:
+                y1, x1, y2, x2 = ry1, rx1, ry2, rx2
+            ax.text(x1, y1, caption, size=11, verticalalignment='top',
+                    color='w', backgroundcolor="none",
+                    bbox={'facecolor': color, 'alpha': 0.5,
+                          'pad': 2, 'edgecolor': 'none'})
+
+        # Masks
+        if masks is not None:
+            mask = masks[:, :, i]
+            masked_image = apply_mask(masked_image, mask, color)
+            # Mask Polygon
+            # Pad to ensure proper polygons for masks that touch image edges.
+            padded_mask = np.zeros(
+                (mask.shape[0] + 2, mask.shape[1] + 2), dtype=np.uint8)
+            padded_mask[1:-1, 1:-1] = mask
+            contours = find_contours(padded_mask, 0.5)
+            for verts in contours:
+                # Subtract the padding and flip (y, x) to (x, y)
+                verts = np.fliplr(verts) - 1
+                p = Polygon(verts, facecolor="none", edgecolor=color)
+                ax.add_patch(p)
+    ax.imshow(masked_image.astype(np.uint8))
+
+
+def display_table(table):
+    """Display values in a table format.
+    table: an iterable of rows, and each row is an iterable of values.
+    """
+    html = ""
+    for row in table:
+        row_html = ""
+        for col in row:
+            row_html += "<td>{:40}</td>".format(str(col))
+        html += "<tr>" + row_html + "</tr>"
+    html = "<table>" + html + "</table>"
+    IPython.display.display(IPython.display.HTML(html))
+
+
+def display_weight_stats(model):
+    """Scans all the weights in the model and returns a list of tuples
+    that contain stats about each weight.
+    """
+    layers = model.get_trainable_layers()
+    table = [["WEIGHT NAME", "SHAPE", "MIN", "MAX", "STD"]]
+    for l in layers:
+        weight_values = l.get_weights()  # list of Numpy arrays
+        weight_tensors = l.weights  # list of TF tensors
+        for i, w in enumerate(weight_values):
+            weight_name = weight_tensors[i].name
+            # Detect problematic layers. Exclude biases of conv layers.
+            alert = ""
+            if w.min() == w.max() and not (l.__class__.__name__ == "Conv2D" and i == 1):
+                alert += "<span style='color:red'>*** dead?</span>"
+            if np.abs(w.min()) > 1000 or np.abs(w.max()) > 1000:
+                alert += "<span style='color:red'>*** Overflow?</span>"
+            # Add row
+            table.append([
+                weight_name + alert,
+                str(w.shape),
+                "{:+9.4f}".format(w.min()),
+                "{:+10.4f}".format(w.max()),
+                "{:+9.4f}".format(w.std()),
+            ])
+    display_table(table)
diff --git a/mask_rcnn/tf_servable/main.py b/mask_rcnn/tf_servable/main.py
new file mode 100644
index 00000000..25700221
--- /dev/null
+++ b/mask_rcnn/tf_servable/main.py
@@ -0,0 +1,118 @@
+from user_config import *
+import tensorflow as tf
+import keras.backend as K
+from tensorflow.python.saved_model import signature_constants
+from tensorflow.python.saved_model import tag_constants
+import os
+from config import mask_config
+from model import MaskRCNN
+
+sess = tf.Session()
+K.set_session(sess)
+
+
+def get_config():
+    if is_coco:
+        import coco
+        class InferenceConfig(coco.CocoConfig):
+            GPU_COUNT = 1
+            IMAGES_PER_GPU = 1
+
+        config = InferenceConfig()
+
+    else:
+        config = mask_config(NUMBER_OF_CLASSES)
+
+    return config
+
+
+def freeze_session(session, keep_var_names=None, output_names=None, clear_devices=True):
+    graph = sess.graph
+
+    with graph.as_default():
+        freeze_var_names = list(set(v.op.name for v in tf.global_variables()).difference(keep_var_names or []))
+
+        output_names = output_names or []
+        input_graph_def = graph.as_graph_def()
+
+        if clear_devices:
+            for node in input_graph_def.node:
+                node.device = ""
+
+        frozen_graph = tf.graph_util.convert_variables_to_constants(
+            session, input_graph_def, output_names, freeze_var_names)
+        return frozen_graph
+
+
+def freeze_model(model, name):
+    frozen_graph = freeze_session(
+        sess,
+        output_names=[out.op.name for out in model.outputs][:4])
+    directory = PATH_TO_SAVE_FROZEN_PB
+    tf.train.write_graph(frozen_graph, directory, name , as_text=False)
+    print("*"*80)
+    print("Finish converting keras model to Frozen PB")
+    print('PATH: ', PATH_TO_SAVE_FROZEN_PB)
+    print("*" * 80)
+
+
+def make_serving_ready(model_path, save_serve_path, version_number):
+    import tensorflow as tf
+
+    export_dir = os.path.join(save_serve_path, str(version_number))
+    graph_pb = model_path
+
+    builder = tf.saved_model.builder.SavedModelBuilder(export_dir)
+
+    with tf.gfile.GFile(graph_pb, "rb") as f:
+        graph_def = tf.GraphDef()
+        graph_def.ParseFromString(f.read())
+
+    sigs = {}
+
+    with tf.Session(graph=tf.Graph()) as sess:
+        # name="" is important to ensure we don't get spurious prefixing
+        tf.import_graph_def(graph_def, name="")
+        g = tf.get_default_graph()
+        input_image = g.get_tensor_by_name("input_image:0")
+        input_image_meta = g.get_tensor_by_name("input_image_meta:0")
+        input_anchors = g.get_tensor_by_name("input_anchors:0")
+
+        output_detection = g.get_tensor_by_name("mrcnn_detection/Reshape_1:0")
+        output_mask = g.get_tensor_by_name("mrcnn_mask/Reshape_1:0")
+
+        sigs[signature_constants.DEFAULT_SERVING_SIGNATURE_DEF_KEY] = \
+            tf.saved_model.signature_def_utils.predict_signature_def(
+                {"input_image": input_image, 'input_image_meta': input_image_meta, 'input_anchors': input_anchors},
+                {"mrcnn_detection/Reshape_1": output_detection, 'mrcnn_mask/Reshape_1': output_mask})
+
+        builder.add_meta_graph_and_variables(sess,
+                                             [tag_constants.SERVING],
+                                             signature_def_map=sigs)
+
+    builder.save()
+    print("*" * 80)
+    print("FINISH CONVERTING FROZEN PB TO SERVING READY")
+    print("PATH:", PATH_TO_SAVE_TENSORFLOW_SERVING_MODEL)
+    print("*" * 80)
+
+
+# Load Mask RCNN config
+# you can also load your own config in here.
+# config = your_custom_config_class
+config = get_config()
+
+
+# LOAD MODEL
+model = MaskRCNN(mode="inference", model_dir=MODEL_DIR, config=config)
+model.load_weights(H5_WEIGHT_PATH, by_name=True)
+
+# Converting keras model to PB frozen graph
+freeze_model(model.keras_model, FROZEN_NAME)
+
+# Now convert frozen graph to Tensorflow Serving Ready
+make_serving_ready(os.path.join(PATH_TO_SAVE_FROZEN_PB, FROZEN_NAME),
+                     PATH_TO_SAVE_TENSORFLOW_SERVING_MODEL,
+                     VERSION_NUMBER)
+
+print("COMPLETED")
\ No newline at end of file
diff --git a/mask_rcnn/tf_servable/model.py b/mask_rcnn/tf_servable/model.py
new file mode 100644
index 00000000..5dcf67e0
--- /dev/null
+++ b/mask_rcnn/tf_servable/model.py
@@ -0,0 +1,2882 @@
+
+import utils
+import keras.backend as K
+import tensorflow as tf
+import os
+import random
+import datetime
+import re
+import math
+import logging
+from collections import OrderedDict
+import multiprocessing
+import numpy as np
+import skimage.transform
+import keras
+import keras.layers as KL
+import keras.engine as KE
+import keras.models as KM
+import os
+from tensorflow.python.saved_model import signature_constants
+from tensorflow.python.saved_model import tag_constants
+
+# Requires TensorFlow 1.3+ and Keras 2.0.8+.
+from distutils.version import LooseVersion
+
+assert LooseVersion(tf.__version__) >= LooseVersion("1.3")
+assert LooseVersion(keras.__version__) >= LooseVersion('2.0.8')
+
+
+############################################################
+#  Utility Functions
+############################################################
+
+def log(text, array=None):
+    """Prints a text message. And, optionally, if a Numpy array is provided it
+    prints it's shape, min, and max values.
+    """
+    if array is not None:
+        text = text.ljust(25)
+        text += ("shape: {:20}  min: {:10.5f}  max: {:10.5f}  {}".format(
+            str(array.shape),
+            array.min() if array.size else "",
+            array.max() if array.size else "",
+            array.dtype))
+
+
+class BatchNorm(KL.BatchNormalization):
+    """Extends the Keras BatchNormalization class to allow a central place
+    to make changes if needed.
+
+    Batch normalization has a negative effect on training if batches are small
+    so this layer is often frozen (via setting in Config class) and functions
+    as linear layer.
+    """
+
+    def call(self, inputs, training=None):
+        """
+        Note about training values:
+            None: Train BN layers. This is the normal mode
+            False: Freeze BN layers. Good when batch size is small
+            True: (don't use). Set layer in training mode even when making inferences
+        """
+        return super(self.__class__, self).call(inputs, training=training)
+
+
+def compute_backbone_shapes(config, image_shape):
+    """Computes the width and height of each stage of the backbone network.
+
+    Returns:
+        [N, (height, width)]. Where N is the number of stages
+    """
+    if callable(config.BACKBONE):
+        return config.COMPUTE_BACKBONE_SHAPE(image_shape)
+
+    # Currently supports ResNet only
+    assert config.BACKBONE in ["resnet50", "resnet101"]
+    return np.array(
+        [[int(math.ceil(image_shape[0] / stride)),
+          int(math.ceil(image_shape[1] / stride))]
+         for stride in config.BACKBONE_STRIDES])
+
+
+############################################################
+#  Resnet Graph
+############################################################
+
+# Code adopted from:
+# https://github.com/fchollet/deep-learning-models/blob/master/resnet50.py
+
+def identity_block(input_tensor, kernel_size, filters, stage, block,
+                   use_bias=True, train_bn=True):
+    """The identity_block is the block that has no conv layer at shortcut
+    # Arguments
+        input_tensor: input tensor
+        kernel_size: default 3, the kernel size of middle conv layer at main path
+        filters: list of integers, the nb_filters of 3 conv layer at main path
+        stage: integer, current stage label, used for generating layer names
+        block: 'a','b'..., current block label, used for generating layer names
+        use_bias: Boolean. To use or not use a bias in conv layers.
+        train_bn: Boolean. Train or freeze Batch Norm layers
+    """
+    nb_filter1, nb_filter2, nb_filter3 = filters
+    conv_name_base = 'res' + str(stage) + block + '_branch'
+    bn_name_base = 'bn' + str(stage) + block + '_branch'
+
+    x = KL.Conv2D(nb_filter1, (1, 1), name=conv_name_base + '2a',
+                  use_bias=use_bias)(input_tensor)
+    x = BatchNorm(name=bn_name_base + '2a')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+
+    x = KL.Conv2D(nb_filter2, (kernel_size, kernel_size), padding='same',
+                  name=conv_name_base + '2b', use_bias=use_bias)(x)
+    x = BatchNorm(name=bn_name_base + '2b')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+
+    x = KL.Conv2D(nb_filter3, (1, 1), name=conv_name_base + '2c',
+                  use_bias=use_bias)(x)
+    x = BatchNorm(name=bn_name_base + '2c')(x, training=train_bn)
+
+    x = KL.Add()([x, input_tensor])
+    x = KL.Activation('relu', name='res' + str(stage) + block + '_out')(x)
+    return x
+
+
+def conv_block(input_tensor, kernel_size, filters, stage, block,
+               strides=(2, 2), use_bias=True, train_bn=True):
+    """conv_block is the block that has a conv layer at shortcut
+    # Arguments
+        input_tensor: input tensor
+        kernel_size: default 3, the kernel size of middle conv layer at main path
+        filters: list of integers, the nb_filters of 3 conv layer at main path
+        stage: integer, current stage label, used for generating layer names
+        block: 'a','b'..., current block label, used for generating layer names
+        use_bias: Boolean. To use or not use a bias in conv layers.
+        train_bn: Boolean. Train or freeze Batch Norm layers
+    Note that from stage 3, the first conv layer at main path is with subsample=(2,2)
+    And the shortcut should have subsample=(2,2) as well
+    """
+    nb_filter1, nb_filter2, nb_filter3 = filters
+    conv_name_base = 'res' + str(stage) + block + '_branch'
+    bn_name_base = 'bn' + str(stage) + block + '_branch'
+
+    x = KL.Conv2D(nb_filter1, (1, 1), strides=strides,
+                  name=conv_name_base + '2a', use_bias=use_bias)(input_tensor)
+    x = BatchNorm(name=bn_name_base + '2a')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+
+    x = KL.Conv2D(nb_filter2, (kernel_size, kernel_size), padding='same',
+                  name=conv_name_base + '2b', use_bias=use_bias)(x)
+    x = BatchNorm(name=bn_name_base + '2b')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+
+    x = KL.Conv2D(nb_filter3, (1, 1), name=conv_name_base +
+                                           '2c', use_bias=use_bias)(x)
+    x = BatchNorm(name=bn_name_base + '2c')(x, training=train_bn)
+
+    shortcut = KL.Conv2D(nb_filter3, (1, 1), strides=strides,
+                         name=conv_name_base + '1', use_bias=use_bias)(input_tensor)
+    shortcut = BatchNorm(name=bn_name_base + '1')(shortcut, training=train_bn)
+
+    x = KL.Add()([x, shortcut])
+    x = KL.Activation('relu', name='res' + str(stage) + block + '_out')(x)
+    return x
+
+
+def resnet_graph(input_image, architecture, stage5=False, train_bn=True):
+    """Build a ResNet graph.
+        architecture: Can be resnet50 or resnet101
+        stage5: Boolean. If False, stage5 of the network is not created
+        train_bn: Boolean. Train or freeze Batch Norm layers
+    """
+    assert architecture in ["resnet50", "resnet101"]
+    # Stage 1
+    x = KL.ZeroPadding2D((3, 3))(input_image)
+    x = KL.Conv2D(64, (7, 7), strides=(2, 2), name='conv1', use_bias=True)(x)
+    x = BatchNorm(name='bn_conv1')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+    C1 = x = KL.MaxPooling2D((3, 3), strides=(2, 2), padding="same")(x)
+    # Stage 2
+    x = conv_block(x, 3, [64, 64, 256], stage=2, block='a', strides=(1, 1), train_bn=train_bn)
+    x = identity_block(x, 3, [64, 64, 256], stage=2, block='b', train_bn=train_bn)
+    C2 = x = identity_block(x, 3, [64, 64, 256], stage=2, block='c', train_bn=train_bn)
+    # Stage 3
+    x = conv_block(x, 3, [128, 128, 512], stage=3, block='a', train_bn=train_bn)
+    x = identity_block(x, 3, [128, 128, 512], stage=3, block='b', train_bn=train_bn)
+    x = identity_block(x, 3, [128, 128, 512], stage=3, block='c', train_bn=train_bn)
+    C3 = x = identity_block(x, 3, [128, 128, 512], stage=3, block='d', train_bn=train_bn)
+    # Stage 4
+    x = conv_block(x, 3, [256, 256, 1024], stage=4, block='a', train_bn=train_bn)
+    block_count = {"resnet50": 5, "resnet101": 22}[architecture]
+    for i in range(block_count):
+        x = identity_block(x, 3, [256, 256, 1024], stage=4, block=chr(98 + i), train_bn=train_bn)
+    C4 = x
+    # Stage 5
+    if stage5:
+        x = conv_block(x, 3, [512, 512, 2048], stage=5, block='a', train_bn=train_bn)
+        x = identity_block(x, 3, [512, 512, 2048], stage=5, block='b', train_bn=train_bn)
+        C5 = x = identity_block(x, 3, [512, 512, 2048], stage=5, block='c', train_bn=train_bn)
+    else:
+        C5 = None
+    return [C1, C2, C3, C4, C5]
+
+
+############################################################
+#  Proposal Layer
+############################################################
+
+def apply_box_deltas_graph(boxes, deltas):
+    """Applies the given deltas to the given boxes.
+    boxes: [N, (y1, x1, y2, x2)] boxes to update
+    deltas: [N, (dy, dx, log(dh), log(dw))] refinements to apply
+    """
+    # Convert to y, x, h, w
+    height = boxes[:, 2] - boxes[:, 0]
+    width = boxes[:, 3] - boxes[:, 1]
+    center_y = boxes[:, 0] + 0.5 * height
+    center_x = boxes[:, 1] + 0.5 * width
+    # Apply deltas
+    center_y += deltas[:, 0] * height
+    center_x += deltas[:, 1] * width
+    height *= tf.exp(deltas[:, 2])
+    width *= tf.exp(deltas[:, 3])
+    # Convert back to y1, x1, y2, x2
+    y1 = center_y - 0.5 * height
+    x1 = center_x - 0.5 * width
+    y2 = y1 + height
+    x2 = x1 + width
+    result = tf.stack([y1, x1, y2, x2], axis=1, name="apply_box_deltas_out")
+    return result
+
+
+def clip_boxes_graph(boxes, window):
+    """
+    boxes: [N, (y1, x1, y2, x2)]
+    window: [4] in the form y1, x1, y2, x2
+    """
+    # Split
+    wy1, wx1, wy2, wx2 = tf.split(window, 4)
+    y1, x1, y2, x2 = tf.split(boxes, 4, axis=1)
+    # Clip
+    y1 = tf.maximum(tf.minimum(y1, wy2), wy1)
+    x1 = tf.maximum(tf.minimum(x1, wx2), wx1)
+    y2 = tf.maximum(tf.minimum(y2, wy2), wy1)
+    x2 = tf.maximum(tf.minimum(x2, wx2), wx1)
+    clipped = tf.concat([y1, x1, y2, x2], axis=1, name="clipped_boxes")
+    clipped.set_shape((clipped.shape[0], 4))
+    return clipped
+
+
+class ProposalLayer(KE.Layer):
+    """Receives anchor scores and selects a subset to pass as proposals
+    to the second stage. Filtering is done based on anchor scores and
+    non-max suppression to remove overlaps. It also applies bounding
+    box refinement deltas to anchors.
+
+    Inputs:
+        rpn_probs: [batch, anchors, (bg prob, fg prob)]
+        rpn_bbox: [batch, anchors, (dy, dx, log(dh), log(dw))]
+        anchors: [batch, (y1, x1, y2, x2)] anchors in normalized coordinates
+
+    Returns:
+        Proposals in normalized coordinates [batch, rois, (y1, x1, y2, x2)]
+    """
+
+    def __init__(self, proposal_count, nms_threshold, config=None, **kwargs):
+        super(ProposalLayer, self).__init__(**kwargs)
+        self.config = config
+        self.proposal_count = proposal_count
+        self.nms_threshold = nms_threshold
+
+    def call(self, inputs):
+        # Box Scores. Use the foreground class confidence. [Batch, num_rois, 1]
+        scores = inputs[0][:, :, 1]
+        # Box deltas [batch, num_rois, 4]
+        deltas = inputs[1]
+        deltas = deltas * np.reshape(self.config.RPN_BBOX_STD_DEV, [1, 1, 4])
+        # Anchors
+        anchors = inputs[2]
+
+        # Improve performance by trimming to top anchors by score
+        # and doing the rest on the smaller subset.
+        pre_nms_limit = tf.minimum(6000, tf.shape(anchors)[1])
+        ix = tf.nn.top_k(scores, pre_nms_limit, sorted=True,
+                         name="top_anchors").indices
+        scores = utils.batch_slice([scores, ix], lambda x, y: tf.gather(x, y),
+                                   self.config.IMAGES_PER_GPU)
+        deltas = utils.batch_slice([deltas, ix], lambda x, y: tf.gather(x, y),
+                                   self.config.IMAGES_PER_GPU)
+        pre_nms_anchors = utils.batch_slice([anchors, ix], lambda a, x: tf.gather(a, x),
+                                            self.config.IMAGES_PER_GPU,
+                                            names=["pre_nms_anchors"])
+
+        # Apply deltas to anchors to get refined anchors.
+        # [batch, N, (y1, x1, y2, x2)]
+        boxes = utils.batch_slice([pre_nms_anchors, deltas],
+                                  lambda x, y: apply_box_deltas_graph(x, y),
+                                  self.config.IMAGES_PER_GPU,
+                                  names=["refined_anchors"])
+
+        # Clip to image boundaries. Since we're in normalized coordinates,
+        # clip to 0..1 range. [batch, N, (y1, x1, y2, x2)]
+        window = np.array([0, 0, 1, 1], dtype=np.float32)
+        boxes = utils.batch_slice(boxes,
+                                  lambda x: clip_boxes_graph(x, window),
+                                  self.config.IMAGES_PER_GPU,
+                                  names=["refined_anchors_clipped"])
+
+        # Filter out small boxes
+        # According to Xinlei Chen's paper, this reduces detection accuracy
+        # for small objects, so we're skipping it.
+
+        # Non-max suppression
+        def nms(boxes, scores):
+            indices = tf.image.non_max_suppression(
+                boxes, scores, self.proposal_count,
+                self.nms_threshold, name="rpn_non_max_suppression")
+            proposals = tf.gather(boxes, indices)
+            # Pad if needed
+            padding = tf.maximum(self.proposal_count - tf.shape(proposals)[0], 0)
+            proposals = tf.pad(proposals, [(0, padding), (0, 0)])
+            return proposals
+
+        proposals = utils.batch_slice([boxes, scores], nms,
+                                      self.config.IMAGES_PER_GPU)
+        return proposals
+
+    def compute_output_shape(self, input_shape):
+        return (None, self.proposal_count, 4)
+
+
+############################################################
+#  ROIAlign Layer
+############################################################
+
+def log2_graph(x):
+    """Implementation of Log2. TF doesn't have a native implementation."""
+    return tf.log(x) / tf.log(2.0)
+
+
+class PyramidROIAlign(KE.Layer):
+    """Implements ROI Pooling on multiple levels of the feature pyramid.
+
+    Params:
+    - pool_shape: [height, width] of the output pooled regions. Usually [7, 7]
+
+    Inputs:
+    - boxes: [batch, num_boxes, (y1, x1, y2, x2)] in normalized
+             coordinates. Possibly padded with zeros if not enough
+             boxes to fill the array.
+    - image_meta: [batch, (meta data)] Image details. See compose_image_meta()
+    - Feature maps: List of feature maps from different levels of the pyramid.
+                    Each is [batch, height, width, channels]
+
+    Output:
+    Pooled regions in the shape: [batch, num_boxes, height, width, channels].
+    The width and height are those specific in the pool_shape in the layer
+    constructor.
+    """
+
+    def __init__(self, pool_shape, **kwargs):
+        super(PyramidROIAlign, self).__init__(**kwargs)
+        self.pool_shape = tuple(pool_shape)
+
+    def call(self, inputs):
+        # Crop boxes [batch, num_boxes, (y1, x1, y2, x2)] in normalized coords
+        boxes = inputs[0]
+
+        # Image meta
+        # Holds details about the image. See compose_image_meta()
+        image_meta = inputs[1]
+
+        # Feature Maps. List of feature maps from different level of the
+        # feature pyramid. Each is [batch, height, width, channels]
+        feature_maps = inputs[2:]
+
+        # Assign each ROI to a level in the pyramid based on the ROI area.
+        y1, x1, y2, x2 = tf.split(boxes, 4, axis=2)
+        h = y2 - y1
+        w = x2 - x1
+        # Use shape of first image. Images in a batch must have the same size.
+        image_shape = parse_image_meta_graph(image_meta)['image_shape'][0]
+        # Equation 1 in the Feature Pyramid Networks paper. Account for
+        # the fact that our coordinates are normalized here.
+        # e.g. a 224x224 ROI (in pixels) maps to P4
+        image_area = tf.cast(image_shape[0] * image_shape[1], tf.float32)
+        roi_level = log2_graph(tf.sqrt(h * w) / (224.0 / tf.sqrt(image_area)))
+        roi_level = tf.minimum(5, tf.maximum(
+            2, 4 + tf.cast(tf.round(roi_level), tf.int32)))
+        roi_level = tf.squeeze(roi_level, 2)
+
+        # Loop through levels and apply ROI pooling to each. P2 to P5.
+        pooled = []
+        box_to_level = []
+        for i, level in enumerate(range(2, 6)):
+            ix = tf.where(tf.equal(roi_level, level))
+            level_boxes = tf.gather_nd(boxes, ix)
+
+            # Box indices for crop_and_resize.
+            box_indices = tf.cast(ix[:, 0], tf.int32)
+
+            # Keep track of which box is mapped to which level
+            box_to_level.append(ix)
+
+            # Stop gradient propogation to ROI proposals
+            level_boxes = tf.stop_gradient(level_boxes)
+            box_indices = tf.stop_gradient(box_indices)
+
+            # Crop and Resize
+            # From Mask R-CNN paper: "We sample four regular locations, so
+            # that we can evaluate either max or average pooling. In fact,
+            # interpolating only a single value at each bin center (without
+            # pooling) is nearly as effective."
+            #
+            # Here we use the simplified approach of a single value per bin,
+            # which is how it's done in tf.crop_and_resize()
+            # Result: [batch * num_boxes, pool_height, pool_width, channels]
+            pooled.append(tf.image.crop_and_resize(
+                feature_maps[i], level_boxes, box_indices, self.pool_shape,
+                method="bilinear"))
+
+        # Pack pooled features into one tensor
+        pooled = tf.concat(pooled, axis=0)
+
+        # Pack box_to_level mapping into one array and add another
+        # column representing the order of pooled boxes
+        box_to_level = tf.concat(box_to_level, axis=0)
+        box_range = tf.expand_dims(tf.range(tf.shape(box_to_level)[0]), 1)
+        box_to_level = tf.concat([tf.cast(box_to_level, tf.int32), box_range],
+                                 axis=1)
+
+        # Rearrange pooled features to match the order of the original boxes
+        # Sort box_to_level by batch then box index
+        # TF doesn't have a way to sort by two columns, so merge them and sort.
+        sorting_tensor = box_to_level[:, 0] * 100000 + box_to_level[:, 1]
+        ix = tf.nn.top_k(sorting_tensor, k=tf.shape(
+            box_to_level)[0]).indices[::-1]
+        ix = tf.gather(box_to_level[:, 2], ix)
+        pooled = tf.gather(pooled, ix)
+
+        # Re-add the batch dimension
+        pooled = tf.expand_dims(pooled, 0)
+        return pooled
+
+    def compute_output_shape(self, input_shape):
+        return input_shape[0][:2] + self.pool_shape + (input_shape[2][-1],)
+
+
+############################################################
+#  Detection Target Layer
+############################################################
+
+def overlaps_graph(boxes1, boxes2):
+    """Computes IoU overlaps between two sets of boxes.
+    boxes1, boxes2: [N, (y1, x1, y2, x2)].
+    """
+    # 1. Tile boxes2 and repeat boxes1. This allows us to compare
+    # every boxes1 against every boxes2 without loops.
+    # TF doesn't have an equivalent to np.repeat() so simulate it
+    # using tf.tile() and tf.reshape.
+    b1 = tf.reshape(tf.tile(tf.expand_dims(boxes1, 1),
+                            [1, 1, tf.shape(boxes2)[0]]), [-1, 4])
+    b2 = tf.tile(boxes2, [tf.shape(boxes1)[0], 1])
+    # 2. Compute intersections
+    b1_y1, b1_x1, b1_y2, b1_x2 = tf.split(b1, 4, axis=1)
+    b2_y1, b2_x1, b2_y2, b2_x2 = tf.split(b2, 4, axis=1)
+    y1 = tf.maximum(b1_y1, b2_y1)
+    x1 = tf.maximum(b1_x1, b2_x1)
+    y2 = tf.minimum(b1_y2, b2_y2)
+    x2 = tf.minimum(b1_x2, b2_x2)
+    intersection = tf.maximum(x2 - x1, 0) * tf.maximum(y2 - y1, 0)
+    # 3. Compute unions
+    b1_area = (b1_y2 - b1_y1) * (b1_x2 - b1_x1)
+    b2_area = (b2_y2 - b2_y1) * (b2_x2 - b2_x1)
+    union = b1_area + b2_area - intersection
+    # 4. Compute IoU and reshape to [boxes1, boxes2]
+    iou = intersection / union
+    overlaps = tf.reshape(iou, [tf.shape(boxes1)[0], tf.shape(boxes2)[0]])
+    return overlaps
+
+
+def detection_targets_graph(proposals, gt_class_ids, gt_boxes, gt_masks, config):
+    """Generates detection targets for one image. Subsamples proposals and
+    generates target class IDs, bounding box deltas, and masks for each.
+
+    Inputs:
+    proposals: [N, (y1, x1, y2, x2)] in normalized coordinates. Might
+               be zero padded if there are not enough proposals.
+    gt_class_ids: [MAX_GT_INSTANCES] int class IDs
+    gt_boxes: [MAX_GT_INSTANCES, (y1, x1, y2, x2)] in normalized coordinates.
+    gt_masks: [height, width, MAX_GT_INSTANCES] of boolean type.
+
+    Returns: Target ROIs and corresponding class IDs, bounding box shifts,
+    and masks.
+    rois: [TRAIN_ROIS_PER_IMAGE, (y1, x1, y2, x2)] in normalized coordinates
+    class_ids: [TRAIN_ROIS_PER_IMAGE]. Integer class IDs. Zero padded.
+    deltas: [TRAIN_ROIS_PER_IMAGE, NUM_CLASSES, (dy, dx, log(dh), log(dw))]
+            Class-specific bbox refinements.
+    masks: [TRAIN_ROIS_PER_IMAGE, height, width). Masks cropped to bbox
+           boundaries and resized to neural network output size.
+
+    Note: Returned arrays might be zero padded if not enough target ROIs.
+    """
+    # Assertions
+    asserts = [
+        tf.Assert(tf.greater(tf.shape(proposals)[0], 0), [proposals],
+                  name="roi_assertion"),
+    ]
+    with tf.control_dependencies(asserts):
+        proposals = tf.identity(proposals)
+
+    # Remove zero padding
+    proposals, _ = trim_zeros_graph(proposals, name="trim_proposals")
+    gt_boxes, non_zeros = trim_zeros_graph(gt_boxes, name="trim_gt_boxes")
+    gt_class_ids = tf.boolean_mask(gt_class_ids, non_zeros,
+                                   name="trim_gt_class_ids")
+    gt_masks = tf.gather(gt_masks, tf.where(non_zeros)[:, 0], axis=2,
+                         name="trim_gt_masks")
+
+    # Handle COCO crowds
+    # A crowd box in COCO is a bounding box around several instances. Exclude
+    # them from training. A crowd box is given a negative class ID.
+    crowd_ix = tf.where(gt_class_ids < 0)[:, 0]
+    non_crowd_ix = tf.where(gt_class_ids > 0)[:, 0]
+    crowd_boxes = tf.gather(gt_boxes, crowd_ix)
+    crowd_masks = tf.gather(gt_masks, crowd_ix, axis=2)
+    gt_class_ids = tf.gather(gt_class_ids, non_crowd_ix)
+    gt_boxes = tf.gather(gt_boxes, non_crowd_ix)
+    gt_masks = tf.gather(gt_masks, non_crowd_ix, axis=2)
+
+    # Compute overlaps matrix [proposals, gt_boxes]
+    overlaps = overlaps_graph(proposals, gt_boxes)
+
+    # Compute overlaps with crowd boxes [anchors, crowds]
+    crowd_overlaps = overlaps_graph(proposals, crowd_boxes)
+    crowd_iou_max = tf.reduce_max(crowd_overlaps, axis=1)
+    no_crowd_bool = (crowd_iou_max < 0.001)
+
+    # Determine positive and negative ROIs
+    roi_iou_max = tf.reduce_max(overlaps, axis=1)
+    # 1. Positive ROIs are those with >= 0.5 IoU with a GT box
+    positive_roi_bool = (roi_iou_max >= 0.5)
+    positive_indices = tf.where(positive_roi_bool)[:, 0]
+    # 2. Negative ROIs are those with < 0.5 with every GT box. Skip crowds.
+    negative_indices = tf.where(tf.logical_and(roi_iou_max < 0.5, no_crowd_bool))[:, 0]
+
+    # Subsample ROIs. Aim for 33% positive
+    # Positive ROIs
+    positive_count = int(config.TRAIN_ROIS_PER_IMAGE *
+                         config.ROI_POSITIVE_RATIO)
+    positive_indices = tf.random_shuffle(positive_indices)[:positive_count]
+    positive_count = tf.shape(positive_indices)[0]
+    # Negative ROIs. Add enough to maintain positive:negative ratio.
+    r = 1.0 / config.ROI_POSITIVE_RATIO
+    negative_count = tf.cast(r * tf.cast(positive_count, tf.float32), tf.int32) - positive_count
+    negative_indices = tf.random_shuffle(negative_indices)[:negative_count]
+    # Gather selected ROIs
+    positive_rois = tf.gather(proposals, positive_indices)
+    negative_rois = tf.gather(proposals, negative_indices)
+
+    # Assign positive ROIs to GT boxes.
+    positive_overlaps = tf.gather(overlaps, positive_indices)
+    roi_gt_box_assignment = tf.cond(
+        tf.greater(tf.shape(positive_overlaps)[1], 0),
+        true_fn=lambda: tf.argmax(positive_overlaps, axis=1),
+        false_fn=lambda: tf.cast(tf.constant([]), tf.int64)
+    )
+    roi_gt_boxes = tf.gather(gt_boxes, roi_gt_box_assignment)
+    roi_gt_class_ids = tf.gather(gt_class_ids, roi_gt_box_assignment)
+
+    # Compute bbox refinement for positive ROIs
+    deltas = utils.box_refinement_graph(positive_rois, roi_gt_boxes)
+    deltas /= config.BBOX_STD_DEV
+
+    # Assign positive ROIs to GT masks
+    # Permute masks to [N, height, width, 1]
+    transposed_masks = tf.expand_dims(tf.transpose(gt_masks, [2, 0, 1]), -1)
+    # Pick the right mask for each ROI
+    roi_masks = tf.gather(transposed_masks, roi_gt_box_assignment)
+
+    # Compute mask targets
+    boxes = positive_rois
+    if config.USE_MINI_MASK:
+        # Transform ROI coordinates from normalized image space
+        # to normalized mini-mask space.
+        y1, x1, y2, x2 = tf.split(positive_rois, 4, axis=1)
+        gt_y1, gt_x1, gt_y2, gt_x2 = tf.split(roi_gt_boxes, 4, axis=1)
+        gt_h = gt_y2 - gt_y1
+        gt_w = gt_x2 - gt_x1
+        y1 = (y1 - gt_y1) / gt_h
+        x1 = (x1 - gt_x1) / gt_w
+        y2 = (y2 - gt_y1) / gt_h
+        x2 = (x2 - gt_x1) / gt_w
+        boxes = tf.concat([y1, x1, y2, x2], 1)
+    box_ids = tf.range(0, tf.shape(roi_masks)[0])
+    masks = tf.image.crop_and_resize(tf.cast(roi_masks, tf.float32), boxes,
+                                     box_ids,
+                                     config.MASK_SHAPE)
+    # Remove the extra dimension from masks.
+    masks = tf.squeeze(masks, axis=3)
+
+    # Threshold mask pixels at 0.5 to have GT masks be 0 or 1 to use with
+    # binary cross entropy loss.
+    masks = tf.round(masks)
+
+    # Append negative ROIs and pad bbox deltas and masks that
+    # are not used for negative ROIs with zeros.
+    rois = tf.concat([positive_rois, negative_rois], axis=0)
+    N = tf.shape(negative_rois)[0]
+    P = tf.maximum(config.TRAIN_ROIS_PER_IMAGE - tf.shape(rois)[0], 0)
+    rois = tf.pad(rois, [(0, P), (0, 0)])
+    roi_gt_boxes = tf.pad(roi_gt_boxes, [(0, N + P), (0, 0)])
+    roi_gt_class_ids = tf.pad(roi_gt_class_ids, [(0, N + P)])
+    deltas = tf.pad(deltas, [(0, N + P), (0, 0)])
+    masks = tf.pad(masks, [[0, N + P], (0, 0), (0, 0)])
+
+    return rois, roi_gt_class_ids, deltas, masks
+
+
+class DetectionTargetLayer(KE.Layer):
+    """Subsamples proposals and generates target box refinement, class_ids,
+    and masks for each.
+
+    Inputs:
+    proposals: [batch, N, (y1, x1, y2, x2)] in normalized coordinates. Might
+               be zero padded if there are not enough proposals.
+    gt_class_ids: [batch, MAX_GT_INSTANCES] Integer class IDs.
+    gt_boxes: [batch, MAX_GT_INSTANCES, (y1, x1, y2, x2)] in normalized
+              coordinates.
+    gt_masks: [batch, height, width, MAX_GT_INSTANCES] of boolean type
+
+    Returns: Target ROIs and corresponding class IDs, bounding box shifts,
+    and masks.
+    rois: [batch, TRAIN_ROIS_PER_IMAGE, (y1, x1, y2, x2)] in normalized
+          coordinates
+    target_class_ids: [batch, TRAIN_ROIS_PER_IMAGE]. Integer class IDs.
+    target_deltas: [batch, TRAIN_ROIS_PER_IMAGE, NUM_CLASSES,
+                    (dy, dx, log(dh), log(dw), class_id)]
+                   Class-specific bbox refinements.
+    target_mask: [batch, TRAIN_ROIS_PER_IMAGE, height, width)
+                 Masks cropped to bbox boundaries and resized to neural
+                 network output size.
+
+    Note: Returned arrays might be zero padded if not enough target ROIs.
+    """
+
+    def __init__(self, config, **kwargs):
+        super(DetectionTargetLayer, self).__init__(**kwargs)
+        self.config = config
+
+    def call(self, inputs):
+        proposals = inputs[0]
+        gt_class_ids = inputs[1]
+        gt_boxes = inputs[2]
+        gt_masks = inputs[3]
+
+        # Slice the batch and run a graph for each slice
+        # TODO: Rename target_bbox to target_deltas for clarity
+        names = ["rois", "target_class_ids", "target_bbox", "target_mask"]
+        outputs = utils.batch_slice(
+            [proposals, gt_class_ids, gt_boxes, gt_masks],
+            lambda w, x, y, z: detection_targets_graph(
+                w, x, y, z, self.config),
+            self.config.IMAGES_PER_GPU, names=names)
+        return outputs
+
+    def compute_output_shape(self, input_shape):
+        return [
+            (None, self.config.TRAIN_ROIS_PER_IMAGE, 4),  # rois
+            (None, 1),  # class_ids
+            (None, self.config.TRAIN_ROIS_PER_IMAGE, 4),  # deltas
+            (None, self.config.TRAIN_ROIS_PER_IMAGE, self.config.MASK_SHAPE[0],
+             self.config.MASK_SHAPE[1])  # masks
+        ]
+
+    def compute_mask(self, inputs, mask=None):
+        return [None, None, None, None]
+
+
+############################################################
+#  Detection Layer
+############################################################
+
+def refine_detections_graph(rois, probs, deltas, window, config):
+    """Refine classified proposals and filter overlaps and return final
+    detections.
+
+    Inputs:
+        rois: [N, (y1, x1, y2, x2)] in normalized coordinates
+        probs: [N, num_classes]. Class probabilities.
+        deltas: [N, num_classes, (dy, dx, log(dh), log(dw))]. Class-specific
+                bounding box deltas.
+        window: (y1, x1, y2, x2) in image coordinates. The part of the image
+            that contains the image excluding the padding.
+
+    Returns detections shaped: [N, (y1, x1, y2, x2, class_id, score)] where
+        coordinates are normalized.
+    """
+    # Class IDs per ROI
+    class_ids = tf.argmax(probs, axis=1, output_type=tf.int32)
+    # Class probability of the top class of each ROI
+    indices = tf.stack([tf.range(probs.shape[0]), class_ids], axis=1)
+    class_scores = tf.gather_nd(probs, indices)
+    # Class-specific bounding box deltas
+    deltas_specific = tf.gather_nd(deltas, indices)
+    # Apply bounding box deltas
+    # Shape: [boxes, (y1, x1, y2, x2)] in normalized coordinates
+    refined_rois = apply_box_deltas_graph(
+        rois, deltas_specific * config.BBOX_STD_DEV)
+    # Clip boxes to image window
+    refined_rois = clip_boxes_graph(refined_rois, window)
+
+    # TODO: Filter out boxes with zero area
+
+    # Filter out background boxes
+    keep = tf.where(class_ids > 0)[:, 0]
+    # Filter out low confidence boxes
+    if config.DETECTION_MIN_CONFIDENCE:
+        conf_keep = tf.where(class_scores >= config.DETECTION_MIN_CONFIDENCE)[:, 0]
+        keep = tf.sets.set_intersection(tf.expand_dims(keep, 0),
+                                        tf.expand_dims(conf_keep, 0))
+        keep = tf.sparse_tensor_to_dense(keep)[0]
+
+    # Apply per-class NMS
+    # 1. Prepare variables
+    pre_nms_class_ids = tf.gather(class_ids, keep)
+    pre_nms_scores = tf.gather(class_scores, keep)
+    pre_nms_rois = tf.gather(refined_rois, keep)
+    unique_pre_nms_class_ids = tf.unique(pre_nms_class_ids)[0]
+
+    def nms_keep_map(class_id):
+        """Apply Non-Maximum Suppression on ROIs of the given class."""
+        # Indices of ROIs of the given class
+        ixs = tf.where(tf.equal(pre_nms_class_ids, class_id))[:, 0]
+        # Apply NMS
+        class_keep = tf.image.non_max_suppression(
+            tf.gather(pre_nms_rois, ixs),
+            tf.gather(pre_nms_scores, ixs),
+            max_output_size=config.DETECTION_MAX_INSTANCES,
+            iou_threshold=config.DETECTION_NMS_THRESHOLD)
+        # Map indices
+        class_keep = tf.gather(keep, tf.gather(ixs, class_keep))
+        # Pad with -1 so returned tensors have the same shape
+        gap = config.DETECTION_MAX_INSTANCES - tf.shape(class_keep)[0]
+        class_keep = tf.pad(class_keep, [(0, gap)],
+                            mode='CONSTANT', constant_values=-1)
+        # Set shape so map_fn() can infer result shape
+        class_keep.set_shape([config.DETECTION_MAX_INSTANCES])
+        return class_keep
+
+    # 2. Map over class IDs
+    nms_keep = tf.map_fn(nms_keep_map, unique_pre_nms_class_ids,
+                         dtype=tf.int64)
+    # 3. Merge results into one list, and remove -1 padding
+    nms_keep = tf.reshape(nms_keep, [-1])
+    nms_keep = tf.gather(nms_keep, tf.where(nms_keep > -1)[:, 0])
+    # 4. Compute intersection between keep and nms_keep
+    keep = tf.sets.set_intersection(tf.expand_dims(keep, 0),
+                                    tf.expand_dims(nms_keep, 0))
+    keep = tf.sparse_tensor_to_dense(keep)[0]
+    # Keep top detections
+    roi_count = config.DETECTION_MAX_INSTANCES
+    class_scores_keep = tf.gather(class_scores, keep)
+    num_keep = tf.minimum(tf.shape(class_scores_keep)[0], roi_count)
+    top_ids = tf.nn.top_k(class_scores_keep, k=num_keep, sorted=True)[1]
+    keep = tf.gather(keep, top_ids)
+
+    # Arrange output as [N, (y1, x1, y2, x2, class_id, score)]
+    # Coordinates are normalized.
+    detections = tf.concat([
+        tf.gather(refined_rois, keep),
+        tf.to_float(tf.gather(class_ids, keep))[..., tf.newaxis],
+        tf.gather(class_scores, keep)[..., tf.newaxis]
+    ], axis=1)
+
+    # Pad with zeros if detections < DETECTION_MAX_INSTANCES
+    gap = config.DETECTION_MAX_INSTANCES - tf.shape(detections)[0]
+    detections = tf.pad(detections, [(0, gap), (0, 0)], "CONSTANT")
+    return detections
+
+
+class DetectionLayer(KE.Layer):
+    """Takes classified proposal boxes and their bounding box deltas and
+    returns the final detection boxes.
+
+    Returns:
+    [batch, num_detections, (y1, x1, y2, x2, class_id, class_score)] where
+    coordinates are normalized.
+    """
+
+    def __init__(self, config=None, **kwargs):
+        super(DetectionLayer, self).__init__(**kwargs)
+        self.config = config
+
+    def call(self, inputs):
+        rois = inputs[0]
+        mrcnn_class = inputs[1]
+        mrcnn_bbox = inputs[2]
+        image_meta = inputs[3]
+
+        # Get windows of images in normalized coordinates. Windows are the area
+        # in the image that excludes the padding.
+        # Use the shape of the first image in the batch to normalize the window
+        # because we know that all images get resized to the same size.
+        m = parse_image_meta_graph(image_meta)
+        image_shape = m['image_shape'][0]
+        window = norm_boxes_graph(m['window'], image_shape[:2])
+
+        # Run detection refinement graph on each item in the batch
+        detections_batch = utils.batch_slice(
+            [rois, mrcnn_class, mrcnn_bbox, window],
+            lambda x, y, w, z: refine_detections_graph(x, y, w, z, self.config),
+            self.config.IMAGES_PER_GPU)
+
+        # Reshape output
+        # [batch, num_detections, (y1, x1, y2, x2, class_score)] in
+        # normalized coordinates
+        return tf.reshape(
+            detections_batch,
+            [self.config.BATCH_SIZE, self.config.DETECTION_MAX_INSTANCES, 6])
+
+    def compute_output_shape(self, input_shape):
+        return (None, self.config.DETECTION_MAX_INSTANCES, 6)
+
+
+############################################################
+#  Region Proposal Network (RPN)
+############################################################
+
+def rpn_graph(feature_map, anchors_per_location, anchor_stride):
+    """Builds the computation graph of Region Proposal Network.
+
+    feature_map: backbone features [batch, height, width, depth]
+    anchors_per_location: number of anchors per pixel in the feature map
+    anchor_stride: Controls the density of anchors. Typically 1 (anchors for
+                   every pixel in the feature map), or 2 (every other pixel).
+
+    Returns:
+        rpn_logits: [batch, H, W, 2] Anchor classifier logits (before softmax)
+        rpn_probs: [batch, H, W, 2] Anchor classifier probabilities.
+        rpn_bbox: [batch, H, W, (dy, dx, log(dh), log(dw))] Deltas to be
+                  applied to anchors.
+    """
+    # TODO: check if stride of 2 causes alignment issues if the feature map
+    # is not even.
+    # Shared convolutional base of the RPN
+    shared = KL.Conv2D(512, (3, 3), padding='same', activation='relu',
+                       strides=anchor_stride,
+                       name='rpn_conv_shared')(feature_map)
+
+    # Anchor Score. [batch, height, width, anchors per location * 2].
+    x = KL.Conv2D(2 * anchors_per_location, (1, 1), padding='valid',
+                  activation='linear', name='rpn_class_raw')(shared)
+
+    # Reshape to [batch, anchors, 2]
+    rpn_class_logits = KL.Lambda(
+        lambda t: tf.reshape(t, [tf.shape(t)[0], -1, 2]))(x)
+
+    # Softmax on last dimension of BG/FG.
+    rpn_probs = KL.Activation(
+        "softmax", name="rpn_class_xxx")(rpn_class_logits)
+
+    # Bounding box refinement. [batch, H, W, anchors per location, depth]
+    # where depth is [x, y, log(w), log(h)]
+    x = KL.Conv2D(anchors_per_location * 4, (1, 1), padding="valid",
+                  activation='linear', name='rpn_bbox_pred')(shared)
+
+    # Reshape to [batch, anchors, 4]
+    rpn_bbox = KL.Lambda(lambda t: tf.reshape(t, [tf.shape(t)[0], -1, 4]))(x)
+
+    return [rpn_class_logits, rpn_probs, rpn_bbox]
+
+
+def build_rpn_model(anchor_stride, anchors_per_location, depth):
+    """Builds a Keras model of the Region Proposal Network.
+    It wraps the RPN graph so it can be used multiple times with shared
+    weights.
+
+    anchors_per_location: number of anchors per pixel in the feature map
+    anchor_stride: Controls the density of anchors. Typically 1 (anchors for
+                   every pixel in the feature map), or 2 (every other pixel).
+    depth: Depth of the backbone feature map.
+
+    Returns a Keras Model object. The model outputs, when called, are:
+    rpn_logits: [batch, H, W, 2] Anchor classifier logits (before softmax)
+    rpn_probs: [batch, W, W, 2] Anchor classifier probabilities.
+    rpn_bbox: [batch, H, W, (dy, dx, log(dh), log(dw))] Deltas to be
+                applied to anchors.
+    """
+    input_feature_map = KL.Input(shape=[None, None, depth],
+                                 name="input_rpn_feature_map")
+    outputs = rpn_graph(input_feature_map, anchors_per_location, anchor_stride)
+    return KM.Model([input_feature_map], outputs, name="rpn_model")
+
+
+############################################################
+#  Feature Pyramid Network Heads
+############################################################
+
+def fpn_classifier_graph(rois, feature_maps, image_meta,
+                         pool_size, num_classes, train_bn=True,
+                         fc_layers_size=1024):
+    """Builds the computation graph of the feature pyramid network classifier
+    and regressor heads.
+
+    rois: [batch, num_rois, (y1, x1, y2, x2)] Proposal boxes in normalized
+          coordinates.
+    feature_maps: List of feature maps from different layers of the pyramid,
+                  [P2, P3, P4, P5]. Each has a different resolution.
+    - image_meta: [batch, (meta data)] Image details. See compose_image_meta()
+    pool_size: The width of the square feature map generated from ROI Pooling.
+    num_classes: number of classes, which determines the depth of the results
+    train_bn: Boolean. Train or freeze Batch Norm layers
+    fc_layers_size: Size of the 2 FC layers
+
+    Returns:
+        logits: [N, NUM_CLASSES] classifier logits (before softmax)
+        probs: [N, NUM_CLASSES] classifier probabilities
+        bbox_deltas: [N, (dy, dx, log(dh), log(dw))] Deltas to apply to
+                     proposal boxes
+    """
+    # ROI Pooling
+    # Shape: [batch, num_boxes, pool_height, pool_width, channels]
+    x = PyramidROIAlign([pool_size, pool_size],
+                        name="roi_align_classifier")([rois, image_meta] + feature_maps)
+    # Two 1024 FC layers (implemented with Conv2D for consistency)
+    x = KL.TimeDistributed(KL.Conv2D(fc_layers_size, (pool_size, pool_size), padding="valid"),
+                           name="mrcnn_class_conv1")(x)
+    x = KL.TimeDistributed(BatchNorm(), name='mrcnn_class_bn1')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+    x = KL.TimeDistributed(KL.Conv2D(fc_layers_size, (1, 1)),
+                           name="mrcnn_class_conv2")(x)
+    x = KL.TimeDistributed(BatchNorm(), name='mrcnn_class_bn2')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+
+    shared = KL.Lambda(lambda x: K.squeeze(K.squeeze(x, 3), 2),
+                       name="pool_squeeze")(x)
+
+    # Classifier head
+    mrcnn_class_logits = KL.TimeDistributed(KL.Dense(num_classes),
+                                            name='mrcnn_class_logits')(shared)
+    mrcnn_probs = KL.TimeDistributed(KL.Activation("softmax"),
+                                     name="mrcnn_class")(mrcnn_class_logits)
+
+    # BBox head
+    # [batch, boxes, num_classes * (dy, dx, log(dh), log(dw))]
+    x = KL.TimeDistributed(KL.Dense(num_classes * 4, activation='linear'),
+                           name='mrcnn_bbox_fc')(shared)
+    # Reshape to [batch, boxes, num_classes, (dy, dx, log(dh), log(dw))]
+    s = K.int_shape(x)
+    mrcnn_bbox = KL.Reshape((s[1], num_classes, 4), name="mrcnn_bbox")(x)
+
+    return mrcnn_class_logits, mrcnn_probs, mrcnn_bbox
+
+
+def build_fpn_mask_graph(rois, feature_maps, image_meta,
+                         pool_size, num_classes, train_bn=True):
+    """Builds the computation graph of the mask head of Feature Pyramid Network.
+
+    rois: [batch, num_rois, (y1, x1, y2, x2)] Proposal boxes in normalized
+          coordinates.
+    feature_maps: List of feature maps from different layers of the pyramid,
+                  [P2, P3, P4, P5]. Each has a different resolution.
+    image_meta: [batch, (meta data)] Image details. See compose_image_meta()
+    pool_size: The width of the square feature map generated from ROI Pooling.
+    num_classes: number of classes, which determines the depth of the results
+    train_bn: Boolean. Train or freeze Batch Norm layers
+
+    Returns: Masks [batch, roi_count, height, width, num_classes]
+    """
+    # ROI Pooling
+    # Shape: [batch, boxes, pool_height, pool_width, channels]
+    x = PyramidROIAlign([pool_size, pool_size],
+                        name="roi_align_mask")([rois, image_meta] + feature_maps)
+
+    # Conv layers
+    x = KL.TimeDistributed(KL.Conv2D(256, (3, 3), padding="same"),
+                           name="mrcnn_mask_conv1")(x)
+    x = KL.TimeDistributed(BatchNorm(),
+                           name='mrcnn_mask_bn1')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+
+    x = KL.TimeDistributed(KL.Conv2D(256, (3, 3), padding="same"),
+                           name="mrcnn_mask_conv2")(x)
+    x = KL.TimeDistributed(BatchNorm(),
+                           name='mrcnn_mask_bn2')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+
+    x = KL.TimeDistributed(KL.Conv2D(256, (3, 3), padding="same"),
+                           name="mrcnn_mask_conv3")(x)
+    x = KL.TimeDistributed(BatchNorm(),
+                           name='mrcnn_mask_bn3')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+
+    x = KL.TimeDistributed(KL.Conv2D(256, (3, 3), padding="same"),
+                           name="mrcnn_mask_conv4")(x)
+    x = KL.TimeDistributed(BatchNorm(),
+                           name='mrcnn_mask_bn4')(x, training=train_bn)
+    x = KL.Activation('relu')(x)
+
+    x = KL.TimeDistributed(KL.Conv2DTranspose(256, (2, 2), strides=2, activation="relu"),
+                           name="mrcnn_mask_deconv")(x)
+    x = KL.TimeDistributed(KL.Conv2D(num_classes, (1, 1), strides=1, activation="sigmoid"),
+                           name="mrcnn_mask")(x)
+    return x
+
+
+############################################################
+#  Loss Functions
+############################################################
+
+def smooth_l1_loss(y_true, y_pred):
+    """Implements Smooth-L1 loss.
+    y_true and y_pred are typically: [N, 4], but could be any shape.
+    """
+    diff = K.abs(y_true - y_pred)
+    less_than_one = K.cast(K.less(diff, 1.0), "float32")
+    loss = (less_than_one * 0.5 * diff ** 2) + (1 - less_than_one) * (diff - 0.5)
+    return loss
+
+
+def rpn_class_loss_graph(rpn_match, rpn_class_logits):
+    """RPN anchor classifier loss.
+
+    rpn_match: [batch, anchors, 1]. Anchor match type. 1=positive,
+               -1=negative, 0=neutral anchor.
+    rpn_class_logits: [batch, anchors, 2]. RPN classifier logits for FG/BG.
+    """
+    # Squeeze last dim to simplify
+    rpn_match = tf.squeeze(rpn_match, -1)
+    # Get anchor classes. Convert the -1/+1 match to 0/1 values.
+    anchor_class = K.cast(K.equal(rpn_match, 1), tf.int32)
+    # Positive and Negative anchors contribute to the loss,
+    # but neutral anchors (match value = 0) don't.
+    indices = tf.where(K.not_equal(rpn_match, 0))
+    # Pick rows that contribute to the loss and filter out the rest.
+    rpn_class_logits = tf.gather_nd(rpn_class_logits, indices)
+    anchor_class = tf.gather_nd(anchor_class, indices)
+    # Cross entropy loss
+    loss = K.sparse_categorical_crossentropy(target=anchor_class,
+                                             output=rpn_class_logits,
+                                             from_logits=True)
+    loss = K.switch(tf.size(loss) > 0, K.mean(loss), tf.constant(0.0))
+    return loss
+
+
+def rpn_bbox_loss_graph(config, target_bbox, rpn_match, rpn_bbox):
+    """Return the RPN bounding box loss graph.
+
+    config: the model config object.
+    target_bbox: [batch, max positive anchors, (dy, dx, log(dh), log(dw))].
+        Uses 0 padding to fill in unsed bbox deltas.
+    rpn_match: [batch, anchors, 1]. Anchor match type. 1=positive,
+               -1=negative, 0=neutral anchor.
+    rpn_bbox: [batch, anchors, (dy, dx, log(dh), log(dw))]
+    """
+    # Positive anchors contribute to the loss, but negative and
+    # neutral anchors (match value of 0 or -1) don't.
+    rpn_match = K.squeeze(rpn_match, -1)
+    indices = tf.where(K.equal(rpn_match, 1))
+
+    # Pick bbox deltas that contribute to the loss
+    rpn_bbox = tf.gather_nd(rpn_bbox, indices)
+
+    # Trim target bounding box deltas to the same length as rpn_bbox.
+    batch_counts = K.sum(K.cast(K.equal(rpn_match, 1), tf.int32), axis=1)
+    target_bbox = batch_pack_graph(target_bbox, batch_counts,
+                                   config.IMAGES_PER_GPU)
+
+    # TODO: use smooth_l1_loss() rather than reimplementing here
+    #       to reduce code duplication
+    diff = K.abs(target_bbox - rpn_bbox)
+    less_than_one = K.cast(K.less(diff, 1.0), "float32")
+    loss = (less_than_one * 0.5 * diff ** 2) + (1 - less_than_one) * (diff - 0.5)
+
+    loss = K.switch(tf.size(loss) > 0, K.mean(loss), tf.constant(0.0))
+    return loss
+
+
+def mrcnn_class_loss_graph(target_class_ids, pred_class_logits,
+                           active_class_ids):
+    """Loss for the classifier head of Mask RCNN.
+
+    target_class_ids: [batch, num_rois]. Integer class IDs. Uses zero
+        padding to fill in the array.
+    pred_class_logits: [batch, num_rois, num_classes]
+    active_class_ids: [batch, num_classes]. Has a value of 1 for
+        classes that are in the dataset of the image, and 0
+        for classes that are not in the dataset.
+    """
+    # During model building, Keras calls this function with
+    # target_class_ids of type float32. Unclear why. Cast it
+    # to int to get around it.
+    target_class_ids = tf.cast(target_class_ids, 'int64')
+
+    # Find predictions of classes that are not in the dataset.
+    pred_class_ids = tf.argmax(pred_class_logits, axis=2)
+    # TODO: Update this line to work with batch > 1. Right now it assumes all
+    #       images in a batch have the same active_class_ids
+    pred_active = tf.gather(active_class_ids[0], pred_class_ids)
+
+    # Loss
+    loss = tf.nn.sparse_softmax_cross_entropy_with_logits(
+        labels=target_class_ids, logits=pred_class_logits)
+
+    # Erase losses of predictions of classes that are not in the active
+    # classes of the image.
+    loss = loss * pred_active
+
+    # Computer loss mean. Use only predictions that contribute
+    # to the loss to get a correct mean.
+    loss = tf.reduce_sum(loss) / tf.reduce_sum(pred_active)
+    return loss
+
+
+def mrcnn_bbox_loss_graph(target_bbox, target_class_ids, pred_bbox):
+    """Loss for Mask R-CNN bounding box refinement.
+
+    target_bbox: [batch, num_rois, (dy, dx, log(dh), log(dw))]
+    target_class_ids: [batch, num_rois]. Integer class IDs.
+    pred_bbox: [batch, num_rois, num_classes, (dy, dx, log(dh), log(dw))]
+    """
+    # Reshape to merge batch and roi dimensions for simplicity.
+    target_class_ids = K.reshape(target_class_ids, (-1,))
+    target_bbox = K.reshape(target_bbox, (-1, 4))
+    pred_bbox = K.reshape(pred_bbox, (-1, K.int_shape(pred_bbox)[2], 4))
+
+    # Only positive ROIs contribute to the loss. And only
+    # the right class_id of each ROI. Get their indices.
+    positive_roi_ix = tf.where(target_class_ids > 0)[:, 0]
+    positive_roi_class_ids = tf.cast(
+        tf.gather(target_class_ids, positive_roi_ix), tf.int64)
+    indices = tf.stack([positive_roi_ix, positive_roi_class_ids], axis=1)
+
+    # Gather the deltas (predicted and true) that contribute to loss
+    target_bbox = tf.gather(target_bbox, positive_roi_ix)
+    pred_bbox = tf.gather_nd(pred_bbox, indices)
+
+    # Smooth-L1 Loss
+    loss = K.switch(tf.size(target_bbox) > 0,
+                    smooth_l1_loss(y_true=target_bbox, y_pred=pred_bbox),
+                    tf.constant(0.0))
+    loss = K.mean(loss)
+    return loss
+
+
+def mrcnn_mask_loss_graph(target_masks, target_class_ids, pred_masks):
+    """Mask binary cross-entropy loss for the masks head.
+
+    target_masks: [batch, num_rois, height, width].
+        A float32 tensor of values 0 or 1. Uses zero padding to fill array.
+    target_class_ids: [batch, num_rois]. Integer class IDs. Zero padded.
+    pred_masks: [batch, proposals, height, width, num_classes] float32 tensor
+                with values from 0 to 1.
+    """
+    # Reshape for simplicity. Merge first two dimensions into one.
+    target_class_ids = K.reshape(target_class_ids, (-1,))
+    mask_shape = tf.shape(target_masks)
+    target_masks = K.reshape(target_masks, (-1, mask_shape[2], mask_shape[3]))
+    pred_shape = tf.shape(pred_masks)
+    pred_masks = K.reshape(pred_masks,
+                           (-1, pred_shape[2], pred_shape[3], pred_shape[4]))
+    # Permute predicted masks to [N, num_classes, height, width]
+    pred_masks = tf.transpose(pred_masks, [0, 3, 1, 2])
+
+    # Only positive ROIs contribute to the loss. And only
+    # the class specific mask of each ROI.
+    positive_ix = tf.where(target_class_ids > 0)[:, 0]
+    positive_class_ids = tf.cast(
+        tf.gather(target_class_ids, positive_ix), tf.int64)
+    indices = tf.stack([positive_ix, positive_class_ids], axis=1)
+
+    # Gather the masks (predicted and true) that contribute to loss
+    y_true = tf.gather(target_masks, positive_ix)
+    y_pred = tf.gather_nd(pred_masks, indices)
+
+    # Compute binary cross entropy. If no positive ROIs, then return 0.
+    # shape: [batch, roi, num_classes]
+    loss = K.switch(tf.size(y_true) > 0,
+                    K.binary_crossentropy(target=y_true, output=y_pred),
+                    tf.constant(0.0))
+    loss = K.mean(loss)
+    return loss
+
+
+############################################################
+#  Data Generator
+############################################################
+
+def load_image_gt(dataset, config, image_id, augment=False, augmentation=None,
+                  use_mini_mask=False):
+    """Load and return ground truth data for an image (image, mask, bounding boxes).
+
+    augment: (deprecated. Use augmentation instead). If true, apply random
+        image augmentation. Currently, only horizontal flipping is offered.
+    augmentation: Optional. An imgaug (https://github.com/aleju/imgaug) augmentation.
+        For example, passing imgaug.augmenters.Fliplr(0.5) flips images
+        right/left 50% of the time.
+    use_mini_mask: If False, returns full-size masks that are the same height
+        and width as the original image. These can be big, for example
+        1024x1024x100 (for 100 instances). Mini masks are smaller, typically,
+        224x224 and are generated by extracting the bounding box of the
+        object and resizing it to MINI_MASK_SHAPE.
+
+    Returns:
+    image: [height, width, 3]
+    shape: the original shape of the image before resizing and cropping.
+    class_ids: [instance_count] Integer class IDs
+    bbox: [instance_count, (y1, x1, y2, x2)]
+    mask: [height, width, instance_count]. The height and width are those
+        of the image unless use_mini_mask is True, in which case they are
+        defined in MINI_MASK_SHAPE.
+    """
+    # Load image and mask
+    image = dataset.load_image(image_id)
+    mask, class_ids = dataset.load_mask(image_id)
+    original_shape = image.shape
+    image, window, scale, padding, crop = utils.resize_image(
+        image,
+        min_dim=config.IMAGE_MIN_DIM,
+        min_scale=config.IMAGE_MIN_SCALE,
+        max_dim=config.IMAGE_MAX_DIM,
+        mode=config.IMAGE_RESIZE_MODE)
+    mask = utils.resize_mask(mask, scale, padding, crop)
+
+    # Random horizontal flips.
+    # TODO: will be removed in a future update in favor of augmentation
+    if augment:
+        logging.warning("'augment' is deprecated. Use 'augmentation' instead.")
+        if random.randint(0, 1):
+            image = np.fliplr(image)
+            mask = np.fliplr(mask)
+
+    # Augmentation
+    # This requires the imgaug lib (https://github.com/aleju/imgaug)
+    if augmentation:
+        import imgaug
+
+        # Augmenters that are safe to apply to masks
+        # Some, such as Affine, have settings that make them unsafe, so always
+        # test your augmentation on masks
+        MASK_AUGMENTERS = ["Sequential", "SomeOf", "OneOf", "Sometimes",
+                           "Fliplr", "Flipud", "CropAndPad",
+                           "Affine", "PiecewiseAffine"]
+
+        def hook(images, augmenter, parents, default):
+            """Determines which augmenters to apply to masks."""
+            return augmenter.__class__.__name__ in MASK_AUGMENTERS
+
+        # Store shapes before augmentation to compare
+        image_shape = image.shape
+        mask_shape = mask.shape
+        # Make augmenters deterministic to apply similarly to images and masks
+        det = augmentation.to_deterministic()
+        image = det.augment_image(image)
+        # Change mask to np.uint8 because imgaug doesn't support np.bool
+        mask = det.augment_image(mask.astype(np.uint8),
+                                 hooks=imgaug.HooksImages(activator=hook))
+        # Verify that shapes didn't change
+        assert image.shape == image_shape, "Augmentation shouldn't change image size"
+        assert mask.shape == mask_shape, "Augmentation shouldn't change mask size"
+        # Change mask back to bool
+        mask = mask.astype(np.bool)
+
+    # Note that some boxes might be all zeros if the corresponding mask got cropped out.
+    # and here is to filter them out
+    _idx = np.sum(mask, axis=(0, 1)) > 0
+    mask = mask[:, :, _idx]
+    class_ids = class_ids[_idx]
+    # Bounding boxes. Note that some boxes might be all zeros
+    # if the corresponding mask got cropped out.
+    # bbox: [num_instances, (y1, x1, y2, x2)]
+    bbox = utils.extract_bboxes(mask)
+
+    # Active classes
+    # Different datasets have different classes, so track the
+    # classes supported in the dataset of this image.
+    active_class_ids = np.zeros([dataset.num_classes], dtype=np.int32)
+    source_class_ids = dataset.source_class_ids[dataset.image_info[image_id]["source"]]
+    active_class_ids[source_class_ids] = 1
+
+    # Resize masks to smaller size to reduce memory usage
+    if use_mini_mask:
+        mask = utils.minimize_mask(bbox, mask, config.MINI_MASK_SHAPE)
+
+    # Image meta data
+    image_meta = compose_image_meta(image_id, original_shape, image.shape,
+                                    window, scale, active_class_ids)
+
+    return image, image_meta, class_ids, bbox, mask
+
+
+def build_detection_targets(rpn_rois, gt_class_ids, gt_boxes, gt_masks, config):
+    """Generate targets for training Stage 2 classifier and mask heads.
+    This is not used in normal training. It's useful for debugging or to train
+    the Mask RCNN heads without using the RPN head.
+
+    Inputs:
+    rpn_rois: [N, (y1, x1, y2, x2)] proposal boxes.
+    gt_class_ids: [instance count] Integer class IDs
+    gt_boxes: [instance count, (y1, x1, y2, x2)]
+    gt_masks: [height, width, instance count] Ground truth masks. Can be full
+              size or mini-masks.
+
+    Returns:
+    rois: [TRAIN_ROIS_PER_IMAGE, (y1, x1, y2, x2)]
+    class_ids: [TRAIN_ROIS_PER_IMAGE]. Integer class IDs.
+    bboxes: [TRAIN_ROIS_PER_IMAGE, NUM_CLASSES, (y, x, log(h), log(w))]. Class-specific
+            bbox refinements.
+    masks: [TRAIN_ROIS_PER_IMAGE, height, width, NUM_CLASSES). Class specific masks cropped
+           to bbox boundaries and resized to neural network output size.
+    """
+    assert rpn_rois.shape[0] > 0
+    assert gt_class_ids.dtype == np.int32, "Expected int but got {}".format(
+        gt_class_ids.dtype)
+    assert gt_boxes.dtype == np.int32, "Expected int but got {}".format(
+        gt_boxes.dtype)
+    assert gt_masks.dtype == np.bool_, "Expected bool but got {}".format(
+        gt_masks.dtype)
+
+    # It's common to add GT Boxes to ROIs but we don't do that here because
+    # according to XinLei Chen's paper, it doesn't help.
+
+    # Trim empty padding in gt_boxes and gt_masks parts
+    instance_ids = np.where(gt_class_ids > 0)[0]
+    assert instance_ids.shape[0] > 0, "Image must contain instances."
+    gt_class_ids = gt_class_ids[instance_ids]
+    gt_boxes = gt_boxes[instance_ids]
+    gt_masks = gt_masks[:, :, instance_ids]
+
+    # Compute areas of ROIs and ground truth boxes.
+    rpn_roi_area = (rpn_rois[:, 2] - rpn_rois[:, 0]) * \
+                   (rpn_rois[:, 3] - rpn_rois[:, 1])
+    gt_box_area = (gt_boxes[:, 2] - gt_boxes[:, 0]) * \
+                  (gt_boxes[:, 3] - gt_boxes[:, 1])
+
+    # Compute overlaps [rpn_rois, gt_boxes]
+    overlaps = np.zeros((rpn_rois.shape[0], gt_boxes.shape[0]))
+    for i in range(overlaps.shape[1]):
+        gt = gt_boxes[i]
+        overlaps[:, i] = utils.compute_iou(
+            gt, rpn_rois, gt_box_area[i], rpn_roi_area)
+
+    # Assign ROIs to GT boxes
+    rpn_roi_iou_argmax = np.argmax(overlaps, axis=1)
+    rpn_roi_iou_max = overlaps[np.arange(
+        overlaps.shape[0]), rpn_roi_iou_argmax]
+    # GT box assigned to each ROI
+    rpn_roi_gt_boxes = gt_boxes[rpn_roi_iou_argmax]
+    rpn_roi_gt_class_ids = gt_class_ids[rpn_roi_iou_argmax]
+
+    # Positive ROIs are those with >= 0.5 IoU with a GT box.
+    fg_ids = np.where(rpn_roi_iou_max > 0.5)[0]
+
+    # Negative ROIs are those with max IoU 0.1-0.5 (hard example mining)
+    # TODO: To hard example mine or not to hard example mine, that's the question
+    # bg_ids = np.where((rpn_roi_iou_max >= 0.1) & (rpn_roi_iou_max < 0.5))[0]
+    bg_ids = np.where(rpn_roi_iou_max < 0.5)[0]
+
+    # Subsample ROIs. Aim for 33% foreground.
+    # FG
+    fg_roi_count = int(config.TRAIN_ROIS_PER_IMAGE * config.ROI_POSITIVE_RATIO)
+    if fg_ids.shape[0] > fg_roi_count:
+        keep_fg_ids = np.random.choice(fg_ids, fg_roi_count, replace=False)
+    else:
+        keep_fg_ids = fg_ids
+    # BG
+    remaining = config.TRAIN_ROIS_PER_IMAGE - keep_fg_ids.shape[0]
+    if bg_ids.shape[0] > remaining:
+        keep_bg_ids = np.random.choice(bg_ids, remaining, replace=False)
+    else:
+        keep_bg_ids = bg_ids
+    # Combine indices of ROIs to keep
+    keep = np.concatenate([keep_fg_ids, keep_bg_ids])
+    # Need more?
+    remaining = config.TRAIN_ROIS_PER_IMAGE - keep.shape[0]
+    if remaining > 0:
+        # Looks like we don't have enough samples to maintain the desired
+        # balance. Reduce requirements and fill in the rest. This is
+        # likely different from the Mask RCNN paper.
+
+        # There is a small chance we have neither fg nor bg samples.
+        if keep.shape[0] == 0:
+            # Pick bg regions with easier IoU threshold
+            bg_ids = np.where(rpn_roi_iou_max < 0.5)[0]
+            assert bg_ids.shape[0] >= remaining
+            keep_bg_ids = np.random.choice(bg_ids, remaining, replace=False)
+            assert keep_bg_ids.shape[0] == remaining
+            keep = np.concatenate([keep, keep_bg_ids])
+        else:
+            # Fill the rest with repeated bg rois.
+            keep_extra_ids = np.random.choice(
+                keep_bg_ids, remaining, replace=True)
+            keep = np.concatenate([keep, keep_extra_ids])
+    assert keep.shape[0] == config.TRAIN_ROIS_PER_IMAGE, \
+        "keep doesn't match ROI batch size {}, {}".format(
+            keep.shape[0], config.TRAIN_ROIS_PER_IMAGE)
+
+    # Reset the gt boxes assigned to BG ROIs.
+    rpn_roi_gt_boxes[keep_bg_ids, :] = 0
+    rpn_roi_gt_class_ids[keep_bg_ids] = 0
+
+    # For each kept ROI, assign a class_id, and for FG ROIs also add bbox refinement.
+    rois = rpn_rois[keep]
+    roi_gt_boxes = rpn_roi_gt_boxes[keep]
+    roi_gt_class_ids = rpn_roi_gt_class_ids[keep]
+    roi_gt_assignment = rpn_roi_iou_argmax[keep]
+
+    # Class-aware bbox deltas. [y, x, log(h), log(w)]
+    bboxes = np.zeros((config.TRAIN_ROIS_PER_IMAGE,
+                       config.NUM_CLASSES, 4), dtype=np.float32)
+    pos_ids = np.where(roi_gt_class_ids > 0)[0]
+    bboxes[pos_ids, roi_gt_class_ids[pos_ids]] = utils.box_refinement(
+        rois[pos_ids], roi_gt_boxes[pos_ids, :4])
+    # Normalize bbox refinements
+    bboxes /= config.BBOX_STD_DEV
+
+    # Generate class-specific target masks
+    masks = np.zeros((config.TRAIN_ROIS_PER_IMAGE, config.MASK_SHAPE[0], config.MASK_SHAPE[1], config.NUM_CLASSES),
+                     dtype=np.float32)
+    for i in pos_ids:
+        class_id = roi_gt_class_ids[i]
+        assert class_id > 0, "class id must be greater than 0"
+        gt_id = roi_gt_assignment[i]
+        class_mask = gt_masks[:, :, gt_id]
+
+        if config.USE_MINI_MASK:
+            # Create a mask placeholder, the size of the image
+            placeholder = np.zeros(config.IMAGE_SHAPE[:2], dtype=bool)
+            # GT box
+            gt_y1, gt_x1, gt_y2, gt_x2 = gt_boxes[gt_id]
+            gt_w = gt_x2 - gt_x1
+            gt_h = gt_y2 - gt_y1
+            # Resize mini mask to size of GT box
+            placeholder[gt_y1:gt_y2, gt_x1:gt_x2] = \
+                np.round(skimage.transform.resize(
+                    class_mask, (gt_h, gt_w), order=1, mode="constant")).astype(bool)
+            # Place the mini batch in the placeholder
+            class_mask = placeholder
+
+        # Pick part of the mask and resize it
+        y1, x1, y2, x2 = rois[i].astype(np.int32)
+        m = class_mask[y1:y2, x1:x2]
+        mask = skimage.transform.resize(m, config.MASK_SHAPE, order=1, mode="constant")
+        masks[i, :, :, class_id] = mask
+
+    return rois, roi_gt_class_ids, bboxes, masks
+
+
+def build_rpn_targets(image_shape, anchors, gt_class_ids, gt_boxes, config):
+    """Given the anchors and GT boxes, compute overlaps and identify positive
+    anchors and deltas to refine them to match their corresponding GT boxes.
+
+    anchors: [num_anchors, (y1, x1, y2, x2)]
+    gt_class_ids: [num_gt_boxes] Integer class IDs.
+    gt_boxes: [num_gt_boxes, (y1, x1, y2, x2)]
+
+    Returns:
+    rpn_match: [N] (int32) matches between anchors and GT boxes.
+               1 = positive anchor, -1 = negative anchor, 0 = neutral
+    rpn_bbox: [N, (dy, dx, log(dh), log(dw))] Anchor bbox deltas.
+    """
+    # RPN Match: 1 = positive anchor, -1 = negative anchor, 0 = neutral
+    rpn_match = np.zeros([anchors.shape[0]], dtype=np.int32)
+    # RPN bounding boxes: [max anchors per image, (dy, dx, log(dh), log(dw))]
+    rpn_bbox = np.zeros((config.RPN_TRAIN_ANCHORS_PER_IMAGE, 4))
+
+    # Handle COCO crowds
+    # A crowd box in COCO is a bounding box around several instances. Exclude
+    # them from training. A crowd box is given a negative class ID.
+    crowd_ix = np.where(gt_class_ids < 0)[0]
+    if crowd_ix.shape[0] > 0:
+        # Filter out crowds from ground truth class IDs and boxes
+        non_crowd_ix = np.where(gt_class_ids > 0)[0]
+        crowd_boxes = gt_boxes[crowd_ix]
+        gt_class_ids = gt_class_ids[non_crowd_ix]
+        gt_boxes = gt_boxes[non_crowd_ix]
+        # Compute overlaps with crowd boxes [anchors, crowds]
+        crowd_overlaps = utils.compute_overlaps(anchors, crowd_boxes)
+        crowd_iou_max = np.amax(crowd_overlaps, axis=1)
+        no_crowd_bool = (crowd_iou_max < 0.001)
+    else:
+        # All anchors don't intersect a crowd
+        no_crowd_bool = np.ones([anchors.shape[0]], dtype=bool)
+
+    # Compute overlaps [num_anchors, num_gt_boxes]
+    overlaps = utils.compute_overlaps(anchors, gt_boxes)
+
+    # Match anchors to GT Boxes
+    # If an anchor overlaps a GT box with IoU >= 0.7 then it's positive.
+    # If an anchor overlaps a GT box with IoU < 0.3 then it's negative.
+    # Neutral anchors are those that don't match the conditions above,
+    # and they don't influence the loss function.
+    # However, don't keep any GT box unmatched (rare, but happens). Instead,
+    # match it to the closest anchor (even if its max IoU is < 0.3).
+    #
+    # 1. Set negative anchors first. They get overwritten below if a GT box is
+    # matched to them. Skip boxes in crowd areas.
+    anchor_iou_argmax = np.argmax(overlaps, axis=1)
+    anchor_iou_max = overlaps[np.arange(overlaps.shape[0]), anchor_iou_argmax]
+    rpn_match[(anchor_iou_max < 0.3) & (no_crowd_bool)] = -1
+    # 2. Set an anchor for each GT box (regardless of IoU value).
+    # TODO: If multiple anchors have the same IoU match all of them
+    gt_iou_argmax = np.argmax(overlaps, axis=0)
+    rpn_match[gt_iou_argmax] = 1
+    # 3. Set anchors with high overlap as positive.
+    rpn_match[anchor_iou_max >= 0.7] = 1
+
+    # Subsample to balance positive and negative anchors
+    # Don't let positives be more than half the anchors
+    ids = np.where(rpn_match == 1)[0]
+    extra = len(ids) - (config.RPN_TRAIN_ANCHORS_PER_IMAGE // 2)
+    if extra > 0:
+        # Reset the extra ones to neutral
+        ids = np.random.choice(ids, extra, replace=False)
+        rpn_match[ids] = 0
+    # Same for negative proposals
+    ids = np.where(rpn_match == -1)[0]
+    extra = len(ids) - (config.RPN_TRAIN_ANCHORS_PER_IMAGE -
+                        np.sum(rpn_match == 1))
+    if extra > 0:
+        # Rest the extra ones to neutral
+        ids = np.random.choice(ids, extra, replace=False)
+        rpn_match[ids] = 0
+
+    # For positive anchors, compute shift and scale needed to transform them
+    # to match the corresponding GT boxes.
+    ids = np.where(rpn_match == 1)[0]
+    ix = 0  # index into rpn_bbox
+    # TODO: use box_refinement() rather than duplicating the code here
+    for i, a in zip(ids, anchors[ids]):
+        # Closest gt box (it might have IoU < 0.7)
+        gt = gt_boxes[anchor_iou_argmax[i]]
+
+        # Convert coordinates to center plus width/height.
+        # GT Box
+        gt_h = gt[2] - gt[0]
+        gt_w = gt[3] - gt[1]
+        gt_center_y = gt[0] + 0.5 * gt_h
+        gt_center_x = gt[1] + 0.5 * gt_w
+        # Anchor
+        a_h = a[2] - a[0]
+        a_w = a[3] - a[1]
+        a_center_y = a[0] + 0.5 * a_h
+        a_center_x = a[1] + 0.5 * a_w
+
+        # Compute the bbox refinement that the RPN should predict.
+        rpn_bbox[ix] = [
+            (gt_center_y - a_center_y) / a_h,
+            (gt_center_x - a_center_x) / a_w,
+            np.log(gt_h / a_h),
+            np.log(gt_w / a_w),
+        ]
+        # Normalize
+        rpn_bbox[ix] /= config.RPN_BBOX_STD_DEV
+        ix += 1
+
+    return rpn_match, rpn_bbox
+
+
+def generate_random_rois(image_shape, count, gt_class_ids, gt_boxes):
+    """Generates ROI proposals similar to what a region proposal network
+    would generate.
+
+    image_shape: [Height, Width, Depth]
+    count: Number of ROIs to generate
+    gt_class_ids: [N] Integer ground truth class IDs
+    gt_boxes: [N, (y1, x1, y2, x2)] Ground truth boxes in pixels.
+
+    Returns: [count, (y1, x1, y2, x2)] ROI boxes in pixels.
+    """
+    # placeholder
+    rois = np.zeros((count, 4), dtype=np.int32)
+
+    # Generate random ROIs around GT boxes (90% of count)
+    rois_per_box = int(0.9 * count / gt_boxes.shape[0])
+    for i in range(gt_boxes.shape[0]):
+        gt_y1, gt_x1, gt_y2, gt_x2 = gt_boxes[i]
+        h = gt_y2 - gt_y1
+        w = gt_x2 - gt_x1
+        # random boundaries
+        r_y1 = max(gt_y1 - h, 0)
+        r_y2 = min(gt_y2 + h, image_shape[0])
+        r_x1 = max(gt_x1 - w, 0)
+        r_x2 = min(gt_x2 + w, image_shape[1])
+
+        # To avoid generating boxes with zero area, we generate double what
+        # we need and filter out the extra. If we get fewer valid boxes
+        # than we need, we loop and try again.
+        while True:
+            y1y2 = np.random.randint(r_y1, r_y2, (rois_per_box * 2, 2))
+            x1x2 = np.random.randint(r_x1, r_x2, (rois_per_box * 2, 2))
+            # Filter out zero area boxes
+            threshold = 1
+            y1y2 = y1y2[np.abs(y1y2[:, 0] - y1y2[:, 1]) >=
+                        threshold][:rois_per_box]
+            x1x2 = x1x2[np.abs(x1x2[:, 0] - x1x2[:, 1]) >=
+                        threshold][:rois_per_box]
+            if y1y2.shape[0] == rois_per_box and x1x2.shape[0] == rois_per_box:
+                break
+
+        # Sort on axis 1 to ensure x1 <= x2 and y1 <= y2 and then reshape
+        # into x1, y1, x2, y2 order
+        x1, x2 = np.split(np.sort(x1x2, axis=1), 2, axis=1)
+        y1, y2 = np.split(np.sort(y1y2, axis=1), 2, axis=1)
+        box_rois = np.hstack([y1, x1, y2, x2])
+        rois[rois_per_box * i:rois_per_box * (i + 1)] = box_rois
+
+    # Generate random ROIs anywhere in the image (10% of count)
+    remaining_count = count - (rois_per_box * gt_boxes.shape[0])
+    # To avoid generating boxes with zero area, we generate double what
+    # we need and filter out the extra. If we get fewer valid boxes
+    # than we need, we loop and try again.
+    while True:
+        y1y2 = np.random.randint(0, image_shape[0], (remaining_count * 2, 2))
+        x1x2 = np.random.randint(0, image_shape[1], (remaining_count * 2, 2))
+        # Filter out zero area boxes
+        threshold = 1
+        y1y2 = y1y2[np.abs(y1y2[:, 0] - y1y2[:, 1]) >=
+                    threshold][:remaining_count]
+        x1x2 = x1x2[np.abs(x1x2[:, 0] - x1x2[:, 1]) >=
+                    threshold][:remaining_count]
+        if y1y2.shape[0] == remaining_count and x1x2.shape[0] == remaining_count:
+            break
+
+    # Sort on axis 1 to ensure x1 <= x2 and y1 <= y2 and then reshape
+    # into x1, y1, x2, y2 order
+    x1, x2 = np.split(np.sort(x1x2, axis=1), 2, axis=1)
+    y1, y2 = np.split(np.sort(y1y2, axis=1), 2, axis=1)
+    global_rois = np.hstack([y1, x1, y2, x2])
+    rois[-remaining_count:] = global_rois
+    return rois
+
+
+def data_generator(dataset, config, shuffle=True, augment=False, augmentation=None,
+                   random_rois=0, batch_size=1, detection_targets=False,
+                   no_augmentation_sources=None):
+    """A generator that returns images and corresponding target class ids,
+    bounding box deltas, and masks.
+
+    dataset: The Dataset object to pick data from
+    config: The model config object
+    shuffle: If True, shuffles the samples before every epoch
+    augment: (deprecated. Use augmentation instead). If true, apply random
+        image augmentation. Currently, only horizontal flipping is offered.
+    augmentation: Optional. An imgaug (https://github.com/aleju/imgaug) augmentation.
+        For example, passing imgaug.augmenters.Fliplr(0.5) flips images
+        right/left 50% of the time.
+    random_rois: If > 0 then generate proposals to be used to train the
+                 network classifier and mask heads. Useful if training
+                 the Mask RCNN part without the RPN.
+    batch_size: How many images to return in each call
+    detection_targets: If True, generate detection targets (class IDs, bbox
+        deltas, and masks). Typically for debugging or visualizations because
+        in trainig detection targets are generated by DetectionTargetLayer.
+    no_augmentation_sources: Optional. List of sources to exclude for
+        augmentation. A source is string that identifies a dataset and is
+        defined in the Dataset class.
+
+    Returns a Python generator. Upon calling next() on it, the
+    generator returns two lists, inputs and outputs. The contents
+    of the lists differs depending on the received arguments:
+    inputs list:
+    - images: [batch, H, W, C]
+    - image_meta: [batch, (meta data)] Image details. See compose_image_meta()
+    - rpn_match: [batch, N] Integer (1=positive anchor, -1=negative, 0=neutral)
+    - rpn_bbox: [batch, N, (dy, dx, log(dh), log(dw))] Anchor bbox deltas.
+    - gt_class_ids: [batch, MAX_GT_INSTANCES] Integer class IDs
+    - gt_boxes: [batch, MAX_GT_INSTANCES, (y1, x1, y2, x2)]
+    - gt_masks: [batch, height, width, MAX_GT_INSTANCES]. The height and width
+                are those of the image unless use_mini_mask is True, in which
+                case they are defined in MINI_MASK_SHAPE.
+
+    outputs list: Usually empty in regular training. But if detection_targets
+        is True then the outputs list contains target class_ids, bbox deltas,
+        and masks.
+    """
+    b = 0  # batch item index
+    image_index = -1
+    image_ids = np.copy(dataset.image_ids)
+    error_count = 0
+    no_augmentation_sources = no_augmentation_sources or []
+
+    # Anchors
+    # [anchor_count, (y1, x1, y2, x2)]
+    backbone_shapes = compute_backbone_shapes(config, config.IMAGE_SHAPE)
+    anchors = utils.generate_pyramid_anchors(config.RPN_ANCHOR_SCALES,
+                                             config.RPN_ANCHOR_RATIOS,
+                                             backbone_shapes,
+                                             config.BACKBONE_STRIDES,
+                                             config.RPN_ANCHOR_STRIDE)
+
+    # Keras requires a generator to run indefinitely.
+    while True:
+        try:
+            # Increment index to pick next image. Shuffle if at the start of an epoch.
+            image_index = (image_index + 1) % len(image_ids)
+            if shuffle and image_index == 0:
+                np.random.shuffle(image_ids)
+
+            # Get GT bounding boxes and masks for image.
+            image_id = image_ids[image_index]
+
+            # If the image source is not to be augmented pass None as augmentation
+            if dataset.image_info[image_id]['source'] in no_augmentation_sources:
+                image, image_meta, gt_class_ids, gt_boxes, gt_masks = \
+                    load_image_gt(dataset, config, image_id, augment=augment,
+                                  augmentation=None,
+                                  use_mini_mask=config.USE_MINI_MASK)
+            else:
+                image, image_meta, gt_class_ids, gt_boxes, gt_masks = \
+                    load_image_gt(dataset, config, image_id, augment=augment,
+                                  augmentation=augmentation,
+                                  use_mini_mask=config.USE_MINI_MASK)
+
+            # Skip images that have no instances. This can happen in cases
+            # where we train on a subset of classes and the image doesn't
+            # have any of the classes we care about.
+            if not np.any(gt_class_ids > 0):
+                continue
+
+            # RPN Targets
+            rpn_match, rpn_bbox = build_rpn_targets(image.shape, anchors,
+                                                    gt_class_ids, gt_boxes, config)
+
+            # Mask R-CNN Targets
+            if random_rois:
+                rpn_rois = generate_random_rois(
+                    image.shape, random_rois, gt_class_ids, gt_boxes)
+                if detection_targets:
+                    rois, mrcnn_class_ids, mrcnn_bbox, mrcnn_mask = \
+                        build_detection_targets(
+                            rpn_rois, gt_class_ids, gt_boxes, gt_masks, config)
+
+            # Init batch arrays
+            if b == 0:
+                batch_image_meta = np.zeros(
+                    (batch_size,) + image_meta.shape, dtype=image_meta.dtype)
+                batch_rpn_match = np.zeros(
+                    [batch_size, anchors.shape[0], 1], dtype=rpn_match.dtype)
+                batch_rpn_bbox = np.zeros(
+                    [batch_size, config.RPN_TRAIN_ANCHORS_PER_IMAGE, 4], dtype=rpn_bbox.dtype)
+                batch_images = np.zeros(
+                    (batch_size,) + image.shape, dtype=np.float32)
+                batch_gt_class_ids = np.zeros(
+                    (batch_size, config.MAX_GT_INSTANCES), dtype=np.int32)
+                batch_gt_boxes = np.zeros(
+                    (batch_size, config.MAX_GT_INSTANCES, 4), dtype=np.int32)
+                batch_gt_masks = np.zeros(
+                    (batch_size, gt_masks.shape[0], gt_masks.shape[1],
+                     config.MAX_GT_INSTANCES), dtype=gt_masks.dtype)
+                if random_rois:
+                    batch_rpn_rois = np.zeros(
+                        (batch_size, rpn_rois.shape[0], 4), dtype=rpn_rois.dtype)
+                    if detection_targets:
+                        batch_rois = np.zeros(
+                            (batch_size,) + rois.shape, dtype=rois.dtype)
+                        batch_mrcnn_class_ids = np.zeros(
+                            (batch_size,) + mrcnn_class_ids.shape, dtype=mrcnn_class_ids.dtype)
+                        batch_mrcnn_bbox = np.zeros(
+                            (batch_size,) + mrcnn_bbox.shape, dtype=mrcnn_bbox.dtype)
+                        batch_mrcnn_mask = np.zeros(
+                            (batch_size,) + mrcnn_mask.shape, dtype=mrcnn_mask.dtype)
+
+            # If more instances than fits in the array, sub-sample from them.
+            if gt_boxes.shape[0] > config.MAX_GT_INSTANCES:
+                ids = np.random.choice(
+                    np.arange(gt_boxes.shape[0]), config.MAX_GT_INSTANCES, replace=False)
+                gt_class_ids = gt_class_ids[ids]
+                gt_boxes = gt_boxes[ids]
+                gt_masks = gt_masks[:, :, ids]
+
+            # Add to batch
+            batch_image_meta[b] = image_meta
+            batch_rpn_match[b] = rpn_match[:, np.newaxis]
+            batch_rpn_bbox[b] = rpn_bbox
+            batch_images[b] = mold_image(image.astype(np.float32), config)
+            batch_gt_class_ids[b, :gt_class_ids.shape[0]] = gt_class_ids
+            batch_gt_boxes[b, :gt_boxes.shape[0]] = gt_boxes
+            batch_gt_masks[b, :, :, :gt_masks.shape[-1]] = gt_masks
+            if random_rois:
+                batch_rpn_rois[b] = rpn_rois
+                if detection_targets:
+                    batch_rois[b] = rois
+                    batch_mrcnn_class_ids[b] = mrcnn_class_ids
+                    batch_mrcnn_bbox[b] = mrcnn_bbox
+                    batch_mrcnn_mask[b] = mrcnn_mask
+            b += 1
+
+            # Batch full?
+            if b >= batch_size:
+                inputs = [batch_images, batch_image_meta, batch_rpn_match, batch_rpn_bbox,
+                          batch_gt_class_ids, batch_gt_boxes, batch_gt_masks]
+                outputs = []
+
+                if random_rois:
+                    inputs.extend([batch_rpn_rois])
+                    if detection_targets:
+                        inputs.extend([batch_rois])
+                        # Keras requires that output and targets have the same number of dimensions
+                        batch_mrcnn_class_ids = np.expand_dims(
+                            batch_mrcnn_class_ids, -1)
+                        outputs.extend(
+                            [batch_mrcnn_class_ids, batch_mrcnn_bbox, batch_mrcnn_mask])
+
+                yield inputs, outputs
+
+                # start a new batch
+                b = 0
+        except (GeneratorExit, KeyboardInterrupt):
+            raise
+        except:
+            # Log it and skip the image
+            logging.exception("Error processing image {}".format(
+                dataset.image_info[image_id]))
+            error_count += 1
+            if error_count > 5:
+                raise
+
+
+############################################################
+#  MaskRCNN Class
+############################################################
+
+class MaskRCNN():
+    """Encapsulates the Mask RCNN model functionality.
+
+    The actual Keras model is in the keras_model property.
+    """
+
+    def __init__(self, mode, config, model_dir):
+        """
+        mode: Either "training" or "inference"
+        config: A Sub-class of the Config class
+        model_dir: Directory to save training logs and trained weights
+        """
+        assert mode in ['training', 'inference']
+        self.mode = mode
+        self.config = config
+        self.model_dir = model_dir
+        self.set_log_dir()
+        self.keras_model = self.build(mode=mode, config=config)
+
+    def build(self, mode, config):
+        """Build Mask R-CNN architecture.
+            input_shape: The shape of the input image.
+            mode: Either "training" or "inference". The inputs and
+                outputs of the model differ accordingly.
+        """
+        assert mode in ['training', 'inference']
+
+        # Image size must be dividable by 2 multiple times
+        h, w = config.IMAGE_SHAPE[:2]
+        if h / 2 ** 6 != int(h / 2 ** 6) or w / 2 ** 6 != int(w / 2 ** 6):
+            raise Exception("Image size must be dividable by 2 at least 6 times "
+                            "to avoid fractions when downscaling and upscaling."
+                            "For example, use 256, 320, 384, 448, 512, ... etc. ")
+
+        # Inputs
+        input_image = KL.Input(
+            shape=[None, None, 3], name="input_image")
+        input_image_meta = KL.Input(shape=[config.IMAGE_META_SIZE],
+                                    name="input_image_meta")
+        if mode == "training":
+            # RPN GT
+            input_rpn_match = KL.Input(
+                shape=[None, 1], name="input_rpn_match", dtype=tf.int32)
+            input_rpn_bbox = KL.Input(
+                shape=[None, 4], name="input_rpn_bbox", dtype=tf.float32)
+
+            # Detection GT (class IDs, bounding boxes, and masks)
+            # 1. GT Class IDs (zero padded)
+            input_gt_class_ids = KL.Input(
+                shape=[None], name="input_gt_class_ids", dtype=tf.int32)
+            # 2. GT Boxes in pixels (zero padded)
+            # [batch, MAX_GT_INSTANCES, (y1, x1, y2, x2)] in image coordinates
+            input_gt_boxes = KL.Input(
+                shape=[None, 4], name="input_gt_boxes", dtype=tf.float32)
+            # Normalize coordinates
+            gt_boxes = KL.Lambda(lambda x: norm_boxes_graph(
+                x, K.shape(input_image)[1:3]))(input_gt_boxes)
+            # 3. GT Masks (zero padded)
+            # [batch, height, width, MAX_GT_INSTANCES]
+            if config.USE_MINI_MASK:
+                input_gt_masks = KL.Input(
+                    shape=[config.MINI_MASK_SHAPE[0],
+                           config.MINI_MASK_SHAPE[1], None],
+                    name="input_gt_masks", dtype=bool)
+            else:
+                input_gt_masks = KL.Input(
+                    shape=[config.IMAGE_SHAPE[0], config.IMAGE_SHAPE[1], None],
+                    name="input_gt_masks", dtype=bool)
+        elif mode == "inference":
+            # Anchors in normalized coordinates
+            input_anchors = KL.Input(shape=[None, 4], name="input_anchors")
+
+        # Build the shared convolutional layers.
+        # Bottom-up Layers
+        # Returns a list of the last layers of each stage, 5 in total.
+        # Don't create the thead (stage 5), so we pick the 4th item in the list.
+        if callable(config.BACKBONE):
+            _, C2, C3, C4, C5 = config.BACKBONE(input_image, stage5=True,
+                                                train_bn=config.TRAIN_BN)
+        else:
+            _, C2, C3, C4, C5 = resnet_graph(input_image, config.BACKBONE,
+                                             stage5=True, train_bn=config.TRAIN_BN)
+        # Top-down Layers
+        # TODO: add assert to varify feature map sizes match what's in config
+        P5 = KL.Conv2D(config.TOP_DOWN_PYRAMID_SIZE, (1, 1), name='fpn_c5p5')(C5)
+        P4 = KL.Add(name="fpn_p4add")([
+            KL.UpSampling2D(size=(2, 2), name="fpn_p5upsampled")(P5),
+            KL.Conv2D(config.TOP_DOWN_PYRAMID_SIZE, (1, 1), name='fpn_c4p4')(C4)])
+        P3 = KL.Add(name="fpn_p3add")([
+            KL.UpSampling2D(size=(2, 2), name="fpn_p4upsampled")(P4),
+            KL.Conv2D(config.TOP_DOWN_PYRAMID_SIZE, (1, 1), name='fpn_c3p3')(C3)])
+        P2 = KL.Add(name="fpn_p2add")([
+            KL.UpSampling2D(size=(2, 2), name="fpn_p3upsampled")(P3),
+            KL.Conv2D(config.TOP_DOWN_PYRAMID_SIZE, (1, 1), name='fpn_c2p2')(C2)])
+        # Attach 3x3 conv to all P layers to get the final feature maps.
+        P2 = KL.Conv2D(config.TOP_DOWN_PYRAMID_SIZE, (3, 3), padding="SAME", name="fpn_p2")(P2)
+        P3 = KL.Conv2D(config.TOP_DOWN_PYRAMID_SIZE, (3, 3), padding="SAME", name="fpn_p3")(P3)
+        P4 = KL.Conv2D(config.TOP_DOWN_PYRAMID_SIZE, (3, 3), padding="SAME", name="fpn_p4")(P4)
+        P5 = KL.Conv2D(config.TOP_DOWN_PYRAMID_SIZE, (3, 3), padding="SAME", name="fpn_p5")(P5)
+        # P6 is used for the 5th anchor scale in RPN. Generated by
+        # subsampling from P5 with stride of 2.
+        P6 = KL.MaxPooling2D(pool_size=(1, 1), strides=2, name="fpn_p6")(P5)
+
+        # Note that P6 is used in RPN, but not in the classifier heads.
+        rpn_feature_maps = [P2, P3, P4, P5, P6]
+        mrcnn_feature_maps = [P2, P3, P4, P5]
+
+        # Anchors
+        if mode == "training":
+            anchors = self.get_anchors(config.IMAGE_SHAPE)
+            # Duplicate across the batch dimension because Keras requires it
+            # TODO: can this be optimized to avoid duplicating the anchors?
+            anchors = np.broadcast_to(anchors, (config.BATCH_SIZE,) + anchors.shape)
+            # A hack to get around Keras's bad support for constants
+            anchors = KL.Lambda(lambda x: tf.Variable(anchors), name="anchors")(input_image)
+        else:
+            anchors = input_anchors
+
+        # RPN Model
+        rpn = build_rpn_model(config.RPN_ANCHOR_STRIDE,
+                              len(config.RPN_ANCHOR_RATIOS), config.TOP_DOWN_PYRAMID_SIZE)
+        # Loop through pyramid layers
+        layer_outputs = []  # list of lists
+        for p in rpn_feature_maps:
+            layer_outputs.append(rpn([p]))
+        # Concatenate layer outputs
+        # Convert from list of lists of level outputs to list of lists
+        # of outputs across levels.
+        # e.g. [[a1, b1, c1], [a2, b2, c2]] => [[a1, a2], [b1, b2], [c1, c2]]
+        output_names = ["rpn_class_logits", "rpn_class", "rpn_bbox"]
+        outputs = list(zip(*layer_outputs))
+        outputs = [KL.Concatenate(axis=1, name=n)(list(o))
+                   for o, n in zip(outputs, output_names)]
+
+        rpn_class_logits, rpn_class, rpn_bbox = outputs
+
+        # Generate proposals
+        # Proposals are [batch, N, (y1, x1, y2, x2)] in normalized coordinates
+        # and zero padded.
+        proposal_count = config.POST_NMS_ROIS_TRAINING if mode == "training" \
+            else config.POST_NMS_ROIS_INFERENCE
+        rpn_rois = ProposalLayer(
+            proposal_count=proposal_count,
+            nms_threshold=config.RPN_NMS_THRESHOLD,
+            name="ROI",
+            config=config)([rpn_class, rpn_bbox, anchors])
+
+        if mode == "training":
+            # Class ID mask to mark class IDs supported by the dataset the image
+            # came from.
+            active_class_ids = KL.Lambda(
+                lambda x: parse_image_meta_graph(x)["active_class_ids"]
+            )(input_image_meta)
+
+            if not config.USE_RPN_ROIS:
+                # Ignore predicted ROIs and use ROIs provided as an input.
+                input_rois = KL.Input(shape=[config.POST_NMS_ROIS_TRAINING, 4],
+                                      name="input_roi", dtype=np.int32)
+                # Normalize coordinates
+                target_rois = KL.Lambda(lambda x: norm_boxes_graph(
+                    x, K.shape(input_image)[1:3]))(input_rois)
+            else:
+                target_rois = rpn_rois
+
+            # Generate detection targets
+            # Subsamples proposals and generates target outputs for training
+            # Note that proposal class IDs, gt_boxes, and gt_masks are zero
+            # padded. Equally, returned rois and targets are zero padded.
+            rois, target_class_ids, target_bbox, target_mask = \
+                DetectionTargetLayer(config, name="proposal_targets")([
+                    target_rois, input_gt_class_ids, gt_boxes, input_gt_masks])
+
+            # Network Heads
+            # TODO: verify that this handles zero padded ROIs
+            mrcnn_class_logits, mrcnn_class, mrcnn_bbox = \
+                fpn_classifier_graph(rois, mrcnn_feature_maps, input_image_meta,
+                                     config.POOL_SIZE, config.NUM_CLASSES,
+                                     train_bn=config.TRAIN_BN,
+                                     fc_layers_size=config.FPN_CLASSIF_FC_LAYERS_SIZE)
+
+            mrcnn_mask = build_fpn_mask_graph(rois, mrcnn_feature_maps,
+                                              input_image_meta,
+                                              config.MASK_POOL_SIZE,
+                                              config.NUM_CLASSES,
+                                              train_bn=config.TRAIN_BN)
+
+            # TODO: clean up (use tf.identify if necessary)
+            output_rois = KL.Lambda(lambda x: x * 1, name="output_rois")(rois)
+
+            # Losses
+            rpn_class_loss = KL.Lambda(lambda x: rpn_class_loss_graph(*x), name="rpn_class_loss")(
+                [input_rpn_match, rpn_class_logits])
+            rpn_bbox_loss = KL.Lambda(lambda x: rpn_bbox_loss_graph(config, *x), name="rpn_bbox_loss")(
+                [input_rpn_bbox, input_rpn_match, rpn_bbox])
+            class_loss = KL.Lambda(lambda x: mrcnn_class_loss_graph(*x), name="mrcnn_class_loss")(
+                [target_class_ids, mrcnn_class_logits, active_class_ids])
+            bbox_loss = KL.Lambda(lambda x: mrcnn_bbox_loss_graph(*x), name="mrcnn_bbox_loss")(
+                [target_bbox, target_class_ids, mrcnn_bbox])
+            mask_loss = KL.Lambda(lambda x: mrcnn_mask_loss_graph(*x), name="mrcnn_mask_loss")(
+                [target_mask, target_class_ids, mrcnn_mask])
+
+            # Model
+            inputs = [input_image, input_image_meta,
+                      input_rpn_match, input_rpn_bbox, input_gt_class_ids, input_gt_boxes, input_gt_masks]
+            if not config.USE_RPN_ROIS:
+                inputs.append(input_rois)
+            outputs = [rpn_class_logits, rpn_class, rpn_bbox,
+                       mrcnn_class_logits, mrcnn_class, mrcnn_bbox, mrcnn_mask,
+                       rpn_rois, output_rois,
+                       rpn_class_loss, rpn_bbox_loss, class_loss, bbox_loss, mask_loss]
+            model = KM.Model(inputs, outputs, name='mask_rcnn')
+        else:
+            # Network Heads
+            # Proposal classifier and BBox regressor heads
+            mrcnn_class_logits, mrcnn_class, mrcnn_bbox = \
+                fpn_classifier_graph(rpn_rois, mrcnn_feature_maps, input_image_meta,
+                                     config.POOL_SIZE, config.NUM_CLASSES,
+                                     train_bn=config.TRAIN_BN,
+                                     fc_layers_size=config.FPN_CLASSIF_FC_LAYERS_SIZE)
+
+            # Detections
+            # output is [batch, num_detections, (y1, x1, y2, x2, class_id, score)] in
+            # normalized coordinates
+            detections = DetectionLayer(config, name="mrcnn_detection")(
+                [rpn_rois, mrcnn_class, mrcnn_bbox, input_image_meta])
+
+            # Create masks for detections
+            detection_boxes = KL.Lambda(lambda x: x[..., :4])(detections)
+            mrcnn_mask = build_fpn_mask_graph(detection_boxes, mrcnn_feature_maps,
+                                              input_image_meta,
+                                              config.MASK_POOL_SIZE,
+                                              config.NUM_CLASSES,
+                                              train_bn=config.TRAIN_BN)
+
+            model = KM.Model([input_image, input_image_meta, input_anchors],
+                             [detections, mrcnn_class, mrcnn_bbox,
+                              mrcnn_mask, rpn_rois, rpn_class, rpn_bbox],
+                             name='mask_rcnn')
+
+        return model
+
+    def find_last(self):
+        """Finds the last checkpoint file of the last trained model in the
+        model directory.
+        Returns:
+            The path of the last checkpoint file
+        """
+        # Get directory names. Each directory corresponds to a model
+        dir_names = next(os.walk(self.model_dir))[1]
+        print("dirnames", dir_names)
+        key = self.config.NAME.lower()
+        print("key", key)
+        dir_names = filter(lambda f: f.startswith(key), dir_names)
+        dir_names = sorted(dir_names)
+        if not dir_names:
+            import errno
+            raise FileNotFoundError(
+                errno.ENOENT,
+                "Could not find model directory under {}".format(self.model_dir))
+        # Pick last directory
+        dir_name = os.path.join(self.model_dir, dir_names[-1])
+        # Find the last checkpoint
+        checkpoints = next(os.walk(dir_name))[2]
+        checkpoints = filter(lambda f: f.startswith("mask_rcnn"), checkpoints)
+        checkpoints = sorted(checkpoints)
+        if not checkpoints:
+            import errno
+            raise FileNotFoundError(
+                errno.ENOENT, "Could not find weight files in {}".format(dir_name))
+        checkpoint = os.path.join(dir_name, checkpoints[-1])
+        return checkpoint
+
+    def load_weights(self, filepath, by_name=False, exclude=None):
+        """Modified version of the corresponding Keras function with
+        the addition of multi-GPU support and the ability to exclude
+        some layers from loading.
+        exclude: list of layer names to exclude
+        """
+        import h5py
+        # Conditional import to support versions of Keras before 2.2
+        # TODO: remove in about 6 months (end of 2018)
+        try:
+            from keras.engine import saving as saving
+        except ImportError:
+            # Keras before 2.2 used the 'topology' namespace.
+            from keras.engine import saving as saving
+
+        if exclude:
+            by_name = True
+
+        if h5py is None:
+            raise ImportError('`load_weights` requires h5py.')
+        f = h5py.File(filepath, mode='r')
+        if 'layer_names' not in f.attrs and 'model_weights' in f:
+            f = f['model_weights']
+
+        # In multi-GPU training, we wrap the model. Get layers
+        # of the inner model because they have the weights.
+        keras_model = self.keras_model
+        layers = keras_model.inner_model.layers if hasattr(keras_model, "inner_model") \
+            else keras_model.layers
+
+        # Exclude some layers
+        if exclude:
+            layers = filter(lambda l: l.name not in exclude, layers)
+
+        if by_name:
+            saving.load_weights_from_hdf5_group_by_name(f, layers)
+        else:
+            saving.load_weights_from_hdf5_group(f, layers)
+        if hasattr(f, 'close'):
+            f.close()
+
+        # Update the log directory
+        self.set_log_dir(filepath)
+
+    def get_imagenet_weights(self):
+        """Downloads ImageNet trained weights from Keras.
+        Returns path to weights file.
+        """
+        from keras.utils.data_utils import get_file
+        TF_WEIGHTS_PATH_NO_TOP = 'https://github.com/fchollet/deep-learning-models/' \
+                                 'releases/download/v0.2/' \
+                                 'resnet50_weights_tf_dim_ordering_tf_kernels_notop.h5'
+        weights_path = get_file('resnet50_weights_tf_dim_ordering_tf_kernels_notop.h5',
+                                TF_WEIGHTS_PATH_NO_TOP,
+                                cache_subdir='models',
+                                md5_hash='a268eb855778b3df3c7506639542a6af')
+        return weights_path
+
+    def compile(self, learning_rate, momentum):
+        """Gets the model ready for training. Adds losses, regularization, and
+        metrics. Then calls the Keras compile() function.
+        """
+        # Optimizer object
+        optimizer = keras.optimizers.SGD(
+            lr=learning_rate, momentum=momentum,
+            clipnorm=self.config.GRADIENT_CLIP_NORM)
+        # Add Losses
+        # First, clear previously set losses to avoid duplication
+        self.keras_model._losses = []
+        self.keras_model._per_input_losses = {}
+        loss_names = [
+            "rpn_class_loss", "rpn_bbox_loss",
+            "mrcnn_class_loss", "mrcnn_bbox_loss", "mrcnn_mask_loss"]
+        for name in loss_names:
+            layer = self.keras_model.get_layer(name)
+            if layer.output in self.keras_model.losses:
+                continue
+            loss = (
+                    tf.reduce_mean(layer.output, keepdims=True)
+                    * self.config.LOSS_WEIGHTS.get(name, 1.))
+            self.keras_model.add_loss(loss)
+
+        # Add L2 Regularization
+        # Skip gamma and beta weights of batch normalization layers.
+        reg_losses = [
+            keras.regularizers.l2(self.config.WEIGHT_DECAY)(w) / tf.cast(tf.size(w), tf.float32)
+            for w in self.keras_model.trainable_weights
+            if 'gamma' not in w.name and 'beta' not in w.name]
+        self.keras_model.add_loss(tf.add_n(reg_losses))
+
+        # Compile
+        self.keras_model.compile(
+            optimizer=optimizer,
+            loss=[None] * len(self.keras_model.outputs))
+
+        # Add metrics for losses
+        for name in loss_names:
+            if name in self.keras_model.metrics_names:
+                continue
+            layer = self.keras_model.get_layer(name)
+            self.keras_model.metrics_names.append(name)
+            loss = (
+                    tf.reduce_mean(layer.output, keepdims=True)
+                    * self.config.LOSS_WEIGHTS.get(name, 1.))
+            self.keras_model.metrics_tensors.append(loss)
+
+    def set_trainable(self, layer_regex, keras_model=None, indent=0, verbose=1):
+        """Sets model layers as trainable if their names match
+        the given regular expression.
+        """
+        # Print message on the first call (but not on recursive calls)
+        if verbose > 0 and keras_model is None:
+            log("Selecting layers to train")
+
+        keras_model = keras_model or self.keras_model
+
+        # In multi-GPU training, we wrap the model. Get layers
+        # of the inner model because they have the weights.
+        layers = keras_model.inner_model.layers if hasattr(keras_model, "inner_model") \
+            else keras_model.layers
+
+        for layer in layers:
+            # Is the layer a model?
+            if layer.__class__.__name__ == 'Model':
+                print("In model: ", layer.name)
+                self.set_trainable(
+                    layer_regex, keras_model=layer, indent=indent + 4)
+                continue
+
+            if not layer.weights:
+                continue
+            # Is it trainable?
+            trainable = bool(re.fullmatch(layer_regex, layer.name))
+            # Update layer. If layer is a container, update inner layer.
+            if layer.__class__.__name__ == 'TimeDistributed':
+                layer.layer.trainable = trainable
+            else:
+                layer.trainable = trainable
+            # Print trainable layer names
+            if trainable and verbose > 0:
+                log("{}{:20}   ({})".format(" " * indent, layer.name,
+                                            layer.__class__.__name__))
+
+    def set_log_dir(self, model_path=None):
+        """Sets the model log directory and epoch counter.
+
+        model_path: If None, or a format different from what this code uses
+            then set a new log directory and start epochs from 0. Otherwise,
+            extract the log directory and the epoch counter from the file
+            name.
+        """
+        # Set date and epoch counter as if starting a new model
+        self.epoch = 0
+        now = datetime.datetime.now()
+
+        # If we have a model path with date and epochs use them
+        if model_path:
+            # Continue from we left of. Get epoch and date from the file name
+            # A sample model path might look like:
+            # /path/to/logs/coco20171029T2315/mask_rcnn_coco_0001.h5
+            regex = r".*/[\w-]+(\d{4})(\d{2})(\d{2})T(\d{2})(\d{2})/mask\_rcnn\_[\w-]+(\d{4})\.h5"
+            m = re.match(regex, model_path)
+            if m:
+                now = datetime.datetime(int(m.group(1)), int(m.group(2)), int(m.group(3)),
+                                        int(m.group(4)), int(m.group(5)))
+                # Epoch number in file is 1-based, and in Keras code it's 0-based.
+                # So, adjust for that then increment by one to start from the next epoch
+                self.epoch = int(m.group(6)) - 1 + 1
+                print('Re-starting from epoch %d' % self.epoch)
+
+        # Directory for training logs
+        # self.log_dir = os.path.join(self.model_dir, "{}{:%Y%m%dT%H%M}".format(
+        #     self.config.NAME.lower(), now))
+        #
+        # # Create log_dir if not exists
+        # if not os.path.exists(self.log_dir):
+        #     os.makedirs(self.log_dir)
+
+        # Path to save after each epoch. Include placeholders that get filled by Keras.
+        # self.checkpoint_path = os.path.join(self.log_dir, "mask_rcnn_{}_*epoch*.h5".format(
+        #     self.config.NAME.lower()))
+        # self.checkpoint_path = self.checkpoint_path.replace(
+        #     "*epoch*", "{epoch:04d}")
+
+    def train(self, train_dataset, val_dataset, learning_rate, epochs, layers,
+              augmentation=None, custom_callbacks=None, no_augmentation_sources=None):
+        """Train the model.
+        train_dataset, val_dataset: Training and validation Dataset objects.
+        learning_rate: The learning rate to train with
+        epochs: Number of training epochs. Note that previous training epochs
+                are considered to be done alreay, so this actually determines
+                the epochs to train in total rather than in this particaular
+                call.
+        layers: Allows selecting wich layers to train. It can be:
+            - A regular expression to match layer names to train
+            - One of these predefined values:
+              heads: The RPN, classifier and mask heads of the network
+              all: All the layers
+              3+: Train Resnet stage 3 and up
+              4+: Train Resnet stage 4 and up
+              5+: Train Resnet stage 5 and up
+        augmentation: Optional. An imgaug (https://github.com/aleju/imgaug)
+            augmentation. For example, passing imgaug.augmenters.Fliplr(0.5)
+            flips images right/left 50% of the time. You can pass complex
+            augmentations as well. This augmentation applies 50% of the
+            time, and when it does it flips images right/left half the time
+            and adds a Gaussian blur with a random sigma in range 0 to 5.
+
+                augmentation = imgaug.augmenters.Sometimes(0.5, [
+                    imgaug.augmenters.Fliplr(0.5),
+                    imgaug.augmenters.GaussianBlur(sigma=(0.0, 5.0))
+                ])
+        custom_callbacks: Optional. Add custom callbacks to be called
+            with the keras fit_generator method. Must be list of type keras.callbacks.
+        no_augmentation_sources: Optional. List of sources to exclude for
+            augmentation. A source is string that identifies a dataset and is
+            defined in the Dataset class.
+        """
+        assert self.mode == "training", "Create model in training mode."
+
+        # Pre-defined layer regular expressions
+        layer_regex = {
+            # all layers but the backbone
+            "heads": r"(mrcnn\_.*)|(rpn\_.*)|(fpn\_.*)",
+            # From a specific Resnet stage and up
+            "3+": r"(res3.*)|(bn3.*)|(res4.*)|(bn4.*)|(res5.*)|(bn5.*)|(mrcnn\_.*)|(rpn\_.*)|(fpn\_.*)",
+            "4+": r"(res4.*)|(bn4.*)|(res5.*)|(bn5.*)|(mrcnn\_.*)|(rpn\_.*)|(fpn\_.*)",
+            "5+": r"(res5.*)|(bn5.*)|(mrcnn\_.*)|(rpn\_.*)|(fpn\_.*)",
+            # All layers
+            "all": ".*",
+        }
+        if layers in layer_regex.keys():
+            layers = layer_regex[layers]
+
+        # Data generators
+        train_generator = data_generator(train_dataset, self.config, shuffle=True,
+                                         augmentation=augmentation,
+                                         batch_size=self.config.BATCH_SIZE,
+                                         no_augmentation_sources=no_augmentation_sources)
+        val_generator = data_generator(val_dataset, self.config, shuffle=True,
+                                       batch_size=self.config.BATCH_SIZE)
+
+        # Callbacks
+        callbacks = [
+            keras.callbacks.TensorBoard(log_dir=self.log_dir,
+                                        histogram_freq=0, write_graph=True, write_images=False),
+            keras.callbacks.ModelCheckpoint(self.checkpoint_path,
+                                            verbose=0, save_weights_only=True),
+        ]
+
+        # Add custom callbacks to the list
+        if custom_callbacks:
+            callbacks += custom_callbacks
+
+        # Train
+        log("\nStarting at epoch {}. LR={}\n".format(self.epoch, learning_rate))
+        log("Checkpoint Path: {}".format(self.checkpoint_path))
+        self.set_trainable(layers)
+        self.compile(learning_rate, self.config.LEARNING_MOMENTUM)
+
+        # Work-around for Windows: Keras fails on Windows when using
+        # multiprocessing workers. See discussion here:
+        # https://github.com/matterport/Mask_RCNN/issues/13#issuecomment-353124009
+        if os.name is 'nt':
+            workers = 0
+        else:
+            workers = multiprocessing.cpu_count()
+
+        self.keras_model.fit_generator(
+            train_generator,
+            initial_epoch=self.epoch,
+            epochs=epochs,
+            steps_per_epoch=self.config.STEPS_PER_EPOCH,
+            callbacks=callbacks,
+            validation_data=val_generator,
+            validation_steps=self.config.VALIDATION_STEPS,
+            max_queue_size=100,
+            workers=workers,
+            use_multiprocessing=True,
+        )
+        self.epoch = max(self.epoch, epochs)
+
+    def mold_inputs(self, images):
+        """Takes a list of images and modifies them to the format expected
+        as an input to the neural network.
+        images: List of image matrices [height,width,depth]. Images can have
+            different sizes.
+
+        Returns 3 Numpy matrices:
+        molded_images: [N, h, w, 3]. Images resized and normalized.
+        image_metas: [N, length of meta data]. Details about each image.
+        windows: [N, (y1, x1, y2, x2)]. The portion of the image that has the
+            original image (padding excluded).
+        """
+        molded_images = []
+        image_metas = []
+        windows = []
+        for image in images:
+            # Resize image
+            # TODO: move resizing to mold_image()
+            molded_image, window, scale, padding, crop = utils.resize_image(
+                image,
+                min_dim=self.config.IMAGE_MIN_DIM,
+                min_scale=self.config.IMAGE_MIN_SCALE,
+                max_dim=self.config.IMAGE_MAX_DIM,
+                mode=self.config.IMAGE_RESIZE_MODE)
+            molded_image = mold_image(molded_image, self.config)
+            # Build image_meta
+            image_meta = compose_image_meta(
+                0, image.shape, molded_image.shape, window, scale,
+                np.zeros([self.config.NUM_CLASSES], dtype=np.int32))
+            # Append
+            molded_images.append(molded_image)
+            windows.append(window)
+            image_metas.append(image_meta)
+        # Pack into arrays
+        molded_images = np.stack(molded_images)
+        image_metas = np.stack(image_metas)
+        windows = np.stack(windows)
+        return molded_images, image_metas, windows
+
+    def unmold_detections(self, detections, mrcnn_mask, original_image_shape,
+                          image_shape, window):
+        """Reformats the detections of one image from the format of the neural
+        network output to a format suitable for use in the rest of the
+        application.
+
+        detections: [N, (y1, x1, y2, x2, class_id, score)] in normalized coordinates
+        mrcnn_mask: [N, height, width, num_classes]
+        original_image_shape: [H, W, C] Original image shape before resizing
+        image_shape: [H, W, C] Shape of the image after resizing and padding
+        window: [y1, x1, y2, x2] Pixel coordinates of box in the image where the real
+                image is excluding the padding.
+
+        Returns:
+        boxes: [N, (y1, x1, y2, x2)] Bounding boxes in pixels
+        class_ids: [N] Integer class IDs for each bounding box
+        scores: [N] Float probability scores of the class_id
+        masks: [height, width, num_instances] Instance masks
+        """
+        # How many detections do we have?
+        # Detections array is padded with zeros. Find the first class_id == 0.
+        zero_ix = np.where(detections[:, 4] == 0)[0]
+        N = zero_ix[0] if zero_ix.shape[0] > 0 else detections.shape[0]
+
+        # Extract boxes, class_ids, scores, and class-specific masks
+        boxes = detections[:N, :4]
+        class_ids = detections[:N, 4].astype(np.int32)
+        scores = detections[:N, 5]
+        masks = mrcnn_mask[np.arange(N), :, :, class_ids]
+
+        # Translate normalized coordinates in the resized image to pixel
+        # coordinates in the original image before resizing
+        window = utils.norm_boxes(window, image_shape[:2])
+        wy1, wx1, wy2, wx2 = window
+        shift = np.array([wy1, wx1, wy1, wx1])
+        wh = wy2 - wy1  # window height
+        ww = wx2 - wx1  # window width
+        scale = np.array([wh, ww, wh, ww])
+        # Convert boxes to normalized coordinates on the window
+        boxes = np.divide(boxes - shift, scale)
+        # Convert boxes to pixel coordinates on the original image
+        boxes = utils.denorm_boxes(boxes, original_image_shape[:2])
+
+        # Filter out detections with zero area. Happens in early training when
+        # network weights are still random
+        exclude_ix = np.where(
+            (boxes[:, 2] - boxes[:, 0]) * (boxes[:, 3] - boxes[:, 1]) <= 0)[0]
+        if exclude_ix.shape[0] > 0:
+            boxes = np.delete(boxes, exclude_ix, axis=0)
+            class_ids = np.delete(class_ids, exclude_ix, axis=0)
+            scores = np.delete(scores, exclude_ix, axis=0)
+            masks = np.delete(masks, exclude_ix, axis=0)
+            N = class_ids.shape[0]
+
+        # Resize masks to original image size and set boundary threshold.
+        full_masks = []
+        for i in range(N):
+            # Convert neural network mask to full size mask
+            full_mask = utils.unmold_mask(masks[i], boxes[i], original_image_shape)
+            full_masks.append(full_mask)
+        full_masks = np.stack(full_masks, axis=-1) \
+            if full_masks else np.empty(original_image_shape[:2] + (0,))
+
+        return boxes, class_ids, scores, full_masks
+
+    def detect(self, images, verbose=0):
+        """Runs the detection pipeline.
+
+        images: List of images, potentially of different sizes.
+
+        Returns a list of dicts, one dict per image. The dict contains:
+        rois: [N, (y1, x1, y2, x2)] detection bounding boxes
+        class_ids: [N] int class IDs
+        scores: [N] float probability scores for the class IDs
+        masks: [H, W, N] instance binary masks
+        """
+        assert self.mode == "inference", "Create model in inference mode."
+        assert len(
+            images) == self.config.BATCH_SIZE, "len(images) must be equal to BATCH_SIZE"
+
+        if verbose:
+            log("Processing {} images".format(len(images)))
+            for image in images:
+                log("image", image)
+
+        # Mold inputs to format expected by the neural network
+        molded_images, image_metas, windows = self.mold_inputs(images)
+
+        # Validate image sizes
+        # All images in a batch MUST be of the same size
+        image_shape = molded_images[0].shape
+        for g in molded_images[1:]:
+            assert g.shape == image_shape, \
+                "After resizing, all images must have the same size. Check IMAGE_RESIZE_MODE and image sizes."
+
+        # Anchors
+        print("$" * 50)
+        print('image shape:', image_shape)
+        anchors = self.get_anchors(image_shape)
+        print('achors shape:', anchors.shape)
+        # Duplicate across the batch dimension because Keras requires it
+        # TODO: can this be optimized to avoid duplicating the anchors?
+        anchors = np.broadcast_to(anchors, (self.config.BATCH_SIZE,) + anchors.shape)
+        print('achors shape:', anchors.shape)
+        print('Config batch size:', self.config.BATCH_SIZE)
+        print('META shape:', image_metas.shape)
+        print("*" * 70)
+        print(molded_images.shape)
+        print(image_metas.shape)
+        print(anchors.shape)
+
+        if verbose:
+            log("molded_images", molded_images)
+            log("image_metas", image_metas)
+            log("anchors", anchors)
+        # Run object detection
+        detections, _, _, mrcnn_mask, _, _, _ = \
+            self.keras_model.predict([molded_images, image_metas, anchors], verbose=0)
+        print("#" * 70)
+        print(detections)
+        print(mrcnn_mask)
+        # Process detections
+        results = []
+        for i, image in enumerate(images):
+            final_rois, final_class_ids, final_scores, final_masks = \
+                self.unmold_detections(detections[i], mrcnn_mask[i],
+                                       image.shape, molded_images[i].shape,
+                                       windows[i])
+            results.append({
+                "rois": final_rois,
+                "class_ids": final_class_ids,
+                "scores": final_scores,
+                "masks": final_masks,
+            })
+            print(final_masks.shape)
+        return results
+
+    def detect_molded(self, molded_images, image_metas, verbose=0):
+        """Runs the detection pipeline, but expect inputs that are
+        molded already. Used mostly for debugging and inspecting
+        the model.
+
+        molded_images: List of images loaded using load_image_gt()
+        image_metas: image meta data, also returned by load_image_gt()
+
+        Returns a list of dicts, one dict per image. The dict contains:
+        rois: [N, (y1, x1, y2, x2)] detection bounding boxes
+        class_ids: [N] int class IDs
+        scores: [N] float probability scores for the class IDs
+        masks: [H, W, N] instance binary masks
+        """
+        assert self.mode == "inference", "Create model in inference mode."
+        assert len(molded_images) == self.config.BATCH_SIZE, \
+            "Number of images must be equal to BATCH_SIZE"
+
+        if verbose:
+            log("Processing {} images".format(len(molded_images)))
+            for image in molded_images:
+                log("image", image)
+
+        # Validate image sizes
+        # All images in a batch MUST be of the same size
+        image_shape = molded_images[0].shape
+        for g in molded_images[1:]:
+            assert g.shape == image_shape, "Images must have the same size"
+
+        # Anchors
+        anchors = self.get_anchors(image_shape)
+        # Duplicate across the batch dimension because Keras requires it
+        # TODO: can this be optimized to avoid duplicating the anchors?
+        anchors = np.broadcast_to(anchors, (self.config.BATCH_SIZE,) + anchors.shape)
+
+        if verbose:
+            log("molded_images", molded_images)
+            log("image_metas", image_metas)
+            log("anchors", anchors)
+        # Run object detection
+        detections, _, _, mrcnn_mask, _, _, _ = \
+            self.keras_model.predict([molded_images, image_metas, anchors], verbose=0)
+        # Process detections
+        results = []
+        for i, image in enumerate(molded_images):
+            window = [0, 0, image.shape[0], image.shape[1]]
+            final_rois, final_class_ids, final_scores, final_masks = \
+                self.unmold_detections(detections[i], mrcnn_mask[i],
+                                       image.shape, molded_images[i].shape,
+                                       window)
+            results.append({
+                "rois": final_rois,
+                "class_ids": final_class_ids,
+                "scores": final_scores,
+                "masks": final_masks,
+            })
+        return results
+
+    def get_anchors(self, image_shape):
+        """Returns anchor pyramid for the given image size."""
+        backbone_shapes = compute_backbone_shapes(self.config, image_shape)
+        # Cache anchors and reuse if image shape is the same
+        if not hasattr(self, "_anchor_cache"):
+            self._anchor_cache = {}
+        if not tuple(image_shape) in self._anchor_cache:
+            # Generate Anchors
+            a = utils.generate_pyramid_anchors(
+                self.config.RPN_ANCHOR_SCALES,
+                self.config.RPN_ANCHOR_RATIOS,
+                backbone_shapes,
+                self.config.BACKBONE_STRIDES,
+                self.config.RPN_ANCHOR_STRIDE)
+            # Keep a copy of the latest anchors in pixel coordinates because
+            # it's used in inspect_model notebooks.
+            # TODO: Remove this after the notebook are refactored to not use it
+            self.anchors = a
+            # Normalize coordinates
+            self._anchor_cache[tuple(image_shape)] = utils.norm_boxes(a, image_shape[:2])
+        return self._anchor_cache[tuple(image_shape)]
+
+    def ancestor(self, tensor, name, checked=None):
+        """Finds the ancestor of a TF tensor in the computation graph.
+        tensor: TensorFlow symbolic tensor.
+        name: Name of ancestor tensor to find
+        checked: For internal use. A list of tensors that were already
+                 searched to avoid loops in traversing the graph.
+        """
+        checked = checked if checked is not None else []
+        # Put a limit on how deep we go to avoid very long loops
+        if len(checked) > 500:
+            return None
+        # Convert name to a regex and allow matching a number prefix
+        # because Keras adds them automatically
+        if isinstance(name, str):
+            name = re.compile(name.replace("/", r"(\_\d+)*/"))
+
+        parents = tensor.op.inputs
+        for p in parents:
+            if p in checked:
+                continue
+            if bool(re.fullmatch(name, p.name)):
+                return p
+            checked.append(p)
+            a = self.ancestor(p, name, checked)
+            if a is not None:
+                return a
+        return None
+
+    def find_trainable_layer(self, layer):
+        """If a layer is encapsulated by another layer, this function
+        digs through the encapsulation and returns the layer that holds
+        the weights.
+        """
+        if layer.__class__.__name__ == 'TimeDistributed':
+            return self.find_trainable_layer(layer.layer)
+        return layer
+
+    def get_trainable_layers(self):
+        """Returns a list of layers that have weights."""
+        layers = []
+        # Loop through all layers
+        for l in self.keras_model.layers:
+            # If layer is a wrapper, find inner trainable layer
+            l = self.find_trainable_layer(l)
+            # Include layer if it has weights
+            if l.get_weights():
+                layers.append(l)
+        return layers
+
+    def run_graph(self, images, outputs, image_metas=None):
+        """Runs a sub-set of the computation graph that computes the given
+        outputs.
+
+        image_metas: If provided, the images are assumed to be already
+            molded (i.e. resized, padded, and normalized)
+
+        outputs: List of tuples (name, tensor) to compute. The tensors are
+            symbolic TensorFlow tensors and the names are for easy tracking.
+
+        Returns an ordered dict of results. Keys are the names received in the
+        input and values are Numpy arrays.
+        """
+        model = self.keras_model
+
+        # Organize desired outputs into an ordered dict
+        outputs = OrderedDict(outputs)
+        for o in outputs.values():
+            assert o is not None
+
+        # Build a Keras function to run parts of the computation graph
+        inputs = model.inputs
+        if model.uses_learning_phase and not isinstance(K.learning_phase(), int):
+            inputs += [K.learning_phase()]
+        kf = K.function(model.inputs, list(outputs.values()))
+
+        # Prepare inputs
+        if image_metas is None:
+            molded_images, image_metas, _ = self.mold_inputs(images)
+        else:
+            molded_images = images
+        image_shape = molded_images[0].shape
+        # Anchors
+        anchors = self.get_anchors(image_shape)
+        # Duplicate across the batch dimension because Keras requires it
+        # TODO: can this be optimized to avoid duplicating the anchors?
+        anchors = np.broadcast_to(anchors, (self.config.BATCH_SIZE,) + anchors.shape)
+        model_in = [molded_images, image_metas, anchors]
+
+        # Run inference
+        if model.uses_learning_phase and not isinstance(K.learning_phase(), int):
+            model_in.append(0.)
+        outputs_np = kf(model_in)
+
+        # Pack the generated Numpy arrays into a a dict and log the results.
+        outputs_np = OrderedDict([(k, v)
+                                  for k, v in zip(outputs.keys(), outputs_np)])
+        for k, v in outputs_np.items():
+            log(k, v)
+        return outputs_np
+
+
+############################################################
+#  Data Formatting
+############################################################
+
+def compose_image_meta(image_id, original_image_shape, image_shape,
+                       window, scale, active_class_ids):
+    """Takes attributes of an image and puts them in one 1D array.
+
+    image_id: An int ID of the image. Useful for debugging.
+    original_image_shape: [H, W, C] before resizing or padding.
+    image_shape: [H, W, C] after resizing and padding
+    window: (y1, x1, y2, x2) in pixels. The area of the image where the real
+            image is (excluding the padding)
+    scale: The scaling factor applied to the original image (float32)
+    active_class_ids: List of class_ids available in the dataset from which
+        the image came. Useful if training on images from multiple datasets
+        where not all classes are present in all datasets.
+    """
+    meta = np.array(
+        [image_id] +  # size=1
+        list(original_image_shape) +  # size=3
+        list(image_shape) +  # size=3
+        list(window) +  # size=4 (y1, x1, y2, x2) in image cooredinates
+        [scale] +  # size=1
+        list(active_class_ids)  # size=num_classes
+    )
+    return meta
+
+
+def parse_image_meta(meta):
+    """Parses an array that contains image attributes to its components.
+    See compose_image_meta() for more details.
+
+    meta: [batch, meta length] where meta length depends on NUM_CLASSES
+
+    Returns a dict of the parsed values.
+    """
+    image_id = meta[:, 0]
+    original_image_shape = meta[:, 1:4]
+    image_shape = meta[:, 4:7]
+    window = meta[:, 7:11]  # (y1, x1, y2, x2) window of image in in pixels
+    scale = meta[:, 11]
+    active_class_ids = meta[:, 12:]
+    return {
+        "image_id": image_id.astype(np.int32),
+        "original_image_shape": original_image_shape.astype(np.int32),
+        "image_shape": image_shape.astype(np.int32),
+        "window": window.astype(np.int32),
+        "scale": scale.astype(np.float32),
+        "active_class_ids": active_class_ids.astype(np.int32),
+    }
+
+
+def parse_image_meta_graph(meta):
+    """Parses a tensor that contains image attributes to its components.
+    See compose_image_meta() for more details.
+
+    meta: [batch, meta length] where meta length depends on NUM_CLASSES
+
+    Returns a dict of the parsed tensors.
+    """
+    image_id = meta[:, 0]
+    original_image_shape = meta[:, 1:4]
+    image_shape = meta[:, 4:7]
+    window = meta[:, 7:11]  # (y1, x1, y2, x2) window of image in in pixels
+    scale = meta[:, 11]
+    active_class_ids = meta[:, 12:]
+    return {
+        "image_id": image_id,
+        "original_image_shape": original_image_shape,
+        "image_shape": image_shape,
+        "window": window,
+        "scale": scale,
+        "active_class_ids": active_class_ids,
+    }
+
+
+def mold_image(images, config):
+    """Expects an RGB image (or array of images) and subtracts
+    the mean pixel and converts it to float. Expects image
+    colors in RGB order.
+    """
+    return images.astype(np.float32) - config.MEAN_PIXEL
+
+
+def unmold_image(normalized_images, config):
+    """Takes a image normalized with mold() and returns the original."""
+    return (normalized_images + config.MEAN_PIXEL).astype(np.uint8)
+
+
+############################################################
+#  Miscellenous Graph Functions
+############################################################
+
+def trim_zeros_graph(boxes, name=None):
+    """Often boxes are represented with matrices of shape [N, 4] and
+    are padded with zeros. This removes zero boxes.
+
+    boxes: [N, 4] matrix of boxes.
+    non_zeros: [N] a 1D boolean mask identifying the rows to keep
+    """
+    non_zeros = tf.cast(tf.reduce_sum(tf.abs(boxes), axis=1), tf.bool)
+    boxes = tf.boolean_mask(boxes, non_zeros, name=name)
+    return boxes, non_zeros
+
+
+def batch_pack_graph(x, counts, num_rows):
+    """Picks different number of values from each row
+    in x depending on the values in counts.
+    """
+    outputs = []
+    for i in range(num_rows):
+        outputs.append(x[i, :counts[i]])
+    return tf.concat(outputs, axis=0)
+
+
+def norm_boxes_graph(boxes, shape):
+    """Converts boxes from pixel coordinates to normalized coordinates.
+    boxes: [..., (y1, x1, y2, x2)] in pixel coordinates
+    shape: [..., (height, width)] in pixels
+
+    Note: In pixel coordinates (y2, x2) is outside the box. But in normalized
+    coordinates it's inside the box.
+
+    Returns:
+        [..., (y1, x1, y2, x2)] in normalized coordinates
+    """
+    h, w = tf.split(tf.cast(shape, tf.float32), 2)
+    scale = tf.concat([h, w, h, w], axis=-1) - tf.constant(1.0)
+    shift = tf.constant([0., 0., 1., 1.])
+    return tf.divide(boxes - shift, scale)
+
+
+def denorm_boxes_graph(boxes, shape):
+    """Converts boxes from normalized coordinates to pixel coordinates.
+    boxes: [..., (y1, x1, y2, x2)] in normalized coordinates
+    shape: [..., (height, width)] in pixels
+
+    Note: In pixel coordinates (y2, x2) is outside the box. But in normalized
+    coordinates it's inside the box.
+
+    Returns:
+        [..., (y1, x1, y2, x2)] in pixel coordinates
+    """
+    h, w = tf.split(tf.cast(shape, tf.float32), 2)
+    scale = tf.concat([h, w, h, w], axis=-1) - tf.constant(1.0)
+    shift = tf.constant([0., 0., 1., 1.])
+    return tf.cast(tf.round(tf.multiply(boxes, scale) + shift), tf.int32)
diff --git a/mask_rcnn/tf_servable/user_config.py b/mask_rcnn/tf_servable/user_config.py
new file mode 100644
index 00000000..ff4b22a6
--- /dev/null
+++ b/mask_rcnn/tf_servable/user_config.py
@@ -0,0 +1,24 @@
+import os
+# User Define parameters
+
+# Make it True if you want to use the provided coco weights
+is_coco = False
+
+# keras model file path
+H5_WEIGHT_PATH = '../models/mask_rcnn_final.h5'
+MODEL_DIR = os.path.dirname(H5_WEIGHT_PATH)
+
+# Path where the Frozen PB will be save
+PATH_TO_SAVE_FROZEN_PB = 'frozen_model/'
+
+# Name for the Frozen PB name
+FROZEN_NAME = 'mask_frozen_graph.pb'
+
+# PATH where to save serving model
+PATH_TO_SAVE_TENSORFLOW_SERVING_MODEL = '../models/serving_model/'
+
+# Version of the serving model
+VERSION_NUMBER = 1
+
+# Number of classes that you have trained your model
+NUMBER_OF_CLASSES = 6
diff --git a/mask_rcnn/tf_servable/utils.py b/mask_rcnn/tf_servable/utils.py
new file mode 100644
index 00000000..026edf70
--- /dev/null
+++ b/mask_rcnn/tf_servable/utils.py
@@ -0,0 +1,884 @@
+import sys
+import os
+import math
+import random
+import cv2
+import numpy as np
+import tensorflow as tf
+import scipy
+import skimage.color
+# import skimage.io
+import skimage.transform
+import urllib.request
+import shutil
+import warnings
+
+# URL from which to download the latest COCO trained weights
+COCO_MODEL_URL = "https://github.com/matterport/Mask_RCNN/releases/download/v2.0/mask_rcnn_coco.h5"
+
+
+############################################################
+#  Bounding Boxes
+############################################################
+
+def extract_bboxes(mask):
+    """Compute bounding boxes from masks.
+    mask: [height, width, num_instances]. Mask pixels are either 1 or 0.
+
+    Returns: bbox array [num_instances, (y1, x1, y2, x2)].
+    """
+    boxes = np.zeros([mask.shape[-1], 4], dtype=np.int32)
+    for i in range(mask.shape[-1]):
+        m = mask[:, :, i]
+        # Bounding box.
+        horizontal_indicies = np.where(np.any(m, axis=0))[0]
+        vertical_indicies = np.where(np.any(m, axis=1))[0]
+        if horizontal_indicies.shape[0]:
+            x1, x2 = horizontal_indicies[[0, -1]]
+            y1, y2 = vertical_indicies[[0, -1]]
+            # x2 and y2 should not be part of the box. Increment by 1.
+            x2 += 1
+            y2 += 1
+        else:
+            # No mask for this instance. Might happen due to
+            # resizing or cropping. Set bbox to zeros
+            x1, x2, y1, y2 = 0, 0, 0, 0
+        boxes[i] = np.array([y1, x1, y2, x2])
+    return boxes.astype(np.int32)
+
+
+def compute_iou(box, boxes, box_area, boxes_area):
+    """Calculates IoU of the given box with the array of the given boxes.
+    box: 1D vector [y1, x1, y2, x2]
+    boxes: [boxes_count, (y1, x1, y2, x2)]
+    box_area: float. the area of 'box'
+    boxes_area: array of length boxes_count.
+
+    Note: the areas are passed in rather than calculated here for
+    efficiency. Calculate once in the caller to avoid duplicate work.
+    """
+    # Calculate intersection areas
+    y1 = np.maximum(box[0], boxes[:, 0])
+    y2 = np.minimum(box[2], boxes[:, 2])
+    x1 = np.maximum(box[1], boxes[:, 1])
+    x2 = np.minimum(box[3], boxes[:, 3])
+    intersection = np.maximum(x2 - x1, 0) * np.maximum(y2 - y1, 0)
+    union = box_area + boxes_area[:] - intersection[:]
+    iou = intersection / union
+    return iou
+
+
+def compute_overlaps(boxes1, boxes2):
+    """Computes IoU overlaps between two sets of boxes.
+    boxes1, boxes2: [N, (y1, x1, y2, x2)].
+
+    For better performance, pass the largest set first and the smaller second.
+    """
+    # Areas of anchors and GT boxes
+    area1 = (boxes1[:, 2] - boxes1[:, 0]) * (boxes1[:, 3] - boxes1[:, 1])
+    area2 = (boxes2[:, 2] - boxes2[:, 0]) * (boxes2[:, 3] - boxes2[:, 1])
+
+    # Compute overlaps to generate matrix [boxes1 count, boxes2 count]
+    # Each cell contains the IoU value.
+    overlaps = np.zeros((boxes1.shape[0], boxes2.shape[0]))
+    for i in range(overlaps.shape[1]):
+        box2 = boxes2[i]
+        overlaps[:, i] = compute_iou(box2, boxes1, area2[i], area1)
+    return overlaps
+
+
+def compute_overlaps_masks(masks1, masks2):
+    """Computes IoU overlaps between two sets of masks.
+    masks1, masks2: [Height, Width, instances]
+    """
+
+    # If either set of masks is empty return empty result
+    if masks1.shape[0] == 0 or masks2.shape[0] == 0:
+        return np.zeros((masks1.shape[0], masks2.shape[-1]))
+    # flatten masks and compute their areas
+    masks1 = np.reshape(masks1 > .5, (-1, masks1.shape[-1])).astype(np.float32)
+    masks2 = np.reshape(masks2 > .5, (-1, masks2.shape[-1])).astype(np.float32)
+    area1 = np.sum(masks1, axis=0)
+    area2 = np.sum(masks2, axis=0)
+
+    # intersections and union
+    intersections = np.dot(masks1.T, masks2)
+    union = area1[:, None] + area2[None, :] - intersections
+    overlaps = intersections / union
+
+    return overlaps
+
+
+def non_max_suppression(boxes, scores, threshold):
+    """Performs non-maximum suppression and returns indices of kept boxes.
+    boxes: [N, (y1, x1, y2, x2)]. Notice that (y2, x2) lays outside the box.
+    scores: 1-D array of box scores.
+    threshold: Float. IoU threshold to use for filtering.
+    """
+    assert boxes.shape[0] > 0
+    if boxes.dtype.kind != "f":
+        boxes = boxes.astype(np.float32)
+
+    # Compute box areas
+    y1 = boxes[:, 0]
+    x1 = boxes[:, 1]
+    y2 = boxes[:, 2]
+    x2 = boxes[:, 3]
+    area = (y2 - y1) * (x2 - x1)
+
+    # Get indicies of boxes sorted by scores (highest first)
+    ixs = scores.argsort()[::-1]
+
+    pick = []
+    while len(ixs) > 0:
+        # Pick top box and add its index to the list
+        i = ixs[0]
+        pick.append(i)
+        # Compute IoU of the picked box with the rest
+        iou = compute_iou(boxes[i], boxes[ixs[1:]], area[i], area[ixs[1:]])
+        # Identify boxes with IoU over the threshold. This
+        # returns indices into ixs[1:], so add 1 to get
+        # indices into ixs.
+        remove_ixs = np.where(iou > threshold)[0] + 1
+        # Remove indices of the picked and overlapped boxes.
+        ixs = np.delete(ixs, remove_ixs)
+        ixs = np.delete(ixs, 0)
+    return np.array(pick, dtype=np.int32)
+
+
+def apply_box_deltas(boxes, deltas):
+    """Applies the given deltas to the given boxes.
+    boxes: [N, (y1, x1, y2, x2)]. Note that (y2, x2) is outside the box.
+    deltas: [N, (dy, dx, log(dh), log(dw))]
+    """
+    boxes = boxes.astype(np.float32)
+    # Convert to y, x, h, w
+    height = boxes[:, 2] - boxes[:, 0]
+    width = boxes[:, 3] - boxes[:, 1]
+    center_y = boxes[:, 0] + 0.5 * height
+    center_x = boxes[:, 1] + 0.5 * width
+    # Apply deltas
+    center_y += deltas[:, 0] * height
+    center_x += deltas[:, 1] * width
+    height *= np.exp(deltas[:, 2])
+    width *= np.exp(deltas[:, 3])
+    # Convert back to y1, x1, y2, x2
+    y1 = center_y - 0.5 * height
+    x1 = center_x - 0.5 * width
+    y2 = y1 + height
+    x2 = x1 + width
+    return np.stack([y1, x1, y2, x2], axis=1)
+
+
+def box_refinement_graph(box, gt_box):
+    """Compute refinement needed to transform box to gt_box.
+    box and gt_box are [N, (y1, x1, y2, x2)]
+    """
+    box = tf.cast(box, tf.float32)
+    gt_box = tf.cast(gt_box, tf.float32)
+
+    height = box[:, 2] - box[:, 0]
+    width = box[:, 3] - box[:, 1]
+    center_y = box[:, 0] + 0.5 * height
+    center_x = box[:, 1] + 0.5 * width
+
+    gt_height = gt_box[:, 2] - gt_box[:, 0]
+    gt_width = gt_box[:, 3] - gt_box[:, 1]
+    gt_center_y = gt_box[:, 0] + 0.5 * gt_height
+    gt_center_x = gt_box[:, 1] + 0.5 * gt_width
+
+    dy = (gt_center_y - center_y) / height
+    dx = (gt_center_x - center_x) / width
+    dh = tf.log(gt_height / height)
+    dw = tf.log(gt_width / width)
+
+    result = tf.stack([dy, dx, dh, dw], axis=1)
+    return result
+
+
+def box_refinement(box, gt_box):
+    """Compute refinement needed to transform box to gt_box.
+    box and gt_box are [N, (y1, x1, y2, x2)]. (y2, x2) is
+    assumed to be outside the box.
+    """
+    box = box.astype(np.float32)
+    gt_box = gt_box.astype(np.float32)
+
+    height = box[:, 2] - box[:, 0]
+    width = box[:, 3] - box[:, 1]
+    center_y = box[:, 0] + 0.5 * height
+    center_x = box[:, 1] + 0.5 * width
+
+    gt_height = gt_box[:, 2] - gt_box[:, 0]
+    gt_width = gt_box[:, 3] - gt_box[:, 1]
+    gt_center_y = gt_box[:, 0] + 0.5 * gt_height
+    gt_center_x = gt_box[:, 1] + 0.5 * gt_width
+
+    dy = (gt_center_y - center_y) / height
+    dx = (gt_center_x - center_x) / width
+    dh = np.log(gt_height / height)
+    dw = np.log(gt_width / width)
+
+    return np.stack([dy, dx, dh, dw], axis=1)
+
+
+############################################################
+#  Dataset
+############################################################
+
+class Dataset(object):
+    """The base class for dataset classes.
+    To use it, create a new class that adds functions specific to the dataset
+    you want to use. For example:
+
+    class CatsAndDogsDataset(Dataset):
+        def load_cats_and_dogs(self):
+            ...
+        def load_mask(self, image_id):
+            ...
+        def image_reference(self, image_id):
+            ...
+
+    See COCODataset and ShapesDataset as examples.
+    """
+
+    def __init__(self, class_map=None):
+        self._image_ids = []
+        self.image_info = []
+        # Background is always the first class
+        self.class_info = [{"source": "", "id": 0, "name": "BG"}]
+        self.source_class_ids = {}
+
+    def add_class(self, source, class_id, class_name):
+        assert "." not in source, "Source name cannot contain a dot"
+        # Does the class exist already?
+        for info in self.class_info:
+            if info['source'] == source and info["id"] == class_id:
+                # source.class_id combination already available, skip
+                return
+        # Add the class
+        self.class_info.append({
+            "source": source,
+            "id": class_id,
+            "name": class_name,
+        })
+
+    def add_image(self, source, image_id, path, **kwargs):
+        image_info = {
+            "id": image_id,
+            "source": source,
+            "path": path,
+        }
+        image_info.update(kwargs)
+        self.image_info.append(image_info)
+
+    def image_reference(self, image_id):
+        """Return a link to the image in its source Website or details about
+        the image that help looking it up or debugging it.
+
+        Override for your dataset, but pass to this function
+        if you encounter images not in your dataset.
+        """
+        return ""
+
+    def prepare(self, class_map=None):
+        """Prepares the Dataset class for use.
+
+        TODO: class map is not supported yet. When done, it should handle mapping
+              classes from different datasets to the same class ID.
+        """
+
+        def clean_name(name):
+            """Returns a shorter version of object names for cleaner display."""
+            return ",".join(name.split(",")[:1])
+
+        # Build (or rebuild) everything else from the info dicts.
+        self.num_classes = len(self.class_info)
+        self.class_ids = np.arange(self.num_classes)
+        self.class_names = [clean_name(c["name"]) for c in self.class_info]
+        self.num_images = len(self.image_info)
+        self._image_ids = np.arange(self.num_images)
+
+        # Mapping from source class and image IDs to internal IDs
+        self.class_from_source_map = {"{}.{}".format(info['source'], info['id']): id
+                                      for info, id in zip(self.class_info, self.class_ids)}
+        self.image_from_source_map = {"{}.{}".format(info['source'], info['id']): id
+                                      for info, id in zip(self.image_info, self.image_ids)}
+
+        # Map sources to class_ids they support
+        self.sources = list(set([i['source'] for i in self.class_info]))
+        self.source_class_ids = {}
+        # Loop over datasets
+        for source in self.sources:
+            self.source_class_ids[source] = []
+            # Find classes that belong to this dataset
+            for i, info in enumerate(self.class_info):
+                # Include BG class in all datasets
+                if i == 0 or source == info['source']:
+                    self.source_class_ids[source].append(i)
+
+    def map_source_class_id(self, source_class_id):
+        """Takes a source class ID and returns the int class ID assigned to it.
+
+        For example:
+        dataset.map_source_class_id("coco.12") -> 23
+        """
+        return self.class_from_source_map[source_class_id]
+
+    def get_source_class_id(self, class_id, source):
+        """Map an internal class ID to the corresponding class ID in the source dataset."""
+        info = self.class_info[class_id]
+        assert info['source'] == source
+        return info['id']
+
+    def append_data(self, class_info, image_info):
+        self.external_to_class_id = {}
+        for i, c in enumerate(self.class_info):
+            for ds, id in c["map"]:
+                self.external_to_class_id[ds + str(id)] = i
+
+        # Map external image IDs to internal ones.
+        self.external_to_image_id = {}
+        for i, info in enumerate(self.image_info):
+            self.external_to_image_id[info["ds"] + str(info["id"])] = i
+
+    @property
+    def image_ids(self):
+        return self._image_ids
+
+    def source_image_link(self, image_id):
+        """Returns the path or URL to the image.
+        Override this to return a URL to the image if it's available online for easy
+        debugging.
+        """
+        return self.image_info[image_id]["path"]
+
+    def load_image(self, image_id):
+        """Load the specified image and return a [H,W,3] Numpy array.
+        """
+        # Load image
+        image = cv2.imread(self.image_info[image_id]['path'])
+        # image = skimage.io.imread(self.image_info[image_id]['path'])
+        # If grayscale. Convert to RGB for consistency.
+        if image.ndim != 3:
+            image = skimage.color.gray2rgb(image)
+        # If has an alpha channel, remove it for consistency
+        if image.shape[-1] == 4:
+            image = image[..., :3]
+        return image
+
+    def load_mask(self, image_id):
+        """Load instance masks for the given image.
+
+        Different datasets use different ways to store masks. Override this
+        method to load instance masks and return them in the form of am
+        array of binary masks of shape [height, width, instances].
+
+        Returns:
+            masks: A bool array of shape [height, width, instance count] with
+                a binary mask per instance.
+            class_ids: a 1D array of class IDs of the instance masks.
+        """
+        # Override this function to load a mask from your dataset.
+        # Otherwise, it returns an empty mask.
+        mask = np.empty([0, 0, 0])
+        class_ids = np.empty([0], np.int32)
+        return mask, class_ids
+
+
+def resize_image(image, min_dim=None, max_dim=None, min_scale=None, mode="square"):
+    """Resizes an image keeping the aspect ratio unchanged.
+
+    min_dim: if provided, resizes the image such that it's smaller
+        dimension == min_dim
+    max_dim: if provided, ensures that the image longest side doesn't
+        exceed this value.
+    min_scale: if provided, ensure that the image is scaled up by at least
+        this percent even if min_dim doesn't require it.
+    mode: Resizing mode.
+        none: No resizing. Return the image unchanged.
+        square: Resize and pad with zeros to get a square image
+            of size [max_dim, max_dim].
+        pad64: Pads width and height with zeros to make them multiples of 64.
+               If min_dim or min_scale are provided, it scales the image up
+               before padding. max_dim is ignored in this mode.
+               The multiple of 64 is needed to ensure smooth scaling of feature
+               maps up and down the 6 levels of the FPN pyramid (2**6=64).
+        crop: Picks random crops from the image. First, scales the image based
+              on min_dim and min_scale, then picks a random crop of
+              size min_dim x min_dim. Can be used in training only.
+              max_dim is not used in this mode.
+
+    Returns:
+    image: the resized image
+    window: (y1, x1, y2, x2). If max_dim is provided, padding might
+        be inserted in the returned image. If so, this window is the
+        coordinates of the image part of the full image (excluding
+        the padding). The x2, y2 pixels are not included.
+    scale: The scale factor used to resize the image
+    padding: Padding added to the image [(top, bottom), (left, right), (0, 0)]
+    """
+    # Keep track of image dtype and return results in the same dtype
+    image_dtype = image.dtype
+    # Default window (y1, x1, y2, x2) and default scale == 1.
+    h, w = image.shape[:2]
+    window = (0, 0, h, w)
+    scale = 1
+    padding = [(0, 0), (0, 0), (0, 0)]
+    crop = None
+
+    if mode == "none":
+        return image, window, scale, padding, crop
+
+    # Scale?
+    if min_dim:
+        # Scale up but not down
+        scale = max(1, min_dim / min(h, w))
+    if min_scale and scale < min_scale:
+        scale = min_scale
+
+    # Does it exceed max dim?
+    if max_dim and mode == "square":
+        image_max = max(h, w)
+        if round(image_max * scale) > max_dim:
+            scale = max_dim / image_max
+
+    # Resize image using bilinear interpolation
+    if scale != 1:
+        image = skimage.transform.resize(
+            image, (round(h * scale), round(w * scale)),
+            order=1, mode="constant", preserve_range=True)
+
+    # Need padding or cropping?
+    if mode == "square":
+        # Get new height and width
+        h, w = image.shape[:2]
+        top_pad = (max_dim - h) // 2
+        bottom_pad = max_dim - h - top_pad
+        left_pad = (max_dim - w) // 2
+        right_pad = max_dim - w - left_pad
+        padding = [(top_pad, bottom_pad), (left_pad, right_pad), (0, 0)]
+        image = np.pad(image, padding, mode='constant', constant_values=0)
+        window = (top_pad, left_pad, h + top_pad, w + left_pad)
+    elif mode == "pad64":
+        h, w = image.shape[:2]
+        # Both sides must be divisible by 64
+        assert min_dim % 64 == 0, "Minimum dimension must be a multiple of 64"
+        # Height
+        if h % 64 > 0:
+            max_h = h - (h % 64) + 64
+            top_pad = (max_h - h) // 2
+            bottom_pad = max_h - h - top_pad
+        else:
+            top_pad = bottom_pad = 0
+        # Width
+        if w % 64 > 0:
+            max_w = w - (w % 64) + 64
+            left_pad = (max_w - w) // 2
+            right_pad = max_w - w - left_pad
+        else:
+            left_pad = right_pad = 0
+        padding = [(top_pad, bottom_pad), (left_pad, right_pad), (0, 0)]
+        image = np.pad(image, padding, mode='constant', constant_values=0)
+        window = (top_pad, left_pad, h + top_pad, w + left_pad)
+    elif mode == "crop":
+        # Pick a random crop
+        h, w = image.shape[:2]
+        y = random.randint(0, (h - min_dim))
+        x = random.randint(0, (w - min_dim))
+        crop = (y, x, min_dim, min_dim)
+        image = image[y:y + min_dim, x:x + min_dim]
+        window = (0, 0, min_dim, min_dim)
+    else:
+        raise Exception("Mode {} not supported".format(mode))
+    return image.astype(image_dtype), window, scale, padding, crop
+
+
+def resize_mask(mask, scale, padding, crop=None):
+    """Resizes a mask using the given scale and padding.
+    Typically, you get the scale and padding from resize_image() to
+    ensure both, the image and the mask, are resized consistently.
+
+    scale: mask scaling factor
+    padding: Padding to add to the mask in the form
+            [(top, bottom), (left, right), (0, 0)]
+    """
+    # Suppress warning from scipy 0.13.0, the output shape of zoom() is
+    # calculated with round() instead of int()
+    with warnings.catch_warnings():
+        warnings.simplefilter("ignore")
+        mask = scipy.ndimage.zoom(mask, zoom=[scale, scale, 1], order=0)
+    if crop is not None:
+        y, x, h, w = crop
+        mask = mask[y:y + h, x:x + w]
+    else:
+        mask = np.pad(mask, padding, mode='constant', constant_values=0)
+    return mask
+
+
+def minimize_mask(bbox, mask, mini_shape):
+    """Resize masks to a smaller version to reduce memory load.
+    Mini-masks can be resized back to image scale using expand_masks()
+
+    See inspect_data.ipynb notebook for more details.
+    """
+    mini_mask = np.zeros(mini_shape + (mask.shape[-1],), dtype=bool)
+    for i in range(mask.shape[-1]):
+        # Pick slice and cast to bool in case load_mask() returned wrong dtype
+        m = mask[:, :, i].astype(bool)
+        y1, x1, y2, x2 = bbox[i][:4]
+        m = m[y1:y2, x1:x2]
+        if m.size == 0:
+            raise Exception("Invalid bounding box with area of zero")
+        # Resize with bilinear interpolation
+        m = skimage.transform.resize(m, mini_shape, order=1, mode="constant")
+        mini_mask[:, :, i] = np.around(m).astype(np.bool)
+    return mini_mask
+
+
+def expand_mask(bbox, mini_mask, image_shape):
+    """Resizes mini masks back to image size. Reverses the change
+    of minimize_mask().
+
+    See inspect_data.ipynb notebook for more details.
+    """
+    mask = np.zeros(image_shape[:2] + (mini_mask.shape[-1],), dtype=bool)
+    for i in range(mask.shape[-1]):
+        m = mini_mask[:, :, i]
+        y1, x1, y2, x2 = bbox[i][:4]
+        h = y2 - y1
+        w = x2 - x1
+        # Resize with bilinear interpolation
+        m = skimage.transform.resize(m, (h, w), order=1, mode="constant")
+        mask[y1:y2, x1:x2, i] = np.around(m).astype(np.bool)
+    return mask
+
+
+# TODO: Build and use this function to reduce code duplication
+
+
+def unmold_mask(mask, bbox, image_shape):
+    """Converts a mask generated by the neural network to a format similar
+    to its original shape.
+    mask: [height, width] of type float. A small, typically 28x28 mask.
+    bbox: [y1, x1, y2, x2]. The box to fit the mask in.
+
+    Returns a binary mask with the same size as the original image.
+    """
+    threshold = 0.5
+    y1, x1, y2, x2 = bbox
+    mask = skimage.transform.resize(mask, (y2 - y1, x2 - x1), order=1, mode="constant")
+    mask = np.where(mask >= threshold, 1, 0).astype(np.bool)
+
+    # Put the mask in the right location.
+    full_mask = np.zeros(image_shape[:2], dtype=np.bool)
+    full_mask[y1:y2, x1:x2] = mask
+    return full_mask
+
+
+############################################################
+#  Anchors
+############################################################
+
+def generate_anchors(scales, ratios, shape, feature_stride, anchor_stride):
+    """
+    scales: 1D array of anchor sizes in pixels. Example: [32, 64, 128]
+    ratios: 1D array of anchor ratios of width/height. Example: [0.5, 1, 2]
+    shape: [height, width] spatial shape of the feature map over which
+            to generate anchors.
+    feature_stride: Stride of the feature map relative to the image in pixels.
+    anchor_stride: Stride of anchors on the feature map. For example, if the
+        value is 2 then generate anchors for every other feature map pixel.
+    """
+    # Get all combinations of scales and ratios
+    scales, ratios = np.meshgrid(np.array(scales), np.array(ratios))
+    scales = scales.flatten()
+    ratios = ratios.flatten()
+
+    # Enumerate heights and widths from scales and ratios
+    heights = scales / np.sqrt(ratios)
+    widths = scales * np.sqrt(ratios)
+
+    # Enumerate shifts in feature space
+    shifts_y = np.arange(0, shape[0], anchor_stride) * feature_stride
+    shifts_x = np.arange(0, shape[1], anchor_stride) * feature_stride
+    shifts_x, shifts_y = np.meshgrid(shifts_x, shifts_y)
+
+    # Enumerate combinations of shifts, widths, and heights
+    box_widths, box_centers_x = np.meshgrid(widths, shifts_x)
+    box_heights, box_centers_y = np.meshgrid(heights, shifts_y)
+
+    # Reshape to get a list of (y, x) and a list of (h, w)
+    box_centers = np.stack(
+        [box_centers_y, box_centers_x], axis=2).reshape([-1, 2])
+    box_sizes = np.stack([box_heights, box_widths], axis=2).reshape([-1, 2])
+
+    # Convert to corner coordinates (y1, x1, y2, x2)
+    boxes = np.concatenate([box_centers - 0.5 * box_sizes,
+                            box_centers + 0.5 * box_sizes], axis=1)
+    return boxes
+
+
+def generate_pyramid_anchors(scales, ratios, feature_shapes, feature_strides,
+                             anchor_stride):
+    """Generate anchors at different levels of a feature pyramid. Each scale
+    is associated with a level of the pyramid, but each ratio is used in
+    all levels of the pyramid.
+
+    Returns:
+    anchors: [N, (y1, x1, y2, x2)]. All generated anchors in one array. Sorted
+        with the same order of the given scales. So, anchors of scale[0] come
+        first, then anchors of scale[1], and so on.
+    """
+    # Anchors
+    # [anchor_count, (y1, x1, y2, x2)]
+    anchors = []
+    for i in range(len(scales)):
+        anchors.append(generate_anchors(scales[i], ratios, feature_shapes[i],
+                                        feature_strides[i], anchor_stride))
+    return np.concatenate(anchors, axis=0)
+
+
+############################################################
+#  Miscellaneous
+############################################################
+
+def trim_zeros(x):
+    """It's common to have tensors larger than the available data and
+    pad with zeros. This function removes rows that are all zeros.
+
+    x: [rows, columns].
+    """
+    assert len(x.shape) == 2
+    return x[~np.all(x == 0, axis=1)]
+
+
+def compute_matches(gt_boxes, gt_class_ids, gt_masks,
+                    pred_boxes, pred_class_ids, pred_scores, pred_masks,
+                    iou_threshold=0.5, score_threshold=0.0):
+    """Finds matches between prediction and ground truth instances.
+
+    Returns:
+        gt_match: 1-D array. For each GT box it has the index of the matched
+                  predicted box.
+        pred_match: 1-D array. For each predicted box, it has the index of
+                    the matched ground truth box.
+        overlaps: [pred_boxes, gt_boxes] IoU overlaps.
+    """
+    # Trim zero padding
+    # TODO: cleaner to do zero unpadding upstream
+    gt_boxes = trim_zeros(gt_boxes)
+    gt_masks = gt_masks[..., :gt_boxes.shape[0]]
+    pred_boxes = trim_zeros(pred_boxes)
+    pred_scores = pred_scores[:pred_boxes.shape[0]]
+    # Sort predictions by score from high to low
+    indices = np.argsort(pred_scores)[::-1]
+    pred_boxes = pred_boxes[indices]
+    pred_class_ids = pred_class_ids[indices]
+    pred_scores = pred_scores[indices]
+    pred_masks = pred_masks[..., indices]
+
+    # Compute IoU overlaps [pred_masks, gt_masks]
+    overlaps = compute_overlaps_masks(pred_masks, gt_masks)
+
+    # Loop through predictions and find matching ground truth boxes
+    match_count = 0
+    pred_match = -1 * np.ones([pred_boxes.shape[0]])
+    gt_match = -1 * np.ones([gt_boxes.shape[0]])
+    for i in range(len(pred_boxes)):
+        # Find best matching ground truth box
+        # 1. Sort matches by score
+        sorted_ixs = np.argsort(overlaps[i])[::-1]
+        # 2. Remove low scores
+        low_score_idx = np.where(overlaps[i, sorted_ixs] < score_threshold)[0]
+        if low_score_idx.size > 0:
+            sorted_ixs = sorted_ixs[:low_score_idx[0]]
+        # 3. Find the match
+        for j in sorted_ixs:
+            # If ground truth box is already matched, go to next one
+            if gt_match[j] > 0:
+                continue
+            # If we reach IoU smaller than the threshold, end the loop
+            iou = overlaps[i, j]
+            if iou < iou_threshold:
+                break
+            # Do we have a match?
+            if pred_class_ids[i] == gt_class_ids[j]:
+                match_count += 1
+                gt_match[j] = i
+                pred_match[i] = j
+                break
+
+    return gt_match, pred_match, overlaps
+
+
+def compute_ap(gt_boxes, gt_class_ids, gt_masks,
+               pred_boxes, pred_class_ids, pred_scores, pred_masks,
+               iou_threshold=0.5):
+    """Compute Average Precision at a set IoU threshold (default 0.5).
+
+    Returns:
+    mAP: Mean Average Precision
+    precisions: List of precisions at different class score thresholds.
+    recalls: List of recall values at different class score thresholds.
+    overlaps: [pred_boxes, gt_boxes] IoU overlaps.
+    """
+    # Get matches and overlaps
+    gt_match, pred_match, overlaps = compute_matches(
+        gt_boxes, gt_class_ids, gt_masks,
+        pred_boxes, pred_class_ids, pred_scores, pred_masks,
+        iou_threshold)
+
+    # Compute precision and recall at each prediction box step
+    precisions = np.cumsum(pred_match > -1) / (np.arange(len(pred_match)) + 1)
+    recalls = np.cumsum(pred_match > -1).astype(np.float32) / len(gt_match)
+
+    # Pad with start and end values to simplify the math
+    precisions = np.concatenate([[0], precisions, [0]])
+    recalls = np.concatenate([[0], recalls, [1]])
+
+    # Ensure precision values decrease but don't increase. This way, the
+    # precision value at each recall threshold is the maximum it can be
+    # for all following recall thresholds, as specified by the VOC paper.
+    for i in range(len(precisions) - 2, -1, -1):
+        precisions[i] = np.maximum(precisions[i], precisions[i + 1])
+
+    # Compute mean AP over recall range
+    indices = np.where(recalls[:-1] != recalls[1:])[0] + 1
+    mAP = np.sum((recalls[indices] - recalls[indices - 1]) *
+                 precisions[indices])
+
+    return mAP, precisions, recalls, overlaps
+
+
+def compute_ap_range(gt_box, gt_class_id, gt_mask,
+                     pred_box, pred_class_id, pred_score, pred_mask,
+                     iou_thresholds=None, verbose=1):
+    """Compute AP over a range or IoU thresholds. Default range is 0.5-0.95."""
+    # Default is 0.5 to 0.95 with increments of 0.05
+    iou_thresholds = iou_thresholds or np.arange(0.5, 1.0, 0.05)
+
+    # Compute AP over range of IoU thresholds
+    AP = []
+    for iou_threshold in iou_thresholds:
+        ap, precisions, recalls, overlaps = \
+            compute_ap(gt_box, gt_class_id, gt_mask,
+                       pred_box, pred_class_id, pred_score, pred_mask,
+                       iou_threshold=iou_threshold)
+        if verbose:
+            print("AP @{:.2f}:\t {:.3f}".format(iou_threshold, ap))
+        AP.append(ap)
+    AP = np.array(AP).mean()
+    if verbose:
+        print("AP @{:.2f}-{:.2f}:\t {:.3f}".format(
+            iou_thresholds[0], iou_thresholds[-1], AP))
+    return AP
+
+
+def compute_recall(pred_boxes, gt_boxes, iou):
+    """Compute the recall at the given IoU threshold. It's an indication
+    of how many GT boxes were found by the given prediction boxes.
+
+    pred_boxes: [N, (y1, x1, y2, x2)] in image coordinates
+    gt_boxes: [N, (y1, x1, y2, x2)] in image coordinates
+    """
+    # Measure overlaps
+    overlaps = compute_overlaps(pred_boxes, gt_boxes)
+    iou_max = np.max(overlaps, axis=1)
+    iou_argmax = np.argmax(overlaps, axis=1)
+    positive_ids = np.where(iou_max >= iou)[0]
+    matched_gt_boxes = iou_argmax[positive_ids]
+
+    recall = len(set(matched_gt_boxes)) / gt_boxes.shape[0]
+    return recall, positive_ids
+
+
+# ## Batch Slicing
+# Some custom layers support a batch size of 1 only, and require a lot of work
+# to support batches greater than 1. This function slices an input tensor
+# across the batch dimension and feeds batches of size 1. Effectively,
+# an easy way to support batches > 1 quickly with little code modification.
+# In the long run, it's more efficient to modify the code to support large
+# batches and getting rid of this function. Consider this a temporary solution
+def batch_slice(inputs, graph_fn, batch_size, names=None):
+    """Splits inputs into slices and feeds each slice to a copy of the given
+    computation graph and then combines the results. It allows you to run a
+    graph on a batch of inputs even if the graph is written to support one
+    instance only.
+
+    inputs: list of tensors. All must have the same first dimension length
+    graph_fn: A function that returns a TF tensor that's part of a graph.
+    batch_size: number of slices to divide the data into.
+    names: If provided, assigns names to the resulting tensors.
+    """
+    if not isinstance(inputs, list):
+        inputs = [inputs]
+
+    outputs = []
+    for i in range(batch_size):
+        inputs_slice = [x[i] for x in inputs]
+        output_slice = graph_fn(*inputs_slice)
+        if not isinstance(output_slice, (tuple, list)):
+            output_slice = [output_slice]
+        outputs.append(output_slice)
+    # Change outputs from a list of slices where each is
+    # a list of outputs to a list of outputs and each has
+    # a list of slices
+    outputs = list(zip(*outputs))
+
+    if names is None:
+        names = [None] * len(outputs)
+
+    result = [tf.stack(o, axis=0, name=n)
+              for o, n in zip(outputs, names)]
+    if len(result) == 1:
+        result = result[0]
+
+    return result
+
+
+def download_trained_weights(coco_model_path, verbose=1):
+    """Download COCO trained weights from Releases.
+
+    coco_model_path: local path of COCO trained weights
+    """
+    if verbose > 0:
+        print("Downloading pretrained model to " + coco_model_path + " ...")
+    with urllib.request.urlopen(COCO_MODEL_URL) as resp, open(coco_model_path, 'wb') as out:
+        shutil.copyfileobj(resp, out)
+    if verbose > 0:
+        print("... done downloading pretrained model!")
+
+
+def norm_boxes(boxes, shape):
+    """Converts boxes from pixel coordinates to normalized coordinates.
+    boxes: [N, (y1, x1, y2, x2)] in pixel coordinates
+    shape: [..., (height, width)] in pixels
+
+    Note: In pixel coordinates (y2, x2) is outside the box. But in normalized
+    coordinates it's inside the box.
+
+    Returns:
+        [N, (y1, x1, y2, x2)] in normalized coordinates
+    """
+    h, w = shape
+    scale = np.array([h - 1, w - 1, h - 1, w - 1])
+    shift = np.array([0, 0, 1, 1])
+    return np.divide((boxes - shift), scale).astype(np.float32)
+
+
+def denorm_boxes(boxes, shape):
+    """Converts boxes from normalized coordinates to pixel coordinates.
+    boxes: [N, (y1, x1, y2, x2)] in normalized coordinates
+    shape: [..., (height, width)] in pixels
+
+    Note: In pixel coordinates (y2, x2) is outside the box. But in normalized
+    coordinates it's inside the box.
+
+    Returns:
+        [N, (y1, x1, y2, x2)] in pixel coordinates
+    """
+    h, w = shape
+    scale = np.array([h - 1, w - 1, h - 1, w - 1])
+    shift = np.array([0, 0, 1, 1])
+    return np.around(np.multiply(boxes, scale) + shift).astype(np.int32)
diff --git a/mask_rcnn/trainer.py b/mask_rcnn/trainer.py
new file mode 100644
index 00000000..ea63806a
--- /dev/null
+++ b/mask_rcnn/trainer.py
@@ -0,0 +1,239 @@
+"""
+Mask R-CNN
+Train on the toy Balloon dataset and implement color splash effect.
+
+Copyright (c) 2018 Matterport, Inc.
+Licensed under the MIT License (see LICENSE for details)
+Written by Waleed Abdulla
+
+------------------------------------------------------------
+
+Usage: import the module (see Jupyter notebooks for examples), or run from
+       the command line as such:
+
+    # Train a new model starting from pre-trained COCO weights
+    python3 balloon.py train --dataset=/path/to/balloon/dataset --weights=coco
+
+    # Resume training a model that you had trained earlier
+    python3 balloon.py train --dataset=/path/to/balloon/dataset --weights=last
+
+    # Train a new model starting from ImageNet weights
+    python3 balloon.py train --dataset=/path/to/balloon/dataset --weights=imagenet
+
+    # Apply color splash to an image
+    python3 balloon.py splash --weights=/path/to/weights/file.h5 --image=<URL or path to file>
+
+    # Apply color splash to video using the last weights you trained
+    python3 balloon.py splash --weights=last --video=<URL or path to file>
+"""
+
+from mrcnn import model as modellib, utils
+from mrcnn.config import Config
+import os
+import sys
+import json
+import datetime
+import numpy as np
+import skimage.draw
+
+# Root directory of the project
+ROOT_DIR = os.path.abspath("../../")
+
+# Import Mask RCNN
+sys.path.append(ROOT_DIR)  # To find local version of the library
+
+# Path to trained weights file
+COCO_WEIGHTS_PATH = os.path.join(ROOT_DIR, "mask_rcnn_coco.h5")
+
+# Directory to save logs and model checkpoints, if not provided
+# through the command line argument --logs
+DEFAULT_LOGS_DIR = os.path.join(ROOT_DIR, "logs")
+
+############################################################
+#  Configurations
+############################################################
+
+
+class PPConfig(Config):
+    """Configuration for training on the toy  dataset.
+    Derives from the base Config class and overrides some values.
+    """
+    # Give the configuration a recognizable name
+    NAME = "pointless_package"
+
+    # We use a GPU with 12GB memory, which can fit two images.
+    # Adjust down if you use a smaller GPU.
+    IMAGES_PER_GPU = 1
+
+    # Number of classes (including background)
+    NUM_CLASSES = 1 + 6  # Background + outerbox + innerbox + item_rect + item_rect_slim + item_sq
+
+    # Number of training steps per epoch
+    STEPS_PER_EPOCH = 100
+
+    # Skip detections with < 90% confidence
+    DETECTION_MIN_CONFIDENCE = 0.9
+
+
+MY_ABS_PATH = "./"
+config = PPConfig()
+config.display()
+
+print("Loading Mask R-CNN model...")
+my_model_dir = MY_ABS_PATH + 'models/'
+model = modellib.MaskRCNN(
+    mode="training", config=config, model_dir=my_model_dir)
+
+#n load the weights for COCO
+# model.load_weights('./models/mask_rcnn_coco.h5',
+#                    by_name=True,
+#                    exclude=["mrcnn_class_logits", "mrcnn_bbox_fc",  "mrcnn_bbox", "mrcnn_mask"])
+
+# model.keras_model.summary()
+
+############################################################
+#  Dataset
+############################################################
+
+class PPDataset(utils.Dataset):
+
+    def load_dataset(self, dataset_dir, subset):
+        """Load a subset of the Balloon dataset.
+        dataset_dir: Root directory of the dataset.
+        subset: Subset to load: train or val
+        """
+        # Add classes. We have only one class to add.
+        self.add_class("pointless_package", 1, "outerbox")
+        self.add_class("pointless_package", 2, "innerbox")
+        self.add_class("pointless_package", 3, "item_sq")
+        self.add_class("pointless_package", 4, "item_rect")
+        self.add_class("pointless_package", 5, "item_rect_slim")
+        self.add_class("pointless_package", 6, "item_circ")
+
+        # Train or validation dataset?
+        assert subset in ["train", "val"]
+        dataset_dir = os.path.join(dataset_dir, subset)
+
+        # Load annotations
+        # VGG Image Annotator (up to version 1.6) saves each image in the form:
+        # { 'filename': '28503151_5b5b7ec140_b.jpg',
+        #   'regions': {
+        #       '0': {
+        #           'region_attributes': {},
+        #           'shape_attributes': {
+        #               'all_points_x': [...],
+        #               'all_points_y': [...],
+        #               'name': 'polygon'}},
+        #       ... more regions ...
+        #   },
+        #   'size': 100202
+        # }
+        # We mostly care about the x and y coordinates of each region
+        # Note: In VIA 2.0, regions was changed from a dict to a list.
+        annotations = json.load(
+            open(os.path.join(dataset_dir, "via_region_data.json")))
+        annotations = list(annotations.values())  # don't need the dict keys
+
+        # The VIA tool saves images in the JSON even if they don't have any
+        # annotations. Skip unannotated images.
+        annotations = [a for a in annotations if a['regions']]
+
+        # Add images
+        for a in annotations:
+            # Get the x, y coordinaets of points of the polygons that make up
+            # the outline of each object instance. These are stores in the
+            # shape_attributes (see json format above)
+            # The if condition is needed to support VIA versions 1.x and 2.x.
+            if type(a['regions']) is dict:
+                polygons = [r['shape_attributes']
+                            for r in a['regions'].values()]
+            else:
+                polygons = [r['shape_attributes'] for r in a['regions']]
+
+            # load_mask() needs the image size to convert polygons to masks.
+            # Unfortunately, VIA doesn't include it in JSON, so we must read
+            # the image. This is only managable since the dataset is tiny.
+            image_path = os.path.join(dataset_dir, a['filename'])
+            image = skimage.io.imread(image_path)
+            height, width = image.shape[:2]
+
+            class_list = [r['region_attributes'] for r in a['regions']]
+
+            self.add_image(
+                "pointless_package",
+                image_id=a['filename'],  # use file name as a unique image id
+                path=image_path,
+                width=width, height=height,
+                class_list=class_list,
+                polygons=polygons)
+
+    def load_mask(self, image_id):
+        """Generate instance masks for an image.
+       Returns:
+        masks: A bool array of shape [height, width, instance count] with
+            one mask per instance.
+        class_ids: a 1D array of class IDs of the instance masks.
+        """
+        class_ids = list()
+        # If not a pointless_package dataset image, delegate to parent class.
+        image_info = self.image_info[image_id]
+        # if image_info["source"] != "pointless_package":
+        #     return super(self.__class__, self).load_mask(image_id)
+
+        # Convert polygons to a bitmap mask of shape
+        # [height, width, instance_count]
+        info = self.image_info[image_id]
+        # print("\n\n\nIMAGE INFO:", info, "\n\n\n\n")
+
+        for box_type in info['class_list']:
+            # print(box_type['name'])
+            class_ids.append(self.class_names.index(str(box_type['name'])))
+        # print(class_ids)
+        # print(self.class_names)
+
+        mask = np.zeros([info["height"], info["width"], len(info["polygons"])],
+                        dtype=np.uint8)
+        for i, p in enumerate(info["polygons"]):
+            # Get indexes of pixels inside the polygon and set them to 1
+            rr, cc = skimage.draw.polygon(p['all_points_y'], p['all_points_x'])
+            mask[rr, cc, i] = 1
+        # Return mask, and array of class IDs of each instance. Since we have
+        # one class ID only, we return an array of 1s
+        return mask.astype(np.bool), np.asarray(class_ids, dtype=np.int32)
+
+    def image_reference(self, image_id):
+        """Return the path of the image."""
+        info = self.image_info[image_id]
+        if info["source"] == "pointless_package":
+            return info["path"]
+        else:
+            super(self.__class__, self).image_reference(image_id)
+
+
+my_dataset_dir = MY_ABS_PATH + 'dataset/'
+
+train_set = PPDataset()
+train_set.load_dataset(
+    my_dataset_dir, "train")
+train_set.prepare()
+print('Train: %d' % len(train_set.image_ids))
+# prepare test/val set
+test_set = PPDataset()
+test_set.load_dataset(
+    my_dataset_dir, "val")
+test_set.prepare()
+print('Test: %d' % len(test_set.image_ids))
+
+
+# train weights (output layers or 'heads')
+# train heads with higher lr to speedup the learning
+model.train(train_set, test_set, learning_rate=config.LEARNING_RATE,
+            epochs=5, layers='all')
+
+history = model.keras_model.history.history
+
+model.get_trainable_layers()
+
+
+model_path = MY_ABS_PATH + 'models/mask_rcnn_final.h5'
+model.keras_model.save_weights(model_path)
diff --git a/mask_rcnn/trainer_voc.py b/mask_rcnn/trainer_voc.py
new file mode 100644
index 00000000..9da9428b
--- /dev/null
+++ b/mask_rcnn/trainer_voc.py
@@ -0,0 +1,198 @@
+from xml.etree import ElementTree
+from os import listdir
+from mrcnn.config import Config
+from mrcnn import model as modellib
+from mrcnn import visualize
+import mrcnn
+from mrcnn.utils import Dataset
+from mrcnn.model import MaskRCNN
+
+import numpy as np
+from numpy import zeros
+from numpy import asarray
+import colorsys
+import argparse
+import imutils
+import random
+import cv2
+import os
+import time
+
+from matplotlib import pyplot
+from matplotlib.patches import Rectangle
+from keras.models import load_model
+
+#inherting  from Config class
+
+MY_ABS_PATH = "./"
+PP_LABELS=[]
+
+class PPConfig(Config):
+    """Configuration for training on the toy  dataset.
+    Derives from the base Config class and overrides some values.
+    """
+    # Give the configuration a recognizable name
+    NAME = "pointless_package"
+
+    # We use a GPU with 12GB memory, which can fit two images.
+    # Adjust down if you use a smaller GPU.
+    IMAGES_PER_GPU = 1
+
+    # Number of classes (including background)
+    NUM_CLASSES = 1 + 3  # Background + outerbox + innerbox + product
+
+    # Number of training steps per epoch
+    STEPS_PER_EPOCH = 100
+
+    # Skip detections with < 90% confidence
+    DETECTION_MIN_CONFIDENCE = 0.9
+
+config = PPConfig()
+config.display()
+
+print("Loading Mask R-CNN model...")
+my_model_dir = MY_ABS_PATH + 'models/'
+model = modellib.MaskRCNN(
+    mode="training", config=config, model_dir=my_model_dir)
+
+#n load the weights for COCO
+model.load_weights('./models/mask_rcnn_coco.h5',
+                   by_name=True,
+                   exclude=["mrcnn_class_logits", "mrcnn_bbox_fc",  "mrcnn_bbox", "mrcnn_mask"])
+                   
+model.keras_model.summary()
+
+
+class PPDataset(Dataset):
+    # load the dataset definitions
+    def load_dataset(self, dataset_dir, is_train=True):
+
+        # Add classes. We have only one class to add.
+        self.add_class("dataset", 1, "outerbox")
+        self.add_class("dataset", 2, "innerbox")
+        self.add_class("dataset", 3, "product")
+
+        # define data locations for images and annotations
+        images_dir = dataset_dir + 'images/'
+        annotations_dir = dataset_dir + 'annotations/'
+
+        # Iterate through all files in the folder to
+        #add class, images and annotaions
+        for filename in listdir(images_dir):
+
+            # extract image id
+            image_id = filename[:-4]
+
+            # skip bad images
+            if image_id in ['00090']:
+                continue
+            # skip all images after 150 if we are building the train set
+            if is_train and int(image_id[4:]) >= 150:
+                continue
+            # skip all images before 150 if we are building the test/val set
+            if not is_train and int(image_id[4:]) < 150:
+                continue
+
+            # setting image file
+            img_path = images_dir + filename
+
+            # setting annotations file
+            ann_path = annotations_dir + image_id + '.xml'
+
+            # adding images and annotations to dataset
+            self.add_image('dataset', image_id=image_id,
+                           path=img_path, annotation=ann_path)
+
+    # extract bounding boxes from an annotation file
+    def extract_boxes(self, filename):
+
+        # load and parse the file
+        tree = ElementTree.parse(filename)
+        # get the root of the document
+        root = tree.getroot()
+        # extract each bounding box
+        boxes = list()
+        for box in root.findall('.//object'):
+            name = box.find('name').text
+            xmin = int(box.find('.//bndbox').find('xmin').text)
+            ymin = int(box.find('.//bndbox').find('ymin').text)
+            xmax = int(box.find('.//bndbox').find('xmax').text)
+            ymax = int(box.find('.//bndbox').find('ymax').text)
+            coors = [xmin, ymin, xmax, ymax, name]
+            boxes.append(coors)
+
+        # for i, product in enumerate(root.findall('.//object')):
+        #     name = product.find('name').text
+        #     print(name)
+
+        # extract image dimensions
+        width = int(root.find('.//size/width').text)
+        height = int(root.find('.//size/height').text)
+        return boxes, width, height
+
+    # load the masks for an image
+    """Generate instance masks for an image.
+       Returns:
+        masks: A bool array of shape [height, width, instance count] with
+            one mask per instance.
+        class_ids: a 1D array of class IDs of the instance masks.
+     """
+
+    def load_mask(self, image_id):
+        # get details of image
+        info = self.image_info[image_id]
+
+        # define anntation  file location
+        path = info['annotation']
+
+        # load XML
+        boxes, w, h = self.extract_boxes(path)
+
+        # create one array for all masks, each on a different channel
+        masks = zeros([h, w, len(boxes)], dtype=np.uint8)
+
+        # create masks
+        class_ids = list()
+        for i in range(len(boxes)):
+            box = boxes[i]
+            row_s, row_e = box[1], box[3]
+            col_s, col_e = box[0], box[2]
+            masks[row_s:row_e, col_s:col_e, i] = 1
+            class_ids.append(self.class_names.index(box[4]))
+        return masks, asarray(class_ids, dtype=np.int32)
+
+    # load an image reference
+    #Return the path of the image."""
+    def image_reference(self, image_id):
+        info = self.image_info[image_id]
+        print(info)
+        return info['path']
+
+
+my_dataset_dir = MY_ABS_PATH + 'dataset/'
+
+train_set = PPDataset()
+train_set.load_dataset(
+    my_dataset_dir, is_train=True)
+train_set.prepare()
+print('Train: %d' % len(train_set.image_ids))
+# prepare test/val set
+test_set = PPDataset()
+test_set.load_dataset(
+    my_dataset_dir, is_train=False)
+test_set.prepare()
+print('Test: %d' % len(test_set.image_ids))
+
+
+# train weights (output layers or 'heads')
+## train heads with higher lr to speedup the learning
+model.train(train_set, test_set, learning_rate=config.LEARNING_RATE,
+            epochs=5, layers='heads')
+
+history = model.keras_model.history.history
+
+model.get_trainable_layers()
+
+
+model_path = MY_ABS_PATH + 'models/mask_rcnn_' + str(time.time()) + '.h5'
+model.keras_model.save_weights(model_path)
diff --git a/opencv_attempts/BoxDetect.py b/opencv_attempts/BoxDetect.py
new file mode 100644
index 00000000..9997f0a2
--- /dev/null
+++ b/opencv_attempts/BoxDetect.py
@@ -0,0 +1,54 @@
+import numpy as np
+import cv2
+import matplotlib.pyplot as plt
+import sys
+
+path = 'images/'
+inf_addr = 'box_1'
+print(sys.argv)
+addr = (path+inf_addr+'.jpg') if len(sys.argv) < 2 else (path +
+                                                         sys.argv[1]+'.jpg')
+
+img = cv2.imread(addr,0)
+
+BINS = 20
+np_hist, _ = np.histogram(img, bins=BINS)
+print(np_hist)
+
+dmin, dmax, _, _ = cv2.minMaxLoc(img)
+if np.issubdtype(img.dtype, 'float'):
+    dmax += np.finfo(img.dtype).eps
+else:
+    dmax += 1
+
+cv_hist = cv2.calcHist([img], [0], None, [BINS], [dmin, dmax]).flatten()
+
+# data = np.reshape(img, (-1, 3))
+# print(data.shape)
+# data = np.float32(data)
+
+# criteria = (cv2.TERM_CRITERIA_EPS + cv2.TERM_CRITERIA_MAX_ITER, 10, 1.0)
+# flags = cv2.KMEANS_RANDOM_CENTERS
+# compactness, labels, centers = cv2.kmeans(data, 1, None, criteria, 10, flags)
+
+# centers[0] = centers[0].astype(int)
+
+
+# img = cv2.cvtColor(img, cv2.COLOR_BGR2HSV)
+# canvas = np.zeros(img.shape)
+
+# img_blur = cv2.GaussianBlur(img, (7,7), 0)
+
+# min_color = np.array(centers[0]-20)
+# max_color = np.array(centers[0]+20)
+
+# mask1 = cv2.inRange(img_blur, min_color, max_color)
+
+plt.plot(np_hist, '-', label='numpy')
+plt.plot(cv_hist, '-', label='opencv')
+
+plt.legend()
+plt.show()
+# cv2.imshow('',mask1)
+cv2.waitKey(0) 
+cv2.destroyAllWindows()
diff --git a/opencv_attempts/countours.py b/opencv_attempts/countours.py
new file mode 100644
index 00000000..a3ab2ee0
--- /dev/null
+++ b/opencv_attempts/countours.py
@@ -0,0 +1,44 @@
+import numpy as np
+import cv2
+import matplotlib.pyplot as plt
+import sys
+import random
+
+path = 'images/'
+inf_addr = 'box_1'
+print(sys.argv)
+addr = (path+inf_addr+'.jpg') if len(sys.argv) < 2 else (path + sys.argv[1]+'.jpg')
+
+img = cv2.imread(addr)
+img_gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
+img_gray = cv2.GaussianBlur(img_gray, (7, 7), 3)
+canvas = np.zeros(img.shape)
+
+canny_edges = cv2.Canny(img_gray, 1, 100)
+# canny_edges = cv2.dilate(canny_edges, None, iterations=2)
+# canny_edges = cv2.erode(canny_edges, None, iterations=2)
+
+canny_contours, hierarchy = cv2.findContours(canny_edges, cv2.RETR_TREE, cv2.CHAIN_APPROX_NONE)
+
+# cv2.drawContours(canvas, canny_contours, -1, (255, 255, 255), 2)
+
+
+cntsSorted = sorted(
+    canny_contours, key=lambda x: cv2.contourArea(x), reverse=True)
+# cntsSorted = sorted(cnts, key=lambda x: cv2.arcLength(x, True), reverse=True)
+cnt_max = cv2.contourArea(cntsSorted[0])
+""" DRAW CONTOUR IMAGE """
+for i, c in enumerate(cntsSorted):
+    if 0 < cv2.contourArea(c) <= cnt_max:
+        color = random.randint(1, 1000) % 255
+        cv2.drawContours(canvas, cntsSorted[i], -1, (color, color, color), 1)
+        print("Color:", color, "Area:", cv2.contourArea(c))
+        cv2.waitKey(200)
+        cv2.imshow('CannyCanvas', canvas)
+
+# cv2.drawContours(img, contours, 5, (0,255,0), 3)
+
+cv2.imshow('',img)
+# cv2.imshow('CannyEdges', canny_edges)
+cv2.waitKey(0)
+cv2.destroyAllWindows()
diff --git a/opencv_attempts/detect.py b/opencv_attempts/detect.py
new file mode 100644
index 00000000..404cfec6
--- /dev/null
+++ b/opencv_attempts/detect.py
@@ -0,0 +1,83 @@
+import numpy as np
+import cv2
+import matplotlib.pyplot as plt
+
+import sys
+
+path = 'images/'
+inf_addr = 'box_1'
+print(sys.argv)
+addr = (path+inf_addr+'.jpg') if len(sys.argv) < 2 else (path + sys.argv[1]+'.jpg')
+
+
+img = cv2.imread(addr)
+
+Z = img.reshape((-1, 3))
+
+# convert to np.float32
+Z = np.float32(Z)
+
+# define criteria, number of clusters(K) and apply kmeans()
+criteria = (cv2.TERM_CRITERIA_EPS + cv2.TERM_CRITERIA_MAX_ITER, 10, 1.0)
+K = 3
+ret, label, center = cv2.kmeans(
+    Z, K, None, criteria, 10, cv2.KMEANS_RANDOM_CENTERS)
+
+# Now convert back into uint8, and make original image
+center = np.uint8(center)
+res = center[label.flatten()]
+res2 = res.reshape((img.shape))
+
+
+img_gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
+# img_gray = res2
+
+# kernel = np.array([[-1, -1, -1], [-1, 9, -1], [-1, -1, -1]])
+# img_gray = cv2.filter2D(img_gray, -1, kernel)
+
+img_gray = cv2.GaussianBlur(img_gray, (7, 7), 3)
+img_gray2 = img_gray.copy()
+
+canvas = np.zeros(shape=img.shape)
+
+edged = cv2.Canny(img_gray, 0, 65)
+edged = cv2.dilate(edged, None, iterations=1)
+edged = cv2.erode(edged, None, iterations=1)
+
+ret, thresh = cv2.threshold(img_gray2, 127, 255, 0)
+
+cnts, hierarchy = cv2.findContours(
+    edged.copy(), cv2.RETR_TREE, cv2.CHAIN_APPROX_SIMPLE)
+
+
+# contours, _ = cv2.findContours(
+#     thresh, cv2.RETR_TREE, cv2.CHAIN_APPROX_SIMPLE)
+
+cv2.drawContours(img, cnts, -1, (0, 255, 0), 3)
+ddepth = -1
+ind = 2
+kernel_size = 3 + 2 * (ind % 5)
+kernel = np.ones((kernel_size, kernel_size), dtype=np.float32)
+kernel /= (kernel_size * kernel_size)
+
+dst = cv2.filter2D(img, ddepth, kernel)
+
+# cnts = cnts[0] if imutils.is_cv2() else cnts[1]
+cntsSorted = sorted(cnts, key=lambda x: cv2.contourArea(x), reverse=True)
+# cntsSorted = sorted(cnts, key=lambda x: cv2.arcLength(x, True), reverse=True)
+
+""" DRAW CONTOUR IMAGE """
+for i, c in enumerate(cntsSorted):
+    cv2.drawContours(canvas, c, -1, (255, 255, 255), 2)
+    print(cv2.contourArea(c))
+    cv2.waitKey(100)
+    cv2.imshow('Canny',canvas)
+
+# cv2.imshow("Custom Filter", dst)
+
+# cv2.imshow('', img)
+# cv2.imshow('Threshold Contours', thresh)
+cv2.imshow('Color Quantization', res2)
+cv2.waitKey(0)
+cv2.destroyAllWindows()
+
diff --git a/opencv_attempts/images/1.jpg b/opencv_attempts/images/1.jpg
new file mode 100644
index 00000000..1c2ccd99
Binary files /dev/null and b/opencv_attempts/images/1.jpg differ
diff --git a/opencv_attempts/images/10.jpg b/opencv_attempts/images/10.jpg
new file mode 100644
index 00000000..928f06cb
Binary files /dev/null and b/opencv_attempts/images/10.jpg differ
diff --git a/opencv_attempts/images/11.jpg b/opencv_attempts/images/11.jpg
new file mode 100644
index 00000000..a0ae6cf3
Binary files /dev/null and b/opencv_attempts/images/11.jpg differ
diff --git a/opencv_attempts/images/12.jpg b/opencv_attempts/images/12.jpg
new file mode 100644
index 00000000..1640f87e
Binary files /dev/null and b/opencv_attempts/images/12.jpg differ
diff --git a/opencv_attempts/images/13.jpg b/opencv_attempts/images/13.jpg
new file mode 100644
index 00000000..a3dca8f6
Binary files /dev/null and b/opencv_attempts/images/13.jpg differ
diff --git a/opencv_attempts/images/14.jpg b/opencv_attempts/images/14.jpg
new file mode 100644
index 00000000..d7c8faff
Binary files /dev/null and b/opencv_attempts/images/14.jpg differ
diff --git a/opencv_attempts/images/15.jpg b/opencv_attempts/images/15.jpg
new file mode 100644
index 00000000..fd667ea6
Binary files /dev/null and b/opencv_attempts/images/15.jpg differ
diff --git a/opencv_attempts/images/16.jpg b/opencv_attempts/images/16.jpg
new file mode 100644
index 00000000..782024eb
Binary files /dev/null and b/opencv_attempts/images/16.jpg differ
diff --git a/opencv_attempts/images/17.jpg b/opencv_attempts/images/17.jpg
new file mode 100644
index 00000000..2c820657
Binary files /dev/null and b/opencv_attempts/images/17.jpg differ
diff --git a/opencv_attempts/images/18.jpg b/opencv_attempts/images/18.jpg
new file mode 100644
index 00000000..33f123af
Binary files /dev/null and b/opencv_attempts/images/18.jpg differ
diff --git a/opencv_attempts/images/19.jpg b/opencv_attempts/images/19.jpg
new file mode 100644
index 00000000..98fa6ff2
Binary files /dev/null and b/opencv_attempts/images/19.jpg differ
diff --git a/opencv_attempts/images/2.jpg b/opencv_attempts/images/2.jpg
new file mode 100644
index 00000000..c7e8400c
Binary files /dev/null and b/opencv_attempts/images/2.jpg differ
diff --git a/opencv_attempts/images/20.jpg b/opencv_attempts/images/20.jpg
new file mode 100644
index 00000000..288a6a96
Binary files /dev/null and b/opencv_attempts/images/20.jpg differ
diff --git a/opencv_attempts/images/21.jpg b/opencv_attempts/images/21.jpg
new file mode 100644
index 00000000..47eb3ad8
Binary files /dev/null and b/opencv_attempts/images/21.jpg differ
diff --git a/opencv_attempts/images/3.jpg b/opencv_attempts/images/3.jpg
new file mode 100644
index 00000000..d11c31f8
Binary files /dev/null and b/opencv_attempts/images/3.jpg differ
diff --git a/opencv_attempts/images/4.jpg b/opencv_attempts/images/4.jpg
new file mode 100644
index 00000000..0c651d1e
Binary files /dev/null and b/opencv_attempts/images/4.jpg differ
diff --git a/opencv_attempts/images/5.jpg b/opencv_attempts/images/5.jpg
new file mode 100644
index 00000000..290b658e
Binary files /dev/null and b/opencv_attempts/images/5.jpg differ
diff --git a/opencv_attempts/images/6.jpg b/opencv_attempts/images/6.jpg
new file mode 100644
index 00000000..c2462720
Binary files /dev/null and b/opencv_attempts/images/6.jpg differ
diff --git a/opencv_attempts/images/7.jpg b/opencv_attempts/images/7.jpg
new file mode 100644
index 00000000..82052589
Binary files /dev/null and b/opencv_attempts/images/7.jpg differ
diff --git a/opencv_attempts/images/8.jpg b/opencv_attempts/images/8.jpg
new file mode 100644
index 00000000..b5133d9c
Binary files /dev/null and b/opencv_attempts/images/8.jpg differ
diff --git a/opencv_attempts/images/9.jpg b/opencv_attempts/images/9.jpg
new file mode 100644
index 00000000..66e89582
Binary files /dev/null and b/opencv_attempts/images/9.jpg differ
diff --git a/opencv_attempts/watershed.py b/opencv_attempts/watershed.py
new file mode 100644
index 00000000..0c84051b
--- /dev/null
+++ b/opencv_attempts/watershed.py
@@ -0,0 +1,39 @@
+import numpy as np
+import cv2 as cv
+from matplotlib import pyplot as plt
+import sys
+
+path = 'images/'
+inf_addr = 'box_1'
+print(sys.argv)
+addr = (path+inf_addr+'.jpg') if len(sys.argv) < 2 else (path + sys.argv[1])
+
+img = cv.imread(addr)
+gray = cv.cvtColor(img, cv.COLOR_BGR2GRAY)
+ret, thresh = cv.threshold(gray, 0, 255, cv.THRESH_BINARY_INV+cv.THRESH_OTSU)
+
+# noise removal
+kernel = np.ones((3, 3), np.uint8)
+opening = cv.morphologyEx(thresh, cv.MORPH_OPEN, kernel, iterations=2)
+# sure background area
+sure_bg = cv.dilate(opening, kernel, iterations=3)
+# Finding sure foreground area
+dist_transform = cv.distanceTransform(opening, cv.DIST_L2, 5)
+ret, sure_fg = cv.threshold(dist_transform, 0.7*dist_transform.max(), 255, 0)
+# Finding unknown region
+sure_fg = np.uint8(sure_fg)
+unknown = cv.subtract(sure_bg, sure_fg)
+
+# Marker labelling
+ret, markers = cv.connectedComponents(sure_fg)
+# Add one to all labels so that sure background is not 0, but 1
+markers = markers+1
+# Now, mark the region of unknown with zero
+markers[unknown == 255] = 0
+
+markers = cv.watershed(img, markers)
+img[markers == -1] = [255, 0, 0]
+
+cv.imshow('', img)
+cv.waitKey(0)
+cv.destroyAllWindows()
diff --git a/yoosuf_scripts/rename.py b/yoosuf_scripts/rename.py
new file mode 100644
index 00000000..a2d3f0f0
--- /dev/null
+++ b/yoosuf_scripts/rename.py
@@ -0,0 +1,70 @@
+
+'''
+Simple python script to rename all files to rename any files to
+ECS 193A naming convention.
+'''
+
+
+import argparse
+
+import io
+import os
+import shutil
+import random
+
+def parse_args():
+    '''
+    Get command line args.
+    '''
+
+    parser = argparse.ArgumentParser()
+    parser.add_argument('--dir', required=True, help='path to \
+            directory with images', dest='dir')
+
+    parser.add_argument('--newdir', required=True, help='path to \
+            new directory with renamed images', dest='new_dir')
+
+    parser.add_argument('--start', required=True, help='naming \
+            starting number', dest='num_start', type=int)
+
+    args = parser.parse_args()
+
+    return args
+
+def rename(files, nums_start):
+    '''
+    Renames the files in a directory.
+    '''
+
+def main():
+
+    args = parse_args()
+
+    try:
+        files = os.listdir(args.dir)
+    except NotADirectoryError:
+        print("No such directory ", args.dir)
+        raise
+
+    new_directory = args.new_dir
+    
+    # randomize the files
+    random.shuffle(files)
+    
+    #os.mkdir(new_directory)
+    shutil.copytree(args.dir, new_directory)
+
+    current_index = args.num_start
+
+    for file in files:
+        full_name = os.path.join(new_directory, file)
+        new_name = os.path.join(new_directory, 'IMG_' + \
+                str(current_index) + '.jpg')
+
+        current_index += 1
+        os.rename(full_name, new_name)
+
+    print("Rename successful!")
+
+if __name__== "__main__":
+  main()
diff --git a/yoosuf_scripts/resize.py b/yoosuf_scripts/resize.py
new file mode 100644
index 00000000..2d92386b
--- /dev/null
+++ b/yoosuf_scripts/resize.py
@@ -0,0 +1,88 @@
+import argparse
+import io
+import os
+import sys
+import shutil
+import cv2
+
+width = 300
+accpted_extensions = ['.jpg', '.jpeg', '.png', '.gif']
+
+description = "Simple script that takes a directory of images and resizes them to width of " + str(width) + "px while still maintaining the aspect ratio."
+
+def parse_args():
+    parser = argparse.ArgumentParser(description=description)
+    parser.add_argument('--src', required=True, help='Path to the directory with source images', dest='src')
+    parser.add_argument('--dest', required=False, help='[Optional] New target directory. If supplied, a new directory will be created and all images will be copied and resized in this directory.', dest='dest')
+
+    return parser.parse_args()
+
+def query_yes_no():
+    print("\n* You have NOT specified a destination.\nThe script will rewrite images to the same directory and original images will not be saved.\nAre you sure you want to continue?\n")
+    
+    yes = {'yes', 'y', 'ye', ''}
+    no = {'no', 'n'}
+    print("Please respond with 'y' or 'n':", end=' ')
+    while True:
+        choice = input().lower()
+        if choice in yes:
+            return True
+        elif choice in no:
+            return False
+        else:
+            print("Please respond with 'y' or 'n':", end=' ')
+
+def main():
+    args = parse_args()
+    source_dir = args.src # source directory name
+    dest_dir = args.dest # destination directory name
+    op_dir = source_dir # operation directory
+
+    if os.path.isdir(source_dir) == False:
+        print("Please enter a valid source directory.")
+        raise NotADirectoryError
+
+    if dest_dir == None and query_yes_no() == False:
+        print("Script aborted.")
+        raise SystemExit
+        
+    if dest_dir != None:
+        """ Copy all files from source to destination directory """
+        shutil.copytree(source_dir, dest_dir)
+        op_dir = dest_dir
+
+    try:
+        """ Get all files in the copied directory """
+        files = os.listdir(op_dir)
+    except NotADirectoryError:
+        print("Invalid source directory", op_dir)
+        raise
+    
+    """ Check if absolute path """
+    file_path = ''
+    if os.path.isabs(op_dir) == False:
+        file_path = './' + op_dir + '/'
+
+    resized = 0
+    total_img = 0
+
+    for file in files:
+        img_name = file_path+file
+        if os.path.splitext(img_name)[1] in accpted_extensions: # check if image is jpg, png
+            img = cv2.imread(img_name)
+            orig_dim = img.shape
+            total_img += 1
+            if orig_dim[0] < 301:
+                print("Did not resize", file, "with dimensions", orig_dim[:2])
+                continue
+            new_dim = (int((width/orig_dim[0]) * orig_dim[1]), width)
+            resized_img = cv2.resize(img, new_dim, interpolation=cv2.INTER_AREA)
+            cv2.imwrite(img_name, resized_img)
+            resized += 1
+            print("Resized", file, "from", orig_dim[:2], "->", resized_img.shape[:2])
+    
+    print(f"\nImages Resized: {resized} out of {total_img} images.")
+    print("Done!")
+
+if __name__ == "__main__":
+    main()

← ↑ → ↓	Move selected region by 1 px (Shift to jump)
a	Select all regions
c	Copy selected regions
v	Paste selected regions
d	Delete selected regions
Ctrl + Wheel	Zoom in/out (mouse cursor is over image)
l	Toggle region label
b	Toggle region boundary
Enter	Finish drawing polyshape
Backspace	Delete last polyshape vertex
← →	Move to next/previous image
+ - =	Zoom in/out/reset
↑	Update region label
↓	Update region colour
Spacebar	Toggle annotation editor (Ctrl to toggle on image editor)
Home / h	Jump to first image
End / e	Jump to last image
PgUp / u	Jump several images
PgDown / d	Jump several images
Esc	Cancel ongoing task