Skip to content

Object Detection Mask R-CNN model: Examples

These are example predictions for the model, images are from the COCO Dataset.

Horse with Guard

Horse with Guard Segmented

JSON outputs:

{
    "labels":
        ["horse 100%", "person 99%", "person 99%", "person 99%", "person 98%", "person 93%", "person 92%", "frisbee 90%", "umbrella 89%", "person 53%"],
    "boxes": [
        [127.11386108398438, 247.31301879882812, 465.427978515625, 480.0],
        [254.72451782226562, 164.79159545898438, 335.8401184082031, 401.29840087890625],
        [0.9573012590408325, 279.462646484375, 75.12348175048828, 479.47015380859375],
        [49.450260162353516, 275.5840759277344, 79.73651123046875, 369.51434326171875],
        [114.95684051513672, 268.72479248046875, 149.48388671875, 397.9055480957031],
        [512.51806640625, 279.2389831542969, 561.9500732421875, 382.5887145996094],
        [560.3663330078125, 272.36761474609375, 598.057373046875, 356.83721923828125],
        [306.2652587890625, 147.22177124023438, 315.6444396972656, 168.5187225341797],
        [507.4710388183594, 267.3088684082031, 571.6740112304688, 296.2601623535156],
        [594.297607421875, 264.638427734375, 614.7077026367188, 345.806396484375]
    ]
}

Cat and Fruis

Cat and Fruis Segmented

JSON outputs:

{
    "labels":
        ["cat 100%", "bowl 98%", "bowl 97%", "bowl 87%", "bowl 85%", "spoon 83%", "bowl 73%"],
    "boxes": [
        [216.59927368164062, 240.20263671875, 407.5367736816406, 379.2315979003906],
        [134.87890625, 55.9307746887207, 245.2788543701172, 120.02284240722656],
        [233.0037841796875, 57.83541488647461, 345.0400695800781, 124.89885711669922],
        [208.5238494873047, 26.521167755126953, 306.4939880371094, 66.13530731201172],
        [328.00067138671875, 69.58489990234375, 475.267578125, 137.90792846679688],
        [352.06707763671875, 43.44765853881836, 444.8140563964844, 97.2989730834961],
        [344.8138122558594, 47.5083122253418, 483.6903991699219, 101.86201477050781]
    ]
}

Cars

Cars Segmented

JSON outputs:

{
    "labels":
        ["car 100%", "bus 100%", "car 100%", "traffic light 99%", "car 99%", "person 99%", "person 98%", "traffic light 96%", "person 93%", "traffic light 91%", "traffic light 83%", "truck 80%", "handbag 80%", "car 70%", "traffic light 59%"],
    "boxes": [
        [69.4033432006836, 426.4164733886719, 149.56976318359375, 481.8005065917969],
        [310.7447509765625, 345.19073486328125, 477.2540283203125, 433.0453796386719],
        [177.8173065185547, 427.03253173828125, 302.9234619140625, 499.82196044921875],
        [268.3243103027344, 223.73086547851562, 284.3643798828125, 269.1820068359375],
        [146.38888549804688, 406.3042297363281, 227.71038818359375, 457.7203063964844],
        [331.662109375, 403.6127014160156, 351.7901916503906, 471.7012939453125],
        [345.9764404296875, 402.6434020996094, 372.4714050292969, 476.3934020996094],
        [188.65028381347656, 268.1125793457031, 205.47999572753906, 300.27154541015625],
        [301.6253662109375, 402.1319580078125, 324.9884948730469, 471.702880859375],
        [152.59521484375, 353.8171691894531, 165.1454315185547, 377.0882873535156],
        [393.2215576171875, 340.48114013671875, 406.4432373046875, 379.64910888671875],
        [370.30169677734375, 393.1182861328125, 626.0230712890625, 517.6090698242188],
        [350.5939025878906, 440.16851806640625, 373.4088439941406, 459.9479675292969],
        [368.0306701660156, 391.2562561035156, 630.3673095703125, 518.3442993164062],
        [179.05198669433594, 274.235595703125, 189.63931274414062, 302.0262756347656]
        ]
    }

Apartmentt

Apartmentt Segmented

JSON outputs:

{
    "labels":
        ["chair 100%", "tv 99%", "couch 98%", "book 98%", "chair 97%", "book 96%", "book 93%", "book 89%", "book 89%", "book 85%", "book 85%", "potted plant 85%", "book 83%", "book 78%", "sink 74%", "book 74%", "dining table 71%", "kite 65%", "book 62%", "book 56%", "potted plant 51%"],
    "boxes": [
        [397.0080871582031, 227.0098419189453, 434.8014221191406, 272.74005126953125],
        [294.5870056152344, 162.546875, 348.7562255859375, 229.76153564453125],
        [439.57012939453125, 234.3487091064453, 638.8670654296875, 425.19976806640625],
        [83.99020385742188, 50.07662582397461, 106.09722900390625, 95.44261169433594],
        [371.9010925292969, 228.10035705566406, 395.4789123535156, 273.06939697265625],
        [102.85154724121094, 66.02977752685547, 117.60905456542969, 101.30097961425781],
        [148.7110595703125, 74.6741943359375, 161.63345336914062, 112.49417114257812],
        [133.4478302001953, 67.26869201660156, 146.62644958496094, 107.57303619384766],
        [127.7191162109375, 69.1695327758789, 136.9913330078125, 106.4194564819336],
        [159.2508087158203, 77.82789611816406, 175.79454040527344, 115.42021179199219],
        [119.92369079589844, 67.9338607788086, 130.61831665039062, 104.94882202148438],
        [347.1818542480469, 225.17445373535156, 374.7388610839844, 261.9774169921875],
        [140.70831298828125, 72.62095642089844, 154.50926208496094, 110.36141204833984],
        [153.75611877441406, 76.79235076904297, 168.7827606201172, 113.96331787109375],
        [289.7503662109375, 243.23162841796875, 308.880859375, 249.50302124023438],
        [113.4874496459961, 70.3045883178711, 120.75492095947266, 101.65245819091797],
        [377.31414794921875, 227.15528869628906, 418.45599365234375, 267.8934020996094],
        [414.75921630859375, 27.752643585205078, 443.8397521972656, 55.12297821044922],
        [117.49675750732422, 70.71876525878906, 124.38624572753906, 102.8495101928711],
        [115.36309051513672, 66.74239349365234, 137.70584106445312, 104.43795013427734],
        [589.8953247070312, 159.18565368652344, 637.3837280273438, 302.1114807128906]
    ]
}

Dog and Birds

Dog and Birds Segmented

JSON outputs:

{
    "labels":
        ["bird 100%", "dog 99%", "bird 99%", "bird 99%", "bird 98%", "bird 98%", "person 57%"],
    "boxes": [
        [124.48042297363281, 91.6610107421875, 194.98130798339844, 143.6868438720703],
        [241.64671325683594, 136.6213836669922, 505.2481384277344, 471.4105529785156],
        [448.51885986328125, 2.485529899597168, 484.5710144042969, 25.771272659301758],
        [125.61963653564453, 125.44010162353516, 177.6766815185547, 213.96636962890625],
        [493.65057373046875, 0.17544308304786682, 532.5198974609375, 15.87779712677002],
        [357.76556396484375, 69.29669952392578, 426.5431823730469, 110.34757995605469],
        [139.05882263183594, 375.3800354003906, 348.6045837402344, 476.62109375]
    ]
}

Hot Dog Stand

Hot Dog Stand Segmented

JSON outputs:

{
    "labels":
        ["cat 100%", "bowl 98%", "bowl 97%", "bowl 87%", "bowl 85%", "spoon 83%", "bowl 73%"],
    "boxes": [
        [216.59927368164062, 240.20263671875, 407.5367736816406, 379.2315979003906],
        [134.87890625, 55.9307746887207, 245.2788543701172, 120.02284240722656],
        [233.0037841796875, 57.83541488647461, 345.0400695800781, 124.89885711669922],
        [208.5238494873047, 26.521167755126953, 306.4939880371094, 66.13530731201172],
        [328.00067138671875, 69.58489990234375, 475.267578125, 137.90792846679688],
        [352.06707763671875, 43.44765853881836, 444.8140563964844, 97.2989730834961],
        [344.8138122558594, 47.5083122253418, 483.6903991699219, 101.86201477050781]
    ]
}