## Image 1

### Results
- microsoft/beit-base-patch16-224-pt22k-ft22k
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.3585329055786133,
"label": "water_sport, aquatics"
},
{
"score": 0.0551958903670311,
"label": "Delawarean, Delawarian"
},
{
"score": 0.04279031604528427,
"label": "dip, plunge"
},
{
"score": 0.025119218975305557,
"label": "sport, athletics"
},
{
"score": 0.024944499135017395,
"label": "swimming, swim"
}
]
</pre>
</details>
- facebook/detr-resnet-50
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.9670101404190063,
"label": "bicycle",
"box": {
"xmin": 777,
"ymin": 269,
"xmax": 851,
"ymax": 401
}
},
{
"score": 0.9972262978553772,
"label": "bicycle",
"box": {
"xmin": 3,
"ymin": 1067,
"xmax": 620,
"ymax": 1426
}
},
{
"score": 0.9987988471984863,
"label": "person",
"box": {
"xmin": 1046,
"ymin": 151,
"xmax": 1420,
"ymax": 724
}
},
{
"score": 0.9972848892211914,
"label": "person",
"box": {
"xmin": 1228,
"ymin": 783,
"xmax": 1314,
"ymax": 1020
}
},
{
"score": 0.9924046397209167,
"label": "person",
"box": {
"xmin": 1173,
"ymin": 748,
"xmax": 1247,
"ymax": 948
}
},
{
"score": 0.9862789511680603,
"label": "person",
"box": {
"xmin": 1351,
"ymin": 180,
"xmax": 1406,
"ymax": 350
}
},
{
"score": 0.993550181388855,
"label": "person",
"box": {
"xmin": 466,
"ymin": 617,
"xmax": 627,
"ymax": 808
}
},
{
"score": 0.9819428324699402,
"label": "person",
"box": {
"xmin": 1346,
"ymin": 739,
"xmax": 1408,
"ymax": 909
}
},
{
"score": 0.9766739010810852,
"label": "person",
"box": {
"xmin": 207,
"ymin": 269,
"xmax": 352,
"ymax": 421
}
},
{
"score": 0.9229204654693604,
"label": "person",
"box": {
"xmin": 1273,
"ymin": 177,
"xmax": 1318,
"ymax": 310
}
},
{
"score": 0.9874098896980286,
"label": "person",
"box": {
"xmin": 1227,
"ymin": 175,
"xmax": 1269,
"ymax": 306
}
},
{
"score": 0.9742178320884705,
"label": "surfboard",
"box": {
"xmin": 480,
"ymin": 1,
"xmax": 616,
"ymax": 245
}
},
{
"score": 0.9985004663467407,
"label": "person",
"box": {
"xmin": 169,
"ymin": 748,
"xmax": 465,
"ymax": 1347
}
},
{
"score": 0.9135106205940247,
"label": "boat",
"box": {
"xmin": 4,
"ymin": 10,
"xmax": 215,
"ymax": 108
}
},
{
"score": 0.984155535697937,
"label": "person",
"box": {
"xmin": 541,
"ymin": 442,
"xmax": 956,
"ymax": 1017
}
},
{
"score": 0.9939020872116089,
"label": "surfboard",
"box": {
"xmin": 377,
"ymin": 353,
"xmax": 1050,
"ymax": 1057
}
},
{
"score": 0.9974502921104431,
"label": "person",
"box": {
"xmin": 733,
"ymin": 145,
"xmax": 1076,
"ymax": 711
}
},
{
"score": 0.9994043111801147,
"label": "person",
"box": {
"xmin": 812,
"ymin": 852,
"xmax": 1069,
"ymax": 1431
}
}
]
</pre>
</details>
## Image 2

### Results
- microsoft/beit-base-patch16-224-pt22k-ft22k
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.1708015501499176,
"label": "student, pupil, educatee"
},
{
"score": 0.12263857573270798,
"label": "pageboy"
},
{
"score": 0.08322908729314804,
"label": "tasset, tasse"
},
{
"score": 0.03783860057592392,
"label": "halter"
},
{
"score": 0.031336382031440735,
"label": "Spandau"
}
]
</pre>
</details>
- facebook/detr-resnet-50
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.9963523149490356,
"label": "person",
"box": {
"xmin": 215,
"ymin": 8,
"xmax": 1328,
"ymax": 1775
}
}
]
</pre>
</details>
## Image 3

### Results
- microsoft/beit-base-patch16-224-pt22k-ft22k
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.3932889699935913,
"label": "ballet_skirt, tutu"
},
{
"score": 0.10553930699825287,
"label": "tugboat, tug, towboat, tower"
},
{
"score": 0.053816571831703186,
"label": "costume"
},
{
"score": 0.026449749246239662,
"label": "costume"
},
{
"score": 0.023851439356803894,
"label": "fancy_dress, masquerade, masquerade_costume"
}
]
</pre>
</details>
- facebook/detr-resnet-50
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.9526549577713013,
"label": "handbag",
"box": {
"xmin": 994,
"ymin": 694,
"xmax": 1074,
"ymax": 833
}
},
{
"score": 0.9050776362419128,
"label": "handbag",
"box": {
"xmin": 1085,
"ymin": 743,
"xmax": 1161,
"ymax": 830
}
},
{
"score": 0.996862530708313,
"label": "backpack",
"box": {
"xmin": 325,
"ymin": 655,
"xmax": 425,
"ymax": 809
}
},
{
"score": 0.9659021496772766,
"label": "person",
"box": {
"xmin": 484,
"ymin": 740,
"xmax": 527,
"ymax": 868
}
},
{
"score": 0.9855809807777405,
"label": "backpack",
"box": {
"xmin": 100,
"ymin": 672,
"xmax": 197,
"ymax": 783
}
},
{
"score": 0.9058822989463806,
"label": "person",
"box": {
"xmin": 551,
"ymin": 711,
"xmax": 605,
"ymax": 803
}
},
{
"score": 0.9988893866539001,
"label": "person",
"box": {
"xmin": 315,
"ymin": 597,
"xmax": 463,
"ymax": 1017
}
},
{
"score": 0.9977328777313232,
"label": "person",
"box": {
"xmin": 94,
"ymin": 594,
"xmax": 283,
"ymax": 1055
}
},
{
"score": 0.9985538125038147,
"label": "person",
"box": {
"xmin": 431,
"ymin": 464,
"xmax": 1017,
"ymax": 1758
}
},
{
"score": 0.9157671928405762,
"label": "person",
"box": {
"xmin": 514,
"ymin": 721,
"xmax": 567,
"ymax": 853
}
},
{
"score": 0.9396088719367981,
"label": "person",
"box": {
"xmin": 1375,
"ymin": 774,
"xmax": 1440,
"ymax": 940
}
},
{
"score": 0.9938980937004089,
"label": "person",
"box": {
"xmin": 914,
"ymin": 663,
"xmax": 995,
"ymax": 851
}
},
{
"score": 0.9829141497612,
"label": "person",
"box": {
"xmin": 865,
"ymin": 680,
"xmax": 929,
"ymax": 814
}
},
{
"score": 0.9993380904197693,
"label": "person",
"box": {
"xmin": 979,
"ymin": 634,
"xmax": 1120,
"ymax": 1001
}
}
]
</pre>
</details>
## Image 4

### Results
- microsoft/beit-base-patch16-224-pt22k-ft22k
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.5473794937133789,
"label": "bow, bowknot"
},
{
"score": 0.2602613866329193,
"label": "rib"
},
{
"score": 0.02672475017607212,
"label": "gift_wrapping"
},
{
"score": 0.010764000937342644,
"label": "package, parcel"
},
{
"score": 0.00281360256485641,
"label": "wraparound"
}
]
</pre>
</details>
- facebook/detr-resnet-50
<details>
<summary>Raw output</summary>
<pre>
[]
</pre>
</details>
## Image 5

### Results
- microsoft/beit-base-patch16-224-pt22k-ft22k
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.15340560674667358,
"label": "mountain_bike, all-terrain_bike, off-roader"
},
{
"score": 0.14019626379013062,
"label": "bicycling"
},
{
"score": 0.0887056514620781,
"label": "dune_cycling"
},
{
"score": 0.05705874413251877,
"label": "safety_belt, life_belt, safety_harness"
},
{
"score": 0.03170625492930412,
"label": "rhymer, rhymester, versifier, poetizer, poetiser"
}
]
</pre>
</details>
- facebook/detr-resnet-50
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.997163712978363,
"label": "person",
"box": {
"xmin": 594,
"ymin": 288,
"xmax": 949,
"ymax": 694
}
},
{
"score": 0.9979368448257446,
"label": "bicycle",
"box": {
"xmin": 528,
"ymin": 446,
"xmax": 1108,
"ymax": 814
}
}
]
</pre>
</details>
## Image 6

### Results
- microsoft/beit-base-patch16-224-pt22k-ft22k
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.2950187623500824,
"label": "call_forwarding"
},
{
"score": 0.12219228595495224,
"label": "voice_mail, voicemail"
},
{
"score": 0.10082340240478516,
"label": "telephone, telephony"
},
{
"score": 0.05075190216302872,
"label": "cadet, plebe"
},
{
"score": 0.03081812709569931,
"label": "collect_call"
}
]
</pre>
</details>
- facebook/detr-resnet-50
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.998989999294281,
"label": "person",
"box": {
"xmin": 58,
"ymin": 927,
"xmax": 1210,
"ymax": 2040
}
}
]
</pre>
</details>
## Image 7

### Results
- microsoft/beit-base-patch16-224-pt22k-ft22k
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.051966048777103424,
"label": "pile_driver"
},
{
"score": 0.04113095998764038,
"label": "B-complex_vitamin, B_complex, vitamin_B_complex, vitamin_B, B_vitamin, B"
},
{
"score": 0.036562610417604446,
"label": "ice_water"
},
{
"score": 0.035076212137937546,
"label": "vitamin_B1, thiamine, thiamin, aneurin, antiberiberi_factor"
},
{
"score": 0.03246167302131653,
"label": "vitamin_K3, menadione"
}
]
</pre>
</details>
- facebook/detr-resnet-50
<details>
<summary>Raw output</summary>
<pre>
[]
</pre>
</details>
## Image 8

### Results
- microsoft/beit-base-patch16-224-pt22k-ft22k
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.1020277887582779,
"label": "yellow-leaf_sickle_pine, Falcatifolium_taxoides"
},
{
"score": 0.07703261077404022,
"label": "fir, fir_tree, true_fir"
},
{
"score": 0.057639602571725845,
"label": "she-oak"
},
{
"score": 0.0543302446603775,
"label": "arborescent_plant"
},
{
"score": 0.03553837165236473,
"label": "silver_fir"
}
]
</pre>
</details>
- facebook/detr-resnet-50
<details>
<summary>Raw output</summary>
<pre>
[]
</pre>
</details>
## Image 9

### Results
- microsoft/beit-base-patch16-224-pt22k-ft22k
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.4498935341835022,
"label": "book"
},
{
"score": 0.15459826588630676,
"label": "philodendron"
},
{
"score": 0.048068154603242874,
"label": "collection, aggregation, accumulation, assemblage"
},
{
"score": 0.026179153472185135,
"label": "green, greenness, viridity"
},
{
"score": 0.022521227598190308,
"label": "cryptocoryne, water_trumpet"
}
]
</pre>
</details>
- facebook/detr-resnet-50
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.9774452447891235,
"label": "book",
"box": {
"xmin": 404,
"ymin": 1384,
"xmax": 1073,
"ymax": 1606
}
},
{
"score": 0.9523172974586487,
"label": "book",
"box": {
"xmin": 277,
"ymin": 683,
"xmax": 896,
"ymax": 921
}
},
{
"score": 0.935616135597229,
"label": "book",
"box": {
"xmin": 401,
"ymin": 1491,
"xmax": 1081,
"ymax": 1753
}
},
{
"score": 0.9563809037208557,
"label": "book",
"box": {
"xmin": 22,
"ymin": 326,
"xmax": 342,
"ymax": 648
}
},
{
"score": 0.9457127451896667,
"label": "book",
"box": {
"xmin": 161,
"ymin": 1170,
"xmax": 1020,
"ymax": 1446
}
}
]
</pre>
</details>
## Image 10

### Results
- microsoft/beit-base-patch16-224-pt22k-ft22k
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.5738916993141174,
"label": "imprint"
},
{
"score": 0.26790598034858704,
"label": "spit, tongue"
},
{
"score": 0.02013584040105343,
"label": "riparian_forest"
},
{
"score": 0.012678979896008968,
"label": "ridge_tile"
},
{
"score": 0.0050319829024374485,
"label": "drumlin"
}
]
</pre>
</details>
- facebook/detr-resnet-50
<details>
<summary>Raw output</summary>
<pre>
[]
</pre>
</details>
## Image 11

### Results
- microsoft/beit-base-patch16-224-pt22k-ft22k
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.24498172104358673,
"label": "fatigues"
},
{
"score": 0.11273926496505737,
"label": "battle_dress"
},
{
"score": 0.04571410268545151,
"label": "sangoma"
},
{
"score": 0.03706562891602516,
"label": "first_lieutenant, 1st_lieutenant"
},
{
"score": 0.036624155938625336,
"label": "licentiate"
}
]
</pre>
</details>
- facebook/detr-resnet-50
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.9995110034942627,
"label": "person",
"box": {
"xmin": 25,
"ymin": 580,
"xmax": 1148,
"ymax": 2048
}
}
]
</pre>
</details>
## Image 12

### Results
- microsoft/beit-base-patch16-224-pt22k-ft22k
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.10919874906539917,
"label": "pill_bottle"
},
{
"score": 0.08866381645202637,
"label": "ski_boot"
},
{
"score": 0.08700862526893616,
"label": "hat, chapeau, lid"
},
{
"score": 0.050055038183927536,
"label": "cloche"
},
{
"score": 0.04304906725883484,
"label": "beanie, beany"
}
]
</pre>
</details>
- facebook/detr-resnet-50
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.99952232837677,
"label": "person",
"box": {
"xmin": 0,
"ymin": 11,
"xmax": 1283,
"ymax": 2263
}
}
]
</pre>
</details>
## Image 13

### Results
- microsoft/beit-base-patch16-224-pt22k-ft22k
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.1646043062210083,
"label": "sweat_pants, sweatpants"
},
{
"score": 0.09391571581363678,
"label": "long_sleeve"
},
{
"score": 0.05163830146193504,
"label": "web_site, website, internet_site, site"
},
{
"score": 0.05139746144413948,
"label": "sleeping_car, sleeper, wagon-lit"
},
{
"score": 0.04919322952628136,
"label": "grey, gray"
}
]
</pre>
</details>
- facebook/detr-resnet-50
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.9963856935501099,
"label": "sports ball",
"box": {
"xmin": 968,
"ymin": 331,
"xmax": 1042,
"ymax": 411
}
},
{
"score": 0.9982948899269104,
"label": "person",
"box": {
"xmin": 270,
"ymin": 559,
"xmax": 975,
"ymax": 1772
}
}
]
</pre>
</details>
## Image 14

### Results
- microsoft/beit-base-patch16-224-pt22k-ft22k
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.19194857776165009,
"label": "Black, Black_person, blackamoor, Negro, Negroid"
},
{
"score": 0.07137732207775116,
"label": "hot_pants"
},
{
"score": 0.07008359581232071,
"label": "wrongdoer, offender"
},
{
"score": 0.061084289103746414,
"label": "Andorran"
},
{
"score": 0.026485782116651535,
"label": "Scandinavian, Norse, Northman"
}
]
</pre>
</details>
- facebook/detr-resnet-50
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.9905648231506348,
"label": "person",
"box": {
"xmin": 16,
"ymin": 73,
"xmax": 963,
"ymax": 1895
}
}
]
</pre>
</details>
## Image 15

### Results
- microsoft/beit-base-patch16-224-pt22k-ft22k
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.04893031716346741,
"label": "planter"
},
{
"score": 0.04559663310647011,
"label": "cellist, violoncellist"
},
{
"score": 0.03605553135275841,
"label": "third_rail"
},
{
"score": 0.024815652519464493,
"label": "brassiere, bra, bandeau"
},
{
"score": 0.023524468764662743,
"label": "foundation_garment, foundation"
}
]
</pre>
</details>
- facebook/detr-resnet-50
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.9935477375984192,
"label": "sports ball",
"box": {
"xmin": 976,
"ymin": 193,
"xmax": 1034,
"ymax": 250
}
},
{
"score": 0.9993860721588135,
"label": "person",
"box": {
"xmin": 81,
"ymin": 483,
"xmax": 1022,
"ymax": 1571
}
}
]
</pre>
</details>
## Image 16

### Results
- microsoft/beit-base-patch16-224-pt22k-ft22k
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.0881146639585495,
"label": "ginger_ale, ginger_pop"
},
{
"score": 0.055923692882061005,
"label": "pile_driver"
},
{
"score": 0.04174800217151642,
"label": "complexion, skin_color, skin_colour"
},
{
"score": 0.032528575509786606,
"label": "courtier"
},
{
"score": 0.025789018720388412,
"label": "babu, baboo"
}
]
</pre>
</details>
- facebook/detr-resnet-50
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.9992997646331787,
"label": "bottle",
"box": {
"xmin": 0,
"ymin": 406,
"xmax": 663,
"ymax": 1276
}
},
{
"score": 0.9984581470489502,
"label": "person",
"box": {
"xmin": 1,
"ymin": 362,
"xmax": 1281,
"ymax": 2251
}
}
]
</pre>
</details>
## Image 17

### Results
- microsoft/beit-base-patch16-224-pt22k-ft22k
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.11748626828193665,
"label": "gum_ball"
},
{
"score": 0.06464188545942307,
"label": "crevice, cranny, crack, fissure, chap"
},
{
"score": 0.028064390644431114,
"label": "Hakham"
},
{
"score": 0.02634829469025135,
"label": "neon_lamp, neon_induction_lamp, neon_tube"
},
{
"score": 0.02446410059928894,
"label": "glow_tube"
}
]
</pre>
</details>
- facebook/detr-resnet-50
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.9458110332489014,
"label": "person",
"box": {
"xmin": 188,
"ymin": 914,
"xmax": 518,
"ymax": 1310
}
}
]
</pre>
</details>
## Image 18

### Results
- microsoft/beit-base-patch16-224-pt22k-ft22k
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.4500826597213745,
"label": "loop"
},
{
"score": 0.038537003099918365,
"label": "coil, spiral, volute, whorl, helix"
},
{
"score": 0.03499343618750572,
"label": "maze, labyrinth"
},
{
"score": 0.032819539308547974,
"label": "funnel, funnel_shape"
},
{
"score": 0.027387460693717003,
"label": "trireme"
}
]
</pre>
</details>
- facebook/detr-resnet-50
<details>
<summary>Raw output</summary>
<pre>
[]
</pre>
</details>
## Image 19

### Results
- microsoft/beit-base-patch16-224-pt22k-ft22k
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.06875976920127869,
"label": "chocolate_milk"
},
{
"score": 0.04325872287154198,
"label": "Red_Delicious"
},
{
"score": 0.040120914578437805,
"label": "vinegar, acetum"
},
{
"score": 0.0395379401743412,
"label": "Japanese_banana, Musa_basjoo"
},
{
"score": 0.03130943700671196,
"label": "conserve, preserve, conserves, preserves"
}
]
</pre>
</details>
- facebook/detr-resnet-50
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.9981312155723572,
"label": "apple",
"box": {
"xmin": 462,
"ymin": 461,
"xmax": 835,
"ymax": 907
}
},
{
"score": 0.9967857599258423,
"label": "banana",
"box": {
"xmin": 0,
"ymin": 832,
"xmax": 456,
"ymax": 1747
}
},
{
"score": 0.9837309122085571,
"label": "bottle",
"box": {
"xmin": 760,
"ymin": 615,
"xmax": 1098,
"ymax": 1763
}
}
]
</pre>
</details>
## Image 20

### Results
- microsoft/beit-base-patch16-224-pt22k-ft22k
<details>
<summary>Raw output</summary>
<pre>
[
{
"score": 0.8516464829444885,
"label": "reckoner, ready_reckoner"
},
{
"score": 0.04170207679271698,
"label": "vehicle"
},
{
"score": 0.030337227508425713,
"label": "lemon"
},
{
"score": 0.017466070130467415,
"label": "lodestone, loadstone"
},
{
"score": 0.004754251800477505,
"label": "envelope"
}
]
</pre>
</details>
- facebook/detr-resnet-50
<details>
<summary>Raw output</summary>
<pre>
[]
</pre>
</details>