"input_tensor": [[[ [0.23, 0.25, 0.26, ...], [0.22, 0.24, 0.26, ...], ...], ...]], "shape": [1, 3, 640, 640 ], "dtype": "float32", "normalized": true } # output { "image": "image_01.jpg", "detections": [ { "class_id": 0, "class_name": "person", "confidence": 0.87, "bbox_xywh": [233.0, 328.5, 242.0, 567.0] } ] }