{
  "routes": [
    "GET /:type/:os/:runtime   — model file URLs (type = video|image)",
    "GET /runtimes             — list all runtime keys"
  ],
  "queryParams": {
    "compute": "(int or SM-version) GPU compute — e.g. 806 or combined 806-10800 (matches model capabilities)",
    "tensorrt_version": "(string) TensorRT version — optional if compute includes it or OS map applies"
  },
  "examples": [
    "/video/linux/onnx",
    "/video/linux/onnx16",
    "/video/mac/coreml",
    "/video/windows/tensorrt?compute=809",
    "/video/linux/openvino",
    "/image/windows/onnx",
    "/image/windows/onnx16",
    "/image/mac/coreml",
    "/image/windows/openvino",
    "/image/windows/openvino16",
    "/image/windows/onnx_qnn",
    "/image/linux/tensorrt?compute=809&tensorrt_version=10800",
    "/image/windows/tensorrt?compute=806-10800"
  ]
}