Correctly calculate input data type for OV (#20066)

* Correctly calculate input data type for OV * Formatting
2025-09-14 17:52:10 +02:00 · 2025-09-14 07:15:41 -06:00 · 2025-09-14 07:15:41 -06:00 · ff0430964c
commit ff0430964c
parent c74e86dff2
2 changed files with 38 additions and 12 deletions
--- a/frigate/detectors/detection_runners.py
+++ b/frigate/detectors/detection_runners.py
@ -149,7 +149,8 @@ class OpenVINOModelRunner(BaseModelRunner):
        # Create reusable inference request
        self.infer_request = self.compiled_model.create_infer_request()
        input_shape = self.compiled_model.inputs[0].get_shape()
-        self.input_tensor = ov.Tensor(ov.Type.f32, input_shape)
+        input_element_type = self.compiled_model.inputs[0].get_element_type()
        self.input_tensor = ov.Tensor(input_element_type, input_shape)
    def get_input_names(self) -> list[str]:
        """Get input names for the model."""
@ -161,20 +162,44 @@ class OpenVINOModelRunner(BaseModelRunner):
        # Assuming NCHW format, width is the last dimension
        return int(input_shape[-1])
-    def run(self, input_data: np.ndarray) -> list[np.ndarray]:
+    def run(self, inputs: dict[str, Any]) -> list[np.ndarray]:
        """Run inference with the model.
        Args:
-            input_data: Input tensor data
+            inputs: Dictionary mapping input names to input data
        Returns:
            List of output tensors
        """
-        # Copy input data to pre-allocated tensor
+        # Handle single input case for backward compatibility
-        np.copyto(self.input_tensor.data, input_data)
+        if len(inputs) == 1 and len(self.compiled_model.inputs) == 1:
            # Single input case - use the pre-allocated tensor for efficiency
            input_data = list(inputs.values())[0]
            np.copyto(self.input_tensor.data, input_data)
            self.infer_request.infer(self.input_tensor)
        else:
            # Multiple inputs case - set each input by name
            for input_name, input_data in inputs.items():
                # Find the input by name
                input_port = None
                for port in self.compiled_model.inputs:
                    if port.get_any_name() == input_name:
                        input_port = port
                        break
-        # Run inference
+                if input_port is None:
-        self.infer_request.infer(self.input_tensor)
+                    raise ValueError(f"Input '{input_name}' not found in model")
                # Create tensor with the correct element type
                input_element_type = input_port.get_element_type()
                input_tensor = ov.Tensor(input_element_type, input_data.shape)
                np.copyto(input_tensor.data, input_data)
                # Set the input tensor
                self.infer_request.set_input_tensor(input_tensor)
            # Run inference
            self.infer_request.infer()
        # Get all output tensors
        outputs = []
--- a/frigate/detectors/plugins/openvino.py
+++ b/frigate/detectors/plugins/openvino.py
@ -141,16 +141,17 @@ class OvDetector(DetectionApi):
                "images": tensor_input,
                "orig_target_sizes": np.array([[self.h, self.w]], dtype=np.int64),
            }
-            outputs = self.runner.run_with_named_inputs(inputs)
+            outputs = self.runner.run(inputs)
            tensor_output = (
-                outputs["output0"],
+                outputs[0],
-                outputs["output1"],
+                outputs[1],
-                outputs["output2"],
+                outputs[2],
            )
            return post_process_dfine(tensor_output, self.w, self.h)
        # Run inference using the runner
-        outputs = self.runner.run(tensor_input)
+        input_name = self.runner.get_input_names()[0]
        outputs = self.runner.run({input_name: tensor_input})
        detections = np.zeros((20, 6), np.float32)