Add support for RF-DETR models (#17298)

* Add support for rf-detr models * Add docs for rf-detr model * Cleanup
2025-10-27 10:52:11 +01:00 · 2025-03-21 18:55:46 -06:00 · 2025-03-21 18:55:46 -06:00 · 48e4c44b32
commit 48e4c44b32
parent 4e83237d47
4 changed files with 97 additions and 5 deletions
--- a/docs/docs/configuration/object_detectors.md
+++ b/docs/docs/configuration/object_detectors.md
@ -342,7 +342,7 @@ Note that the labelmap uses a subset of the complete COCO label set that has onl
 #### D-FINE
-[D-FINE](https://github.com/Peterande/D-FINE) is the [current state of the art](https://paperswithcode.com/sota/real-time-object-detection-on-coco?p=d-fine-redefine-regression-task-in-detrs-as) at the time of writing. The ONNX exported models are supported, but not included by default. See [the models section](#downloading-d-fine-model) for more information on downloading the D-FINE model for use in Frigate.
+[D-FINE](https://github.com/Peterande/D-FINE) is a DETR based model. The ONNX exported models are supported, but not included by default. See [the models section](#downloading-d-fine-model) for more information on downloading the D-FINE model for use in Frigate.
 After placing the downloaded onnx model in your config/model_cache folder, you can use the following configuration:
@ -647,9 +647,29 @@ model:
 Note that the labelmap uses a subset of the complete COCO label set that has only 80 objects.
 #### RF-DETR
 [RF-DETR](https://github.com/roboflow/rf-detr) is a DETR based model. The ONNX exported models are supported, but not included by default. See [the models section](#downloading-rf-detr-model) for more informatoin on downloading the RF-DETR model for use in Frigate.
 After placing the downloaded onnx model in your `config/model_cache` folder, you can use the following configuration:
 ```
 detectors:
  onnx:
    type: onnx
 model:
  model_type: rfdetr
  width: 560
  height: 560
  input_tensor: nchw
  input_dtype: float
  path: /config/model_cache/rfdetr.onnx
 ```
 #### D-FINE
-[D-FINE](https://github.com/Peterande/D-FINE) is the [current state of the art](https://paperswithcode.com/sota/real-time-object-detection-on-coco?p=d-fine-redefine-regression-task-in-detrs-as) at the time of writing. The ONNX exported models are supported, but not included by default. See [the models section](#downloading-d-fine-model) for more information on downloading the D-FINE model for use in Frigate.
+[D-FINE](https://github.com/Peterande/D-FINE) is a DETR based model. The ONNX exported models are supported, but not included by default. See [the models section](#downloading-d-fine-model) for more information on downloading the D-FINE model for use in Frigate.
 After placing the downloaded onnx model in your config/model_cache folder, you can use the following configuration:
@ -873,6 +893,16 @@ Make sure you change the batch size to 1 before exporting.
 :::
 ### Download RF-DETR Model
 To export as ONNX:
 1. `pip3 install rfdetr`
 2. `python`
 3. `from rfdetr import RFDETRBase`
 4. `x = RFDETRBase()`
 5. `x.export()`
 ### Downloading YOLO-NAS Model
 You can build and download a compatible model with pre-trained weights using [this notebook](https://github.com/blakeblackshear/frigate/blob/dev/notebooks/YOLO_NAS_Pretrained_Export.ipynb) [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/blakeblackshear/frigate/blob/dev/notebooks/YOLO_NAS_Pretrained_Export.ipynb).
--- a/frigate/detectors/detector_config.py
+++ b/frigate/detectors/detector_config.py
@ -33,11 +33,12 @@ class InputDTypeEnum(str, Enum):
 class ModelTypeEnum(str, Enum):
    dfine = "dfine"
    rfdetr = "rfdetr"
    ssd = "ssd"
    yolox = "yolox"
    yolov9 = "yolov9"
    yolonas = "yolonas"
    dfine = "dfine"
    yologeneric = "yolo-generic"
--- a/frigate/detectors/plugins/onnx.py
+++ b/frigate/detectors/plugins/onnx.py
@ -12,6 +12,7 @@ from frigate.detectors.detector_config import (
 from frigate.util.model import (
    get_ort_providers,
    post_process_dfine,
    post_process_rfdetr,
    post_process_yolov9,
 )
@ -73,7 +74,9 @@ class ONNXDetector(DetectionApi):
        model_input_name = self.model.get_inputs()[0].name
        tensor_output = self.model.run(None, {model_input_name: tensor_input})
-        if self.onnx_model_type == ModelTypeEnum.yolonas:
+        if self.onnx_model_type == ModelTypeEnum.rfdetr:
            return post_process_rfdetr(tensor_output)
        elif self.onnx_model_type == ModelTypeEnum.yolonas:
            predictions = tensor_output[0]
            detections = np.zeros((20, 6), np.float32)
--- a/frigate/util/model.py
+++ b/frigate/util/model.py
@ -13,7 +13,11 @@ logger = logging.getLogger(__name__)
 ### Post Processing
-def post_process_dfine(tensor_output: np.ndarray, width, height) -> np.ndarray:
+
 def post_process_dfine(
    tensor_output: np.ndarray, width: int, height: int
 ) -> np.ndarray:
    class_ids = tensor_output[0][tensor_output[2] > 0.4]
    boxes = tensor_output[1][tensor_output[2] > 0.4]
    scores = tensor_output[2][tensor_output[2] > 0.4]
@ -41,6 +45,60 @@ def post_process_dfine(tensor_output: np.ndarray, width, height) -> np.ndarray:
    return detections
 def post_process_rfdetr(tensor_output: list[np.ndarray, np.ndarray]) -> np.ndarray:
    boxes = tensor_output[0]
    raw_scores = tensor_output[1]
    # apply soft max to scores
    exp = np.exp(raw_scores - np.max(raw_scores, axis=-1, keepdims=True))
    all_scores = exp / np.sum(exp, axis=-1, keepdims=True)
    # get highest scoring class from every detection
    scores = np.max(all_scores[0, :, 1:], axis=-1)
    labels = np.argmax(all_scores[0, :, 1:], axis=-1)
    idxs = scores > 0.4
    filtered_boxes = boxes[0, idxs]
    filtered_scores = scores[idxs]
    filtered_labels = labels[idxs]
    # convert boxes from [x_center, y_center, width, height]
    x_center, y_center, w, h = (
        filtered_boxes[:, 0],
        filtered_boxes[:, 1],
        filtered_boxes[:, 2],
        filtered_boxes[:, 3],
    )
    x_min = x_center - w / 2
    y_min = y_center - h / 2
    x_max = x_center + w / 2
    y_max = y_center + h / 2
    filtered_boxes = np.stack([x_min, y_min, x_max, y_max], axis=-1)
    # apply nms
    indices = cv2.dnn.NMSBoxes(
        filtered_boxes, filtered_scores, score_threshold=0.4, nms_threshold=0.4
    )
    detections = np.zeros((20, 6), np.float32)
    for i, (bbox, confidence, class_id) in enumerate(
        zip(filtered_boxes[indices], filtered_scores[indices], filtered_labels[indices])
    ):
        if i == 20:
            break
        detections[i] = [
            class_id,
            confidence,
            bbox[1],
            bbox[0],
            bbox[3],
            bbox[2],
        ]
    return detections
 def post_process_yolov9(predictions: np.ndarray, width, height) -> np.ndarray:
    predictions = np.squeeze(predictions).T
    scores = np.max(predictions[:, 4:], axis=1)