Unverified Commit 96c05330 authored by Martin Weinelt's avatar Martin Weinelt
Browse files

frigate: disable failing onnxruntime optimization

Recent onnxruntime versions have a failing optimization with FP16
embedding models used in Frigate.
parent da71ac00
Loading
Loading
Loading
Loading
+19 −0
Original line number Diff line number Diff line
Disable the SimplifedLayerNormFusion optimization for onnxruntime embedding
models to prevent a crash when using FP16 models (like jinna-clip-v1) with newer
onnxruntime versions.

https://github.com/microsoft/onnxruntime/issues/26717#issuecomment-3800462654


diff --git a/frigate/embeddings/onnx/runner.py b/frigate/embeddings/onnx/runner.py
index c34c97a8d..dca91daae 100644
--- a/frigate/embeddings/onnx/runner.py
+++ b/frigate/embeddings/onnx/runner.py
@@ -52,6 +52,7 @@ class ONNXModelRunner:
                 model_path,
                 providers=providers,
                 provider_options=options,
+                disabled_optimizers=["SimplifiedLayerNormFusion"],
             )
 
     def get_input_names(self) -> list[str]:
+3 −0
Original line number Diff line number Diff line
@@ -84,6 +84,7 @@ python3Packages.buildPythonApplication rec {
      hash = "sha256-1+n0n0yCtjfAHkXzsZdIF0iCVdPGmsG7l8/VTqBVEjU=";
    })
    ./ffmpeg.patch
    # https://github.com/blakeblackshear/frigate/pull/21876
    ./ai-edge-litert.patch
    (fetchpatch {
      # peewee-migrate 0.14.x compat
@@ -95,6 +96,8 @@ python3Packages.buildPythonApplication rec {
      ];
      hash = "sha256-RrmwjE4SHJIUOYfqcCtMy9Pht7UXhHcoAZlFQv9aQFw=";
    })
    # https://github.com/microsoft/onnxruntime/issues/26717
    ./onnxruntime-compat.patch
  ];

  postPatch = ''