refactor

2026-02-10 19:07:55 +03:00 · 2025-03-11 18:35:21 -04:00
parent f5e44f12e1
commit ec0fa4d52b
22 changed files with 132 additions and 105 deletions
--- a/machine-learning/export/onnx/Dockerfile
+++ b/machine-learning/export/onnx/Dockerfile
--- a/machine-learning/export/onnx/conda-lock.yml
+++ b/machine-learning/export/onnx/conda-lock.yml
--- a/machine-learning/export/onnx/env.dev.yaml
+++ b/machine-learning/export/onnx/env.dev.yaml
--- a/machine-learning/export/onnx/env.yaml
+++ b/machine-learning/export/onnx/env.yaml
--- a/machine-learning/export/onnx/models/init.py
+++ b/machine-learning/export/onnx/models/init.py
--- a/machine-learning/export/onnx/models/mclip.py
+++ b/machine-learning/export/onnx/models/mclip.py
--- a/machine-learning/export/onnx/models/openclip.py
+++ b/machine-learning/export/onnx/models/openclip.py
--- a/machine-learning/export/onnx/models/optimize.py
+++ b/machine-learning/export/onnx/models/optimize.py
--- a/machine-learning/export/onnx/models/util.py
+++ b/machine-learning/export/onnx/models/util.py
--- a/machine-learning/export/onnx/run.py
+++ b/machine-learning/export/onnx/run.py
--- a/machine-learning/export/rknpu/ViT-B-32__openai/README.md
+++ b/machine-learning/export/rknpu/ViT-B-32__openai/README.md
@@ -0,0 +1,11 @@
+---
+tags:
+ - immich
+ - clip
+---
+# Model Description
+
+This repo contains ONNX exports for the CLIP model [openai/clip-vit-base-patch32](https://huggingface.co/openai/clip-vit-base-patch32). 
+It separates the visual and textual encoders into separate models for the purpose of generating image and text embeddings.
+
+This repo is specifically intended for use with [Immich](https://immich.app/), a self-hosted photo library.
--- a/machine-learning/export/rknpu/build_rknn.py
+++ b/machine-learning/export/rknpu/build_rknn.py
@@ -0,0 +1,69 @@
+import argparse
+from pathlib import Path
+
+from rknn.api import RKNN
+
+parser = argparse.ArgumentParser("ONNX to RKNN model converter")
+parser.add_argument(
+    "model", help="Directory of the model that will be exported to RKNN ex:ViT-B-32__openai.", type=Path
+)
+parser.add_argument("target_platform", help="target platform ex:rk3566", type=str)
+args = parser.parse_args()
+
+
+def ConvertModel(model_dir: Path, target_platform: str, dynamic_input=None):
+    input_path = model_dir / "model.onnx"
+    print(f"Converting model {input_path}")
+    rknn = RKNN(verbose=False)
+
+    rknn.config(
+        target_platform=target_platform,
+        dynamic_input=dynamic_input,
+        enable_flash_attention=True,
+        # remove_reshape=True,
+        # model_pruning=True
+    )
+    ret = rknn.load_onnx(model=input_path.as_posix())
+
+    if ret != 0:
+        print("Load failed!")
+        exit(ret)
+
+    ret = rknn.build(do_quantization=False)
+
+    if ret != 0:
+        print("Build failed!")
+        exit(ret)
+
+    output_path = model_dir / "rknpu" / target_platform / "model.rknn"
+    output_path.parent.mkdir(parents=True, exist_ok=True)
+    print(f"Exporting model {model_dir} to {output_path}")
+    ret = rknn.export_rknn(output_path.as_posix())
+    if ret != 0:
+        print("Export rknn model failed!")
+        exit(ret)
+
+
+textual = args.model / "textual"
+visual = args.model / "visual"
+detection = args.model / "detection"
+recognition = args.model / "recognition"
+
+is_dir = [textual.is_dir(), visual.is_dir(), detection.is_dir(), recognition.is_dir()]
+if not any(is_dir):
+    print("Unknown model")
+    exit(1)
+
+is_textual, is_visual, is_detection, is_recognition = is_dir
+
+if is_textual:
+    ConvertModel(textual, target_platform=args.target_platform)
+
+if is_visual:
+    ConvertModel(visual, target_platform=args.target_platform)
+
+if is_detection:
+    ConvertModel(detection, args.target_platform, [[[1, 3, 640, 640]]])
+
+if is_recognition:
+    ConvertModel(recognition, args.target_platform, [[[1, 3, 112, 112]]])
--- a/machine-learning/export/rknpu/convert.sh
+++ b/machine-learning/export/rknpu/convert.sh
@@ -0,0 +1,13 @@
+#!/bin/bash
+
+python3 build_rknn.py "$1" "$2" > immich_to_rknn2.log
+
+# if "No lowering found for" found in log file, return error status 1
+if grep -q "No lowering found for" immich_to_rknn2.log; then
+    echo -e "\e[31mSome operations are not supported by RKNN, please check the log file for details.\e[0m"
+    exit 1
+else
+    echo -e "\e[32mConversion completed successfully.\e[0m"
+    rm immich_to_rknn2.log
+    exit 0
+fi
--- a/machine-learning/export/rknpu/requirements.txt
+++ b/machine-learning/export/rknpu/requirements.txt
@@ -0,0 +1 @@
+rknn-toolkit2==2.3.0