mirror of
https://github.com/immich-app/immich.git
synced 2025-06-16 20:14:42 -04:00
58 lines
1.6 KiB
Python
58 lines
1.6 KiB
Python
from __future__ import annotations
|
|
|
|
from pathlib import Path
|
|
from typing import Any
|
|
|
|
import numpy as np
|
|
import onnxruntime as ort
|
|
from numpy.typing import NDArray
|
|
|
|
from app.schemas import SessionNode
|
|
from rknn.rknnpool import rknnPoolExecutor
|
|
|
|
from ..config import log
|
|
|
|
|
|
def runInfrence(rknn_lite, input):
|
|
outputs = rknn_lite.inference(inputs=[input], data_format="nchw")
|
|
|
|
return outputs
|
|
|
|
|
|
class RknnSession:
|
|
def __init__(self, model_path: Path | str):
|
|
self.model_path = Path(model_path)
|
|
self.ort_model_path = str(self.model_path).replace(".rknn", ".onnx")
|
|
self.tpe = 1 if "textual" in str(self.model_path) else 2
|
|
|
|
log.info(f"Loading RKNN model from {self.model_path} with {self.tpe} threads.")
|
|
self.rknnpool = rknnPoolExecutor(rknnModel=self.model_path.as_posix(), TPEs=self.tpe, func=runInfrence)
|
|
|
|
self.ort_session = ort.InferenceSession(
|
|
self.ort_model_path,
|
|
)
|
|
self.inputs = self.ort_session.get_inputs()
|
|
self.outputs = self.ort_session.get_outputs()
|
|
|
|
del self.ort_session
|
|
|
|
def __del__(self):
|
|
self.rknnpool.release()
|
|
|
|
def get_inputs(self) -> list[SessionNode]:
|
|
return self.inputs
|
|
|
|
def get_outputs(self) -> list[SessionNode]:
|
|
return self.outputs
|
|
|
|
def run(
|
|
self,
|
|
output_names: list[str] | None,
|
|
input_feed: dict[str, NDArray[np.float32]] | dict[str, NDArray[np.int32]],
|
|
run_options: Any = None,
|
|
):
|
|
input_data = [np.ascontiguousarray(v) for v in input_feed.values()][0]
|
|
self.rknnpool.put(input_data)
|
|
outputs = self.rknnpool.get()[0]
|
|
return outputs
|