mirror of
				https://github.com/immich-app/immich.git
				synced 2025-10-25 15:52:33 -04:00 
			
		
		
		
	
		
			
				
	
	
		
			68 lines
		
	
	
		
			2.3 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			68 lines
		
	
	
		
			2.3 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| from typing import Any
 | |
| 
 | |
| from aiocache.backends.memory import SimpleMemoryCache
 | |
| from aiocache.lock import OptimisticLock
 | |
| from aiocache.plugins import TimingPlugin
 | |
| 
 | |
| from app.models import from_model_type
 | |
| 
 | |
| from ..schemas import ModelType, has_profiling
 | |
| from .base import InferenceModel
 | |
| 
 | |
| 
 | |
| class ModelCache:
 | |
|     """Fetches a model from an in-memory cache, instantiating it if it's missing."""
 | |
| 
 | |
|     def __init__(
 | |
|         self,
 | |
|         revalidate: bool = False,
 | |
|         timeout: int | None = None,
 | |
|         profiling: bool = False,
 | |
|     ) -> None:
 | |
|         """
 | |
|         Args:
 | |
|             revalidate: Resets TTL on cache hit. Useful to keep models in memory while active. Defaults to False.
 | |
|             timeout: Maximum allowed time for model to load. Disabled if None. Defaults to None.
 | |
|             profiling: Collects metrics for cache operations, adding slight overhead. Defaults to False.
 | |
|         """
 | |
| 
 | |
|         plugins = []
 | |
| 
 | |
|         if profiling:
 | |
|             plugins.append(TimingPlugin())
 | |
| 
 | |
|         self.revalidate_enable = revalidate
 | |
| 
 | |
|         self.cache = SimpleMemoryCache(timeout=timeout, plugins=plugins, namespace=None)
 | |
| 
 | |
|     async def get(self, model_name: str, model_type: ModelType, **model_kwargs: Any) -> InferenceModel:
 | |
|         """
 | |
|         Args:
 | |
|             model_name: Name of model in the model hub used for the task.
 | |
|             model_type: Model type or task, which determines which model zoo is used.
 | |
| 
 | |
|         Returns:
 | |
|             model: The requested model.
 | |
|         """
 | |
| 
 | |
|         key = f"{model_name}{model_type.value}{model_kwargs.get('mode', '')}"
 | |
| 
 | |
|         async with OptimisticLock(self.cache, key) as lock:
 | |
|             model: InferenceModel | None = await self.cache.get(key)
 | |
|             if model is None:
 | |
|                 model = from_model_type(model_type, model_name, **model_kwargs)
 | |
|                 await lock.cas(model, ttl=model_kwargs.get("ttl", None))
 | |
|             elif self.revalidate_enable:
 | |
|                 await self.revalidate(key, model_kwargs.get("ttl", None))
 | |
|         return model
 | |
| 
 | |
|     async def get_profiling(self) -> dict[str, float] | None:
 | |
|         if not has_profiling(self.cache):
 | |
|             return None
 | |
| 
 | |
|         return self.cache.profiling
 | |
| 
 | |
|     async def revalidate(self, key: str, ttl: int | None) -> None:
 | |
|         if ttl is not None and key in self.cache._handlers:
 | |
|             await self.cache.expire(key, ttl)
 |