machine-learning/app/config.py

import concurrent.futures
import logging
import os
import sys
from pathlib import Path
from socket import socket

from gunicorn.arbiter import Arbiter
from pydantic import BaseSettings
from rich.console import Console
from rich.logging import RichHandler
from uvicorn import Server
from uvicorn.workers import UvicornWorker

from .schemas import ModelType


class Settings(BaseSettings):
    cache_folder: str = "/cache"
    model_ttl: int = 300
    model_ttl_poll_s: int = 10
    host: str = "0.0.0.0"
    port: int = 3003
    workers: int = 1
    test_full: bool = False
    request_threads: int = os.cpu_count() or 4
    model_inter_op_threads: int = 0
    model_intra_op_threads: int = 0
    ann: bool = True

    class Config:
        env_prefix = "MACHINE_LEARNING_"
        case_sensitive = False


class LogSettings(BaseSettings):
    log_level: str = "info"
    no_color: bool = False

    class Config:
        case_sensitive = False


_clean_name = str.maketrans(":\\/", "___", ".")


def clean_name(model_name: str) -> str:
    return model_name.split("/")[-1].translate(_clean_name)


def get_cache_dir(model_name: str, model_type: ModelType) -> Path:
    return Path(settings.cache_folder) / model_type.value / clean_name(model_name)


def get_hf_model_name(model_name: str) -> str:
    return f"immich-app/{clean_name(model_name)}"


LOG_LEVELS: dict[str, int] = {
    "critical": logging.ERROR,
    "error": logging.ERROR,
    "warning": logging.WARNING,
    "warn": logging.WARNING,
    "info": logging.INFO,
    "log": logging.INFO,
    "debug": logging.DEBUG,
    "verbose": logging.DEBUG,
}

settings = Settings()
log_settings = LogSettings()

LOG_LEVEL = LOG_LEVELS.get(log_settings.log_level.lower(), logging.INFO)


class CustomRichHandler(RichHandler):
    def __init__(self) -> None:
        console = Console(color_system="standard", no_color=log_settings.no_color)
        self.excluded = ["uvicorn", "starlette", "fastapi"]
        super().__init__(
            show_path=False,
            omit_repeated_times=False,
            console=console,
            rich_tracebacks=True,
            tracebacks_suppress=[*self.excluded, concurrent.futures],
            tracebacks_show_locals=LOG_LEVEL == logging.DEBUG,
        )

    # hack to exclude certain modules from rich tracebacks
    def emit(self, record: logging.LogRecord) -> None:
        if record.exc_info is not None:
            tb = record.exc_info[2]
            while tb is not None:
                if any(excluded in tb.tb_frame.f_code.co_filename for excluded in self.excluded):
                    tb.tb_frame.f_locals["_rich_traceback_omit"] = True
                tb = tb.tb_next

        return super().emit(record)


log = logging.getLogger("ml.log")
log.setLevel(LOG_LEVEL)


# patches this issue https://github.com/encode/uvicorn/discussions/1803
class CustomUvicornServer(Server):
    async def shutdown(self, sockets: list[socket] | None = None) -> None:
        for sock in sockets or []:
            sock.close()
        await super().shutdown()


class CustomUvicornWorker(UvicornWorker):
    async def _serve(self) -> None:
        self.config.app = self.wsgi
        server = CustomUvicornServer(config=self.config)
        self._install_sigquit_handler()
        await server.serve(sockets=self.sockets)
        if not server.started:
            sys.exit(Arbiter.WORKER_BOOT_ERROR)
fix(ml): error logging (#6646) * fix ml error logging * exclude certain libraries from traceback 2024-01-25 19:26:27 -05:00			`import concurrent.futures`
chore(ml): improved logging (#3918) * fixed `minScore` not being set correctly * apply to init * don't send `enabled` * fix eslint warning * added logger * added logging * refinements * enable access log for info level * formatting * merged strings --------- Co-authored-by: Alex <alex.tran1502@gmail.com> 2023-08-30 04:22:01 -04:00			`import logging`
feat(ml)!: switch image classification and CLIP models to ONNX (#3809) 2023-08-25 00:28:51 -04:00			`import os`
chore(ml): improve shutdown (#5689) 2023-12-14 14:51:24 -05:00			`import sys`
refactor(ml): modularization and styling (#2835) * basic refactor and styling * removed batching * module entrypoint * removed unused imports * model superclass, model cache now in app state * fixed cache dir and enforced abstract method --------- Co-authored-by: Alex Tran <alex.tran1502@gmail.com> 2023-06-24 23:18:09 -04:00			`from pathlib import Path`
chore(ml): improve shutdown (#5689) 2023-12-14 14:51:24 -05:00			`from socket import socket`
refactor(ml): modularization and styling (#2835) * basic refactor and styling * removed batching * module entrypoint * removed unused imports * model superclass, model cache now in app state * fixed cache dir and enforced abstract method --------- Co-authored-by: Alex Tran <alex.tran1502@gmail.com> 2023-06-24 23:18:09 -04:00
chore(ml): improve shutdown (#5689) 2023-12-14 14:51:24 -05:00			`from gunicorn.arbiter import Arbiter`
feat(ml) backend takes image over HTTP (#2783) * using pydantic BaseSetting * ML API takes image file as input * keeping image in memory * reducing duplicate code * using bytes instead of UploadFile & other small code improvements * removed form-multipart, using HTTP body * format code --------- Co-authored-by: Alex Tran <alex.tran1502@gmail.com> 2023-06-17 22:49:19 -05:00			`from pydantic import BaseSettings`
chore(ml): improved logging (#3918) * fixed `minScore` not being set correctly * apply to init * don't send `enabled` * fix eslint warning * added logger * added logging * refinements * enable access log for info level * formatting * merged strings --------- Co-authored-by: Alex <alex.tran1502@gmail.com> 2023-08-30 04:22:01 -04:00			`from rich.console import Console`
			`from rich.logging import RichHandler`
chore(ml): improve shutdown (#5689) 2023-12-14 14:51:24 -05:00			`from uvicorn import Server`
			`from uvicorn.workers import UvicornWorker`
feat(ml) backend takes image over HTTP (#2783) * using pydantic BaseSetting * ML API takes image file as input * keeping image in memory * reducing duplicate code * using bytes instead of UploadFile & other small code improvements * removed form-multipart, using HTTP body * format code --------- Co-authored-by: Alex Tran <alex.tran1502@gmail.com> 2023-06-17 22:49:19 -05:00
refactor(ml): modularization and styling (#2835) * basic refactor and styling * removed batching * module entrypoint * removed unused imports * model superclass, model cache now in app state * fixed cache dir and enforced abstract method --------- Co-authored-by: Alex Tran <alex.tran1502@gmail.com> 2023-06-24 23:18:09 -04:00			`from .schemas import ModelType`


feat(ml) backend takes image over HTTP (#2783) * using pydantic BaseSetting * ML API takes image file as input * keeping image in memory * reducing duplicate code * using bytes instead of UploadFile & other small code improvements * removed form-multipart, using HTTP body * format code --------- Co-authored-by: Alex Tran <alex.tran1502@gmail.com> 2023-06-17 22:49:19 -05:00			`class Settings(BaseSettings):`
			`cache_folder: str = "/cache"`
fix(ml): better model unloading (#3340) * restart process on inactivity * formatting * always update `last_called` * load models sequentially * renamed variable, updated docs * formatting * made poll env name consistent with model ttl env 2023-11-16 21:42:44 -05:00			`model_ttl: int = 300`
			`model_ttl_poll_s: int = 10`
feat(ml) backend takes image over HTTP (#2783) * using pydantic BaseSetting * ML API takes image file as input * keeping image in memory * reducing duplicate code * using bytes instead of UploadFile & other small code improvements * removed form-multipart, using HTTP body * format code --------- Co-authored-by: Alex Tran <alex.tran1502@gmail.com> 2023-06-17 22:49:19 -05:00			`host: str = "0.0.0.0"`
			`port: int = 3003`
			`workers: int = 1`
chore(ml): added testing and github workflow (#2969) * added testing * github action for python, made mypy happy * formatted with black * minor fixes and styling * test model cache * cache test dependencies * narrowed model cache tests * moved endpoint tests to their own class * cleaned up fixtures * formatting * removed unused dep 2023-06-27 19:21:33 -04:00			`test_full: bool = False`
feat(ml)!: switch image classification and CLIP models to ONNX (#3809) 2023-08-25 00:28:51 -04:00			`request_threads: int = os.cpu_count() or 4`
feat(ml)!: cuda and openvino acceleration (#5619) * cuda and openvino ep, refactor, update dockerfile * updated workflow * typing fixes * added tests * updated ml test gh action * updated README * updated docker-compose * added compute to hwaccel.yml * updated gh matrix updated gh matrix updated gh matrix updated gh matrix updated gh matrix give up * remove cuda/arm64 build * add hwaccel image tags to docker-compose * remove unnecessary quotes * add suffix to git tag * fixed kwargs in base model * armnn ld_library_path * update pyproject.toml * add armnn workflow * formatting * consolidate hwaccel files, update docker compose * update hw transcoding docs * add ml hwaccel docs * update dev and prod docker-compose * added armnn prerequisite docs * support 3.10 * updated docker-compose comments * formatting * test coverage * don't set arena extend strategy for openvino * working openvino * formatting * fix dockerfile * added type annotation * add wsl configuration for openvino * updated lock file * copy python3 * comment out extends section * fix platforms * simplify workflow suffix tagging * simplify aio transcoding doc * update docs and workflow for `hwaccel.yml` change * revert docs 2024-01-21 18:22:39 -05:00			`model_inter_op_threads: int = 0`
			`model_intra_op_threads: int = 0`
feat(ml): ARMNN acceleration (#5667) * feat(ml): ARMNN acceleration for CLIP * wrap ANN as ONNX-Session * strict typing * normalize ARMNN CLIP embedding * mutex to handle concurrent execution * make inputs contiguous * fine-grained locking; concurrent network execution --------- Co-authored-by: mertalev <101130780+mertalev@users.noreply.github.com> 2024-01-11 18:26:46 +01:00			`ann: bool = True`
feat(ml) backend takes image over HTTP (#2783) * using pydantic BaseSetting * ML API takes image file as input * keeping image in memory * reducing duplicate code * using bytes instead of UploadFile & other small code improvements * removed form-multipart, using HTTP body * format code --------- Co-authored-by: Alex Tran <alex.tran1502@gmail.com> 2023-06-17 22:49:19 -05:00
refactor(ml): model downloading (#3545) * download facial recognition models * download hf models * simplified logic * updated `predict` for facial recognition * ensure download method is called * fixed repo_id for clip * fixed download destination * use st's own `snapshot_download` * conditional download * fixed predict method * check if loaded * minor fixes * updated mypy overrides * added pytest-mock * updated tests * updated lock 2023-08-05 22:45:13 -04:00			`class Config:`
refactor(ml): modularization and styling (#2835) * basic refactor and styling * removed batching * module entrypoint * removed unused imports * model superclass, model cache now in app state * fixed cache dir and enforced abstract method --------- Co-authored-by: Alex Tran <alex.tran1502@gmail.com> 2023-06-24 23:18:09 -04:00			`env_prefix = "MACHINE_LEARNING_"`
feat(ml) backend takes image over HTTP (#2783) * using pydantic BaseSetting * ML API takes image file as input * keeping image in memory * reducing duplicate code * using bytes instead of UploadFile & other small code improvements * removed form-multipart, using HTTP body * format code --------- Co-authored-by: Alex Tran <alex.tran1502@gmail.com> 2023-06-17 22:49:19 -05:00			`case_sensitive = False`


chore(ml): improved logging (#3918) * fixed `minScore` not being set correctly * apply to init * don't send `enabled` * fix eslint warning * added logger * added logging * refinements * enable access log for info level * formatting * merged strings --------- Co-authored-by: Alex <alex.tran1502@gmail.com> 2023-08-30 04:22:01 -04:00			`class LogSettings(BaseSettings):`
			`log_level: str = "info"`
			`no_color: bool = False`

			`class Config:`
			`case_sensitive = False`


feat(ml)!: switch image classification and CLIP models to ONNX (#3809) 2023-08-25 00:28:51 -04:00			`_clean_name = str.maketrans(":\\/", "___", ".")`


feat(ml): add face models (#4952) added models to config dropdown fixed downloading updated tests use hf for face models formatting 2023-11-11 20:04:49 -05:00			`def clean_name(model_name: str) -> str:`
			`return model_name.split("/")[-1].translate(_clean_name)`


refactor(ml): modularization and styling (#2835) * basic refactor and styling * removed batching * module entrypoint * removed unused imports * model superclass, model cache now in app state * fixed cache dir and enforced abstract method --------- Co-authored-by: Alex Tran <alex.tran1502@gmail.com> 2023-06-24 23:18:09 -04:00			`def get_cache_dir(model_name: str, model_type: ModelType) -> Path:`
feat(ml): add face models (#4952) added models to config dropdown fixed downloading updated tests use hf for face models formatting 2023-11-11 20:04:49 -05:00			`return Path(settings.cache_folder) / model_type.value / clean_name(model_name)`


			`def get_hf_model_name(model_name: str) -> str:`
			`return f"immich-app/{clean_name(model_name)}"`
refactor(ml): modularization and styling (#2835) * basic refactor and styling * removed batching * module entrypoint * removed unused imports * model superclass, model cache now in app state * fixed cache dir and enforced abstract method --------- Co-authored-by: Alex Tran <alex.tran1502@gmail.com> 2023-06-24 23:18:09 -04:00

chore(ml): improved logging (#3918) * fixed `minScore` not being set correctly * apply to init * don't send `enabled` * fix eslint warning * added logger * added logging * refinements * enable access log for info level * formatting * merged strings --------- Co-authored-by: Alex <alex.tran1502@gmail.com> 2023-08-30 04:22:01 -04:00			`LOG_LEVELS: dict[str, int] = {`
			`"critical": logging.ERROR,`
			`"error": logging.ERROR,`
			`"warning": logging.WARNING,`
			`"warn": logging.WARNING,`
			`"info": logging.INFO,`
			`"log": logging.INFO,`
			`"debug": logging.DEBUG,`
			`"verbose": logging.DEBUG,`
			`}`

feat(ml) backend takes image over HTTP (#2783) * using pydantic BaseSetting * ML API takes image file as input * keeping image in memory * reducing duplicate code * using bytes instead of UploadFile & other small code improvements * removed form-multipart, using HTTP body * format code --------- Co-authored-by: Alex Tran <alex.tran1502@gmail.com> 2023-06-17 22:49:19 -05:00			`settings = Settings()`
chore(ml): improved logging (#3918) * fixed `minScore` not being set correctly * apply to init * don't send `enabled` * fix eslint warning * added logger * added logging * refinements * enable access log for info level * formatting * merged strings --------- Co-authored-by: Alex <alex.tran1502@gmail.com> 2023-08-30 04:22:01 -04:00			`log_settings = LogSettings()`

fix(ml): handle missing `context_length` field (#6695) * handle missing `context_length` field * specify list type 2024-01-27 19:50:50 -05:00			`LOG_LEVEL = LOG_LEVELS.get(log_settings.log_level.lower(), logging.INFO)`

chore(ml): memory optimisations (#3934) 2023-08-31 19:30:53 -04:00
			`class CustomRichHandler(RichHandler):`
			`def __init__(self) -> None:`
			`console = Console(color_system="standard", no_color=log_settings.no_color)`
fix(ml): error logging (#6646) * fix ml error logging * exclude certain libraries from traceback 2024-01-25 19:26:27 -05:00			`self.excluded = ["uvicorn", "starlette", "fastapi"]`
			`super().__init__(`
			`show_path=False,`
			`omit_repeated_times=False,`
			`console=console,`
			`rich_tracebacks=True,`
			`tracebacks_suppress=[*self.excluded, concurrent.futures],`
fix(ml): handle missing `context_length` field (#6695) * handle missing `context_length` field * specify list type 2024-01-27 19:50:50 -05:00			`tracebacks_show_locals=LOG_LEVEL == logging.DEBUG,`
fix(ml): error logging (#6646) * fix ml error logging * exclude certain libraries from traceback 2024-01-25 19:26:27 -05:00			`)`

			`# hack to exclude certain modules from rich tracebacks`
			`def emit(self, record: logging.LogRecord) -> None:`
			`if record.exc_info is not None:`
			`tb = record.exc_info[2]`
			`while tb is not None:`
			`if any(excluded in tb.tb_frame.f_code.co_filename for excluded in self.excluded):`
			`tb.tb_frame.f_locals["_rich_traceback_omit"] = True`
			`tb = tb.tb_next`

			`return super().emit(record)`


			`log = logging.getLogger("ml.log")`
fix(ml): handle missing `context_length` field (#6695) * handle missing `context_length` field * specify list type 2024-01-27 19:50:50 -05:00			`log.setLevel(LOG_LEVEL)`
chore(ml): improve shutdown (#5689) 2023-12-14 14:51:24 -05:00

			`# patches this issue https://github.com/encode/uvicorn/discussions/1803`
			`class CustomUvicornServer(Server):`
			`async def shutdown(self, sockets: list[socket] \| None = None) -> None:`
			`for sock in sockets or []:`
			`sock.close()`
			`await super().shutdown()`


			`class CustomUvicornWorker(UvicornWorker):`
			`async def _serve(self) -> None:`
			`self.config.app = self.wsgi`
			`server = CustomUvicornServer(config=self.config)`
			`self._install_sigquit_handler()`
			`await server.serve(sockets=self.sockets)`
			`if not server.started:`
			`sys.exit(Arbiter.WORKER_BOOT_ERROR)`