chore(ml): uv (#16725)

* poetry to uv * update ci * remove caching * add typeshed to dev * no need for `--non-interactive` * move backends to extras * oopsie * update ci
2025-06-12 21:38:37 +02:00 · 2025-03-09 22:30:16 -04:00 · 2025-03-09 22:30:16 -04:00 · 6da77600e5
commit 6da77600e5
parent 573d9a7733
8 changed files with 2748 additions and 3834 deletions
--- a/.github/workflows/prepare-release.yml
+++ b/.github/workflows/prepare-release.yml
@ -41,8 +41,8 @@ jobs:
        with:
          token: ${{ steps.generate-token.outputs.token }}

-      - name: Install Poetry
-        run: pipx install poetry
+      - name: Install uv
+        uses: astral-sh/setup-uv@v5

      - name: Bump version
        run: misc/release/pump-version.sh -s "${{ inputs.serverBump }}" -m "${{ inputs.mobileBump }}"
@ -74,7 +74,7 @@ jobs:
        with:
          app-id: ${{ secrets.PUSH_O_MATIC_APP_ID }}
          private-key: ${{ secrets.PUSH_O_MATIC_APP_KEY }}
-      
+
      - name: Checkout
        uses: actions/checkout@v4
        with:
--- a/.github/workflows/test.yml
+++ b/.github/workflows/test.yml
@ -380,27 +380,28 @@ jobs:
        working-directory: ./machine-learning
    steps:
      - uses: actions/checkout@v4
-      - name: Install poetry
-        run: pipx install poetry
+      - name: Install uv
+        uses: astral-sh/setup-uv@v5
      - uses: actions/setup-python@v5
-        with:
-          python-version: 3.11
-          cache: 'poetry'
+        # TODO: add caching when supported (https://github.com/actions/setup-python/pull/818)
+        # with:
+        #   python-version: 3.11
+        #   cache: 'uv'
      - name: Install dependencies
        run: |
-          poetry install --with dev --with cpu
+          uv sync --extra cpu
      - name: Lint with ruff
        run: |
-          poetry run ruff check --output-format=github app export
+          uv run ruff check --output-format=github app export
      - name: Check black formatting
        run: |
-          poetry run black --check app export
+          uv run black --check app export
      - name: Run mypy type checking
        run: |
-          poetry run mypy --install-types --non-interactive --strict app/
+          uv run mypy --strict app/
      - name: Run tests and coverage
        run: |
-          poetry run pytest app --cov=app --cov-report term-missing
+          uv run pytest app --cov=app --cov-report term-missing

  shellcheck:
    name: ShellCheck
--- a/machine-learning/Dockerfile
+++ b/machine-learning/Dockerfile
@ -19,20 +19,16 @@ FROM builder-${DEVICE} AS builder

 ARG DEVICE
 ENV PYTHONDONTWRITEBYTECODE=1 \
-    PYTHONUNBUFFERED=1 \
-    PIP_NO_CACHE_DIR=true \
-    VIRTUAL_ENV="/opt/venv" \
-    PATH="/opt/venv/bin:${PATH}"
+    PYTHONUNBUFFERED=1
+WORKDIR /usr/src/app

 RUN apt-get update && apt-get install -y --no-install-recommends g++

-RUN pip install --upgrade pip && pip install poetry
-RUN poetry config installer.max-workers 10 && \
-    poetry config virtualenvs.create false
-RUN python3 -m venv /opt/venv
-
-COPY poetry.lock pyproject.toml ./
-RUN poetry install --sync --no-interaction --no-ansi --no-root --with ${DEVICE} --without dev
+COPY --from=ghcr.io/astral-sh/uv:latest /uv /uvx /bin/
+RUN --mount=type=cache,target=/root/.cache/uv \
+    --mount=type=bind,source=uv.lock,target=uv.lock \
+    --mount=type=bind,source=pyproject.toml,target=pyproject.toml \
+    uv sync --frozen --extra ${DEVICE} --no-dev --no-editable --no-install-project --compile-bytecode --no-progress

 FROM python:3.11-slim-bookworm@sha256:614c8691ab74150465ec9123378cd4dde7a6e57be9e558c3108df40664667a4c AS prod-cpu

@ -93,7 +89,7 @@ WORKDIR /usr/src/app
 ENV TRANSFORMERS_CACHE=/cache \
    PYTHONDONTWRITEBYTECODE=1 \
    PYTHONUNBUFFERED=1 \
-    PATH="/opt/venv/bin:$PATH" \
+    PATH="/usr/src/app/.venv/bin:$PATH" \
    PYTHONPATH=/usr/src \
    DEVICE=${DEVICE}

@ -102,7 +98,7 @@ RUN echo "hard core 0" >> /etc/security/limits.conf && \
    echo "fs.suid_dumpable 0" >> /etc/sysctl.conf && \
    echo 'ulimit -S -c 0 > /dev/null 2>&1' >> /etc/profile

-COPY --from=builder /opt/venv /opt/venv
+COPY --from=builder /usr/src/app/.venv /usr/src/app/.venv
 COPY ann/ann.py /usr/src/ann/ann.py
 COPY start.sh log_conf.json gunicorn_conf.py ./
 COPY app .
--- a/machine-learning/README.md
+++ b/machine-learning/README.md
@ -5,13 +5,12 @@

 # Setup

-This project uses [Poetry](https://python-poetry.org/docs/#installation), so be sure to install it first.
-Running `poetry install --no-root --with dev --with cpu` will install everything you need in an isolated virtual environment.
-CUDA and OpenVINO are supported as acceleration APIs. To use them, you can replace `--with cpu` with either of `--with cuda` or `--with openvino`. In the case of CUDA, a [compute capability](https://developer.nvidia.com/cuda-gpus) of 5.2 or higher is required.
-
-To add or remove dependencies, you can use the commands `poetry add $PACKAGE_NAME` and `poetry remove $PACKAGE_NAME`, respectively.
-Be sure to commit the `poetry.lock` and `pyproject.toml` files with `poetry lock --no-update` to reflect any changes in dependencies.
+This project uses [uv](https://docs.astral.sh/uv/getting-started/installation/), so be sure to install it first.
+Running `uv sync --extra cpu` will install everything you need in an isolated virtual environment.
+CUDA and OpenVINO are supported as acceleration APIs. To use them, you can replace `--group cpu` with either of `--group cuda` or `--group openvino`. In the case of CUDA, a [compute capability](https://developer.nvidia.com/cuda-gpus) of 5.2 or higher is required.

+To add or remove dependencies, you can use the commands `uv add $PACKAGE_NAME` and `uv remove $PACKAGE_NAME`, respectively.
+Be sure to commit the `uv.lock` and `pyproject.toml` files with `uv lock` to reflect any changes in dependencies.

 # Load Testing

@ -19,22 +18,25 @@ To measure inference throughput and latency, you can use [Locust](https://locust
 Locust works by querying the model endpoints and aggregating their statistics, meaning the app must be deployed.
 You can change the models or adjust options like score thresholds through the Locust UI.

-To get started, you can simply run `locust --web-host 127.0.0.1` and open `localhost:8089` in a browser to access the UI. See the [Locust documentation](https://docs.locust.io/en/stable/index.html) for more info on running Locust. 
+To get started, you can simply run `locust --web-host 127.0.0.1` and open `localhost:8089` in a browser to access the UI. See the [Locust documentation](https://docs.locust.io/en/stable/index.html) for more info on running Locust.

 Note that in Locust's jargon, concurrency is measured in `users`, and each user runs one task at a time. To achieve a particular per-endpoint concurrency, multiply that number by the number of endpoints to be queried. For example, if there are 3 endpoints and you want each of them to receive 8 requests at a time, you should set the number of users to 24.

 # Facial Recognition

 ## Acknowledgements
+
 This project utilizes facial recognition models from the [InsightFace](https://github.com/deepinsight/insightface/tree/master/model_zoo) project. We appreciate the work put into developing these models, which have been beneficial to the machine learning part of this project.

 ### Used Models
-* antelopev2
-* buffalo_l
-* buffalo_m
-* buffalo_s
+
+- antelopev2
+- buffalo_l
+- buffalo_m
+- buffalo_s

 ## License and Use Restrictions
+
 We have received permission to use the InsightFace facial recognition models in our project, as granted via email by Jia Guo (guojia@insightface.ai) on 18th March 2023. However, it's important to note that this permission does not extend to the redistribution or commercial use of their models by third parties. Users and developers interested in using these models should review the licensing terms provided in the InsightFace GitHub repository.

-For more information on the capabilities of the InsightFace models and to ensure compliance with their license, please refer to their [official repository](https://github.com/deepinsight/insightface). Adhering to the specified licensing terms is crucial for the respectful and lawful use of their work.
+For more information on the capabilities of the InsightFace models and to ensure compliance with their license, please refer to their [official repository](https://github.com/deepinsight/insightface). Adhering to the specified licensing terms is crucial for the respectful and lawful use of their work.
--- a/machine-learning/poetry.lock
+++ b/machine-learning/poetry.lock
--- a/machine-learning/pyproject.toml
+++ b/machine-learning/pyproject.toml
@ -1,72 +1,77 @@
-[tool.poetry]
+[project]
 name = "machine-learning"
 version = "1.129.0"
 description = ""
-authors = ["Hau Tran <alex.tran1502@gmail.com>"]
+authors = [{ name = "Hau Tran", email = "alex.tran1502@gmail.com" }]
+requires-python = ">=3.10,<4.0"
 readme = "README.md"
-packages = [{include = "app"}]
+dependencies = [
+    "aiocache>=0.12.1,<1.0",
+    "fastapi>=0.95.2,<1.0",
+    "ftfy>=6.1.1",
+    "gunicorn>=21.1.0",
+    "huggingface-hub>=0.20.1,<1.0",
+    "insightface>=0.7.3,<1.0",
+    "opencv-python-headless>=4.7.0.72,<5.0",
+    "orjson>=3.9.5",
+    "pillow>=9.5.0,<11.0",
+    "pydantic>=2.0.0,<3",
+    "pydantic-settings>=2.5.2,<3",
+    "python-multipart>=0.0.6,<1.0",
+    "rich>=13.4.2",
+    "tokenizers>=0.15.0,<1.0",
+    "uvicorn[standard]>=0.22.0,<1.0",
+]

-[tool.poetry.dependencies]
-python = ">=3.10,<4.0"
-insightface = ">=0.7.3,<1.0"
-opencv-python-headless = ">=4.7.0.72,<5.0"
-pillow = ">=9.5.0,<11.0"
-fastapi = ">=0.95.2,<1.0"
-uvicorn = {extras = ["standard"], version = ">=0.22.0,<1.0"}
-pydantic = "^2.0.0"
-pydantic-settings = "^2.5.2"
-aiocache = ">=0.12.1,<1.0"
-rich = ">=13.4.2"
-ftfy = ">=6.1.1"
-python-multipart = ">=0.0.6,<1.0"
-orjson = ">=3.9.5"
-gunicorn = ">=21.1.0"
-huggingface-hub = ">=0.20.1,<1.0"
-tokenizers = ">=0.15.0,<1.0"
+[dependency-groups]
+test = [
+    "httpx>=0.24.1",
+    "pytest>=7.3.1",
+    "pytest-asyncio>=0.21.0",
+    "pytest-cov>=4.1.0",
+    "pytest-mock>=3.11.1",
+]
+types = [
+    "types-pyyaml>=6.0.12.20241230",
+    "types-requests>=2.32.0.20250306",
+    "types-setuptools>=75.8.2.20250305",
+    "types-simplejson>=3.20.0.20250218",
+    "types-ujson>=5.10.0.20240515",
+]
+lint = [
+    "black>=23.3.0",
+    "mypy>=1.3.0",
+    "ruff>=0.0.272",
+    { include-group = "types" },
+]
+dev = ["locust>=2.15.1", { include-group = "test" }, { include-group = "lint" }]

-[tool.poetry.group.dev.dependencies]
-mypy = ">=1.3.0"
-black = ">=23.3.0"
-pytest = ">=7.3.1"
-locust = ">=2.15.1"
-httpx = ">=0.24.1"
-pytest-asyncio = ">=0.21.0"
-pytest-cov = ">=4.1.0"
-ruff = ">=0.0.272"
-pytest-mock = ">=3.11.1"
+[project.optional-dependencies]
+cpu = ["onnxruntime>=1.15.0,<2"]
+cuda = ["onnxruntime-gpu>=1.17.0,<2"]
+openvino = ["onnxruntime-openvino>=1.17.1,<1.19.0"]
+armnn = ["onnxruntime>=1.15.0,<2"]

-[tool.poetry.group.cpu]
-optional = true
+[tool.uv]
+compile-bytecode = true

-[tool.poetry.group.cpu.dependencies]
-onnxruntime = "^1.15.0"
-
-[tool.poetry.group.cuda]
-optional = true
-
-[tool.poetry.group.cuda.dependencies]
-onnxruntime-gpu = {version = "^1.17.0", source = "cuda12"}
-
-[tool.poetry.group.openvino]
-optional = true
-
-[tool.poetry.group.openvino.dependencies]
-onnxruntime-openvino = ">=1.17.1,<1.19.0"
-
-[tool.poetry.group.armnn]
-optional = true
-
-[tool.poetry.group.armnn.dependencies]
-onnxruntime = "^1.15.0"
-
-[[tool.poetry.source]]
+[[tool.uv.index]]
 name = "cuda12"
 url = "https://aiinfra.pkgs.visualstudio.com/PublicPackages/_packaging/onnxruntime-cuda-12/pypi/simple/"
-priority = "explicit"
+explicit = true
+
+[tool.uv.sources]
+onnxruntime-gpu = { index = "cuda12" }
+
+[tool.hatch.build.targets.sdist]
+include = ["app"]
+
+[tool.hatch.build.targets.wheel]
+include = ["app"]

 [build-system]
-requires = ["poetry-core"]
-build-backend = "poetry.core.masonry.api"
+requires = ["hatchling"]
+build-backend = "hatchling.build"

 [tool.mypy]
 python_version = "3.11"
--- a/machine-learning/uv.lock
+++ b/machine-learning/uv.lock
--- a/misc/release/pump-version.sh
+++ b/misc/release/pump-version.sh
@ -73,7 +73,7 @@ if [ "$CURRENT_SERVER" != "$NEXT_SERVER" ]; then
  npm --prefix web i --package-lock-only
  npm --prefix e2e version "$SERVER_PUMP"
  npm --prefix e2e i --package-lock-only
-  poetry --directory machine-learning version "$SERVER_PUMP"
+  uvx --from=toml-cli toml set --toml-path=pyproject.toml project.version "$SERVER_PUMP"
 fi

 if [ "$CURRENT_MOBILE" != "$NEXT_MOBILE" ]; then